Repository: quickwit-oss/tantivy
Branch: main
Commit: 545169c0d843
Files: 504
Total size: 29.6 MB

Directory structure:
gitextract_0oj2913e/

├── .claude/
│   └── skills/
│       ├── rationalize-deps/
│       │   └── SKILL.md
│       └── simple-pr/
│           └── SKILL.md
├── .github/
│   ├── FUNDING.yml
│   ├── ISSUE_TEMPLATE/
│   │   ├── actions.md
│   │   ├── bug_report.md
│   │   ├── feature_request.md
│   │   └── question.md
│   ├── dependabot.yml
│   └── workflows/
│       ├── coverage.yml
│       ├── long_running.yml
│       └── test.yml
├── .gitignore
├── ARCHITECTURE.md
├── AUTHORS
├── CHANGELOG.md
├── CITATION.cff
├── Cargo.toml
├── LICENSE
├── Makefile
├── README.md
├── RELEASE.md
├── TODO.txt
├── benches/
│   ├── agg_bench.rs
│   ├── alice.txt
│   ├── analyzer.rs
│   ├── and_or_queries.rs
│   ├── bool_queries_with_range.rs
│   ├── exists_json.rs
│   ├── gh.json
│   ├── hdfs.json
│   ├── index-bench.rs
│   ├── merge_segments.rs
│   ├── range_queries.rs
│   ├── range_query.rs
│   ├── regex_all_terms.rs
│   ├── str_search_and_get.rs
│   └── wiki.json
├── bitpacker/
│   ├── Cargo.toml
│   ├── benches/
│   │   └── bench.rs
│   └── src/
│       ├── bitpacker.rs
│       ├── blocked_bitpacker.rs
│       ├── filter_vec/
│       │   ├── avx2.rs
│       │   ├── mod.rs
│       │   └── scalar.rs
│       └── lib.rs
├── cliff.toml
├── columnar/
│   ├── Cargo.toml
│   ├── README.md
│   ├── benches/
│   │   ├── bench_access.rs
│   │   ├── bench_column_values_get.rs
│   │   ├── bench_create_column_values.rs
│   │   ├── bench_first_vals.rs
│   │   ├── bench_merge.rs
│   │   ├── bench_optional_index.rs
│   │   ├── bench_values_u128.rs
│   │   ├── bench_values_u64.rs
│   │   └── common.rs
│   ├── columnar-cli/
│   │   ├── Cargo.toml
│   │   └── src/
│   │       └── main.rs
│   ├── columnar-cli-inspect/
│   │   ├── Cargo.toml
│   │   └── src/
│   │       └── main.rs
│   ├── compat_tests_data/
│   │   ├── v1.columnar
│   │   └── v2.columnar
│   └── src/
│       ├── TODO.md
│       ├── block_accessor.rs
│       ├── column/
│       │   ├── dictionary_encoded.rs
│       │   ├── mod.rs
│       │   └── serialize.rs
│       ├── column_index/
│       │   ├── merge/
│       │   │   ├── mod.rs
│       │   │   ├── shuffled.rs
│       │   │   └── stacked.rs
│       │   ├── mod.rs
│       │   ├── multivalued_index.rs
│       │   ├── optional_index/
│       │   │   ├── mod.rs
│       │   │   ├── set.rs
│       │   │   ├── set_block/
│       │   │   │   ├── dense.rs
│       │   │   │   ├── mod.rs
│       │   │   │   ├── sparse.rs
│       │   │   │   └── tests.rs
│       │   │   └── tests.rs
│       │   └── serialize.rs
│       ├── column_values/
│       │   ├── merge.rs
│       │   ├── mod.rs
│       │   ├── monotonic_column.rs
│       │   ├── monotonic_mapping.rs
│       │   ├── monotonic_mapping_u128.rs
│       │   ├── stats.rs
│       │   ├── u128_based/
│       │   │   ├── compact_space/
│       │   │   │   ├── blank_range.rs
│       │   │   │   ├── build_compact_space.rs
│       │   │   │   └── mod.rs
│       │   │   └── mod.rs
│       │   ├── u64_based/
│       │   │   ├── bitpacked.rs
│       │   │   ├── blockwise_linear.rs
│       │   │   ├── line.rs
│       │   │   ├── linear.rs
│       │   │   ├── mod.rs
│       │   │   ├── stats_collector.rs
│       │   │   └── tests.rs
│       │   └── vec_column.rs
│       ├── columnar/
│       │   ├── column_type.rs
│       │   ├── format_version.rs
│       │   ├── merge/
│       │   │   ├── merge_dict_column.rs
│       │   │   ├── merge_mapping.rs
│       │   │   ├── mod.rs
│       │   │   ├── term_merger.rs
│       │   │   └── tests.rs
│       │   ├── mod.rs
│       │   ├── reader/
│       │   │   └── mod.rs
│       │   └── writer/
│       │       ├── column_operation.rs
│       │       ├── column_writers.rs
│       │       ├── mod.rs
│       │       ├── serializer.rs
│       │       └── value_index.rs
│       ├── compat_tests.rs
│       ├── dictionary.rs
│       ├── dynamic_column.rs
│       ├── iterable.rs
│       ├── lib.rs
│       ├── tests.rs
│       ├── utils.rs
│       └── value.rs
├── common/
│   ├── Cargo.toml
│   ├── benches/
│   │   └── bench.rs
│   └── src/
│       ├── bitset.rs
│       ├── bounds.rs
│       ├── byte_count.rs
│       ├── datetime.rs
│       ├── file_slice.rs
│       ├── group_by.rs
│       ├── json_path_writer.rs
│       ├── lib.rs
│       ├── serialize.rs
│       ├── vint.rs
│       └── writer.rs
├── doc/
│   ├── .gitignore
│   ├── book.toml
│   └── src/
│       ├── SUMMARY.md
│       ├── avant-propos.md
│       ├── basis.md
│       ├── best_practise.md.rs
│       ├── examples.md
│       ├── facetting.md
│       ├── faq.md
│       ├── index_sorting.md
│       ├── innerworkings.md
│       ├── inverted_index.md
│       ├── json.md
│       └── schema.md
├── examples/
│   ├── aggregation.rs
│   ├── basic_search.rs
│   ├── custom_collector.rs
│   ├── custom_tokenizer.rs
│   ├── date_time_field.rs
│   ├── deleting_updating_documents.rs
│   ├── faceted_search.rs
│   ├── faceted_search_with_tweaked_score.rs
│   ├── filter_aggregation.rs
│   ├── fuzzy_search.rs
│   ├── index_from_multiple_threads.rs
│   ├── index_with_json.rs
│   ├── integer_range_search.rs
│   ├── ip_field.rs
│   ├── iterating_docs_and_positions.rs
│   ├── json_field.rs
│   ├── phrase_prefix_search.rs
│   ├── pre_tokenized_text.rs
│   ├── snippet.rs
│   ├── stop_words.rs
│   └── warmer.rs
├── ownedbytes/
│   ├── Cargo.toml
│   └── src/
│       └── lib.rs
├── query-grammar/
│   ├── Cargo.toml
│   ├── README.md
│   └── src/
│       ├── infallible.rs
│       ├── lib.rs
│       ├── occur.rs
│       ├── query_grammar.rs
│       └── user_input_ast.rs
├── rustfmt.toml
├── src/
│   ├── aggregation/
│   │   ├── README.md
│   │   ├── accessor_helpers.rs
│   │   ├── agg_data.rs
│   │   ├── agg_limits.rs
│   │   ├── agg_req.rs
│   │   ├── agg_result.rs
│   │   ├── agg_tests.rs
│   │   ├── bucket/
│   │   │   ├── composite/
│   │   │   │   ├── accessors.rs
│   │   │   │   ├── calendar_interval.rs
│   │   │   │   ├── collector.rs
│   │   │   │   ├── map.rs
│   │   │   │   ├── mod.rs
│   │   │   │   └── numeric_types.rs
│   │   │   ├── filter.rs
│   │   │   ├── histogram/
│   │   │   │   ├── date_histogram.rs
│   │   │   │   ├── histogram.rs
│   │   │   │   └── mod.rs
│   │   │   ├── mod.rs
│   │   │   ├── range.rs
│   │   │   ├── term_agg.rs
│   │   │   └── term_missing_agg.rs
│   │   ├── cached_sub_aggs.rs
│   │   ├── collector.rs
│   │   ├── date.rs
│   │   ├── error.rs
│   │   ├── intermediate_agg_result.rs
│   │   ├── metric/
│   │   │   ├── average.rs
│   │   │   ├── cardinality.rs
│   │   │   ├── count.rs
│   │   │   ├── extended_stats.rs
│   │   │   ├── max.rs
│   │   │   ├── min.rs
│   │   │   ├── mod.rs
│   │   │   ├── percentiles.rs
│   │   │   ├── stats.rs
│   │   │   ├── sum.rs
│   │   │   └── top_hits.rs
│   │   ├── mod.rs
│   │   └── segment_agg_result.rs
│   ├── collector/
│   │   ├── count_collector.rs
│   │   ├── docset_collector.rs
│   │   ├── facet_collector.rs
│   │   ├── filter_collector_wrapper.rs
│   │   ├── histogram_collector.rs
│   │   ├── mod.rs
│   │   ├── multi_collector.rs
│   │   ├── sort_key/
│   │   │   ├── mod.rs
│   │   │   ├── order.rs
│   │   │   ├── sort_by_bytes.rs
│   │   │   ├── sort_by_erased_type.rs
│   │   │   ├── sort_by_score.rs
│   │   │   ├── sort_by_static_fast_value.rs
│   │   │   ├── sort_by_string.rs
│   │   │   └── sort_key_computer.rs
│   │   ├── sort_key_top_collector.rs
│   │   ├── tests.rs
│   │   ├── top_collector.rs
│   │   └── top_score_collector.rs
│   ├── compat_tests.rs
│   ├── core/
│   │   ├── executor.rs
│   │   ├── json_utils.rs
│   │   ├── mod.rs
│   │   ├── searcher.rs
│   │   └── tests.rs
│   ├── directory/
│   │   ├── composite_file.rs
│   │   ├── directory.rs
│   │   ├── directory_lock.rs
│   │   ├── error.rs
│   │   ├── footer.rs
│   │   ├── managed_directory.rs
│   │   ├── mmap_directory/
│   │   │   ├── file_watcher.rs
│   │   │   └── mod.rs
│   │   ├── mod.rs
│   │   ├── ram_directory.rs
│   │   ├── tests.rs
│   │   └── watch_event_router.rs
│   ├── docset.rs
│   ├── error.rs
│   ├── fastfield/
│   │   ├── alive_bitset.rs
│   │   ├── error.rs
│   │   ├── facet_reader.rs
│   │   ├── mod.rs
│   │   ├── readers.rs
│   │   └── writer.rs
│   ├── fieldnorm/
│   │   ├── code.rs
│   │   ├── mod.rs
│   │   ├── reader.rs
│   │   ├── serializer.rs
│   │   └── writer.rs
│   ├── functional_test.rs
│   ├── future_result.rs
│   ├── index/
│   │   ├── index.rs
│   │   ├── index_meta.rs
│   │   ├── inverted_index_reader.rs
│   │   ├── mod.rs
│   │   ├── segment.rs
│   │   ├── segment_component.rs
│   │   ├── segment_id.rs
│   │   └── segment_reader.rs
│   ├── indexer/
│   │   ├── delete_queue.rs
│   │   ├── doc_id_mapping.rs
│   │   ├── doc_opstamp_mapping.rs
│   │   ├── flat_map_with_buffer.rs
│   │   ├── index_writer.rs
│   │   ├── index_writer_status.rs
│   │   ├── indexing_term.rs
│   │   ├── log_merge_policy.rs
│   │   ├── merge_index_test.rs
│   │   ├── merge_operation.rs
│   │   ├── merge_policy.rs
│   │   ├── merger.rs
│   │   ├── mod.rs
│   │   ├── operation.rs
│   │   ├── path_to_unordered_id.rs
│   │   ├── prepared_commit.rs
│   │   ├── segment_entry.rs
│   │   ├── segment_manager.rs
│   │   ├── segment_register.rs
│   │   ├── segment_serializer.rs
│   │   ├── segment_updater.rs
│   │   ├── segment_writer.rs
│   │   ├── single_segment_index_writer.rs
│   │   └── stamper.rs
│   ├── lib.rs
│   ├── macros.rs
│   ├── positions/
│   │   ├── mod.rs
│   │   ├── reader.rs
│   │   └── serializer.rs
│   ├── postings/
│   │   ├── block_search.rs
│   │   ├── block_segment_postings.rs
│   │   ├── compression/
│   │   │   ├── mod.rs
│   │   │   └── vint.rs
│   │   ├── indexing_context.rs
│   │   ├── json_postings_writer.rs
│   │   ├── loaded_postings.rs
│   │   ├── mod.rs
│   │   ├── per_field_postings_writer.rs
│   │   ├── postings.rs
│   │   ├── postings_writer.rs
│   │   ├── recorder.rs
│   │   ├── segment_postings.rs
│   │   ├── serializer.rs
│   │   ├── skip.rs
│   │   └── term_info.rs
│   ├── query/
│   │   ├── all_query.rs
│   │   ├── automaton_weight.rs
│   │   ├── bitset/
│   │   │   └── mod.rs
│   │   ├── bm25.rs
│   │   ├── boolean_query/
│   │   │   ├── block_wand.rs
│   │   │   ├── boolean_query.rs
│   │   │   ├── boolean_weight.rs
│   │   │   └── mod.rs
│   │   ├── boost_query.rs
│   │   ├── const_score_query.rs
│   │   ├── disjunction.rs
│   │   ├── disjunction_max_query.rs
│   │   ├── empty_query.rs
│   │   ├── exclude.rs
│   │   ├── exist_query.rs
│   │   ├── explanation.rs
│   │   ├── fuzzy_query.rs
│   │   ├── intersection.rs
│   │   ├── mod.rs
│   │   ├── more_like_this/
│   │   │   ├── mod.rs
│   │   │   ├── more_like_this.rs
│   │   │   └── query.rs
│   │   ├── phrase_prefix_query/
│   │   │   ├── mod.rs
│   │   │   ├── phrase_prefix_query.rs
│   │   │   ├── phrase_prefix_scorer.rs
│   │   │   └── phrase_prefix_weight.rs
│   │   ├── phrase_query/
│   │   │   ├── mod.rs
│   │   │   ├── phrase_query.rs
│   │   │   ├── phrase_scorer.rs
│   │   │   ├── phrase_weight.rs
│   │   │   ├── regex_phrase_query.rs
│   │   │   └── regex_phrase_weight.rs
│   │   ├── query.rs
│   │   ├── query_parser/
│   │   │   ├── logical_ast.rs
│   │   │   ├── mod.rs
│   │   │   └── query_parser.rs
│   │   ├── range_query/
│   │   │   ├── fast_field_range_doc_set.rs
│   │   │   ├── mod.rs
│   │   │   ├── range_query.rs
│   │   │   └── range_query_fastfield.rs
│   │   ├── regex_query.rs
│   │   ├── reqopt_scorer.rs
│   │   ├── score_combiner.rs
│   │   ├── scorer.rs
│   │   ├── set_query.rs
│   │   ├── size_hint.rs
│   │   ├── term_query/
│   │   │   ├── mod.rs
│   │   │   ├── term_query.rs
│   │   │   ├── term_scorer.rs
│   │   │   └── term_weight.rs
│   │   ├── union/
│   │   │   ├── bitset_union.rs
│   │   │   ├── buffered_union.rs
│   │   │   ├── mod.rs
│   │   │   └── simple_union.rs
│   │   ├── vec_docset.rs
│   │   └── weight.rs
│   ├── reader/
│   │   ├── mod.rs
│   │   └── warming.rs
│   ├── schema/
│   │   ├── bytes_options.rs
│   │   ├── date_time_options.rs
│   │   ├── document/
│   │   │   ├── de.rs
│   │   │   ├── default_document.rs
│   │   │   ├── existing_type_impls.rs
│   │   │   ├── mod.rs
│   │   │   ├── owned_value.rs
│   │   │   ├── se.rs
│   │   │   └── value.rs
│   │   ├── facet.rs
│   │   ├── facet_options.rs
│   │   ├── field.rs
│   │   ├── field_entry.rs
│   │   ├── field_type.rs
│   │   ├── flags.rs
│   │   ├── index_record_option.rs
│   │   ├── ip_options.rs
│   │   ├── json_object_options.rs
│   │   ├── mod.rs
│   │   ├── named_field_document.rs
│   │   ├── numeric_options.rs
│   │   ├── schema.rs
│   │   ├── term.rs
│   │   └── text_options.rs
│   ├── snippet/
│   │   └── mod.rs
│   ├── space_usage/
│   │   └── mod.rs
│   ├── store/
│   │   ├── compression_lz4_block.rs
│   │   ├── compression_zstd_block.rs
│   │   ├── compressors.rs
│   │   ├── decompressors.rs
│   │   ├── footer.rs
│   │   ├── index/
│   │   │   ├── block.rs
│   │   │   ├── mod.rs
│   │   │   ├── skip_index.rs
│   │   │   └── skip_index_builder.rs
│   │   ├── mod.rs
│   │   ├── reader.rs
│   │   ├── store_compressor.rs
│   │   └── writer.rs
│   ├── termdict/
│   │   ├── fst_termdict/
│   │   │   ├── merger.rs
│   │   │   ├── mod.rs
│   │   │   ├── streamer.rs
│   │   │   ├── term_info_store.rs
│   │   │   └── termdict.rs
│   │   ├── mod.rs
│   │   ├── sstable_termdict/
│   │   │   ├── merger.rs
│   │   │   └── mod.rs
│   │   └── tests.rs
│   └── tokenizer/
│       ├── alphanum_only.rs
│       ├── ascii_folding_filter.rs
│       ├── empty_tokenizer.rs
│       ├── facet_tokenizer.rs
│       ├── lower_caser.rs
│       ├── mod.rs
│       ├── ngram_tokenizer.rs
│       ├── raw_tokenizer.rs
│       ├── regex_tokenizer.rs
│       ├── remove_long.rs
│       ├── simple_tokenizer.rs
│       ├── split_compound_words.rs
│       ├── stemmer.rs
│       ├── stop_word_filter/
│       │   ├── gen_stopwords.py
│       │   ├── mod.rs
│       │   └── stopwords.rs
│       ├── tokenized_string.rs
│       ├── tokenizer.rs
│       ├── tokenizer_manager.rs
│       └── whitespace_tokenizer.rs
├── sstable/
│   ├── Cargo.toml
│   ├── README.md
│   ├── benches/
│   │   ├── ord_to_term.rs
│   │   └── stream_bench.rs
│   ├── src/
│   │   ├── block_match_automaton.rs
│   │   ├── block_reader.rs
│   │   ├── delta.rs
│   │   ├── dictionary.rs
│   │   ├── lib.rs
│   │   ├── merge/
│   │   │   ├── heap_merge.rs
│   │   │   └── mod.rs
│   │   ├── sstable_index_v2.rs
│   │   ├── sstable_index_v3.rs
│   │   ├── streamer.rs
│   │   ├── value/
│   │   │   ├── index.rs
│   │   │   ├── mod.rs
│   │   │   ├── range.rs
│   │   │   ├── u64_monotonic.rs
│   │   │   ├── vec_u32.rs
│   │   │   └── void.rs
│   │   └── vint.rs
│   └── tests/
│       └── sstable_test.rs
├── stacker/
│   ├── Cargo.toml
│   ├── Performance.md
│   ├── benches/
│   │   └── bench.rs
│   ├── example/
│   │   └── hashmap.rs
│   ├── fuzz_test/
│   │   ├── Cargo.toml
│   │   └── src/
│   │       └── main.rs
│   └── src/
│       ├── arena_hashmap.rs
│       ├── expull.rs
│       ├── fastcmp.rs
│       ├── fastcpy.rs
│       ├── lib.rs
│       ├── memory_arena.rs
│       └── shared_arena_hashmap.rs
├── tests/
│   ├── compat_tests_data/
│   │   ├── index_v6/
│   │   │   ├── .managed.json
│   │   │   ├── 00000000000000000000000000000000.fast
│   │   │   ├── 00000000000000000000000000000000.fieldnorm
│   │   │   ├── 00000000000000000000000000000000.idx
│   │   │   ├── 00000000000000000000000000000000.pos
│   │   │   ├── 00000000000000000000000000000000.store
│   │   │   ├── 00000000000000000000000000000000.term
│   │   │   └── meta.json
│   │   └── index_v7/
│   │       ├── .managed.json
│   │       ├── 000002f0000000000000000000000000.fast
│   │       ├── 000002f0000000000000000000000000.fieldnorm
│   │       ├── 000002f0000000000000000000000000.idx
│   │       ├── 000002f0000000000000000000000000.pos
│   │       ├── 000002f0000000000000000000000000.store
│   │       ├── 000002f0000000000000000000000000.term
│   │       └── meta.json
│   └── failpoints/
│       └── mod.rs
└── tokenizer-api/
    ├── Cargo.toml
    ├── README.md
    └── src/
        └── lib.rs

================================================
FILE CONTENTS
================================================

================================================
FILE: .claude/skills/rationalize-deps/SKILL.md
================================================
---
name: rationalize-deps
description: Analyze Cargo.toml dependencies and attempt to remove unused features to reduce compile times and binary size
---

# Rationalize Dependencies

This skill analyzes Cargo.toml dependencies to identify and remove unused features.

## Overview

Many crates enable features by default that may not be needed. This skill:
1. Identifies dependencies with default features enabled
2. Tests if `default-features = false` works
3. Identifies which specific features are actually needed
4. Verifies compilation after changes

## Step 1: Identify the target

Ask the user which crate(s) to analyze:
- A specific crate name (e.g., "tokio", "serde")
- A specific workspace member (e.g., "quickwit-search")
- "all" to scan the entire workspace

## Step 2: Analyze current dependencies

For the workspace Cargo.toml (`quickwit/Cargo.toml`), list dependencies that:
- Do NOT have `default-features = false`
- Have default features that might be unnecessary

Run: `cargo tree -p <crate> -f "{p} {f}" --edges features` to see what features are actually used.

## Step 3: For each candidate dependency

### 3a: Check the crate's default features

Look up the crate on crates.io or check its Cargo.toml to understand:
- What features are enabled by default
- What each feature provides

Use: `cargo metadata --format-version=1 | jq '.packages[] | select(.name == "<crate>") | .features'`

### 3b: Try disabling default features

Modify the dependency in `quickwit/Cargo.toml`:

From:
```toml
some-crate = { version = "1.0" }
```

To:
```toml
some-crate = { version = "1.0", default-features = false }
```

### 3c: Run cargo check

Run: `cargo check --workspace` (or target specific packages for faster feedback)

If compilation fails:
1. Read the error messages to identify which features are needed
2. Add only the required features explicitly:
   ```toml
   some-crate = { version = "1.0", default-features = false, features = ["needed-feature"] }
   ```
3. Re-run cargo check

### 3d: Binary search for minimal features

If there are many default features, use binary search:
1. Start with no features
2. If it fails, add half the default features
3. Continue until you find the minimal set

## Step 4: Document findings

For each dependency analyzed, report:
- Original configuration
- New configuration (if changed)
- Features that were removed
- Any features that are required

## Step 5: Verify full build

After all changes, run:
```bash
cargo check --workspace --all-targets
cargo test --workspace --no-run
```

## Common Patterns

### Serde
Often only needs `derive`:
```toml
serde = { version = "1.0", default-features = false, features = ["derive", "std"] }
```

### Tokio
Identify which runtime features are actually used:
```toml
tokio = { version = "1.0", default-features = false, features = ["rt-multi-thread", "macros", "sync"] }
```

### Reqwest
Often doesn't need all TLS backends:
```toml
reqwest = { version = "0.11", default-features = false, features = ["rustls-tls", "json"] }
```

## Rollback

If changes cause issues:
```bash
git checkout quickwit/Cargo.toml
cargo check --workspace
```

## Tips

- Start with large crates that have many default features (tokio, reqwest, hyper)
- Use `cargo bloat --crates` to identify large dependencies
- Check `cargo tree -d` for duplicate dependencies that might indicate feature conflicts
- Some features are needed only for tests - consider using `[dev-dependencies]` features


================================================
FILE: .claude/skills/simple-pr/SKILL.md
================================================
---
name: simple-pr
description: Create a simple PR from staged changes with an auto-generated commit message
disable-model-invocation: true
---

# Simple PR

Follow these steps to create a simple PR from staged changes:

## Step 1: Check workspace state

Run: `git status`

Verify that all changes have been staged (no unstaged changes). If there are unstaged changes, abort and ask the user to stage their changes first with `git add`.

Also verify that we are on the `main` branch. If not, abort and ask the user to switch to main first.

## Step 2: Ensure main is up to date

Run: `git pull origin main`

This ensures we're working from the latest code.

## Step 3: Review staged changes

Run: `git diff --cached`

Review the staged changes to understand what the PR will contain.

## Step 4: Generate commit message

Based on the staged changes, generate a concise commit message (1-2 sentences) that describes the "why" rather than the "what".

Display the proposed commit message to the user and ask for confirmation before proceeding.

## Step 5: Create a new branch

Get the git username: `git config user.name | tr ' ' '-' | tr '[:upper:]' '[:lower:]'`

Create a short, descriptive branch name based on the changes (e.g., `fix-typo-in-readme`, `add-retry-logic`, `update-deps`).

Create and checkout the branch: `git checkout -b {username}/{short-descriptive-name}`

## Step 6: Commit changes

Commit with the message from step 3:
```
git commit -m "{commit-message}"
```

## Step 7: Push and open a PR

Push the branch and open a PR:
```
git push -u origin {branch-name}
gh pr create --title "{commit-message-title}" --body "{longer-description-if-needed}"
```

Report the PR URL to the user when complete.


================================================
FILE: .github/FUNDING.yml
================================================
# These are supported funding model platforms

github: fulmicoton
patreon: # Replace with a single Patreon username
open_collective: # Replace with a single Open Collective username
ko_fi: # Replace with a single Ko-fi username
tidelift: # Replace with a single Tidelift platform-name/package-name e.g., npm/babel
community_bridge: # Replace with a single Community Bridge project-name e.g., cloud-foundry
liberapay: # Replace with a single Liberapay username
issuehunt: # Replace with a single IssueHunt username
otechie: # Replace with a single Otechie username
custom: # Replace with up to 4 custom sponsorship URLs e.g., ['link1', 'link2']


================================================
FILE: .github/ISSUE_TEMPLATE/actions.md
================================================
---
name: Actions
about: Actions not directly related to producing code.

---

# Actions title

Action description. 
e.g. 
- benchmark
- investigate and report
- etc.


================================================
FILE: .github/ISSUE_TEMPLATE/bug_report.md
================================================
---
name: Bug report
about: Create a report to help us improve

---

**Describe the bug**
- What did you do?
- What happened?
- What was expected?

**Which version of tantivy are you using?**
If "master",  ideally give the specific sha1 revision.

**To Reproduce**

If your bug is deterministic, can you give a minimal reproducing code?
Some bugs are not deterministic. Can you describe with precision in which context it happened?
If this is possible, can you share your code?


================================================
FILE: .github/ISSUE_TEMPLATE/feature_request.md
================================================
---
name: Feature request
about: Suggest an idea for this project

---

**Is your feature request related to a problem? Please describe.**
A clear and concise description of what the problem is. Ex. I'm always frustrated when [...]

**Describe the solution you'd like**
A clear and concise description of what you want to happen.

**[Optional] describe alternatives you've considered**
A clear and concise description of any alternative solutions or features you've considered.


================================================
FILE: .github/ISSUE_TEMPLATE/question.md
================================================
---
name: Question
about: Ask any question about tantivy's usage...

---

Try to be specific about your use case...


================================================
FILE: .github/dependabot.yml
================================================
version: 2
updates:
- package-ecosystem: cargo
  directory: "/"
  schedule:
    interval: daily
    time: "20:00"
  open-pull-requests-limit: 10

- package-ecosystem: "github-actions"
  directory: "/"
  schedule:
    interval: daily
    time: "20:00"
  open-pull-requests-limit: 10


================================================
FILE: .github/workflows/coverage.yml
================================================
name: Coverage

on:
  push:
    branches: [main]

# Ensures that we cancel running jobs for the same PR / same workflow.
concurrency:
  group: ${{ github.workflow }}-${{ github.event.pull_request.number || github.ref }}
  cancel-in-progress: true

jobs:
  coverage:
    runs-on: ubuntu-latest
    steps:
      - uses: actions/checkout@v4
      - name: Install Rust
        run: rustup toolchain install nightly-2025-12-01 --profile minimal --component llvm-tools-preview
      - uses: Swatinem/rust-cache@v2
      - uses: taiki-e/install-action@cargo-llvm-cov
      - name: Generate code coverage
        run: cargo +nightly-2025-12-01 llvm-cov --all-features --workspace --doctests --lcov --output-path lcov.info
      - name: Upload coverage to Codecov
        uses: codecov/codecov-action@v3
        continue-on-error: true
        with:
          token: ${{ secrets.CODECOV_TOKEN }} # not required for public repos
          files: lcov.info
          fail_ci_if_error: true


================================================
FILE: .github/workflows/long_running.yml
================================================
name: Long running tests

on:
  push:
    branches: [ main ]

env:
  CARGO_TERM_COLOR: always
  NUM_FUNCTIONAL_TEST_ITERATIONS: 20000

# Ensures that we cancel running jobs for the same PR / same workflow.
concurrency:
  group: ${{ github.workflow }}-${{ github.event.pull_request.number || github.ref }}
  cancel-in-progress: true

jobs:
  test:

    runs-on: ubuntu-latest

    steps:
    - uses: actions/checkout@v4
    - name: Install stable
      uses: actions-rs/toolchain@v1
      with:
          toolchain: stable
          profile: minimal
          override: true

    - name: Run indexing_unsorted
      run: cargo test indexing_unsorted -- --ignored
    - name: Run indexing_sorted
      run: cargo test indexing_sorted -- --ignored


================================================
FILE: .github/workflows/test.yml
================================================
name: Unit tests

on:
  push:
    branches: [ main ]
  pull_request:
    branches: [ main ]

env:
  CARGO_TERM_COLOR: always

# Ensures that we cancel running jobs for the same PR / same workflow.
concurrency:
  group: ${{ github.workflow }}-${{ github.event.pull_request.number || github.ref }}
  cancel-in-progress: true

jobs:
  check:

    runs-on: ubuntu-latest

    steps:
    - uses: actions/checkout@v4

    - name: Install nightly
      uses: actions-rs/toolchain@v1
      with:
            toolchain: nightly
            profile: minimal
            components: rustfmt
    - name: Install stable
      uses: actions-rs/toolchain@v1
      with:
            toolchain: stable
            profile: minimal
            components: clippy

    - uses: Swatinem/rust-cache@v2

    - name: Check Formatting
      run: cargo +nightly fmt --all -- --check

    - name: Check Stable Compilation
      run: cargo build --all-features


    - name: Check Bench Compilation
      run: cargo +nightly bench --no-run --profile=dev --all-features

    - uses: actions-rs/clippy-check@v1
      with:
        toolchain: stable
        token: ${{ secrets.GITHUB_TOKEN }}
        args: --tests

  test:

    runs-on: ubuntu-latest

    strategy:
      matrix:
        features:
          - { label: "all", flags: "mmap,stopwords,lz4-compression,zstd-compression,failpoints,stemmer" }
          - { label: "quickwit", flags: "mmap,quickwit,failpoints" }
          - { label: "none", flags: "" }

    name: test-${{ matrix.features.label}}

    steps:
    - uses: actions/checkout@v4

    - name: Install stable
      uses: actions-rs/toolchain@v1
      with:
            toolchain: stable
            profile: minimal
            override: true

    - uses: taiki-e/install-action@nextest
    - uses: Swatinem/rust-cache@v2

    - name: Run tests
      run: |
        # if matrix.feature.flags is empty then run on --lib to avoid compiling examples
        # (as most of them rely on mmap) otherwise run all
        if [ -z "${{ matrix.features.flags }}" ]; then
          cargo +stable nextest run --lib --no-default-features --verbose --workspace
        else
          cargo +stable nextest run --features ${{ matrix.features.flags }} --no-default-features --verbose --workspace
        fi

    - name: Run doctests
      run: |
        # if matrix.feature.flags is empty then run on --lib to avoid compiling examples
        # (as most of them rely on mmap) otherwise run all
        if [ -z "${{ matrix.features.flags }}" ]; then
          echo "no doctest for no feature flag"
        else
          cargo +stable test --doc --features ${{ matrix.features.flags }} --verbose --workspace
        fi


================================================
FILE: .gitignore
================================================
tantivy.iml
.cargo
proptest-regressions
*.swp
target
target/debug
.vscode
target/release
Cargo.lock
benchmark
.DS_Store
*.bk
.idea
trace.dat
cargo-timing*
control
variable


================================================
FILE: ARCHITECTURE.md
================================================
# Tantivy

## What is tantivy?

Tantivy is a library that is meant to build search engines. Although it is by no means a port of Lucene, its architecture is strongly inspired by it. If you are familiar with Lucene, you may be struck by the overlapping vocabulary.
This is not fortuitous.

Tantivy's bread and butter is to address the problem of full-text search :

Given a large set of textual documents, and a text query, return the K-most relevant documents in a very efficient way. To execute these queries rapidly, the tantivy needs to build an index beforehand. The relevance score implemented in the tantivy is not configurable. Tantivy uses the same score as the default similarity used in Lucene / Elasticsearch, called [BM25](https://en.wikipedia.org/wiki/Okapi_BM25).

But tantivy's scope does not stop there. Numerous features are required to power rich-search applications. For instance, one may want to:

- compute the count of documents matching a query in the different section of an e-commerce website,
- display an average price per meter square for a real estate search engine,
- take into account historical user data to rank documents in a specific way,
- or even use tantivy to power an OLAP database.

A more abstract description of the problem space tantivy is trying to address is the following.

Ingest a large set of documents, create an index that makes it possible to
rapidly select all documents matching a given predicate (also known as a query) and
collect some information about them ([See collector](#collector-define-what-to-do-with-matched-documents)).

Roughly speaking the design is following these guiding principles:

- Search should be O(1) in memory.
- Indexing should be O(1) in memory. (In practice it is just sublinear)
- Search should be as fast as possible

This comes at the cost of the dynamicity of the index: while it is possible to add, and delete documents from our corpus, the tantivy is designed to handle these updates in large batches.

## [core/](src/core): Index, segments, searchers

Core contains all of the high-level code to make it possible to create an index, add documents, delete documents and commit.

This is both the most high-level part of tantivy, the least performance-sensitive one, the seemingly most mundane code... And paradoxically the most complicated part.

### Index and Segments

A tantivy index is a collection of smaller independent immutable segments.
Each segment contains its own independent set of data structures.

A segment is identified by a segment id that is in fact a UUID.
The file of a segment has the format

 ```segment-id . ext```

The extension signals which data structure (or [`SegmentComponent`](src/index/segment_component.rs)) is stored in the file.

A small `meta.json` file is in charge of keeping track of the list of segments, as well as the schema.

On commit, one segment per indexing thread is written to disk, and the `meta.json` is then updated atomically.

For a better idea of how indexing works, you may read the [following blog post](https://fulmicoton.com/posts/behold-tantivy-part2/).

### Deletes

Deletes happen by deleting a "term". Tantivy does not offer any notion of primary id, so it is up to the user to use a field in their schema as if it was a primary id, and delete the associated term if they want to delete only one specific document.

On commit, tantivy will find all of the segments with documents matching this existing term and remove from [alive bitset file](src/fastfield/alive_bitset.rs) that represents the bitset of the alive document ids.
Like all segment files, this file is immutable. Because it is possible to have more than one alive bitset file at a given instant, the alive bitset filename has the format ```segment_id . commit_opstamp . del```.

An opstamp is simply an incremental id that identifies any operation applied to the index. For instance, performing a commit or adding a document.

### DocId

Within a segment, all documents are identified by a DocId that ranges within `[0, max_doc)`.
where `max_doc` is the number of documents in the segment, (deleted or not). Having such a compact `DocId` space is key to the compression of our data structures.

The DocIds are simply allocated in the order documents are added to the index.

### Merges

In separate threads, tantivy's index writer search for opportunities to merge segments.
The point of segment merge is to:

- eventually get rid of tombstoned documents
- reduce the otherwise ever-growing number of segments.

Indeed, while having several segments instead of one does not hurt search too much, having hundreds can have a measurable impact on the search performance.

### Searcher

The user of the library usually does not need to know about the existence of Segments.
Searching is done through an object called a [`Searcher`](src/core/searcher.rs), that captures a
snapshot of the index at one point of time, by holding a list of [SegmentReader](src/core/segment_reader.rs).

In other words, regardless of commits, file garbage collection, or segment merge that might happen, as long as the user holds and reuse the same [Searcher](src/core/searcher.rs), search will happen on an immutable snapshot of the index.

## [directory/](src/directory): Where should the data be stored?

Tantivy, like Lucene, abstracts the place where the data should be stored in a key-trait
called [`Directory`](src/directory/directory.rs).
Contrary to Lucene however, "files" are quite different from some kind of `io::Read` object.
Check out [`src/directory/directory.rs`](src/directory/directory.rs) trait for more details.

Tantivy ships two main directory implementation: the `MmapDirectory` and the `RamDirectory`,
but users can extend tantivy with their own implementation.

## [schema/](src/schema): What are documents?

Tantivy's document follows a very strict schema, decided before building any index.

The schema defines all of the fields that the indexes [`Document`](src/schema/document/mod.rs) may and should contain, their types (`text`, `i64`, `u64`, `Date`, ...) as well as how it should be indexed / represented in tantivy.

Depending on the type of the field, you can decide to

- put it in the docstore
- store it as a fast field
- index it

Practically, tantivy will push values associated with this type to up to 3 respective
data structures.

*Limitations*

As of today, tantivy's schema imposes a 1:1 relationship between a field that is being ingested and a field represented in the search index. In sophisticated search application, it is fairly common to want to index a field twice using different tokenizers, or to index the concatenation of several fields together into one field.

This is not something tantivy supports, and it is up to the user to duplicate field / concatenate fields before feeding them to tantivy.

## General information about these data structures

All data structures in tantivy, have:

- a writer
- a serializer
- a reader

The writer builds an in-memory representation of a batch of documents. This representation is not searchable. It is just meant as an intermediary mutable representation, to which we can sequentially add
the document of a batch. At the end of the batch (or if a memory limit is reached), this representation
is then converted into an on-disk immutable representation, that is extremely compact.
This conversion is done by the serializer.

Finally, the reader is in charge of offering an API to read on this on-disk read-only representation.
In tantivy, readers are designed to require very little anonymous memory. The data is read straight from an mmapped file, and loading an index is as fast as mmapping its files.

## [store/](src/store): Here is my DocId, Gimme my document

The docstore is a row-oriented storage that, for each document, stores a subset of the fields
that are marked as stored in the schema. The docstore is compressed using a general-purpose algorithm
like LZ4.

**Useful for**

In search engines, it is often used to display search results.
Once the top 10 documents have been identified, we fetch them from the store, and display them or their snippet on the search result page (aka SERP).

**Not useful for**

Fetching a document from the store is typically a "slow" operation. It usually consists in

- searching into a compact tree-like data structure to find the position of the right block.
- decompressing a small block
- returning the document from this block.

It is NOT meant to be called for every document matching a query.

As a rule of thumb, if you hit the docstore more than 100 times per search query, you are probably misusing tantivy.

## [fastfield/](src/fastfield): Here is my DocId, Gimme my value

Fast fields are stored in a column-oriented storage that allows for random access.
The only compression applied is bitpacking. The column comes with two meta data.
The minimum value in the column and the number of bits per doc.

Fetching a value for a `DocId` is then as simple as computing

```rust
min_value + fetch_bits(num_bits * doc_id..num_bits * (doc_id+1))
```

This operation just requires one memory fetch.
Because, DocSets are scanned through in order (DocId are iterated in a sorted manner) which
also help locality.

In Lucene's jargon, fast fields are called DocValues.

**Useful for**

They are typically integer values that are useful to either rank or compute aggregate over
all of the documents matching a query (aka [DocSet](src/docset.rs)).

For instance, one could define a function to combine upvotes with tantivy's internal relevancy score.
This can be done by fetching a fast field during scoring.
One could also compute the mean price of the items matching a query in an e-commerce website.
This can be done by fetching a fast field in a collector.
Finally one could decide to post-filter a docset to remove docset with a price within a specific range.
If the ratio of filtered out documents is not too low, an efficient way to do this is to fetch the price and apply the filter on the collector side.

Aside from integer values, it is also possible to store an actual byte payload.
For advanced search engine, it is possible to store all of the features required for learning-to-rank in a byte payload, access it during search, and apply the learning-to-rank model.

Finally facets are a specific kind of fast field, and the associated source code is in [`fastfield/facet_reader.rs`](src/fastfield/facet_reader.rs).

# The inverted search index

The inverted index is the core part of full-text search.
When presented a new document with the text field "Hello, happy tax payer!", tantivy breaks it into a list of so-called tokens. In addition to just splitting these strings into tokens, it might also do different kinds of operations like dropping the punctuation, converting the character to lowercase, apply stemming, etc. Tantivy makes it possible to configure the operations to be applied in the schema (tokenizer/ is the place where these operations are implemented).

For instance, the default tokenizer of tantivy would break our text into: `[hello, happy, tax, payer]`.
The document will therefore be registered in the inverted index as containing the terms
`[text:hello, text:happy, text:tax, text:payer]`.

The role of the inverted index is, when given a term, gives us in return a very fast iterator over the sorted doc ids that match the term.

Such an iterator is called a posting list. In addition to giving us `DocId`, they can also give us optionally the number of occurrence of the term for each document, also called term frequency or TF.

These iterators being sorted by DocId, one can create an iterator over the document containing `text:tax AND text:payer`, `(text:tax AND text:payer) OR (text:contribuable)` or any boolean expression.

In order to represent the function
```Term ⟶ Posting```

The inverted index actually consists of two data structures chained together.

- [Term](src/schema/term.rs) ⟶ [TermInfo](src/postings/term_info.rs) is addressed by the term dictionary.
- [TermInfo](src/postings/term_info.rs) ⟶ [Posting](src/postings/postings.rs) is addressed by the posting lists.

Where [TermInfo](src/postings/term_info.rs) is an object containing some meta data about a term.

## [termdict/](src/termdict): Here is a term, give me the [TermInfo](src/postings/term_info.rs)

Tantivy's term dictionary is mainly in charge of supplying the function

[Term](src/schema/term.rs) ⟶ [TermInfo](src/postings/term_info.rs)

It is itself broken into two parts.

- [Term](src/schema/term.rs) ⟶ [TermOrdinal](src/termdict/mod.rs) is addressed by a finite state transducer, implemented by the fst crate.
- [TermOrdinal](src/termdict/mod.rs) ⟶ [TermInfo](src/postings/term_info.rs) is addressed by the term info store.

## [postings/](src/postings): Iterate over documents... very fast

A posting list makes it possible to store a sorted list of doc ids and for each doc store
a term frequency as well.

The posting lists are stored in a separate file. The [TermInfo](src/postings/term_info.rs) contains an offset into that file and a number of documents for the given posting list. Both are required and sufficient to read the posting list.

The posting list is organized in block of 128 documents.
One block of doc ids is followed by one block of term frequencies.

The doc ids are delta encoded and bitpacked.
The term frequencies are bitpacked.

Because the number of docs is rarely a multiple of 128, the last block may contain an arbitrary number of docs between 1 and 127 documents. We then use variable int encoding instead of bitpacking.

## [positions/](src/positions): Where are my terms within the documents?

Phrase queries make it possible to search for documents containing a specific sequence of terms.
For instance, when the phrase query "the art of war" does not match "the war of art".
To make it possible, it is possible to specify in the schema that a field should store positions in addition to being indexed.

The token positions of all of the terms are then stored in a separate file with the extension `.pos`.
The [TermInfo](src/postings/term_info.rs) gives an offset (expressed in position this time) in this file. As we iterate through the docset,
we advance the position reader by the number of term frequencies of the current document.

## [fieldnorm/](src/fieldnorm): Here is my doc, how many tokens in this field?

The [BM25](https://en.wikipedia.org/wiki/Okapi_BM25) formula also requires to know the number of tokens stored in a specific field for a given document. We store this information on one byte per document in the fieldnorm.
The fieldnorm is therefore compressed. Values up to 40 are encoded unchanged.

## [tokenizer/](src/tokenizer): How should we process text?

Text processing is key to a good search experience.
Splits or normalize your text too much, and the search results will have a less precision and a higher recall.
Do not normalize, or under split your text, you will end up with a higher precision and a lesser recall.

Text processing can be configured by selecting an off-the-shelf [`Tokenizer`](./src/tokenizer/tokenizer.rs) or implementing your own to first split the text into tokens, and then chain different [`TokenFilter`](src/tokenizer/tokenizer.rs)'s to it.

Tantivy's comes with few tokenizers, but external crates are offering advanced tokenizers, such as [Lindera](https://crates.io/crates/lindera) for Japanese.

## [query/](src/query): Define and compose queries

The [Query](src/query/query.rs) trait defines what a query is.
Due to the necessity for some queries to compute some statistics over the entire index, and because the
index is composed of several `SegmentReader`, the path from transforming a `Query` to an iterator over documents is slightly convoluted, but fundamentally, this is what a Query is.

The iterator over a document comes with some scoring function. The resulting trait is called a
[Scorer](src/query/scorer.rs) and is specific to a segment.

Different queries can be combined using the [BooleanQuery](src/query/boolean_query/).
Tantivy comes with different types of queries and can be extended by implementing
the `Query`, `Weight`, and `Scorer` traits.

## [collector](src/collector): Define what to do with matched documents

Collectors define how to aggregate the documents matching a query, in the broadest sense possible.
The search will push matched documents one by one, calling their
`fn collect(doc: DocId, score: Score);` method.

Users may implement their own collectors by implementing the [Collector](src/collector/mod.rs) trait.

## [query-grammar](query-grammar): Defines the grammar of the query parser

While the [QueryParser](src/query/query_parser/query_parser.rs) struct is located in the `query/` directory, the actual parser combinator used to convert user queries into an AST is in an external crate called `query-grammar`. This part was externalized to lighten the work of the compiler.


================================================
FILE: AUTHORS
================================================
# This is the list of authors of tantivy for copyright purposes.
Paul Masurel
Laurentiu Nicola
Dru Sellers
Ashley Mannix
Michael J. Curry
Jason Wolfe
# As an employee of Google I am required to add Google LLC
# in the list of authors, but this project is not affiliated to Google
# in any other way.
Google LLC 


================================================
FILE: CHANGELOG.md
================================================
Tantivy 0.25
================================

## Bugfixes
- fix union performance regression in tantivy 0.24 [#2663](https://github.com/quickwit-oss/tantivy/pull/2663)(@PSeitz)
- make zstd optional in sstable [#2633](https://github.com/quickwit-oss/tantivy/pull/2633)(@Parth)
- Fix TopDocs::order_by_string_fast_field for asc order [#2672](https://github.com/quickwit-oss/tantivy/pull/2672)(@stuhood @PSeitz)

## Features/Improvements
- add docs/example and Vec<u32> values to sstable [#2660](https://github.com/quickwit-oss/tantivy/pull/2660)(@PSeitz)
- Add string fast field support to `TopDocs`. [#2642](https://github.com/quickwit-oss/tantivy/pull/2642)(@stuhood)
- update edition to 2024 [#2620](https://github.com/quickwit-oss/tantivy/pull/2620)(@PSeitz)
- Allow optional spaces between the field name and the value in the query parser [#2678](https://github.com/quickwit-oss/tantivy/pull/2678)(@Darkheir)
- Support mixed field types in query parser [#2676](https://github.com/quickwit-oss/tantivy/pull/2676)(@trinity-1686a)
- Add per-field size details [#2679](https://github.com/quickwit-oss/tantivy/pull/2679)(@fulmicoton)

Tantivy 0.24.2
================================
- Fix TopNComputer for reverse order. [#2672](https://github.com/quickwit-oss/tantivy/pull/2672)(@stuhood @PSeitz) 

Affected queries are [order_by_fast_field](https://docs.rs/tantivy/latest/tantivy/collector/struct.TopDocs.html#method.order_by_fast_field) and
[order_by_u64_field](https://docs.rs/tantivy/latest/tantivy/collector/struct.TopDocs.html#method.order_by_u64_field)
for `Order::Asc`

Tantivy 0.24.1
================================
- Fix: bump required rust version to 1.81
  
Tantivy 0.24
================================
Tantivy 0.24 will be backwards compatible with indices created with v0.22 and v0.21. The new minimum rust version will be 1.75. Tantivy 0.23 will be skipped.

#### Bugfixes
- fix potential endless loop in merge [#2457](https://github.com/quickwit-oss/tantivy/pull/2457)(@PSeitz)
- fix bug that causes out-of-order sstable key. [#2445](https://github.com/quickwit-oss/tantivy/pull/2445)(@fulmicoton)
- fix ReferenceValue API flaw [#2372](https://github.com/quickwit-oss/tantivy/pull/2372)(@PSeitz)
- fix `OwnedBytes` debug panic [#2512](https://github.com/quickwit-oss/tantivy/pull/2512)(@b41sh)
- catch panics during merges [#2582](https://github.com/quickwit-oss/tantivy/pull/2582)(@rdettai)
- switch from u32 to usize in bitpacker. This enables multivalued columns larger than 4GB, which crashed during merge before. [#2581](https://github.com/quickwit-oss/tantivy/pull/2581) [#2586](https://github.com/quickwit-oss/tantivy/pull/2586)(@fulmicoton-dd @PSeitz)

#### Breaking API Changes
- remove index sorting [#2434](https://github.com/quickwit-oss/tantivy/pull/2434)(@PSeitz)

#### Features/Improvements
- **Aggregation**
    - Support for cardinality aggregation [#2337](https://github.com/quickwit-oss/tantivy/pull/2337) [#2446](https://github.com/quickwit-oss/tantivy/pull/2446) (@raphaelcoeffic @PSeitz)
    - Support for extended stats aggregation [#2247](https://github.com/quickwit-oss/tantivy/pull/2247)(@giovannicuccu)
    - Add Key::I64 and Key::U64 variants in aggregation to avoid f64 precision issues [#2468](https://github.com/quickwit-oss/tantivy/pull/2468)(@PSeitz)
    - Faster term aggregation fetch terms [#2447](https://github.com/quickwit-oss/tantivy/pull/2447)(@PSeitz)
    - Improve custom order deserialization [#2451](https://github.com/quickwit-oss/tantivy/pull/2451)(@PSeitz)
    - Change AggregationLimits behavior [#2495](https://github.com/quickwit-oss/tantivy/pull/2495)(@PSeitz)
    - lower contention on AggregationLimits [#2394](https://github.com/quickwit-oss/tantivy/pull/2394)(@PSeitz)
    - fix postcard compatibility for top_hits, add postcard test [#2346](https://github.com/quickwit-oss/tantivy/pull/2346)(@PSeitz)
    - reduce top hits memory consumption [#2426](https://github.com/quickwit-oss/tantivy/pull/2426)(@PSeitz)
    - check unsupported parameters top_hits [#2351](https://github.com/quickwit-oss/tantivy/pull/2351)(@PSeitz)
    - Change AggregationLimits to AggregationLimitsGuard [#2495](https://github.com/quickwit-oss/tantivy/pull/2495)(@PSeitz)
    - add support for counting non integer in aggregation [#2547](https://github.com/quickwit-oss/tantivy/pull/2547)(@trinity-1686a)
- **Range Queries**
    - Support fast field range queries on json fields [#2456](https://github.com/quickwit-oss/tantivy/pull/2456)(@PSeitz)
    - Add support for str fast field range query [#2460](https://github.com/quickwit-oss/tantivy/pull/2460) [#2452](https://github.com/quickwit-oss/tantivy/pull/2452) [#2453](https://github.com/quickwit-oss/tantivy/pull/2453)(@PSeitz)
    - modify fastfield range query heuristic [#2375](https://github.com/quickwit-oss/tantivy/pull/2375)(@trinity-1686a)
    - add FastFieldRangeQuery for explicit range queries on fast field (for `RangeQuery` it is autodetected) [#2477](https://github.com/quickwit-oss/tantivy/pull/2477)(@PSeitz)

- add format backwards-compatibility tests [#2485](https://github.com/quickwit-oss/tantivy/pull/2485)(@PSeitz)
- add columnar format compatibility tests [#2433](https://github.com/quickwit-oss/tantivy/pull/2433)(@PSeitz)
- Improved snippet ranges algorithm [#2474](https://github.com/quickwit-oss/tantivy/pull/2474)(@gezihuzi)
- make find_field_with_default return json fields without path [#2476](https://github.com/quickwit-oss/tantivy/pull/2476)(@trinity-1686a)
- Make `BooleanQuery` support `minimum_number_should_match` [#2405](https://github.com/quickwit-oss/tantivy/pull/2405)(@LebranceBW)
- Make `NUM_MERGE_THREADS` configurable [#2535](https://github.com/quickwit-oss/tantivy/pull/2535)(@Barre)

- **RegexPhraseQuery** 
`RegexPhraseQuery` supports phrase queries with regex. E.g. query "b.* b.* wolf" matches "big bad wolf". Slop is supported as well: "b.* wolf"~2 matches "big bad wolf" [#2516](https://github.com/quickwit-oss/tantivy/pull/2516)(@PSeitz)

- **Optional Index in Multivalue Columnar Index** 
For mostly empty multivalued indices there was a large overhead during creation when iterating all docids (merge case). 
This is alleviated by placing an optional index in the multivalued index to mark documents that have values. 
This will slightly increase space and access time. [#2439](https://github.com/quickwit-oss/tantivy/pull/2439)(@PSeitz)

- **Store DateTime as nanoseconds in doc store** DateTime in the doc store was truncated to microseconds previously. This removes this truncation, while still keeping backwards compatibility. [#2486](https://github.com/quickwit-oss/tantivy/pull/2486)(@PSeitz)

- **Performance/Memory**
    - lift clauses in LogicalAst for optimized ast during execution [#2449](https://github.com/quickwit-oss/tantivy/pull/2449)(@PSeitz)
    - Use Vec instead of BTreeMap to back OwnedValue object [#2364](https://github.com/quickwit-oss/tantivy/pull/2364)(@fulmicoton)
    - Replace TantivyDocument with CompactDoc. CompactDoc is much smaller and provides similar performance. [#2402](https://github.com/quickwit-oss/tantivy/pull/2402)(@PSeitz)
    - Recycling buffer in PrefixPhraseScorer [#2443](https://github.com/quickwit-oss/tantivy/pull/2443)(@fulmicoton)

- **Json Type**
    - JSON supports now all values on the root level. Previously an object was required. This enables support for flat mixed types. allow more JSON values, fix i64 special case [#2383](https://github.com/quickwit-oss/tantivy/pull/2383)(@PSeitz)
    - add json path constructor to term [#2367](https://github.com/quickwit-oss/tantivy/pull/2367)(@PSeitz)

- **QueryParser**
    - fix de-escaping too much in query parser [#2427](https://github.com/quickwit-oss/tantivy/pull/2427)(@trinity-1686a)
    - improve query parser [#2416](https://github.com/quickwit-oss/tantivy/pull/2416)(@trinity-1686a)
    - Support field grouping `title:(return AND "pink panther")` [#2333](https://github.com/quickwit-oss/tantivy/pull/2333)(@trinity-1686a)
    - allow term starting with wildcard [#2568](https://github.com/quickwit-oss/tantivy/pull/2568)(@trinity-1686a)

- Exist queries match subpath fields [#2558](https://github.com/quickwit-oss/tantivy/pull/2558)(@rdettai)
- add access benchmark for columnar [#2432](https://github.com/quickwit-oss/tantivy/pull/2432)(@PSeitz)
- extend indexwriter proptests [#2342](https://github.com/quickwit-oss/tantivy/pull/2342)(@PSeitz)
- add bench & test for columnar merging [#2428](https://github.com/quickwit-oss/tantivy/pull/2428)(@PSeitz)
- Change in Executor API [#2391](https://github.com/quickwit-oss/tantivy/pull/2391)(@fulmicoton)
- Removed usage of num_cpus [#2387](https://github.com/quickwit-oss/tantivy/pull/2387)(@fulmicoton)
- use bingang for agg and stacker benchmark [#2378](https://github.com/quickwit-oss/tantivy/pull/2378)[#2492](https://github.com/quickwit-oss/tantivy/pull/2492)(@PSeitz) 
- cleanup top level exports [#2382](https://github.com/quickwit-oss/tantivy/pull/2382)(@PSeitz)
- make convert_to_fast_value_and_append_to_json_term pub [#2370](https://github.com/quickwit-oss/tantivy/pull/2370)(@PSeitz)
- remove JsonTermWriter [#2238](https://github.com/quickwit-oss/tantivy/pull/2238)(@PSeitz)
- validate sort by field type [#2336](https://github.com/quickwit-oss/tantivy/pull/2336)(@PSeitz)
- Fix trait bound of StoreReader::iter [#2360](https://github.com/quickwit-oss/tantivy/pull/2360)(@adamreichold)
- remove read_postings_no_deletes [#2526](https://github.com/quickwit-oss/tantivy/pull/2526)(@PSeitz)

Tantivy 0.22.1
================================
- Fix TopNComputer for reverse order. [#2672](https://github.com/quickwit-oss/tantivy/pull/2672)(@stuhood @PSeitz) 

Affected queries are [order_by_fast_field](https://docs.rs/tantivy/latest/tantivy/collector/struct.TopDocs.html#method.order_by_fast_field) and
[order_by_u64_field](https://docs.rs/tantivy/latest/tantivy/collector/struct.TopDocs.html#method.order_by_u64_field)
for `Order::Asc`

Tantivy 0.22
================================

Tantivy 0.22 will be able to read indices created with Tantivy 0.21.

#### Bugfixes
- Fix null byte handling in JSON paths (null bytes in json keys caused panic during indexing) [#2345](https://github.com/quickwit-oss/tantivy/pull/2345)(@PSeitz)
- Fix bug that can cause `get_docids_for_value_range` to panic. [#2295](https://github.com/quickwit-oss/tantivy/pull/2295)(@fulmicoton)
- Avoid 1 document indices by increase min memory to 15MB for indexing [#2176](https://github.com/quickwit-oss/tantivy/pull/2176)(@PSeitz)
- Fix merge panic for JSON fields [#2284](https://github.com/quickwit-oss/tantivy/pull/2284)(@PSeitz)
- Fix bug occurring when merging JSON object indexed with positions. [#2253](https://github.com/quickwit-oss/tantivy/pull/2253)(@fulmicoton)
- Fix empty DateHistogram gap bug [#2183](https://github.com/quickwit-oss/tantivy/pull/2183)(@PSeitz)
- Fix range query end check (fields with less than 1 value per doc are affected) [#2226](https://github.com/quickwit-oss/tantivy/pull/2226)(@PSeitz)
- Handle exclusive out of bounds ranges on fastfield range queries [#2174](https://github.com/quickwit-oss/tantivy/pull/2174)(@PSeitz)

#### Breaking API Changes
- rename ReloadPolicy onCommit to onCommitWithDelay [#2235](https://github.com/quickwit-oss/tantivy/pull/2235)(@giovannicuccu)
- Move exports from the root into modules [#2220](https://github.com/quickwit-oss/tantivy/pull/2220)(@PSeitz)
- Accept field name instead of `Field` in FilterCollector [#2196](https://github.com/quickwit-oss/tantivy/pull/2196)(@PSeitz)
- remove deprecated IntOptions and DateTime [#2353](https://github.com/quickwit-oss/tantivy/pull/2353)(@PSeitz)

#### Features/Improvements
- Tantivy documents as a trait: Index data directly without converting to tantivy types first [#2071](https://github.com/quickwit-oss/tantivy/pull/2071)(@ChillFish8)
- encode some part of posting list as -1 instead of direct values (smaller inverted indices) [#2185](https://github.com/quickwit-oss/tantivy/pull/2185)(@trinity-1686a)
- **Aggregation**
  - Support to deserialize f64 from string [#2311](https://github.com/quickwit-oss/tantivy/pull/2311)(@PSeitz)
  - Add a top_hits aggregator [#2198](https://github.com/quickwit-oss/tantivy/pull/2198)(@ditsuke)
  - Support bool type in term aggregation [#2318](https://github.com/quickwit-oss/tantivy/pull/2318)(@PSeitz)
  - Support ip addresses in term aggregation [#2319](https://github.com/quickwit-oss/tantivy/pull/2319)(@PSeitz)
  - Support date type in term aggregation [#2172](https://github.com/quickwit-oss/tantivy/pull/2172)(@PSeitz)
  - Support escaped dot when addressing field [#2250](https://github.com/quickwit-oss/tantivy/pull/2250)(@PSeitz)

- Add ExistsQuery to check documents that have a value [#2160](https://github.com/quickwit-oss/tantivy/pull/2160)(@imotov)
- Expose TopDocs::order_by_u64_field again [#2282](https://github.com/quickwit-oss/tantivy/pull/2282)(@ditsuke)

- **Memory/Performance**
  - Faster TopN: replace BinaryHeap with TopNComputer [#2186](https://github.com/quickwit-oss/tantivy/pull/2186)(@PSeitz)
  - reduce number of allocations during indexing [#2257](https://github.com/quickwit-oss/tantivy/pull/2257)(@PSeitz)
  - Less Memory while indexing: docid deltas while indexing [#2249](https://github.com/quickwit-oss/tantivy/pull/2249)(@PSeitz)
  - Faster indexing: use term hashmap in fastfield [#2243](https://github.com/quickwit-oss/tantivy/pull/2243)(@PSeitz)
  - term hashmap remove copy in is_empty, unused unordered_id [#2229](https://github.com/quickwit-oss/tantivy/pull/2229)(@PSeitz)
  - add method to fetch block of first values in columnar [#2330](https://github.com/quickwit-oss/tantivy/pull/2330)(@PSeitz)
  - Faster aggregations: add fast path for full columns in fetch_block [#2328](https://github.com/quickwit-oss/tantivy/pull/2328)(@PSeitz)
  - Faster sstable loading: use fst for sstable index [#2268](https://github.com/quickwit-oss/tantivy/pull/2268)(@trinity-1686a)

- **QueryParser**
  - allow newline where we allow space in query parser [#2302](https://github.com/quickwit-oss/tantivy/pull/2302)(@trinity-1686a)
  - allow some mixing of occur and bool in strict query parser [#2323](https://github.com/quickwit-oss/tantivy/pull/2323)(@trinity-1686a)
  - handle * inside term in lenient query parser [#2228](https://github.com/quickwit-oss/tantivy/pull/2228)(@trinity-1686a)
  - add support for exists query syntax in query parser [#2170](https://github.com/quickwit-oss/tantivy/pull/2170)(@trinity-1686a)
- Add shared search executor [#2312](https://github.com/quickwit-oss/tantivy/pull/2312)(@MochiXu)
- Truncate keys to u16::MAX in term hashmap [#2299](https://github.com/quickwit-oss/tantivy/pull/2299)(@PSeitz)
- report if a term matched when warming up posting list [#2309](https://github.com/quickwit-oss/tantivy/pull/2309)(@trinity-1686a)
- Support json fields in FuzzyTermQuery [#2173](https://github.com/quickwit-oss/tantivy/pull/2173)(@PingXia-at)
- Read list of fields encoded in term dictionary for JSON fields [#2184](https://github.com/quickwit-oss/tantivy/pull/2184)(@PSeitz)
- add collect_block to BoxableSegmentCollector [#2331](https://github.com/quickwit-oss/tantivy/pull/2331)(@PSeitz)
- expose collect_block buffer size [#2326](https://github.com/quickwit-oss/tantivy/pull/2326)(@PSeitz)
- Forward regex parser errors [#2288](https://github.com/quickwit-oss/tantivy/pull/2288)(@adamreichold)
- Make FacetCounts defaultable and cloneable. [#2322](https://github.com/quickwit-oss/tantivy/pull/2322)(@adamreichold)
- Derive Debug for SchemaBuilder [#2254](https://github.com/quickwit-oss/tantivy/pull/2254)(@GodTamIt)
- add missing inlines to tantivy options [#2245](https://github.com/quickwit-oss/tantivy/pull/2245)(@PSeitz)

Tantivy 0.21.1
================================
#### Bugfixes
- Range queries on fast fields with less values on that field than documents had an invalid end condition, leading to missing results. [#2226](https://github.com/quickwit-oss/tantivy/issues/2226)(@appaquet @PSeitz)
- Increase the minimum memory budget from 3MB to 15MB to avoid single doc segments (API fix). [#2176](https://github.com/quickwit-oss/tantivy/issues/2176)(@PSeitz)

Tantivy 0.21
================================
#### Bugfixes
- Fix track fast field memory consumption, which led to higher memory consumption than the budget allowed during indexing [#2148](https://github.com/quickwit-oss/tantivy/issues/2148)[#2147](https://github.com/quickwit-oss/tantivy/issues/2147)(@PSeitz)
- Fix a regression from 0.20 where sort index by date wasn't working anymore [#2124](https://github.com/quickwit-oss/tantivy/issues/2124)(@PSeitz)
- Fix getting the root facet on the `FacetCollector`. [#2086](https://github.com/quickwit-oss/tantivy/issues/2086)(@adamreichold)
- Align numerical type priority order of columnar and query. [#2088](https://github.com/quickwit-oss/tantivy/issues/2088)(@fmassot)
#### Breaking Changes
- Remove support for Brotli and Snappy compression [#2123](https://github.com/quickwit-oss/tantivy/issues/2123)(@adamreichold)
#### Features/Improvements
- Implement lenient query parser [#2129](https://github.com/quickwit-oss/tantivy/pull/2129)(@trinity-1686a)
- order_by_u64_field and order_by_fast_field allow sorting in ascending and descending order [#2111](https://github.com/quickwit-oss/tantivy/issues/2111)(@naveenann)
- Allow dynamic filters in text analyzer builder [#2110](https://github.com/quickwit-oss/tantivy/issues/2110)(@fulmicoton @fmassot)
- **Aggregation**
  - Add missing parameter for term aggregation [#2149](https://github.com/quickwit-oss/tantivy/issues/2149)[#2103](https://github.com/quickwit-oss/tantivy/issues/2103)(@PSeitz)
  - Add missing parameter for percentiles [#2157](https://github.com/quickwit-oss/tantivy/issues/2157)(@PSeitz)
  - Add missing parameter for stats,min,max,count,sum,avg [#2151](https://github.com/quickwit-oss/tantivy/issues/2151)(@PSeitz)
  - Improve aggregation deserialization error message [#2150](https://github.com/quickwit-oss/tantivy/issues/2150)(@PSeitz)
  - Add validation for type Bytes to term_agg [#2077](https://github.com/quickwit-oss/tantivy/issues/2077)(@PSeitz)
  - Alternative mixed field collection [#2135](https://github.com/quickwit-oss/tantivy/issues/2135)(@PSeitz)
- Add missing query_terms impl for TermSetQuery. [#2120](https://github.com/quickwit-oss/tantivy/issues/2120)(@adamreichold)
- Minor improvements to OwnedBytes [#2134](https://github.com/quickwit-oss/tantivy/issues/2134)(@adamreichold)
- Remove allocations in split compound words [#2080](https://github.com/quickwit-oss/tantivy/issues/2080)(@PSeitz)
- Ngram tokenizer now returns an error with invalid arguments [#2102](https://github.com/quickwit-oss/tantivy/issues/2102)(@fmassot)
- Make TextAnalyzerBuilder public [#2097](https://github.com/quickwit-oss/tantivy/issues/2097)(@adamreichold)
- Return an error when tokenizer is not found while indexing [#2093](https://github.com/quickwit-oss/tantivy/issues/2093)(@naveenann)
- Delayed column opening during merge [#2132](https://github.com/quickwit-oss/tantivy/issues/2132)(@PSeitz)

Tantivy 0.20.2
================================
- Align numerical type priority order on the search side.  [#2088](https://github.com/quickwit-oss/tantivy/issues/2088) (@fmassot)
- Fix is_child_of function not considering the root facet. [#2086](https://github.com/quickwit-oss/tantivy/issues/2086) (@adamreichhold)

Tantivy 0.20.1
================================
- Fix building on windows with mmap [#2070](https://github.com/quickwit-oss/tantivy/issues/2070) (@ChillFish8)

Tantivy 0.20
================================
#### Bugfixes
- Fix phrase queries with slop (slop supports now transpositions, algorithm that carries slop so far for num terms > 2) [#2031](https://github.com/quickwit-oss/tantivy/issues/2031)[#2020](https://github.com/quickwit-oss/tantivy/issues/2020)(@PSeitz)
- Handle error for exists on MMapDirectory [#1988](https://github.com/quickwit-oss/tantivy/issues/1988) (@PSeitz)
- Aggregation
  - Fix min doc_count empty merge bug [#2057](https://github.com/quickwit-oss/tantivy/issues/2057) (@PSeitz)
  - Fix: Sort order for term aggregations (sort order on key was inverted) [#1858](https://github.com/quickwit-oss/tantivy/issues/1858) (@PSeitz)

#### Features/Improvements
- Add PhrasePrefixQuery [#1842](https://github.com/quickwit-oss/tantivy/issues/1842) (@trinity-1686a)
- Add `coerce` option for text and numbers types (convert the value instead of returning an error during indexing) [#1904](https://github.com/quickwit-oss/tantivy/issues/1904) (@PSeitz)
- Add regex tokenizer [#1759](https://github.com/quickwit-oss/tantivy/issues/1759)(@mkleen)
- Move tokenizer API to separate crate. Having a separate crate with a stable API will allow us to use tokenizers with different tantivy versions. [#1767](https://github.com/quickwit-oss/tantivy/issues/1767) (@PSeitz)
- **Columnar crate**: New fast field handling (@fulmicoton @PSeitz) [#1806](https://github.com/quickwit-oss/tantivy/issues/1806)[#1809](https://github.com/quickwit-oss/tantivy/issues/1809)
  - Support for fast fields with optional values. Previously tantivy supported only single-valued and multi-value fast fields. The encoding of optional fast fields is now very compact.
  - Fast field Support for JSON (schemaless fast fields). Support multiple types on the same column. [#1876](https://github.com/quickwit-oss/tantivy/issues/1876) (@fulmicoton)
  - Unified access for fast fields over different cardinalities.
  - Unified storage for typed and untyped fields.
  - Move fastfield codecs into columnar. [#1782](https://github.com/quickwit-oss/tantivy/issues/1782) (@fulmicoton)
  - Sparse dense index for optional values [#1716](https://github.com/quickwit-oss/tantivy/issues/1716) (@PSeitz)
  - Switch to nanosecond precision in DateTime fastfield [#2016](https://github.com/quickwit-oss/tantivy/issues/2016) (@PSeitz)
- **Aggregation**
  - Add `date_histogram` aggregation (only `fixed_interval` for now) [#1900](https://github.com/quickwit-oss/tantivy/issues/1900) (@PSeitz)
  - Add `percentiles` aggregations [#1984](https://github.com/quickwit-oss/tantivy/issues/1984) (@PSeitz)
  - [**breaking**] Drop JSON support on intermediate agg result (we use postcard as format in `quickwit` to send intermediate results) [#1992](https://github.com/quickwit-oss/tantivy/issues/1992) (@PSeitz)
  - Set memory limit in bytes for aggregations after which they abort (Previously there was only the bucket limit) [#1942](https://github.com/quickwit-oss/tantivy/issues/1942)[#1957](https://github.com/quickwit-oss/tantivy/issues/1957)(@PSeitz)
  - Add support for u64,i64,f64 fields in term aggregation [#1883](https://github.com/quickwit-oss/tantivy/issues/1883) (@PSeitz)
  - Allow histogram bounds to be passed as Rfc3339 [#2076](https://github.com/quickwit-oss/tantivy/issues/2076) (@PSeitz)
  - Add count, min, max, and sum aggregations [#1794](https://github.com/quickwit-oss/tantivy/issues/1794) (@guilload)
  - Switch to Aggregation without serde_untagged => better deserialization errors. [#2003](https://github.com/quickwit-oss/tantivy/issues/2003) (@PSeitz)
  - Switch to ms in histogram for date type (ES compatibility) [#2045](https://github.com/quickwit-oss/tantivy/issues/2045) (@PSeitz)
  - Reduce term aggregation memory consumption [#2013](https://github.com/quickwit-oss/tantivy/issues/2013) (@PSeitz)
  - Reduce agg memory consumption: Replace generic aggregation collector (which has a high memory requirement per instance) in aggregation tree with optimized versions behind a trait.
  - Split term collection count and sub_agg (Faster term agg with less memory consumption for cases without sub-aggs) [#1921](https://github.com/quickwit-oss/tantivy/issues/1921) (@PSeitz)
  - Schemaless aggregations: In combination with stacker tantivy supports now schemaless aggregations via the JSON type.
    - Add aggregation support for JSON type [#1888](https://github.com/quickwit-oss/tantivy/issues/1888) (@PSeitz)
    - Mixed types support on JSON fields in aggs [#1971](https://github.com/quickwit-oss/tantivy/issues/1971) (@PSeitz)
  - Perf: Fetch blocks of vals in aggregation for all cardinality [#1950](https://github.com/quickwit-oss/tantivy/issues/1950) (@PSeitz)
  - Allow histogram bounds to be passed as Rfc3339 [#2076](https://github.com/quickwit-oss/tantivy/issues/2076) (@PSeitz)
- `Searcher` with disabled scoring via `EnableScoring::Disabled` [#1780](https://github.com/quickwit-oss/tantivy/issues/1780) (@shikhar)
- Enable tokenizer on json fields [#2053](https://github.com/quickwit-oss/tantivy/issues/2053) (@PSeitz)
- Enforcing "NOT" and "-" queries consistency in UserInputAst [#1609](https://github.com/quickwit-oss/tantivy/issues/1609) (@bazhenov)
- Faster indexing
  - Refactor tokenization pipeline to use GATs [#1924](https://github.com/quickwit-oss/tantivy/issues/1924) (@trinity-1686a)
  - Faster term hash map [#2058](https://github.com/quickwit-oss/tantivy/issues/2058)[#1940](https://github.com/quickwit-oss/tantivy/issues/1940) (@PSeitz)
  - tokenizer-api: reduce Tokenizer allocation overhead [#2062](https://github.com/quickwit-oss/tantivy/issues/2062) (@PSeitz)
  - Refactor vint [#2010](https://github.com/quickwit-oss/tantivy/issues/2010) (@PSeitz)
- Faster search
  - Work in batches of docs on the SegmentCollector (Only for cases without score for now) [#1937](https://github.com/quickwit-oss/tantivy/issues/1937) (@PSeitz)
  - Faster fast field range queries using SIMD [#1954](https://github.com/quickwit-oss/tantivy/issues/1954) (@fulmicoton)
  - Improve fast field range query performance [#1864](https://github.com/quickwit-oss/tantivy/issues/1864) (@PSeitz)
- Make BM25 scoring more flexible [#1855](https://github.com/quickwit-oss/tantivy/issues/1855) (@alexcole)
- Switch fs2 to fs4 as it is now unmaintained and does not support illumos [#1944](https://github.com/quickwit-oss/tantivy/issues/1944) (@Toasterson)
- Made BooleanWeight and BoostWeight public [#1991](https://github.com/quickwit-oss/tantivy/issues/1991) (@fulmicoton)
- Make index compatible with virtual drives on Windows [#1843](https://github.com/quickwit-oss/tantivy/issues/1843) (@gyk)
- Add stop words for Hungarian language [#2069](https://github.com/quickwit-oss/tantivy/issues/2069) (@tnxbutno)
- Auto downgrade index record option, instead of vint error [#1857](https://github.com/quickwit-oss/tantivy/issues/1857) (@PSeitz)
- Enable range query on fast field for u64 compatible types [#1762](https://github.com/quickwit-oss/tantivy/issues/1762) (@PSeitz) [#1876]
- sstable
  - Isolating sstable and stacker in independent crates. [#1718](https://github.com/quickwit-oss/tantivy/issues/1718) (@fulmicoton)
  - New sstable format [#1943](https://github.com/quickwit-oss/tantivy/issues/1943)[#1953](https://github.com/quickwit-oss/tantivy/issues/1953) (@trinity-1686a)
  - Use DeltaReader directly to implement Dictionary::ord_to_term [#1928](https://github.com/quickwit-oss/tantivy/issues/1928) (@trinity-1686a)
  - Use DeltaReader directly to implement Dictionary::term_ord [#1925](https://github.com/quickwit-oss/tantivy/issues/1925) (@trinity-1686a)
- Add separate tokenizer manager for fast fields [#2019](https://github.com/quickwit-oss/tantivy/issues/2019) (@PSeitz)
- Make construction of LevenshteinAutomatonBuilder for FuzzyTermQuery instances lazy. [#1756](https://github.com/quickwit-oss/tantivy/issues/1756) (@adamreichold)
- Added support for madvise when opening an mmapped Index [#2036](https://github.com/quickwit-oss/tantivy/issues/2036) (@fulmicoton)
- Rename `DatePrecision` to `DateTimePrecision` [#2051](https://github.com/quickwit-oss/tantivy/issues/2051) (@guilload)
- Query Parser
  - Quotation mark can now be used for phrase queries. [#2050](https://github.com/quickwit-oss/tantivy/issues/2050) (@fulmicoton)
  - PhrasePrefixQuery is supported in the query parser via: `field:"phrase ter"*` [#2044](https://github.com/quickwit-oss/tantivy/issues/2044) (@adamreichold)
- Docs
  - Update examples for literate docs [#1880](https://github.com/quickwit-oss/tantivy/issues/1880) (@PSeitz)
  - Add ip field example [#1775](https://github.com/quickwit-oss/tantivy/issues/1775) (@PSeitz)
  - Fix doc store cache documentation [#1821](https://github.com/quickwit-oss/tantivy/issues/1821) (@PSeitz)
  - Fix BooleanQuery document [#1999](https://github.com/quickwit-oss/tantivy/issues/1999) (@RT_Enzyme)
  - Update comments in the faceted search example [#1737](https://github.com/quickwit-oss/tantivy/issues/1737) (@DawChihLiou)


Tantivy 0.19
================================
#### Bugfixes
- Fix missing fieldnorms for u64, i64, f64, bool, bytes and date [#1620](https://github.com/quickwit-oss/tantivy/pull/1620) (@PSeitz)
- Fix interpolation overflow in linear interpolation fastfield codec [#1480](https://github.com/quickwit-oss/tantivy/pull/1480) (@PSeitz @fulmicoton)

#### Features/Improvements
- Add support for `IN` in queryparser , e.g. `field: IN [val1 val2 val3]` [#1683](https://github.com/quickwit-oss/tantivy/pull/1683) (@trinity-1686a)
- Skip score calculation, when no scoring is required [#1646](https://github.com/quickwit-oss/tantivy/pull/1646) (@PSeitz)
- Limit fast fields to u32 (`get_val(u32)`) [#1644](https://github.com/quickwit-oss/tantivy/pull/1644) (@PSeitz)
- The `DateTime` type has been updated to hold timestamps with microseconds precision.
  `DateOptions` and `DatePrecision` have been added to configure Date fields. The precision is used to hint on fast values compression. Otherwise, seconds precision is used everywhere else (i.e terms, indexing) [#1396](https://github.com/quickwit-oss/tantivy/pull/1396) (@evanxg852000)
- Add IP address field type [#1553](https://github.com/quickwit-oss/tantivy/pull/1553) (@PSeitz)
- Add boolean field type [#1382](https://github.com/quickwit-oss/tantivy/pull/1382) (@boraarslan)
- Remove Searcher pool and make `Searcher` cloneable. (@PSeitz)
- Validate settings on create [#1570](https://github.com/quickwit-oss/tantivy/pull/1570) (@PSeitz)
- Detect and apply gcd on fastfield codecs [#1418](https://github.com/quickwit-oss/tantivy/pull/1418) (@PSeitz)
- Doc store
  - use separate thread to compress block store [#1389](https://github.com/quickwit-oss/tantivy/pull/1389) [#1510](https://github.com/quickwit-oss/tantivy/pull/1510) (@PSeitz @fulmicoton)
  - Expose doc store cache size [#1403](https://github.com/quickwit-oss/tantivy/pull/1403) (@PSeitz)
  - Enable compression levels for doc store [#1378](https://github.com/quickwit-oss/tantivy/pull/1378) (@PSeitz)
  - Make block size configurable [#1374](https://github.com/quickwit-oss/tantivy/pull/1374) (@kryesh)
- Make `tantivy::TantivyError` cloneable [#1402](https://github.com/quickwit-oss/tantivy/pull/1402) (@PSeitz)
- Add support for phrase slop in query language [#1393](https://github.com/quickwit-oss/tantivy/pull/1393) (@saroh)
- Aggregation
  - Add aggregation support for date type [#1693](https://github.com/quickwit-oss/tantivy/pull/1693)(@PSeitz)
  - Add support for keyed parameter in range and histogram aggregations [#1424](https://github.com/quickwit-oss/tantivy/pull/1424) (@k-yomo)
  - Add aggregation bucket limit [#1363](https://github.com/quickwit-oss/tantivy/pull/1363) (@PSeitz)
- Faster indexing
  - [#1610](https://github.com/quickwit-oss/tantivy/pull/1610) (@PSeitz)
  - [#1594](https://github.com/quickwit-oss/tantivy/pull/1594) (@PSeitz)
  - [#1582](https://github.com/quickwit-oss/tantivy/pull/1582) (@PSeitz)
  - [#1611](https://github.com/quickwit-oss/tantivy/pull/1611) (@PSeitz)
  - Added a pre-configured stop word filter for various language [#1666](https://github.com/quickwit-oss/tantivy/pull/1666) (@adamreichold)

Tantivy 0.18
================================

- For date values `chrono` has been replaced with `time` (@uklotzde) #1304 :
  - The `time` crate is re-exported as `tantivy::time` instead of `tantivy::chrono`.
  - The type alias `tantivy::DateTime` has been removed.
  - `Value::Date` wraps `time::PrimitiveDateTime` without time zone information.
  - Internally date/time values are stored as seconds since UNIX epoch in UTC.
  - Converting a `time::OffsetDateTime` to `Value::Date` implicitly converts the value into UTC.
    If this is not desired do the time zone conversion yourself and use `time::PrimitiveDateTime`
    directly instead.
- Add [histogram](https://github.com/quickwit-oss/tantivy/pull/1306) aggregation (@PSeitz)
- Add support for fastfield on text fields (@PSeitz)
- Add terms aggregation (@PSeitz)
- Add support for zstd compression (@kryesh)

Tantivy 0.18.1
================================
- Hotfix: positions computation.  #1629 (@fmassot, @fulmicoton, @PSeitz)

Tantivy 0.17
================================

- LogMergePolicy now triggers merges if the ratio of deleted documents reaches a threshold (@shikhar @fulmicoton) [#115](https://github.com/quickwit-oss/tantivy/issues/115)
- Adds a searcher Warmer API (@shikhar @fulmicoton)
- Change to non-strict schema. Ignore fields in data which are not defined in schema. Previously this returned an error. #1211
- Facets are necessarily indexed. Existing index with indexed facets should work out of the box. Index without facets that are marked with index: false should be broken (but they were already broken in a sense). (@fulmicoton) #1195 .
- Bugfix that could in theory impact durability in theory on some filesystems [#1224](https://github.com/quickwit-oss/tantivy/issues/1224)
- Schema now offers not indexing fieldnorms (@lpouget) [#922](https://github.com/quickwit-oss/tantivy/issues/922)
- Reduce the number of fsync calls [#1225](https://github.com/quickwit-oss/tantivy/issues/1225)
- Fix opening bytes index with dynamic codec (@PSeitz) [#1278](https://github.com/quickwit-oss/tantivy/issues/1278)
- Added an aggregation collector for range, average and stats compatible with Elasticsearch. (@PSeitz)
- Added a JSON schema type @fulmicoton [#1251](https://github.com/quickwit-oss/tantivy/issues/1251)
- Added support for slop in phrase queries @halvorboe [#1068](https://github.com/quickwit-oss/tantivy/issues/1068)

Tantivy 0.16.2
================================

- Bugfix in FuzzyTermQuery. (transposition_cost_one was not doing anything)

Tantivy 0.16.1
========================

- Major Bugfix on multivalued fastfield.  #1151
- Demux operation (@PSeitz)

Tantivy 0.16.0
=========================

- Bugfix in the filesum check. (@evanxg852000) #1127
- Bugfix in positions when the index is sorted by a field. (@appaquet) #1125

Tantivy 0.15.3
=========================

- Major bugfix. Deleting documents was broken when the index was sorted by a field. (@appaquet, @fulmicoton) #1101

Tantivy 0.15.2
========================

- Major bugfix. DocStore still panics when a deleted doc is at the beginning of a block. (@appaquet) #1088

Tantivy 0.15.1
=========================

- Major bugfix. DocStore panics when first block is deleted. (@appaquet) #1077

Tantivy 0.15.0
=========================

- API Changes. Using Range instead of (start, end) in the API and internals (`FileSlice`, `OwnedBytes`, `Snippets`, ...)
  This change is breaking but migration is trivial.
- Added an Histogram collector. (@fulmicoton) #994
- Added support for Option<TCollector>.  (@fulmicoton)
- DocAddress is now a struct (@scampi) #987
- Bugfix consistent tie break handling in facet's topk (@hardikpnsp) #357
- Date field support for range queries (@rihardsk) #516
- Added lz4-flex as the default compression scheme in tantivy (@PSeitz) #1009
- Renamed a lot of symbols to avoid all uppercasing on acronyms, as per new clippy recommendation. For instance, RAMDirectory -> RamDirectory. (@fulmicoton)
- Simplified positions index format (@fulmicoton) #1022
- Moved bitpacking to bitpacker subcrate and add BlockedBitpacker, which bitpacks blocks of 128 elements (@PSeitz) #1030
- Added support for more-like-this query in tantivy (@evanxg852000) #1011
- Added support for sorting an index, e.g presorting documents in an index by a timestamp field. This can heavily improve performance for certain scenarios, by utilizing the sorted data (Top-n optimizations)(@PSeitz). #1026
- Add iterator over documents in doc store (@PSeitz). #1044
- Fix log merge policy (@PSeitz). #1043
- Add detection to avoid small doc store blocks on merge (@PSeitz). #1054
- Make doc store compression dynamic (@PSeitz). #1060
- Switch to json for footer version handling (@PSeitz). #1060
- Updated TermMerger implementation to rely on the union feature of the FST (@scampi) #469
- Add boolean marking whether position is required in the query_terms API call (@fulmicoton). #1070

Tantivy 0.14.0
=========================

- Remove dependency to atomicwrites #833 .Implemented by @fulmicoton upon suggestion and research from @asafigan).
- Migrated tantivy error from the now deprecated `failure` crate to `thiserror` #760. (@hirevo)
- API Change. Accessing the typed value off a `Schema::Value` now returns an Option instead of panicking if the type does not match.
- Large API Change in the Directory API. Tantivy used to assume that all files could be somehow memory mapped. After this change, Directory return a `FileSlice` that can be reduced and eventually read into an `OwnedBytes` object. Long and blocking io operation are still required by they do not span over the entire file.
- Added support for Brotli compression in the DocStore. (@ppodolsky)
- Added helper for building intersections and unions in BooleanQuery (@guilload)
- Bugfix in `Query::explain`
- Removed dependency on `notify` #924. Replaced with `FileWatcher` struct that polls meta file every 500ms in background thread. (@halvorboe @guilload)
- Added `FilterCollector`, which wraps another collector and filters docs using a predicate over a fast field (@barrotsteindev)
- Simplified the encoding of the skip reader struct. BlockWAND max tf is now encoded over a single byte. (@fulmicoton)
- `FilterCollector` now supports all Fast Field value types (@barrotsteindev)
- FastField are not all loaded when opening the segment reader. (@fulmicoton)
- Added an API to merge segments, see `tantivy::merge_segments` #1005. (@evanxg852000)

This version breaks compatibility and requires users to reindex everything.

Tantivy 0.13.2
===================

Bugfix. Acquiring a facet reader on a segment that does not contain any
doc with this facet returns `None`. (#896)

Tantivy 0.13.1
===================

Made `Query` and `Collector` `Send + Sync`.
Updated misc dependency versions.

Tantivy 0.13.0
======================

Tantivy 0.13 introduce a change in the index format that will require
you to reindex your index (BlockWAND information are added in the skiplist).
The index size increase is minor as this information is only added for
full blocks.
If you have a massive index for which reindexing is not an option, please contact me
so that we can discuss possible solutions.

- Bugfix in `FuzzyTermQuery` not matching terms by prefix when it should (@Peachball)
- Relaxed constraints on the custom/tweak score functions. At the segment level, they can be mut, and they are not required to be Sync + Send.
- `MMapDirectory::open` does not return a `Result` anymore.
- Change in the DocSet and Scorer API. (@fulmicoton).
A freshly created DocSet point directly to their first doc. A sentinel value called TERMINATED marks the end of a DocSet.
`.advance()` returns the new DocId. `Scorer::skip(target)` has been replaced by `Scorer::seek(target)` and returns the resulting DocId.
As a result, iterating through DocSet now looks as follows

```rust
let mut doc = docset.doc();
while doc != TERMINATED {
   // ...
   doc = docset.advance();
}
```

The change made it possible to greatly simplify a lot of the docset's code.

- Misc internal optimization and introduction of the `Scorer::for_each_pruning` function. (@fulmicoton)
- Added an offset option to the Top(.*)Collectors. (@robyoung)
- Added Block WAND. Performance on TOP-K on term-unions should be greatly increased. (@fulmicoton, and special thanks
to the PISA team for answering all my questions!)

Tantivy 0.12.0
======================

- Removing static dispatch in tokenizers for simplicity. (#762)
- Added backward iteration for `TermDictionary` stream. (@halvorboe)
- Fixed a performance issue when searching for the posting lists of a missing term (@audunhalland)
- Added a configurable maximum number of docs (10M by default) for a segment to be considered for merge (@hntd187, landed by @halvorboe #713)
- Important Bugfix #777, causing tantivy to retain memory mapping. (diagnosed by @poljar)
- Added support for field boosting. (#547, @fulmicoton)

## How to update?

Crates relying on custom tokenizer, or registering tokenizer in the manager will require some
minor changes. Check <https://github.com/quickwit-oss/tantivy/blob/main/examples/custom_tokenizer.rs>
to check for some code sample.

Tantivy 0.11.3
=======================

- Fixed DateTime as a fast field (#735)

Tantivy 0.11.2
=======================

- The future returned by `IndexWriter::merge` does not borrow `self` mutably anymore (#732)
- Exposing a constructor for `WatchHandle` (#731)

Tantivy 0.11.1
=====================

- Bug fix #729

Tantivy 0.11.0
=====================

- Added f64 field. Internally reuse u64 code the same way i64 does (@fdb-hiroshima)
- Various bugfixes in the query parser.
  - Better handling of hyphens in query parser. (#609)
  - Better handling of whitespaces.
- Closes #498 - add support for Elastic-style unbounded range queries for alphanumeric types eg. "title:>hello", "weight:>=70.5", "height:<200" (@petr-tik)
- API change around `Box<BoxableTokenizer>`. See detail in #629
- Avoid rebuilding Regex automaton whenever a regex query is reused. #639 (@brainlock)
- Add footer with some metadata to index files. #605 (@fdb-hiroshima)
- Add a method to check the compatibility of the footer in the index with the running version of tantivy (@petr-tik)
- TopDocs collector: ensure stable sorting on equal score. #671 (@brainlock)
- Added handling of pre-tokenized text fields (#642), which will enable users to
  load tokens created outside tantivy. See usage in examples/pre_tokenized_text. (@kkoziara)
- Fix crash when committing multiple times with deleted documents. #681 (@brainlock)

## How to update?

- The index format is changed. You are required to reindex your data to use tantivy 0.11.
- `Box<dyn BoxableTokenizer>` has been replaced by a `BoxedTokenizer` struct.
- Regex are now compiled when the `RegexQuery` instance is built. As a result, it can now return
an error and handling the `Result` is required.
- `tantivy::version()` now returns a `Version` object. This object implements `ToString()`

Tantivy 0.10.2
=====================

- Closes #656. Solving memory leak.

Tantivy 0.10.1
=====================

- Closes #544.  A few users experienced problems with the directory watching system.
Avoid watching the mmap directory until someone effectively creates a reader that uses
this functionality.

Tantivy 0.10.0
=====================

*Tantivy 0.10.0 index format is compatible with the index format in 0.9.0.*

- Added an API to easily tweak or entirely replace the
 default score. See `TopDocs::tweak_score`and `TopScore::custom_score` (@fulmicoton)
- Added an ASCII folding filter (@drusellers)
- Bugfix in `query.count` in presence of deletes (@fulmicoton)
- Added `.explain(...)` in `Query` and `Weight` to (@fulmicoton)
- Added an efficient way to `delete_all_documents` in `IndexWriter` (@petr-tik).
  All segments are simply removed.

Minor
---------

- Switched to Rust 2018 (@uvd)
- Small simplification of the code.
Calling .freq() or .doc() when .advance() has never been called
on segment postings should panic from now on.
- Tokens exceeding `u16::max_value() - 4` chars are discarded silently instead of panicking.
- Fast fields are now preloaded when the `SegmentReader` is created.
- `IndexMeta` is now public.  (@hntd187)
- `IndexWriter` `add_document`, `delete_term`. `IndexWriter` is `Sync`, making it possible to use it with a `Arc<RwLock<IndexWriter>>`. `add_document` and `delete_term` can
only require a read lock. (@fulmicoton)
- Introducing `Opstamp` as an expressive type alias for `u64`. (@petr-tik)
- Stamper now relies on `AtomicU64` on all platforms (@petr-tik)
- Bugfix - Files get deleted slightly earlier
- Compilation resources improved (@fdb-hiroshima)

## How to update?

Your program should be usable as is.

### Fast fields

Fast fields used to be accessed directly from the `SegmentReader`.
The API changed, you are now required to acquire your fast field reader via the
`segment_reader.fast_fields()`, and use one of the typed method:

- `.u64()`, `.i64()` if your field is single-valued ;
- `.u64s()`, `.i64s()` if your field is multi-valued ;
- `.bytes()` if your field is bytes fast field.

Tantivy 0.9.0
=====================

*0.9.0 index format is not compatible with the
previous index format.*

- MAJOR BUGFIX :
  Some `Mmap` objects were being leaked, and would never get released. (@fulmicoton)
- Removed most unsafe (@fulmicoton)
- Indexer memory footprint improved. (VInt comp, inlining the first block. (@fulmicoton)
- Stemming in other language possible (@pentlander)
- Segments with no docs are deleted earlier (@barrotsteindev)
- Added grouped add and delete operations.
  They are guaranteed to happen together (i.e. they cannot be split by a commit).
  In addition, adds are guaranteed to happen on the same segment. (@elbow-jason)
- Removed `INT_STORED` and `INT_INDEXED`. It is now possible to use `STORED` and `INDEXED`
  for int fields. (@fulmicoton)
- Added DateTime field (@barrotsteindev)
- Added IndexReader. By default, index is reloaded automatically upon new commits (@fulmicoton)
- SIMD linear search within blocks (@fulmicoton)

## How to update ?

tantivy 0.9 brought some API breaking change.
To update from tantivy 0.8, you will need to go through the following steps.

- `schema::INT_INDEXED` and `schema::INT_STORED`  should be replaced by `schema::INDEXED` and `schema::INT_STORED`.
- The index now does not hold the pool of searcher anymore. You are required to create an intermediary object called
`IndexReader` for this.

    ```rust
    // create the reader. You typically need to create 1 reader for the entire
    // lifetime of you program.
    let reader = index.reader()?;

    // Acquire a searcher (previously `index.searcher()`) is now written:
    let searcher = reader.searcher();

    // With the default setting of the reader, you are not required to
    // call `index.load_searchers()` anymore.
    //
    // The IndexReader will pick up that change automatically, regardless
    // of whether the update was done in a different process or not.
    // If this behavior is not wanted, you can create your reader with
    // the `ReloadPolicy::Manual`, and manually decide when to reload the index
    // by calling `reader.reload()?`.

    ```

Tantivy 0.8.2
=====================

Fixing build for x86_64 platforms. (#496)
No need to update from 0.8.1 if tantivy
is building on your platform.

Tantivy 0.8.1
=====================

Hotfix of #476.

Merge was reflecting deletes before commit was passed.
Thanks @barrotsteindev  for reporting the bug.

Tantivy 0.8.0
=====================

*No change in the index format*

- API Breaking change in the collector API. (@jwolfe, @fulmicoton)
- Multithreaded search (@jwolfe, @fulmicoton)

Tantivy 0.7.1
=====================

*No change in the index format*

- Bugfix: NGramTokenizer panics on non ascii chars
- Added a space usage API

Tantivy 0.7
=====================

- Skip data for doc ids and positions (@fulmicoton),
  greatly improving performance
- Tantivy error now rely on the failure crate (@drusellers)
- Added support for `AND`, `OR`, `NOT` syntax in addition to the `+`,`-` syntax
- Added a snippet generator with highlight (@vigneshsarma, @fulmicoton)
- Added a `TopFieldCollector` (@pentlander)

Tantivy 0.6.1
=========================

- Bugfix #324. GC removing was removing file that were still in useful
- Added support for parsing AllQuery and RangeQuery via QueryParser
  - AllQuery: `*`
  - RangeQuery:
    - Inclusive `field:[startIncl to endIncl]`
    - Exclusive `field:{startExcl to endExcl}`
    - Mixed `field:[startIncl to endExcl}` and vice versa
    - Unbounded `field:[start to *]`, `field:[* to end]`

Tantivy 0.6
==========================

Special thanks to @drusellers and @jason-wolfe for their contributions
to this release!

- Removed C code. Tantivy is now pure Rust. (@fulmicoton)
- BM25 (@fulmicoton)
- Approximate field norms encoded over 1 byte. (@fulmicoton)
- Compiles on stable rust (@fulmicoton)
- Add &[u8] fastfield for associating arbitrary bytes to each document (@jason-wolfe) (#270)
  - Completely uncompressed
  - Internally: One u64 fast field for indexes, one fast field for the bytes themselves.
- Add NGram token support (@drusellers)
- Add Stopword Filter support (@drusellers)
- Add a FuzzyTermQuery (@drusellers)
- Add a RegexQuery (@drusellers)
- Various performance improvements (@fulmicoton)_

Tantivy 0.5.2
===========================

- bugfix #274
- bugfix #280
- bugfix #289

Tantivy 0.5.1
==========================

- bugfix #254 : tantivy failed if no documents in a segment contained a specific field.

Tantivy 0.5
==========================

- Faceting
- RangeQuery
- Configurable tokenization pipeline
- Bugfix in PhraseQuery
- Various query optimisation
- Allowing very large indexes
  - 64 bits file address
  - Smarter encoding of the `TermInfo` objects

Tantivy 0.4.3
==========================

- Bugfix race condition when deleting files. (#198)

Tantivy 0.4.2
==========================

- Prevent usage of AVX2 instructions (#201)

Tantivy 0.4.1
==========================

- Bugfix for non-indexed fields. (#199)

Tantivy 0.4.0
==========================

- Raise the limit of number of fields (previously 256 fields) (@fulmicoton)
- Removed u32 fields. They are replaced by u64 and i64 fields (#65) (@fulmicoton)
- Optimized skip in SegmentPostings (#130) (@lnicola)
- Replacing rustc_serialize by serde. Kudos to  benchmark@KodrAus and @lnicola
- Using error-chain (@KodrAus)
- QueryParser: (@fulmicoton)
  - Explicit error returned when searched for a term that is not indexed
  - Searching for a int term via the query parser was broken `(age:1)`
  - Searching for a non-indexed field returns an explicit Error
  - Phrase query for non-tokenized field are not tokenized by the query parser.
- Faster/Better indexing (@fulmicoton)
  - using murmurhash2
  - faster merging
  - more memory efficient fast field writer (@lnicola )
  - better handling of collisions
  - lesser memory usage
- Added API, most notably to iterate over ranges of terms (@fulmicoton)
- Bugfix that was preventing to unmap segment files, on index drop (@fulmicoton)
- Made the doc! macro public (@fulmicoton)
- Added an alternative implementation of the streaming dictionary (@fulmicoton)

Tantivy 0.3.1
==========================

- Expose a method to trigger files garbage collection

Tantivy 0.3
==========================

Special thanks to @Kodraus @lnicola @Ameobea @manuel-woelker @celaus
for their contribution to this release.

Thanks also to everyone in tantivy gitter chat
for their advise and company :)

<https://gitter.im/tantivy-search/tantivy>

Warning:

Tantivy 0.3 is NOT backward compatible with tantivy 0.2
code and index format.
You should not expect backward compatibility before
tantivy 1.0.

New Features
------------

- Delete. You can now delete documents from an index.
- Support for windows (Thanks to @lnicola)

Various Bugfixes & small improvements
----------------------------------------

- Added CI for Windows (<https://ci.appveyor.com/project/fulmicoton/tantivy>)
Thanks to @KodrAus ! (#108)
- Various dependy version update (Thanks to @Ameobea) #76
- Fixed several race conditions in `Index.wait_merge_threads`
- Fixed #72. Mmap were never released.
- Fixed #80. Fast field used to take an amplitude of 32 bits after a merge. (Ouch!)
- Fixed #92. u32 are now encoded using big endian in the fst
  in order to make there enumeration consistent with
  the natural ordering.
- Building binary targets for tantivy-cli (Thanks to @KodrAus)
- Misc invisible bug fixes, and code cleanup.
- Use


================================================
FILE: CITATION.cff
================================================
cff-version: 1.2.0
message: "If you use this software, please cite it as below."
authors:
  - alias: Quickwit Inc.
    website: "https://quickwit.io"
title: "tantivy"
version: 0.22.0
doi: 10.5281/zenodo.13942948
date-released: 2024-10-17
url: "https://github.com/quickwit-oss/tantivy"


================================================
FILE: Cargo.toml
================================================
[package]
name = "tantivy"
version = "0.26.0"
authors = ["Paul Masurel <paul.masurel@gmail.com>"]
license = "MIT"
categories = ["database-implementations", "data-structures"]
description = """Search engine library"""
documentation = "https://docs.rs/tantivy/"
homepage = "https://github.com/quickwit-oss/tantivy"
repository = "https://github.com/quickwit-oss/tantivy"
readme = "README.md"
keywords = ["search", "information", "retrieval"]
edition = "2021"
rust-version = "1.86"
exclude = ["benches/*.json", "benches/*.txt"]

[dependencies]
oneshot = "0.1.13"
base64 = "0.22.0"
byteorder = "1.4.3"
crc32fast = "1.3.2"
once_cell = "1.10.0"
regex = { version = "1.5.5", default-features = false, features = [
    "std",
    "unicode",
] }
aho-corasick = "1.0"
tantivy-fst = "0.5"
memmap2 = { version = "0.9.0", optional = true }
lz4_flex = { version = "0.12", default-features = false, optional = true }
zstd = { version = "0.13", optional = true, default-features = false }
tempfile = { version = "3.12.0", optional = true }
log = "0.4.16"
serde = { version = "1.0.219", features = ["derive"] }
serde_json = "1.0.140"
fs4 = { version = "0.13.1", optional = true }
levenshtein_automata = "0.2.1"
uuid = { version = "1.0.0", features = ["v4", "serde"] }
crossbeam-channel = "0.5.4"
rust-stemmers = { version = "1.2.0", optional = true }
downcast-rs = "2.0.1"
bitpacking = { version = "0.9.3", default-features = false, features = [
    "bitpacker4x",
] }
census = "0.4.2"
rustc-hash = "2.0.0"
thiserror = "2.0.1"
htmlescape = "0.3.1"
fail = { version = "0.5.0", optional = true }
time = { version = "0.3.47", features = ["serde-well-known"] }
smallvec = "1.8.0"
rayon = "1.5.2"
lru = "0.16.3"
fastdivide = "0.4.0"
itertools = "0.14.0"
measure_time = "0.9.0"
arc-swap = "1.5.0"
bon = "3.3.1"

columnar = { version = "0.6", path = "./columnar", package = "tantivy-columnar" }
sstable = { version = "0.6", path = "./sstable", package = "tantivy-sstable", optional = true }
stacker = { version = "0.6", path = "./stacker", package = "tantivy-stacker" }
query-grammar = { version = "0.25.0", path = "./query-grammar", package = "tantivy-query-grammar" }
tantivy-bitpacker = { version = "0.9", path = "./bitpacker" }
common = { version = "0.10", path = "./common/", package = "tantivy-common" }
tokenizer-api = { version = "0.6", path = "./tokenizer-api", package = "tantivy-tokenizer-api" }
sketches-ddsketch = { git = "https://github.com/quickwit-oss/rust-sketches-ddsketch.git", rev = "555caf1", features = ["use_serde"] }
datasketches = "0.2.0"
futures-util = { version = "0.3.28", optional = true }
futures-channel = { version = "0.3.28", optional = true }
fnv = "1.0.7"
typetag = "0.2.21"

[target.'cfg(windows)'.dependencies]
winapi = "0.3.9"

[dev-dependencies]
binggan = "0.14.2"
rand = "0.9"
maplit = "1.0.2"
matches = "0.1.9"
pretty_assertions = "1.2.1"
proptest = "1.7.0"
test-log = "0.2.10"
futures = "0.3.21"
paste = "1.0.11"
more-asserts = "0.3.1"
rand_distr = "0.5"
time = { version = "0.3.47", features = ["serde-well-known", "macros"] }
postcard = { version = "1.0.4", features = [
    "use-std",
], default-features = false }

[target.'cfg(not(windows))'.dev-dependencies]
criterion = { version = "0.5", default-features = false }

[dev-dependencies.fail]
version = "0.5.0"
features = ["failpoints"]

[profile.release]
opt-level = 3
debug = false
debug-assertions = false

[profile.bench]
opt-level = 3
debug = true
debug-assertions = false

[profile.test]
debug-assertions = true
overflow-checks = true

[features]
default = ["mmap", "stopwords", "lz4-compression", "columnar-zstd-compression", "stemmer"]
stemmer = ["rust-stemmers"]
mmap = ["fs4", "tempfile", "memmap2"]
stopwords = []

lz4-compression = ["lz4_flex"]
zstd-compression = ["zstd"]

# enable zstd-compression in columnar (and sstable)
columnar-zstd-compression = ["columnar/zstd-compression"]

failpoints = ["fail", "fail/failpoints"]
unstable = []                            # useful for benches.

quickwit = ["sstable", "futures-util", "futures-channel"]

# Compares only the hash of a string when indexing data.
# Increases indexing speed, but may lead to extremely rare missing terms, when there's a hash collision.
# Uses 64bit ahash.
compare_hash_only = ["stacker/compare_hash_only"]

[workspace]
members = [
    "query-grammar",
    "bitpacker",
    "common",
    "ownedbytes",
    "stacker",
    "sstable",
    "tokenizer-api",
    "columnar",
]

# Following the "fail" crate best practises, we isolate
# tests that define specific behavior in fail check points
# in a different binary.
#
# We do that because, fail rely on a global definition of
# failpoints behavior and hence, it is incompatible with
# multithreading.
[[test]]
name = "failpoints"
path = "tests/failpoints/mod.rs"
required-features = ["failpoints"]

[[bench]]
name = "analyzer"
harness = false

[[bench]]
name = "index-bench"
harness = false

[[bench]]
name = "agg_bench"
harness = false

[[bench]]
name = "exists_json"
harness = false

[[bench]]
name = "range_query"
harness = false

[[bench]]
name = "and_or_queries"
harness = false

[[bench]]
name = "range_queries"
harness = false

[[bench]]
name = "bool_queries_with_range"
harness = false

[[bench]]
name = "str_search_and_get"
harness = false

[[bench]]
name = "merge_segments"
harness = false

[[bench]]
name = "regex_all_terms"
harness = false


================================================
FILE: LICENSE
================================================
Copyright (c) 2018 by the project authors, as listed in the AUTHORS file. 

Permission is hereby granted, free of charge, to any person obtaining a copy of this software and associated documentation files (the "Software"), to deal in the Software without restriction, including without limitation the rights to use, copy, modify, merge, publish, distribute, sublicense, and/or sell copies of the Software, and to permit persons to whom the Software is furnished to do so, subject to the following conditions:

The above copyright notice and this permission notice shall be included in all copies or substantial portions of the Software.

THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.


================================================
FILE: Makefile
================================================
test:
	@echo "Run test only... No examples."
	cargo test --tests --lib

fmt:
	cargo +nightly fmt --all


================================================
FILE: README.md
================================================
[![Docs](https://docs.rs/tantivy/badge.svg)](https://docs.rs/crate/tantivy/)
[![Build Status](https://github.com/quickwit-oss/tantivy/actions/workflows/test.yml/badge.svg)](https://github.com/quickwit-oss/tantivy/actions/workflows/test.yml)
[![codecov](https://codecov.io/gh/quickwit-oss/tantivy/branch/main/graph/badge.svg)](https://codecov.io/gh/quickwit-oss/tantivy)
[![Join the chat at https://discord.gg/MT27AG5EVE](https://shields.io/discord/908281611840282624?label=chat%20on%20discord)](https://discord.gg/MT27AG5EVE)
[![License: MIT](https://img.shields.io/badge/License-MIT-yellow.svg)](https://opensource.org/licenses/MIT)
[![Crates.io](https://img.shields.io/crates/v/tantivy.svg)](https://crates.io/crates/tantivy)

<img src="https://tantivy-search.github.io/logo/tantivy-logo.png" alt="Tantivy, the fastest full-text search engine library written in Rust" height="250">

## Fast full-text search engine library written in Rust

**If you are looking for an alternative to Elasticsearch or Apache Solr, check out [Quickwit](https://github.com/quickwit-oss/quickwit), our distributed search engine built on top of Tantivy.**

Tantivy is closer to [Apache Lucene](https://lucene.apache.org/) than to [Elasticsearch](https://www.elastic.co/products/elasticsearch) or [Apache Solr](https://lucene.apache.org/solr/) in the sense it is not
an off-the-shelf search engine server, but rather a crate that can be used to build such a search engine.

Tantivy is, in fact, strongly inspired by Lucene's design.

## Benchmark

The following [benchmark](https://tantivy-search.github.io/bench/) breaks down the
performance for different types of queries/collections.

Your mileage WILL vary depending on the nature of queries and their load.

Details about the benchmark can be found at this [repository](https://github.com/quickwit-oss/search-benchmark-game).

## Features

- Full-text search
- Configurable tokenizer (stemming available for 17 Latin languages) with third party support for Chinese ([tantivy-jieba](https://crates.io/crates/tantivy-jieba) and [cang-jie](https://crates.io/crates/cang-jie)), Japanese ([lindera](https://github.com/lindera-morphology/lindera-tantivy), [Vaporetto](https://crates.io/crates/vaporetto_tantivy), and [tantivy-tokenizer-tiny-segmenter](https://crates.io/crates/tantivy-tokenizer-tiny-segmenter)) and Korean ([lindera](https://github.com/lindera-morphology/lindera-tantivy) + [lindera-ko-dic-builder](https://github.com/lindera-morphology/lindera-ko-dic-builder))
- Fast (check out the :racehorse: :sparkles: [benchmark](https://tantivy-search.github.io/bench/) :sparkles: :racehorse:)
- Tiny startup time (<10ms), perfect for command-line tools
- BM25 scoring (the same as Lucene)
- Natural query language (e.g. `(michael AND jackson) OR "king of pop"`)
- Phrase queries search (e.g. `"michael jackson"`)
- Incremental indexing
- Multithreaded indexing (indexing English Wikipedia takes < 3 minutes on my desktop)
- Mmap directory
- SIMD integer compression when the platform/CPU includes the SSE2 instruction set
- Single valued and multivalued u64, i64, and f64 fast fields (equivalent of doc values in Lucene)
- `&[u8]` fast fields
- Text, i64, u64, f64, dates, ip, bool, and hierarchical facet fields
- Compressed document store (LZ4, Zstd, None)
- Range queries
- Faceted search
- Configurable indexing (optional term frequency and position indexing)
- JSON Field
- Aggregation Collector: histogram, range buckets, average, and stats metrics
- LogMergePolicy with deletes
- Searcher Warmer API
- Cheesy logo with a horse

### Non-features

Distributed search is out of the scope of Tantivy, but if you are looking for this feature, check out [Quickwit](https://github.com/quickwit-oss/quickwit/).

## Getting started

Tantivy works on stable Rust and supports Linux, macOS, and Windows.

- [Tantivy's simple search example](https://tantivy-search.github.io/examples/basic_search.html)
- [tantivy-cli and its tutorial](https://github.com/quickwit-oss/tantivy-cli) - `tantivy-cli` is an actual command-line interface that makes it easy for you to create a search engine,
index documents, and search via the CLI or a small server with a REST API.
It walks you through getting a Wikipedia search engine up and running in a few minutes.
- [Reference doc for the last released version](https://docs.rs/tantivy/)

## How can I support this project?

There are many ways to support this project.

- Use Tantivy and tell us about your experience on [Discord](https://discord.gg/MT27AG5EVE) or by email (paul.masurel@gmail.com)
- Report bugs
- Write a blog post
- Help with documentation by asking questions or submitting PRs
- Contribute code (you can join [our Discord server](https://discord.gg/MT27AG5EVE))
- Talk about Tantivy around you

## Contributing code

We use the GitHub Pull Request workflow: reference a GitHub ticket and/or include a comprehensive commit message when opening a PR.
Feel free to update CHANGELOG.md with your contribution.

### Tokenizer

When implementing a tokenizer for tantivy depend on the `tantivy-tokenizer-api` crate.

### Clone and build locally

Tantivy compiles on stable Rust.
To check out and run tests, you can simply run:

```bash
git clone https://github.com/quickwit-oss/tantivy.git
cd tantivy
cargo test
```

## Companies Using Tantivy

<p align="left">
<img align="center" src="doc/assets/images/etsy.png" alt="Etsy" height="25" width="auto" /> &nbsp;
<img align="center" src="doc/assets/images/paradedb.png" alt="ParadeDB" height="25" width="auto" /> &nbsp;
<img align="center" src="doc/assets/images/Nuclia.png#gh-light-mode-only" alt="Nuclia" height="25" width="auto" /> &nbsp;
<img align="center" src="doc/assets/images/humanfirst.png#gh-light-mode-only" alt="Humanfirst.ai" height="30" width="auto" />
<img align="center" src="doc/assets/images/element.io.svg#gh-light-mode-only" alt="Element.io" height="25" width="auto" />
<img align="center" src="doc/assets/images/nuclia-dark-theme.png#gh-dark-mode-only" alt="Nuclia" height="35" width="auto" /> &nbsp;
<img align="center" src="doc/assets/images/humanfirst.ai-dark-theme.png#gh-dark-mode-only" alt="Humanfirst.ai" height="25" width="auto" />&nbsp; &nbsp;
<img align="center" src="doc/assets/images/element-dark-theme.png#gh-dark-mode-only" alt="Element.io" height="25" width="auto" />
</p>

## FAQ

### Can I use Tantivy in other languages?

- Python → [tantivy-py](https://github.com/quickwit-oss/tantivy-py)
- Ruby → [tantiny](https://github.com/baygeldin/tantiny)

You can also find other bindings on [GitHub](https://github.com/search?q=tantivy) but they may be less maintained.

### What are some examples of Tantivy use?

- [seshat](https://github.com/matrix-org/seshat/): A matrix message database/indexer
- [tantiny](https://github.com/baygeldin/tantiny): Tiny full-text search for Ruby
- [lnx](https://github.com/lnx-search/lnx): adaptable, typo tolerant search engine with a REST API
- [Bichon](https://github.com/rustmailer/bichon): A lightweight, high-performance Rust email archiver with WebUI
- and [more](https://github.com/search?q=tantivy)!

### On average, how much faster is Tantivy compared to Lucene?

- According to our [search latency benchmark](https://tantivy-search.github.io/bench/), Tantivy is approximately 2x faster than Lucene.

### Does tantivy support incremental indexing?

- Yes.

### How can I edit documents?

- Data in tantivy is immutable. To edit a document, the document needs to be deleted and reindexed.

### When will my documents be searchable during indexing?

- Documents will be searchable after a `commit` is called on an `IndexWriter`. Existing `IndexReader`s will also need to be reloaded in order to reflect the changes. Finally, changes are only visible to newly acquired `Searcher`.


================================================
FILE: RELEASE.md
================================================
# Releasing a new Tantivy Version

## Steps

1. Identify new packages in workspace since last release
2. Identify changed packages in workspace since last release
3. Bump version in `Cargo.toml` and their dependents for all changed packages
4. Update version of root `Cargo.toml`
5. Publish version starting with leaf nodes
6. Set git tag with new version


[`cargo-release`](https://github.com/crate-ci/cargo-release) will help us with steps 1-5:

Replace prev-tag-name
```bash
cargo release --workspace --no-publish -v --prev-tag-name 0.24 --push-remote origin minor --no-tag
```

`no-tag` or it will create tags for all the subpackages

cargo release will _not_ ignore unchanged packages, but it will print warnings for them.
e.g. "warning: updating ownedbytes to 0.10.0 despite no changes made since tag 0.24"

We need to manually ignore these unchanged packages
```bash
cargo release --workspace --no-publish -v --prev-tag-name 0.24 --push-remote origin minor --no-tag --exclude tokenizer-api
```

Add `--execute` to actually publish the packages, otherwise it will only print the commands that would be run.

### Tag Version
```bash
git tag 0.25.0
git push upstream tag 0.25.0
```


================================================
FILE: TODO.txt
================================================
Make schema_builder API fluent.
fix doc serialization and prevent compression problems

u64 , etc. should return Result<Option> now that we support optional missing a column is really not an error
remove fastfield codecs
ditch the first_or_default trick. if it is still useful, improve its implementation.
rename FastFieldReaders::open to load


remove fast field reader

find a way to unify the two DateTime.
re-add type check in the filter wrapper

add unit test on columnar list columns.

make sure sort works


================================================
FILE: benches/agg_bench.rs
================================================
use binggan::plugins::PeakMemAllocPlugin;
use binggan::{black_box, InputGroup, PeakMemAlloc, INSTRUMENTED_SYSTEM};
use rand::distr::weighted::WeightedIndex;
use rand::rngs::StdRng;
use rand::seq::IndexedRandom;
use rand::{Rng, SeedableRng};
use rand_distr::Distribution;
use serde_json::json;
use tantivy::aggregation::agg_req::Aggregations;
use tantivy::aggregation::AggregationCollector;
use tantivy::query::{AllQuery, TermQuery};
use tantivy::schema::{IndexRecordOption, Schema, TextFieldIndexing, FAST, STRING};
use tantivy::{doc, DateTime, Index, Term};

#[global_allocator]
pub static GLOBAL: &PeakMemAlloc<std::alloc::System> = &INSTRUMENTED_SYSTEM;

/// Mini macro to register a function via its name
/// runner.register("average_u64", move |index| average_u64(index));
macro_rules! register {
    ($runner:expr, $func:ident) => {
        $runner.register(stringify!($func), move |index| {
            $func(index);
        })
    };
}

fn main() {
    let inputs = vec![
        ("full", get_test_index_bench(Cardinality::Full).unwrap()),
        (
            "dense",
            get_test_index_bench(Cardinality::OptionalDense).unwrap(),
        ),
        (
            "sparse",
            get_test_index_bench(Cardinality::OptionalSparse).unwrap(),
        ),
        (
            "multivalue",
            get_test_index_bench(Cardinality::Multivalued).unwrap(),
        ),
    ];

    bench_agg(InputGroup::new_with_inputs(inputs));
}

fn bench_agg(mut group: InputGroup<Index>) {
    group.add_plugin(PeakMemAllocPlugin::new(GLOBAL));

    register!(group, average_u64);
    register!(group, average_f64);
    register!(group, average_f64_u64);
    register!(group, stats_f64);
    register!(group, extendedstats_f64);
    register!(group, percentiles_f64);
    register!(group, terms_7);
    register!(group, terms_all_unique);
    register!(group, terms_150_000);
    register!(group, terms_many_top_1000);
    register!(group, terms_many_order_by_term);
    register!(group, terms_many_with_top_hits);
    register!(group, terms_all_unique_with_avg_sub_agg);
    register!(group, terms_many_with_avg_sub_agg);
    register!(group, terms_status_with_avg_sub_agg);
    register!(group, terms_status_with_histogram);
    register!(group, terms_zipf_1000);
    register!(group, terms_zipf_1000_with_histogram);
    register!(group, terms_zipf_1000_with_avg_sub_agg);

    register!(group, terms_many_json_mixed_type_with_avg_sub_agg);

    register!(group, composite_term_many_page_1000);
    register!(group, composite_term_many_page_1000_with_avg_sub_agg);
    register!(group, composite_term_few);
    register!(group, composite_histogram);
    register!(group, composite_histogram_calendar);

    register!(group, cardinality_agg);
    register!(group, terms_status_with_cardinality_agg);

    register!(group, range_agg);
    register!(group, range_agg_with_avg_sub_agg);
    register!(group, range_agg_with_term_agg_status);
    register!(group, range_agg_with_term_agg_many);
    register!(group, histogram);
    register!(group, histogram_hard_bounds);
    register!(group, histogram_with_avg_sub_agg);
    register!(group, histogram_with_term_agg_status);
    register!(group, avg_and_range_with_avg_sub_agg);

    // Filter aggregation benchmarks
    register!(group, filter_agg_all_query_count_agg);
    register!(group, filter_agg_term_query_count_agg);
    register!(group, filter_agg_all_query_with_sub_aggs);
    register!(group, filter_agg_term_query_with_sub_aggs);

    group.run();
}

fn exec_term_with_agg(index: &Index, agg_req: serde_json::Value) {
    let agg_req: Aggregations = serde_json::from_value(agg_req).unwrap();

    let reader = index.reader().unwrap();
    let text_field = reader.searcher().schema().get_field("text").unwrap();
    let term_query = TermQuery::new(
        Term::from_field_text(text_field, "cool"),
        IndexRecordOption::Basic,
    );
    let collector = get_collector(agg_req);
    let searcher = reader.searcher();
    black_box(searcher.search(&term_query, &collector).unwrap());
}

fn average_u64(index: &Index) {
    let agg_req = json!({
        "average": { "avg": { "field": "score", } }
    });
    exec_term_with_agg(index, agg_req)
}
fn average_f64(index: &Index) {
    let agg_req = json!({
        "average": { "avg": { "field": "score_f64", } }
    });
    exec_term_with_agg(index, agg_req)
}
fn average_f64_u64(index: &Index) {
    let agg_req = json!({
        "average_f64": { "avg": { "field": "score_f64" } },
        "average": { "avg": { "field": "score" } },
    });
    exec_term_with_agg(index, agg_req)
}
fn stats_f64(index: &Index) {
    let agg_req = json!({
        "average_f64": { "stats": { "field": "score_f64", } }
    });
    exec_term_with_agg(index, agg_req)
}
fn extendedstats_f64(index: &Index) {
    let agg_req = json!({
        "extendedstats_f64": { "extended_stats": { "field": "score_f64", } }
    });
    exec_term_with_agg(index, agg_req)
}
fn percentiles_f64(index: &Index) {
    let agg_req = json!({
        "mypercentiles": {
            "percentiles": {
                "field": "score_f64",
                "percents": [ 95, 99, 99.9 ]
            }
        }
    });
    execute_agg(index, agg_req);
}

fn cardinality_agg(index: &Index) {
    let agg_req = json!({
        "cardinality": {
            "cardinality": {
                "field": "text_many_terms"
            },
        }
    });
    execute_agg(index, agg_req);
}
fn terms_status_with_cardinality_agg(index: &Index) {
    let agg_req = json!({
        "my_texts": {
            "terms": { "field": "text_few_terms_status" },
            "aggs": {
                "cardinality": {
                    "cardinality": {
                        "field": "text_many_terms"
                    },
                }
            }
        },
    });
    execute_agg(index, agg_req);
}

fn terms_7(index: &Index) {
    let agg_req = json!({
        "my_texts": { "terms": { "field": "text_few_terms_status" } },
    });
    execute_agg(index, agg_req);
}
fn terms_all_unique(index: &Index) {
    let agg_req = json!({
        "my_texts": { "terms": { "field": "text_all_unique_terms" } },
    });
    execute_agg(index, agg_req);
}

fn terms_150_000(index: &Index) {
    let agg_req = json!({
        "my_texts": { "terms": { "field": "text_many_terms" } },
    });
    execute_agg(index, agg_req);
}
fn terms_many_top_1000(index: &Index) {
    let agg_req = json!({
        "my_texts": { "terms": { "field": "text_many_terms", "size": 1000 } },
    });
    execute_agg(index, agg_req);
}
fn terms_many_order_by_term(index: &Index) {
    let agg_req = json!({
        "my_texts": { "terms": { "field": "text_many_terms", "order": { "_key": "desc" } } },
    });
    execute_agg(index, agg_req);
}
fn terms_many_with_top_hits(index: &Index) {
    let agg_req = json!({
        "my_texts": {
            "terms": { "field": "text_many_terms" },
            "aggs": {
                "top_hits": { "top_hits":
                    {
                        "sort": [
                            { "score": "desc" }
                        ],
                        "size": 2,
                        "doc_value_fields": ["score_f64"]
                    }
                }
            }
        },
    });
    execute_agg(index, agg_req);
}
fn terms_many_with_avg_sub_agg(index: &Index) {
    let agg_req = json!({
        "my_texts": {
            "terms": { "field": "text_many_terms" },
            "aggs": {
                "average_f64": { "avg": { "field": "score_f64" } }
            }
        },
    });
    execute_agg(index, agg_req);
}
fn terms_all_unique_with_avg_sub_agg(index: &Index) {
    let agg_req = json!({
        "my_texts": {
            "terms": { "field": "text_all_unique_terms" },
            "aggs": {
                "average_f64": { "avg": { "field": "score_f64" } }
            }
        },
    });
    execute_agg(index, agg_req);
}
fn terms_status_with_histogram(index: &Index) {
    let agg_req = json!({
        "my_texts": {
            "terms": { "field": "text_few_terms_status" },
            "aggs": {
                "histo": {"histogram": { "field": "score_f64", "interval": 10 }}
            }
        }
    });
    execute_agg(index, agg_req);
}

fn terms_zipf_1000_with_histogram(index: &Index) {
    let agg_req = json!({
        "my_texts": {
            "terms": { "field": "text_1000_terms_zipf" },
            "aggs": {
                "histo": {"histogram": { "field": "score_f64", "interval": 10 }}
            }
        }
    });
    execute_agg(index, agg_req);
}

fn terms_status_with_avg_sub_agg(index: &Index) {
    let agg_req = json!({
        "my_texts": {
            "terms": { "field": "text_few_terms_status" },
            "aggs": {
                "average_f64": { "avg": { "field": "score_f64" } }
            }
        },
    });
    execute_agg(index, agg_req);
}

fn terms_zipf_1000_with_avg_sub_agg(index: &Index) {
    let agg_req = json!({
        "my_texts": {
            "terms": { "field": "text_1000_terms_zipf" },
            "aggs": {
                "average_f64": { "avg": { "field": "score_f64" } }
            }
        },
    });
    execute_agg(index, agg_req);
}

fn terms_zipf_1000(index: &Index) {
    let agg_req = json!({
        "my_texts": { "terms": { "field": "text_1000_terms_zipf" } },
    });
    execute_agg(index, agg_req);
}

fn terms_many_json_mixed_type_with_avg_sub_agg(index: &Index) {
    let agg_req = json!({
        "my_texts": {
            "terms": { "field": "json.mixed_type" },
            "aggs": {
                "average_f64": { "avg": { "field": "score_f64" } }
            }
        },
    });
    execute_agg(index, agg_req);
}

fn composite_term_few(index: &Index) {
    let agg_req = json!({
        "my_ctf": {
            "composite": {
                "sources": [
                    { "text_few_terms": { "terms": { "field": "text_few_terms" } } }
                ],
                "size": 1000
            }
        },
    });
    execute_agg(index, agg_req);
}
fn composite_term_many_page_1000(index: &Index) {
    let agg_req = json!({
        "my_ctmp1000": {
            "composite": {
                "sources": [
                    { "text_many_terms": { "terms": { "field": "text_many_terms" } } }
                ],
                "size": 1000
            }
        },
    });
    execute_agg(index, agg_req);
}
fn composite_term_many_page_1000_with_avg_sub_agg(index: &Index) {
    let agg_req = json!({
        "my_ctmp1000wasa": {
            "composite": {
                "sources": [
                    { "text_many_terms": { "terms": { "field": "text_many_terms" } } }
                ],
                "size": 1000,
            },
            "aggs": {
                "average_f64": { "avg": { "field": "score_f64" } }
            }
        },
    });
    execute_agg(index, agg_req);
}
fn composite_histogram(index: &Index) {
    let agg_req = json!({
        "my_ch": {
            "composite": {
                "sources": [
                    { "f64_histogram": { "histogram": { "field": "score_f64", "interval": 1 } } }
                ],
                "size": 1000
            }
        },
    });
    execute_agg(index, agg_req);
}
fn composite_histogram_calendar(index: &Index) {
    let agg_req = json!({
        "my_chc": {
            "composite": {
                "sources": [
                    { "time_histogram": { "date_histogram": { "field": "timestamp", "calendar_interval": "month" } } }
                ],
                "size": 1000
            }
        },
    });
    execute_agg(index, agg_req);
}

fn execute_agg(index: &Index, agg_req: serde_json::Value) {
    let agg_req: Aggregations = serde_json::from_value(agg_req).unwrap();
    let collector = get_collector(agg_req);

    let reader = index.reader().unwrap();
    let searcher = reader.searcher();
    black_box(searcher.search(&AllQuery, &collector).unwrap());
}
fn range_agg(index: &Index) {
    let agg_req = json!({
        "range_f64": { "range": { "field": "score_f64", "ranges": [
            { "from": 3, "to": 7000 },
            { "from": 7000, "to": 20000 },
            { "from": 20000, "to": 30000 },
            { "from": 30000, "to": 40000 },
            { "from": 40000, "to": 50000 },
            { "from": 50000, "to": 60000 }
        ] } },
    });
    execute_agg(index, agg_req);
}
fn range_agg_with_avg_sub_agg(index: &Index) {
    let agg_req = json!({
        "rangef64": {
            "range": {
                "field": "score_f64",
                "ranges": [
                    { "from": 3, "to": 7000 },
                    { "from": 7000, "to": 20000 },
                    { "from": 20000, "to": 30000 },
                    { "from": 30000, "to": 40000 },
                    { "from": 40000, "to": 50000 },
                    { "from": 50000, "to": 60000 }
                ]
            },
            "aggs": {
                "average_f64": { "avg": { "field": "score_f64" } }
            }
        },
    });
    execute_agg(index, agg_req);
}

fn range_agg_with_term_agg_status(index: &Index) {
    let agg_req = json!({
        "rangef64": {
            "range": {
                "field": "score_f64",
                "ranges": [
                    { "from": 3, "to": 7000 },
                    { "from": 7000, "to": 20000 },
                    { "from": 20000, "to": 30000 },
                    { "from": 30000, "to": 40000 },
                    { "from": 40000, "to": 50000 },
                    { "from": 50000, "to": 60000 }
                ]
            },
            "aggs": {
                "my_texts": { "terms": { "field": "text_few_terms_status" } },
            }
        },
    });
    execute_agg(index, agg_req);
}
fn range_agg_with_term_agg_many(index: &Index) {
    let agg_req = json!({
        "rangef64": {
            "range": {
                "field": "score_f64",
                "ranges": [
                    { "from": 3, "to": 7000 },
                    { "from": 7000, "to": 20000 },
                    { "from": 20000, "to": 30000 },
                    { "from": 30000, "to": 40000 },
                    { "from": 40000, "to": 50000 },
                    { "from": 50000, "to": 60000 }
                ]
            },
            "aggs": {
                "my_texts": { "terms": { "field": "text_many_terms" } },
            }
        },
    });
    execute_agg(index, agg_req);
}

fn histogram(index: &Index) {
    let agg_req = json!({
        "rangef64": {
            "histogram": {
                "field": "score_f64",
                "interval": 100 // 1000 buckets
            },
        }
    });
    execute_agg(index, agg_req);
}
fn histogram_hard_bounds(index: &Index) {
    let agg_req = json!({
        "rangef64": { "histogram": { "field": "score_f64", "interval": 100, "hard_bounds": { "min": 1000, "max": 300000 } } },
    });
    execute_agg(index, agg_req);
}
fn histogram_with_avg_sub_agg(index: &Index) {
    let agg_req = json!({
        "rangef64": {
            "histogram": { "field": "score_f64", "interval": 100 },
            "aggs": {
                "average_f64": { "avg": { "field": "score_f64" } }
            }
        }
    });
    execute_agg(index, agg_req);
}
fn histogram_with_term_agg_status(index: &Index) {
    let agg_req = json!({
        "rangef64": {
            "histogram": { "field": "score_f64", "interval": 10 },
            "aggs": {
                "my_texts": { "terms": { "field": "text_few_terms_status" } }
            }
        }
    });
    execute_agg(index, agg_req);
}
fn avg_and_range_with_avg_sub_agg(index: &Index) {
    let agg_req = json!({
        "rangef64": {
            "range": {
                "field": "score_f64",
                "ranges": [
                    { "from": 3, "to": 7000 },
                    { "from": 7000, "to": 20000 },
                    { "from": 20000, "to": 60000 }
                ]
            },
            "aggs": {
                "average_in_range": { "avg": { "field": "score" } }
            }
        },
        "average": { "avg": { "field": "score" } }
    });
    execute_agg(index, agg_req);
}

#[derive(Clone, Copy, Hash, Default, Debug, PartialEq, Eq, PartialOrd, Ord)]
enum Cardinality {
    /// All documents contain exactly one value.
    /// `Full` is the default for auto-detecting the Cardinality, since it is the most strict.
    #[default]
    Full = 0,
    /// All documents contain at most one value.
    OptionalDense = 1,
    /// All documents may contain any number of values.
    Multivalued = 2,
    /// 1 / 20 documents has a value
    OptionalSparse = 3,
}

fn get_collector(agg_req: Aggregations) -> AggregationCollector {
    AggregationCollector::from_aggs(agg_req, Default::default())
}

fn get_test_index_bench(cardinality: Cardinality) -> tantivy::Result<Index> {
    // Flag to use existing index
    let reuse_index = std::env::var("REUSE_AGG_BENCH_INDEX").is_ok();
    if reuse_index && std::path::Path::new("agg_bench").exists() {
        return Index::open_in_dir("agg_bench");
    }
    // crreate dir
    std::fs::create_dir_all("agg_bench")?;
    let mut schema_builder = Schema::builder();
    let text_fieldtype = tantivy::schema::TextOptions::default()
        .set_indexing_options(
            TextFieldIndexing::default().set_index_option(IndexRecordOption::WithFreqs),
        )
        .set_stored();
    let text_field = schema_builder.add_text_field("text", text_fieldtype);
    let json_field = schema_builder.add_json_field("json", FAST);
    let text_field_all_unique_terms =
        schema_builder.add_text_field("text_all_unique_terms", STRING | FAST);
    let text_field_many_terms = schema_builder.add_text_field("text_many_terms", STRING | FAST);
    let text_field_few_terms = schema_builder.add_text_field("text_few_terms", STRING | FAST);
    let text_field_few_terms_status =
        schema_builder.add_text_field("text_few_terms_status", STRING | FAST);
    let text_field_1000_terms_zipf =
        schema_builder.add_text_field("text_1000_terms_zipf", STRING | FAST);
    let score_fieldtype = tantivy::schema::NumericOptions::default().set_fast();
    let score_field = schema_builder.add_u64_field("score", score_fieldtype.clone());
    let score_field_f64 = schema_builder.add_f64_field("score_f64", score_fieldtype.clone());
    let score_field_i64 = schema_builder.add_i64_field("score_i64", score_fieldtype);
    let date_field = schema_builder.add_date_field("timestamp", FAST);
    // use tmp dir
    let index = if reuse_index {
        Index::create_in_dir("agg_bench", schema_builder.build())?
    } else {
        Index::create_from_tempdir(schema_builder.build())?
    };
    // Approximate log proportions
    let status_field_data = [
        ("INFO", 8000),
        ("ERROR", 300),
        ("WARN", 1200),
        ("DEBUG", 500),
        ("OK", 500),
        ("CRITICAL", 20),
        ("EMERGENCY", 1),
    ];
    let log_level_distribution =
        WeightedIndex::new(status_field_data.iter().map(|item| item.1)).unwrap();

    let few_terms_data = ["INFO", "ERROR", "WARN", "DEBUG"];
    let lg_norm = rand_distr::LogNormal::new(2.996f64, 0.979f64).unwrap();

    let many_terms_data = (0..150_000)
        .map(|num| format!("author{num}"))
        .collect::<Vec<_>>();

    // Prepare 1000 unique terms sampled using a Zipf distribution.
    // Exponent ~1.1 approximates top-20 terms covering around ~20%.
    let terms_1000: Vec<String> = (1..=1000).map(|i| format!("term_{i}")).collect();
    let zipf_1000 = rand_distr::Zipf::new(1000.0, 1.1f64).unwrap();

    {
        let mut rng = StdRng::from_seed([1u8; 32]);
        let mut index_writer = index.writer_with_num_threads(1, 200_000_000)?;
        // To make the different test cases comparable we just change one doc to force the
        // cardinality
        if cardinality == Cardinality::OptionalDense {
            index_writer.add_document(doc!())?;
        }
        if cardinality == Cardinality::Multivalued {
            let log_level_sample_a = status_field_data[log_level_distribution.sample(&mut rng)].0;
            let log_level_sample_b = status_field_data[log_level_distribution.sample(&mut rng)].0;
            let idx_a = zipf_1000.sample(&mut rng) as usize - 1;
            let idx_b = zipf_1000.sample(&mut rng) as usize - 1;
            let term_1000_a = &terms_1000[idx_a];
            let term_1000_b = &terms_1000[idx_b];
            index_writer.add_document(doc!(
                json_field => json!({"mixed_type": 10.0}),
                json_field => json!({"mixed_type": 10.0}),
                text_field => "cool",
                text_field => "cool",
                text_field_all_unique_terms => "cool",
                text_field_all_unique_terms => "coolo",
                text_field_many_terms => "cool",
                text_field_many_terms => "cool",
                text_field_few_terms => "cool",
                text_field_few_terms => "cool",
                text_field_few_terms_status => log_level_sample_a,
                text_field_few_terms_status => log_level_sample_b,
                text_field_1000_terms_zipf => term_1000_a.as_str(),
                text_field_1000_terms_zipf => term_1000_b.as_str(),
                score_field => 1u64,
                score_field => 1u64,
                score_field_f64 => lg_norm.sample(&mut rng),
                score_field_f64 => lg_norm.sample(&mut rng),
                score_field_i64 => 1i64,
                score_field_i64 => 1i64,
            ))?;
        }
        let mut doc_with_value = 1_000_000;
        if cardinality == Cardinality::OptionalSparse {
            doc_with_value /= 20;
        }
        let _val_max = 1_000_000.0;
        for _ in 0..doc_with_value {
            let val: f64 = rng.random_range(0.0..1_000_000.0);
            let json = if rng.random_bool(0.1) {
                // 10% are numeric values
                json!({ "mixed_type": val })
            } else {
                json!({"mixed_type": many_terms_data.choose(&mut rng).unwrap().to_string()})
            };
            index_writer.add_document(doc!(
                text_field => "cool",
                json_field => json,
                text_field_all_unique_terms => format!("unique_term_{}", rng.random::<u64>()),
                text_field_many_terms => many_terms_data.choose(&mut rng).unwrap().to_string(),
                text_field_few_terms => few_terms_data.choose(&mut rng).unwrap().to_string(),
                text_field_few_terms_status => status_field_data[log_level_distribution.sample(&mut rng)].0,
                text_field_1000_terms_zipf => terms_1000[zipf_1000.sample(&mut rng) as usize - 1].as_str(),
                score_field => val as u64,
                score_field_f64 => lg_norm.sample(&mut rng),
                score_field_i64 => val as i64,
                date_field => DateTime::from_timestamp_millis((val * 1_000_000.) as i64),
            ))?;
            if cardinality == Cardinality::OptionalSparse {
                for _ in 0..20 {
                    index_writer.add_document(doc!(text_field => "cool"))?;
                }
            }
        }
        // writing the segment
        index_writer.commit()?;
    }

    Ok(index)
}

// Filter aggregation benchmarks

fn filter_agg_all_query_count_agg(index: &Index) {
    let agg_req = json!({
        "filtered": {
            "filter": "*",
            "aggs": {
                "count": { "value_count": { "field": "score" } }
            }
        }
    });
    execute_agg(index, agg_req);
}

fn filter_agg_term_query_count_agg(index: &Index) {
    let agg_req = json!({
        "filtered": {
            "filter": "text:cool",
            "aggs": {
                "count": { "value_count": { "field": "score" } }
            }
        }
    });
    execute_agg(index, agg_req);
}

fn filter_agg_all_query_with_sub_aggs(index: &Index) {
    let agg_req = json!({
        "filtered": {
            "filter": "*",
            "aggs": {
                "avg_score": { "avg": { "field": "score" } },
                "stats_score": { "stats": { "field": "score_f64" } },
                "terms_text": {
                    "terms": { "field": "text_few_terms_status" }
                }
            }
        }
    });
    execute_agg(index, agg_req);
}

fn filter_agg_term_query_with_sub_aggs(index: &Index) {
    let agg_req = json!({
        "filtered": {
            "filter": "text:cool",
            "aggs": {
                "avg_score": { "avg": { "field": "score" } },
                "stats_score": { "stats": { "field": "score_f64" } },
                "terms_text": {
                    "terms": { "field": "text_few_terms_status" }
                }
            }
        }
    });
    execute_agg(index, agg_req);
}


================================================
FILE: benches/alice.txt
================================================
﻿The Project Gutenberg EBook of Alice’s Adventures in Wonderland, by Lewis Carroll

This eBook is for the use of anyone anywhere in the United States and most
other parts of the world at no cost and with almost no restrictions
whatsoever.  You may copy it, give it away or re-use it under the terms of
the Project Gutenberg License included with this eBook or online at
www.gutenberg.org.  If you are not located in the United States, you'll have
to check the laws of the country where you are located before using this ebook.

Title: Alice’s Adventures in Wonderland

Author: Lewis Carroll

Release Date: June 25, 2008 [EBook #11]
[Most recently updated: October 12, 2020]

Language: English

Character set encoding: UTF-8

*** START OF THIS PROJECT GUTENBERG EBOOK ALICE’S ADVENTURES IN WONDERLAND ***


Produced by Arthur DiBianca and David Widger

[Illustration]


Alice’s Adventures in Wonderland

by Lewis Carroll

THE MILLENNIUM FULCRUM EDITION 3.0

Contents

 CHAPTER I.     Down the Rabbit-Hole
 CHAPTER II.    The Pool of Tears
 CHAPTER III.   A Caucus-Race and a Long Tale
 CHAPTER IV.    The Rabbit Sends in a Little Bill
 CHAPTER V.     Advice from a Caterpillar
 CHAPTER VI.    Pig and Pepper
 CHAPTER VII.   A Mad Tea-Party
 CHAPTER VIII.  The Queen’s Croquet-Ground
 CHAPTER IX.    The Mock Turtle’s Story
 CHAPTER X.     The Lobster Quadrille
 CHAPTER XI.    Who Stole the Tarts?
 CHAPTER XII.   Alice’s Evidence


CHAPTER I.
Down the Rabbit-Hole


Alice was beginning to get very tired of sitting by her sister on the
bank, and of having nothing to do: once or twice she had peeped into
the book her sister was reading, but it had no pictures or
conversations in it, “and what is the use of a book,” thought Alice
“without pictures or conversations?”

So she was considering in her own mind (as well as she could, for the
hot day made her feel very sleepy and stupid), whether the pleasure of
making a daisy-chain would be worth the trouble of getting up and
picking the daisies, when suddenly a White Rabbit with pink eyes ran
close by her.

There was nothing so _very_ remarkable in that; nor did Alice think it
so _very_ much out of the way to hear the Rabbit say to itself, “Oh
dear! Oh dear! I shall be late!” (when she thought it over afterwards,
it occurred to her that she ought to have wondered at this, but at the
time it all seemed quite natural); but when the Rabbit actually _took a
watch out of its waistcoat-pocket_, and looked at it, and then hurried
on, Alice started to her feet, for it flashed across her mind that she
had never before seen a rabbit with either a waistcoat-pocket, or a
watch to take out of it, and burning with curiosity, she ran across the
field after it, and fortunately was just in time to see it pop down a
large rabbit-hole under the hedge.

In another moment down went Alice after it, never once considering how
in the world she was to get out again.

The rabbit-hole went straight on like a tunnel for some way, and then
dipped suddenly down, so suddenly that Alice had not a moment to think
about stopping herself before she found herself falling down a very
deep well.

Either the well was very deep, or she fell very slowly, for she had
plenty of time as she went down to look about her and to wonder what
was going to happen next. First, she tried to look down and make out
what she was coming to, but it was too dark to see anything; then she
looked at the sides of the well, and noticed that they were filled with
cupboards and book-shelves; here and there she saw maps and pictures
hung upon pegs. She took down a jar from one of the shelves as she
passed; it was labelled “ORANGE MARMALADE”, but to her great
disappointment it was empty: she did not like to drop the jar for fear
of killing somebody underneath, so managed to put it into one of the
cupboards as she fell past it.

“Well!” thought Alice to herself, “after such a fall as this, I shall
think nothing of tumbling down stairs! How brave they’ll all think me
at home! Why, I wouldn’t say anything about it, even if I fell off the
top of the house!” (Which was very likely true.)

Down, down, down. Would the fall _never_ come to an end? “I wonder how
many miles I’ve fallen by this time?” she said aloud. “I must be
getting somewhere near the centre of the earth. Let me see: that would
be four thousand miles down, I think—” (for, you see, Alice had learnt
several things of this sort in her lessons in the schoolroom, and
though this was not a _very_ good opportunity for showing off her
knowledge, as there was no one to listen to her, still it was good
practice to say it over) “—yes, that’s about the right distance—but
then I wonder what Latitude or Longitude I’ve got to?” (Alice had no
idea what Latitude was, or Longitude either, but thought they were nice
grand words to say.)

Presently she began again. “I wonder if I shall fall right _through_
the earth! How funny it’ll seem to come out among the people that walk
with their heads downward! The Antipathies, I think—” (she was rather
glad there _was_ no one listening, this time, as it didn’t sound at all
the right word) “—but I shall have to ask them what the name of the
country is, you know. Please, Ma’am, is this New Zealand or Australia?”
(and she tried to curtsey as she spoke—fancy _curtseying_ as you’re
falling through the air! Do you think you could manage it?) “And what
an ignorant little girl she’ll think me for asking! No, it’ll never do
to ask: perhaps I shall see it written up somewhere.”

Down, down, down. There was nothing else to do, so Alice soon began
talking again. “Dinah’ll miss me very much to-night, I should think!”
(Dinah was the cat.) “I hope they’ll remember her saucer of milk at
tea-time. Dinah my dear! I wish you were down here with me! There are
no mice in the air, I’m afraid, but you might catch a bat, and that’s
very like a mouse, you know. But do cats eat bats, I wonder?” And here
Alice began to get rather sleepy, and went on saying to herself, in a
dreamy sort of way, “Do cats eat bats? Do cats eat bats?” and
sometimes, “Do bats eat cats?” for, you see, as she couldn’t answer
either question, it didn’t much matter which way she put it. She felt
that she was dozing off, and had just begun to dream that she was
walking hand in hand with Dinah, and saying to her very earnestly,
“Now, Dinah, tell me the truth: did you ever eat a bat?” when suddenly,
thump! thump! down she came upon a heap of sticks and dry leaves, and
the fall was over.

Alice was not a bit hurt, and she jumped up on to her feet in a moment:
she looked up, but it was all dark overhead; before her was another
long passage, and the White Rabbit was still in sight, hurrying down
it. There was not a moment to be lost: away went Alice like the wind,
and was just in time to hear it say, as it turned a corner, “Oh my ears
and whiskers, how late it’s getting!” She was close behind it when she
turned the corner, but the Rabbit was no longer to be seen: she found
herself in a long, low hall, which was lit up by a row of lamps hanging
from the roof.

There were doors all round the hall, but they were all locked; and when
Alice had been all the way down one side and up the other, trying every
door, she walked sadly down the middle, wondering how she was ever to
get out again.

Suddenly she came upon a little three-legged table, all made of solid
glass; there was nothing on it except a tiny golden key, and Alice’s
first thought was that it might belong to one of the doors of the hall;
but, alas! either the locks were too large, or the key was too small,
but at any rate it would not open any of them. However, on the second
time round, she came upon a low curtain she had not noticed before, and
behind it was a little door about fifteen inches high: she tried the
little golden key in the lock, and to her great delight it fitted!

Alice opened the door and found that it led into a small passage, not
much larger than a rat-hole: she knelt down and looked along the
passage into the loveliest garden you ever saw. How she longed to get
out of that dark hall, and wander about among those beds of bright
flowers and those cool fountains, but she could not even get her head
through the doorway; “and even if my head would go through,” thought
poor Alice, “it would be of very little use without my shoulders. Oh,
how I wish I could shut up like a telescope! I think I could, if I only
knew how to begin.” For, you see, so many out-of-the-way things had
happened lately, that Alice had begun to think that very few things
indeed were really impossible.

There seemed to be no use in waiting by the little door, so she went
back to the table, half hoping she might find another key on it, or at
any rate a book of rules for shutting people up like telescopes: this
time she found a little bottle on it, (“which certainly was not here
before,” said Alice,) and round the neck of the bottle was a paper
label, with the words “DRINK ME,” beautifully printed on it in large
letters.

It was all very well to say “Drink me,” but the wise little Alice was
not going to do _that_ in a hurry. “No, I’ll look first,” she said,
“and see whether it’s marked ‘_poison_’ or not”; for she had read
several nice little histories about children who had got burnt, and
eaten up by wild beasts and other unpleasant things, all because they
_would_ not remember the simple rules their friends had taught them:
such as, that a red-hot poker will burn you if you hold it too long;
and that if you cut your finger _very_ deeply with a knife, it usually
bleeds; and she had never forgotten that, if you drink much from a
bottle marked “poison,” it is almost certain to disagree with you,
sooner or later.

However, this bottle was _not_ marked “poison,” so Alice ventured to
taste it, and finding it very nice, (it had, in fact, a sort of mixed
flavour of cherry-tart, custard, pine-apple, roast turkey, toffee, and
hot buttered toast,) she very soon finished it off.

*      *      *      *      *      *      *

    *      *      *      *      *      *

*      *      *      *      *      *      *


“What a curious feeling!” said Alice; “I must be shutting up like a
telescope.”

And so it was indeed: she was now only ten inches high, and her face
brightened up at the thought that she was now the right size for going
through the little door into that lovely garden. First, however, she
waited for a few minutes to see if she was going to shrink any further:
she felt a little nervous about this; “for it might end, you know,”
said Alice to herself, “in my going out altogether, like a candle. I
wonder what I should be like then?” And she tried to fancy what the
flame of a candle is like after the candle is blown out, for she could
not remember ever having seen such a thing.

After a while, finding that nothing more happened, she decided on going
into the garden at once; but, alas for poor Alice! when she got to the
door, she found she had forgotten the little golden key, and when she
went back to the table for it, she found she could not possibly reach
it: she could see it quite plainly through the glass, and she tried her
best to climb up one of the legs of the table, but it was too slippery;
and when she had tired herself out with trying, the poor little thing
sat down and cried.

“Come, there’s no use in crying like that!” said Alice to herself,
rather sharply; “I advise you to leave off this minute!” She generally
gave herself very good advice, (though she very seldom followed it),
and sometimes she scolded herself so severely as to bring tears into
her eyes; and once she remembered trying to box her own ears for having
cheated herself in a game of croquet she was playing against herself,
for this curious child was very fond of pretending to be two people.
“But it’s no use now,” thought poor Alice, “to pretend to be two
people! Why, there’s hardly enough of me left to make _one_ respectable
person!”

Soon her eye fell on a little glass box that was lying under the table:
she opened it, and found in it a very small cake, on which the words
“EAT ME” were beautifully marked in currants. “Well, I’ll eat it,” said
Alice, “and if it makes me grow larger, I can reach the key; and if it
makes me grow smaller, I can creep under the door; so either way I’ll
get into the garden, and I don’t care which happens!”

She ate a little bit, and said anxiously to herself, “Which way? Which
way?”, holding her hand on the top of her head to feel which way it was
growing, and she was quite surprised to find that she remained the same
size: to be sure, this generally happens when one eats cake, but Alice
had got so much into the way of expecting nothing but out-of-the-way
things to happen, that it seemed quite dull and stupid for life to go
on in the common way.

So she set to work, and very soon finished off the cake.

*      *      *      *      *      *      *

    *      *      *      *      *      *

*      *      *      *      *      *      *


CHAPTER II.
The Pool of Tears


“Curiouser and curiouser!” cried Alice (she was so much surprised, that
for the moment she quite forgot how to speak good English); “now I’m
opening out like the largest telescope that ever was! Good-bye, feet!”
(for when she looked down at her feet, they seemed to be almost out of
sight, they were getting so far off). “Oh, my poor little feet, I
wonder who will put on your shoes and stockings for you now, dears? I’m
sure _I_ shan’t be able! I shall be a great deal too far off to trouble
myself about you: you must manage the best way you can;—but I must be
kind to them,” thought Alice, “or perhaps they won’t walk the way I
want to go! Let me see: I’ll give them a new pair of boots every
Christmas.”

And she went on planning to herself how she would manage it. “They must
go by the carrier,” she thought; “and how funny it’ll seem, sending
presents to one’s own feet! And how odd the directions will look!

     _Alice’s Right Foot, Esq., Hearthrug, near the Fender,_ (_with
     Alice’s love_).

Oh dear, what nonsense I’m talking!”

Just then her head struck against the roof of the hall: in fact she was
now more than nine feet high, and she at once took up the little golden
key and hurried off to the garden door.

Poor Alice! It was as much as she could do, lying down on one side, to
look through into the garden with one eye; but to get through was more
hopeless than ever: she sat down and began to cry again.

“You ought to be ashamed of yourself,” said Alice, “a great girl like
you,” (she might well say this), “to go on crying in this way! Stop
this moment, I tell you!” But she went on all the same, shedding
gallons of tears, until there was a large pool all round her, about
four inches deep and reaching half down the hall.

After a time she heard a little pattering of feet in the distance, and
she hastily dried her eyes to see what was coming. It was the White
Rabbit returning, splendidly dressed, with a pair of white kid gloves
in one hand and a large fan in the other: he came trotting along in a
great hurry, muttering to himself as he came, “Oh! the Duchess, the
Duchess! Oh! won’t she be savage if I’ve kept her waiting!” Alice felt
so desperate that she was ready to ask help of any one; so, when the
Rabbit came near her, she began, in a low, timid voice, “If you please,
sir—” The Rabbit started violently, dropped the white kid gloves and
the fan, and skurried away into the darkness as hard as he could go.

Alice took up the fan and gloves, and, as the hall was very hot, she
kept fanning herself all the time she went on talking: “Dear, dear! How
queer everything is to-day! And yesterday things went on just as usual.
I wonder if I’ve been changed in the night? Let me think: was I the
same when I got up this morning? I almost think I can remember feeling
a little different. But if I’m not the same, the next question is, Who
in the world am I? Ah, _that’s_ the great puzzle!” And she began
thinking over all the children she knew that were of the same age as
herself, to see if she could have been changed for any of them.

“I’m sure I’m not Ada,” she said, “for her hair goes in such long
ringlets, and mine doesn’t go in ringlets at all; and I’m sure I can’t
be Mabel, for I know all sorts of things, and she, oh! she knows such a
very little! Besides, _she’s_ she, and _I’m_ I, and—oh dear, how
puzzling it all is! I’ll try if I know all the things I used to know.
Let me see: four times five is twelve, and four times six is thirteen,
and four times seven is—oh dear! I shall never get to twenty at that
rate! However, the Multiplication Table doesn’t signify: let’s try
Geography. London is the capital of Paris, and Paris is the capital of
Rome, and Rome—no, _that’s_ all wrong, I’m certain! I must have been
changed for Mabel! I’ll try and say ‘_How doth the little_—’” and she
crossed her hands on her lap as if she were saying lessons, and began
to repeat it, but her voice sounded hoarse and strange, and the words
did not come the same as they used to do:—

“How doth the little crocodile
    Improve his shining tail,
And pour the waters of the Nile
    On every golden scale!

“How cheerfully he seems to grin,
    How neatly spread his claws,
And welcome little fishes in
    With gently smiling jaws!”


“I’m sure those are not the right words,” said poor Alice, and her eyes
filled with tears again as she went on, “I must be Mabel after all, and
I shall have to go and live in that poky little house, and have next to
no toys to play with, and oh! ever so many lessons to learn! No, I’ve
made up my mind about it; if I’m Mabel, I’ll stay down here! It’ll be
no use their putting their heads down and saying ‘Come up again, dear!’
I shall only look up and say ‘Who am I then? Tell me that first, and
then, if I like being that person, I’ll come up: if not, I’ll stay down
here till I’m somebody else’—but, oh dear!” cried Alice, with a sudden
burst of tears, “I do wish they _would_ put their heads down! I am so
_very_ tired of being all alone here!”

As she said this she looked down at her hands, and was surprised to see
that she had put on one of the Rabbit’s little white kid gloves while
she was talking. “How _can_ I have done that?” she thought. “I must be
growing small again.” She got up and went to the table to measure
herself by it, and found that, as nearly as she could guess, she was
now about two feet high, and was going on shrinking rapidly: she soon
found out that the cause of this was the fan she was holding, and she
dropped it hastily, just in time to avoid shrinking away altogether.

“That _was_ a narrow escape!” said Alice, a good deal frightened at the
sudden change, but very glad to find herself still in existence; “and
now for the garden!” and she ran with all speed back to the little
door: but, alas! the little door was shut again, and the little golden
key was lying on the glass table as before, “and things are worse than
ever,” thought the poor child, “for I never was so small as this
before, never! And I declare it’s too bad, that it is!”

As she said these words her foot slipped, and in another moment,
splash! she was up to her chin in salt water. Her first idea was that
she had somehow fallen into the sea, “and in that case I can go back by
railway,” she said to herself. (Alice had been to the seaside once in
her life, and had come to the general conclusion, that wherever you go
to on the English coast you find a number of bathing machines in the
sea, some children digging in the sand with wooden spades, then a row
of lodging houses, and behind them a railway station.) However, she
soon made out that she was in the pool of tears which she had wept when
she was nine feet high.

“I wish I hadn’t cried so much!” said Alice, as she swam about, trying
to find her way out. “I shall be punished for it now, I suppose, by
being drowned in my own tears! That _will_ be a queer thing, to be
sure! However, everything is queer to-day.”

Just then she heard something splashing about in the pool a little way
off, and she swam nearer to make out what it was: at first she thought
it must be a walrus or hippopotamus, but then she remembered how small
she was now, and she soon made out that it was only a mouse that had
slipped in like herself.

“Would it be of any use, now,” thought Alice, “to speak to this mouse?
Everything is so out-of-the-way down here, that I should think very
likely it can talk: at any rate, there’s no harm in trying.” So she
began: “O Mouse, do you know the way out of this pool? I am very tired
of swimming about here, O Mouse!” (Alice thought this must be the right
way of speaking to a mouse: she had never done such a thing before, but
she remembered having seen in her brother’s Latin Grammar, “A mouse—of
a mouse—to a mouse—a mouse—O mouse!”) The Mouse looked at her rather
inquisitively, and seemed to her to wink with one of its little eyes,
but it said nothing.

“Perhaps it doesn’t understand English,” thought Alice; “I daresay it’s
a French mouse, come over with William the Conqueror.” (For, with all
her knowledge of history, Alice had no very clear notion how long ago
anything had happened.) So she began again: “Où est ma chatte?” which
was the first sentence in her French lesson-book. The Mouse gave a
sudden leap out of the water, and seemed to quiver all over with
fright. “Oh, I beg your pardon!” cried Alice hastily, afraid that she
had hurt the poor animal’s feelings. “I quite forgot you didn’t like
cats.”

“Not like cats!” cried the Mouse, in a shrill, passionate voice. “Would
_you_ like cats if you were me?”

“Well, perhaps not,” said Alice in a soothing tone: “don’t be angry
about it. And yet I wish I could show you our cat Dinah: I think you’d
take a fancy to cats if you could only see her. She is such a dear
quiet thing,” Alice went on, half to herself, as she swam lazily about
in the pool, “and she sits purring so nicely by the fire, licking her
paws and washing her face—and she is such a nice soft thing to
nurse—and she’s such a capital one for catching mice—oh, I beg your
pardon!” cried Alice again, for this time the Mouse was bristling all
over, and she felt certain it must be really offended. “We won’t talk
about her any more if you’d rather not.”

“We indeed!” cried the Mouse, who was trembling down to the end of his
tail. “As if _I_ would talk on such a subject! Our family always
_hated_ cats: nasty, low, vulgar things! Don’t let me hear the name
again!”

“I won’t indeed!” said Alice, in a great hurry to change the subject of
conversation. “Are you—are you fond—of—of dogs?” The Mouse did not
answer, so Alice went on eagerly: “There is such a nice little dog near
our house I should like to show you! A little bright-eyed terrier, you
know, with oh, such long curly brown hair! And it’ll fetch things when
you throw them, and it’ll sit up and beg for its dinner, and all sorts
of things—I can’t remember half of them—and it belongs to a farmer, you
know, and he says it’s so useful, it’s worth a hundred pounds! He says
it kills all the rats and—oh dear!” cried Alice in a sorrowful tone,
“I’m afraid I’ve offended it again!” For the Mouse was swimming away
from her as hard as it could go, and making quite a commotion in the
pool as it went.

So she called softly after it, “Mouse dear! Do come back again, and we
won’t talk about cats or dogs either, if you don’t like them!” When the
Mouse heard this, it turned round and swam slowly back to her: its face
was quite pale (with passion, Alice thought), and it said in a low
trembling voice, “Let us get to the shore, and then I’ll tell you my
history, and you’ll understand why it is I hate cats and dogs.”

It was high time to go, for the pool was getting quite crowded with the
birds and animals that had fallen into it: there were a Duck and a
Dodo, a Lory and an Eaglet, and several other curious creatures. Alice
led the way, and the whole party swam to the shore.


CHAPTER III.
A Caucus-Race and a Long Tale


They were indeed a queer-looking party that assembled on the bank—the
birds with draggled feathers, the animals with their fur clinging close
to them, and all dripping wet, cross, and uncomfortable.

The first question of course was, how to get dry again: they had a
consultation about this, and after a few minutes it seemed quite
natural to Alice to find herself talking familiarly with them, as if
she had known them all her life. Indeed, she had quite a long argument
with the Lory, who at last turned sulky, and would only say, “I am
older than you, and must know better;” and this Alice would not allow
without knowing how old it was, and, as the Lory positively refused to
tell its age, there was no more to be said.

At last the Mouse, who seemed to be a person of authority among them,
called out, “Sit down, all of you, and listen to me! _I’ll_ soon make
you dry enough!” They all sat down at once, in a large ring, with the
Mouse in the middle. Alice kept her eyes anxiously fixed on it, for she
felt sure she would catch a bad cold if she did not get dry very soon.

“Ahem!” said the Mouse with an important air, “are you all ready? This
is the driest thing I know. Silence all round, if you please! ‘William
the Conqueror, whose cause was favoured by the pope, was soon submitted
to by the English, who wanted leaders, and had been of late much
accustomed to usurpation and conquest. Edwin and Morcar, the earls of
Mercia and Northumbria—’”

“Ugh!” said the Lory, with a shiver.

“I beg your pardon!” said the Mouse, frowning, but very politely: “Did
you speak?”

“Not I!” said the Lory hastily.

“I thought you did,” said the Mouse. “—I proceed. ‘Edwin and Morcar,
the earls of Mercia and Northumbria, declared for him: and even
Stigand, the patriotic archbishop of Canterbury, found it advisable—’”

“Found _what_?” said the Duck.

“Found _it_,” the Mouse replied rather crossly: “of course you know
what ‘it’ means.”

“I know what ‘it’ means well enough, when _I_ find a thing,” said the
Duck: “it’s generally a frog or a worm. The question is, what did the
archbishop find?”

The Mouse did not notice this question, but hurriedly went on, “‘—found
it advisable to go with Edgar Atheling to meet William and offer him
the crown. William’s conduct at first was moderate. But the insolence
of his Normans—’ How are you getting on now, my dear?” it continued,
turning to Alice as it spoke.

“As wet as ever,” said Alice in a melancholy tone: “it doesn’t seem to
dry me at all.”

“In that case,” said the Dodo solemnly, rising to its feet, “I move
that the meeting adjourn, for the immediate adoption of more energetic
remedies—”

“Speak English!” said the Eaglet. “I don’t know the meaning of half
those long words, and, what’s more, I don’t believe you do either!” And
the Eaglet bent down its head to hide a smile: some of the other birds
tittered audibly.

“What I was going to say,” said the Dodo in an offended tone, “was,
that the best thing to get us dry would be a Caucus-race.”

“What _is_ a Caucus-race?” said Alice; not that she wanted much to
know, but the Dodo had paused as if it thought that _somebody_ ought to
speak, and no one else seemed inclined to say anything.

“Why,” said the Dodo, “the best way to explain it is to do it.” (And,
as you might like to try the thing yourself, some winter day, I will
tell you how the Dodo managed it.)

First it marked out a race-course, in a sort of circle, (“the exact
shape doesn’t matter,” it said,) and then all the party were placed
along the course, here and there. There was no “One, two, three, and
away,” but they began running when they liked, and left off when they
liked, so that it was not easy to know when the race was over. However,
when they had been running half an hour or so, and were quite dry
again, the Dodo suddenly called out “The race is over!” and they all
crowded round it, panting, and asking, “But who has won?”

This question the Dodo could not answer without a great deal of
thought, and it sat for a long time with one finger pressed upon its
forehead (the position in which you usually see Shakespeare, in the
pictures of him), while the rest waited in silence. At last the Dodo
said, “_Everybody_ has won, and all must have prizes.”

“But who is to give the prizes?” quite a chorus of voices asked.

“Why, _she_, of course,” said the Dodo, pointing to Alice with one
finger; and the whole party at once crowded round her, calling out in a
confused way, “Prizes! Prizes!”

Alice had no idea what to do, and in despair she put her hand in her
pocket, and pulled out a box of comfits, (luckily the salt water had
not got into it), and handed them round as prizes. There was exactly
one a-piece, all round.

“But she must have a prize herself, you know,” said the Mouse.

“Of course,” the Dodo replied very gravely. “What else have you got in
your pocket?” he went on, turning to Alice.

“Only a thimble,” said Alice sadly.

“Hand it over here,” said the Dodo.

Then they all crowded round her once more, while the Dodo solemnly
presented the thimble, saying “We beg your acceptance of this elegant
thimble;” and, when it had finished this short speech, they all
cheered.

Alice thought the whole thing very absurd, but they all looked so grave
that she did not dare to laugh; and, as she could not think of anything
to say, she simply bowed, and took the thimble, looking as solemn as
she could.

The next thing was to eat the comfits: this caused some noise and
confusion, as the large birds complained that they could not taste
theirs, and the small ones choked and had to be patted on the back.
However, it was over at last, and they sat down again in a ring, and
begged the Mouse to tell them something more.

“You promised to tell me your history, you know,” said Alice, “and why
it is you hate—C and D,” she added in a whisper, half afraid that it
would be offended again.

“Mine is a long and a sad tale!” said the Mouse, turning to Alice, and
sighing.

“It _is_ a long tail, certainly,” said Alice, looking down with wonder
at the Mouse’s tail; “but why do you call it sad?” And she kept on
puzzling about it while the Mouse was speaking, so that her idea of the
tale was something like this:—

         “Fury said to a mouse, That he met in the house, ‘Let us both
         go to law: _I_ will prosecute _you_.—Come, I’ll take no
         denial; We must have a trial: For really this morning I’ve
         nothing to do.’ Said the mouse to the cur, ‘Such a trial, dear
         sir, With no jury or judge, would be wasting our breath.’
         ‘I’ll be judge, I’ll be jury,’ Said cunning old Fury: ‘I’ll
         try the whole cause, and condemn you to death.’”

“You are not attending!” said the Mouse to Alice severely. “What are
you thinking of?”

“I beg your pardon,” said Alice very humbly: “you had got to the fifth
bend, I think?”

“I had _not!_” cried the Mouse, sharply and very angrily.

“A knot!” said Alice, always ready to make herself useful, and looking
anxiously about her. “Oh, do let me help to undo it!”

“I shall do nothing of the sort,” said the Mouse, getting up and
walking away. “You insult me by talking such nonsense!”

“I didn’t mean it!” pleaded poor Alice. “But you’re so easily offended,
you know!”

The Mouse only growled in reply.

“Please come back and finish your story!” Alice called after it; and
the others all joined in chorus, “Yes, please do!” but the Mouse only
shook its head impatiently, and walked a little quicker.

“What a pity it wouldn’t stay!” sighed the Lory, as soon as it was
quite out of sight; and an old Crab took the opportunity of saying to
her daughter “Ah, my dear! Let this be a lesson to you never to lose
_your_ temper!” “Hold your tongue, Ma!” said the young Crab, a little
snappishly. “You’re enough to try the patience of an oyster!”

“I wish I had our Dinah here, I know I do!” said Alice aloud,
addressing nobody in particular. “She’d soon fetch it back!”

“And who is Dinah, if I might venture to ask the question?” said the
Lory.

Alice replied eagerly, for she was always ready to talk about her pet:
“Dinah’s our cat. And she’s such a capital one for catching mice you
can’t think! And oh, I wish you could see her after the birds! Why,
she’ll eat a little bird as soon as look at it!”

This speech caused a remarkable sensation among the party. Some of the
birds hurried off at once: one old Magpie began wrapping itself up very
carefully, remarking, “I really must be getting home; the night-air
doesn’t suit my throat!” and a Canary called out in a trembling voice
to its children, “Come away, my dears! It’s high time you were all in
bed!” On various pretexts they all moved off, and Alice was soon left
alone.

“I wish I hadn’t mentioned Dinah!” she said to herself in a melancholy
tone. “Nobody seems to like her, down here, and I’m sure she’s the best
cat in the world! Oh, my dear Dinah! I wonder if I shall ever see you
any more!” And here poor Alice began to cry again, for she felt very
lonely and low-spirited. In a little while, however, she again heard a
little pattering of footsteps in the distance, and she looked up
eagerly, half hoping that the Mouse had changed his mind, and was
coming back to finish his story.


CHAPTER IV.
The Rabbit Sends in a Little Bill


It was the White Rabbit, trotting slowly back again, and looking
anxiously about as it went, as if it had lost something; and she heard
it muttering to itself “The Duchess! The Duchess! Oh my dear paws! Oh
my fur and whiskers! She’ll get me executed, as sure as ferrets are
ferrets! Where _can_ I have dropped them, I wonder?” Alice guessed in a
moment that it was looking for the fan and the pair of white kid
gloves, and she very good-naturedly began hunting about for them, but
they were nowhere to be seen—everything seemed to have changed since
her swim in the pool, and the great hall, with the glass table and the
little door, had vanished completely.

Very soon the Rabbit noticed Alice, as she went hunting about, and
called out to her in an angry tone, “Why, Mary Ann, what _are_ you
doing out here? Run home this moment, and fetch me a pair of gloves and
a fan! Quick, now!” And Alice was so much frightened that she ran off
at once in the direction it pointed to, without trying to explain the
mistake it had made.

“He took me for his housemaid,” she said to herself as she ran. “How
surprised he’ll be when he finds out who I am! But I’d better take him
his fan and gloves—that is, if I can find them.” As she said this, she
came upon a neat little house, on the door of which was a bright brass
plate with the name “W. RABBIT,” engraved upon it. She went in without
knocking, and hurried upstairs, in great fear lest she should meet the
real Mary Ann, and be turned out of the house before she had found the
fan and gloves.

“How queer it seems,” Alice said to herself, “to be going messages for
a rabbit! I suppose Dinah’ll be sending me on messages next!” And she
began fancying the sort of thing that would happen: “‘Miss Alice! Come
here directly, and get ready for your walk!’ ‘Coming in a minute,
nurse! But I’ve got to see that the mouse doesn’t get out.’ Only I
don’t think,” Alice went on, “that they’d let Dinah stop in the house
if it began ordering people about like that!”

By this time she had found her way into a tidy little room with a table
in the window, and on it (as she had hoped) a fan and two or three
pairs of tiny white kid gloves: she took up the fan and a pair of the
gloves, and was just going to leave the room, when her eye fell upon a
little bottle that stood near the looking-glass. There was no label
this time with the words “DRINK ME,” but nevertheless she uncorked it
and put it to her lips. “I know _something_ interesting is sure to
happen,” she said to herself, “whenever I eat or drink anything; so
I’ll just see what this bottle does. I do hope it’ll make me grow large
again, for really I’m quite tired of being such a tiny little thing!”

It did so indeed, and much sooner than she had expected: before she had
drunk half the bottle, she found her head pressing against the ceiling,
and had to stoop to save her neck from being broken. She hastily put
down the bottle, saying to herself “That’s quite enough—I hope I shan’t
grow any more—As it is, I can’t get out at the door—I do wish I hadn’t
drunk quite so much!”

Alas! it was too late to wish that! She went on growing, and growing,
and very soon had to kneel down on the floor: in another minute there
was not even room for this, and she tried the effect of lying down with
one elbow against the door, and the other arm curled round her head.
Still she went on growing, and, as a last resource, she put one arm out
of the window, and one foot up the chimney, and said to herself “Now I
can do no more, whatever happens. What _will_ become of me?”

Luckily for Alice, the little magic bottle had now had its full effect,
and she grew no larger: still it was very uncomfortable, and, as there
seemed to be no sort of chance of her ever getting out of the room
again, no wonder she felt unhappy.

“It was much pleasanter at home,” thought poor Alice, “when one wasn’t
always growing larger and smaller, and being ordered about by mice and
rabbits. I almost wish I hadn’t gone down that rabbit-hole—and yet—and
yet—it’s rather curious, you know, this sort of life! I do wonder what
_can_ have happened to me! When I used to read fairy-tales, I fancied
that kind of thing never happened, and now here I am in the middle of
one! There ought to be a book written about me, that there ought! And
when I grow up, I’ll write one—but I’m grown up now,” she added in a
sorrowful tone; “at least there’s no room to grow up any more _here_.”

“But then,” thought Alice, “shall I _never_ get any older than I am
now? That’ll be a comfort, one way—never to be an old woman—but
then—always to have lessons to learn! Oh, I shouldn’t like _that!_”

“Oh, you foolish Alice!” she answered herself. “How can you learn
lessons in here? Why, there’s hardly room for _you_, and no room at all
for any lesson-books!”

And so she went on, taking first one side and then the other, and
making quite a conversation of it altogether; but after a few minutes
she heard a voice outside, and stopped to listen.

“Mary Ann! Mary Ann!” said the voice. “Fetch me my gloves this moment!”
Then came a little pattering of feet on the stairs. Alice knew it was
the Rabbit coming to look for her, and she trembled till she shook the
house, quite forgetting that she was now about a thousand times as
large as the Rabbit, and had no reason to be afraid of it.

Presently the Rabbit came up to the door, and tried to open it; but, as
the door opened inwards, and Alice’s elbow was pressed hard against it,
that attempt proved a failure. Alice heard it say to itself “Then I’ll
go round and get in at the window.”

“_That_ you won’t!” thought Alice, and, after waiting till she fancied
she heard the Rabbit just under the window, she suddenly spread out her
hand, and made a snatch in the air. She did not get hold of anything,
but she heard a little shriek and a fall, and a crash of broken glass,
from which she concluded that it was just possible it had fallen into a
cucumber-frame, or something of the sort.

Next came an angry voice—the Rabbit’s—“Pat! Pat! Where are you?” And
then a voice she had never heard before, “Sure then I’m here! Digging
for apples, yer honour!”

“Digging for apples, indeed!” said the Rabbit angrily. “Here! Come and
help me out of _this!_” (Sounds of more broken glass.)

“Now tell me, Pat, what’s that in the window?”

“Sure, it’s an arm, yer honour!” (He pronounced it “arrum.”)

“An arm, you goose! Who ever saw one that size? Why, it fills the whole
window!”

“Sure, it does, yer honour: but it’s an arm for all that.”

“Well, it’s got no business there, at any rate: go and take it away!”

There was a long silence after this, and Alice could only hear whispers
now and then; such as, “Sure, I don’t like it, yer honour, at all, at
all!” “Do as I tell you, you coward!” and at last she spread out her
hand again, and made another snatch in the air. This time there were
_two_ little shrieks, and more sounds of broken glass. “What a number
of cucumber-frames there must be!” thought Alice. “I wonder what
they’ll do next! As for pulling me out of the window, I only wish they
_could!_ I’m sure _I_ don’t want to stay in here any longer!”

She waited for some time without hearing anything more: at last came a
rumbling of little cartwheels, and the sound of a good many voices all
talking together: she made out the words: “Where’s the other
ladder?—Why, I hadn’t to bring but one; Bill’s got the other—Bill!
fetch it here, lad!—Here, put ’em up at this corner—No, tie ’em
together first—they don’t reach half high enough yet—Oh! they’ll do
well enough; don’t be particular—Here, Bill! catch hold of this
rope—Will the roof bear?—Mind that loose slate—Oh, it’s coming down!
Heads below!” (a loud crash)—“Now, who did that?—It was Bill, I
fancy—Who’s to go down the chimney?—Nay, _I_ shan’t! _You_ do
it!—_That_ I won’t, then!—Bill’s to go down—Here, Bill! the master says
you’re to go down the chimney!”

“Oh! So Bill’s got to come down the chimney, has he?” said Alice to
herself. “Shy, they seem to put everything upon Bill! I wouldn’t be in
Bill’s place for a good deal: this fireplace is narrow, to be sure; but
I _think_ I can kick a little!”

She drew her foot as far down the chimney as she could, and waited till
she heard a little animal (she couldn’t guess of what sort it was)
scratching and scrambling about in the chimney close above her: then,
saying to herself “This is Bill,” she gave one sharp kick, and waited
to see what would happen next.

The first thing she heard was a general chorus of “There goes Bill!”
then the Rabbit’s voice along—“Catch him, you by the hedge!” then
silence, and then another confusion of voices—“Hold up his head—Brandy
now—Don’t choke him—How was it, old fellow? What happened to you? Tell
us all about it!”

Last came a little feeble, squeaking voice, (“That’s Bill,” thought
Alice,) “Well, I hardly know—No more, thank ye; I’m better now—but I’m
a deal too flustered to tell you—all I know is, something comes at me
like a Jack-in-the-box, and up I goes like a sky-rocket!”

“So you did, old fellow!” said the others.

“We must burn the house down!” said the Rabbit’s voice; and Alice
called out as loud as she could, “If you do, I’ll set Dinah at you!”

There was a dead silence instantly, and Alice thought to herself, “I
wonder what they _will_ do next! If they had any sense, they’d take the
roof off.” After a minute or two, they began moving about again, and
Alice heard the Rabbit say, “A barrowful will do, to begin with.”

“A barrowful of _what?_” thought Alice; but she had not long to doubt,
for the next moment a shower of little pebbles came rattling in at the
window, and some of them hit her in the face. “I’ll put a stop to
this,” she said to herself, and shouted out, “You’d better not do that
again!” which produced another dead silence.

Alice noticed with some surprise that the pebbles were all turning into
little cakes as they lay on the floor, and a bright idea came into her
head. “If I eat one of these cakes,” she thought, “it’s sure to make
_some_ change in my size; and as it can’t possibly make me larger, it
must make me smaller, I suppose.”

So she swallowed one of the cakes, and was delighted to find that she
began shrinking directly. As soon as she was small enough to get
through the door, she ran out of the house, and found quite a crowd of
little animals and birds waiting outside. The poor little Lizard, Bill,
was in the middle, being held up by two guinea-pigs, who were giving it
something out of a bottle. They all made a rush at Alice the moment she
appeared; but she ran off as hard as she could, and soon found herself
safe in a thick wood.

“The first thing I’ve got to do,” said Alice to herself, as she
wandered about in the wood, “is to grow to my right size again; and the
second thing is to find my way into that lovely garden. I think that
will be the best plan.”

It sounded an excellent plan, no doubt, and very neatly and simply
arranged; the only difficulty was, that she had not the smallest idea
how to set about it; and while she was peering about anxiously among
the trees, a little sharp bark just over her head made her look up in a
great hurry.

An enormous puppy was looking down at her with large round eyes, and
feebly stretching out one paw, trying to touch her. “Poor little
thing!” said Alice, in a coaxing tone, and she tried hard to whistle to
it; but she was terribly frightened all the time at the thought that it
might be hungry, in which case it would be very likely to eat her up in
spite of all her coaxing.

Hardly knowing what she did, she picked up a little bit of stick, and
held it out to the puppy; whereupon the puppy jumped into the air off
all its feet at once, with a yelp of delight, and rushed at the stick,
and made believe to worry it; then Alice dodged behind a great thistle,
to keep herself from being run over; and the moment she appeared on the
other side, the puppy made another rush at the stick, and tumbled head
over heels in its hurry to get hold of it; then Alice, thinking it was
very like having a game of play with a cart-horse, and expecting every
moment to be trampled under its feet, ran round the thistle again; then
the puppy began a series of short charges at the stick, running a very
little way forwards each time and a long way back, and barking hoarsely
all the while, till at last it sat down a good way off, panting, with
its tongue hanging out of its mouth, and its great eyes half shut.

This seemed to Alice a good opportunity for making her escape; so she
set off at once, and ran till she was quite tired and out of breath,
and till the puppy’s bark sounded quite faint in the distance.

“And yet what a dear little puppy it was!” said Alice, as she leant
against a buttercup to rest herself, and fanned herself with one of the
leaves: “I should have liked teaching it tricks very much, if—if I’d
only been the right size to do it! Oh dear! I’d nearly forgotten that
I’ve got to grow up again! Let me see—how _is_ it to be managed? I
suppose I ought to eat or drink something or other; but the great
question is, what?”

The great question certainly was, what? Alice looked all round her at
the flowers and the blades of grass, but she did not see anything that
looked like the right thing to eat or drink under the circumstances.
There was a large mushroom growing near her, about the same height as
herself; and when she had looked under it, and on both sides of it, and
behind it, it occurred to her that she might as well look and see what
was on the top of it.

She stretched herself up on tiptoe, and peeped over the edge of the
mushroom, and her eyes immediately met those of a large blue
caterpillar, that was sitting on the top with its arms folded, quietly
smoking a long hookah, and taking not the smallest notice of her or of
anything else.


CHAPTER V.
Advice from a Caterpillar


The Caterpillar and Alice looked at each other for some time in
silence: at last the Caterpillar took the hookah out of its mouth, and
addressed her in a languid, sleepy voice.

“Who are _you?_” said the Caterpillar.

This was not an encouraging opening for a conversation. Alice replied,
rather shyly, “I—I hardly know, sir, just at present—at least I know
who I _was_ when I got up this morning, but I think I must have been
changed several times since then.”

“What do you mean by that?” said the Caterpillar sternly. “Explain
yourself!”

“I can’t explain _myself_, I’m afraid, sir,” said Alice, “because I’m
not myself, you see.”

“I don’t see,” said the Caterpillar.

“I’m afraid I can’t put it more clearly,” Alice replied very politely,
“for I can’t understand it myself to begin with; and being so many
different sizes in a day is very confusing.”

“It isn’t,” said the Caterpillar.

“Well, perhaps you haven’t found it so yet,” said Alice; “but when you
have to turn into a chrysalis—you will some day, you know—and then
after that into a butterfly, I should think you’ll feel it a little
queer, won’t you?”

“Not a bit,” said the Caterpillar.

“Well, perhaps your feelings may be different,” said Alice; “all I know
is, it would feel very queer to _me_.”

“You!” said the Caterpillar contemptuously. “Who are _you?_”

Which brought them back again to the beginning of the conversation.
Alice felt a little irritated at the Caterpillar’s making such _very_
short remarks, and she drew herself up and said, very gravely, “I
think, you ought to tell me who _you_ are, first.”

“Why?” said the Caterpillar.

Here was another puzzling question; and as Alice could not think of any
good reason, and as the Caterpillar seemed to be in a _very_ unpleasant
state of mind, she turned away.

“Come back!” the Caterpillar called after her. “I’ve something
important to say!”

This sounded promising, certainly: Alice turned and came back again.

“Keep your temper,” said the Caterpillar.

“Is that all?” said Alice, swallowing down her anger as well as she
could.

“No,” said the Caterpillar.

Alice thought she might as well wait, as she had nothing else to do,
and perhaps after all it might tell her something worth hearing. For
some minutes it puffed away without speaking, but at last it unfolded
its arms, took the hookah out of its mouth again, and said, “So you
think you’re changed, do you?”

“I’m afraid I am, sir,” said Alice; “I can’t remember things as I
used—and I don’t keep the same size for ten minutes together!”

“Can’t remember _what_ things?” said the Caterpillar.

“Well, I’ve tried to say “How doth the little busy bee,” but it all
came different!” Alice replied in a very melancholy voice.

“Repeat, “_You are old, Father William_,’” said the Caterpillar.

Alice folded her hands, and began:—

“You are old, Father William,” the young man said,
    “And your hair has become very white;
And yet you incessantly stand on your head—
    Do you think, at your age, it is right?”

“In my youth,” Father William replied to his son,
    “I feared it might injure the brain;
But, now that I’m perfectly sure I have none,
    Why, I do it again and again.”

“You are old,” said the youth, “as I mentioned before,
    And have grown most uncommonly fat;
Yet you turned a back-somersault in at the door—
    Pray, what is the reason of that?”

“In my youth,” said the sage, as he shook his grey locks,
    “I kept all my limbs very supple
By the use of this ointment—one shilling the box—
    Allow me to sell you a couple?”

“You are old,” said the youth, “and your jaws are too weak
    For anything tougher than suet;
Yet you finished the goose, with the bones and the beak—
    Pray, how did you manage to do it?”

“In my youth,” said his father, “I took to the law,
    And argued each case with my wife;
And the muscular strength, which it gave to my jaw,
    Has lasted the rest of my life.”

“You are old,” said the youth, “one would hardly suppose
    That your eye was as steady as ever;
Yet you balanced an eel on the end of your nose—
    What made you so awfully clever?”

“I have answered three questions, and that is enough,”
    Said his father; “don’t give yourself airs!
Do you think I can listen all day to such stuff?
    Be off, or I’ll kick you down stairs!”


“That is not said right,” said the Caterpillar.

“Not _quite_ right, I’m afraid,” said Alice, timidly; “some of the
words have got altered.”

“It is wrong from beginning to end,” said the Caterpillar decidedly,
and there was silence for some minutes.

The Caterpillar was the first to speak.

“What size do you want to be?” it asked.

“Oh, I’m not particular as to size,” Alice hastily replied; “only one
doesn’t like changing so often, you know.”

“I _don’t_ know,” said the Caterpillar.

Alice said nothing: she had never been so much contradicted in her life
before, and she felt that she was losing her temper.

“Are you content now?” said the Caterpillar.

“Well, I should like to be a _little_ larger, sir, if you wouldn’t
mind,” said Alice: “three inches is such a wretched height to be.”

“It is a very good height indeed!” said the Caterpillar angrily,
rearing itself upright as it spoke (it was exactly three inches high).

“But I’m not used to it!” pleaded poor Alice in a piteous tone. And she
thought of herself, “I wish the creatures wouldn’t be so easily
offended!”

“You’ll get used to it in time,” said the Caterpillar; and it put the
hookah into its mouth and began smoking again.

This time Alice waited patiently until it chose to speak again. In a
minute or two the Caterpillar took the hookah out of its mouth and
yawned once or twice, and shook itself. Then it got down off the
mushroom, and crawled away in the grass, merely remarking as it went,
“One side will make you grow taller, and the other side will make you
grow shorter.”

“One side of _what?_ The other side of _what?_” thought Alice to
herself.

“Of the mushroom,” said the Caterpillar, just as if she had asked it
aloud; and in another moment it was out of sight.

Alice remained looking thoughtfully at the mushroom for a minute,
trying to make out which were the two sides of it; and as it was
perfectly round, she found this a very difficult question. However, at
last she stretched her arms round it as far as they would go, and broke
off a bit of the edge with each hand.

“And now which is which?” she said to herself, and nibbled a little of
the right-hand bit to try the effect: the next moment she felt a
violent blow underneath her chin: it had struck her foot!

She was a good deal frightened by this very sudden change, but she felt
that there was no time to be lost, as she was shrinking rapidly; so she
set to work at once to eat some of the other bit. Her chin was pressed
so closely against her foot, that there was hardly room to open her
mouth; but she did it at last, and managed to swallow a morsel of the
lefthand bit.

*      *      *      *      *      *      *

    *      *      *      *      *      *

*      *      *      *      *      *      *


“Come, my head’s free at last!” said Alice in a tone of delight, which
changed into alarm in another moment, when she found that her shoulders
were nowhere to be found: all she could see, when she looked down, was
an immense length of neck, which seemed to rise like a stalk out of a
sea of green leaves that lay far below her.

“What _can_ all that green stuff be?” said Alice. “And where _have_ my
shoulders got to? And oh, my poor hands, how is it I can’t see you?”
She was moving them about as she spoke, but no result seemed to follow,
except a little shaking among the distant green leaves.

As there seemed to be no chance of getting her hands up to her head,
she tried to get her head down to them, and was delighted to find that
her neck would bend about easily in any direction, like a serpent. She
had just succeeded in curving it down into a graceful zigzag, and was
going to dive in among the leaves, which she found to be nothing but
the tops of the trees under which she had been wandering, when a sharp
hiss made her draw back in a hurry: a large pigeon had flown into her
face, and was beating her violently with its wings.

“Serpent!” screamed the Pigeon.

“I’m _not_ a serpent!” said Alice indignantly. “Let me alone!”

“Serpent, I say again!” repeated the Pigeon, but in a more subdued
tone, and added with a kind of sob, “I’ve tried every way, and nothing
seems to suit them!”

“I haven’t the least idea what you’re talking about,” said Alice.

“I’ve tried the roots of trees, and I’ve tried banks, and I’ve tried
hedges,” the Pigeon went on, without attending to her; “but those
serpents! There’s no pleasing them!”

Alice was more and more puzzled, but she thought there was no use in
saying anything more till the Pigeon had finished.

“As if it wasn’t trouble enough hatching the eggs,” said the Pigeon;
“but I must be on the look-out for serpents night and day! Why, I
haven’t had a wink of sleep these three weeks!”

“I’m very sorry you’ve been annoyed,” said Alice, who was beginning to
see its meaning.

“And just as I’d taken the highest tree in the wood,” continued the
Pigeon, raising its voice to a shriek, “and just as I was thinking I
should be free of them at last, they must needs come wriggling down
from the sky! Ugh, Serpent!”

“But I’m _not_ a serpent, I tell you!” said Alice. “I’m a—I’m a—”

“Well! _What_ are you?” said the Pigeon. “I can see you’re trying to
invent something!”

“I—I’m a little girl,” said Alice, rather doubtfully, as she remembered
the number of changes she had gone through that day.

“A likely story indeed!” said the Pigeon in a tone of the deepest
contempt. “I’ve seen a good many little girls in my time, but never
_one_ with such a neck as that! No, no! You’re a serpent; and there’s
no use denying it. I suppose you’ll be telling me next that you never
tasted an egg!”

“I _have_ tasted eggs, certainly,” said Alice, who was a very truthful
child; “but little girls eat eggs quite as much as serpents do, you
know.”

“I don’t believe it,” said the Pigeon; “but if they do, why then
they’re a kind of serpent, that’s all I can say.”

This was such a new idea to Alice, that she was quite silent for a
minute or two, which gave the Pigeon the opportunity of adding, “You’re
looking for eggs, I know _that_ well enough; and what does it matter to
me whether you’re a little girl or a serpent?”

“It matters a good deal to _me_,” said Alice hastily; “but I’m not
looking for eggs, as it happens; and if I was, I shouldn’t want
_yours_: I don’t like them raw.”

“Well, be off, then!” said the Pigeon in a sulky tone, as it settled
down again into its nest. Alice crouched down among the trees as well
as she could, for her neck kept getting entangled among the branches,
and every now and then she had to stop and untwist it. After a while
she remembered that she still held the pieces of mushroom in her hands,
and she set to work very carefully, nibbling first at one and then at
the other, and growing sometimes taller and sometimes shorter, until
she had succeeded in bringing herself down to her usual height.

It was so long since she had been anything near the right size, that it
felt quite strange at first; but she got used to it in a few minutes,
and began talking to herself, as usual. “Come, there’s half my plan
done now! How puzzling all these changes are! I’m never sure what I’m
going to be, from one minute to another! However, I’ve got back to my
right size: the next thing is, to get into that beautiful garden—how
_is_ that to be done, I wonder?” As she said this, she came suddenly
upon an open place, with a little house in it about four feet high.
“Whoever lives there,” thought Alice, “it’ll never do to come upon them
_this_ size: why, I should frighten them out of their wits!” So she
began nibbling at the righthand bit again, and did not venture to go
near the house till she had brought herself down to nine inches high.


CHAPTER VI.
Pig and Pepper


For a minute or two she stood looking at the house, and wondering what
to do next, when suddenly a footman in livery came running out of the
wood—(she considered him to be a footman because he was in livery:
otherwise, judging by his face only, she would have called him a
fish)—and rapped loudly at the door with his knuckles. It was opened by
another footman in livery, with a round face, and large eyes like a
frog; and both footmen, Alice noticed, had powdered hair that curled
all over their heads. She felt very curious to know what it was all
about, and crept a little way out of the wood to listen.

The Fish-Footman began by producing from under his arm a great letter,
nearly as large as himself, and this he handed over to the other,
saying, in a solemn tone, “For the Duchess. An invitation from the
Queen to play croquet.” The Frog-Footman repeated, in the same solemn
tone, only changing the order of the words a little, “From the Queen.
An invitation for the Duchess to play croquet.”

Then they both bowed low, and their curls got entangled together.

Alice laughed so much at this, that she had to run back into the wood
for fear of their hearing her; and when she next peeped out the
Fish-Footman was gone, and the other was sitting on the ground near the
door, staring stupidly up into the sky.

Alice went timidly up to the door, and knocked.

“There’s no sort of use in knocking,” said the Footman, “and that for
two reasons. First, because I’m on the same side of the door as you
are; secondly, because they’re making such a noise inside, no one could
possibly hear you.” And certainly there _was_ a most extraordinary
noise going on within—a constant howling and sneezing, and every now
and then a great crash, as if a dish or kettle had been broken to
pieces.

“Please, then,” said Alice, “how am I to get in?”

“There might be some sense in your knocking,” the Footman went on
without attending to her, “if we had the door between us. For instance,
if you were _inside_, you might knock, and I could let you out, you
know.” He was looking up into the sky all the time he was speaking, and
this Alice thought decidedly uncivil. “But perhaps he can’t help it,”
she said to herself; “his eyes are so _very_ nearly at the top of his
head. But at any rate he might answer questions.—How am I to get in?”
she repeated, aloud.

“I shall sit here,” the Footman remarked, “till tomorrow—”

At this moment the door of the house opened, and a large plate came
skimming out, straight at the Footman’s head: it just grazed his nose,
and broke to pieces against one of the trees behind him.

“—or next day, maybe,” the Footman continued in the same tone, exactly
as if nothing had happened.

“How am I to get in?” asked Alice again, in a louder tone.

“_Are_ you to get in at all?” said the Footman. “That’s the first
question, you know.”

It was, no doubt: only Alice did not like to be told so. “It’s really
dreadful,” she muttered to herself, “the way all the creatures argue.
It’s enough to drive one crazy!”

The Footman seemed to think this a good opportunity for repeating his
remark, with variations. “I shall sit here,” he said, “on and off, for
days and days.”

“But what am _I_ to do?” said Alice.

“Anything you like,” said the Footman, and began whistling.

“Oh, there’s no use in talking to him,” said Alice desperately: “he’s
perfectly idiotic!” And she opened the door and went in.

The door led right into a large kitchen, which was full of smoke from
one end to the other: the Duchess was sitting on a three-legged stool
in the middle, nursing a baby; the cook was leaning over the fire,
stirring a large cauldron which seemed to be full of soup.

“There’s certainly too much pepper in that soup!” Alice said to
herself, as well as she could for sneezing.

There was certainly too much of it in the air. Even the Duchess sneezed
occasionally; and as for the baby, it was sneezing and howling
alternately without a moment’s pause. The only things in the kitchen
that did not sneeze, were the cook, and a large cat which was sitting
on the hearth and grinning from ear to ear.

“Please would you tell me,” said Alice, a little timidly, for she was
not quite sure whether it was good manners for her to speak first, “why
your cat grins like that?”

“It’s a Cheshire cat,” said the Duchess, “and that’s why. Pig!”

She said the last word with such sudden violence that Alice quite
jumped; but she saw in another moment that it was addressed to the
baby, and not to her, so she took courage, and went on again:—

“I didn’t know that Cheshire cats always grinned; in fact, I didn’t
know that cats _could_ grin.”

“They all can,” said the Duchess; “and most of ’em do.”

“I don’t know of any that do,” Alice said very politely, feeling quite
pleased to have got into a conversation.

“You don’t know much,” said the Duchess; “and that’s a fact.”

Alice did not at all like the tone of this remark, and thought it would
be as well to introduce some other subject of conversation. While she
was trying to fix on one, the cook took the cauldron of soup off the
fire, and at once set to work throwing everything within her reach at
the Duchess and the baby—the fire-irons came first; then followed a
shower of saucepans, plates, and dishes. The Duchess took no notice of
them even when they hit her; and the baby was howling so much already,
that it was quite impossible to say whether the blows hurt it or not.

“Oh, _please_ mind what you’re doing!” cried Alice, jumping up and down
in an agony of terror. “Oh, there goes his _precious_ nose!” as an
unusually large saucepan flew close by it, and very nearly carried it
off.

“If everybody minded their own business,” the Duchess said in a hoarse
growl, “the world would go round a deal faster than it does.”

“Which would _not_ be an advantage,” said Alice, who felt very glad to
get an opportunity of showing off a little of her knowledge. “Just
think of what work it would make with the day and night! You see the
earth takes twenty-four hours to turn round on its axis—”

“Talking of axes,” said the Duchess, “chop off her head!”

Alice glanced rather anxiously at the cook, to see if she meant to take
the hint; but the cook was busily stirring the soup, and seemed not to
be listening, so she went on again: “Twenty-four hours, I _think_; or
is it twelve? I—”

“Oh, don’t bother _me_,” said the Duchess; “I never could abide
figures!” And with that she began nursing her child again, singing a
sort of lullaby to it as she did so, and giving it a violent shake at
the end of every line:

“Speak roughly to your little boy,
    And beat him when he sneezes:
He only does it to annoy,
    Because he knows it teases.”


CHORUS.
(In which the cook and the baby joined):


“Wow! wow! wow!”


While the Duchess sang the second verse of the song, she kept tossing
the baby violently up and down, and the poor little thing howled so,
that Alice could hardly hear the words:—

“I speak severely to my boy,
    I beat him when he sneezes;
For he can thoroughly enjoy
    The pepper when he pleases!”


CHORUS.


“Wow! wow! wow!”


“Here! you may nurse it a bit, if you like!” the Duchess said to Alice,
flinging the baby at her as she spoke. “I must go and get ready to play
croquet with the Queen,” and she hurried out of the room. The cook
threw a frying-pan after her as she went out, but it just missed her.

Alice caught the baby with some difficulty, as it was a queer-shaped
little creature, and held out its arms and legs in all directions,
“just like a star-fish,” thought Alice. The poor little thing was
snorting like a steam-engine when she caught it, and kept doubling
itself up and straightening itself out again, so that altogether, for
the first minute or two, it was as much as she could do to hold it.

As soon as she had made out the proper way of nursing it, (which was to
twist it up into a sort of knot, and then keep tight hold of its right
ear and left foot, so as to prevent its undoing itself,) she carried it
out into the open air. “If I don’t take this child away with me,”
thought Alice, “they’re sure to kill it in a day or two: wouldn’t it be
murder to leave it behind?” She said the last words out loud, and the
little thing grunted in reply (it had left off sneezing by this time).
“Don’t grunt,” said Alice; “that’s not at all a proper way of
expressing yourself.”

The baby grunted again, and Alice looked very anxiously into its face
to see what was the matter with it. There could be no doubt that it had
a _very_ turn-up nose, much more like a snout than a real nose; also
its eyes were getting extremely small for a baby: altogether Alice did
not like the look of the thing at all. “But perhaps it was only
sobbing,” she thought, and looked into its eyes again, to see if there
were any tears.

No, there were no tears. “If you’re going to turn into a pig, my dear,”
said Alice, seriously, “I’ll have nothing more to do with you. Mind
now!” The poor little thing sobbed again (or grunted, it was impossible
to say which), and they went on for some while in silence.

Alice was just beginning to think to herself, “Now, what am I to do
with this creature when I get it home?” when it grunted again, so
violently, that she looked down into its face in some alarm. This time
there could be _no_ mistake about it: it was neither more nor less than
a pig, and she felt that it would be quite absurd for her to carry it
further.

So she set the little creature down, and felt quite relieved to see it
trot away quietly into the wood. “If it had grown up,” she said to
herself, “it would have made a dreadfully ugly child: but it makes
rather a handsome pig, I think.” And she began thinking over other
children she knew, who might do very well as pigs, and was just saying
to herself, “if one only knew the right way to change them—” when she
was a little startled by seeing the Cheshire Cat sitting on a bough of
a tree a few yards off.

The Cat only grinned when it saw Alice. It looked good-natured, she
thought: still it had _very_ long claws and a great many teeth, so she
felt that it ought to be treated with respect.

“Cheshire Puss,” she began, rather timidly, as she did not at all know
whether it would like the name: however, it only grinned a little
wider. “Come, it’s pleased so far,” thought Alice, and she went on.
“Would you tell me, please, which way I ought to go from here?”

“That depends a good deal on where you want to get to,” said the Cat.

“I don’t much care where—” said Alice.

“Then it doesn’t matter which way you go,” said the Cat.

“—so long as I get _somewhere_,” Alice added as an explanation.

“Oh, you’re sure to do that,” said the Cat, “if you only walk long
enough.”

Alice felt that this could not be denied, so she tried another
question. “What sort of people live about here?”

“In _that_ direction,” the Cat said, waving its right paw round, “lives
a Hatter: and in _that_ direction,” waving the other paw, “lives a
March Hare. Visit either you like: they’re both mad.”

“But I don’t want to go among mad people,” Alice remarked.

“Oh, you can’t help that,” said the Cat: “we’re all mad here. I’m mad.
You’re mad.”

“How do you know I’m mad?” said Alice.

“You must be,” said the Cat, “or you wouldn’t have come here.”

Alice didn’t think that proved it at all; however, she went on “And how
do you know that you’re mad?”

“To begin with,” said the Cat, “a dog’s not mad. You grant that?”

“I suppose so,” said Alice.

“Well, then,” the Cat went on, “you see, a dog growls when it’s angry,
and wags its tail when it’s pleased. Now _I_ growl when I’m pleased,
and wag my tail when I’m angry. Therefore I’m mad.”

“_I_ call it purring, not growling,” said Alice.

“Call it what you like,” said the Cat. “Do you play croquet with the
Queen to-day?”

“I should like it very much,” said Alice, “but I haven’t been invited
yet.”

“You’ll see me there,” said the Cat, and vanished.

Alice was not much surprised at this, she was getting so used to queer
things happening. While she was looking at the place where it had been,
it suddenly appeared again.

“By-the-bye, what became of the baby?” said the Cat. “I’d nearly
forgotten to ask.”

“It turned into a pig,” Alice quietly said, just as if it had come back
in a natural way.

“I thought it would,” said the Cat, and vanished again.

Alice waited a little, half expecting to see it again, but it did not
appear, and after a minute or two she walked on in the direction in
which the March Hare was said to live. “I’ve seen hatters before,” she
said to herself; “the March Hare will be much the most interesting, and
perhaps as this is May it won’t be raving mad—at least not so mad as it
was in March.” As she said this, she looked up, and there was the Cat
again, sitting on a branch of a tree.

“Did you say pig, or fig?” said the Cat.

“I said pig,” replied Alice; “and I wish you wouldn’t keep appearing
and vanishing so suddenly: you make one quite giddy.”

“All right,” said the Cat; and this time it vanished quite slowly,
beginning with the end of the tail, and ending with the grin, which
remained some time after the rest of it had gone.

“Well! I’ve often seen a cat without a grin,” thought Alice; “but a
grin without a cat! It’s the most curious thing I ever saw in my life!”

She had not gone much farther before she came in sight of the house of
the March Hare: she thought it must be the right house, because the
chimneys were shaped like ears and the roof was thatched with fur. It
was so large a house, that she did not like to go nearer till she had
nibbled some more of the lefthand bit of mushroom, and raised herself
to about two feet high: even then she walked up towards it rather
timidly, saying to herself “Suppose it should be raving mad after all!
I almost wish I’d gone to see the Hatter instead!”


CHAPTER VII.
A Mad Tea-Party


There was a table set out under a tree in front of the house, and the
March Hare and the Hatter were having tea at it: a Dormouse was sitting
between them, fast asleep, and the other two were using it as a
cushion, resting their elbows on it, and talking over its head. “Very
uncomfortable for the Dormouse,” thought Alice; “only, as it’s asleep,
I suppose it doesn’t mind.”

The table was a large one, but the three were all crowded together at
one corner of it: “No room! No room!” they cried out when they saw
Alice coming. “There’s _plenty_ of room!” said Alice indignantly, and
she sat down in a large arm-chair at one end of the table.

“Have some wine,” the March Hare said in an encouraging tone.

Alice looked all round the table, but there was nothing on it but tea.
“I don’t see any wine,” she remarked.

“There isn’t any,” said the March Hare.

“Then it wasn’t very civil of you to offer it,” said Alice angrily.

“It wasn’t very civil of you to sit down without being invited,” said
the March Hare.

“I didn’t know it was _your_ table,” said Alice; “it’s laid for a great
many more than three.”

“Your hair wants cutting,” said the Hatter. He had been looking at
Alice for some time with great curiosity, and this was his first
speech.

“You should learn not to make personal remarks,” Alice said with some
severity; “it’s very rude.”

The Hatter opened his eyes very wide on hearing this; but all he _said_
was, “Why is a raven like a writing-desk?”

“Come, we shall have some fun now!” thought Alice. “I’m glad they’ve
begun asking riddles.—I believe I can guess that,” she added aloud.

“Do you mean that you think you can find out the answer to it?” said
the March Hare.

“Exactly so,” said Alice.

“Then you should say what you mean,” the March Hare went on.

“I do,” Alice hastily replied; “at least—at least I mean what I
say—that’s the same thing, you know.”

“Not the same thing a bit!” said the Hatter. “You might just as well
say that ‘I see what I eat’ is the same thing as ‘I eat what I see’!”

“You might just as well say,” added the March Hare, “that ‘I like what
I get’ is the same thing as ‘I get what I like’!”

“You might just as well say,” added the Dormouse, who seemed to be
talking in his sleep, “that ‘I breathe when I sleep’ is the same thing
as ‘I sleep when I breathe’!”

“It _is_ the same thing with you,” said the Hatter, and here the
conversation dropped, and the party sat silent for a minute, while
Alice thought over all she could remember about ravens and
writing-desks, which wasn’t much.

The Hatter was the first to break the silence. “What day of the month
is it?” he said, turning to Alice: he had taken his watch out of his
pocket, and was looking at it uneasily, shaking it every now and then,
and holding it to his ear.

Alice considered a little, and then said “The fourth.”

“Two days wrong!” sighed the Hatter. “I told you butter wouldn’t suit
the works!” he added looking angrily at the March Hare.

“It was the _best_ butter,” the March Hare meekly replied.

“Yes, but some crumbs must have got in as well,” the Hatter grumbled:
“you shouldn’t have put it in with the bread-knife.”

The March Hare took the watch and looked at it gloomily: then he dipped
it into his cup of tea, and looked at it again: but he could think of
nothing better to say than his first remark, “It was the _best_ butter,
you know.”

Alice had been looking over his shoulder with some curiosity. “What a
funny watch!” she remarked. “It tells the day of the month, and doesn’t
tell what o’clock it is!”

“Why should it?” muttered the Hatter. “Does _your_ watch tell you what
year it is?”

“Of course not,” Alice replied very readily: “but that’s because it
stays the same year for such a long time together.”

“Which is just the case with _mine_,” said the Hatter.

Alice felt dreadfully puzzled. The Hatter’s remark seemed to have no
sort of meaning in it, and yet it was certainly English. “I don’t quite
understand you,” she said, as politely as she could.

“The Dormouse is asleep again,” said the Hatter, and he poured a little
hot tea upon its nose.

The Dormouse shook its head impatiently, and said, without opening its
eyes, “Of course, of course; just what I was going to remark myself.”

“Have you guessed the riddle yet?” the Hatter said, turning to Alice
again.

“No, I give it up,” Alice replied: “what’s the answer?”

“I haven’t the slightest idea,” said the Hatter.

“Nor I,” said the March Hare.

Alice sighed wearily. “I think you might do something better with the
time,” she said, “than waste it in asking riddles that have no
answers.”

“If you knew Time as well as I do,” said the Hatter, “you wouldn’t talk
about wasting _it_. It’s _him_.”

“I don’t know what you mean,” said Alice.

“Of course you don’t!” the Hatter said, tossing his head
contemptuously. “I dare say you never even spoke to Time!”

“Perhaps not,” Alice cautiously replied: “but I know I have to beat
time when I learn music.”

“Ah! that accounts for it,” said the Hatter. “He won’t stand beating.
Now, if you only kept on good terms with him, he’d do almost anything
you liked with the clock. For instance, suppose it were nine o’clock in
the morning, just time to begin lessons: you’d only have to whisper a
hint to Time, and round goes the clock in a twinkling! Half-past one,
time for dinner!”

(“I only wish it was,” the March Hare said to itself in a whisper.)

“That would be grand, certainly,” said Alice thoughtfully: “but then—I
shouldn’t be hungry for it, you know.”

“Not at first, perhaps,” said the Hatter: “but you could keep it to
half-past one as long as you liked.”

“Is that the way _you_ manage?” Alice asked.

The Hatter shook his head mournfully. “Not I!” he replied. “We
quarrelled last March—just before _he_ went mad, you know—” (pointing
with his tea spoon at the March Hare,) “—it was at the great concert
given by the Queen of Hearts, and I had to sing

‘Twinkle, twinkle, little bat!
How I wonder what you’re at!’


You know the song, perhaps?”

“I’ve heard something like it,” said Alice.

“It goes on, you know,” the Hatter continued, “in this way:—

‘Up above the world you fly,
Like a tea-tray in the sky.
                    Twinkle, twinkle—’”


Here the Dormouse shook itself, and began singing in its sleep
“_Twinkle, twinkle, twinkle, twinkle_—” and went on so long that they
had to pinch it to make it stop.

“Well, I’d hardly finished the first verse,” said the Hatter, “when the
Queen jumped up and bawled out, ‘He’s murdering the time! Off with his
head!’”

“How dreadfully savage!” exclaimed Alice.

“And ever since that,” the Hatter went on in a mournful tone, “he won’t
do a thing I ask! It’s always six o’clock now.”

A bright idea came into Alice’s head. “Is that the reason so many
tea-things are put out here?” she asked.

“Yes, that’s it,” said the Hatter with a sigh: “it’s always tea-time,
and we’ve no time to wash the things between whiles.”

“Then you keep moving round, I suppose?” said Alice.

“Exactly so,” said the Hatter: “as the things get used up.”

“But what happens when you come to the beginning again?” Alice ventured
to ask.

“Suppose we change the subject,” the March Hare interrupted, yawning.
“I’m getting tired of this. I vote the young lady tells us a story.”

“I’m afraid I don’t know one,” said Alice, rather alarmed at the
proposal.

“Then the Dormouse shall!” they both cried. “Wake up, Dormouse!” And
they pinched it on both sides at once.

The Dormouse slowly opened his eyes. “I wasn’t asleep,” he said in a
hoarse, feeble voice: “I heard every word you fellows were saying.”

“Tell us a story!” said the March Hare.

“Yes, please do!” pleaded Alice.

“And be quick about it,” added the Hatter, “or you’ll be asleep again
before it’s done.”

“Once upon a time there were three little sisters,” the Dormouse began
in a great hurry; “and their names were Elsie, Lacie, and Tillie; and
they lived at the bottom of a well—”

“What did they live on?” said Alice, who always took a great interest
in questions of eating and drinking.

“They lived on treacle,” said the Dormouse, after thinking a minute or
two.

“They couldn’t have done that, you know,” Alice gently remarked;
“they’d have been ill.”

“So they were,” said the Dormouse; “_very_ ill.”

Alice tried to fancy to herself what such an extraordinary ways of
living would be like, but it puzzled her too much, so she went on: “But
why did they live at the bottom of a well?”

“Take some more tea,” the March Hare said to Alice, very earnestly.

“I’ve had nothing yet,” Alice replied in an offended tone, “so I can’t
take more.”

“You mean you can’t take _less_,” said the Hatter: “it’s very easy to
take _more_ than nothing.”

“Nobody asked _your_ opinion,” said Alice.

“Who’s making personal remarks now?” the Hatter asked triumphantly.

Alice did not quite know what to say to this: so she helped herself to
some tea and bread-and-butter, and then turned to the Dormouse, and
repeated her question. “Why did they live at the bottom of a well?”

The Dormouse again took a minute or two to think about it, and then
said, “It was a treacle-well.”

“There’s no such thing!” Alice was beginning very angrily, but the
Hatter and the March Hare went “Sh! sh!” and the Dormouse sulkily
remarked, “If you can’t be civil, you’d better finish the story for
yourself.”

“No, please go on!” Alice said very humbly; “I won’t interrupt again. I
dare say there may be _one_.”

“One, indeed!” said the Dormouse indignantly. However, he consented to
go on. “And so these three little sisters—they were learning to draw,
you know—”

“What did they draw?” said Alice, quite forgetting her promise.

“Treacle,” said the Dormouse, without considering at all this time.

“I want a clean cup,” interrupted the Hatter: “let’s all move one place
on.”

He moved on as he spoke, and the Dormouse followed him: the March Hare
moved into the Dormouse’s place, and Alice rather unwillingly took the
place of the March Hare. The Hatter was the only one who got any
advantage from the change: and Alice was a good deal worse off than
before, as the March Hare had just upset the milk-jug into his plate.

Alice did not wish to offend the Dormouse again, so she began very
cautiously: “But I don’t understand. Where did they draw the treacle
from?”

“You can draw water out of a water-well,” said the Hatter; “so I should
think you could draw treacle out of a treacle-well—eh, stupid?”

“But they were _in_ the well,” Alice said to the Dormouse, not choosing
to notice this last remark.

“Of course they were,” said the Dormouse; “—well in.”

This answer so confused poor Alice, that she let the Dormouse go on for
some time without interrupting it.

“They were learning to draw,” the Dormouse went on, yawning and rubbing
its eyes, for it was getting very sleepy; “and they drew all manner of
things—everything that begins with an M—”

“Why with an M?” said Alice.

“Why not?” said the March Hare.

Alice was silent.

The Dormouse had closed its eyes by this time, and was going off into a
doze; but, on being pinched by the Hatter, it woke up again with a
little shriek, and went on: “—that begins with an M, such as
mouse-traps, and the moon, and memory, and muchness—you know you say
things are “much of a muchness”—did you ever see such a thing as a
drawing of a muchness?”

“Really, now you ask me,” said Alice, very much confused, “I don’t
think—”

“Then you shouldn’t talk,” said the Hatter.

This piece of rudeness was more than Alice could bear: she got up in
great disgust, and walked off; the Dormouse fell asleep instantly, and
neither of the others took the least notice of her going, though she
looked back once or twice, half hoping that they would call after her:
the last time she saw them, they were trying to put the Dormouse into
the teapot.

“At any rate I’ll never go _there_ again!” said Alice as she picked her
way through the wood. “It’s the stupidest tea-party I ever was at in
all my life!”

Just as she said this, she noticed that one of the trees had a door
leading right into it. “That’s very curious!” she thought. “But
everything’s curious today. I think I may as well go in at once.” And
in she went.

Once more she found herself in the long hall, and close to the little
glass table. “Now, I’ll manage better this time,” she said to herself,
and began by taking the little golden key, and unlocking the door that
led into the garden. Then she went to work nibbling at the mushroom
(she had kept a piece of it in her pocket) till she was about a foot
high: then she walked down the little passage: and _then_—she found
herself at last in the beautiful garden, among the bright flower-beds
and the cool fountains.


CHAPTER VIII.
The Queen’s Croquet-Ground


A large rose-tree stood near the entrance of the garden: the roses
growing on it were white, but there were three gardeners at it, busily
painting them red. Alice thought this a very curious thing, and she
went nearer to watch them, and just as she came up to them she heard
one of them say, “Look out now, Five! Don’t go splashing paint over me
like that!”

“I couldn’t help it,” said Five, in a sulky tone; “Seven jogged my
elbow.”

On which Seven looked up and said, “That’s right, Five! Always lay the
blame on others!”

“_You’d_ better not talk!” said Five. “I heard the Queen say only
yesterday you deserved to be beheaded!”

“What for?” said the one who had spoken first.

“That’s none of _your_ business, Two!” said Seven.

“Yes, it _is_ his business!” said Five, “and I’ll tell him—it was for
bringing the cook tulip-roots instead of onions.”

Seven flung down his brush, and had just begun “Well, of all the unjust
things—” when his eye chanced to fall upon Alice, as she stood watching
them, and he checked himself suddenly: the others looked round also,
and all of them bowed low.

“Would you tell me,” said Alice, a little timidly, “why you are
painting those roses?”

Five and Seven said nothing, but looked at Two. Two began in a low
voice, “Why the fact is, you see, Miss, this here ought to have been a
_red_ rose-tree, and we put a white one in by mistake; and if the Queen
was to find it out, we should all have our heads cut off, you know. So
you see, Miss, we’re doing our best, afore she comes, to—” At this
moment Five, who had been anxiously looking across the garden, called
out “The Queen! The Queen!” and the three gardeners instantly threw
themselves flat upon their faces. There was a sound of many footsteps,
and Alice looked round, eager to see the Queen.

First came ten soldiers carrying clubs; these were all shaped like the
three gardeners, oblong and flat, with their hands and feet at the
corners: next the ten courtiers; these were ornamented all over with
diamonds, and walked two and two, as the soldiers did. After these came
the royal children; there were ten of them, and the little dears came
jumping merrily along hand in hand, in couples: they were all
ornamented with hearts. Next came the guests, mostly Kings and Queens,
and among them Alice recognised the White Rabbit: it was talking in a
hurried nervous manner, smiling at everything that was said, and went
by without noticing her. Then followed the Knave of Hearts, carrying
the King’s crown on a crimson velvet cushion; and, last of all this
grand procession, came THE KING AND QUEEN OF HEARTS.

Alice was rather doubtful whether she ought not to lie down on her face
like the three gardeners, but she could not remember ever having heard
of such a rule at processions; “and besides, what would be the use of a
procession,” thought she, “if people had all to lie down upon their
faces, so that they couldn’t see it?” So she stood still where she was,
and waited.

When the procession came opposite to Alice, they all stopped and looked
at her, and the Queen said severely “Who is this?” She said it to the
Knave of Hearts, who only bowed and smiled in reply.

“Idiot!” said the Queen, tossing her head impatiently; and, turning to
Alice, she went on, “What’s your name, child?”

“My name is Alice, so please your Majesty,” said Alice very politely;
but she added, to herself, “Why, they’re only a pack of cards, after
all. I needn’t be afraid of them!”

“And who are _these?_” said the Queen, pointing to the three gardeners
who were lying round the rose-tree; for, you see, as they were lying on
their faces, and the pattern on their backs was the same as the rest of
the pack, she could not tell whether they were gardeners, or soldiers,
or courtiers, or three of her own children.

“How should _I_ know?” said Alice, surprised at her own courage. “It’s
no business of _mine_.”

The Queen turned crimson with fury, and, after glaring at her for a
moment like a wild beast, screamed “Off with her head! Off—”

“Nonsense!” said Alice, very loudly and decidedly, and the Queen was
silent.

The King laid his hand upon her arm, and timidly said “Consider, my
dear: she is only a child!”

The Queen turned angrily away from him, and said to the Knave “Turn
them over!”

The Knave did so, very carefully, with one foot.

“Get up!” said the Queen, in a shrill, loud voice, and the three
gardeners instantly jumped up, and began bowing to the King, the Queen,
the royal children, and everybody else.

“Leave off that!” screamed the Queen. “You make me giddy.” And then,
turning to the rose-tree, she went on, “What _have_ you been doing
here?”

“May it please your Majesty,” said Two, in a very humble tone, going
down on one knee as he spoke, “we were trying—”

“_I_ see!” said the Queen, who had meanwhile been examining the roses.
“Off with their heads!” and the procession moved on, three of the
soldiers remaining behind to execute the unfortunate gardeners, who ran
to Alice for protection.

“You shan’t be beheaded!” said Alice, and she put them into a large
flower-pot that stood near. The three soldiers wandered about for a
minute or two, looking for them, and then quietly marched off after the
others.

“Are their heads off?” shouted the Queen.

“Their heads are gone, if it please your Majesty!” the soldiers shouted
in reply.

“That’s right!” shouted the Queen. “Can you play croquet?”

The soldiers were silent, and looked at Alice, as the question was
evidently meant for her.

“Yes!” shouted Alice.

“Come on, then!” roared the Queen, and Alice joined the procession,
wondering very much what would happen next.

“It’s—it’s a very fine day!” said a timid voice at her side. She was
walking by the White Rabbit, who was peeping anxiously into her face.

“Very,” said Alice: “—where’s the Duchess?”

“Hush! Hush!” said the Rabbit in a low, hurried tone. He looked
anxiously over his shoulder as he spoke, and then raised himself upon
tiptoe, put his mouth close to her ear, and whispered “She’s under
sentence of execution.”

“What for?” said Alice.

“Did you say ‘What a pity!’?” the Rabbit asked.

“No, I didn’t,” said Alice: “I don’t think it’s at all a pity. I said
‘What for?’”

“She boxed the Queen’s ears—” the Rabbit began. Alice gave a little
scream of laughter. “Oh, hush!” the Rabbit whispered in a frightened
tone. “The Queen will hear you! You see, she came rather late, and the
Queen said—”

“Get to your places!” shouted the Queen in a voice of thunder, and
people began running about in all directions, tumbling up against each
other; however, they got settled down in a minute or two, and the game
began. Alice thought she had never seen such a curious croquet-ground
in her life; it was all ridges and furrows; the balls were live
hedgehogs, the mallets live flamingoes, and the soldiers had to double
themselves up and to stand on their hands and feet, to make the arches.

The chief difficulty Alice found at first was in managing her flamingo:
she succeeded in getting its body tucked away, comfortably enough,
under her arm, with its legs hanging down, but generally, just as she
had got its neck nicely straightened out, and was going to give the
hedgehog a blow with its head, it _would_ twist itself round and look
up in her face, with such a puzzled expression that she could not help
bursting out laughing: and when she had got its head down, and was
going to begin again, it was very provoking to find that the hedgehog
had unrolled itself, and was in the act of crawling away: besides all
this, there was generally a ridge or furrow in the way wherever she
wanted to send the hedgehog to, and, as the doubled-up soldiers were
always getting up and walking off to other parts of the ground, Alice
soon came to the conclusion that it was a very difficult game indeed.

The players all played at once without waiting for turns, quarrelling
all the while, and fighting for the hedgehogs; and in a very short time
the Queen was in a furious passion, and went stamping about, and
shouting “Off with his head!” or “Off with her head!” about once in a
minute.

Alice began to feel very uneasy: to be sure, she had not as yet had any
dispute with the Queen, but she knew that it might happen any minute,
“and then,” thought she, “what would become of me? They’re dreadfully
fond of beheading people here; the great wonder is, that there’s any
one left alive!”

She was looking about for some way of escape, and wondering whether she
could get away without being seen, when she noticed a curious
appearance in the air: it puzzled her very much at first, but, after
watching it a minute or two, she made it out to be a grin, and she said
to herself “It’s the Cheshire Cat: now I shall have somebody to talk
to.”

“How are you getting on?” said the Cat, as soon as there was mouth
enough for it to speak with.

Alice waited till the eyes appeared, and then nodded. “It’s no use
speaking to it,” she thought, “till its ears have come, or at least one
of them.” In another minute the whole head appeared, and then Alice put
down her flamingo, and began an account of the game, feeling very glad
she had someone to listen to her. The Cat seemed to think that there
was enough of it now in sight, and no more of it appeared.

“I don’t think they play at all fairly,” Alice began, in rather a
complaining tone, “and they all quarrel so dreadfully one can’t hear
oneself speak—and they don’t seem to have any rules in particular; at
least, if there are, nobody attends to them—and you’ve no idea how
confusing it is all the things being alive; for instance, there’s the
arch I’ve got to go through next walking about at the other end of the
ground—and I should have croqueted the Queen’s hedgehog just now, only
it ran away when it saw mine coming!”

“How do you like the Queen?” said the Cat in a low voice.

“Not at all,” said Alice: “she’s so extremely—” Just then she noticed
that the Queen was close behind her, listening: so she went on,
“—likely to win, that it’s hardly worth while finishing the game.”

The Queen smiled and passed on.

“Who _are_ you talking to?” said the King, going up to Alice, and
looking at the Cat’s head with great curiosity.

“It’s a friend of mine—a Cheshire Cat,” said Alice: “allow me to
introduce it.”

“I don’t like the look of it at all,” said the King: “however, it may
kiss my hand if it likes.”

“I’d rather not,” the Cat remarked.

“Don’t be impertinent,” said the King, “and don’t look at me like
that!” He got behind Alice as he spoke.

“A cat may look at a king,” said Alice. “I’ve read that in some book,
but I don’t remember where.”

“Well, it must be removed,” said the King very decidedly, and he called
the Queen, who was passing at the moment, “My dear! I wish you would
have this cat removed!”

The Queen had only one way of settling all difficulties, great or
small. “Off with his head!” she said, without even looking round.

“I’ll fetch the executioner myself,” said the King eagerly, and he
hurried off.

Alice thought she might as well go back, and see how the game was going
on, as she heard the Queen’s voice in the distance, screaming with
passion. She had already heard her sentence three of the players to be
executed for having missed their turns, and she did not like the look
of things at all, as the game was in such confusion that she never knew
whether it was her turn or not. So she went in search of her hedgehog.

The hedgehog was engaged in a fight with another hedgehog, which seemed
to Alice an excellent opportunity for croqueting one of them with the
other: the only difficulty was, that her flamingo was gone across to
the other side of the garden, where Alice could see it trying in a
helpless sort of way to fly up into a tree.

By the time she had caught the flamingo and brought it back, the fight
was over, and both the hedgehogs were out of sight: “but it doesn’t
matter much,” thought Alice, “as all the arches are gone from this side
of the ground.” So she tucked it away under her arm, that it might not
escape again, and went back for a little more conversation with her
friend.

When she got back to the Cheshire Cat, she was surprised to find quite
a large crowd collected round it: there was a dispute going on between
the executioner, the King, and the Queen, who were all talking at once,
while all the rest were quite silent, and looked very uncomfortable.

The moment Alice appeared, she was appealed to by all three to settle
the question, and they repeated their arguments to her, though, as they
all spoke at once, she found it very hard indeed to make out exactly
what they said.

The executioner’s argument was, that you couldn’t cut off a head unless
there was a body to cut it off from: that he had never had to do such a
thing before, and he wasn’t going to begin at _his_ time of life.

The King’s argument was, that anything that had a head could be
beheaded, and that you weren’t to talk nonsense.

The Queen’s argument was, that if something wasn’t done about it in
less than no time she’d have everybody executed, all round. (It was
this last remark that had made the whole party look so grave and
anxious.)

Alice could think of nothing else to say but “It belongs to the
Duchess: you’d better ask _her_ about it.”

“She’s in prison,” the Queen said to the executioner: “fetch her here.”
And the executioner went off like an arrow.

The Cat’s head began fading away the moment he was gone, and, by the
time he had come back with the Duchess, it had entirely disappeared; so
the King and the executioner ran wildly up and down looking for it,
while the rest of the party went back to the game.


CHAPTER IX.
The Mock Turtle’s Story


“You can’t think how glad I am to see you again, you dear old thing!”
said the Duchess, as she tucked her arm affectionately into Alice’s,
and they walked off together.

Alice was very glad to find her in such a pleasant temper, and thought
to herself that perhaps it was only the pepper that had made her so
savage when they met in the kitchen.

“When _I’m_ a Duchess,” she said to herself, (not in a very hopeful
tone though), “I won’t have any pepper in my kitchen _at all_. Soup
does very well without—Maybe it’s always pepper that makes people
hot-tempered,” she went on, very much pleased at having found out a new
kind of rule, “and vinegar that makes them sour—and camomile that makes
them bitter—and—and barley-sugar and such things that make children
sweet-tempered. I only wish people knew _that_: then they wouldn’t be
so stingy about it, you know—”

She had quite forgotten the Duchess by this time, and was a little
startled when she heard her voice close to her ear. “You’re thinking
about something, my dear, and that makes you forget to talk. I can’t
tell you just now what the moral of that is, but I shall remember it in
a bit.”

“Perhaps it hasn’t one,” Alice ventured to remark.

“Tut, tut, child!” said the Duchess. “Everything’s got a moral, if only
you can find it.” And she squeezed herself up closer to Alice’s side as
she spoke.

Alice did not much like keeping so close to her: first, because the
Duchess was _very_ ugly; and secondly, because she was exactly the
right height to rest her chin upon Alice’s shoulder, and it was an
uncomfortably sharp chin. However, she did not like to be rude, so she
bore it as well as she could.

“The game’s going on rather better now,” she said, by way of keeping up
the conversation a little.

“’Tis so,” said the Duchess: “and the moral of that is—‘Oh, ’tis love,
’tis love, that makes the world go round!’”

“Somebody said,” Alice whispered, “that it’s done by everybody minding
their own business!”

“Ah, well! It means much the same thing,” said the Duchess, digging her
sharp little chin into Alice’s shoulder as she added, “and the moral of
_that_ is—‘Take care of the sense, and the sounds will take care of
themselves.’”

“How fond she is of finding morals in things!” Alice thought to
herself.

“I dare say you’re wondering why I don’t put my arm round your waist,”
the Duchess said after a pause: “the reason is, that I’m doubtful about
the temper of your flamingo. Shall I try the experiment?”

“He might bite,” Alice cautiously replied, not feeling at all anxious
to have the experiment tried.

“Very true,” said the Duchess: “flamingoes and mustard both bite. And
the moral of that is—‘Birds of a feather flock together.’”

“Only mustard isn’t a bird,” Alice remarked.

“Right, as usual,” said the Duchess: “what a clear way you have of
putting things!”

“It’s a mineral, I _think_,” said Alice.

“Of course it is,” said the Duchess, who seemed ready to agree to
everything that Alice said; “there’s a large mustard-mine near here.
And the moral of that is—‘The more there is of mine, the less there is
of yours.’”

“Oh, I know!” exclaimed Alice, who had not attended to this last
remark, “it’s a vegetable. It doesn’t look like one, but it is.”

“I quite agree with you,” said the Duchess; “and the moral of that
is—‘Be what you would seem to be’—or if you’d like it put more
simply—‘Never imagine yourself not to be otherwise than what it might
appear to others that what you were or might have been was not
otherwise than what you had been would have appeared to them to be
otherwise.’”

“I think I should understand that better,” Alice said very politely,
“if I had it written down: but I can’t quite follow it as you say it.”

“That’s nothing to what I could say if I chose,” the Duchess replied,
in a pleased tone.

“Pray don’t trouble yourself to say it any longer than that,” said
Alice.

“Oh, don’t talk about trouble!” said the Duchess. “I make you a present
of everything I’ve said as yet.”

“A cheap sort of present!” thought Alice. “I’m glad they don’t give
birthday presents like that!” But she did not venture to say it out
loud.

“Thinking again?” the Duchess asked, with another dig of her sharp
little chin.

“I’ve a right to think,” said Alice sharply, for she was beginning to
feel a little worried.

“Just about as much right,” said the Duchess, “as pigs have to fly; and
the m—”

But here, to Alice’s great surprise, the Duchess’s voice died away,
even in the middle of her favourite word ‘moral,’ and the arm that was
linked into hers began to tremble. Alice looked up, and there stood the
Queen in front of them, with her arms folded, frowning like a
thunderstorm.

“A fine day, your Majesty!” the Duchess began in a low, weak voice.

“Now, I give you fair warning,” shouted the Queen, stamping on the
ground as she spoke; “either you or your head must be off, and that in
about half no time! Take your choice!”

The Duchess took her choice, and was gone in a moment.

“Let’s go on with the game,” the Queen said to Alice; and Alice was too
much frightened to say a word, but slowly followed her back to the
croquet-ground.

The other guests had taken advantage of the Queen’s absence, and were
resting in the shade: however, the moment they saw her, they hurried
back to the game, the Queen merely remarking that a moment’s delay
would cost them their lives.

All the time they were playing the Queen never left off quarrelling
with the other players, and shouting “Off with his head!” or “Off with
her head!” Those whom she sentenced were taken into custody by the
soldiers, who of course had to leave off being arches to do this, so
that by the end of half an hour or so there were no arches left, and
all the players, except the King, the Queen, and Alice, were in custody
and under sentence of execution.

Then the Queen left off, quite out of breath, and said to Alice, “Have
you seen the Mock Turtle yet?”

“No,” said Alice. “I don’t even know what a Mock Turtle is.”

“It’s the thing Mock Turtle Soup is made from,” said the Queen.

“I never saw one, or heard of one,” said Alice.

“Come on, then,” said the Queen, “and he shall tell you his history,”

As they walked off together, Alice heard the King say in a low voice,
to the company generally, “You are all pardoned.” “Come, _that’s_ a
good thing!” she said to herself, for she had felt quite unhappy at the
number of executions the Queen had ordered.

They very soon came upon a Gryphon, lying fast asleep in the sun. (If
you don’t know what a Gryphon is, look at the picture.) “Up, lazy
thing!” said the Queen, “and take this young lady to see the Mock
Turtle, and to hear his history. I must go back and see after some
executions I have ordered;” and she walked off, leaving Alice alone
with the Gryphon. Alice did not quite like the look of the creature,
but on the whole she thought it would be quite as safe to stay with it
as to go after that savage Queen: so she waited.

The Gryphon sat up and rubbed its eyes: then it watched the Queen till
she was out of sight: then it chuckled. “What fun!” said the Gryphon,
half to itself, half to Alice.

“What _is_ the fun?” said Alice.

“Why, _she_,” said the Gryphon. “It’s all her fancy, that: they never
executes nobody, you know. Come on!”

“Everybody says ‘come on!’ here,” thought Alice, as she went slowly
after it: “I never was so ordered about in all my life, never!”

They had not gone far before they saw the Mock Turtle in the distance,
sitting sad and lonely on a little ledge of rock, and, as they came
nearer, Alice could hear him sighing as if his heart would break. She
pitied him deeply. “What is his sorrow?” she asked the Gryphon, and the
Gryphon answered, very nearly in the same words as before, “It’s all
his fancy, that: he hasn’t got no sorrow, you know. Come on!”

So they went up to the Mock Turtle, who looked at them with large eyes
full of tears, but said nothing.

“This here young lady,” said the Gryphon, “she wants for to know your
history, she do.”

“I’ll tell it her,” said the Mock Turtle in a deep, hollow tone: “sit
down, both of you, and don’t speak a word till I’ve finished.”

So they sat down, and nobody spoke for some minutes. Alice thought to
herself, “I don’t see how he can _ever_ finish, if he doesn’t begin.”
But she waited patiently.

“Once,” said the Mock Turtle at last, with a deep sigh, “I was a real
Turtle.”

These words were followed by a very long silence, broken only by an
occasional exclamation of “Hjckrrh!” from the Gryphon, and the constant
heavy sobbing of the Mock Turtle. Alice was very nearly getting up and
saying, “Thank you, sir, for your interesting story,” but she could not
help thinking there _must_ be more to come, so she sat still and said
nothing.

“When we were little,” the Mock Turtle went on at last, more calmly,
though still sobbing a little now and then, “we went to school in the
sea. The master was an old Turtle—we used to call him Tortoise—”

“Why did you call him Tortoise, if he wasn’t one?” Alice asked.

“We called him Tortoise because he taught us,” said the Mock Turtle
angrily: “really you are very dull!”

“You ought to be ashamed of yourself for asking such a simple
question,” added the Gryphon; and then they both sat silent and looked
at poor Alice, who felt ready to sink into the earth. At last the
Gryphon said to the Mock Turtle, “Drive on, old fellow! Don’t be all
day about it!” and he went on in these words:

“Yes, we went to school in the sea, though you mayn’t believe it—”

“I never said I didn’t!” interrupted Alice.

“You did,” said the Mock Turtle.

“Hold your tongue!” added the Gryphon, before Alice could speak again.
The Mock Turtle went on.

“We had the best of educations—in fact, we went to school every day—”

“_I’ve_ been to a day-school, too,” said Alice; “you needn’t be so
proud as all that.”

“With extras?” asked the Mock Turtle a little anxiously.

“Yes,” said Alice, “we learned French and music.”

“And washing?” said the Mock Turtle.

“Certainly not!” said Alice indignantly.

“Ah! then yours wasn’t a really good school,” said the Mock Turtle in a
tone of great relief. “Now at _ours_ they had at the end of the bill,
‘French, music, _and washing_—extra.’”

“You couldn’t have wanted it much,” said Alice; “living at the bottom
of the sea.”

“I couldn’t afford to learn it.” said the Mock Turtle with a sigh. “I
only took the regular course.”

“What was that?” inquired Alice.

“Reeling and Writhing, of course, to begin with,” the Mock Turtle
replied; “and then the different branches of Arithmetic—Ambition,
Distraction, Uglification, and Derision.”

“I never heard of ‘Uglification,’” Alice ventured to say. “What is it?”

The Gryphon lifted up both its paws in surprise. “What! Never heard of
uglifying!” it exclaimed. “You know what to beautify is, I suppose?”

“Yes,” said Alice doubtfully: “it means—to—make—anything—prettier.”

“Well, then,” the Gryphon went on, “if you don’t know what to uglify
is, you _are_ a simpleton.”

Alice did not feel encouraged to ask any more questions about it, so
she turned to the Mock Turtle, and said “What else had you to learn?”

“Well, there was Mystery,” the Mock Turtle replied, counting off the
subjects on his flappers, “—Mystery, ancient and modern, with
Seaography: then Drawling—the Drawling-master was an old conger-eel,
that used to come once a week: _he_ taught us Drawling, Stretching, and
Fainting in Coils.”

“What was _that_ like?” said Alice.

“Well, I can’t show it you myself,” the Mock Turtle said: “I’m too
stiff. And the Gryphon never learnt it.”

“Hadn’t time,” said the Gryphon: “I went to the Classics master,
though. He was an old crab, _he_ was.”

“I never went to him,” the Mock Turtle said with a sigh: “he taught
Laughing and Grief, they used to say.”

“So he did, so he did,” said the Gryphon, sighing in his turn; and both
creatures hid their faces in their paws.

“And how many hours a day did you do lessons?” said Alice, in a hurry
to change the subject.

“Ten hours the first day,” said the Mock Turtle: “nine the next, and so
on.”

“What a curious plan!” exclaimed Alice.

“That’s the reason they’re called lessons,” the Gryphon remarked:
“because they lessen from day to day.”

This was quite a new idea to Alice, and she thought it over a little
before she made her next remark. “Then the eleventh day must have been
a holiday?”

“Of course it was,” said the Mock Turtle.

“And how did you manage on the twelfth?” Alice went on eagerly.

“That’s enough about lessons,” the Gryphon interrupted in a very
decided tone: “tell her something about the games now.”


CHAPTER X.
The Lobster Quadrille


The Mock Turtle sighed deeply, and drew the back of one flapper across
his eyes. He looked at Alice, and tried to speak, but for a minute or
two sobs choked his voice. “Same as if he had a bone in his throat,”
said the Gryphon: and it set to work shaking him and punching him in
the back. At last the Mock Turtle recovered his voice, and, with tears
running down his cheeks, he went on again:—

“You may not have lived much under the sea—” (“I haven’t,” said
Alice)—“and perhaps you were never even introduced to a lobster—”
(Alice began to say “I once tasted—” but checked herself hastily, and
said “No, never”) “—so you can have no idea what a delightful thing a
Lobster Quadrille is!”

“No, indeed,” said Alice. “What sort of a dance is it?”

“Why,” said the Gryphon, “you first form into a line along the
sea-shore—”

“Two lines!” cried the Mock Turtle. “Seals, turtles, salmon, and so on;
then, when you’ve cleared all the jelly-fish out of the way—”

“_That_ generally takes some time,” interrupted the Gryphon.

“—you advance twice—”

“Each with a lobster as a partner!” cried the Gryphon.

“Of course,” the Mock Turtle said: “advance twice, set to partners—”

“—change lobsters, and retire in same order,” continued the Gryphon.

“Then, you know,” the Mock Turtle went on, “you throw the—”

“The lobsters!” shouted the Gryphon, with a bound into the air.

“—as far out to sea as you can—”

“Swim after them!” screamed the Gryphon.

“Turn a somersault in the sea!” cried the Mock Turtle, capering wildly
about.

“Change lobsters again!” yelled the Gryphon at the top of its voice.

“Back to land again, and that’s all the first figure,” said the Mock
Turtle, suddenly dropping his voice; and the two creatures, who had
been jumping about like mad things all this time, sat down again very
sadly and quietly, and looked at Alice.

“It must be a very pretty dance,” said Alice timidly.

“Would you like to see a little of it?” said the Mock Turtle.

“Very much indeed,” said Alice.

“Come, let’s try the first figure!” said the Mock Turtle to the
Gryphon. “We can do without lobsters, you know. Which shall sing?”

“Oh, _you_ sing,” said the Gryphon. “I’ve forgotten the words.”

So they began solemnly dancing round and round Alice, every now and
then treading on her toes when they passed too close, and waving their
forepaws to mark the time, while the Mock Turtle sang this, very slowly
and sadly:—

“Will you walk a little faster?” said a whiting to a snail.
“There’s a porpoise close behind us, and he’s treading on my tail.
See how eagerly the lobsters and the turtles all advance!
They are waiting on the shingle—will you come and join the dance?
Will you, won’t you, will you, won’t you, will you join the dance?
Will you, won’t you, will you, won’t you, won’t you join the dance?

“You can really have no notion how delightful it will be
When they take us up and throw us, with the lobsters, out to sea!”
But the snail replied “Too far, too far!” and gave a look askance—
Said he thanked the whiting kindly, but he would not join the dance.
Would not, could not, would not, could not, would not join the dance.
Would not, could not, would not, could not, could not join the dance.

“What matters it how far we go?” his scaly friend replied.
“There is another shore, you know, upon the other side.
The further off from England the nearer is to France—
Then turn not pale, beloved snail, but come and join the dance.
Will you, won’t you, will you, won’t you, will you join the dance?
Will you, won’t you, will you, won’t you, won’t you join the dance?”


“Thank you, it’s a very interesting dance to watch,” said Alice,
feeling very glad that it was over at last: “and I do so like that
curious song about the whiting!”

“Oh, as to the whiting,” said the Mock Turtle, “they—you’ve seen them,
of course?”

“Yes,” said Alice, “I’ve often seen them at dinn—” she checked herself
hastily.

“I don’t know where Dinn may be,” said the Mock Turtle, “but if you’ve
seen them so often, of course you know what they’re like.”

“I believe so,” Alice replied thoughtfully. “They have their tails in
their mouths—and they’re all over crumbs.”

“You’re wrong about the crumbs,” said the Mock Turtle: “crumbs would
all wash off in the sea. But they _have_ their tails in their mouths;
and the reason is—” here the Mock Turtle yawned and shut his
eyes.—“Tell her about the reason and all that,” he said to the Gryphon.

“The reason is,” said the Gryphon, “that they _would_ go with the
lobsters to the dance. So they got thrown out to sea. So they had to
fall a long way. So they got their tails fast in their mouths. So they
couldn’t get them out again. That’s all.”

“Thank you,” said Alice, “it’s very interesting. I never knew so much
about a whiting before.”

“I can tell you more than that, if you like,” said the Gryphon. “Do you
know why it’s called a whiting?”

“I never thought about it,” said Alice. “Why?”

“_It does the boots and shoes_,” the Gryphon replied very solemnly.

Alice was thoroughly puzzled. “Does the boots and shoes!” she repeated
in a wondering tone.

“Why, what are _your_ shoes done with?” said the Gryphon. “I mean, what
makes them so shiny?”

Alice looked down at them, and considered a little before she gave her
answer. “They’re done with blacking, I believe.”

“Boots and shoes under the sea,” the Gryphon went on in a deep voice,
“are done with a whiting. Now you know.”

“And what are they made of?” Alice asked in a tone of great curiosity.

“Soles and eels, of course,” the Gryphon replied rather impatiently:
“any shrimp could have told you that.”

“If I’d been the whiting,” said Alice, whose thoughts were still
running on the song, “I’d have said to the porpoise, ‘Keep back,
please: we don’t want _you_ with us!’”

“They were obliged to have him with them,” the Mock Turtle said: “no
wise fish would go anywhere without a porpoise.”

“Wouldn’t it really?” said Alice in a tone of great surprise.

“Of course not,” said the Mock Turtle: “why, if a fish came to _me_,
and told me he was going a journey, I should say ‘With what porpoise?’”

“Don’t you mean ‘purpose’?” said Alice.

“I mean what I say,” the Mock Turtle replied in an offended tone. And
the Gryphon added “Come, let’s hear some of _your_ adventures.”

“I could tell you my adventures—beginning from this morning,” said
Alice a little timidly: “but it’s no use going back to yesterday,
because I was a different person then.”

“Explain all that,” said the Mock Turtle.

“No, no! The adventures first,” said the Gryphon in an impatient tone:
“explanations take such a dreadful time.”

So Alice began telling them her adventures from the time when she first
saw the White Rabbit. She was a little nervous about it just at first,
the two creatures got so close to her, one on each side, and opened
their eyes and mouths so _very_ wide, but she gained courage as she
went on. Her listeners were perfectly quiet till she got to the part
about her repeating “_You are old, Father William_,” to the
Caterpillar, and the words all coming different, and then the Mock
Turtle drew a long breath, and said “That’s very curious.”

“It’s all about as curious as it can be,” said the Gryphon.

“It all came different!” the Mock Turtle repeated thoughtfully. “I
should like to hear her try and repeat something now. Tell her to
begin.” He looked at the Gryphon as if he thought it had some kind of
authority over Alice.

“Stand up and repeat ‘’_Tis the voice of the sluggard_,’” said the
Gryphon.

“How the creatures order one about, and make one repeat lessons!”
thought Alice; “I might as well be at school at once.” However, she got
up, and began to repeat it, but her head was so full of the Lobster
Quadrille, that she hardly knew what she was saying, and the words came
very queer indeed:—

“’Tis the voice of the Lobster; I heard him declare,
“You have baked me too brown, I must sugar my hair.”
As a duck with its eyelids, so he with his nose
Trims his belt and his buttons, and turns out his toes.”

[later editions continued as follows
When the sands are all dry, he is gay as a lark,
And will talk in contemptuous tones of the Shark,
But, when the tide rises and sharks are around,
His voice has a timid and tremulous sound.]


“That’s different from what _I_ used to say when I was a child,” said
the Gryphon.

“Well, I never heard it before,” said the Mock Turtle; “but it sounds
uncommon nonsense.”

Alice said nothing; she had sat down with her face in her hands,
wondering if anything would _ever_ happen in a natural way again.

“I should like to have it explained,” said the Mock Turtle.

“She can’t explain it,” said the Gryphon hastily. “Go on with the next
verse.”

“But about his toes?” the Mock Turtle persisted. “How _could_ he turn
them out with his nose, you know?”

“It’s the first position in dancing.” Alice said; but was dreadfully
puzzled by the whole thing, and longed to change the subject.

“Go on with the next verse,” the Gryphon repeated impatiently: “it
begins ‘_I passed by his garden_.’”

Alice did not dare to disobey, though she felt sure it would all come
wrong, and she went on in a trembling voice:—

“I passed by his garden, and marked, with one eye,
How the Owl and the Panther were sharing a pie—”

[later editions continued as follows
The Panther took pie-crust, and gravy, and meat,
While the Owl had the dish as its share of the treat.
When the pie was all finished, the Owl, as a boon,
Was kindly permitted to pocket the spoon:
While the Panther received knife and fork with a growl,
And concluded the banquet—]


“What _is_ the use of repeating all that stuff,” the Mock Turtle
interrupted, “if you don’t explain it as you go on? It’s by far the
most confusing thing _I_ ever heard!”

“Yes, I think you’d better leave off,” said the Gryphon: and Alice was
only too glad to do so.

“Shall we try another figure of the Lobster Quadrille?” the Gryphon
went on. “Or would you like the Mock Turtle to sing you a song?”

“Oh, a song, please, if the Mock Turtle would be so kind,” Alice
replied, so eagerly that the Gryphon said, in a rather offended tone,
“Hm! No accounting for tastes! Sing her ‘_Turtle Soup_,’ will you, old
fellow?”

The Mock Turtle sighed deeply, and began, in a voice sometimes choked
with sobs, to sing this:—

“Beautiful Soup, so rich and green,
Waiting in a hot tureen!
Who for such dainties would not stoop?
Soup of the evening, beautiful Soup!
Soup of the evening, beautiful Soup!
    Beau—ootiful Soo—oop!
    Beau—ootiful Soo—oop!
Soo—oop of the e—e—evening,
    Beautiful, beautiful Soup!

“Beautiful Soup! Who cares for fish,
Game, or any other dish?
Who would not give all else for two p
ennyworth only of beautiful Soup?
Pennyworth only of beautiful Soup?
    Beau—ootiful Soo—oop!
    Beau—ootiful Soo—oop!
Soo—oop of the e—e—evening,
    Beautiful, beauti—FUL SOUP!”


“Chorus again!” cried the Gryphon, and the Mock Turtle had just begun
to repeat it, when a cry of “The trial’s beginning!” was heard in the
distance.

“Come on!” cried the Gryphon, and, taking Alice by the hand, it hurried
off, without waiting for the end of the song.

“What trial is it?” Alice panted as she ran; but the Gryphon only
answered “Come on!” and ran the faster, while more and more faintly
came, carried on the breeze that followed them, the melancholy words:—

“Soo—oop of the e—e—evening,
    Beautiful, beautiful Soup!”


CHAPTER XI.
Who Stole the Tarts?


The King and Queen of Hearts were seated on their throne when they
arrived, with a great crowd assembled about them—all sorts of little
birds and beasts, as well as the whole pack of cards: the Knave was
standing before them, in chains, with a soldier on each side to guard
him; and near the King was the White Rabbit, with a trumpet in one
hand, and a scroll of parchment in the other. In the very middle of the
court was a table, with a large dish of tarts upon it: they looked so
good, that it made Alice quite hungry to look at them—“I wish they’d
get the trial done,” she thought, “and hand round the refreshments!”
But there seemed to be no chance of this, so she began looking at
everything about her, to pass away the time.

Alice had never been in a court of justice before, but she had read
about them in books, and she was quite pleased to find that she knew
the name of nearly everything there. “That’s the judge,” she said to
herself, “because of his great wig.”

The judge, by the way, was the King; and as he wore his crown over the
wig, (look at the frontispiece if you want to see how he did it,) he
did not look at all comfortable, and it was certainly not becoming.

“And that’s the jury-box,” thought Alice, “and those twelve creatures,”
(she was obliged to say “creatures,” you see, because some of them were
animals, and some were birds,) “I suppose they are the jurors.” She
said this last word two or three times over to herself, being rather
proud of it: for she thought, and rightly too, that very few little
girls of her age knew the meaning of it at all. However, “jury-men”
would have done just as well.

The twelve jurors were all writing very busily on slates. “What are
they doing?” Alice whispered to the Gryphon. “They can’t have anything
to put down yet, before the trial’s begun.”

“They’re putting down their names,” the Gryphon whispered in reply,
“for fear they should forget them before the end of the trial.”

“Stupid things!” Alice began in a loud, indignant voice, but she
stopped hastily, for the White Rabbit cried out, “Silence in the
court!” and the King put on his spectacles and looked anxiously round,
to make out who was talking.

Alice could see, as well as if she were looking over their shoulders,
that all the jurors were writing down “stupid things!” on their slates,
and she could even make out that one of them didn’t know how to spell
“stupid,” and that he had to ask his neighbour to tell him. “A nice
muddle their slates’ll be in before the trial’s over!” thought Alice.

One of the jurors had a pencil that squeaked. This of course, Alice
could _not_ stand, and she went round the court and got behind him, and
very soon found an opportunity of taking it away. She did it so quickly
that the poor little juror (it was Bill, the Lizard) could not make out
at all what had become of it; so, after hunting all about for it, he
was obliged to write with one finger for the rest of the day; and this
was of very little use, as it left no mark on the slate.

“Herald, read the accusation!” said the King.

On this the White Rabbit blew three blasts on the trumpet, and then
unrolled the parchment scroll, and read as follows:—

“The Queen of Hearts, she made some tarts,
    All on a summer day:
The Knave of Hearts, he stole those tarts,
    And took them quite away!”


“Consider your verdict,” the King said to the jury.

“Not yet, not yet!” the Rabbit hastily interrupted. “There’s a great
deal to come before that!”

“Call the first witness,” said the King; and the White Rabbit blew
three blasts on the trumpet, and called out, “First witness!”

The first witness was the Hatter. He came in with a teacup in one hand
and a piece of bread-and-butter in the other. “I beg pardon, your
Majesty,” he began, “for bringing these in: but I hadn’t quite finished
my tea when I was sent for.”

“You ought to have finished,” said the King. “When did you begin?”

The Hatter looked at the March Hare, who had followed him into the
court, arm-in-arm with the Dormouse. “Fourteenth of March, I _think_ it
was,” he said.

“Fifteenth,” said the March Hare.

“Sixteenth,” added the Dormouse.

“Write that down,” the King said to the jury, and the jury eagerly
wrote down all three dates on their slates, and then added them up, and
reduced the answer to shillings and pence.

“Take off your hat,” the King said to the Hatter.

“It isn’t mine,” said the Hatter.

“_Stolen!_” the King exclaimed, turning to the jury, who instantly made
a memorandum of the fact.

“I keep them to sell,” the Hatter added as an explanation; “I’ve none
of my own. I’m a hatter.”

Here the Queen put on her spectacles, and began staring at the Hatter,
who turned pale and fidgeted.

“Give your evidence,” said the King; “and don’t be nervous, or I’ll
have you executed on the spot.”

This did not seem to encourage the witness at all: he kept shifting
from one foot to the other, looking uneasily at the Queen, and in his
confusion he bit a large piece out of his teacup instead of the
bread-and-butter.

Just at this moment Alice felt a very curious sensation, which puzzled
her a good deal until she made out what it was: she was beginning to
grow larger again, and she thought at first she would get up and leave
the court; but on second thoughts she decided to remain where she was
as long as there was room for her.

“I wish you wouldn’t squeeze so.” said the Dormouse, who was sitting
next to her. “I can hardly breathe.”

“I can’t help it,” said Alice very meekly: “I’m growing.”

“You’ve no right to grow _here_,” said the Dormouse.

“Don’t talk nonsense,” said Alice more boldly: “you know you’re growing
too.”

“Yes, but _I_ grow at a reasonable pace,” said the Dormouse: “not in
that ridiculous fashion.” And he got up very sulkily and crossed over
to the other side of the court.

All this time the Queen had never left off staring at the Hatter, and,
just as the Dormouse crossed the court, she said to one of the officers
of the court, “Bring me the list of the singers in the last concert!”
on which the wretched Hatter trembled so, that he shook both his shoes
off.

“Give your evidence,” the King repeated angrily, “or I’ll have you
executed, whether you’re nervous or not.”

“I’m a poor man, your Majesty,” the Hatter began, in a trembling voice,
“—and I hadn’t begun my tea—not above a week or so—and what with the
bread-and-butter getting so thin—and the twinkling of the tea—”

“The twinkling of the _what?_” said the King.

“It _began_ with the tea,” the Hatter replied.

“Of course twinkling begins with a T!” said the King sharply. “Do you
take me for a dunce? Go on!”

“I’m a poor man,” the Hatter went on, “and most things twinkled after
that—only the March Hare said—”

“I didn’t!” the March Hare interrupted in a great hurry.

“You did!” said the Hatter.

“I deny it!” said the March Hare.

“He denies it,” said the King: “leave out that part.”

“Well, at any rate, the Dormouse said—” the Hatter went on, looking
anxiously round to see if he would deny it too: but the Dormouse denied
nothing, being fast asleep.

“After that,” continued the Hatter, “I cut some more bread-and-butter—”

“But what did the Dormouse say?” one of the jury asked.

“That I can’t remember,” said the Hatter.

“You _must_ remember,” remarked the King, “or I’ll have you executed.”

The miserable Hatter dropped his teacup and bread-and-butter, and went
down on one knee. “I’m a poor man, your Majesty,” he began.

“You’re a _very_ poor _speaker_,” said the King.

Here one of the guinea-pigs cheered, and was immediately suppressed by
the officers of the court. (As that is rather a hard word, I will just
explain to you how it was done. They had a large canvas bag, which tied
up at the mouth with strings: into this they slipped the guinea-pig,
head first, and then sat upon it.)

“I’m glad I’ve seen that done,” thought Alice. “I’ve so often read in
the newspapers, at the end of trials, “There was some attempts at
applause, which was immediately suppressed by the officers of the
court,” and I never understood what it meant till now.”

“If that’s all you know about it, you may stand down,” continued the
King.

“I can’t go no lower,” said the Hatter: “I’m on the floor, as it is.”

“Then you may _sit_ down,” the King replied.

Here the other guinea-pig cheered, and was suppressed.

“Come, that finished the guinea-pigs!” thought Alice. “Now we shall get
on better.”

“I’d rather finish my tea,” said the Hatter, with an anxious look at
the Queen, who was reading the list of singers.

“You may go,” said the King, and the Hatter hurriedly left the court,
without even waiting to put his shoes on.

“—and just take his head off outside,” the Queen added to one of the
officers: but the Hatter was out of sight before the officer could get
to the door.

“Call the next witness!” said the King.

The next witness was the Duchess’s cook. She carried the pepper-box in
her hand, and Alice guessed who it was, even before she got into the
court, by the way the people near the door began sneezing all at once.

“Give your evidence,” said the King.

“Shan’t,” said the cook.

The King looked anxiously at the White Rabbit, who said in a low voice,
“Your Majesty must cross-examine _this_ witness.”

“Well, if I must, I must,” the King said, with a melancholy air, and,
after folding his arms and frowning at the cook till his eyes were
nearly out of sight, he said in a deep voice, “What are tarts made of?”

“Pepper, mostly,” said the cook.

“Treacle,” said a sleepy voice behind her.

“Collar that Dormouse,” the Queen shrieked out. “Behead that Dormouse!
Turn that Dormouse out of court! Suppress him! Pinch him! Off with his
whiskers!”

For some minutes the whole court was in confusion, getting the Dormouse
turned out, and, by the time they had settled down again, the cook had
disappeared.

“Never mind!” said the King, with an air of great relief. “Call the
next witness.” And he added in an undertone to the Queen, “Really, my
dear, _you_ must cross-examine the next witness. It quite makes my
forehead ache!”

Alice watched the White Rabbit as he fumbled over the list, feeling
very curious to see what the next witness would be like, “—for they
haven’t got much evidence _yet_,” she said to herself. Imagine her
surprise, when the White Rabbit read out, at the top of his shrill
little voice, the name “Alice!”


CHAPTER XII.
Alice’s Evidence


“Here!” cried Alice, quite forgetting in the flurry of the moment how
large she had grown in the last few minutes, and she jumped up in such
a hurry that she tipped over the jury-box with the edge of her skirt,
upsetting all the jurymen on to the heads of the crowd below, and there
they lay sprawling about, reminding her very much of a globe of
goldfish she had accidentally upset the week before.

“Oh, I _beg_ your pardon!” she exclaimed in a tone of great dismay, and
began picking them up again as quickly as she could, for the accident
of the goldfish kept running in her head, and she had a vague sort of
idea that they must be collected at once and put back into the
jury-box, or they would die.

“The trial cannot proceed,” said the King in a very grave voice, “until
all the jurymen are back in their proper places—_all_,” he repeated
with great emphasis, looking hard at Alice as he said so.

Alice looked at the jury-box, and saw that, in her haste, she had put
the Lizard in head downwards, and the poor little thing was waving its
tail about in a melancholy way, being quite unable to move. She soon
got it out again, and put it right; “not that it signifies much,” she
said to herself; “I should think it would be _quite_ as much use in the
trial one way up as the other.”

As soon as the jury had a little recovered from the shock of being
upset, and their slates and pencils had been found and handed back to
them, they set to work very diligently to write out a history of the
accident, all except the Lizard, who seemed too much overcome to do
anything but sit with its mouth open, gazing up into the roof of the
court.

“What do you know about this business?” the King said to Alice.

“Nothing,” said Alice.

“Nothing _whatever?_” persisted the King.

“Nothing whatever,” said Alice.

“That’s very important,” the King said, turning to the jury. They were
just beginning to write this down on their slates, when the White
Rabbit interrupted: “_Un_important, your Majesty means, of course,” he
said in a very respectful tone, but frowning and making faces at him as
he spoke.

“_Un_important, of course, I meant,” the King hastily said, and went on
to himself in an undertone,

“important—unimportant—unimportant—important—” as if he were trying
which word sounded best.

Some of the jury wrote it down “important,” and some “unimportant.”
Alice could see this, as she was near enough to look over their slates;
“but it doesn’t matter a bit,” she thought to herself.

At this moment the King, who had been for some time busily writing in
his note-book, cackled out “Silence!” and read out from his book, “Rule
Forty-two. _All persons more than a mile high to leave the court_.”

Everybody looked at Alice.

“_I’m_ not a mile high,” said Alice.

“You are,” said the King.

“Nearly two miles high,” added the Queen.

“Well, I shan’t go, at any rate,” said Alice: “besides, that’s not a
regular rule: you invented it just now.”

“It’s the oldest rule in the book,” said the King.

“Then it ought to be Number One,” said Alice.

The King turned pale, and shut his note-book hastily. “Consider your
verdict,” he said to the jury, in a low, trembling voice.

“There’s more evidence to come yet, please your Majesty,” said the
White Rabbit, jumping up in a great hurry; “this paper has just been
picked up.”

“What’s in it?” said the Queen.

“I haven’t opened it yet,” said the White Rabbit, “but it seems to be a
letter, written by the prisoner to—to somebody.”

“It must have been that,” said the King, “unless it was written to
nobody, which isn’t usual, you know.”

“Who is it directed to?” said one of the jurymen.

“It isn’t directed at all,” said the White Rabbit; “in fact, there’s
nothing written on the _outside_.” He unfolded the paper as he spoke,
and added “It isn’t a letter, after all: it’s a set of verses.”

“Are they in the prisoner’s handwriting?” asked another of the jurymen.

“No, they’re not,” said the White Rabbit, “and that’s the queerest
thing about it.” (The jury all looked puzzled.)

“He must have imitated somebody else’s hand,” said the King. (The jury
all brightened up again.)

“Please your Majesty,” said the Knave, “I didn’t write it, and they
can’t prove I did: there’s no name signed at the end.”

“If you didn’t sign it,” said the King, “that only makes the matter
worse. You _must_ have meant some mischief, or else you’d have signed
your name like an honest man.”

There was a general clapping of hands at this: it was the first really
clever thing the King had said that day.

“That _proves_ his guilt,” said the Queen.

“It proves nothing of the sort!” said Alice. “Why, you don’t even know
what they’re about!”

“Read them,” said the King.

The White Rabbit put on his spectacles. “Where shall I begin, please
your Majesty?” he asked.

“Begin at the beginning,” the King said gravely, “and go on till you
come to the end: then stop.”

These were the verses the White Rabbit read:—

“They told me you had been to her,
    And mentioned me to him:
She gave me a good character,
    But said I could not swim.

He sent them word I had not gone
    (We know it to be true):
If she should push the matter on,
    What would become of you?

I gave her one, they gave him two,
    You gave us three or more;
They all returned from him to you,
    Though they were mine before.

If I or she should chance to be
    Involved in this affair,
He trusts to you to set them free,
    Exactly as we were.

My notion was that you had been
    (Before she had this fit)
An obstacle that came between
    Him, and ourselves, and it.

Don’t let him know she liked them best,
    For this must ever be
A secret, kept from all the rest,
    Between yourself and me.”


“That’s the most important piece of evidence we’ve heard yet,” said the
King, rubbing his hands; “so now let the jury—”

“If any one of them can explain it,” said Alice, (she had grown so
large in the last few minutes that she wasn’t a bit afraid of
interrupting him,) “I’ll give him sixpence. _I_ don’t believe there’s
an atom of meaning in it.”

The jury all wrote down on their slates, “_She_ doesn’t believe there’s
an atom of meaning in it,” but none of them attempted to explain the
paper.

“If there’s no meaning in it,” said the King, “that saves a world of
trouble, you know, as we needn’t try to find any. And yet I don’t
know,” he went on, spreading out the verses on his knee, and looking at
them with one eye; “I seem to see some meaning in them, after all.
“—_said I could not swim_—” you can’t swim, can you?” he added, turning
to the Knave.

The Knave shook his head sadly. “Do I look like it?” he said. (Which he
certainly did _not_, being made entirely of cardboard.)

“All right, so far,” said the King, and he went on muttering over the
verses to himself: “‘_We know it to be true_—’ that’s the jury, of
course—‘_I gave her one, they gave him two_—’ why, that must be what he
did with the tarts, you know—”

“But, it goes on ‘_they all returned from him to you_,’” said Alice.

“Why, there they are!” said the King triumphantly, pointing to the
tarts on the table. “Nothing can be clearer than _that_. Then
again—‘_before she had this fit_—’ you never had fits, my dear, I
think?” he said to the Queen.

“Never!” said the Queen furiously, throwing an inkstand at the Lizard
as she spoke. (The unfortunate little Bill had left off writing on his
slate with one finger, as he found it made no mark; but he now hastily
began again, using the ink, that was trickling down his face, as long
as it lasted.)

“Then the words don’t _fit_ you,” said the King, looking round the
court with a smile. There was a dead silence.

“It’s a pun!” the King added in an offended tone, and everybody
laughed, “Let the jury consider their verdict,” the King said, for
about the twentieth time that day.

“No, no!” said the Queen. “Sentence first—verdict afterwards.”

“Stuff and nonsense!” said Alice loudly. “The idea of having the
sentence first!”

“Hold your tongue!” said the Queen, turning purple.

“I won’t!” said Alice.

“Off with her head!” the Queen shouted at the top of her voice. Nobody
moved.

“Who cares for you?” said Alice, (she had grown to her full size by
this time.) “You’re nothing but a pack of cards!”

At this the whole pack rose up into the air, and came flying down upon
her: she gave a little scream, half of fright and half of anger, and
tried to beat them off, and found herself lying on the bank, with her
head in the lap of her sister, who was gently brushing away some dead
leaves that had fluttered down from the trees upon her face.

“Wake up, Alice dear!” said her sister; “Why, what a long sleep you’ve
had!”

“Oh, I’ve had such a curious dream!” said Alice, and she told her
sister, as well as she could remember them, all these strange
Adventures of hers that you have just been reading about; and when she
had finished, her sister kissed her, and said, “It _was_ a curious
dream, dear, certainly: but now run in to your tea; it’s getting late.”
So Alice got up and ran off, thinking while she ran, as well she might,
what a wonderful dream it had been.


But her sister sat still just as she left her, leaning her head on her
hand, watching the setting sun, and thinking of little Alice and all
her wonderful Adventures, till she too began dreaming after a fashion,
and this was her dream:—

First, she dreamed of little Alice herself, and once again the tiny
hands were clasped upon her knee, and the bright eager eyes were
looking up into hers—she could hear the very tones of her voice, and
see that queer little toss of her head to keep back the wandering hair
that _would_ always get into her eyes—and still as she listened, or
seemed to listen, the whole place around her became alive with the
strange creatures of her little sister’s dream.

The long grass rustled at her feet as the White Rabbit hurried by—the
frightened Mouse splashed his way through the neighbouring pool—she
could hear the rattle of the teacups as the March Hare and his friends
shared their never-ending meal, and the shrill voice of the Queen
ordering off her unfortunate guests to execution—once more the pig-baby
was sneezing on the Duchess’s knee, while plates and dishes crashed
around it—once more the shriek of the Gryphon, the squeaking of the
Lizard’s slate-pencil, and the choking of the suppressed guinea-pigs,
filled the air, mixed up with the distant sobs of the miserable Mock
Turtle.

So she sat on, with closed eyes, and half believed herself in
Wonderland, though she knew she had but to open them again, and all
would change to dull reality—the grass would be only rustling in the
wind, and the pool rippling to the waving of the reeds—the rattling
teacups would change to tinkling sheep-bells, and the Queen’s shrill
cries to the voice of the shepherd boy—and the sneeze of the baby, the
shriek of the Gryphon, and all the other queer noises, would change
(she knew) to the confused clamour of the busy farm-yard—while the
lowing of the cattle in the distance would take the place of the Mock
Turtle’s heavy sobs.

Lastly, she pictured to herself how this same little sister of hers
would, in the after-time, be herself a grown woman; and how she would
keep, through all her riper years, the simple and loving heart of her
childhood: and how she would gather about her other little children,
and make _their_ eyes bright and eager with many a strange tale,
perhaps even with the dream of Wonderland of long ago: and how she
would feel with all their simple sorrows, and find a pleasure in all
their simple joys, remembering her own child-life, and the happy summer
days.

THE END 


End of Project Gutenberg’s Alice’s Adventures in Wonderland, by Lewis Carroll

*** END OF THIS PROJECT GUTENBERG EBOOK ALICE’S ADVENTURES IN WONDERLAND ***

***** This file should be named 11-0.txt or 11-0.zip *****
This and all associated files of various formats will be found in:
        http://www.gutenberg.org/1/11/

Produced by Arthur DiBianca and David Widger

Updated editions will replace the previous one--the old editions will
be renamed.

Creating the works from print editions not protected by U.S. copyright
law means that no one owns a United States copyright in these works,
so the Foundation (and you!) can copy and distribute it in the United
States without permission and without paying copyright
royalties. Special rules, set forth in the General Terms of Use part
of this license, apply to copying and distributing Project
Gutenberg-tm electronic works to protect the PROJECT GUTENBERG-tm
concept and trademark. Project Gutenberg is a registered trademark,
and may not be used if you charge for the eBooks, unless you receive
specific permission. If you do not charge anything for copies of this
eBook, complying with the rules is very easy. You may use this eBook
for nearly any purpose such as creation of derivative works, reports,
performances and research. They may be modified and printed and given
away--you may do practically ANYTHING in the United States with eBooks
not protected by U.S. copyright law. Redistribution is subject to the
trademark license, especially commercial redistribution.

START: FULL LICENSE

THE FULL PROJECT GUTENBERG LICENSE
PLEASE READ THIS BEFORE YOU DISTRIBUTE OR USE THIS WORK

To protect the Project Gutenberg-tm mission of promoting the free
distribution of electronic works, by using or distributing this work
(or any other work associated in any way with the phrase "Project
Gutenberg"), you agree to comply with all the terms of the Full
Project Gutenberg-tm License available with this file or online at
www.gutenberg.org/license.

Section 1. General Terms of Use and Redistributing Project
Gutenberg-tm electronic works

1.A. By reading or using any part of this Project Gutenberg-tm
electronic work, you indicate that you have read, understand, agree to
and accept all the terms of this license and intellectual property
(trademark/copyright) agreement. If you do not agree to abide by all
the terms of this agreement, you must cease using and return or
destroy all copies of Project Gutenberg-tm electronic works in your
possession. If you paid a fee for obtaining a copy of or access to a
Project Gutenberg-tm electronic work and you do not agree to be bound
by the terms of this agreement, you may obtain a refund from the
person or entity to whom you paid the fee as set forth in paragraph
1.E.8.

1.B. "Project Gutenberg" is a registered trademark. It may only be
used on or associated in any way with an electronic work by people who
agree to be bound by the terms of this agreement. There are a few
things that you can do with most Project Gutenberg-tm electronic works
even without complying with the full terms of this agreement. See
paragraph 1.C below. There are a lot of things you can do with Project
Gutenberg-tm electronic works if you follow the terms of this
agreement and help preserve free future access to Project Gutenberg-tm
electronic works. See paragraph 1.E below.

1.C. The Project Gutenberg Literary Archive Foundation ("the
Foundation" or PGLAF), owns a compilation copyright in the collection
of Project Gutenberg-tm electronic works. Nearly all the individual
works in the collection are in the public domain in the United
States. If an individual work is unprotected by copyright law in the
United States and you are located in the United States, we do not
claim a right to prevent you from copying, distributing, performing,
displaying or creating derivative works based on the work as long as
all references to Project Gutenberg are removed. Of course, we hope
that you will support the Project Gutenberg-tm mission of promoting
free access to electronic works by freely sharing Project Gutenberg-tm
works in compliance with the terms of this agreement for keeping the
Project Gutenberg-tm name associated with the work. You can easily
comply with the terms of this agreement by keeping this work in the
same format with its attached full Project Gutenberg-tm License when
you share it without charge with others.

1.D. The copyright laws of the place where you are located also govern
what you can do with this work. Copyright laws in most countries are
in a constant state of change. If you are outside the United States,
check the laws of your country in addition to the terms of this
agreement before downloading, copying, displaying, performing,
distributing or creating derivative works based on this work or any
other Project Gutenberg-tm work. The Foundation makes no
representations concerning the copyright status of any work in any
country outside the United States.

1.E. Unless you have removed all references to Project Gutenberg:

1.E.1. The following sentence, with active links to, or other
immediate access to, the full Project Gutenberg-tm License must appear
prominently whenever any copy of a Project Gutenberg-tm work (any work
on which the phrase "Project Gutenberg" appears, or with which the
phrase "Project Gutenberg" is associated) is accessed, displayed,
performed, viewed, copied or distributed:

  This eBook is for the use of anyone anywhere in the United States and
  most other parts of the world at no cost and with almost no
  restrictions whatsoever. You may copy it, give it away or re-use it
  under the terms of the Project Gutenberg License included with this
  eBook or online at www.gutenberg.org. If you are not located in the
  United States, you'll have to check the laws of the country where you
  are located before using this ebook.

1.E.2. If an individual Project Gutenberg-tm electronic work is
derived from texts not protected by U.S. copyright law (does not
contain a notice indicating that it is posted with permission of the
copyright holder), the work can be copied and distributed to anyone in
the United States without paying any fees or charges. If you are
redistributing or providing access to a work with the phrase "Project
Gutenberg" associated with or appearing on the work, you must comply
either with the requirements of paragraphs 1.E.1 through 1.E.7 or
obtain permission for the use of the work and the Project Gutenberg-tm
trademark as set forth in paragraphs 1.E.8 or 1.E.9.

1.E.3. If an individual Project Gutenberg-tm electronic work is posted
with the permission of the copyright holder, your use and distribution
must comply with both paragraphs 1.E.1 through 1.E.7 and any
additional terms imposed by the copyright holder. Additional terms
will be linked to the Project Gutenberg-tm License for all works
posted with the permission of the copyright holder found at the
beginning of this work.

1.E.4. Do not unlink or detach or remove the full Project Gutenberg-tm
License terms from this work, or any files containing a part of this
work or any other work associated with Project Gutenberg-tm.

1.E.5. Do not copy, display, perform, distribute or redistribute this
electronic work, or any part of this electronic work, without
prominently displaying the sentence set forth in paragraph 1.E.1 with
active links or immediate access to the full terms of the Project
Gutenberg-tm License.

1.E.6. You may convert to and distribute this work in any binary,
compressed, marked up, nonproprietary or proprietary form, including
any word processing or hypertext form. However, if you provide access
to or distribute copies of a Project Gutenberg-tm work in a format
other than "Plain Vanilla ASCII" or other format used in the official
version posted on the official Project Gutenberg-tm web site
(www.gutenberg.org), you must, at no additional cost, fee or expense
to the user, provide a copy, a means of exporting a copy, or a means
of obtaining a copy upon request, of the work in its original "Plain
Vanilla ASCII" or other form. Any alternate format must include the
full Project Gutenberg-tm License as specified in paragraph 1.E.1.

1.E.7. Do not charge a fee for access to, viewing, displaying,
performing, copying or distributing any Project Gutenberg-tm works
unless you comply with paragraph 1.E.8 or 1.E.9.

1.E.8. You may charge a reasonable fee for copies of or providing
access to or distributing Project Gutenberg-tm electronic works
provided that

* You pay a royalty fee of 20% of the gross profits you derive from
  the use of Project Gutenberg-tm works calculated using the method
  you already use to calculate your applicable taxes. The fee is owed
  to the owner of the Project Gutenberg-tm trademark, but he has
  agreed to donate royalties under this paragraph to the Project
  Gutenberg Literary Archive Foundation. Royalty payments must be paid
  within 60 days following each date on which you prepare (or are
  legally required to prepare) your periodic tax returns. Royalty
  payments should be clearly marked as such and sent to the Project
  Gutenberg Literary Archive Foundation at the address specified in
  Section 4, "Information about donations to the Project Gutenberg
  Literary Archive Foundation."

* You provide a full refund of any money paid by a user who notifies
  you in writing (or by e-mail) within 30 days of receipt that s/he
  does not agree to the terms of the full Project Gutenberg-tm
  License. You must require such a user to return or destroy all
  copies of the works possessed in a physical medium and discontinue
  all use of and all access to other copies of Project Gutenberg-tm
  works.

* You provide, in accordance with paragraph 1.F.3, a full refund of
  any money paid for a work or a replacement copy, if a defect in the
  electronic work is discovered and reported to you within 90 days of
  receipt of the work.

* You comply with all other terms of this agreement for free
  distribution of Project Gutenberg-tm works.

1.E.9. If you wish to charge a fee or distribute a Project
Gutenberg-tm electronic work or group of works on different terms than
are set forth in this agreement, you must obtain permission in writing
from both the Project Gutenberg Literary Archive Foundation and The
Project Gutenberg Trademark LLC, the owner of the Project Gutenberg-tm
trademark. Contact the Foundation as set forth in Section 3 below.

1.F.

1.F.1. Project Gutenberg volunteers and employees expend considerable
effort to identify, do copyright research on, transcribe and proofread
works not protected by U.S. copyright law in creating the Project
Gutenberg-tm collection. Despite these efforts, Project Gutenberg-tm
electronic works, and the medium on which they may be stored, may
contain "Defects," such as, but not limited to, incomplete, inaccurate
or corrupt data, transcription errors, a copyright or other
intellectual property infringement, a defective or damaged disk or
other medium, a computer virus, or computer codes that damage or
cannot be read by your equipment.

1.F.2. LIMITED WARRANTY, DISCLAIMER OF DAMAGES - Except for the "Right
of Replacement or Refund" described in paragraph 1.F.3, the Project
Gutenberg Literary Archive Foundation, the owner of the Project
Gutenberg-tm trademark, and any other party distributing a Project
Gutenberg-tm electronic work under this agreement, disclaim all
liability to you for damages, costs and expenses, including legal
fees. YOU AGREE THAT YOU HAVE NO REMEDIES FOR NEGLIGENCE, STRICT
LIABILITY, BREACH OF WARRANTY OR BREACH OF CONTRACT EXCEPT THOSE
PROVIDED IN PARAGRAPH 1.F.3. YOU AGREE THAT THE FOUNDATION, THE
TRADEMARK OWNER, AND ANY DISTRIBUTOR UNDER THIS AGREEMENT WILL NOT BE
LIABLE TO YOU FOR ACTUAL, DIRECT, INDIRECT, CONSEQUENTIAL, PUNITIVE OR
INCIDENTAL DAMAGES EVEN IF YOU GIVE NOTICE OF THE POSSIBILITY OF SUCH
DAMAGE.

1.F.3. LIMITED RIGHT OF REPLACEMENT OR REFUND - If you discover a
defect in this electronic work within 90 days of receiving it, you can
receive a refund of the money (if any) you paid for it by sending a
written explanation to the person you received the work from. If you
received the work on a physical medium, you must return the medium
with your written explanation. The person or entity that provided you
with the defective work may elect to provide a replacement copy in
lieu of a refund. If you received the work electronically, the person
or entity providing it to you may choose to give you a second
opportunity to receive the work electronically in lieu of a refund. If
the second copy is also defective, you may demand a refund in writing
without further opportunities to fix the problem.

1.F.4. Except for the limited right of replacement or refund set forth
in paragraph 1.F.3, this work is provided to you 'AS-IS', WITH NO
OTHER WARRANTIES OF ANY KIND, EXPRESS OR IMPLIED, INCLUDING BUT NOT
LIMITED TO WARRANTIES OF MERCHANTABILITY OR FITNESS FOR ANY PURPOSE.

1.F.5. Some states do not allow disclaimers of certain implied
warranties or the exclusion or limitation of certain types of
damages. If any disclaimer or limitation set forth in this agreement
violates the law of the state applicable to this agreement, the
agreement shall be interpreted to make the maximum disclaimer or
limitation permitted by the applicable state law. The invalidity or
unenforceability of any provision of this agreement shall not void the
remaining provisions.

1.F.6. INDEMNITY - You agree to indemnify and hold the Foundation, the
trademark owner, any agent or employee of the Foundation, anyone
providing copies of Project Gutenberg-tm electronic works in
accordance with this agreement, and any volunteers associated with the
production, promotion and distribution of Project Gutenberg-tm
electronic works, harmless from all liability, costs and expenses,
including legal fees, that arise directly or indirectly from any of
the following which you do or cause to occur: (a) distribution of this
or any Project Gutenberg-tm work, (b) alteration, modification, or
additions or deletions to any Project Gutenberg-tm work, and (c) any
Defect you cause.

Section 2. Information about the Mission of Project Gutenberg-tm

Project Gutenberg-tm is synonymous with the free distribution of
electronic works in formats readable by the widest variety of
computers including obsolete, old, middle-aged and new computers. It
exists because of the efforts of hundreds of volunteers and donations
from people in all walks of life.

Volunteers and financial support to provide volunteers with the
assistance they need are critical to reaching Project Gutenberg-tm's
goals and ensuring that the Project Gutenberg-tm collection will
remain freely available for generations to come. In 2001, the Project
Gutenberg Literary Archive Foundation was created to provide a secure
and permanent future for Project Gutenberg-tm and future
generations. To learn more about the Project Gutenberg Literary
Archive Foundation and how your efforts and donations can help, see
Sections 3 and 4 and the Foundation information page at
www.gutenberg.org


Section 3. Information about the Project Gutenberg Literary Archive Foundation

The Project Gutenberg Literary Archive Foundation is a non profit
501(c)(3) educational corporation organized under the laws of the
state of Mississippi and granted tax exempt status by the Internal
Revenue Service. The Foundation's EIN or federal tax identification
number is 64-6221541. Contributions to the Project Gutenberg Literary
Archive Foundation are tax deductible to the full extent permitted by
U.S. federal laws and your state's laws.

The Foundation's principal office is in Fairbanks, Alaska, with the
mailing address: PO Box 750175, Fairbanks, AK 99775, but its
volunteers and employees are scattered throughout numerous
locations. Its business office is located at 809 North 1500 West, Salt
Lake City, UT 84116, (801) 596-1887. Email contact links and up to
date contact information can be found at the Foundation's web site and
official page at www.gutenberg.org/contact

For additional contact information:

    Dr. Gregory B. Newby
    Chief Executive and Director
    gbnewby@pglaf.org

Section 4. Information about Donations to the Project Gutenberg
Literary Archive Foundation

Project Gutenberg-tm depends upon and cannot survive without wide
spread public support and donations to carry out its mission of
increasing the number of public domain and licensed works that can be
freely distributed in machine readable form accessible by the widest
array of equipment including outdated equipment. Many small donations
($1 to $5,000) are particularly important to maintaining tax exempt
status with the IRS.

The Foundation is committed to complying with the laws regulating
charities and charitable donations in all 50 states of the United
States. Compliance requirements are not uniform and it takes a
considerable effort, much paperwork and many fees to meet and keep up
with these requirements. We do not solicit donations in locations
where we have not received written confirmation of compliance. To SEND
DONATIONS or determine the status of compliance for any particular
state visit www.gutenberg.org/donate

While we cannot and do not solicit contributions from states where we
have not met the solicitation requirements, we know of no prohibition
against accepting unsolicited donations from donors in such states who
approach us with offers to donate.

International donations are gratefully accepted, but we cannot make
any statements concerning tax treatment of donations received from
outside the United States. U.S. laws alone swamp our small staff.

Please check the Project Gutenberg Web pages for current donation
methods and addresses. Donations are accepted in a number of other
ways including checks, online payments and credit card donations. To
donate, please visit: www.gutenberg.org/donate

Section 5. General Information About Project Gutenberg-tm electronic works.

Professor Michael S. Hart was the originator of the Project
Gutenberg-tm concept of a library of electronic works that could be
freely shared with anyone. For forty years, he produced and
distributed Project Gutenberg-tm eBooks with only a loose network of
volunteer support.

Project Gutenberg-tm eBooks are often created from several printed
editions, all of which are confirmed as not protected by copyright in
the U.S. unless a copyright notice is included. Thus, we do not
necessarily keep eBooks in compliance with any particular paper
edition.

Most people start at our Web site which has the main PG search
facility: www.gutenberg.org

This Web site includes information about Project Gutenberg-tm,
including how to make donations to the Project Gutenberg Literary
Archive Foundation, how to help produce our new eBooks, and how to
subscribe to our email newsletter to hear about new eBooks.


================================================
FILE: benches/analyzer.rs
================================================
use criterion::{criterion_group, criterion_main, Criterion};
use tantivy::tokenizer::{
    LowerCaser, RemoveLongFilter, SimpleTokenizer, TextAnalyzer, TokenizerManager,
};

const ALICE_TXT: &str = include_str!("alice.txt");

pub fn criterion_benchmark(c: &mut Criterion) {
    let tokenizer_manager = TokenizerManager::default();
    let mut tokenizer = tokenizer_manager.get("default").unwrap();
    c.bench_function("default-tokenize-alice", |b| {
        b.iter(|| {
            let mut word_count = 0;
            let mut token_stream = tokenizer.token_stream(ALICE_TXT);
            while token_stream.advance() {
                word_count += 1;
            }
            assert_eq!(word_count, 30_731);
        })
    });
    let mut dynamic_analyzer = TextAnalyzer::builder(SimpleTokenizer::default())
        .dynamic()
        .filter_dynamic(RemoveLongFilter::limit(40))
        .filter_dynamic(LowerCaser)
        .build();
    c.bench_function("dynamic-tokenize-alice", |b| {
        b.iter(|| {
            let mut word_count = 0;
            let mut token_stream = dynamic_analyzer.token_stream(ALICE_TXT);
            while token_stream.advance() {
                word_count += 1;
            }
            assert_eq!(word_count, 30_731);
        })
    });
}

criterion_group! {
    name = benches;
    config = Criterion::default().sample_size(200);
    targets = criterion_benchmark
}
criterion_main!(benches);


================================================
FILE: benches/and_or_queries.rs
================================================
// Benchmarks boolean conjunction queries using binggan.
//
// What’s measured:
// - Or and And queries with varying selectivity (only `Term` queries for now on leafs)
// - Nested AND/OR combinations (on multiple fields)
// - No-scoring path using the Count collector (focus on iterator/skip performance)
// - Top-K retrieval (k=10) using the TopDocs collector
//
// Corpus model:
// - Synthetic docs; each token a/b/c is independently included per doc
// - If none of a/b/c are included, emit a neutral filler token to keep doc length similar
//
// Notes:
// - After optimization, when scoring is disabled Tantivy reads doc-only postings
//   (IndexRecordOption::Basic), avoiding frequency decoding overhead.
// - This bench isolates boolean iteration speed and intersection/union cost.
// - Use `cargo bench --bench boolean_conjunction` to run.

use binggan::{black_box, BenchGroup, BenchRunner};
use rand::prelude::*;
use rand::rngs::StdRng;
use rand::SeedableRng;
use tantivy::collector::sort_key::SortByStaticFastValue;
use tantivy::collector::{Collector, Count, TopDocs};
use tantivy::query::{Query, QueryParser};
use tantivy::schema::{Schema, FAST, TEXT};
use tantivy::{doc, Index, Order, ReloadPolicy, Searcher};

#[derive(Clone)]
struct BenchIndex {
    #[allow(dead_code)]
    index: Index,
    searcher: Searcher,
    query_parser: QueryParser,
}

/// Build a single index containing both fields (title, body) and
/// return two BenchIndex views:
/// - single_field: QueryParser defaults to only "body"
/// - multi_field:  QueryParser defaults to ["title", "body"]
fn build_shared_indices(num_docs: usize, p_a: f32, p_b: f32, p_c: f32) -> (BenchIndex, BenchIndex) {
    // Unified schema (two text fields)
    let mut schema_builder = Schema::builder();
    let f_title = schema_builder.add_text_field("title", TEXT);
    let f_body = schema_builder.add_text_field("body", TEXT);
    let f_score = schema_builder.add_u64_field("score", FAST);
    let f_score2 = schema_builder.add_u64_field("score2", FAST);
    let schema = schema_builder.build();
    let index = Index::create_in_ram(schema.clone());

    // Populate index with stable RNG for reproducibility.
    let mut rng = StdRng::from_seed([7u8; 32]);

    // Populate: spread each present token 90/10 to body/title
    {
        let mut writer = index.writer_with_num_threads(1, 500_000_000).unwrap();
        for _ in 0..num_docs {
            let has_a = rng.random_bool(p_a as f64);
            let has_b = rng.random_bool(p_b as f64);
            let has_c = rng.random_bool(p_c as f64);
            let score = rng.random_range(0u64..100u64);
            let score2 = rng.random_range(0u64..100_000u64);
            let mut title_tokens: Vec<&str> = Vec::new();
            let mut body_tokens: Vec<&str> = Vec::new();
            if has_a {
                if rng.random_bool(0.1) {
                    title_tokens.push("a");
                } else {
                    body_tokens.push("a");
                }
            }
            if has_b {
                if rng.random_bool(0.1) {
                    title_tokens.push("b");
                } else {
                    body_tokens.push("b");
                }
            }
            if has_c {
                if rng.random_bool(0.1) {
                    title_tokens.push("c");
                } else {
                    body_tokens.push("c");
                }
            }
            if title_tokens.is_empty() && body_tokens.is_empty() {
                body_tokens.push("z");
            }
            writer
                .add_document(doc!(
                    f_title=>title_tokens.join(" "),
                    f_body=>body_tokens.join(" "),
                    f_score=>score,
                    f_score2=>score2,
                ))
                .unwrap();
        }
        writer.commit().unwrap();
    }

    // Prepare reader/searcher once.
    let reader = index
        .reader_builder()
        .reload_policy(ReloadPolicy::Manual)
        .try_into()
        .unwrap();
    let searcher = reader.searcher();

    // Build two query parsers with different default fields.
    let qp_single = QueryParser::for_index(&index, vec![f_body]);
    let qp_multi = QueryParser::for_index(&index, vec![f_title, f_body]);

    let single_view = BenchIndex {
        index: index.clone(),
        searcher: searcher.clone(),
        query_parser: qp_single,
    };
    let multi_view = BenchIndex {
        index,
        searcher,
        query_parser: qp_multi,
    };
    (single_view, multi_view)
}

fn main() {
    // Prepare corpora with varying selectivity. Build one index per corpus
    // and derive two views (single-field vs multi-field) from it.
    let scenarios = vec![
        (
            "N=1M, p(a)=5%, p(b)=1%, p(c)=15%".to_string(),
            1_000_000,
            0.05,
            0.01,
            0.15,
        ),
        (
            "N=1M, p(a)=1%, p(b)=1%, p(c)=15%".to_string(),
            1_000_000,
            0.01,
            0.01,
            0.15,
        ),
    ];

    let queries = &["a", "+a +b", "+a +b +c", "a OR b", "a OR b OR c"];

    let mut runner = BenchRunner::new();
    for (label, n, pa, pb, pc) in scenarios {
        let (single_view, multi_view) = build_shared_indices(n, pa, pb, pc);

        for (view_name, bench_index) in [("single_field", single_view), ("multi_field", multi_view)]
        {
            // Single-field group: default field is body only
            let mut group = runner.new_group();
            group.set_name(format!("{} — {}", view_name, label));
            for query_str in queries {
                add_bench_task(&mut group, &bench_index, query_str, Count, "count");
                add_bench_task(
                    &mut group,
                    &bench_index,
                    query_str,
                    TopDocs::with_limit(10).order_by_score(),
                    "top10",
                );
                add_bench_task(
                    &mut group,
                    &bench_index,
                    query_str,
                    TopDocs::with_limit(10).order_by_fast_field::<u64>("score", Order::Asc),
                    "top10_by_ff",
                );
                add_bench_task(
                    &mut group,
                    &bench_index,
                    query_str,
                    TopDocs::with_limit(10).order_by((
                        SortByStaticFastValue::<u64>::for_field("score"),
                        SortByStaticFastValue::<u64>::for_field("score2"),
                    )),
                    "top10_by_2ff",
                );
            }
            group.run();
        }
    }
}

fn add_bench_task<C: Collector + 'static>(
    bench_group: &mut BenchGroup,
    bench_index: &BenchIndex,
    query_str: &str,
    collector: C,
    collector_name: &str,
) {
    let task_name = format!("{}_{}", query_str.replace(" ", "_"), collector_name);
    let query = bench_index.query_parser.parse_query(query_str).unwrap();
    let search_task = SearchTask {
        searcher: bench_index.searcher.clone(),
        collector,
        query,
    };
    bench_group.register(task_name, move |_| black_box(search_task.run()));
}

struct SearchTask<C: Collector> {
    searcher: Searcher,
    collector: C,
    query: Box<dyn Query>,
}

impl<C: Collector> SearchTask<C> {
    #[inline(never)]
    pub fn run(&self) -> usize {
        self.searcher.search(&self.query, &self.collector).unwrap();
        1
    }
}


================================================
FILE: benches/bool_queries_with_range.rs
================================================
use binggan::{black_box, BenchGroup, BenchRunner};
use rand::prelude::*;
use rand::rngs::StdRng;
use rand::SeedableRng;
use tantivy::collector::{Collector, Count, DocSetCollector, TopDocs};
use tantivy::query::{Query, QueryParser};
use tantivy::schema::{Schema, FAST, INDEXED, TEXT};
use tantivy::{doc, Index, Order, ReloadPolicy, Searcher};

#[derive(Clone)]
struct BenchIndex {
    #[allow(dead_code)]
    index: Index,
    searcher: Searcher,
    query_parser: QueryParser,
}

fn build_shared_indices(num_docs: usize, p_title_a: f32, distribution: &str) -> BenchIndex {
    // Unified schema
    let mut schema_builder = Schema::builder();
    let f_title = schema_builder.add_text_field("title", TEXT);
    let f_num_rand = schema_builder.add_u64_field("num_rand", INDEXED);
    let f_num_asc = schema_builder.add_u64_field("num_asc", INDEXED);
    let f_num_rand_fast = schema_builder.add_u64_field("num_rand_fast", INDEXED | FAST);
    let f_num_asc_fast = schema_builder.add_u64_field("num_asc_fast", INDEXED | FAST);
    let schema = schema_builder.build();
    let index = Index::create_in_ram(schema.clone());

    // Populate index with stable RNG for reproducibility.
    let mut rng = StdRng::from_seed([7u8; 32]);

    {
        let mut writer = index.writer_with_num_threads(1, 4_000_000_000).unwrap();

        match distribution {
            "dense" => {
                for doc_id in 0..num_docs {
                    // Always add title to avoid empty documents
                    let title_token = if rng.random_bool(p_title_a as f64) {
                        "a"
                    } else {
                        "b"
                    };

                    let num_rand = rng.random_range(0u64..1000u64);

                    let num_asc = (doc_id / 10000) as u64;

                    writer
                        .add_document(doc!(
                            f_title=>title_token,
                            f_num_rand=>num_rand,
                            f_num_asc=>num_asc,
                            f_num_rand_fast=>num_rand,
                            f_num_asc_fast=>num_asc,
                        ))
                        .unwrap();
                }
            }
            "sparse" => {
                for doc_id in 0..num_docs {
                    // Always add title to avoid empty documents
                    let title_token = if rng.random_bool(p_title_a as f64) {
                        "a"
                    } else {
                        "b"
                    };

                    let num_rand = rng.random_range(0u64..10000000u64);

                    let num_asc = doc_id as u64;

                    writer
                        .add_document(doc!(
                            f_title=>title_token,
                            f_num_rand=>num_rand,
                            f_num_asc=>num_asc,
                            f_num_rand_fast=>num_rand,
                            f_num_asc_fast=>num_asc,
                        ))
                        .unwrap();
                }
            }
            _ => {
                panic!("Unsupported distribution type");
            }
        }
        writer.commit().unwrap();
    }

    // Prepare reader/searcher once.
    let reader = index
        .reader_builder()
        .reload_policy(ReloadPolicy::Manual)
        .try_into()
        .unwrap();
    let searcher = reader.searcher();

    // Build query parser for title field
    let qp_title = QueryParser::for_index(&index, vec![f_title]);

    BenchIndex {
        index,
        searcher,
        query_parser: qp_title,
    }
}

fn main() {
    // Prepare corpora with varying scenarios
    let scenarios = vec![
        (
            "dense and 99% a".to_string(),
            10_000_000,
            0.99,
            "dense",
            0,
            9,
        ),
        (
            "dense and 99% a".to_string(),
            10_000_000,
            0.99,
            "dense",
            990,
            999,
        ),
        (
            "sparse and 99% a".to_string(),
            10_000_000,
            0.99,
            "sparse",
            0,
            9,
        ),
        (
            "sparse and 99% a".to_string(),
            10_000_000,
            0.99,
            "sparse",
            9_999_990,
            9_999_999,
        ),
    ];

    let mut runner = BenchRunner::new();
    for (scenario_id, n, p_title_a, num_rand_distribution, range_low, range_high) in scenarios {
        // Build index for this scenario
        let bench_index = build_shared_indices(n, p_title_a, num_rand_distribution);

        // Create benchmark group
        let mut group = runner.new_group();

        // Now set the name (this moves scenario_id)
        group.set_name(scenario_id);

        // Define all four field types
        let field_names = ["num_rand", "num_asc", "num_rand_fast", "num_asc_fast"];

        // Define the three terms we want to test with
        let terms = ["a", "b", "z"];

        // Generate all combinations of terms and field names
        let mut queries = Vec::new();
        for &term in &terms {
            for &field_name in &field_names {
                let query_str = format!(
                    "{} AND {}:[{} TO {}]",
                    term, field_name, range_low, range_high
                );
                queries.push((query_str, field_name.to_string()));
            }
        }

        let query_str = format!(
            "{}:[{} TO {}] AND {}:[{} TO {}]",
            "num_rand_fast", range_low, range_high, "num_asc_fast", range_low, range_high
        );
        queries.push((query_str, "num_asc_fast".to_string()));

        // Run all benchmark tasks for each query and its corresponding field name
        for (query_str, field_name) in queries {
            run_benchmark_tasks(&mut group, &bench_index, &query_str, &field_name);
        }

        group.run();
    }
}

/// Run all benchmark tasks for a given query string and field name
fn run_benchmark_tasks(
    bench_group: &mut BenchGroup,
    bench_index: &BenchIndex,
    query_str: &str,
    field_name: &str,
) {
    // Test count
    add_bench_task(bench_group, bench_index, query_str, Count, "count");

    // Test all results
    add_bench_task(
        bench_group,
        bench_index,
        query_str,
        DocSetCollector,
        "all results",
    );

    // Test top 100 by the field (if it's a FAST field)
    if field_name.ends_with("_fast") {
        // Ascending order
        {
            let collector_name = format!("top100_by_{}_asc", field_name);
            let field_name_owned = field_name.to_string();
            add_bench_task(
                bench_group,
                bench_index,
                query_str,
                TopDocs::with_limit(100).order_by_fast_field::<u64>(field_name_owned, Order::Asc),
                &collector_name,
            );
        }

        // Descending order
        {
            let collector_name = format!("top100_by_{}_desc", field_name);
            let field_name_owned = field_name.to_string();
            add_bench_task(
                bench_group,
                bench_index,
                query_str,
                TopDocs::with_limit(100).order_by_fast_field::<u64>(field_name_owned, Order::Desc),
                &collector_name,
            );
        }
    }
}

fn add_bench_task<C: Collector + 'static>(
    bench_group: &mut BenchGroup,
    bench_index: &BenchIndex,
    query_str: &str,
    collector: C,
    collector_name: &str,
) {
    let task_name = format!("{}_{}", query_str.replace(" ", "_"), collector_name);
    let query = bench_index.query_parser.parse_query(query_str).unwrap();
    let search_task = SearchTask {
        searcher: bench_index.searcher.clone(),
        collector,
        query,
    };
    bench_group.register(task_name, move |_| black_box(search_task.run()));
}

struct SearchTask<C: Collector> {
    searcher: Searcher,
    collector: C,
    query: Box<dyn Query>,
}

impl<C: Collector> SearchTask<C> {
    #[inline(never)]
    pub fn run(&self) -> usize {
        let result = self.searcher.search(&self.query, &self.collector).unwrap();
        if let Some(count) = (&result as &dyn std::any::Any).downcast_ref::<usize>() {
            *count
        } else if let Some(top_docs) = (&result as &dyn std::any::Any)
            .downcast_ref::<Vec<(Option<u64>, tantivy::DocAddress)>>()
        {
            top_docs.len()
        } else if let Some(top_docs) =
            (&result as &dyn std::any::Any).downcast_ref::<Vec<(u64, tantivy::DocAddress)>>()
        {
            top_docs.len()
        } else if let Some(doc_set) = (&result as &dyn std::any::Any)
            .downcast_ref::<std::collections::HashSet<tantivy::DocAddress>>()
        {
            doc_set.len()
        } else {
            eprintln!(
                "Unknown collector result type: {:?}",
                std::any::type_name::<C::Fruit>()
            );
            0
        }
    }
}


================================================
FILE: benches/exists_json.rs
================================================
use binggan::plugins::PeakMemAllocPlugin;
use binggan::{black_box, InputGroup, PeakMemAlloc, INSTRUMENTED_SYSTEM};
use serde_json::json;
use tantivy::collector::Count;
use tantivy::query::ExistsQuery;
use tantivy::schema::{Schema, FAST, TEXT};
use tantivy::{doc, Index};

#[global_allocator]
pub static GLOBAL: &PeakMemAlloc<std::alloc::System> = &INSTRUMENTED_SYSTEM;

fn main() {
    let doc_count: usize = 500_000;
    let subfield_counts: &[usize] = &[1, 2, 3, 4, 5, 6, 7, 8, 16, 256, 4096, 65536, 262144];

    let indices: Vec<(String, Index)> = subfield_counts
        .iter()
        .map(|&sub_fields| {
            (
                format!("subfields={sub_fields}"),
                build_index_with_json_subfields(doc_count, sub_fields),
            )
        })
        .collect();

    let mut group = InputGroup::new_with_inputs(indices);
    group.add_plugin(PeakMemAllocPlugin::new(GLOBAL));

    group.config().num_iter_group = Some(1);
    group.config().num_iter_bench = Some(1);
    group.register("exists_json", exists_json_union);

    group.run();
}

fn exists_json_union(index: &Index) {
    let reader = index.reader().expect("reader");
    let searcher = reader.searcher();
    let query = ExistsQuery::new("json".to_string(), true);
    let count = searcher.search(&query, &Count).expect("exists search");
    // Prevents optimizer from eliding the search
    black_box(count);
}

fn build_index_with_json_subfields(num_docs: usize, num_subfields: usize) -> Index {
    // Schema: single JSON field stored as FAST to support ExistsQuery.
    let mut schema_builder = Schema::builder();
    let json_field = schema_builder.add_json_field("json", TEXT | FAST);
    let schema = schema_builder.build();

    let index = Index::create_from_tempdir(schema).expect("create index");
    {
        let mut index_writer = index
            .writer_with_num_threads(1, 200_000_000)
            .expect("writer");
        for i in 0..num_docs {
            let sub = i % num_subfields;
            // Only one subpath set per document; rotate subpaths so that
            // no single subpath is full, but the union covers all docs.
            let v = json!({ format!("field_{sub}"): i as u64 });
            index_writer
                .add_document(doc!(json_field => v))
                .expect("add_document");
        }
        index_writer.commit().expect("commit");
    }

    index
}


================================================
FILE: benches/gh.json
================================================
{"id":"2489395767","type":"PushEvent","actor":{"id":1310570,"login":"soumith","gravatar_id":"","url":"https://api.github.com/users/soumith","avatar_url":"https://avatars.githubusercontent.com/u/1310570?"},"repo":{"id":28067809,"name":"soumith/fbcunn","url":"https://api.github.com/repos/soumith/fbcunn"},"payload":{"push_id":536752122,"size":4,"distinct_size":4,"ref":"refs/heads/master","head":"fa6048ec9b9eeafd12cee5f81324f355e1f2a198","before":"2d06657267b32e0c8e193c617039da200f710195","commits":[{"sha":"dbd68d30ee1f7b60d404553fc1c6226ebb374c8e","author":{"email":"88de463b5797707cf3425f85a415c3d869db732b@gmail.com","name":"Soumith Chintala"},"message":"back to old structure, except lua files moved out","distinct":true,"url":"https://api.github.com/repos/soumith/fbcunn/commits/dbd68d30ee1f7b60d404553fc1c6226ebb374c8e"},{"sha":"5567f9f5a83d7fe3320b18e5b89405e8a5ca77e6","author":{"email":"88de463b5797707cf3425f85a415c3d869db732b@gmail.com","name":"Soumith Chintala"},"message":"...","distinct":true,"url":"https://api.github.com/repos/soumith/fbcunn/commits/5567f9f5a83d7fe3320b18e5b89405e8a5ca77e6"},{"sha":"58a83b277328eca811d3a37cf171b2fc4fcd87af","author":{"email":"88de463b5797707cf3425f85a415c3d869db732b@gmail.com","name":"Soumith Chintala"},"message":"...","distinct":true,"url":"https://api.github.com/repos/soumith/fbcunn/commits/58a83b277328eca811d3a37cf171b2fc4fcd87af"},{"sha":"fa6048ec9b9eeafd12cee5f81324f355e1f2a198","author":{"email":"88de463b5797707cf3425f85a415c3d869db732b@gmail.com","name":"Soumith Chintala"},"message":"...","distinct":true,"url":"https://api.github.com/repos/soumith/fbcunn/commits/fa6048ec9b9eeafd12cee5f81324f355e1f2a198"}]},"public":true,"created_at":"2015-01-01T01:00:00Z"}
{"id":"2489395768","type":"PushEvent","actor":{"id":227068,"login":"radix","gravatar_id":"","url":"https://api.github.com/users/radix","avatar_url":"https://avatars.githubusercontent.com/u/227068?"},"repo":{"id":20022094,"name":"radix/effect","url":"https://api.github.com/repos/radix/effect"},"payload":{"push_id":536752123,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"defdbe78db98ad69d72f42b09194309f47616592","before":"d4c2903c26a8e50e7605405281b9d407855ff4c3","commits":[{"sha":"defdbe78db98ad69d72f42b09194309f47616592","author":{"email":"5f33e8ddd36b0c849687df732835b9abbe9b347b@twistedmatrix.com","name":"Christopher Armstrong"},"message":"put the auto-generated API docs in the repository so readthedocs will work.\nsigh.","distinct":true,"url":"https://api.github.com/repos/radix/effect/commits/defdbe78db98ad69d72f42b09194309f47616592"}]},"public":true,"created_at":"2015-01-01T01:00:00Z"}
{"id":"2489395770","type":"PullRequestEvent","actor":{"id":1341245,"login":"asfgit","gravatar_id":"","url":"https://api.github.com/users/asfgit","avatar_url":"https://avatars.githubusercontent.com/u/1341245?"},"repo":{"id":17165658,"name":"apache/spark","url":"https://api.github.com/repos/apache/spark"},"payload":{"action":"closed","number":3842,"pull_request":{"url":"https://api.github.com/repos/apache/spark/pulls/3842","id":26684124,"html_url":"https://github.com/apache/spark/pull/3842","diff_url":"https://github.com/apache/spark/pull/3842.diff","patch_url":"https://github.com/apache/spark/pull/3842.patch","issue_url":"https://api.github.com/repos/apache/spark/issues/3842","number":3842,"state":"closed","locked":false,"title":"SPARK-2757 [BUILD] [STREAMING] Add Mima test for Spark Sink after 1.10 is released","user":{"login":"srowen","id":822522,"avatar_url":"https://avatars.githubusercontent.com/u/822522?v=3","gravatar_id":"","url":"https://api.github.com/users/srowen","html_url":"https://github.com/srowen","followers_url":"https://api.github.com/users/srowen/followers","following_url":"https://api.github.com/users/srowen/following{/other_user}","gists_url":"https://api.github.com/users/srowen/gists{/gist_id}","starred_url":"https://api.github.com/users/srowen/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/srowen/subscriptions","organizations_url":"https://api.github.com/users/srowen/orgs","repos_url":"https://api.github.com/users/srowen/repos","events_url":"https://api.github.com/users/srowen/events{/privacy}","received_events_url":"https://api.github.com/users/srowen/received_events","type":"User","site_admin":false},"body":"Re-enable MiMa for Streaming Flume Sink module, now that 1.1.0 is released, per the JIRA TO-DO. That's pretty much all there is to this.","created_at":"2014-12-30T12:47:17Z","updated_at":"2015-01-01T01:00:02Z","closed_at":"2015-01-01T01:00:02Z","merged_at":null,"merge_commit_sha":"c66df2c9084212b592f5eb7a47fcebec542fda65","assignee":null,"milestone":null,"commits_url":"https://api.github.com/repos/apache/spark/pulls/3842/commits","review_comments_url":"https://api.github.com/repos/apache/spark/pulls/3842/comments","review_comment_url":"https://api.github.com/repos/apache/spark/pulls/comments/{number}","comments_url":"https://api.github.com/repos/apache/spark/issues/3842/comments","statuses_url":"https://api.github.com/repos/apache/spark/statuses/50ff80e4498c2cb0a30793fb41fa2d20942811d6","head":{"label":"srowen:SPARK-2757","ref":"SPARK-2757","sha":"50ff80e4498c2cb0a30793fb41fa2d20942811d6","user":{"login":"srowen","id":822522,"avatar_url":"https://avatars.githubusercontent.com/u/822522?v=3","gravatar_id":"","url":"https://api.github.com/users/srowen","html_url":"https://github.com/srowen","followers_url":"https://api.github.com/users/srowen/followers","following_url":"https://api.github.com/users/srowen/following{/other_user}","gists_url":"https://api.github.com/users/srowen/gists{/gist_id}","starred_url":"https://api.github.com/users/srowen/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/srowen/subscriptions","organizations_url":"https://api.github.com/users/srowen/orgs","repos_url":"https://api.github.com/users/srowen/repos","events_url":"https://api.github.com/users/srowen/events{/privacy}","received_events_url":"https://api.github.com/users/srowen/received_events","type":"User","site_admin":false},"repo":{"id":17241201,"name":"spark","full_name":"srowen/spark","owner":{"login":"srowen","id":822522,"avatar_url":"https://avatars.githubusercontent.com/u/822522?v=3","gravatar_id":"","url":"https://api.github.com/users/srowen","html_url":"https://github.com/srowen","followers_url":"https://api.github.com/users/srowen/followers","following_url":"https://api.github.com/users/srowen/following{/other_user}","gists_url":"https://api.github.com/users/srowen/gists{/gist_id}","starred_url":"https://api.github.com/users/srowen/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/srowen/subscriptions","organizations_url":"https://api.github.com/users/srowen/orgs","repos_url":"https://api.github.com/users/srowen/repos","events_url":"https://api.github.com/users/srowen/events{/privacy}","received_events_url":"https://api.github.com/users/srowen/received_events","type":"User","site_admin":false},"private":false,"html_url":"https://github.com/srowen/spark","description":"Mirror of Apache Spark","fork":true,"url":"https://api.github.com/repos/srowen/spark","forks_url":"https://api.github.com/repos/srowen/spark/forks","keys_url":"https://api.github.com/repos/srowen/spark/keys{/key_id}","collaborators_url":"https://api.github.com/repos/srowen/spark/collaborators{/collaborator}","teams_url":"https://api.github.com/repos/srowen/spark/teams","hooks_url":"https://api.github.com/repos/srowen/spark/hooks","issue_events_url":"https://api.github.com/repos/srowen/spark/issues/events{/number}","events_url":"https://api.github.com/repos/srowen/spark/events","assignees_url":"https://api.github.com/repos/srowen/spark/assignees{/user}","branches_url":"https://api.github.com/repos/srowen/spark/branches{/branch}","tags_url":"https://api.github.com/repos/srowen/spark/tags","blobs_url":"https://api.github.com/repos/srowen/spark/git/blobs{/sha}","git_tags_url":"https://api.github.com/repos/srowen/spark/git/tags{/sha}","git_refs_url":"https://api.github.com/repos/srowen/spark/git/refs{/sha}","trees_url":"https://api.github.com/repos/srowen/spark/git/trees{/sha}","statuses_url":"https://api.github.com/repos/srowen/spark/statuses/{sha}","languages_url":"https://api.github.com/repos/srowen/spark/languages","stargazers_url":"https://api.github.com/repos/srowen/spark/stargazers","contributors_url":"https://api.github.com/repos/srowen/spark/contributors","subscribers_url":"https://api.github.com/repos/srowen/spark/subscribers","subscription_url":"https://api.github.com/repos/srowen/spark/subscription","commits_url":"https://api.github.com/repos/srowen/spark/commits{/sha}","git_commits_url":"https://api.github.com/repos/srowen/spark/git/commits{/sha}","comments_url":"https://api.github.com/repos/srowen/spark/comments{/number}","issue_comment_url":"https://api.github.com/repos/srowen/spark/issues/comments/{number}","contents_url":"https://api.github.com/repos/srowen/spark/contents/{+path}","compare_url":"https://api.github.com/repos/srowen/spark/compare/{base}...{head}","merges_url":"https://api.github.com/repos/srowen/spark/merges","archive_url":"https://api.github.com/repos/srowen/spark/{archive_format}{/ref}","downloads_url":"https://api.github.com/repos/srowen/spark/downloads","issues_url":"https://api.github.com/repos/srowen/spark/issues{/number}","pulls_url":"https://api.github.com/repos/srowen/spark/pulls{/number}","milestones_url":"https://api.github.com/repos/srowen/spark/milestones{/number}","notifications_url":"https://api.github.com/repos/srowen/spark/notifications{?since,all,participating}","labels_url":"https://api.github.com/repos/srowen/spark/labels{/name}","releases_url":"https://api.github.com/repos/srowen/spark/releases{/id}","created_at":"2014-02-27T07:57:07Z","updated_at":"2014-12-31T22:16:53Z","pushed_at":"2014-12-31T23:34:36Z","git_url":"git://github.com/srowen/spark.git","ssh_url":"git@github.com:srowen/spark.git","clone_url":"https://github.com/srowen/spark.git","svn_url":"https://github.com/srowen/spark","homepage":null,"size":84942,"stargazers_count":1,"watchers_count":1,"language":"Scala","has_issues":false,"has_downloads":true,"has_wiki":false,"has_pages":false,"forks_count":1,"mirror_url":null,"open_issues_count":0,"forks":1,"open_issues":0,"watchers":1,"default_branch":"master"}},"base":{"label":"apache:master","ref":"master","sha":"040d6f2d13b132b3ef2a1e4f12f9f0e781c5a0b8","user":{"login":"apache","id":47359,"avatar_url":"https://avatars.githubusercontent.com/u/47359?v=3","gravatar_id":"","url":"https://api.github.com/users/apache","html_url":"https://github.com/apache","followers_url":"https://api.github.com/users/apache/followers","following_url":"https://api.github.com/users/apache/following{/other_user}","gists_url":"https://api.github.com/users/apache/gists{/gist_id}","starred_url":"https://api.github.com/users/apache/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/apache/subscriptions","organizations_url":"https://api.github.com/users/apache/orgs","repos_url":"https://api.github.com/users/apache/repos","events_url":"https://api.github.com/users/apache/events{/privacy}","received_events_url":"https://api.github.com/users/apache/received_events","type":"Organization","site_admin":false},"repo":{"id":17165658,"name":"spark","full_name":"apache/spark","owner":{"login":"apache","id":47359,"avatar_url":"https://avatars.githubusercontent.com/u/47359?v=3","gravatar_id":"","url":"https://api.github.com/users/apache","html_url":"https://github.com/apache","followers_url":"https://api.github.com/users/apache/followers","following_url":"https://api.github.com/users/apache/following{/other_user}","gists_url":"https://api.github.com/users/apache/gists{/gist_id}","starred_url":"https://api.github.com/users/apache/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/apache/subscriptions","organizations_url":"https://api.github.com/users/apache/orgs","repos_url":"https://api.github.com/users/apache/repos","events_url":"https://api.github.com/users/apache/events{/privacy}","received_events_url":"https://api.github.com/users/apache/received_events","type":"Organization","site_admin":false},"private":false,"html_url":"https://github.com/apache/spark","description":"Mirror of Apache Spark","fork":false,"url":"https://api.github.com/repos/apache/spark","forks_url":"https://api.github.com/repos/apache/spark/forks","keys_url":"https://api.github.com/repos/apache/spark/keys{/key_id}","collaborators_url":"https://api.github.com/repos/apache/spark/collaborators{/collaborator}","teams_url":"https://api.github.com/repos/apache/spark/teams","hooks_url":"https://api.github.com/repos/apache/spark/hooks","issue_events_url":"https://api.github.com/repos/apache/spark/issues/events{/number}","events_url":"https://api.github.com/repos/apache/spark/events","assignees_url":"https://api.github.com/repos/apache/spark/assignees{/user}","branches_url":"https://api.github.com/repos/apache/spark/branches{/branch}","tags_url":"https://api.github.com/repos/apache/spark/tags","blobs_url":"https://api.github.com/repos/apache/spark/git/blobs{/sha}","git_tags_url":"https://api.github.com/repos/apache/spark/git/tags{/sha}","git_refs_url":"https://api.github.com/repos/apache/spark/git/refs{/sha}","trees_url":"https://api.github.com/repos/apache/spark/git/trees{/sha}","statuses_url":"https://api.github.com/repos/apache/spark/statuses/{sha}","languages_url":"https://api.github.com/repos/apache/spark/languages","stargazers_url":"https://api.github.com/repos/apache/spark/stargazers","contributors_url":"https://api.github.com/repos/apache/spark/contributors","subscribers_url":"https://api.github.com/repos/apache/spark/subscribers","subscription_url":"https://api.github.com/repos/apache/spark/subscription","commits_url":"https://api.github.com/repos/apache/spark/commits{/sha}","git_commits_url":"https://api.github.com/repos/apache/spark/git/commits{/sha}","comments_url":"https://api.github.com/repos/apache/spark/comments{/number}","issue_comment_url":"https://api.github.com/repos/apache/spark/issues/comments/{number}","contents_url":"https://api.github.com/repos/apache/spark/contents/{+path}","compare_url":"https://api.github.com/repos/apache/spark/compare/{base}...{head}","merges_url":"https://api.github.com/repos/apache/spark/merges","archive_url":"https://api.github.com/repos/apache/spark/{archive_format}{/ref}","downloads_url":"https://api.github.com/repos/apache/spark/downloads","issues_url":"https://api.github.com/repos/apache/spark/issues{/number}","pulls_url":"https://api.github.com/repos/apache/spark/pulls{/number}","milestones_url":"https://api.github.com/repos/apache/spark/milestones{/number}","notifications_url":"https://api.github.com/repos/apache/spark/notifications{?since,all,participating}","labels_url":"https://api.github.com/repos/apache/spark/labels{/name}","releases_url":"https://api.github.com/repos/apache/spark/releases{/id}","created_at":"2014-02-25T08:00:08Z","updated_at":"2015-01-01T00:59:33Z","pushed_at":"2015-01-01T00:59:33Z","git_url":"git://github.com/apache/spark.git","ssh_url":"git@github.com:apache/spark.git","clone_url":"https://github.com/apache/spark.git","svn_url":"https://github.com/apache/spark","homepage":null,"size":1083068,"stargazers_count":2458,"watchers_count":2458,"language":"Scala","has_issues":false,"has_downloads":true,"has_wiki":false,"has_pages":false,"forks_count":2179,"mirror_url":"git://git.apache.org/spark.git","open_issues_count":268,"forks":2179,"open_issues":268,"watchers":2458,"default_branch":"master"}},"_links":{"self":{"href":"https://api.github.com/repos/apache/spark/pulls/3842"},"html":{"href":"https://github.com/apache/spark/pull/3842"},"issue":{"href":"https://api.github.com/repos/apache/spark/issues/3842"},"comments":{"href":"https://api.github.com/repos/apache/spark/issues/3842/comments"},"review_comments":{"href":"https://api.github.com/repos/apache/spark/pulls/3842/comments"},"review_comment":{"href":"https://api.github.com/repos/apache/spark/pulls/comments/{number}"},"commits":{"href":"https://api.github.com/repos/apache/spark/pulls/3842/commits"},"statuses":{"href":"https://api.github.com/repos/apache/spark/statuses/50ff80e4498c2cb0a30793fb41fa2d20942811d6"}},"merged":false,"mergeable":null,"mergeable_state":"unknown","merged_by":null,"comments":13,"review_comments":0,"commits":2,"additions":6,"deletions":1,"changed_files":2}},"public":true,"created_at":"2015-01-01T01:00:02Z","org":{"id":47359,"login":"apache","gravatar_id":"","url":"https://api.github.com/orgs/apache","avatar_url":"https://avatars.githubusercontent.com/u/47359?"}}
{"id":"2489395771","type":"PushEvent","actor":{"id":1341245,"login":"asfgit","gravatar_id":"","url":"https://api.github.com/users/asfgit","avatar_url":"https://avatars.githubusercontent.com/u/1341245?"},"repo":{"id":17165658,"name":"apache/spark","url":"https://api.github.com/repos/apache/spark"},"payload":{"push_id":536752124,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"4bb12488d56ea651c56d9688996b464b99095582","before":"fe6efacc0b865e9e827a1565877077000e63976e","commits":[{"sha":"4bb12488d56ea651c56d9688996b464b99095582","author":{"email":"291c18f3fb7528c712d9098b0e50a515ea0b91d5@cloudera.com","name":"Sean Owen"},"message":"SPARK-2757 [BUILD] [STREAMING] Add Mima test for Spark Sink after 1.10 is released\n\nRe-enable MiMa for Streaming Flume Sink module, now that 1.1.0 is released, per the JIRA TO-DO. That's pretty much all there is to this.\n\nAuthor: Sean Owen <sowen@cloudera.com>\n\nCloses #3842 from srowen/SPARK-2757 and squashes the following commits:\n\n50ff80e [Sean Owen] Exclude apparent false positive turned up by re-enabling MiMa checks for Streaming Flume Sink\n0e5ba5c [Sean Owen] Re-enable MiMa for Streaming Flume Sink module","distinct":true,"url":"https://api.github.com/repos/apache/spark/commits/4bb12488d56ea651c56d9688996b464b99095582"}]},"public":true,"created_at":"2015-01-01T01:00:02Z","org":{"id":47359,"login":"apache","gravatar_id":"","url":"https://api.github.com/orgs/apache","avatar_url":"https://avatars.githubusercontent.com/u/47359?"}}
{"id":"2489395775","type":"WatchEvent","actor":{"id":8562461,"login":"jamezb","gravatar_id":"","url":"https://api.github.com/users/jamezb","avatar_url":"https://avatars.githubusercontent.com/u/8562461?"},"repo":{"id":3073296,"name":"SirVer/ultisnips","url":"https://api.github.com/repos/SirVer/ultisnips"},"payload":{"action":"started"},"public":true,"created_at":"2015-01-01T01:00:03Z"}
{"id":"2489395777","type":"PushEvent","actor":{"id":3471313,"login":"uygunuks","gravatar_id":"","url":"https://api.github.com/users/uygunuks","avatar_url":"https://avatars.githubusercontent.com/u/3471313?"},"repo":{"id":28677766,"name":"uygunuks/AsalSayiKalibi","url":"https://api.github.com/repos/uygunuks/AsalSayiKalibi"},"payload":{"push_id":536752126,"size":1,"distinct_size":1,"ref":"refs/heads/uygunuks","head":"0fb2391e7aabeb57f358d5d51c70c766e6fa00d1","before":"e47f1e095b582a95143e414b3d449b1105345994","commits":[{"sha":"0fb2391e7aabeb57f358d5d51c70c766e6fa00d1","author":{"email":"821f468726cd384db724fde38ddabae6642cf80c@gmail.com","name":"Uygun BODUR"},"message":".","distinct":true,"url":"https://api.github.com/repos/uygunuks/AsalSayiKalibi/commits/0fb2391e7aabeb57f358d5d51c70c766e6fa00d1"}]},"public":true,"created_at":"2015-01-01T01:00:03Z"}
{"id":"2489395778","type":"PushEvent","actor":{"id":9201970,"login":"qdm","gravatar_id":"","url":"https://api.github.com/users/qdm","avatar_url":"https://avatars.githubusercontent.com/u/9201970?"},"repo":{"id":25173910,"name":"qdm/qdm.github.io","url":"https://api.github.com/repos/qdm/qdm.github.io"},"payload":{"push_id":536752127,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"05438aee0e5572a6e4adf91d7eef32917812d9e9","before":"c68bef59c42e21a898e59516233d5968deab61ca","commits":[{"sha":"05438aee0e5572a6e4adf91d7eef32917812d9e9","author":{"email":"de163e90d3aeef9f404d1de71c48e234a211e3c3@gmail.com","name":"KT"},"message":"Update","distinct":true,"url":"https://api.github.com/repos/qdm/qdm.github.io/commits/05438aee0e5572a6e4adf91d7eef32917812d9e9"}]},"public":true,"created_at":"2015-01-01T01:00:03Z"}
{"id":"2489395780","type":"PushEvent","actor":{"id":3495129,"login":"sundaymtn","gravatar_id":"","url":"https://api.github.com/users/sundaymtn","avatar_url":"https://avatars.githubusercontent.com/u/3495129?"},"repo":{"id":24147122,"name":"sundaymtn/waterline","url":"https://api.github.com/repos/sundaymtn/waterline"},"payload":{"push_id":536752128,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"44753191dc8f615ccda4f0afe31a09342172cfe4","before":"edee9761c08f76560fba328ea671c40f132f1afe","commits":[{"sha":"44753191dc8f615ccda4f0afe31a09342172cfe4","author":{"email":"7fbc091194a9488bfb16868527a7c3a8ba469dba@gmail.com","name":"Seth Carter"},"message":"Wed Dec 31 20:00:02 EST 2014","distinct":true,"url":"https://api.github.com/repos/sundaymtn/waterline/commits/44753191dc8f615ccda4f0afe31a09342172cfe4"}]},"public":true,"created_at":"2015-01-01T01:00:04Z"}
{"id":"2489395781","type":"IssueCommentEvent","actor":{"id":383994,"login":"jonschlinkert","gravatar_id":"","url":"https://api.github.com/users/jonschlinkert","avatar_url":"https://avatars.githubusercontent.com/u/383994?"},"repo":{"id":27114957,"name":"jonschlinkert/alphabet","url":"https://api.github.com/repos/jonschlinkert/alphabet"},"payload":{"action":"created","issue":{"url":"https://api.github.com/repos/jonschlinkert/alphabet/issues/1","labels_url":"https://api.github.com/repos/jonschlinkert/alphabet/issues/1/labels{/name}","comments_url":"https://api.github.com/repos/jonschlinkert/alphabet/issues/1/comments","events_url":"https://api.github.com/repos/jonschlinkert/alphabet/issues/1/events","html_url":"https://github.com/jonschlinkert/alphabet/issues/1","id":53200509,"number":1,"title":"any reason this isn't 1.0?","user":{"login":"tkellen","id":1004324,"avatar_url":"https://avatars.githubusercontent.com/u/1004324?v=3","gravatar_id":"","url":"https://api.github.com/users/tkellen","html_url":"https://github.com/tkellen","followers_url":"https://api.github.com/users/tkellen/followers","following_url":"https://api.github.com/users/tkellen/following{/other_user}","gists_url":"https://api.github.com/users/tkellen/gists{/gist_id}","starred_url":"https://api.github.com/users/tkellen/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/tkellen/subscriptions","organizations_url":"https://api.github.com/users/tkellen/orgs","repos_url":"https://api.github.com/users/tkellen/repos","events_url":"https://api.github.com/users/tkellen/events{/privacy}","received_events_url":"https://api.github.com/users/tkellen/received_events","type":"User","site_admin":false},"labels":[],"state":"closed","locked":false,"assignee":null,"milestone":null,"comments":2,"created_at":"2014-12-31T19:50:51Z","updated_at":"2015-01-01T01:00:04Z","closed_at":"2015-01-01T01:00:04Z","body":":P"},"comment":{"url":"https://api.github.com/repos/jonschlinkert/alphabet/issues/comments/68477208","html_url":"https://github.com/jonschlinkert/alphabet/issues/1#issuecomment-68477208","issue_url":"https://api.github.com/repos/jonschlinkert/alphabet/issues/1","id":68477208,"user":{"login":"jonschlinkert","id":383994,"avatar_url":"https://avatars.githubusercontent.com/u/383994?v=3","gravatar_id":"","url":"https://api.github.com/users/jonschlinkert","html_url":"https://github.com/jonschlinkert","followers_url":"https://api.github.com/users/jonschlinkert/followers","following_url":"https://api.github.com/users/jonschlinkert/following{/other_user}","gists_url":"https://api.github.com/users/jonschlinkert/gists{/gist_id}","starred_url":"https://api.github.com/users/jonschlinkert/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/jonschlinkert/subscriptions","organizations_url":"https://api.github.com/users/jonschlinkert/orgs","repos_url":"https://api.github.com/users/jonschlinkert/repos","events_url":"https://api.github.com/users/jonschlinkert/events{/privacy}","received_events_url":"https://api.github.com/users/jonschlinkert/received_events","type":"User","site_admin":false},"created_at":"2015-01-01T01:00:04Z","updated_at":"2015-01-01T01:00:04Z","body":"done. the English alphabet is officially stable."}},"public":true,"created_at":"2015-01-01T01:00:04Z"}
{"id":"2489395782","type":"IssuesEvent","actor":{"id":383994,"login":"jonschlinkert","gravatar_id":"","url":"https://api.github.com/users/jonschlinkert","avatar_url":"https://avatars.githubusercontent.com/u/383994?"},"repo":{"id":27114957,"name":"jonschlinkert/alphabet","url":"https://api.github.com/repos/jonschlinkert/alphabet"},"payload":{"action":"closed","issue":{"url":"https://api.github.com/repos/jonschlinkert/alphabet/issues/1","labels_url":"https://api.github.com/repos/jonschlinkert/alphabet/issues/1/labels{/name}","comments_url":"https://api.github.com/repos/jonschlinkert/alphabet/issues/1/comments","events_url":"https://api.github.com/repos/jonschlinkert/alphabet/issues/1/events","html_url":"https://github.com/jonschlinkert/alphabet/issues/1","id":53200509,"number":1,"title":"any reason this isn't 1.0?","user":{"login":"tkellen","id":1004324,"avatar_url":"https://avatars.githubusercontent.com/u/1004324?v=3","gravatar_id":"","url":"https://api.github.com/users/tkellen","html_url":"https://github.com/tkellen","followers_url":"https://api.github.com/users/tkellen/followers","following_url":"https://api.github.com/users/tkellen/following{/other_user}","gists_url":"https://api.github.com/users/tkellen/gists{/gist_id}","starred_url":"https://api.github.com/users/tkellen/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/tkellen/subscriptions","organizations_url":"https://api.github.com/users/tkellen/orgs","repos_url":"https://api.github.com/users/tkellen/repos","events_url":"https://api.github.com/users/tkellen/events{/privacy}","received_events_url":"https://api.github.com/users/tkellen/received_events","type":"User","site_admin":false},"labels":[],"state":"closed","locked":false,"assignee":null,"milestone":null,"comments":2,"created_at":"2014-12-31T19:50:51Z","updated_at":"2015-01-01T01:00:04Z","closed_at":"2015-01-01T01:00:04Z","body":":P"}},"public":true,"created_at":"2015-01-01T01:00:04Z"}
{"id":"2489395784","type":"PushEvent","actor":{"id":954353,"login":"byronmccollum","gravatar_id":"","url":"https://api.github.com/users/byronmccollum","avatar_url":"https://avatars.githubusercontent.com/u/954353?"},"repo":{"id":28677943,"name":"byronmccollum/html-lua","url":"https://api.github.com/repos/byronmccollum/html-lua"},"payload":{"push_id":536752130,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"4fc83167bc7fd4520a8c01e2a0cca1ae7b5f191a","before":"f2b6358fbc7c23443f40a51dea7a21aed96c3df3","commits":[{"sha":"4fc83167bc7fd4520a8c01e2a0cca1ae7b5f191a","author":{"email":"5c33cd3f0e8876e7150963b90c8e5c3e219c1462@rackspace.com","name":"Byron McCollum"},"message":"Update and rename htmlparser.lua to diff.lua","distinct":true,"url":"https://api.github.com/repos/byronmccollum/html-lua/commits/4fc83167bc7fd4520a8c01e2a0cca1ae7b5f191a"}]},"public":true,"created_at":"2015-01-01T01:00:04Z"}
{"id":"2489395786","type":"PushEvent","actor":{"id":4070158,"login":"caleb-eades","gravatar_id":"","url":"https://api.github.com/users/caleb-eades","avatar_url":"https://avatars.githubusercontent.com/u/4070158?"},"repo":{"id":20469468,"name":"caleb-eades/MinecraftServers","url":"https://api.github.com/repos/caleb-eades/MinecraftServers"},"payload":{"push_id":536752131,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"60172d1d82e6e7a353b92353ee214a4960d39023","before":"049abf23362ba353c697f1c88d54250ebd073ce1","commits":[{"sha":"60172d1d82e6e7a353b92353ee214a4960d39023","author":{"email":"5bbfe2c07a3ef0b22b72711a2edf1c023f6433c5@gmail.com","name":"caleb-eades"},"message":"Auto Snapshot Server State","distinct":true,"url":"https://api.github.com/repos/caleb-eades/MinecraftServers/commits/60172d1d82e6e7a353b92353ee214a4960d39023"}]},"public":true,"created_at":"2015-01-01T01:00:04Z"}
{"id":"2489395789","type":"PushEvent","actor":{"id":6372134,"login":"Stuntddude","gravatar_id":"","url":"https://api.github.com/users/Stuntddude","avatar_url":"https://avatars.githubusercontent.com/u/6372134?"},"repo":{"id":28654554,"name":"Stuntddude/Blockade-Runner","url":"https://api.github.com/repos/Stuntddude/Blockade-Runner"},"payload":{"push_id":536752132,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"b9ec439b0ecc1f79b1b08fa5c0a2abe1f14856c9","before":"8289316476b4f01149046d43c34bb6aec0318b17","commits":[{"sha":"b9ec439b0ecc1f79b1b08fa5c0a2abe1f14856c9","author":{"email":"648fb0198c1960b14fbfb0124dd6b81f9019bc45@gmail.com","name":"Miles Fogle"},"message":"Implemented InputHandler\n\nCreated the first draft of a generic input handler in ld31.InputHandler,\nwhich is now used to handle keyboard input, and will be used to handle\nmouse input and provide options for keybindings. Moved most\ninput-handling code out of LD31.","distinct":true,"url":"https://api.github.com/repos/Stuntddude/Blockade-Runner/commits/b9ec439b0ecc1f79b1b08fa5c0a2abe1f14856c9"}]},"public":true,"created_at":"2015-01-01T01:00:06Z"}
{"id":"2489395790","type":"PullRequestReviewCommentEvent","actor":{"id":4195632,"login":"KA101","gravatar_id":"","url":"https://api.github.com/users/KA101","avatar_url":"https://avatars.githubusercontent.com/u/4195632?"},"repo":{"id":5973855,"name":"CleverRaven/Cataclysm-DDA","url":"https://api.github.com/repos/CleverRaven/Cataclysm-DDA"},"payload":{"action":"created","comment":{"url":"https://api.github.com/repos/CleverRaven/Cataclysm-DDA/pulls/comments/22397251","id":22397251,"diff_hunk":"@@ -469,14 +469,23 @@ std::string effect::disp_desc(bool reduced) const\n     std::vector<desc_freq> values;\n     // Add various desc_freq structs to values. If more effects wish to be placed in the descriptions this is the\n     // place to add them.\n-    values.push_back(desc_freq(get_percentage(\"PAIN\", reduced), get_avg_mod(\"PAIN\", reduced), _(\"pain\"), _(\"pain\")));\n-    values.push_back(desc_freq(get_percentage(\"HURT\", reduced), get_avg_mod(\"HURT\", reduced), _(\"damage\"), _(\"damage\")));\n-    values.push_back(desc_freq(get_percentage(\"THIRST\", reduced), get_avg_mod(\"THIRST\", reduced), _(\"thirst\"), _(\"quench\")));\n-    values.push_back(desc_freq(get_percentage(\"HUNGER\", reduced), get_avg_mod(\"HUNGER\", reduced), _(\"hunger\"), _(\"sate\")));\n-    values.push_back(desc_freq(get_percentage(\"FATIGUE\", reduced), get_avg_mod(\"FATIGUE\", reduced), _(\"fatigue\"), _(\"rest\")));\n-    values.push_back(desc_freq(get_percentage(\"COUGH\", reduced), get_avg_mod(\"COUGH\", reduced), _(\"coughing\"), _(\"coughing\")));\n-    values.push_back(desc_freq(get_percentage(\"VOMIT\", reduced), get_avg_mod(\"VOMIT\", reduced), _(\"vomiting\"), _(\"vomiting\")));\n-    values.push_back(desc_freq(get_percentage(\"SLEEP\", reduced), get_avg_mod(\"SLEEP\", reduced), _(\"blackouts\"), _(\"blackouts\")));\n+    int val = 0;\n+    val = get_avg_mod(\"PAIN\", reduced);\n+    values.push_back(desc_freq(get_percentage(\"PAIN\", val, reduced), val, _(\"pain\"), _(\"pain\")));","path":"src/effect.cpp","position":14,"original_position":14,"commit_id":"63238b1c8a9b7551d891f9d2595f53f43d91e776","original_commit_id":"63238b1c8a9b7551d891f9d2595f53f43d91e776","user":{"login":"KA101","id":4195632,"avatar_url":"https://avatars.githubusercontent.com/u/4195632?v=3","gravatar_id":"","url":"https://api.github.com/users/KA101","html_url":"https://github.com/KA101","followers_url":"https://api.github.com/users/KA101/followers","following_url":"https://api.github.com/users/KA101/following{/other_user}","gists_url":"https://api.github.com/users/KA101/gists{/gist_id}","starred_url":"https://api.github.com/users/KA101/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/KA101/subscriptions","organizations_url":"https://api.github.com/users/KA101/orgs","repos_url":"https://api.github.com/users/KA101/repos","events_url":"https://api.github.com/users/KA101/events{/privacy}","received_events_url":"https://api.github.com/users/KA101/received_events","type":"User","site_admin":false},"body":"Huh.  This looks like it might be workable for the mutation fix.  I wasn't sure how best to handle that.","created_at":"2015-01-01T01:00:05Z","updated_at":"2015-01-01T01:00:05Z","html_url":"https://github.com/CleverRaven/Cataclysm-DDA/pull/10698#discussion_r22397251","pull_request_url":"https://api.github.com/repos/CleverRaven/Cataclysm-DDA/pulls/10698","_links":{"self":{"href":"https://api.github.com/repos/CleverRaven/Cataclysm-DDA/pulls/comments/22397251"},"html":{"href":"https://github.com/CleverRaven/Cataclysm-DDA/pull/10698#discussion_r22397251"},"pull_request":{"href":"https://api.github.com/repos/CleverRaven/Cataclysm-DDA/pulls/10698"}}},"pull_request":{"url":"https://api.github.com/repos/CleverRaven/Cataclysm-DDA/pulls/10698","id":26739248,"html_url":"https://github.com/CleverRaven/Cataclysm-DDA/pull/10698","diff_url":"https://github.com/CleverRaven/Cataclysm-DDA/pull/10698.diff","patch_url":"https://github.com/CleverRaven/Cataclysm-DDA/pull/10698.patch","issue_url":"https://api.github.com/repos/CleverRaven/Cataclysm-DDA/issues/10698","number":10698,"state":"open","locked":false,"title":"Fix effect triggering","user":{"login":"i2amroy","id":4275617,"avatar_url":"https://avatars.githubusercontent.com/u/4275617?v=3","gravatar_id":"","url":"https://api.github.com/users/i2amroy","html_url":"https://github.com/i2amroy","followers_url":"https://api.github.com/users/i2amroy/followers","following_url":"https://api.github.com/users/i2amroy/following{/other_user}","gists_url":"https://api.github.com/users/i2amroy/gists{/gist_id}","starred_url":"https://api.github.com/users/i2amroy/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/i2amroy/subscriptions","organizations_url":"https://api.github.com/users/i2amroy/orgs","repos_url":"https://api.github.com/users/i2amroy/repos","events_url":"https://api.github.com/users/i2amroy/events{/privacy}","received_events_url":"https://api.github.com/users/i2amroy/received_events","type":"User","site_admin":false},"body":"Fixes some <= 0 confusion stuff and makes having a nonzero addition value properly override having a default (0) chance to trigger.\r\n\r\nFixes #10617","created_at":"2015-01-01T00:42:50Z","updated_at":"2015-01-01T01:00:05Z","closed_at":null,"merged_at":null,"merge_commit_sha":"88ebf4a7e6d454d6b8bd6757a0bab31855a9ea1d","assignee":null,"milestone":null,"commits_url":"https://api.github.com/repos/CleverRaven/Cataclysm-DDA/pulls/10698/commits","review_comments_url":"https://api.github.com/repos/CleverRaven/Cataclysm-DDA/pulls/10698/comments","review_comment_url":"https://api.github.com/repos/CleverRaven/Cataclysm-DDA/pulls/comments/{number}","comments_url":"https://api.github.com/repos/CleverRaven/Cataclysm-DDA/issues/10698/comments","statuses_url":"https://api.github.com/repos/CleverRaven/Cataclysm-DDA/statuses/63238b1c8a9b7551d891f9d2595f53f43d91e776","head":{"label":"i2amroy:PKILL","ref":"PKILL","sha":"63238b1c8a9b7551d891f9d2595f53f43d91e776","user":{"login":"i2amroy","id":4275617,"avatar_url":"https://avatars.githubusercontent.com/u/4275617?v=3","gravatar_id":"","url":"https://api.github.com/users/i2amroy","html_url":"https://github.com/i2amroy","followers_url":"https://api.github.com/users/i2amroy/followers","following_url":"https://api.github.com/users/i2amroy/following{/other_user}","gists_url":"https://api.github.com/users/i2amroy/gists{/gist_id}","starred_url":"https://api.github.com/users/i2amroy/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/i2amroy/subscriptions","organizations_url":"https://api.github.com/users/i2amroy/orgs","repos_url":"https://api.github.com/users/i2amroy/repos","events_url":"https://api.github.com/users/i2amroy/events{/privacy}","received_events_url":"https://api.github.com/users/i2amroy/received_events","type":"User","site_admin":false},"repo":{"id":9722704,"name":"Cataclysm-DDA","full_name":"i2amroy/Cataclysm-DDA","owner":{"login":"i2amroy","id":4275617,"avatar_url":"https://avatars.githubusercontent.com/u/4275617?v=3","gravatar_id":"","url":"https://api.github.com/users/i2amroy","html_url":"https://github.com/i2amroy","followers_url":"https://api.github.com/users/i2amroy/followers","following_url":"https://api.github.com/users/i2amroy/following{/other_user}","gists_url":"https://api.github.com/users/i2amroy/gists{/gist_id}","starred_url":"https://api.github.com/users/i2amroy/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/i2amroy/subscriptions","organizations_url":"https://api.github.com/users/i2amroy/orgs","repos_url":"https://api.github.com/users/i2amroy/repos","events_url":"https://api.github.com/users/i2amroy/events{/privacy}","received_events_url":"https://api.github.com/users/i2amroy/received_events","type":"User","site_admin":false},"private":false,"html_url":"https://github.com/i2amroy/Cataclysm-DDA","description":"Cataclysm - Dark Days Ahead. A fork/variant of Cataclysm Roguelike by Whales.","fork":true,"url":"https://api.github.com/repos/i2amroy/Cataclysm-DDA","forks_url":"https://api.github.com/repos/i2amroy/Cataclysm-DDA/forks","keys_url":"https://api.github.com/repos/i2amroy/Cataclysm-DDA/keys{/key_id}","collaborators_url":"https://api.github.com/repos/i2amroy/Cataclysm-DDA/collaborators{/collaborator}","teams_url":"https://api.github.com/repos/i2amroy/Cataclysm-DDA/teams","hooks_url":"https://api.github.com/repos/i2amroy/Cataclysm-DDA/hooks","issue_events_url":"https://api.github.com/repos/i2amroy/Cataclysm-DDA/issues/events{/number}","events_url":"https://api.github.com/repos/i2amroy/Cataclysm-DDA/events","assignees_url":"https://api.github.com/repos/i2amroy/Cataclysm-DDA/assignees{/user}","branches_url":"https://api.github.com/repos/i2amroy/Cataclysm-DDA/branches{/branch}","tags_url":"https://api.github.com/repos/i2amroy/Cataclysm-DDA/tags","blobs_url":"https://api.github.com/repos/i2amroy/Cataclysm-DDA/git/blobs{/sha}","git_tags_url":"https://api.github.com/repos/i2amroy/Cataclysm-DDA/git/tags{/sha}","git_refs_url":"https://api.github.com/repos/i2amroy/Cataclysm-DDA/git/refs{/sha}","trees_url":"https://api.github.com/repos/i2amroy/Cataclysm-DDA/git/trees{/sha}","statuses_url":"https://api.github.com/repos/i2amroy/Cataclysm-DDA/statuses/{sha}","languages_url":"https://api.github.com/repos/i2amroy/Cataclysm-DDA/languages","stargazers_url":"https://api.github.com/repos/i2amroy/Cataclysm-DDA/stargazers","contributors_url":"https://api.github.com/repos/i2amroy/Cataclysm-DDA/contributors","subscribers_url":"https://api.github.com/repos/i2amroy/Cataclysm-DDA/subscribers","subscription_url":"https://api.github.com/repos/i2amroy/Cataclysm-DDA/subscription","commits_url":"https://api.github.com/repos/i2amroy/Cataclysm-DDA/commits{/sha}","git_commits_url":"https://api.github.com/repos/i2amroy/Cataclysm-DDA/git/commits{/sha}","comments_url":"https://api.github.com/repos/i2amroy/Cataclysm-DDA/comments{/number}","issue_comment_url":"https://api.github.com/repos/i2amroy/Cataclysm-DDA/issues/comments/{number}","contents_url":"https://api.github.com/repos/i2amroy/Cataclysm-DDA/contents/{+path}","compare_url":"https://api.github.com/repos/i2amroy/Cataclysm-DDA/compare/{base}...{head}","merges_url":"https://api.github.com/repos/i2amroy/Cataclysm-DDA/merges","archive_url":"https://api.github.com/repos/i2amroy/Cataclysm-DDA/{archive_format}{/ref}","downloads_url":"https://api.github.com/repos/i2amroy/Cataclysm-DDA/downloads","issues_url":"https://api.github.com/repos/i2amroy/Cataclysm-DDA/issues{/number}","pulls_url":"https://api.github.com/repos/i2amroy/Cataclysm-DDA/pulls{/number}","milestones_url":"https://api.github.com/repos/i2amroy/Cataclysm-DDA/milestones{/number}","notifications_url":"https://api.github.com/repos/i2amroy/Cataclysm-DDA/notifications{?since,all,participating}","labels_url":"https://api.github.com/repos/i2amroy/Cataclysm-DDA/labels{/name}","releases_url":"https://api.github.com/repos/i2amroy/Cataclysm-DDA/releases{/id}","created_at":"2013-04-27T23:43:26Z","updated_at":"2014-12-31T21:47:23Z","pushed_at":"2015-01-01T00:39:41Z","git_url":"git://github.com/i2amroy/Cataclysm-DDA.git","ssh_url":"git@github.com:i2amroy/Cataclysm-DDA.git","clone_url":"https://github.com/i2amroy/Cataclysm-DDA.git","svn_url":"https://github.com/i2amroy/Cataclysm-DDA","homepage":"http://www.cataclysm.glyphgryph.com/","size":324783,"stargazers_count":0,"watchers_count":0,"language":"C++","has_issues":false,"has_downloads":true,"has_wiki":true,"has_pages":false,"forks_count":0,"mirror_url":null,"open_issues_count":0,"forks":0,"open_issues":0,"watchers":0,"default_branch":"master"}},"base":{"label":"CleverRaven:master","ref":"master","sha":"ddef397944dacbc1a57f0fb4900f3f3cf9a2045a","user":{"login":"CleverRaven","id":4367009,"avatar_url":"https://avatars.githubusercontent.com/u/4367009?v=3","gravatar_id":"","url":"https://api.github.com/users/CleverRaven","html_url":"https://github.com/CleverRaven","followers_url":"https://api.github.com/users/CleverRaven/followers","following_url":"https://api.github.com/users/CleverRaven/following{/other_user}","gists_url":"https://api.github.com/users/CleverRaven/gists{/gist_id}","starred_url":"https://api.github.com/users/CleverRaven/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/CleverRaven/subscriptions","organizations_url":"https://api.github.com/users/CleverRaven/orgs","repos_url":"https://api.github.com/users/CleverRaven/repos","events_url":"https://api.github.com/users/CleverRaven/events{/privacy}","received_events_url":"https://api.github.com/users/CleverRaven/received_events","type":"Organization","site_admin":false},"repo":{"id":5973855,"name":"Cataclysm-DDA","full_name":"CleverRaven/Cataclysm-DDA","owner":{"login":"CleverRaven","id":4367009,"avatar_url":"https://avatars.githubusercontent.com/u/4367009?v=3","gravatar_id":"","url":"https://api.github.com/users/CleverRaven","html_url":"https://github.com/CleverRaven","followers_url":"https://api.github.com/users/CleverRaven/followers","following_url":"https://api.github.com/users/CleverRaven/following{/other_user}","gists_url":"https://api.github.com/users/CleverRaven/gists{/gist_id}","starred_url":"https://api.github.com/users/CleverRaven/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/CleverRaven/subscriptions","organizations_url":"https://api.github.com/users/CleverRaven/orgs","repos_url":"https://api.github.com/users/CleverRaven/repos","events_url":"https://api.github.com/users/CleverRaven/events{/privacy}","received_events_url":"https://api.github.com/users/CleverRaven/received_events","type":"Organization","site_admin":false},"private":false,"html_url":"https://github.com/CleverRaven/Cataclysm-DDA","description":"Cataclysm - Dark Days Ahead. A fork/variant of Cataclysm Roguelike by Whales.","fork":false,"url":"https://api.github.com/repos/CleverRaven/Cataclysm-DDA","forks_url":"https://api.github.com/repos/CleverRaven/Cataclysm-DDA/forks","keys_url":"https://api.github.com/repos/CleverRaven/Cataclysm-DDA/keys{/key_id}","collaborators_url":"https://api.github.com/repos/CleverRaven/Cataclysm-DDA/collaborators{/collaborator}","teams_url":"https://api.github.com/repos/CleverRaven/Cataclysm-DDA/teams","hooks_url":"https://api.github.com/repos/CleverRaven/Cataclysm-DDA/hooks","issue_events_url":"https://api.github.com/repos/CleverRaven/Cataclysm-DDA/issues/events{/number}","events_url":"https://api.github.com/repos/CleverRaven/Cataclysm-DDA/events","assignees_url":"https://api.github.com/repos/CleverRaven/Cataclysm-DDA/assignees{/user}","branches_url":"https://api.github.com/repos/CleverRaven/Cataclysm-DDA/branches{/branch}","tags_url":"https://api.github.com/repos/CleverRaven/Cataclysm-DDA/tags","blobs_url":"https://api.github.com/repos/CleverRaven/Cataclysm-DDA/git/blobs{/sha}","git_tags_url":"https://api.github.com/repos/CleverRaven/Cataclysm-DDA/git/tags{/sha}","git_refs_url":"https://api.github.com/repos/CleverRaven/Cataclysm-DDA/git/refs{/sha}","trees_url":"https://api.github.com/repos/CleverRaven/Cataclysm-DDA/git/trees{/sha}","statuses_url":"https://api.github.com/repos/CleverRaven/Cataclysm-DDA/statuses/{sha}","languages_url":"https://api.github.com/repos/CleverRaven/Cataclysm-DDA/languages","stargazers_url":"https://api.github.com/repos/CleverRaven/Cataclysm-DDA/stargazers","contributors_url":"https://api.github.com/repos/CleverRaven/Cataclysm-DDA/contributors","subscribers_url":"https://api.github.com/repos/CleverRaven/Cataclysm-DDA/subscribers","subscription_url":"https://api.github.com/repos/CleverRaven/Cataclysm-DDA/subscription","commits_url":"https://api.github.com/repos/CleverRaven/Cataclysm-DDA/commits{/sha}","git_commits_url":"https://api.github.com/repos/CleverRaven/Cataclysm-DDA/git/commits{/sha}","comments_url":"https://api.github.com/repos/CleverRaven/Cataclysm-DDA/comments{/number}","issue_comment_url":"https://api.github.com/repos/CleverRaven/Cataclysm-DDA/issues/comments/{number}","contents_url":"https://api.github.com/repos/CleverRaven/Cataclysm-DDA/contents/{+path}","compare_url":"https://api.github.com/repos/CleverRaven/Cataclysm-DDA/compare/{base}...{head}","merges_url":"https://api.github.com/repos/CleverRaven/Cataclysm-DDA/merges","archive_url":"https://api.github.com/repos/CleverRaven/Cataclysm-DDA/{archive_format}{/ref}","downloads_url":"https://api.github.com/repos/CleverRaven/Cataclysm-DDA/downloads","issues_url":"https://api.github.com/repos/CleverRaven/Cataclysm-DDA/issues{/number}","pulls_url":"https://api.github.com/repos/CleverRaven/Cataclysm-DDA/pulls{/number}","milestones_url":"https://api.github.com/repos/CleverRaven/Cataclysm-DDA/milestones{/number}","notifications_url":"https://api.github.com/repos/CleverRaven/Cataclysm-DDA/notifications{?since,all,participating}","labels_url":"https://api.github.com/repos/CleverRaven/Cataclysm-DDA/labels{/name}","releases_url":"https://api.github.com/repos/CleverRaven/Cataclysm-DDA/releases{/id}","created_at":"2012-09-26T22:57:43Z","updated_at":"2014-12-31T07:31:31Z","pushed_at":"2014-12-31T07:31:30Z","git_url":"git://github.com/CleverRaven/Cataclysm-DDA.git","ssh_url":"git@github.com:CleverRaven/Cataclysm-DDA.git","clone_url":"https://github.com/CleverRaven/Cataclysm-DDA.git","svn_url":"https://github.com/CleverRaven/Cataclysm-DDA","homepage":"http://en.cataclysmdda.com/","size":400119,"stargazers_count":556,"watchers_count":556,"language":"C++","has_issues":true,"has_downloads":true,"has_wiki":true,"has_pages":false,"forks_count":619,"mirror_url":null,"open_issues_count":774,"forks":619,"open_issues":774,"watchers":556,"default_branch":"master"}},"_links":{"self":{"href":"https://api.github.com/repos/CleverRaven/Cataclysm-DDA/pulls/10698"},"html":{"href":"https://github.com/CleverRaven/Cataclysm-DDA/pull/10698"},"issue":{"href":"https://api.github.com/repos/CleverRaven/Cataclysm-DDA/issues/10698"},"comments":{"href":"https://api.github.com/repos/CleverRaven/Cataclysm-DDA/issues/10698/comments"},"review_comments":{"href":"https://api.github.com/repos/CleverRaven/Cataclysm-DDA/pulls/10698/comments"},"review_comment":{"href":"https://api.github.com/repos/CleverRaven/Cataclysm-DDA/pulls/comments/{number}"},"commits":{"href":"https://api.github.com/repos/CleverRaven/Cataclysm-DDA/pulls/10698/commits"},"statuses":{"href":"https://api.github.com/repos/CleverRaven/Cataclysm-DDA/statuses/63238b1c8a9b7551d891f9d2595f53f43d91e776"}}}},"public":true,"created_at":"2015-01-01T01:00:05Z","org":{"id":4367009,"login":"CleverRaven","gravatar_id":"","url":"https://api.github.com/orgs/CleverRaven","avatar_url":"https://avatars.githubusercontent.com/u/4367009?"}}
{"id":"2489395794","type":"CreateEvent","actor":{"id":5762348,"login":"JasonYang96","gravatar_id":"","url":"https://api.github.com/users/JasonYang96","avatar_url":"https://avatars.githubusercontent.com/u/5762348?"},"repo":{"id":28678050,"name":"JasonYang96/Leet-Code-OJ","url":"https://api.github.com/repos/JasonYang96/Leet-Code-OJ"},"payload":{"ref":"master","ref_type":"branch","master_branch":"master","description":"Solutions to Problems found at https://oj.leetcode.com/problems/","pusher_type":"user"},"public":true,"created_at":"2015-01-01T01:00:06Z"}
{"id":"2489395795","type":"WatchEvent","actor":{"id":119853,"login":"mcddx330","gravatar_id":"","url":"https://api.github.com/users/mcddx330","avatar_url":"https://avatars.githubusercontent.com/u/119853?"},"repo":{"id":8257106,"name":"jessesquires/JSQMessagesViewController","url":"https://api.github.com/repos/jessesquires/JSQMessagesViewController"},"payload":{"action":"started"},"public":true,"created_at":"2015-01-01T01:00:06Z"}
{"id":"2489395796","type":"ForkEvent","actor":{"id":8518239,"login":"gitter-badger","gravatar_id":"","url":"https://api.github.com/users/gitter-badger","avatar_url":"https://avatars.githubusercontent.com/u/8518239?"},"repo":{"id":8540783,"name":"russmatney/dotfiles","url":"https://api.github.com/repos/russmatney/dotfiles"},"payload":{"forkee":{"id":28678212,"name":"dotfiles-15","full_name":"gitter-badger/dotfiles-15","owner":{"login":"gitter-badger","id":8518239,"avatar_url":"https://avatars.githubusercontent.com/u/8518239?v=3","gravatar_id":"","url":"https://api.github.com/users/gitter-badger","html_url":"https://github.com/gitter-badger","followers_url":"https://api.github.com/users/gitter-badger/followers","following_url":"https://api.github.com/users/gitter-badger/following{/other_user}","gists_url":"https://api.github.com/users/gitter-badger/gists{/gist_id}","starred_url":"https://api.github.com/users/gitter-badger/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/gitter-badger/subscriptions","organizations_url":"https://api.github.com/users/gitter-badger/orgs","repos_url":"https://api.github.com/users/gitter-badger/repos","events_url":"https://api.github.com/users/gitter-badger/events{/privacy}","received_events_url":"https://api.github.com/users/gitter-badger/received_events","type":"User","site_admin":false},"private":false,"html_url":"https://github.com/gitter-badger/dotfiles-15","description":"","fork":true,"url":"https://api.github.com/repos/gitter-badger/dotfiles-15","forks_url":"https://api.github.com/repos/gitter-badger/dotfiles-15/forks","keys_url":"https://api.github.com/repos/gitter-badger/dotfiles-15/keys{/key_id}","collaborators_url":"https://api.github.com/repos/gitter-badger/dotfiles-15/collaborators{/collaborator}","teams_url":"https://api.github.com/repos/gitter-badger/dotfiles-15/teams","hooks_url":"https://api.github.com/repos/gitter-badger/dotfiles-15/hooks","issue_events_url":"https://api.github.com/repos/gitter-badger/dotfiles-15/issues/events{/number}","events_url":"https://api.github.com/repos/gitter-badger/dotfiles-15/events","assignees_url":"https://api.github.com/repos/gitter-badger/dotfiles-15/assignees{/user}","branches_url":"https://api.github.com/repos/gitter-badger/dotfiles-15/branches{/branch}","tags_url":"https://api.github.com/repos/gitter-badger/dotfiles-15/tags","blobs_url":"https://api.github.com/repos/gitter-badger/dotfiles-15/git/blobs{/sha}","git_tags_url":"https://api.github.com/repos/gitter-badger/dotfiles-15/git/tags{/sha}","git_refs_url":"https://api.github.com/repos/gitter-badger/dotfiles-15/git/refs{/sha}","trees_url":"https://api.github.com/repos/gitter-badger/dotfiles-15/git/trees{/sha}","statuses_url":"https://api.github.com/repos/gitter-badger/dotfiles-15/statuses/{sha}","languages_url":"https://api.github.com/repos/gitter-badger/dotfiles-15/languages","stargazers_url":"https://api.github.com/repos/gitter-badger/dotfiles-15/stargazers","contributors_url":"https://api.github.com/repos/gitter-badger/dotfiles-15/contributors","subscribers_url":"https://api.github.com/repos/gitter-badger/dotfiles-15/subscribers","subscription_url":"https://api.github.com/repos/gitter-badger/dotfiles-15/subscription","commits_url":"https://api.github.com/repos/gitter-badger/dotfiles-15/commits{/sha}","git_commits_url":"https://api.github.com/repos/gitter-badger/dotfiles-15/git/commits{/sha}","comments_url":"https://api.github.com/repos/gitter-badger/dotfiles-15/comments{/number}","issue_comment_url":"https://api.github.com/repos/gitter-badger/dotfiles-15/issues/comments/{number}","contents_url":"https://api.github.com/repos/gitter-badger/dotfiles-15/contents/{+path}","compare_url":"https://api.github.com/repos/gitter-badger/dotfiles-15/compare/{base}...{head}","merges_url":"https://api.github.com/repos/gitter-badger/dotfiles-15/merges","archive_url":"https://api.github.com/repos/gitter-badger/dotfiles-15/{archive_format}{/ref}","downloads_url":"https://api.github.com/repos/gitter-badger/dotfiles-15/downloads","issues_url":"https://api.github.com/repos/gitter-badger/dotfiles-15/issues{/number}","pulls_url":"https://api.github.com/repos/gitter-badger/dotfiles-15/pulls{/number}","milestones_url":"https://api.github.com/repos/gitter-badger/dotfiles-15/milestones{/number}","notifications_url":"https://api.github.com/repos/gitter-badger/dotfiles-15/notifications{?since,all,participating}","labels_url":"https://api.github.com/repos/gitter-badger/dotfiles-15/labels{/name}","releases_url":"https://api.github.com/repos/gitter-badger/dotfiles-15/releases{/id}","created_at":"2015-01-01T01:00:07Z","updated_at":"2014-12-30T19:07:15Z","pushed_at":"2014-12-30T19:07:15Z","git_url":"git://github.com/gitter-badger/dotfiles-15.git","ssh_url":"git@github.com:gitter-badger/dotfiles-15.git","clone_url":"https://github.com/gitter-badger/dotfiles-15.git","svn_url":"https://github.com/gitter-badger/dotfiles-15","homepage":"","size":620,"stargazers_count":0,"watchers_count":0,"language":null,"has_issues":false,"has_downloads":true,"has_wiki":true,"has_pages":false,"forks_count":0,"mirror_url":null,"open_issues_count":0,"forks":0,"open_issues":0,"watchers":0,"default_branch":"master","public":true}},"public":true,"created_at":"2015-01-01T01:00:08Z"}
{"id":"2489395797","type":"PullRequestEvent","actor":{"id":1235097,"login":"rmarinho","gravatar_id":"","url":"https://api.github.com/users/rmarinho","avatar_url":"https://avatars.githubusercontent.com/u/1235097?"},"repo":{"id":20463939,"name":"XLabs/Xamarin-Forms-Labs","url":"https://api.github.com/repos/XLabs/Xamarin-Forms-Labs"},"payload":{"action":"closed","number":533,"pull_request":{"url":"https://api.github.com/repos/XLabs/Xamarin-Forms-Labs/pulls/533","id":26426443,"html_url":"https://github.com/XLabs/Xamarin-Forms-Labs/pull/533","diff_url":"https://github.com/XLabs/Xamarin-Forms-Labs/pull/533.diff","patch_url":"https://github.com/XLabs/Xamarin-Forms-Labs/pull/533.patch","issue_url":"https://api.github.com/repos/XLabs/Xamarin-Forms-Labs/issues/533","number":533,"state":"closed","locked":false,"title":"android & ios screenshots","user":{"login":"jguertl","id":7988662,"avatar_url":"https://avatars.githubusercontent.com/u/7988662?v=3","gravatar_id":"","url":"https://api.github.com/users/jguertl","html_url":"https://github.com/jguertl","followers_url":"https://api.github.com/users/jguertl/followers","following_url":"https://api.github.com/users/jguertl/following{/other_user}","gists_url":"https://api.github.com/users/jguertl/gists{/gist_id}","starred_url":"https://api.github.com/users/jguertl/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/jguertl/subscriptions","organizations_url":"https://api.github.com/users/jguertl/orgs","repos_url":"https://api.github.com/users/jguertl/repos","events_url":"https://api.github.com/users/jguertl/events{/privacy}","received_events_url":"https://api.github.com/users/jguertl/received_events","type":"User","site_admin":false},"body":"","created_at":"2014-12-21T10:31:17Z","updated_at":"2015-01-01T01:00:07Z","closed_at":"2015-01-01T01:00:07Z","merged_at":"2015-01-01T01:00:07Z","merge_commit_sha":"f60ed691a53c54c0e9f7254f072dc92a46d2652d","assignee":null,"milestone":null,"commits_url":"https://api.github.com/repos/XLabs/Xamarin-Forms-Labs/pulls/533/commits","review_comments_url":"https://api.github.com/repos/XLabs/Xamarin-Forms-Labs/pulls/533/comments","review_comment_url":"https://api.github.com/repos/XLabs/Xamarin-Forms-Labs/pulls/comments/{number}","comments_url":"https://api.github.com/repos/XLabs/Xamarin-Forms-Labs/issues/533/comments","statuses_url":"https://api.github.com/repos/XLabs/Xamarin-Forms-Labs/statuses/1fb29e8b83f96badb55e4dfecc19392f498df57a","head":{"label":"jguertl:master","ref":"master","sha":"1fb29e8b83f96badb55e4dfecc19392f498df57a","user":{"login":"jguertl","id":7988662,"avatar_url":"https://avatars.githubusercontent.com/u/7988662?v=3","gravatar_id":"","url":"https://api.github.com/users/jguertl","html_url":"https://github.com/jguertl","followers_url":"https://api.github.com/users/jguertl/followers","following_url":"https://api.github.com/users/jguertl/following{/other_user}","gists_url":"https://api.github.com/users/jguertl/gists{/gist_id}","starred_url":"https://api.github.com/users/jguertl/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/jguertl/subscriptions","organizations_url":"https://api.github.com/users/jguertl/orgs","repos_url":"https://api.github.com/users/jguertl/repos","events_url":"https://api.github.com/users/jguertl/events{/privacy}","received_events_url":"https://api.github.com/users/jguertl/received_events","type":"User","site_admin":false},"repo":{"id":28277803,"name":"Xamarin-Forms-Labs","full_name":"jguertl/Xamarin-Forms-Labs","owner":{"login":"jguertl","id":7988662,"avatar_url":"https://avatars.githubusercontent.com/u/7988662?v=3","gravatar_id":"","url":"https://api.github.com/users/jguertl","html_url":"https://github.com/jguertl","followers_url":"https://api.github.com/users/jguertl/followers","following_url":"https://api.github.com/users/jguertl/following{/other_user}","gists_url":"https://api.github.com/users/jguertl/gists{/gist_id}","starred_url":"https://api.github.com/users/jguertl/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/jguertl/subscriptions","organizations_url":"https://api.github.com/users/jguertl/orgs","repos_url":"https://api.github.com/users/jguertl/repos","events_url":"https://api.github.com/users/jguertl/events{/privacy}","received_events_url":"https://api.github.com/users/jguertl/received_events","type":"User","site_admin":false},"private":false,"html_url":"https://github.com/jguertl/Xamarin-Forms-Labs","description":"Xamarin Forms Labs is a open source project that aims to provide a powerful and cross platform set of controls and helpers tailored to work with Xamarin Forms.","fork":true,"url":"https://api.github.com/repos/jguertl/Xamarin-Forms-Labs","forks_url":"https://api.github.com/repos/jguertl/Xamarin-Forms-Labs/forks","keys_url":"https://api.github.com/repos/jguertl/Xamarin-Forms-Labs/keys{/key_id}","collaborators_url":"https://api.github.com/repos/jguertl/Xamarin-Forms-Labs/collaborators{/collaborator}","teams_url":"https://api.github.com/repos/jguertl/Xamarin-Forms-Labs/teams","hooks_url":"https://api.github.com/repos/jguertl/Xamarin-Forms-Labs/hooks","issue_events_url":"https://api.github.com/repos/jguertl/Xamarin-Forms-Labs/issues/events{/number}","events_url":"https://api.github.com/repos/jguertl/Xamarin-Forms-Labs/events","assignees_url":"https://api.github.com/repos/jguertl/Xamarin-Forms-Labs/assignees{/user}","branches_url":"https://api.github.com/repos/jguertl/Xamarin-Forms-Labs/branches{/branch}","tags_url":"https://api.github.com/repos/jguertl/Xamarin-Forms-Labs/tags","blobs_url":"https://api.github.com/repos/jguertl/Xamarin-Forms-Labs/git/blobs{/sha}","git_tags_url":"https://api.github.com/repos/jguertl/Xamarin-Forms-Labs/git/tags{/sha}","git_refs_url":"https://api.github.com/repos/jguertl/Xamarin-Forms-Labs/git/refs{/sha}","trees_url":"https://api.github.com/repos/jguertl/Xamarin-Forms-Labs/git/trees{/sha}","statuses_url":"https://api.github.com/repos/jguertl/Xamarin-Forms-Labs/statuses/{sha}","languages_url":"https://api.github.com/repos/jguertl/Xamarin-Forms-Labs/languages","stargazers_url":"https://api.github.com/repos/jguertl/Xamarin-Forms-Labs/stargazers","contributors_url":"https://api.github.com/repos/jguertl/Xamarin-Forms-Labs/contributors","subscribers_url":"https://api.github.com/repos/jguertl/Xamarin-Forms-Labs/subscribers","subscription_url":"https://api.github.com/repos/jguertl/Xamarin-Forms-Labs/subscription","commits_url":"https://api.github.com/repos/jguertl/Xamarin-Forms-Labs/commits{/sha}","git_commits_url":"https://api.github.com/repos/jguertl/Xamarin-Forms-Labs/git/commits{/sha}","comments_url":"https://api.github.com/repos/jguertl/Xamarin-Forms-Labs/comments{/number}","issue_comment_url":"https://api.github.com/repos/jguertl/Xamarin-Forms-Labs/issues/comments/{number}","contents_url":"https://api.github.com/repos/jguertl/Xamarin-Forms-Labs/contents/{+path}","compare_url":"https://api.github.com/repos/jguertl/Xamarin-Forms-Labs/compare/{base}...{head}","merges_url":"https://api.github.com/repos/jguertl/Xamarin-Forms-Labs/merges","archive_url":"https://api.github.com/repos/jguertl/Xamarin-Forms-Labs/{archive_format}{/ref}","downloads_url":"https://api.github.com/repos/jguertl/Xamarin-Forms-Labs/downloads","issues_url":"https://api.github.com/repos/jguertl/Xamarin-Forms-Labs/issues{/number}","pulls_url":"https://api.github.com/repos/jguertl/Xamarin-Forms-Labs/pulls{/number}","milestones_url":"https://api.github.com/repos/jguertl/Xamarin-Forms-Labs/milestones{/number}","notifications_url":"https://api.github.com/repos/jguertl/Xamarin-Forms-Labs/notifications{?since,all,participating}","labels_url":"https://api.github.com/repos/jguertl/Xamarin-Forms-Labs/labels{/name}","releases_url":"https://api.github.com/repos/jguertl/Xamarin-Forms-Labs/releases{/id}","created_at":"2014-12-20T20:17:25Z","updated_at":"2014-12-21T10:30:08Z","pushed_at":"2014-12-21T10:30:08Z","git_url":"git://github.com/jguertl/Xamarin-Forms-Labs.git","ssh_url":"git@github.com:jguertl/Xamarin-Forms-Labs.git","clone_url":"https://github.com/jguertl/Xamarin-Forms-Labs.git","svn_url":"https://github.com/jguertl/Xamarin-Forms-Labs","homepage":"","size":96864,"stargazers_count":0,"watchers_count":0,"language":"C#","has_issues":false,"has_downloads":true,"has_wiki":true,"has_pages":true,"forks_count":0,"mirror_url":null,"open_issues_count":0,"forks":0,"open_issues":0,"watchers":0,"default_branch":"master"}},"base":{"label":"XLabs:master","ref":"master","sha":"6906dd38ff69debcc304cb05b6877fae71747acd","user":{"login":"XLabs","id":7787062,"avatar_url":"https://avatars.githubusercontent.com/u/7787062?v=3","gravatar_id":"","url":"https://api.github.com/users/XLabs","html_url":"https://github.com/XLabs","followers_url":"https://api.github.com/users/XLabs/followers","following_url":"https://api.github.com/users/XLabs/following{/other_user}","gists_url":"https://api.github.com/users/XLabs/gists{/gist_id}","starred_url":"https://api.github.com/users/XLabs/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/XLabs/subscriptions","organizations_url":"https://api.github.com/users/XLabs/orgs","repos_url":"https://api.github.com/users/XLabs/repos","events_url":"https://api.github.com/users/XLabs/events{/privacy}","received_events_url":"https://api.github.com/users/XLabs/received_events","type":"Organization","site_admin":false},"repo":{"id":20463939,"name":"Xamarin-Forms-Labs","full_name":"XLabs/Xamarin-Forms-Labs","owner":{"login":"XLabs","id":7787062,"avatar_url":"https://avatars.githubusercontent.com/u/7787062?v=3","gravatar_id":"","url":"https://api.github.com/users/XLabs","html_url":"https://github.com/XLabs","followers_url":"https://api.github.com/users/XLabs/followers","following_url":"https://api.github.com/users/XLabs/following{/other_user}","gists_url":"https://api.github.com/users/XLabs/gists{/gist_id}","starred_url":"https://api.github.com/users/XLabs/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/XLabs/subscriptions","organizations_url":"https://api.github.com/users/XLabs/orgs","repos_url":"https://api.github.com/users/XLabs/repos","events_url":"https://api.github.com/users/XLabs/events{/privacy}","received_events_url":"https://api.github.com/users/XLabs/received_events","type":"Organization","site_admin":false},"private":false,"html_url":"https://github.com/XLabs/Xamarin-Forms-Labs","description":"Xamarin Forms Labs is a open source project that aims to provide a powerful and cross platform set of controls and helpers tailored to work with Xamarin Forms.","fork":false,"url":"https://api.github.com/repos/XLabs/Xamarin-Forms-Labs","forks_url":"https://api.github.com/repos/XLabs/Xamarin-Forms-Labs/forks","keys_url":"https://api.github.com/repos/XLabs/Xamarin-Forms-Labs/keys{/key_id}","collaborators_url":"https://api.github.com/repos/XLabs/Xamarin-Forms-Labs/collaborators{/collaborator}","teams_url":"https://api.github.com/repos/XLabs/Xamarin-Forms-Labs/teams","hooks_url":"https://api.github.com/repos/XLabs/Xamarin-Forms-Labs/hooks","issue_events_url":"https://api.github.com/repos/XLabs/Xamarin-Forms-Labs/issues/events{/number}","events_url":"https://api.github.com/repos/XLabs/Xamarin-Forms-Labs/events","assignees_url":"https://api.github.com/repos/XLabs/Xamarin-Forms-Labs/assignees{/user}","branches_url":"https://api.github.com/repos/XLabs/Xamarin-Forms-Labs/branches{/branch}","tags_url":"https://api.github.com/repos/XLabs/Xamarin-Forms-Labs/tags","blobs_url":"https://api.github.com/repos/XLabs/Xamarin-Forms-Labs/git/blobs{/sha}","git_tags_url":"https://api.github.com/repos/XLabs/Xamarin-Forms-Labs/git/tags{/sha}","git_refs_url":"https://api.github.com/repos/XLabs/Xamarin-Forms-Labs/git/refs{/sha}","trees_url":"https://api.github.com/repos/XLabs/Xamarin-Forms-Labs/git/trees{/sha}","statuses_url":"https://api.github.com/repos/XLabs/Xamarin-Forms-Labs/statuses/{sha}","languages_url":"https://api.github.com/repos/XLabs/Xamarin-Forms-Labs/languages","stargazers_url":"https://api.github.com/repos/XLabs/Xamarin-Forms-Labs/stargazers","contributors_url":"https://api.github.com/repos/XLabs/Xamarin-Forms-Labs/contributors","subscribers_url":"https://api.github.com/repos/XLabs/Xamarin-Forms-Labs/subscribers","subscription_url":"https://api.github.com/repos/XLabs/Xamarin-Forms-Labs/subscription","commits_url":"https://api.github.com/repos/XLabs/Xamarin-Forms-Labs/commits{/sha}","git_commits_url":"https://api.github.com/repos/XLabs/Xamarin-Forms-Labs/git/commits{/sha}","comments_url":"https://api.github.com/repos/XLabs/Xamarin-Forms-Labs/comments{/number}","issue_comment_url":"https://api.github.com/repos/XLabs/Xamarin-Forms-Labs/issues/comments/{number}","contents_url":"https://api.github.com/repos/XLabs/Xamarin-Forms-Labs/contents/{+path}","compare_url":"https://api.github.com/repos/XLabs/Xamarin-Forms-Labs/compare/{base}...{head}","merges_url":"https://api.github.com/repos/XLabs/Xamarin-Forms-Labs/merges","archive_url":"https://api.github.com/repos/XLabs/Xamarin-Forms-Labs/{archive_format}{/ref}","downloads_url":"https://api.github.com/repos/XLabs/Xamarin-Forms-Labs/downloads","issues_url":"https://api.github.com/repos/XLabs/Xamarin-Forms-Labs/issues{/number}","pulls_url":"https://api.github.com/repos/XLabs/Xamarin-Forms-Labs/pulls{/number}","milestones_url":"https://api.github.com/repos/XLabs/Xamarin-Forms-Labs/milestones{/number}","notifications_url":"https://api.github.com/repos/XLabs/Xamarin-Forms-Labs/notifications{?since,all,participating}","labels_url":"https://api.github.com/repos/XLabs/Xamarin-Forms-Labs/labels{/name}","releases_url":"https://api.github.com/repos/XLabs/Xamarin-Forms-Labs/releases{/id}","created_at":"2014-06-03T23:53:11Z","updated_at":"2015-01-01T00:59:13Z","pushed_at":"2015-01-01T01:00:07Z","git_url":"git://github.com/XLabs/Xamarin-Forms-Labs.git","ssh_url":"git@github.com:XLabs/Xamarin-Forms-Labs.git","clone_url":"https://github.com/XLabs/Xamarin-Forms-Labs.git","svn_url":"https://github.com/XLabs/Xamarin-Forms-Labs","homepage":"","size":104805,"stargazers_count":340,"watchers_count":340,"language":"C#","has_issues":true,"has_downloads":true,"has_wiki":true,"has_pages":true,"forks_count":210,"mirror_url":null,"open_issues_count":91,"forks":210,"open_issues":91,"watchers":340,"default_branch":"master"}},"_links":{"self":{"href":"https://api.github.com/repos/XLabs/Xamarin-Forms-Labs/pulls/533"},"html":{"href":"https://github.com/XLabs/Xamarin-Forms-Labs/pull/533"},"issue":{"href":"https://api.github.com/repos/XLabs/Xamarin-Forms-Labs/issues/533"},"comments":{"href":"https://api.github.com/repos/XLabs/Xamarin-Forms-Labs/issues/533/comments"},"review_comments":{"href":"https://api.github.com/repos/XLabs/Xamarin-Forms-Labs/pulls/533/comments"},"review_comment":{"href":"https://api.github.com/repos/XLabs/Xamarin-Forms-Labs/pulls/comments/{number}"},"commits":{"href":"https://api.github.com/repos/XLabs/Xamarin-Forms-Labs/pulls/533/commits"},"statuses":{"href":"https://api.github.com/repos/XLabs/Xamarin-Forms-Labs/statuses/1fb29e8b83f96badb55e4dfecc19392f498df57a"}},"merged":true,"mergeable":null,"mergeable_state":"unknown","merged_by":{"login":"rmarinho","id":1235097,"avatar_url":"https://avatars.githubusercontent.com/u/1235097?v=3","gravatar_id":"","url":"https://api.github.com/users/rmarinho","html_url":"https://github.com/rmarinho","followers_url":"https://api.github.com/users/rmarinho/followers","following_url":"https://api.github.com/users/rmarinho/following{/other_user}","gists_url":"https://api.github.com/users/rmarinho/gists{/gist_id}","starred_url":"https://api.github.com/users/rmarinho/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/rmarinho/subscriptions","organizations_url":"https://api.github.com/users/rmarinho/orgs","repos_url":"https://api.github.com/users/rmarinho/repos","events_url":"https://api.github.com/users/rmarinho/events{/privacy}","received_events_url":"https://api.github.com/users/rmarinho/received_events","type":"User","site_admin":false},"comments":1,"review_comments":0,"commits":1,"additions":0,"deletions":0,"changed_files":9}},"public":true,"created_at":"2015-01-01T01:00:08Z","org":{"id":7787062,"login":"XLabs","gravatar_id":"","url":"https://api.github.com/orgs/XLabs","avatar_url":"https://avatars.githubusercontent.com/u/7787062?"}}
{"id":"2489395801","type":"PushEvent","actor":{"id":1235097,"login":"rmarinho","gravatar_id":"","url":"https://api.github.com/users/rmarinho","avatar_url":"https://avatars.githubusercontent.com/u/1235097?"},"repo":{"id":20463939,"name":"XLabs/Xamarin-Forms-Labs","url":"https://api.github.com/repos/XLabs/Xamarin-Forms-Labs"},"payload":{"push_id":536752137,"size":2,"distinct_size":2,"ref":"refs/heads/master","head":"5b5d95052d67e79b27788b0e498ec6a9e240046e","before":"4db7138d78546f01b9782f8b1fcfe4fb27e861b6","commits":[{"sha":"1fb29e8b83f96badb55e4dfecc19392f498df57a","author":{"email":"9191838847179d50d9ec96fb4d4274d728e70c57@me.com","name":"Jakob Gürtl"},"message":"android & ios screenshots","distinct":true,"url":"https://api.github.com/repos/XLabs/Xamarin-Forms-Labs/commits/1fb29e8b83f96badb55e4dfecc19392f498df57a"},{"sha":"5b5d95052d67e79b27788b0e498ec6a9e240046e","author":{"email":"b1c1d8736f20db3fb6c1c66bb1455ed43909f0d8@ruimarinho.net","name":"Rui Marinho"},"message":"Merge pull request #533 from jguertl/master\n\nandroid & ios screenshots","distinct":true,"url":"https://api.github.com/repos/XLabs/Xamarin-Forms-Labs/commits/5b5d95052d67e79b27788b0e498ec6a9e240046e"}]},"public":true,"created_at":"2015-01-01T01:00:08Z","org":{"id":7787062,"login":"XLabs","gravatar_id":"","url":"https://api.github.com/orgs/XLabs","avatar_url":"https://avatars.githubusercontent.com/u/7787062?"}}
{"id":"2489395802","type":"PushEvent","actor":{"id":926454,"login":"lukeis","gravatar_id":"","url":"https://api.github.com/users/lukeis","avatar_url":"https://avatars.githubusercontent.com/u/926454?"},"repo":{"id":9457897,"name":"SeleniumHQ/irc-logs","url":"https://api.github.com/repos/SeleniumHQ/irc-logs"},"payload":{"push_id":536752139,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"d8aa1d441301788eeacffb3408616863637fecd8","before":"50c406047545cdb0be48743b4de97620f1ce5f48","commits":[{"sha":"d8aa1d441301788eeacffb3408616863637fecd8","author":{"email":"c7f2353e77fbd59227c091422ca81210965ba01d","name":"selloggingbot"},"message":"updating logs","distinct":true,"url":"https://api.github.com/repos/SeleniumHQ/irc-logs/commits/d8aa1d441301788eeacffb3408616863637fecd8"}]},"public":true,"created_at":"2015-01-01T01:00:08Z","org":{"id":983927,"login":"SeleniumHQ","gravatar_id":"","url":"https://api.github.com/orgs/SeleniumHQ","avatar_url":"https://avatars.githubusercontent.com/u/983927?"}}
{"id":"2489395805","type":"WatchEvent","actor":{"id":1390347,"login":"Addvilz","gravatar_id":"","url":"https://api.github.com/users/Addvilz","avatar_url":"https://avatars.githubusercontent.com/u/1390347?"},"repo":{"id":23615534,"name":"DanielGorlo/ISIS.js","url":"https://api.github.com/repos/DanielGorlo/ISIS.js"},"payload":{"action":"started"},"public":true,"created_at":"2015-01-01T01:00:08Z"}
{"id":"2489395808","type":"PushEvent","actor":{"id":1844764,"login":"ianblenke","gravatar_id":"","url":"https://api.github.com/users/ianblenke","avatar_url":"https://avatars.githubusercontent.com/u/1844764?"},"repo":{"id":28671505,"name":"ianblenke/docker-packetbeat-agent","url":"https://api.github.com/repos/ianblenke/docker-packetbeat-agent"},"payload":{"push_id":536752144,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"80ef4b415c08ccaaa009bfb07b807a3fc8864454","before":"8d67307dd90527ef7771a0304d5469a5387271b1","commits":[{"sha":"80ef4b415c08ccaaa009bfb07b807a3fc8864454","author":{"email":"57a33a5496950fec8433e4dd83347673459dcdfc@blenke.com","name":"Ian Blenke"},"message":"snaplen is an integer, not a string","distinct":true,"url":"https://api.github.com/repos/ianblenke/docker-packetbeat-agent/commits/80ef4b415c08ccaaa009bfb07b807a3fc8864454"}]},"public":true,"created_at":"2015-01-01T01:00:08Z"}
{"id":"2489395809","type":"PushEvent","actor":{"id":1221156,"login":"fyfe","gravatar_id":"","url":"https://api.github.com/users/fyfe","avatar_url":"https://avatars.githubusercontent.com/u/1221156?"},"repo":{"id":28673837,"name":"fyfe/git-test","url":"https://api.github.com/repos/fyfe/git-test"},"payload":{"push_id":536752143,"size":0,"distinct_size":0,"ref":"refs/heads/develop","head":"4a252ca6b0d37d0714710d57ba524ff0601806df","before":"279e85c74e9a85941ce223bd8a8f3ac37fa891fc","commits":[]},"public":true,"created_at":"2015-01-01T01:00:08Z"}
{"id":"2489395811","type":"PushEvent","actor":{"id":7727148,"login":"ThadHouse","gravatar_id":"","url":"https://api.github.com/users/ThadHouse","avatar_url":"https://avatars.githubusercontent.com/u/7727148?"},"repo":{"id":26708360,"name":"ThadHouse/SplineGenerator","url":"https://api.github.com/repos/ThadHouse/SplineGenerator"},"payload":{"push_id":536752145,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"3a313300b8a8694a20be00b74b25763b015f3549","before":"a2b94fbe206b40060f076c185ef431200083aaf4","commits":[{"sha":"3a313300b8a8694a20be00b74b25763b015f3549","author":{"email":"ba841f95fa6d615b6e0ccbf97085c32d1f18fdef@users.noreply.github.com","name":"ThadHouse"},"message":"Update README.md","distinct":true,"url":"https://api.github.com/repos/ThadHouse/SplineGenerator/commits/3a313300b8a8694a20be00b74b25763b015f3549"}]},"public":true,"created_at":"2015-01-01T01:00:08Z"}
{"id":"2489395812","type":"PushEvent","actor":{"id":6158630,"login":"greatfire","gravatar_id":"","url":"https://api.github.com/users/greatfire","avatar_url":"https://avatars.githubusercontent.com/u/6158630?"},"repo":{"id":18126008,"name":"greatfire/z","url":"https://api.github.com/repos/greatfire/z"},"payload":{"push_id":536752146,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"1c095ccf0c45826798d494d477eef16082e2919f","before":"0fae830fbc8591e9b4e3faf0794a1b73c460f9e6","commits":[{"sha":"1c095ccf0c45826798d494d477eef16082e2919f","author":{"email":"24bf68e341ce0fbd9259a5d51feed79682ea4eba@greatfire.org","name":"Ubuntu"},"message":"a","distinct":true,"url":"https://api.github.com/repos/greatfire/z/commits/1c095ccf0c45826798d494d477eef16082e2919f"}]},"public":true,"created_at":"2015-01-01T01:00:09Z"}
{"id":"2489395813","type":"CreateEvent","actor":{"id":8518239,"login":"gitter-badger","gravatar_id":"","url":"https://api.github.com/users/gitter-badger","avatar_url":"https://avatars.githubusercontent.com/u/8518239?"},"repo":{"id":28678212,"name":"gitter-badger/dotfiles-15","url":"https://api.github.com/repos/gitter-badger/dotfiles-15"},"payload":{"ref":"gitter-badge","ref_type":"branch","master_branch":"master","description":"","pusher_type":"user"},"public":true,"created_at":"2015-01-01T01:00:09Z"}
{"id":"2489395822","type":"PushEvent","actor":{"id":8518239,"login":"gitter-badger","gravatar_id":"","url":"https://api.github.com/users/gitter-badger","avatar_url":"https://avatars.githubusercontent.com/u/8518239?"},"repo":{"id":28678212,"name":"gitter-badger/dotfiles-15","url":"https://api.github.com/repos/gitter-badger/dotfiles-15"},"payload":{"push_id":536752152,"size":1,"distinct_size":1,"ref":"refs/heads/gitter-badge","head":"e4f636ddb08f1811808e3f872a7a323aa80c8a7b","before":"7ca425b3dc133cd625f3f2e2e014ebee508eb39d","commits":[{"sha":"e4f636ddb08f1811808e3f872a7a323aa80c8a7b","author":{"email":"4e199b4a1c40b497a95fcd1cd896351733849949@gitter.im","name":"The Gitter Badger"},"message":"Added Gitter badge","distinct":true,"url":"https://api.github.com/repos/gitter-badger/dotfiles-15/commits/e4f636ddb08f1811808e3f872a7a323aa80c8a7b"}]},"public":true,"created_at":"2015-01-01T01:00:10Z"}
{"id":"2489395823","type":"IssueCommentEvent","actor":{"id":2068437,"login":"ahaurw01","gravatar_id":"","url":"https://api.github.com/users/ahaurw01","avatar_url":"https://avatars.githubusercontent.com/u/2068437?"},"repo":{"id":18271693,"name":"ahaurw01/gulp-remember","url":"https://api.github.com/repos/ahaurw01/gulp-remember"},"payload":{"action":"created","issue":{"url":"https://api.github.com/repos/ahaurw01/gulp-remember/issues/13","labels_url":"https://api.github.com/repos/ahaurw01/gulp-remember/issues/13/labels{/name}","comments_url":"https://api.github.com/repos/ahaurw01/gulp-remember/issues/13/comments","events_url":"https://api.github.com/repos/ahaurw01/gulp-remember/issues/13/events","html_url":"https://github.com/ahaurw01/gulp-remember/pull/13","id":53012936,"number":13,"title":"Handle file's history","user":{"login":"efolio","id":2078815,"avatar_url":"https://avatars.githubusercontent.com/u/2078815?v=3","gravatar_id":"","url":"https://api.github.com/users/efolio","html_url":"https://github.com/efolio","followers_url":"https://api.github.com/users/efolio/followers","following_url":"https://api.github.com/users/efolio/following{/other_user}","gists_url":"https://api.github.com/users/efolio/gists{/gist_id}","starred_url":"https://api.github.com/users/efolio/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/efolio/subscriptions","organizations_url":"https://api.github.com/users/efolio/orgs","repos_url":"https://api.github.com/users/efolio/repos","events_url":"https://api.github.com/users/efolio/events{/privacy}","received_events_url":"https://api.github.com/users/efolio/received_events","type":"User","site_admin":false},"labels":[],"state":"closed","locked":false,"assignee":null,"milestone":null,"comments":11,"created_at":"2014-12-28T23:47:50Z","updated_at":"2015-01-01T01:00:09Z","closed_at":"2015-01-01T01:00:09Z","pull_request":{"url":"https://api.github.com/repos/ahaurw01/gulp-remember/pulls/13","html_url":"https://github.com/ahaurw01/gulp-remember/pull/13","diff_url":"https://github.com/ahaurw01/gulp-remember/pull/13.diff","patch_url":"https://github.com/ahaurw01/gulp-remember/pull/13.patch"},"body":"Mostly add a `forgetUsingHistory` method in order to tackle the need to forget files using the original filename instead of the processed filename.\r\n\r\nI'll be glad to tweak this PR anyway you want.\r\n\r\nThanks a lot,"},"comment":{"url":"https://api.github.com/repos/ahaurw01/gulp-remember/issues/comments/68477210","html_url":"https://github.com/ahaurw01/gulp-remember/pull/13#issuecomment-68477210","issue_url":"https://api.github.com/repos/ahaurw01/gulp-remember/issues/13","id":68477210,"user":{"login":"ahaurw01","id":2068437,"avatar_url":"https://avatars.githubusercontent.com/u/2068437?v=3","gravatar_id":"","url":"https://api.github.com/users/ahaurw01","html_url":"https://github.com/ahaurw01","followers_url":"https://api.github.com/users/ahaurw01/followers","following_url":"https://api.github.com/users/ahaurw01/following{/other_user}","gists_url":"https://api.github.com/users/ahaurw01/gists{/gist_id}","starred_url":"https://api.github.com/users/ahaurw01/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/ahaurw01/subscriptions","organizations_url":"https://api.github.com/users/ahaurw01/orgs","repos_url":"https://api.github.com/users/ahaurw01/repos","events_url":"https://api.github.com/users/ahaurw01/events{/privacy}","received_events_url":"https://api.github.com/users/ahaurw01/received_events","type":"User","site_admin":false},"created_at":"2015-01-01T01:00:09Z","updated_at":"2015-01-01T01:00:09Z","body":"@efolio @qraynaud \r\nI'm not comfortable adding this feature as it nearly doubles the complexity of this plugin while solving (to me) a seemingly orthogonal problem. And opening the door to tweaking and expanding this feature in the future to better solve use cases that are slightly different from yours is not attractive to me either. \r\n\r\nI believe that the beauty of gulp plugins is that they are simple, unopinionated, imperative, and get incorporated into the workflow of your own code. Grunt, for example, encourages API creep within its plugins because they are used declaratively; they are simply configured. Gulp allows you to take micro-helpers and mix and match them in ways that conform to really specific workflow needs. If a gulp plugin begins to make assumptions about workflow, it has the opportunity for a quick expansion of complexity and/or a need for the plugin to be configured in more ways. \r\n\r\nI am of the opinion that more stupid-simple modules is better than fewer slightly more complex modules, especially in the gulp environment."}},"public":true,"created_at":"2015-01-01T01:00:10Z"}
{"id":"2489395824","type":"PullRequestEvent","actor":{"id":2068437,"login":"ahaurw01","gravatar_id":"","url":"https://api.github.com/users/ahaurw01","avatar_url":"https://avatars.githubusercontent.com/u/2068437?"},"repo":{"id":18271693,"name":"ahaurw01/gulp-remember","url":"https://api.github.com/repos/ahaurw01/gulp-remember"},"payload":{"action":"closed","number":13,"pull_request":{"url":"https://api.github.com/repos/ahaurw01/gulp-remember/pulls/13","id":26629069,"html_url":"https://github.com/ahaurw01/gulp-remember/pull/13","diff_url":"https://github.com/ahaurw01/gulp-remember/pull/13.diff","patch_url":"https://github.com/ahaurw01/gulp-remember/pull/13.patch","issue_url":"https://api.github.com/repos/ahaurw01/gulp-remember/issues/13","number":13,"state":"closed","locked":false,"title":"Handle file's history","user":{"login":"efolio","id":2078815,"avatar_url":"https://avatars.githubusercontent.com/u/2078815?v=3","gravatar_id":"","url":"https://api.github.com/users/efolio","html_url":"https://github.com/efolio","followers_url":"https://api.github.com/users/efolio/followers","following_url":"https://api.github.com/users/efolio/following{/other_user}","gists_url":"https://api.github.com/users/efolio/gists{/gist_id}","starred_url":"https://api.github.com/users/efolio/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/efolio/subscriptions","organizations_url":"https://api.github.com/users/efolio/orgs","repos_url":"https://api.github.com/users/efolio/repos","events_url":"https://api.github.com/users/efolio/events{/privacy}","received_events_url":"https://api.github.com/users/efolio/received_events","type":"User","site_admin":false},"body":"Mostly add a `forgetUsingHistory` method in order to tackle the need to forget files using the original filename instead of the processed filename.\r\n\r\nI'll be glad to tweak this PR anyway you want.\r\n\r\nThanks a lot,","created_at":"2014-12-28T23:47:50Z","updated_at":"2015-01-01T01:00:09Z","closed_at":"2015-01-01T01:00:09Z","merged_at":null,"merge_commit_sha":"77da51e98bbc8a636fabf2ec70de46338199e570","assignee":null,"milestone":null,"commits_url":"https://api.github.com/repos/ahaurw01/gulp-remember/pulls/13/commits","review_comments_url":"https://api.github.com/repos/ahaurw01/gulp-remember/pulls/13/comments","review_comment_url":"https://api.github.com/repos/ahaurw01/gulp-remember/pulls/comments/{number}","comments_url":"https://api.github.com/repos/ahaurw01/gulp-remember/issues/13/comments","statuses_url":"https://api.github.com/repos/ahaurw01/gulp-remember/statuses/b54cbec37e97f1b472eabdced02d07847a536f9e","head":{"label":"efolio:master","ref":"master","sha":"b54cbec37e97f1b472eabdced02d07847a536f9e","user":{"login":"efolio","id":2078815,"avatar_url":"https://avatars.githubusercontent.com/u/2078815?v=3","gravatar_id":"","url":"https://api.github.com/users/efolio","html_url":"https://github.com/efolio","followers_url":"https://api.github.com/users/efolio/followers","following_url":"https://api.github.com/users/efolio/following{/other_user}","gists_url":"https://api.github.com/users/efolio/gists{/gist_id}","starred_url":"https://api.github.com/users/efolio/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/efolio/subscriptions","organizations_url":"https://api.github.com/users/efolio/orgs","repos_url":"https://api.github.com/users/efolio/repos","events_url":"https://api.github.com/users/efolio/events{/privacy}","received_events_url":"https://api.github.com/users/efolio/received_events","type":"User","site_admin":false},"repo":{"id":28569993,"name":"gulp-remember","full_name":"efolio/gulp-remember","owner":{"login":"efolio","id":2078815,"avatar_url":"https://avatars.githubusercontent.com/u/2078815?v=3","gravatar_id":"","url":"https://api.github.com/users/efolio","html_url":"https://github.com/efolio","followers_url":"https://api.github.com/users/efolio/followers","following_url":"https://api.github.com/users/efolio/following{/other_user}","gists_url":"https://api.github.com/users/efolio/gists{/gist_id}","starred_url":"https://api.github.com/users/efolio/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/efolio/subscriptions","organizations_url":"https://api.github.com/users/efolio/orgs","repos_url":"https://api.github.com/users/efolio/repos","events_url":"https://api.github.com/users/efolio/events{/privacy}","received_events_url":"https://api.github.com/users/efolio/received_events","type":"User","site_admin":false},"private":false,"html_url":"https://github.com/efolio/gulp-remember","description":"A plugin for gulp that remembers and recalls files passed through it","fork":true,"url":"https://api.github.com/repos/efolio/gulp-remember","forks_url":"https://api.github.com/repos/efolio/gulp-remember/forks","keys_url":"https://api.github.com/repos/efolio/gulp-remember/keys{/key_id}","collaborators_url":"https://api.github.com/repos/efolio/gulp-remember/collaborators{/collaborator}","teams_url":"https://api.github.com/repos/efolio/gulp-remember/teams","hooks_url":"https://api.github.com/repos/efolio/gulp-remember/hooks","issue_events_url":"https://api.github.com/repos/efolio/gulp-remember/issues/events{/number}","events_url":"https://api.github.com/repos/efolio/gulp-remember/events","assignees_url":"https://api.github.com/repos/efolio/gulp-remember/assignees{/user}","branches_url":"https://api.github.com/repos/efolio/gulp-remember/branches{/branch}","tags_url":"https://api.github.com/repos/efolio/gulp-remember/tags","blobs_url":"https://api.github.com/repos/efolio/gulp-remember/git/blobs{/sha}","git_tags_url":"https://api.github.com/repos/efolio/gulp-remember/git/tags{/sha}","git_refs_url":"https://api.github.com/repos/efolio/gulp-remember/git/refs{/sha}","trees_url":"https://api.github.com/repos/efolio/gulp-remember/git/trees{/sha}","statuses_url":"https://api.github.com/repos/efolio/gulp-remember/statuses/{sha}","languages_url":"https://api.github.com/repos/efolio/gulp-remember/languages","stargazers_url":"https://api.github.com/repos/efolio/gulp-remember/stargazers","contributors_url":"https://api.github.com/repos/efolio/gulp-remember/contributors","subscribers_url":"https://api.github.com/repos/efolio/gulp-remember/subscribers","subscription_url":"https://api.github.com/repos/efolio/gulp-remember/subscription","commits_url":"https://api.github.com/repos/efolio/gulp-remember/commits{/sha}","git_commits_url":"https://api.github.com/repos/efolio/gulp-remember/git/commits{/sha}","comments_url":"https://api.github.com/repos/efolio/gulp-remember/comments{/number}","issue_comment_url":"https://api.github.com/repos/efolio/gulp-remember/issues/comments/{number}","contents_url":"https://api.github.com/repos/efolio/gulp-remember/contents/{+path}","compare_url":"https://api.github.com/repos/efolio/gulp-remember/compare/{base}...{head}","merges_url":"https://api.github.com/repos/efolio/gulp-remember/merges","archive_url":"https://api.github.com/repos/efolio/gulp-remember/{archive_format}{/ref}","downloads_url":"https://api.github.com/repos/efolio/gulp-remember/downloads","issues_url":"https://api.github.com/repos/efolio/gulp-remember/issues{/number}","pulls_url":"https://api.github.com/repos/efolio/gulp-remember/pulls{/number}","milestones_url":"https://api.github.com/repos/efolio/gulp-remember/milestones{/number}","notifications_url":"https://api.github.com/repos/efolio/gulp-remember/notifications{?since,all,participating}","labels_url":"https://api.github.com/repos/efolio/gulp-remember/labels{/name}","releases_url":"https://api.github.com/repos/efolio/gulp-remember/releases{/id}","created_at":"2014-12-28T19:41:58Z","updated_at":"2014-12-28T23:45:40Z","pushed_at":"2014-12-28T23:45:40Z","git_url":"git://github.com/efolio/gulp-remember.git","ssh_url":"git@github.com:efolio/gulp-remember.git","clone_url":"https://github.com/efolio/gulp-remember.git","svn_url":"https://github.com/efolio/gulp-remember","homepage":null,"size":275,"stargazers_count":0,"watchers_count":0,"language":"JavaScript","has_issues":false,"has_downloads":true,"has_wiki":true,"has_pages":false,"forks_count":0,"mirror_url":null,"open_issues_count":0,"forks":0,"open_issues":0,"watchers":0,"default_branch":"master"}},"base":{"label":"ahaurw01:master","ref":"master","sha":"8bba77a2fb8f692192c3499f50a9a53036e5fb60","user":{"login":"ahaurw01","id":2068437,"avatar_url":"https://avatars.githubusercontent.com/u/2068437?v=3","gravatar_id":"","url":"https://api.github.com/users/ahaurw01","html_url":"https://github.com/ahaurw01","followers_url":"https://api.github.com/users/ahaurw01/followers","following_url":"https://api.github.com/users/ahaurw01/following{/other_user}","gists_url":"https://api.github.com/users/ahaurw01/gists{/gist_id}","starred_url":"https://api.github.com/users/ahaurw01/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/ahaurw01/subscriptions","organizations_url":"https://api.github.com/users/ahaurw01/orgs","repos_url":"https://api.github.com/users/ahaurw01/repos","events_url":"https://api.github.com/users/ahaurw01/events{/privacy}","received_events_url":"https://api.github.com/users/ahaurw01/received_events","type":"User","site_admin":false},"repo":{"id":18271693,"name":"gulp-remember","full_name":"ahaurw01/gulp-remember","owner":{"login":"ahaurw01","id":2068437,"avatar_url":"https://avatars.githubusercontent.com/u/2068437?v=3","gravatar_id":"","url":"https://api.github.com/users/ahaurw01","html_url":"https://github.com/ahaurw01","followers_url":"https://api.github.com/users/ahaurw01/followers","following_url":"https://api.github.com/users/ahaurw01/following{/other_user}","gists_url":"https://api.github.com/users/ahaurw01/gists{/gist_id}","starred_url":"https://api.github.com/users/ahaurw01/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/ahaurw01/subscriptions","organizations_url":"https://api.github.com/users/ahaurw01/orgs","repos_url":"https://api.github.com/users/ahaurw01/repos","events_url":"https://api.github.com/users/ahaurw01/events{/privacy}","received_events_url":"https://api.github.com/users/ahaurw01/received_events","type":"User","site_admin":false},"private":false,"html_url":"https://github.com/ahaurw01/gulp-remember","description":"A plugin for gulp that remembers and recalls files passed through it","fork":false,"url":"https://api.github.com/repos/ahaurw01/gulp-remember","forks_url":"https://api.github.com/repos/ahaurw01/gulp-remember/forks","keys_url":"https://api.github.com/repos/ahaurw01/gulp-remember/keys{/key_id}","collaborators_url":"https://api.github.com/repos/ahaurw01/gulp-remember/collaborators{/collaborator}","teams_url":"https://api.github.com/repos/ahaurw01/gulp-remember/teams","hooks_url":"https://api.github.com/repos/ahaurw01/gulp-remember/hooks","issue_events_url":"https://api.github.com/repos/ahaurw01/gulp-remember/issues/events{/number}","events_url":"https://api.github.com/repos/ahaurw01/gulp-remember/events","assignees_url":"https://api.github.com/repos/ahaurw01/gulp-remember/assignees{/user}","branches_url":"https://api.github.com/repos/ahaurw01/gulp-remember/branches{/branch}","tags_url":"https://api.github.com/repos/ahaurw01/gulp-remember/tags","blobs_url":"https://api.github.com/repos/ahaurw01/gulp-remember/git/blobs{/sha}","git_tags_url":"https://api.github.com/repos/ahaurw01/gulp-remember/git/tags{/sha}","git_refs_url":"https://api.github.com/repos/ahaurw01/gulp-remember/git/refs{/sha}","trees_url":"https://api.github.com/repos/ahaurw01/gulp-remember/git/trees{/sha}","statuses_url":"https://api.github.com/repos/ahaurw01/gulp-remember/statuses/{sha}","languages_url":"https://api.github.com/repos/ahaurw01/gulp-remember/languages","stargazers_url":"https://api.github.com/repos/ahaurw01/gulp-remember/stargazers","contributors_url":"https://api.github.com/repos/ahaurw01/gulp-remember/contributors","subscribers_url":"https://api.github.com/repos/ahaurw01/gulp-remember/subscribers","subscription_url":"https://api.github.com/repos/ahaurw01/gulp-remember/subscription","commits_url":"https://api.github.com/repos/ahaurw01/gulp-remember/commits{/sha}","git_commits_url":"https://api.github.com/repos/ahaurw01/gulp-remember/git/commits{/sha}","comments_url":"https://api.github.com/repos/ahaurw01/gulp-remember/comments{/number}","issue_comment_url":"https://api.github.com/repos/ahaurw01/gulp-remember/issues/comments/{number}","contents_url":"https://api.github.com/repos/ahaurw01/gulp-remember/contents/{+path}","compare_url":"https://api.github.com/repos/ahaurw01/gulp-remember/compare/{base}...{head}","merges_url":"https://api.github.com/repos/ahaurw01/gulp-remember/merges","archive_url":"https://api.github.com/repos/ahaurw01/gulp-remember/{archive_format}{/ref}","downloads_url":"https://api.github.com/repos/ahaurw01/gulp-remember/downloads","issues_url":"https://api.github.com/repos/ahaurw01/gulp-remember/issues{/number}","pulls_url":"https://api.github.com/repos/ahaurw01/gulp-remember/pulls{/number}","milestones_url":"https://api.github.com/repos/ahaurw01/gulp-remember/milestones{/number}","notifications_url":"https://api.github.com/repos/ahaurw01/gulp-remember/notifications{?since,all,participating}","labels_url":"https://api.github.com/repos/ahaurw01/gulp-remember/labels{/name}","releases_url":"https://api.github.com/repos/ahaurw01/gulp-remember/releases{/id}","created_at":"2014-03-30T19:21:07Z","updated_at":"2014-12-29T04:09:25Z","pushed_at":"2014-12-21T15:42:48Z","git_url":"git://github.com/ahaurw01/gulp-remember.git","ssh_url":"git@github.com:ahaurw01/gulp-remember.git","clone_url":"https://github.com/ahaurw01/gulp-remember.git","svn_url":"https://github.com/ahaurw01/gulp-remember","homepage":null,"size":275,"stargazers_count":35,"watchers_count":35,"language":"JavaScript","has_issues":true,"has_downloads":true,"has_wiki":true,"has_pages":false,"forks_count":6,"mirror_url":null,"open_issues_count":0,"forks":6,"open_issues":0,"watchers":35,"default_branch":"master"}},"_links":{"self":{"href":"https://api.github.com/repos/ahaurw01/gulp-remember/pulls/13"},"html":{"href":"https://github.com/ahaurw01/gulp-remember/pull/13"},"issue":{"href":"https://api.github.com/repos/ahaurw01/gulp-remember/issues/13"},"comments":{"href":"https://api.github.com/repos/ahaurw01/gulp-remember/issues/13/comments"},"review_comments":{"href":"https://api.github.com/repos/ahaurw01/gulp-remember/pulls/13/comments"},"review_comment":{"href":"https://api.github.com/repos/ahaurw01/gulp-remember/pulls/comments/{number}"},"commits":{"href":"https://api.github.com/repos/ahaurw01/gulp-remember/pulls/13/commits"},"statuses":{"href":"https://api.github.com/repos/ahaurw01/gulp-remember/statuses/b54cbec37e97f1b472eabdced02d07847a536f9e"}},"merged":false,"mergeable":true,"mergeable_state":"clean","merged_by":null,"comments":11,"review_comments":0,"commits":1,"additions":195,"deletions":14,"changed_files":3}},"public":true,"created_at":"2015-01-01T01:00:10Z"}
{"id":"2489395826","type":"PullRequestEvent","actor":{"id":8518239,"login":"gitter-badger","gravatar_id":"","url":"https://api.github.com/users/gitter-badger","avatar_url":"https://avatars.githubusercontent.com/u/8518239?"},"repo":{"id":8540783,"name":"russmatney/dotfiles","url":"https://api.github.com/repos/russmatney/dotfiles"},"payload":{"action":"opened","number":1,"pull_request":{"url":"https://api.github.com/repos/russmatney/dotfiles/pulls/1","id":26739403,"html_url":"https://github.com/russmatney/dotfiles/pull/1","diff_url":"https://github.com/russmatney/dotfiles/pull/1.diff","patch_url":"https://github.com/russmatney/dotfiles/pull/1.patch","issue_url":"https://api.github.com/repos/russmatney/dotfiles/issues/1","number":1,"state":"open","locked":false,"title":"Add a Gitter chat badge to README.md","user":{"login":"gitter-badger","id":8518239,"avatar_url":"https://avatars.githubusercontent.com/u/8518239?v=3","gravatar_id":"","url":"https://api.github.com/users/gitter-badger","html_url":"https://github.com/gitter-badger","followers_url":"https://api.github.com/users/gitter-badger/followers","following_url":"https://api.github.com/users/gitter-badger/following{/other_user}","gists_url":"https://api.github.com/users/gitter-badger/gists{/gist_id}","starred_url":"https://api.github.com/users/gitter-badger/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/gitter-badger/subscriptions","organizations_url":"https://api.github.com/users/gitter-badger/orgs","repos_url":"https://api.github.com/users/gitter-badger/repos","events_url":"https://api.github.com/users/gitter-badger/events{/privacy}","received_events_url":"https://api.github.com/users/gitter-badger/received_events","type":"User","site_admin":false},"body":"### russmatney/dotfiles now has a Chat Room on Gitter\n\n@russmatney has just created a chat room. You can visit it here: [https://gitter.im/russmatney/dotfiles](https://gitter.im/russmatney/dotfiles?utm_source=badge&utm_medium=badge&utm_campaign=pr-badge&content=body_link).\n\nThis pull-request adds this badge to your README.md:\n\n\n[![Gitter](https://badges.gitter.im/Join%20Chat.svg)](https://gitter.im/russmatney/dotfiles?utm_source=badge&utm_medium=badge&utm_campaign=pr-badge&utm_content=body_badge)\n\nHappy chatting.\n\n\nPS: [Click here](https://gitter.im/settings/badger/opt-out) if you would prefer not to receive automatic pull-requests from Gitter in future.\n","created_at":"2015-01-01T01:00:09Z","updated_at":"2015-01-01T01:00:09Z","closed_at":null,"merged_at":null,"merge_commit_sha":null,"assignee":null,"milestone":null,"commits_url":"https://api.github.com/repos/russmatney/dotfiles/pulls/1/commits","review_comments_url":"https://api.github.com/repos/russmatney/dotfiles/pulls/1/comments","review_comment_url":"https://api.github.com/repos/russmatney/dotfiles/pulls/comments/{number}","comments_url":"https://api.github.com/repos/russmatney/dotfiles/issues/1/comments","statuses_url":"https://api.github.com/repos/russmatney/dotfiles/statuses/e4f636ddb08f1811808e3f872a7a323aa80c8a7b","head":{"label":"gitter-badger:gitter-badge","ref":"gitter-badge","sha":"e4f636ddb08f1811808e3f872a7a323aa80c8a7b","user":{"login":"gitter-badger","id":8518239,"avatar_url":"https://avatars.githubusercontent.com/u/8518239?v=3","gravatar_id":"","url":"https://api.github.com/users/gitter-badger","html_url":"https://github.com/gitter-badger","followers_url":"https://api.github.com/users/gitter-badger/followers","following_url":"https://api.github.com/users/gitter-badger/following{/other_user}","gists_url":"https://api.github.com/users/gitter-badger/gists{/gist_id}","starred_url":"https://api.github.com/users/gitter-badger/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/gitter-badger/subscriptions","organizations_url":"https://api.github.com/users/gitter-badger/orgs","repos_url":"https://api.github.com/users/gitter-badger/repos","events_url":"https://api.github.com/users/gitter-badger/events{/privacy}","received_events_url":"https://api.github.com/users/gitter-badger/received_events","type":"User","site_admin":false},"repo":{"id":28678212,"name":"dotfiles-15","full_name":"gitter-badger/dotfiles-15","owner":{"login":"gitter-badger","id":8518239,"avatar_url":"https://avatars.githubusercontent.com/u/8518239?v=3","gravatar_id":"","url":"https://api.github.com/users/gitter-badger","html_url":"https://github.com/gitter-badger","followers_url":"https://api.github.com/users/gitter-badger/followers","following_url":"https://api.github.com/users/gitter-badger/following{/other_user}","gists_url":"https://api.github.com/users/gitter-badger/gists{/gist_id}","starred_url":"https://api.github.com/users/gitter-badger/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/gitter-badger/subscriptions","organizations_url":"https://api.github.com/users/gitter-badger/orgs","repos_url":"https://api.github.com/users/gitter-badger/repos","events_url":"https://api.github.com/users/gitter-badger/events{/privacy}","received_events_url":"https://api.github.com/users/gitter-badger/received_events","type":"User","site_admin":false},"private":false,"html_url":"https://github.com/gitter-badger/dotfiles-15","description":"","fork":true,"url":"https://api.github.com/repos/gitter-badger/dotfiles-15","forks_url":"https://api.github.com/repos/gitter-badger/dotfiles-15/forks","keys_url":"https://api.github.com/repos/gitter-badger/dotfiles-15/keys{/key_id}","collaborators_url":"https://api.github.com/repos/gitter-badger/dotfiles-15/collaborators{/collaborator}","teams_url":"https://api.github.com/repos/gitter-badger/dotfiles-15/teams","hooks_url":"https://api.github.com/repos/gitter-badger/dotfiles-15/hooks","issue_events_url":"https://api.github.com/repos/gitter-badger/dotfiles-15/issues/events{/number}","events_url":"https://api.github.com/repos/gitter-badger/dotfiles-15/events","assignees_url":"https://api.github.com/repos/gitter-badger/dotfiles-15/assignees{/user}","branches_url":"https://api.github.com/repos/gitter-badger/dotfiles-15/branches{/branch}","tags_url":"https://api.github.com/repos/gitter-badger/dotfiles-15/tags","blobs_url":"https://api.github.com/repos/gitter-badger/dotfiles-15/git/blobs{/sha}","git_tags_url":"https://api.github.com/repos/gitter-badger/dotfiles-15/git/tags{/sha}","git_refs_url":"https://api.github.com/repos/gitter-badger/dotfiles-15/git/refs{/sha}","trees_url":"https://api.github.com/repos/gitter-badger/dotfiles-15/git/trees{/sha}","statuses_url":"https://api.github.com/repos/gitter-badger/dotfiles-15/statuses/{sha}","languages_url":"https://api.github.com/repos/gitter-badger/dotfiles-15/languages","stargazers_url":"https://api.github.com/repos/gitter-badger/dotfiles-15/stargazers","contributors_url":"https://api.github.com/repos/gitter-badger/dotfiles-15/contributors","subscribers_url":"https://api.github.com/repos/gitter-badger/dotfiles-15/subscribers","subscription_url":"https://api.github.com/repos/gitter-badger/dotfiles-15/subscription","commits_url":"https://api.github.com/repos/gitter-badger/dotfiles-15/commits{/sha}","git_commits_url":"https://api.github.com/repos/gitter-badger/dotfiles-15/git/commits{/sha}","comments_url":"https://api.github.com/repos/gitter-badger/dotfiles-15/comments{/number}","issue_comment_url":"https://api.github.com/repos/gitter-badger/dotfiles-15/issues/comments/{number}","contents_url":"https://api.github.com/repos/gitter-badger/dotfiles-15/contents/{+path}","compare_url":"https://api.github.com/repos/gitter-badger/dotfiles-15/compare/{base}...{head}","merges_url":"https://api.github.com/repos/gitter-badger/dotfiles-15/merges","archive_url":"https://api.github.com/repos/gitter-badger/dotfiles-15/{archive_format}{/ref}","downloads_url":"https://api.github.com/repos/gitter-badger/dotfiles-15/downloads","issues_url":"https://api.github.com/repos/gitter-badger/dotfiles-15/issues{/number}","pulls_url":"https://api.github.com/repos/gitter-badger/dotfiles-15/pulls{/number}","milestones_url":"https://api.github.com/repos/gitter-badger/dotfiles-15/milestones{/number}","notifications_url":"https://api.github.com/repos/gitter-badger/dotfiles-15/notifications{?since,all,participating}","labels_url":"https://api.github.com/repos/gitter-badger/dotfiles-15/labels{/name}","releases_url":"https://api.github.com/repos/gitter-badger/dotfiles-15/releases{/id}","created_at":"2015-01-01T01:00:07Z","updated_at":"2015-01-01T01:00:08Z","pushed_at":"2015-01-01T01:00:09Z","git_url":"git://github.com/gitter-badger/dotfiles-15.git","ssh_url":"git@github.com:gitter-badger/dotfiles-15.git","clone_url":"https://github.com/gitter-badger/dotfiles-15.git","svn_url":"https://github.com/gitter-badger/dotfiles-15","homepage":"","size":620,"stargazers_count":0,"watchers_count":0,"language":"VimL","has_issues":false,"has_downloads":true,"has_wiki":true,"has_pages":false,"forks_count":0,"mirror_url":null,"open_issues_count":0,"forks":0,"open_issues":0,"watchers":0,"default_branch":"master"}},"base":{"label":"russmatney:master","ref":"master","sha":"7ca425b3dc133cd625f3f2e2e014ebee508eb39d","user":{"login":"russmatney","id":1596350,"avatar_url":"https://avatars.githubusercontent.com/u/1596350?v=3","gravatar_id":"","url":"https://api.github.com/users/russmatney","html_url":"https://github.com/russmatney","followers_url":"https://api.github.com/users/russmatney/followers","following_url":"https://api.github.com/users/russmatney/following{/other_user}","gists_url":"https://api.github.com/users/russmatney/gists{/gist_id}","starred_url":"https://api.github.com/users/russmatney/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/russmatney/subscriptions","organizations_url":"https://api.github.com/users/russmatney/orgs","repos_url":"https://api.github.com/users/russmatney/repos","events_url":"https://api.github.com/users/russmatney/events{/privacy}","received_events_url":"https://api.github.com/users/russmatney/received_events","type":"User","site_admin":false},"repo":{"id":8540783,"name":"dotfiles","full_name":"russmatney/dotfiles","owner":{"login":"russmatney","id":1596350,"avatar_url":"https://avatars.githubusercontent.com/u/1596350?v=3","gravatar_id":"","url":"https://api.github.com/users/russmatney","html_url":"https://github.com/russmatney","followers_url":"https://api.github.com/users/russmatney/followers","following_url":"https://api.github.com/users/russmatney/following{/other_user}","gists_url":"https://api.github.com/users/russmatney/gists{/gist_id}","starred_url":"https://api.github.com/users/russmatney/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/russmatney/subscriptions","organizations_url":"https://api.github.com/users/russmatney/orgs","repos_url":"https://api.github.com/users/russmatney/repos","events_url":"https://api.github.com/users/russmatney/events{/privacy}","received_events_url":"https://api.github.com/users/russmatney/received_events","type":"User","site_admin":false},"private":false,"html_url":"https://github.com/russmatney/dotfiles","description":"","fork":false,"url":"https://api.github.com/repos/russmatney/dotfiles","forks_url":"https://api.github.com/repos/russmatney/dotfiles/forks","keys_url":"https://api.github.com/repos/russmatney/dotfiles/keys{/key_id}","collaborators_url":"https://api.github.com/repos/russmatney/dotfiles/collaborators{/collaborator}","teams_url":"https://api.github.com/repos/russmatney/dotfiles/teams","hooks_url":"https://api.github.com/repos/russmatney/dotfiles/hooks","issue_events_url":"https://api.github.com/repos/russmatney/dotfiles/issues/events{/number}","events_url":"https://api.github.com/repos/russmatney/dotfiles/events","assignees_url":"https://api.github.com/repos/russmatney/dotfiles/assignees{/user}","branches_url":"https://api.github.com/repos/russmatney/dotfiles/branches{/branch}","tags_url":"https://api.github.com/repos/russmatney/dotfiles/tags","blobs_url":"https://api.github.com/repos/russmatney/dotfiles/git/blobs{/sha}","git_tags_url":"https://api.github.com/repos/russmatney/dotfiles/git/tags{/sha}","git_refs_url":"https://api.github.com/repos/russmatney/dotfiles/git/refs{/sha}","trees_url":"https://api.github.com/repos/russmatney/dotfiles/git/trees{/sha}","statuses_url":"https://api.github.com/repos/russmatney/dotfiles/statuses/{sha}","languages_url":"https://api.github.com/repos/russmatney/dotfiles/languages","stargazers_url":"https://api.github.com/repos/russmatney/dotfiles/stargazers","contributors_url":"https://api.github.com/repos/russmatney/dotfiles/contributors","subscribers_url":"https://api.github.com/repos/russmatney/dotfiles/subscribers","subscription_url":"https://api.github.com/repos/russmatney/dotfiles/subscription","commits_url":"https://api.github.com/repos/russmatney/dotfiles/commits{/sha}","git_commits_url":"https://api.github.com/repos/russmatney/dotfiles/git/commits{/sha}","comments_url":"https://api.github.com/repos/russmatney/dotfiles/comments{/number}","issue_comment_url":"https://api.github.com/repos/russmatney/dotfiles/issues/comments/{number}","contents_url":"https://api.github.com/repos/russmatney/dotfiles/contents/{+path}","compare_url":"https://api.github.com/repos/russmatney/dotfiles/compare/{base}...{head}","merges_url":"https://api.github.com/repos/russmatney/dotfiles/merges","archive_url":"https://api.github.com/repos/russmatney/dotfiles/{archive_format}{/ref}","downloads_url":"https://api.github.com/repos/russmatney/dotfiles/downloads","issues_url":"https://api.github.com/repos/russmatney/dotfiles/issues{/number}","pulls_url":"https://api.github.com/repos/russmatney/dotfiles/pulls{/number}","milestones_url":"https://api.github.com/repos/russmatney/dotfiles/milestones{/number}","notifications_url":"https://api.github.com/repos/russmatney/dotfiles/notifications{?since,all,participating}","labels_url":"https://api.github.com/repos/russmatney/dotfiles/labels{/name}","releases_url":"https://api.github.com/repos/russmatney/dotfiles/releases{/id}","created_at":"2013-03-03T18:57:40Z","updated_at":"2014-12-30T19:07:15Z","pushed_at":"2014-12-30T19:07:15Z","git_url":"git://github.com/russmatney/dotfiles.git","ssh_url":"git@github.com:russmatney/dotfiles.git","clone_url":"https://github.com/russmatney/dotfiles.git","svn_url":"https://github.com/russmatney/dotfiles","homepage":"","size":620,"stargazers_count":1,"watchers_count":1,"language":"VimL","has_issues":false,"has_downloads":true,"has_wiki":true,"has_pages":false,"forks_count":1,"mirror_url":null,"open_issues_count":1,"forks":1,"open_issues":1,"watchers":1,"default_branch":"master"}},"_links":{"self":{"href":"https://api.github.com/repos/russmatney/dotfiles/pulls/1"},"html":{"href":"https://github.com/russmatney/dotfiles/pull/1"},"issue":{"href":"https://api.github.com/repos/russmatney/dotfiles/issues/1"},"comments":{"href":"https://api.github.com/repos/russmatney/dotfiles/issues/1/comments"},"review_comments":{"href":"https://api.github.com/repos/russmatney/dotfiles/pulls/1/comments"},"review_comment":{"href":"https://api.github.com/repos/russmatney/dotfiles/pulls/comments/{number}"},"commits":{"href":"https://api.github.com/repos/russmatney/dotfiles/pulls/1/commits"},"statuses":{"href":"https://api.github.com/repos/russmatney/dotfiles/statuses/e4f636ddb08f1811808e3f872a7a323aa80c8a7b"}},"merged":false,"mergeable":null,"mergeable_state":"unknown","merged_by":null,"comments":0,"review_comments":0,"commits":1,"additions":2,"deletions":0,"changed_files":1}},"public":true,"created_at":"2015-01-01T01:00:10Z"}
{"id":"2489395827","type":"PushEvent","actor":{"id":6158630,"login":"greatfire","gravatar_id":"","url":"https://api.github.com/users/greatfire","avatar_url":"https://avatars.githubusercontent.com/u/6158630?"},"repo":{"id":15100395,"name":"greatfire/wiki","url":"https://api.github.com/repos/greatfire/wiki"},"payload":{"push_id":536752151,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"ba5bb9726f655f8acd29ecb3f89f1ae55305e680","before":"60adcb73302844b76926dc2b33a941f4f5069836","commits":[{"sha":"ba5bb9726f655f8acd29ecb3f89f1ae55305e680","author":{"email":"24bf68e341ce0fbd9259a5d51feed79682ea4eba@greatfire.org","name":"Ubuntu"},"message":"a","distinct":true,"url":"https://api.github.com/repos/greatfire/wiki/commits/ba5bb9726f655f8acd29ecb3f89f1ae55305e680"}]},"public":true,"created_at":"2015-01-01T01:00:10Z"}
{"id":"2489395828","type":"PushEvent","actor":{"id":314716,"login":"astrofrog","gravatar_id":"","url":"https://api.github.com/users/astrofrog","avatar_url":"https://avatars.githubusercontent.com/u/314716?"},"repo":{"id":22914622,"name":"astrofrog/reproject-benchmarks","url":"https://api.github.com/repos/astrofrog/reproject-benchmarks"},"payload":{"push_id":536752153,"size":1,"distinct_size":1,"ref":"refs/heads/gh-pages","head":"0e9b7c43a998d5386212968a8b55899c507a7288","before":"399b664da8fdf3dd344e09740700a45eabd8377b","commits":[{"sha":"0e9b7c43a998d5386212968a8b55899c507a7288","author":{"email":"5a30e73bb3eb7866ce4ccff234d7add82054e98d@gmail.com","name":"Thomas Robitaille"},"message":"Generated from sources","distinct":true,"url":"https://api.github.com/repos/astrofrog/reproject-benchmarks/commits/0e9b7c43a998d5386212968a8b55899c507a7288"}]},"public":true,"created_at":"2015-01-01T01:00:10Z"}
{"id":"2489395834","type":"PushEvent","actor":{"id":429529,"login":"cato-","gravatar_id":"","url":"https://api.github.com/users/cato-","avatar_url":"https://avatars.githubusercontent.com/u/429529?"},"repo":{"id":7588969,"name":"xenim/livestatus-publicpage","url":"https://api.github.com/repos/xenim/livestatus-publicpage"},"payload":{"push_id":536752158,"size":1,"distinct_size":1,"ref":"refs/heads/gh-pages","head":"39684ee741d07cd9c8f1ca9f5333b805f3c67ec2","before":"aaa220dfce3ed980c25e7277cb174b4705cc23af","commits":[{"sha":"39684ee741d07cd9c8f1ca9f5333b805f3c67ec2","author":{"email":"12e9293ec6b30c7fa8a0926af42807e929c1684f@niob.xnis.de","name":"Robert Weidlich"},"message":"update","distinct":true,"url":"https://api.github.com/repos/xenim/livestatus-publicpage/commits/39684ee741d07cd9c8f1ca9f5333b805f3c67ec2"}]},"public":true,"created_at":"2015-01-01T01:00:10Z","org":{"id":1789841,"login":"xenim","gravatar_id":"","url":"https://api.github.com/orgs/xenim","avatar_url":"https://avatars.githubusercontent.com/u/1789841?"}}
{"id":"2489395835","type":"PushEvent","actor":{"id":16432,"login":"tardate","gravatar_id":"","url":"https://api.github.com/users/tardate","avatar_url":"https://avatars.githubusercontent.com/u/16432?"},"repo":{"id":28238617,"name":"tardate/visual555","url":"https://api.github.com/repos/tardate/visual555"},"payload":{"push_id":536752159,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"a2e48f3da6ae2425950266f6f02857172d33af0a","before":"c9b4675aa616e728733541ce7ce42b161fe92b8a","commits":[{"sha":"a2e48f3da6ae2425950266f6f02857172d33af0a","author":{"email":"136d28fa799cf1dc4e2c5bcef36214a038721fe5@gmail.com","name":"Paul Gallagher"},"message":"add some book recommendations","distinct":true,"url":"https://api.github.com/repos/tardate/visual555/commits/a2e48f3da6ae2425950266f6f02857172d33af0a"}]},"public":true,"created_at":"2015-01-01T01:00:10Z"}
{"id":"2489395838","type":"PushEvent","actor":{"id":4447136,"login":"su-github-machine-user","gravatar_id":"","url":"https://api.github.com/users/su-github-machine-user","avatar_url":"https://avatars.githubusercontent.com/u/4447136?"},"repo":{"id":10314483,"name":"su-github-machine-user/github-nagios-check","url":"https://api.github.com/repos/su-github-machine-user/github-nagios-check"},"payload":{"push_id":536752162,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"2320a2b78da315d43fa018bba258dc9b1d07e6b9","before":"e9d1b5d1e3bdac7c2aabe75094d401db3ee35f65","commits":[{"sha":"2320a2b78da315d43fa018bba258dc9b1d07e6b9","author":{"email":"875a8f2f42c570f5f4ea7bfd154f582bcf95673a@su.se","name":"su-githubmirror"},"message":"New timestamp: 1420074002","distinct":true,"url":"https://api.github.com/repos/su-github-machine-user/github-nagios-check/commits/2320a2b78da315d43fa018bba258dc9b1d07e6b9"}]},"public":true,"created_at":"2015-01-01T01:00:10Z"}
{"id":"2489395842","type":"PushEvent","actor":{"id":2275298,"login":"enjoydiy","gravatar_id":"","url":"https://api.github.com/users/enjoydiy","avatar_url":"https://avatars.githubusercontent.com/u/2275298?"},"repo":{"id":6275680,"name":"enjoydiy/ttautovpn","url":"https://api.github.com/repos/enjoydiy/ttautovpn"},"payload":{"push_id":536752166,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"947cbd06a44b1f1e2970af802bda84a62b876285","before":"b4694b448e512278f83daf0d6c41e3bce241e2e3","commits":[{"sha":"947cbd06a44b1f1e2970af802bda84a62b876285","author":{"email":"d033e22ae348aeb5660fc2140aec35850c4da997@enjoydiy.com","name":"zijiao"},"message":"The routes include china IPs,created on 2015/01/01","distinct":true,"url":"https://api.github.com/repos/enjoydiy/ttautovpn/commits/947cbd06a44b1f1e2970af802bda84a62b876285"}]},"public":true,"created_at":"2015-01-01T01:00:10Z"}
{"id":"2489395845","type":"WatchEvent","actor":{"id":681965,"login":"wonbyte","gravatar_id":"","url":"https://api.github.com/users/wonbyte","avatar_url":"https://avatars.githubusercontent.com/u/681965?"},"repo":{"id":14490265,"name":"idris-lang/idris-tutorial","url":"https://api.github.com/repos/idris-lang/idris-tutorial"},"payload":{"action":"started"},"public":true,"created_at":"2015-01-01T01:00:11Z","org":{"id":5552910,"login":"idris-lang","gravatar_id":"","url":"https://api.github.com/orgs/idris-lang","avatar_url":"https://avatars.githubusercontent.com/u/5552910?"}}
{"id":"2489395846","type":"PushEvent","actor":{"id":5186562,"login":"wynot","gravatar_id":"","url":"https://api.github.com/users/wynot","avatar_url":"https://avatars.githubusercontent.com/u/5186562?"},"repo":{"id":28301051,"name":"wynot/bizmarkio_app","url":"https://api.github.com/repos/wynot/bizmarkio_app"},"payload":{"push_id":536752167,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"1e8c2f76bb60291f62859804bd999e48ac8baf26","before":"ed7d2b523d98421614bfbef2eee59d256ef43118","commits":[{"sha":"1e8c2f76bb60291f62859804bd999e48ac8baf26","author":{"email":"a586fcf1f3b216ef769d3cfdb1ef68d895375da3@gmail.com","name":"Will Young"},"message":"Add user microposts","distinct":true,"url":"https://api.github.com/repos/wynot/bizmarkio_app/commits/1e8c2f76bb60291f62859804bd999e48ac8baf26"}]},"public":true,"created_at":"2015-01-01T01:00:11Z"}
{"id":"2489395848","type":"PushEvent","actor":{"id":3004602,"login":"mattkirby","gravatar_id":"","url":"https://api.github.com/users/mattkirby","avatar_url":"https://avatars.githubusercontent.com/u/3004602?"},"repo":{"id":25184298,"name":"mattkirby/puppet-zpr","url":"https://api.github.com/repos/mattkirby/puppet-zpr"},"payload":{"push_id":536752169,"size":1,"distinct_size":1,"ref":"refs/heads/standard_params","head":"9f6831aef1e36ee6af01f7dacc12c5a082d8c587","before":"25e6dd22e0302c18ab830e43e5448ac6c8f74f86","commits":[{"sha":"9f6831aef1e36ee6af01f7dacc12c5a082d8c587","author":{"email":"992efda4ce64b989ffc2f2114584c88f5d0d9310@puppetlabs.com","name":"kirby@puppetlabs.com"},"message":"Remove notify since file resource doesn't work like the exec did","distinct":true,"url":"https://api.github.com/repos/mattkirby/puppet-zpr/commits/9f6831aef1e36ee6af01f7dacc12c5a082d8c587"}]},"public":true,"created_at":"2015-01-01T01:00:11Z"}
{"id":"2489395849","type":"PushEvent","actor":{"id":10176820,"login":"chalavadivishnu","gravatar_id":"","url":"https://api.github.com/users/chalavadivishnu","avatar_url":"https://avatars.githubusercontent.com/u/10176820?"},"repo":{"id":28678150,"name":"chalavadivishnu/Face-Detection","url":"https://api.github.com/repos/chalavadivishnu/Face-Detection"},"payload":{"push_id":536752170,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"8069b04a69d5729520e64e6c88c262a77407bd75","before":"b252ace8548afd9d1806bffffbe5c6497ca58edf","commits":[{"sha":"8069b04a69d5729520e64e6c88c262a77407bd75","author":{"email":"ce8044f02eb2a26b631671f5297317036d398e79@gmail.com","name":"Chalavadi Vishnu"},"message":"main","distinct":true,"url":"https://api.github.com/repos/chalavadivishnu/Face-Detection/commits/8069b04a69d5729520e64e6c88c262a77407bd75"}]},"public":true,"created_at":"2015-01-01T01:00:11Z"}
{"id":"2489395850","type":"PushEvent","actor":{"id":8147971,"login":"machchk","gravatar_id":"","url":"https://api.github.com/users/machchk","avatar_url":"https://avatars.githubusercontent.com/u/8147971?"},"repo":{"id":21783823,"name":"machchk/report","url":"https://api.github.com/repos/machchk/report"},"payload":{"push_id":536752171,"size":1,"distinct_size":1,"ref":"refs/heads/gh-pages","head":"7b1e68cdc33154e42d97302cf36ed4bfe7d280be","before":"34370ef489c66eedc0d0169a95898cc7f82c1c3e","commits":[{"sha":"7b1e68cdc33154e42d97302cf36ed4bfe7d280be","author":{"email":"dc76e9f0c0006e8f919e0c515c66dbba3982f785@localhost","name":"root"},"message":"update","distinct":true,"url":"https://api.github.com/repos/machchk/report/commits/7b1e68cdc33154e42d97302cf36ed4bfe7d280be"}]},"public":true,"created_at":"2015-01-01T01:00:11Z"}
{"id":"2489395853","type":"PushEvent","actor":{"id":8838361,"login":"benjamincaldwell","gravatar_id":"","url":"https://api.github.com/users/benjamincaldwell","avatar_url":"https://avatars.githubusercontent.com/u/8838361?"},"repo":{"id":28570090,"name":"benjamincaldwell/Website","url":"https://api.github.com/repos/benjamincaldwell/Website"},"payload":{"push_id":536752174,"size":1,"distinct_size":1,"ref":"refs/heads/gh-pages","head":"1bce253e7632d45b428be6d1e4b02e39a3d477de","before":"d4a7f3e628110633e87261aa0661277ccbd8b75f","commits":[{"sha":"1bce253e7632d45b428be6d1e4b02e39a3d477de","author":{"email":"8ffda5448dc6d9eb6fc0b9b1283b3b20a847a4a2@gmail.com","name":"Benjamin Caldwell"},"message":"different background image method","distinct":true,"url":"https://api.github.com/repos/benjamincaldwell/Website/commits/1bce253e7632d45b428be6d1e4b02e39a3d477de"}]},"public":true,"created_at":"2015-01-01T01:00:11Z"}
{"id":"2489395862","type":"PushEvent","actor":{"id":8770348,"login":"HouseMonitor","gravatar_id":"","url":"https://api.github.com/users/HouseMonitor","avatar_url":"https://avatars.githubusercontent.com/u/8770348?"},"repo":{"id":24030380,"name":"HouseMonitor/Logs2014-2015","url":"https://api.github.com/repos/HouseMonitor/Logs2014-2015"},"payload":{"push_id":536752177,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"a84a03375407c8616b1a105a052f5f29f8e43261","before":"68ebc9a7d6ad3a823361e4f3cebda44e42342fee","commits":[{"sha":"a84a03375407c8616b1a105a052f5f29f8e43261","author":{"email":"17e72c8f1b0781cefad8c299a70b47a752ed01a6@gmail.com","name":"Matej Drolc"},"message":"automated commit","distinct":true,"url":"https://api.github.com/repos/HouseMonitor/Logs2014-2015/commits/a84a03375407c8616b1a105a052f5f29f8e43261"}]},"public":true,"created_at":"2015-01-01T01:00:12Z"}
{"id":"2489395865","type":"CreateEvent","actor":{"id":3521359,"login":"ssomnoremac","gravatar_id":"","url":"https://api.github.com/users/ssomnoremac","avatar_url":"https://avatars.githubusercontent.com/u/3521359?"},"repo":{"id":28655796,"name":"ssomnoremac/mean","url":"https://api.github.com/repos/ssomnoremac/mean"},"payload":{"ref":"dev","ref_type":"branch","master_branch":"master","description":"MEAN.JS - Full-Stack JavaScript Using MongoDB, Express, AngularJS, and Node.js - ","pusher_type":"user"},"public":true,"created_at":"2015-01-01T01:00:12Z"}
{"id":"2489395866","type":"PushEvent","actor":{"id":9101573,"login":"megantmcginley","gravatar_id":"","url":"https://api.github.com/users/megantmcginley","avatar_url":"https://avatars.githubusercontent.com/u/9101573?"},"repo":{"id":25549968,"name":"megantmcginley/megantmcginley.github.io","url":"https://api.github.com/repos/megantmcginley/megantmcginley.github.io"},"payload":{"push_id":536752179,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"e613a42ea94329f38b4f9994b48ccd4f845a5225","before":"0d1eeb608f9fbcc69047690dbb9019ac8217def7","commits":[{"sha":"e613a42ea94329f38b4f9994b48ccd4f845a5225","author":{"email":"92f56e51255edbb80c74150d0115560b34c2bc35@users.noreply.github.com","name":"megantmcginley"},"message":"Update projects.html","distinct":true,"url":"https://api.github.com/repos/megantmcginley/megantmcginley.github.io/commits/e613a42ea94329f38b4f9994b48ccd4f845a5225"}]},"public":true,"created_at":"2015-01-01T01:00:12Z"}
{"id":"2489395869","type":"WatchEvent","actor":{"id":4725234,"login":"xuhf","gravatar_id":"","url":"https://api.github.com/users/xuhf","avatar_url":"https://avatars.githubusercontent.com/u/4725234?"},"repo":{"id":10197269,"name":"xiaobozi/youku-lixian","url":"https://api.github.com/repos/xiaobozi/youku-lixian"},"payload":{"action":"started"},"public":true,"created_at":"2015-01-01T01:00:12Z"}
{"id":"2489395875","type":"PushEvent","actor":{"id":2318343,"login":"treckstar","gravatar_id":"","url":"https://api.github.com/users/treckstar","avatar_url":"https://avatars.githubusercontent.com/u/2318343?"},"repo":{"id":17101123,"name":"treckstar/yolo-octo-hipster","url":"https://api.github.com/repos/treckstar/yolo-octo-hipster"},"payload":{"push_id":536752182,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"e8d20aa6bc5d4da90d065848c17e0abd7ee1bc9b","before":"025bfa80305fd4f33670e6cfd1ced7e3dfcc5c94","commits":[{"sha":"e8d20aa6bc5d4da90d065848c17e0abd7ee1bc9b","author":{"email":"28cf8d5dd63a27bb1a047ac2fe7ded863d3bc56c@gmail.com","name":"treckstar"},"message":"Got the words that burn like fire in my mouth.","distinct":true,"url":"https://api.github.com/repos/treckstar/yolo-octo-hipster/commits/e8d20aa6bc5d4da90d065848c17e0abd7ee1bc9b"}]},"public":true,"created_at":"2015-01-01T01:00:13Z"}
{"id":"2489395882","type":"PullRequestReviewCommentEvent","actor":{"id":412280,"login":"kayone","gravatar_id":"","url":"https://api.github.com/users/kayone","avatar_url":"https://avatars.githubusercontent.com/u/412280?"},"repo":{"id":2565137,"name":"SynoCommunity/spksrc","url":"https://api.github.com/repos/SynoCommunity/spksrc"},"payload":{"action":"created","comment":{"url":"https://api.github.com/repos/SynoCommunity/spksrc/pulls/comments/22397252","id":22397252,"diff_hunk":"@@ -0,0 +1,60 @@\n+SPK_NAME = nzbdrone","path":"spk/sonarr/Makefile","position":1,"original_position":1,"commit_id":"d7db1b629ab3e2894060967467f483fa936bf048","original_commit_id":"cc43ff5895bb3cd025dee598705e1a0404c8db6f","user":{"login":"kayone","id":412280,"avatar_url":"https://avatars.githubusercontent.com/u/412280?v=3","gravatar_id":"","url":"https://api.github.com/users/kayone","html_url":"https://github.com/kayone","followers_url":"https://api.github.com/users/kayone/followers","following_url":"https://api.github.com/users/kayone/following{/other_user}","gists_url":"https://api.github.com/users/kayone/gists{/gist_id}","starred_url":"https://api.github.com/users/kayone/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/kayone/subscriptions","organizations_url":"https://api.github.com/users/kayone/orgs","repos_url":"https://api.github.com/users/kayone/repos","events_url":"https://api.github.com/users/kayone/events{/privacy}","received_events_url":"https://api.github.com/users/kayone/received_events","type":"User","site_admin":false},"body":"makes sense,\r\nthanks, wasn't sure if we needed to maintain backwards compatibility.","created_at":"2015-01-01T01:00:13Z","updated_at":"2015-01-01T01:00:13Z","html_url":"https://github.com/SynoCommunity/spksrc/pull/1409#discussion_r22397252","pull_request_url":"https://api.github.com/repos/SynoCommunity/spksrc/pulls/1409","_links":{"self":{"href":"https://api.github.com/repos/SynoCommunity/spksrc/pulls/comments/22397252"},"html":{"href":"https://github.com/SynoCommunity/spksrc/pull/1409#discussion_r22397252"},"pull_request":{"href":"https://api.github.com/repos/SynoCommunity/spksrc/pulls/1409"}}},"pull_request":{"url":"https://api.github.com/repos/SynoCommunity/spksrc/pulls/1409","id":26606843,"html_url":"https://github.com/SynoCommunity/spksrc/pull/1409","diff_url":"https://github.com/SynoCommunity/spksrc/pull/1409.diff","patch_url":"https://github.com/SynoCommunity/spksrc/pull/1409.patch","issue_url":"https://api.github.com/repos/SynoCommunity/spksrc/issues/1409","number":1409,"state":"open","locked":false,"title":"NzbDrone to Sonarr + dependencies updated","user":{"login":"maxrogers","id":265707,"avatar_url":"https://avatars.githubusercontent.com/u/265707?v=3","gravatar_id":"","url":"https://api.github.com/users/maxrogers","html_url":"https://github.com/maxrogers","followers_url":"https://api.github.com/users/maxrogers/followers","following_url":"https://api.github.com/users/maxrogers/following{/other_user}","gists_url":"https://api.github.com/users/maxrogers/gists{/gist_id}","starred_url":"https://api.github.com/users/maxrogers/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/maxrogers/subscriptions","organizations_url":"https://api.github.com/users/maxrogers/orgs","repos_url":"https://api.github.com/users/maxrogers/repos","events_url":"https://api.github.com/users/maxrogers/events{/privacy}","received_events_url":"https://api.github.com/users/maxrogers/received_events","type":"User","site_admin":false},"body":"","created_at":"2014-12-26T21:05:05Z","updated_at":"2015-01-01T01:00:13Z","closed_at":null,"merged_at":null,"merge_commit_sha":"673d66d273703a319d6a3b626e070cd37957f218","assignee":null,"milestone":null,"commits_url":"https://api.github.com/repos/SynoCommunity/spksrc/pulls/1409/commits","review_comments_url":"https://api.github.com/repos/SynoCommunity/spksrc/pulls/1409/comments","review_comment_url":"https://api.github.com/repos/SynoCommunity/spksrc/pulls/comments/{number}","comments_url":"https://api.github.com/repos/SynoCommunity/spksrc/issues/1409/comments","statuses_url":"https://api.github.com/repos/SynoCommunity/spksrc/statuses/d7db1b629ab3e2894060967467f483fa936bf048","head":{"label":"maxrogers:sonarr","ref":"sonarr","sha":"d7db1b629ab3e2894060967467f483fa936bf048","user":{"login":"maxrogers","id":265707,"avatar_url":"https://avatars.githubusercontent.com/u/265707?v=3","gravatar_id":"","url":"https://api.github.com/users/maxrogers","html_url":"https://github.com/maxrogers","followers_url":"https://api.github.com/users/maxrogers/followers","following_url":"https://api.github.com/users/maxrogers/following{/other_user}","gists_url":"https://api.github.com/users/maxrogers/gists{/gist_id}","starred_url":"https://api.github.com/users/maxrogers/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/maxrogers/subscriptions","organizations_url":"https://api.github.com/users/maxrogers/orgs","repos_url":"https://api.github.com/users/maxrogers/repos","events_url":"https://api.github.com/users/maxrogers/events{/privacy}","received_events_url":"https://api.github.com/users/maxrogers/received_events","type":"User","site_admin":false},"repo":{"id":28520597,"name":"spksrc","full_name":"maxrogers/spksrc","owner":{"login":"maxrogers","id":265707,"avatar_url":"https://avatars.githubusercontent.com/u/265707?v=3","gravatar_id":"","url":"https://api.github.com/users/maxrogers","html_url":"https://github.com/maxrogers","followers_url":"https://api.github.com/users/maxrogers/followers","following_url":"https://api.github.com/users/maxrogers/following{/other_user}","gists_url":"https://api.github.com/users/maxrogers/gists{/gist_id}","starred_url":"https://api.github.com/users/maxrogers/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/maxrogers/subscriptions","organizations_url":"https://api.github.com/users/maxrogers/orgs","repos_url":"https://api.github.com/users/maxrogers/repos","events_url":"https://api.github.com/users/maxrogers/events{/privacy}","received_events_url":"https://api.github.com/users/maxrogers/received_events","type":"User","site_admin":false},"private":false,"html_url":"https://github.com/maxrogers/spksrc","description":"Cross compilation framework to create native packages for the Synology's NAS","fork":true,"url":"https://api.github.com/repos/maxrogers/spksrc","forks_url":"https://api.github.com/repos/maxrogers/spksrc/forks","keys_url":"https://api.github.com/repos/maxrogers/spksrc/keys{/key_id}","collaborators_url":"https://api.github.com/repos/maxrogers/spksrc/collaborators{/collaborator}","teams_url":"https://api.github.com/repos/maxrogers/spksrc/teams","hooks_url":"https://api.github.com/repos/maxrogers/spksrc/hooks","issue_events_url":"https://api.github.com/repos/maxrogers/spksrc/issues/events{/number}","events_url":"https://api.github.com/repos/maxrogers/spksrc/events","assignees_url":"https://api.github.com/repos/maxrogers/spksrc/assignees{/user}","branches_url":"https://api.github.com/repos/maxrogers/spksrc/branches{/branch}","tags_url":"https://api.github.com/repos/maxrogers/spksrc/tags","blobs_url":"https://api.github.com/repos/maxrogers/spksrc/git/blobs{/sha}","git_tags_url":"https://api.github.com/repos/maxrogers/spksrc/git/tags{/sha}","git_refs_url":"https://api.github.com/repos/maxrogers/spksrc/git/refs{/sha}","trees_url":"https://api.github.com/repos/maxrogers/spksrc/git/trees{/sha}","statuses_url":"https://api.github.com/repos/maxrogers/spksrc/statuses/{sha}","languages_url":"https://api.github.com/repos/maxrogers/spksrc/languages","stargazers_url":"https://api.github.com/repos/maxrogers/spksrc/stargazers","contributors_url":"https://api.github.com/repos/maxrogers/spksrc/contributors","subscribers_url":"https://api.github.com/repos/maxrogers/spksrc/subscribers","subscription_url":"https://api.github.com/repos/maxrogers/spksrc/subscription","commits_url":"https://api.github.com/repos/maxrogers/spksrc/commits{/sha}","git_commits_url":"https://api.github.com/repos/maxrogers/spksrc/git/commits{/sha}","comments_url":"https://api.github.com/repos/maxrogers/spksrc/comments{/number}","issue_comment_url":"https://api.github.com/repos/maxrogers/spksrc/issues/comments/{number}","contents_url":"https://api.github.com/repos/maxrogers/spksrc/contents/{+path}","compare_url":"https://api.github.com/repos/maxrogers/spksrc/compare/{base}...{head}","merges_url":"https://api.github.com/repos/maxrogers/spksrc/merges","archive_url":"https://api.github.com/repos/maxrogers/spksrc/{archive_format}{/ref}","downloads_url":"https://api.github.com/repos/maxrogers/spksrc/downloads","issues_url":"https://api.github.com/repos/maxrogers/spksrc/issues{/number}","pulls_url":"https://api.github.com/repos/maxrogers/spksrc/pulls{/number}","milestones_url":"https://api.github.com/repos/maxrogers/spksrc/milestones{/number}","notifications_url":"https://api.github.com/repos/maxrogers/spksrc/notifications{?since,all,participating}","labels_url":"https://api.github.com/repos/maxrogers/spksrc/labels{/name}","releases_url":"https://api.github.com/repos/maxrogers/spksrc/releases{/id}","created_at":"2014-12-26T20:36:05Z","updated_at":"2014-12-26T20:36:07Z","pushed_at":"2014-12-31T22:30:08Z","git_url":"git://github.com/maxrogers/spksrc.git","ssh_url":"git@github.com:maxrogers/spksrc.git","clone_url":"https://github.com/maxrogers/spksrc.git","svn_url":"https://github.com/maxrogers/spksrc","homepage":"https://github.com/SynoCommunity/spksrc","size":6160,"stargazers_count":0,"watchers_count":0,"language":"Makefile","has_issues":false,"has_downloads":true,"has_wiki":true,"has_pages":false,"forks_count":0,"mirror_url":null,"open_issues_count":0,"forks":0,"open_issues":0,"watchers":0,"default_branch":"develop"}},"base":{"label":"SynoCommunity:develop","ref":"develop","sha":"9e6205a91eb2c59cccbe8d1d479065b07727f061","user":{"login":"SynoCommunity","id":1123581,"avatar_url":"https://avatars.githubusercontent.com/u/1123581?v=3","gravatar_id":"","url":"https://api.github.com/users/SynoCommunity","html_url":"https://github.com/SynoCommunity","followers_url":"https://api.github.com/users/SynoCommunity/followers","following_url":"https://api.github.com/users/SynoCommunity/following{/other_user}","gists_url":"https://api.github.com/users/SynoCommunity/gists{/gist_id}","starred_url":"https://api.github.com/users/SynoCommunity/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/SynoCommunity/subscriptions","organizations_url":"https://api.github.com/users/SynoCommunity/orgs","repos_url":"https://api.github.com/users/SynoCommunity/repos","events_url":"https://api.github.com/users/SynoCommunity/events{/privacy}","received_events_url":"https://api.github.com/users/SynoCommunity/received_events","type":"Organization","site_admin":false},"repo":{"id":2565137,"name":"spksrc","full_name":"SynoCommunity/spksrc","owner":{"login":"SynoCommunity","id":1123581,"avatar_url":"https://avatars.githubusercontent.com/u/1123581?v=3","gravatar_id":"","url":"https://api.github.com/users/SynoCommunity","html_url":"https://github.com/SynoCommunity","followers_url":"https://api.github.com/users/SynoCommunity/followers","following_url":"https://api.github.com/users/SynoCommunity/following{/other_user}","gists_url":"https://api.github.com/users/SynoCommunity/gists{/gist_id}","starred_url":"https://api.github.com/users/SynoCommunity/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/SynoCommunity/subscriptions","organizations_url":"https://api.github.com/users/SynoCommunity/orgs","repos_url":"https://api.github.com/users/SynoCommunity/repos","events_url":"https://api.github.com/users/SynoCommunity/events{/privacy}","received_events_url":"https://api.github.com/users/SynoCommunity/received_events","type":"Organization","site_admin":false},"private":false,"html_url":"https://github.com/SynoCommunity/spksrc","description":"Cross compilation framework to create native packages for the Synology's NAS","fork":false,"url":"https://api.github.com/repos/SynoCommunity/spksrc","forks_url":"https://api.github.com/repos/SynoCommunity/spksrc/forks","keys_url":"https://api.github.com/repos/SynoCommunity/spksrc/keys{/key_id}","collaborators_url":"https://api.github.com/repos/SynoCommunity/spksrc/collaborators{/collaborator}","teams_url":"https://api.github.com/repos/SynoCommunity/spksrc/teams","hooks_url":"https://api.github.com/repos/SynoCommunity/spksrc/hooks","issue_events_url":"https://api.github.com/repos/SynoCommunity/spksrc/issues/events{/number}","events_url":"https://api.github.com/repos/SynoCommunity/spksrc/events","assignees_url":"https://api.github.com/repos/SynoCommunity/spksrc/assignees{/user}","branches_url":"https://api.github.com/repos/SynoCommunity/spksrc/branches{/branch}","tags_url":"https://api.github.com/repos/SynoCommunity/spksrc/tags","blobs_url":"https://api.github.com/repos/SynoCommunity/spksrc/git/blobs{/sha}","git_tags_url":"https://api.github.com/repos/SynoCommunity/spksrc/git/tags{/sha}","git_refs_url":"https://api.github.com/repos/SynoCommunity/spksrc/git/refs{/sha}","trees_url":"https://api.github.com/repos/SynoCommunity/spksrc/git/trees{/sha}","statuses_url":"https://api.github.com/repos/SynoCommunity/spksrc/statuses/{sha}","languages_url":"https://api.github.com/repos/SynoCommunity/spksrc/languages","stargazers_url":"https://api.github.com/repos/SynoCommunity/spksrc/stargazers","contributors_url":"https://api.github.com/repos/SynoCommunity/spksrc/contributors","subscribers_url":"https://api.github.com/repos/SynoCommunity/spksrc/subscribers","subscription_url":"https://api.github.com/repos/SynoCommunity/spksrc/subscription","commits_url":"https://api.github.com/repos/SynoCommunity/spksrc/commits{/sha}","git_commits_url":"https://api.github.com/repos/SynoCommunity/spksrc/git/commits{/sha}","comments_url":"https://api.github.com/repos/SynoCommunity/spksrc/comments{/number}","issue_comment_url":"https://api.github.com/repos/SynoCommunity/spksrc/issues/comments/{number}","contents_url":"https://api.github.com/repos/SynoCommunity/spksrc/contents/{+path}","compare_url":"https://api.github.com/repos/SynoCommunity/spksrc/compare/{base}...{head}","merges_url":"https://api.github.com/repos/SynoCommunity/spksrc/merges","archive_url":"https://api.github.com/repos/SynoCommunity/spksrc/{archive_format}{/ref}","downloads_url":"https://api.github.com/repos/SynoCommunity/spksrc/downloads","issues_url":"https://api.github.com/repos/SynoCommunity/spksrc/issues{/number}","pulls_url":"https://api.github.com/repos/SynoCommunity/spksrc/pulls{/number}","milestones_url":"https://api.github.com/repos/SynoCommunity/spksrc/milestones{/number}","notifications_url":"https://api.github.com/repos/SynoCommunity/spksrc/notifications{?since,all,participating}","labels_url":"https://api.github.com/repos/SynoCommunity/spksrc/labels{/name}","releases_url":"https://api.github.com/repos/SynoCommunity/spksrc/releases{/id}","created_at":"2011-10-12T20:25:50Z","updated_at":"2014-12-31T13:44:45Z","pushed_at":"2014-12-31T11:23:04Z","git_url":"git://github.com/SynoCommunity/spksrc.git","ssh_url":"git@github.com:SynoCommunity/spksrc.git","clone_url":"https://github.com/SynoCommunity/spksrc.git","svn_url":"https://github.com/SynoCommunity/spksrc","homepage":"https://github.com/SynoCommunity/spksrc","size":30572,"stargazers_count":617,"watchers_count":617,"language":"Makefile","has_issues":true,"has_downloads":true,"has_wiki":true,"has_pages":false,"forks_count":294,"mirror_url":null,"open_issues_count":229,"forks":294,"open_issues":229,"watchers":617,"default_branch":"develop"}},"_links":{"self":{"href":"https://api.github.com/repos/SynoCommunity/spksrc/pulls/1409"},"html":{"href":"https://github.com/SynoCommunity/spksrc/pull/1409"},"issue":{"href":"https://api.github.com/repos/SynoCommunity/spksrc/issues/1409"},"comments":{"href":"https://api.github.com/repos/SynoCommunity/spksrc/issues/1409/comments"},"review_comments":{"href":"https://api.github.com/repos/SynoCommunity/spksrc/pulls/1409/comments"},"review_comment":{"href":"https://api.github.com/repos/SynoCommunity/spksrc/pulls/comments/{number}"},"commits":{"href":"https://api.github.com/repos/SynoCommunity/spksrc/pulls/1409/commits"},"statuses":{"href":"https://api.github.com/repos/SynoCommunity/spksrc/statuses/d7db1b629ab3e2894060967467f483fa936bf048"}}}},"public":true,"created_at":"2015-01-01T01:00:13Z","org":{"id":1123581,"login":"SynoCommunity","gravatar_id":"","url":"https://api.github.com/orgs/SynoCommunity","avatar_url":"https://avatars.githubusercontent.com/u/1123581?"}}
{"id":"2489395883","type":"PushEvent","actor":{"id":4102215,"login":"d3stats","gravatar_id":"","url":"https://api.github.com/users/d3stats","avatar_url":"https://avatars.githubusercontent.com/u/4102215?"},"repo":{"id":9317463,"name":"d3stats/d3.fuzz.me.uk","url":"https://api.github.com/repos/d3stats/d3.fuzz.me.uk"},"payload":{"push_id":536752185,"size":1,"distinct_size":1,"ref":"refs/heads/gh-pages","head":"87f4b08c009c2cecc8f8411f48be921f9f5ab4f8","before":"09f4bcab487b3cf4bb8101c28fde4ddb4326b95c","commits":[{"sha":"87f4b08c009c2cecc8f8411f48be921f9f5ab4f8","author":{"email":"4f26aeafdb2367620a393c973eddbe8f8b846ebd@fuzz.me.uk","name":"d3stats"},"message":"scheduled update","distinct":true,"url":"https://api.github.com/repos/d3stats/d3.fuzz.me.uk/commits/87f4b08c009c2cecc8f8411f48be921f9f5ab4f8"}]},"public":true,"created_at":"2015-01-01T01:00:13Z"}
{"id":"2489395884","type":"PushEvent","actor":{"id":3160808,"login":"trustedsec","gravatar_id":"","url":"https://api.github.com/users/trustedsec","avatar_url":"https://avatars.githubusercontent.com/u/3160808?"},"repo":{"id":7391261,"name":"trustedsec/social-engineer-toolkit","url":"https://api.github.com/repos/trustedsec/social-engineer-toolkit"},"payload":{"push_id":536752186,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"8f07649e93f94728dd876e7bcbd3cef21e8add69","before":"981c2c1a0fbea08bf5555725afa8e1b2d6d6fe2e","commits":[{"sha":"8f07649e93f94728dd876e7bcbd3cef21e8add69","author":{"email":"863b5d643be6fa3d7c1bad8d1f065e00f75dc0c2@trustedsec.com","name":"trustedsec"},"message":"Updated Java Applet with obfuscation.","distinct":true,"url":"https://api.github.com/repos/trustedsec/social-engineer-toolkit/commits/8f07649e93f94728dd876e7bcbd3cef21e8add69"}]},"public":true,"created_at":"2015-01-01T01:00:14Z"}
{"id":"2489395885","type":"WatchEvent","actor":{"id":489911,"login":"vasanthela","gravatar_id":"","url":"https://api.github.com/users/vasanthela","avatar_url":"https://avatars.githubusercontent.com/u/489911?"},"repo":{"id":27021112,"name":"sorentwo/readthis","url":"https://api.github.com/repos/sorentwo/readthis"},"payload":{"action":"started"},"public":true,"created_at":"2015-01-01T01:00:16Z"}
{"id":"2489395886","type":"IssuesEvent","actor":{"id":1414603,"login":"zoldello","gravatar_id":"","url":"https://api.github.com/users/zoldello","avatar_url":"https://avatars.githubusercontent.com/u/1414603?"},"repo":{"id":26617214,"name":"ChicagoVeg/restaurantList","url":"https://api.github.com/repos/ChicagoVeg/restaurantList"},"payload":{"action":"opened","issue":{"url":"https://api.github.com/repos/ChicagoVeg/restaurantList/issues/9","labels_url":"https://api.github.com/repos/ChicagoVeg/restaurantList/issues/9/labels{/name}","comments_url":"https://api.github.com/repos/ChicagoVeg/restaurantList/issues/9/comments","events_url":"https://api.github.com/repos/ChicagoVeg/restaurantList/issues/9/events","html_url":"https://github.com/ChicagoVeg/restaurantList/issues/9","id":53210171,"number":9,"title":"When I filter out restaurants by type, the removed restaurant pins remain in the map","user":{"login":"zoldello","id":1414603,"avatar_url":"https://avatars.githubusercontent.com/u/1414603?v=3","gravatar_id":"","url":"https://api.github.com/users/zoldello","html_url":"https://github.com/zoldello","followers_url":"https://api.github.com/users/zoldello/followers","following_url":"https://api.github.com/users/zoldello/following{/other_user}","gists_url":"https://api.github.com/users/zoldello/gists{/gist_id}","starred_url":"https://api.github.com/users/zoldello/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/zoldello/subscriptions","organizations_url":"https://api.github.com/users/zoldello/orgs","repos_url":"https://api.github.com/users/zoldello/repos","events_url":"https://api.github.com/users/zoldello/events{/privacy}","received_events_url":"https://api.github.com/users/zoldello/received_events","type":"User","site_admin":false},"labels":[{"url":"https://api.github.com/repos/ChicagoVeg/restaurantList/labels/bug","name":"bug","color":"fc2929"},{"url":"https://api.github.com/repos/ChicagoVeg/restaurantList/labels/Great+to+Have","name":"Great to Have","color":"f7c6c7"}],"state":"open","locked":false,"assignee":{"login":"zoldello","id":1414603,"avatar_url":"https://avatars.githubusercontent.com/u/1414603?v=3","gravatar_id":"","url":"https://api.github.com/users/zoldello","html_url":"https://github.com/zoldello","followers_url":"https://api.github.com/users/zoldello/followers","following_url":"https://api.github.com/users/zoldello/following{/other_user}","gists_url":"https://api.github.com/users/zoldello/gists{/gist_id}","starred_url":"https://api.github.com/users/zoldello/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/zoldello/subscriptions","organizations_url":"https://api.github.com/users/zoldello/orgs","repos_url":"https://api.github.com/users/zoldello/repos","events_url":"https://api.github.com/users/zoldello/events{/privacy}","received_events_url":"https://api.github.com/users/zoldello/received_events","type":"User","site_admin":false},"milestone":{"url":"https://api.github.com/repos/ChicagoVeg/restaurantList/milestones/3","labels_url":"https://api.github.com/repos/ChicagoVeg/restaurantList/milestones/3/labels","id":894444,"number":3,"title":"Release 1","description":"","creator":{"login":"vadim424","id":10101875,"avatar_url":"https://avatars.githubusercontent.com/u/10101875?v=3","gravatar_id":"","url":"https://api.github.com/users/vadim424","html_url":"https://github.com/vadim424","followers_url":"https://api.github.com/users/vadim424/followers","following_url":"https://api.github.com/users/vadim424/following{/other_user}","gists_url":"https://api.github.com/users/vadim424/gists{/gist_id}","starred_url":"https://api.github.com/users/vadim424/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/vadim424/subscriptions","organizations_url":"https://api.github.com/users/vadim424/orgs","repos_url":"https://api.github.com/users/vadim424/repos","events_url":"https://api.github.com/users/vadim424/events{/privacy}","received_events_url":"https://api.github.com/users/vadim424/received_events","type":"User","site_admin":false},"open_issues":3,"closed_issues":4,"state":"open","created_at":"2014-12-07T00:34:16Z","updated_at":"2015-01-01T01:00:14Z","due_on":"2014-12-14T06:00:00Z","closed_at":null},"comments":0,"created_at":"2015-01-01T01:00:14Z","updated_at":"2015-01-01T01:00:14Z","closed_at":null,"body":""}},"public":true,"created_at":"2015-01-01T01:00:16Z","org":{"id":9426295,"login":"ChicagoVeg","gravatar_id":"","url":"https://api.github.com/orgs/ChicagoVeg","avatar_url":"https://avatars.githubusercontent.com/u/9426295?"}}
{"id":"2489395891","type":"WatchEvent","actor":{"id":3514976,"login":"trupin","gravatar_id":"","url":"https://api.github.com/users/trupin","avatar_url":"https://avatars.githubusercontent.com/u/3514976?"},"repo":{"id":2544305,"name":"tomakehurst/wiremock","url":"https://api.github.com/repos/tomakehurst/wiremock"},"payload":{"action":"started"},"public":true,"created_at":"2015-01-01T01:00:16Z"}
{"id":"2489395900","type":"PushEvent","actor":{"id":2101973,"login":"konjac","gravatar_id":"","url":"https://api.github.com/users/konjac","avatar_url":"https://avatars.githubusercontent.com/u/2101973?"},"repo":{"id":24664906,"name":"konjac/calendars","url":"https://api.github.com/repos/konjac/calendars"},"payload":{"push_id":536752192,"size":1,"distinct_size":1,"ref":"refs/heads/gh-pages","head":"e0cebd9186ac0e326934d5fa27e8d350c4b1cf87","before":"ef7f231d67bd83d9569d1c34fe99fba72e961c19","commits":[{"sha":"e0cebd9186ac0e326934d5fa27e8d350c4b1cf87","author":{"email":"6dc96bd73a12a2b22abd88d2fca39328a25102c5@gmail.com","name":"konjac"},"message":"update","distinct":true,"url":"https://api.github.com/repos/konjac/calendars/commits/e0cebd9186ac0e326934d5fa27e8d350c4b1cf87"}]},"public":true,"created_at":"2015-01-01T01:00:16Z"}
{"id":"2489395899","type":"PushEvent","actor":{"id":739159,"login":"lessthanoptimal","gravatar_id":"","url":"https://api.github.com/users/lessthanoptimal","avatar_url":"https://avatars.githubusercontent.com/u/739159?"},"repo":{"id":28421901,"name":"lessthanoptimal/bow","url":"https://api.github.com/repos/lessthanoptimal/bow"},"payload":{"push_id":536752193,"size":2,"distinct_size":2,"ref":"refs/heads/master","head":"05bf0882abaf590379176a0c0093d0cc49d8390e","before":"40e23734127f500478caeb3071ea184752fa99c3","commits":[{"sha":"c10a64918fb1deb7edd5c8d9ed7f31bb715ccb1e","author":{"email":"d4f7bed66133e57602ad989e685eeed7b4535dfc@gmail.com","name":"Peter Abeles"},"message":"- Octave code is more mature","distinct":true,"url":"https://api.github.com/repos/lessthanoptimal/bow/commits/c10a64918fb1deb7edd5c8d9ed7f31bb715ccb1e"},{"sha":"05bf0882abaf590379176a0c0093d0cc49d8390e","author":{"email":"d4f7bed66133e57602ad989e685eeed7b4535dfc@gmail.com","name":"Peter Abeles"},"message":"- renamed src to python","distinct":true,"url":"https://api.github.com/repos/lessthanoptimal/bow/commits/05bf0882abaf590379176a0c0093d0cc49d8390e"}]},"public":true,"created_at":"2015-01-01T01:00:16Z"}
{"id":"2489395903","type":"PushEvent","actor":{"id":1396247,"login":"hemstreet","gravatar_id":"","url":"https://api.github.com/users/hemstreet","avatar_url":"https://avatars.githubusercontent.com/u/1396247?"},"repo":{"id":18146818,"name":"Handbid/Handbid-WordPress","url":"https://api.github.com/repos/Handbid/Handbid-WordPress"},"payload":{"push_id":536752194,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"7c3d9244dd7646d85e8028493125e6306bf32070","before":"52a447d2c80786cd9c1ef7d9e861562ced30e4d9","commits":[{"sha":"7c3d9244dd7646d85e8028493125e6306bf32070","author":{"email":"5e0a51686c7b5ffc310cf0f73a7ea38c001a4814@gmail.com","name":"Hemstreet"},"message":"receipt markup","distinct":true,"url":"https://api.github.com/repos/Handbid/Handbid-WordPress/commits/7c3d9244dd7646d85e8028493125e6306bf32070"}]},"public":true,"created_at":"2015-01-01T01:00:16Z","org":{"id":7072597,"login":"Handbid","gravatar_id":"","url":"https://api.github.com/orgs/Handbid","avatar_url":"https://avatars.githubusercontent.com/u/7072597?"}}
{"id":"2489395904","type":"PushEvent","actor":{"id":5684907,"login":"martin-williams","gravatar_id":"","url":"https://api.github.com/users/martin-williams","avatar_url":"https://avatars.githubusercontent.com/u/5684907?"},"repo":{"id":25208939,"name":"martin-williams/tpp_imdb","url":"https://api.github.com/repos/martin-williams/tpp_imdb"},"payload":{"push_id":536752195,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"317709a0e7b17b5eea34d28a6623e90d8d693304","before":"ad1a720f71ec001edefc3f743f83b1fe2917c0db","commits":[{"sha":"317709a0e7b17b5eea34d28a6623e90d8d693304","author":{"email":"c9a2ee53052a131cbb42f619416968acbd6ad458@beardon.com","name":"Martin Williams"},"message":"more adjustments to pageant search page","distinct":true,"url":"https://api.github.com/repos/martin-williams/tpp_imdb/commits/317709a0e7b17b5eea34d28a6623e90d8d693304"}]},"public":true,"created_at":"2015-01-01T01:00:16Z"}
{"id":"2489395905","type":"PushEvent","actor":{"id":8882603,"login":"pinaet","gravatar_id":"","url":"https://api.github.com/users/pinaet","avatar_url":"https://avatars.githubusercontent.com/u/8882603?"},"repo":{"id":24382269,"name":"pinaet/pinaet.github.io","url":"https://api.github.com/repos/pinaet/pinaet.github.io"},"payload":{"push_id":536752196,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"cfd66e5e7aa225813d3fb60231142d47533bad02","before":"be40427e7b0488333d4658aad8c763591b77e794","commits":[{"sha":"cfd66e5e7aa225813d3fb60231142d47533bad02","author":{"email":"8207655137af68a9e81af8e7a2b0dcaa36726d43@gmail.com","name":"Pinaet"},"message":"modified facebook plugin 3","distinct":true,"url":"https://api.github.com/repos/pinaet/pinaet.github.io/commits/cfd66e5e7aa225813d3fb60231142d47533bad02"}]},"public":true,"created_at":"2015-01-01T01:00:16Z"}
{"id":"2489395906","type":"PushEvent","actor":{"id":8077771,"login":"camsc","gravatar_id":"","url":"https://api.github.com/users/camsc","avatar_url":"https://avatars.githubusercontent.com/u/8077771?"},"repo":{"id":22777322,"name":"camsc/camsc.github.io","url":"https://api.github.com/repos/camsc/camsc.github.io"},"payload":{"push_id":536752197,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"22e97dea8206b1c5f2e0d5b058f9fb887462a887","before":"4b6c8016628865488fb78d8dbbfc93d057999ef4","commits":[{"sha":"22e97dea8206b1c5f2e0d5b058f9fb887462a887","author":{"email":"1d572acbfa68c7c6e541c7b840d6b622e5c0dc91@khanacademy.org","name":"Cam"},"message":"small update","distinct":true,"url":"https://api.github.com/repos/camsc/camsc.github.io/commits/22e97dea8206b1c5f2e0d5b058f9fb887462a887"}]},"public":true,"created_at":"2015-01-01T01:00:16Z"}
{"id":"2489395909","type":"PushEvent","actor":{"id":6267945,"login":"lakotadlustig","gravatar_id":"","url":"https://api.github.com/users/lakotadlustig","avatar_url":"https://avatars.githubusercontent.com/u/6267945?"},"repo":{"id":28615365,"name":"korlabs/tippr","url":"https://api.github.com/repos/korlabs/tippr"},"payload":{"push_id":536752200,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"010ba4d2a839b14d435b0d2c2ea75a861cab3e5d","before":"a306207249b2eaceb9668541e8dcb159dcf33c3f","commits":[{"sha":"010ba4d2a839b14d435b0d2c2ea75a861cab3e5d","author":{"email":"3280e741e838010abad30f9c64878ae2d3f3e766@podbe.at","name":"Lakota Lustig"},"message":"Update app.php","distinct":true,"url":"https://api.github.com/repos/korlabs/tippr/commits/010ba4d2a839b14d435b0d2c2ea75a861cab3e5d"}]},"public":true,"created_at":"2015-01-01T01:00:16Z","org":{"id":7786022,"login":"korlabs","gravatar_id":"","url":"https://api.github.com/orgs/korlabs","avatar_url":"https://avatars.githubusercontent.com/u/7786022?"}}
{"id":"2489395912","type":"WatchEvent","actor":{"id":681965,"login":"wonbyte","gravatar_id":"","url":"https://api.github.com/users/wonbyte","avatar_url":"https://avatars.githubusercontent.com/u/681965?"},"repo":{"id":2386778,"name":"idris-lang/Idris-dev","url":"https://api.github.com/repos/idris-lang/Idris-dev"},"payload":{"action":"started"},"public":true,"created_at":"2015-01-01T01:00:17Z","org":{"id":5552910,"login":"idris-lang","gravatar_id":"","url":"https://api.github.com/orgs/idris-lang","avatar_url":"https://avatars.githubusercontent.com/u/5552910?"}}
{"id":"2489395917","type":"PushEvent","actor":{"id":10161953,"login":"vanceavalon","gravatar_id":"","url":"https://api.github.com/users/vanceavalon","avatar_url":"https://avatars.githubusercontent.com/u/10161953?"},"repo":{"id":28676586,"name":"vanceavalon/cassandra","url":"https://api.github.com/repos/vanceavalon/cassandra"},"payload":{"push_id":536752202,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"474fbd83268b21d63b61739e30e95c58e7121b3c","before":"3724660f44fe83771180e377e88f6bdcc23d7053","commits":[{"sha":"474fbd83268b21d63b61739e30e95c58e7121b3c","author":{"email":"eb40dd603b6777633aefcd015011472550a9e731@gmail.com","name":"vanceavalon"},"message":"Update variable SEEDS\n\nUpdate variable SEEDS get to /services/db/cassandra/node1","distinct":true,"url":"https://api.github.com/repos/vanceavalon/cassandra/commits/474fbd83268b21d63b61739e30e95c58e7121b3c"}]},"public":true,"created_at":"2015-01-01T01:00:17Z"}
{"id":"2489395919","type":"CreateEvent","actor":{"id":10081364,"login":"celiaks","gravatar_id":"","url":"https://api.github.com/users/celiaks","avatar_url":"https://avatars.githubusercontent.com/u/10081364?"},"repo":{"id":28678214,"name":"celiaks/formcheckerSL","url":"https://api.github.com/repos/celiaks/formcheckerSL"},"payload":{"ref":null,"ref_type":"repository","master_branch":"master","description":"form checker plugin for jquery","pusher_type":"user"},"public":true,"created_at":"2015-01-01T01:00:17Z"}
{"id":"2489395921","type":"ForkEvent","actor":{"id":1402662,"login":"jamcar23","gravatar_id":"","url":"https://api.github.com/users/jamcar23","avatar_url":"https://avatars.githubusercontent.com/u/1402662?"},"repo":{"id":2990192,"name":"WhisperSystems/TextSecure","url":"https://api.github.com/repos/WhisperSystems/TextSecure"},"payload":{"forkee":{"id":28678215,"name":"TextSecure","full_name":"jamcar23/TextSecure","owner":{"login":"jamcar23","id":1402662,"avatar_url":"https://avatars.githubusercontent.com/u/1402662?v=3","gravatar_id":"","url":"https://api.github.com/users/jamcar23","html_url":"https://github.com/jamcar23","followers_url":"https://api.github.com/users/jamcar23/followers","following_url":"https://api.github.com/users/jamcar23/following{/other_user}","gists_url":"https://api.github.com/users/jamcar23/gists{/gist_id}","starred_url":"https://api.github.com/users/jamcar23/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/jamcar23/subscriptions","organizations_url":"https://api.github.com/users/jamcar23/orgs","repos_url":"https://api.github.com/users/jamcar23/repos","events_url":"https://api.github.com/users/jamcar23/events{/privacy}","received_events_url":"https://api.github.com/users/jamcar23/received_events","type":"User","site_admin":false},"private":false,"html_url":"https://github.com/jamcar23/TextSecure","description":"A secure text messaging application for Android.","fork":true,"url":"https://api.github.com/repos/jamcar23/TextSecure","forks_url":"https://api.github.com/repos/jamcar23/TextSecure/forks","keys_url":"https://api.github.com/repos/jamcar23/TextSecure/keys{/key_id}","collaborators_url":"https://api.github.com/repos/jamcar23/TextSecure/collaborators{/collaborator}","teams_url":"https://api.github.com/repos/jamcar23/TextSecure/teams","hooks_url":"https://api.github.com/repos/jamcar23/TextSecure/hooks","issue_events_url":"https://api.github.com/repos/jamcar23/TextSecure/issues/events{/number}","events_url":"https://api.github.com/repos/jamcar23/TextSecure/events","assignees_url":"https://api.github.com/repos/jamcar23/TextSecure/assignees{/user}","branches_url":"https://api.github.com/repos/jamcar23/TextSecure/branches{/branch}","tags_url":"https://api.github.com/repos/jamcar23/TextSecure/tags","blobs_url":"https://api.github.com/repos/jamcar23/TextSecure/git/blobs{/sha}","git_tags_url":"https://api.github.com/repos/jamcar23/TextSecure/git/tags{/sha}","git_refs_url":"https://api.github.com/repos/jamcar23/TextSecure/git/refs{/sha}","trees_url":"https://api.github.com/repos/jamcar23/TextSecure/git/trees{/sha}","statuses_url":"https://api.github.com/repos/jamcar23/TextSecure/statuses/{sha}","languages_url":"https://api.github.com/repos/jamcar23/TextSecure/languages","stargazers_url":"https://api.github.com/repos/jamcar23/TextSecure/stargazers","contributors_url":"https://api.github.com/repos/jamcar23/TextSecure/contributors","subscribers_url":"https://api.github.com/repos/jamcar23/TextSecure/subscribers","subscription_url":"https://api.github.com/repos/jamcar23/TextSecure/subscription","commits_url":"https://api.github.com/repos/jamcar23/TextSecure/commits{/sha}","git_commits_url":"https://api.github.com/repos/jamcar23/TextSecure/git/commits{/sha}","comments_url":"https://api.github.com/repos/jamcar23/TextSecure/comments{/number}","issue_comment_url":"https://api.github.com/repos/jamcar23/TextSecure/issues/comments/{number}","contents_url":"https://api.github.com/repos/jamcar23/TextSecure/contents/{+path}","compare_url":"https://api.github.com/repos/jamcar23/TextSecure/compare/{base}...{head}","merges_url":"https://api.github.com/repos/jamcar23/TextSecure/merges","archive_url":"https://api.github.com/repos/jamcar23/TextSecure/{archive_format}{/ref}","downloads_url":"https://api.github.com/repos/jamcar23/TextSecure/downloads","issues_url":"https://api.github.com/repos/jamcar23/TextSecure/issues{/number}","pulls_url":"https://api.github.com/repos/jamcar23/TextSecure/pulls{/number}","milestones_url":"https://api.github.com/repos/jamcar23/TextSecure/milestones{/number}","notifications_url":"https://api.github.com/repos/jamcar23/TextSecure/notifications{?since,all,participating}","labels_url":"https://api.github.com/repos/jamcar23/TextSecure/labels{/name}","releases_url":"https://api.github.com/repos/jamcar23/TextSecure/releases{/id}","created_at":"2015-01-01T01:00:17Z","updated_at":"2015-01-01T00:00:47Z","pushed_at":"2015-01-01T00:00:45Z","git_url":"git://github.com/jamcar23/TextSecure.git","ssh_url":"git@github.com:jamcar23/TextSecure.git","clone_url":"https://github.com/jamcar23/TextSecure.git","svn_url":"https://github.com/jamcar23/TextSecure","homepage":"","size":54519,"stargazers_count":0,"watchers_count":0,"language":null,"has_issues":false,"has_downloads":true,"has_wiki":true,"has_pages":false,"forks_count":0,"mirror_url":null,"open_issues_count":0,"forks":0,"open_issues":0,"watchers":0,"default_branch":"master","public":true}},"public":true,"created_at":"2015-01-01T01:00:18Z","org":{"id":702459,"login":"WhisperSystems","gravatar_id":"","url":"https://api.github.com/orgs/WhisperSystems","avatar_url":"https://avatars.githubusercontent.com/u/702459?"}}
{"id":"2489395933","type":"PushEvent","actor":{"id":1856621,"login":"InternetDevels","gravatar_id":"","url":"https://api.github.com/users/InternetDevels","avatar_url":"https://avatars.githubusercontent.com/u/1856621?"},"repo":{"id":20291263,"name":"InternetDevels/drupalcores","url":"https://api.github.com/repos/InternetDevels/drupalcores"},"payload":{"push_id":536752208,"size":1,"distinct_size":1,"ref":"refs/heads/gh-pages","head":"11b1d13135fd0d4a56a916b0a99468b9e50a3061","before":"dbb4ef6b7364169b3ef3433e6bb5579555e78353","commits":[{"sha":"11b1d13135fd0d4a56a916b0a99468b9e50a3061","author":{"email":"141a748f5c0795fdf68eaad85b65480c92abbe5f@internetdevels.com","name":"mula"},"message":"Update bump.","distinct":true,"url":"https://api.github.com/repos/InternetDevels/drupalcores/commits/11b1d13135fd0d4a56a916b0a99468b9e50a3061"}]},"public":true,"created_at":"2015-01-01T01:00:21Z"}
{"id":"2489395934","type":"PushEvent","actor":{"id":3196313,"login":"dpastoor","gravatar_id":"","url":"https://api.github.com/users/dpastoor","avatar_url":"https://avatars.githubusercontent.com/u/3196313?"},"repo":{"id":16302099,"name":"dpastoor/PKPDmisc","url":"https://api.github.com/repos/dpastoor/PKPDmisc"},"payload":{"push_id":536752210,"size":2,"distinct_size":2,"ref":"refs/heads/master","head":"81e56dd1160f5bbe8628cb61de33f4636e4588f0","before":"9e3b7585ba59c6f8e7c80cca0420d954164ff648","commits":[{"sha":"d705ff1bd6889fb2beb7483e203b3234d1ce62df","author":{"email":"5480d79f0d3b1ca7acc7421688b095f8d1e51564@gmail.com","name":"Devin Pastoor"},"message":"refactor, change api to give pauc as a range, fix bug in partial auc calculation where concentration and time points did not match","distinct":true,"url":"https://api.github.com/repos/dpastoor/PKPDmisc/commits/d705ff1bd6889fb2beb7483e203b3234d1ce62df"},{"sha":"81e56dd1160f5bbe8628cb61de33f4636e4588f0","author":{"email":"5480d79f0d3b1ca7acc7421688b095f8d1e51564@gmail.com","name":"Devin Pastoor"},"message":"partial AUC summarization functions","distinct":true,"url":"https://api.github.com/repos/dpastoor/PKPDmisc/commits/81e56dd1160f5bbe8628cb61de33f4636e4588f0"}]},"public":true,"created_at":"2015-01-01T01:00:21Z"}
{"id":"2489395935","type":"PushEvent","actor":{"id":50891,"login":"westurner","gravatar_id":"","url":"https://api.github.com/users/westurner","avatar_url":"https://avatars.githubusercontent.com/u/50891?"},"repo":{"id":23823526,"name":"wrdrd/docs","url":"https://api.github.com/repos/wrdrd/docs"},"payload":{"push_id":536752212,"size":1,"distinct_size":1,"ref":"refs/heads/gh-pages","head":"43ccb4fcce46afbf06307e1272e0fa8fb08558e3","before":"6929c4af15e4293d16bdc64edcd9568b30994dbe","commits":[{"sha":"43ccb4fcce46afbf06307e1272e0fa8fb08558e3","author":{"email":"dd516747aaff812d65b57b832bbf2900e5471cbc@wrd.nu","name":"Wes Turner"},"message":"Update documentation","distinct":true,"url":"https://api.github.com/repos/wrdrd/docs/commits/43ccb4fcce46afbf06307e1272e0fa8fb08558e3"}]},"public":true,"created_at":"2015-01-01T01:00:21Z","org":{"id":8705413,"login":"wrdrd","gravatar_id":"","url":"https://api.github.com/orgs/wrdrd","avatar_url":"https://avatars.githubusercontent.com/u/8705413?"}}
{"id":"2489395944","type":"PushEvent","actor":{"id":50891,"login":"westurner","gravatar_id":"","url":"https://api.github.com/users/westurner","avatar_url":"https://avatars.githubusercontent.com/u/50891?"},"repo":{"id":23823526,"name":"wrdrd/docs","url":"https://api.github.com/repos/wrdrd/docs"},"payload":{"push_id":536752217,"size":1,"distinct_size":1,"ref":"refs/heads/develop","head":"a55294c22ea1c069306bb13a2fd47ff3950e7b47","before":"e44784669180fe7c0c3014aa307b0df1722afa1a","commits":[{"sha":"a55294c22ea1c069306bb13a2fd47ff3950e7b47","author":{"email":"dd516747aaff812d65b57b832bbf2900e5471cbc@wrd.nu","name":"Wes Turner"},"message":"BLD: Add sphinxcontrib-srclinks https://github.com/westurner/sphinxcontrib-srclinks","distinct":true,"url":"https://api.github.com/repos/wrdrd/docs/commits/a55294c22ea1c069306bb13a2fd47ff3950e7b47"}]},"public":true,"created_at":"2015-01-01T01:00:21Z","org":{"id":8705413,"login":"wrdrd","gravatar_id":"","url":"https://api.github.com/orgs/wrdrd","avatar_url":"https://avatars.githubusercontent.com/u/8705413?"}}
{"id":"2489395950","type":"CreateEvent","actor":{"id":10263666,"login":"katiekroik","gravatar_id":"","url":"https://api.github.com/users/katiekroik","avatar_url":"https://avatars.githubusercontent.com/u/10263666?"},"repo":{"id":28677679,"name":"jl4282/swirlwebsite","url":"https://api.github.com/repos/jl4282/swirlwebsite"},"payload":{"ref":"Develop","ref_type":"branch","master_branch":"master","description":"","pusher_type":"user"},"public":true,"created_at":"2015-01-01T01:00:21Z"}
{"id":"2489395958","type":"PushEvent","actor":{"id":7387879,"login":"dsm-git","gravatar_id":"","url":"https://api.github.com/users/dsm-git","avatar_url":"https://avatars.githubusercontent.com/u/7387879?"},"repo":{"id":28354666,"name":"Door43/d43-ar-x-dcv","url":"https://api.github.com/repos/Door43/d43-ar-x-dcv"},"payload":{"push_id":536752224,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"6158b50e1a2b200c5efba979f08248b153ced502","before":"6e5fca555cca6b3531b17347936d26dc7ddc89e4","commits":[{"sha":"6158b50e1a2b200c5efba979f08248b153ced502","author":{"email":"62eb0db178518a8376b23676c2639eb2732c0be8@us.door43.org","name":"Apache"},"message":"Page Edit [39]:  [EricWatt]","distinct":true,"url":"https://api.github.com/repos/Door43/d43-ar-x-dcv/commits/6158b50e1a2b200c5efba979f08248b153ced502"}]},"public":true,"created_at":"2015-01-01T01:00:22Z","org":{"id":4982125,"login":"Door43","gravatar_id":"","url":"https://api.github.com/orgs/Door43","avatar_url":"https://avatars.githubusercontent.com/u/4982125?"}}
{"id":"2489395959","type":"PushEvent","actor":{"id":4083697,"login":"benkrikler","gravatar_id":"","url":"https://api.github.com/users/benkrikler","avatar_url":"https://avatars.githubusercontent.com/u/4083697?"},"repo":{"id":20542797,"name":"alcap-org/alcap-org.github.io","url":"https://api.github.com/repos/alcap-org/alcap-org.github.io"},"payload":{"push_id":536752225,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"7a97c7e4c1ebbc0e9fb204be5c2d8f29588c081a","before":"67705976f15e45db781567aa3533c147042b380b","commits":[{"sha":"7a97c7e4c1ebbc0e9fb204be5c2d8f29588c081a","author":{"email":"a7d7c4a65fd9795221a11ba0ae55ee302ba5e64d@googlemail.com","name":"benkrikler"},"message":"Automatically regenerated doxygen documentation for branch 'master' of 'g4sim' on Thu Jan  1 01:00:01 GMT 2015","distinct":true,"url":"https://api.github.com/repos/alcap-org/alcap-org.github.io/commits/7a97c7e4c1ebbc0e9fb204be5c2d8f29588c081a"}]},"public":true,"created_at":"2015-01-01T01:00:22Z","org":{"id":7251877,"login":"alcap-org","gravatar_id":"","url":"https://api.github.com/orgs/alcap-org","avatar_url":"https://avatars.githubusercontent.com/u/7251877?"}}
{"id":"2489395962","type":"CreateEvent","actor":{"id":16432,"login":"tardate","gravatar_id":"","url":"https://api.github.com/users/tardate","avatar_url":"https://avatars.githubusercontent.com/u/16432?"},"repo":{"id":28238617,"name":"tardate/visual555","url":"https://api.github.com/repos/tardate/visual555"},"payload":{"ref":"1.0.1","ref_type":"tag","master_branch":"master","description":"","pusher_type":"user"},"public":true,"created_at":"2015-01-01T01:00:23Z"}
{"id":"2489395967","type":"PushEvent","actor":{"id":5314189,"login":"panpawn","gravatar_id":"","url":"https://api.github.com/users/panpawn","avatar_url":"https://avatars.githubusercontent.com/u/5314189?"},"repo":{"id":12385273,"name":"panpawn/Pokemon-Showdown","url":"https://api.github.com/repos/panpawn/Pokemon-Showdown"},"payload":{"push_id":536752228,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"a8f530712351c080960f0ff0ed94bc68b3e3a760","before":"a1301b53905292c61da4352a0acbe5145edbb32b","commits":[{"sha":"a8f530712351c080960f0ff0ed94bc68b3e3a760","author":{"email":"cf2a241a02ff3bf0bd910964e03ee01c59e44ac0@gmail.com","name":"panpawn"},"message":"add AbidE","distinct":true,"url":"https://api.github.com/repos/panpawn/Pokemon-Showdown/commits/a8f530712351c080960f0ff0ed94bc68b3e3a760"}]},"public":true,"created_at":"2015-01-01T01:00:23Z"}
{"id":"2489395974","type":"CreateEvent","actor":{"id":1640798,"login":"langorn","gravatar_id":"","url":"https://api.github.com/users/langorn","avatar_url":"https://avatars.githubusercontent.com/u/1640798?"},"repo":{"id":28678190,"name":"langorn/crm","url":"https://api.github.com/repos/langorn/crm"},"payload":{"ref":"master","ref_type":"branch","master_branch":"master","description":"a crm for content management","pusher_type":"user"},"public":true,"created_at":"2015-01-01T01:00:24Z"}
{"id":"2489395980","type":"PushEvent","actor":{"id":4153853,"login":"jlumijarvi","gravatar_id":"","url":"https://api.github.com/users/jlumijarvi","avatar_url":"https://avatars.githubusercontent.com/u/4153853?"},"repo":{"id":28678176,"name":"jlumijarvi/csv2xml","url":"https://api.github.com/repos/jlumijarvi/csv2xml"},"payload":{"push_id":536752237,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"0366b227c1b20d451524d9712bb67771daa739f3","before":"65f5ec025e3a0fd0cb5175e765477a051c20570f","commits":[{"sha":"0366b227c1b20d451524d9712bb67771daa739f3","author":{"email":"40e6fc59d2535c98bfd5d19357e20df6e95cef64@gmail.com","name":"jlumijarvi"},"message":"Create LICENSE.md","distinct":true,"url":"https://api.github.com/repos/jlumijarvi/csv2xml/commits/0366b227c1b20d451524d9712bb67771daa739f3"}]},"public":true,"created_at":"2015-01-01T01:00:25Z"}
{"id":"2489395981","type":"IssuesEvent","actor":{"id":10361074,"login":"CFLPlayer","gravatar_id":"","url":"https://api.github.com/users/CFLPlayer","avatar_url":"https://avatars.githubusercontent.com/u/10361074?"},"repo":{"id":3112411,"name":"mcMMO-Dev/mcMMO","url":"https://api.github.com/repos/mcMMO-Dev/mcMMO"},"payload":{"action":"opened","issue":{"url":"https://api.github.com/repos/mcMMO-Dev/mcMMO/issues/2395","labels_url":"https://api.github.com/repos/mcMMO-Dev/mcMMO/issues/2395/labels{/name}","comments_url":"https://api.github.com/repos/mcMMO-Dev/mcMMO/issues/2395/comments","events_url":"https://api.github.com/repos/mcMMO-Dev/mcMMO/issues/2395/events","html_url":"https://github.com/mcMMO-Dev/mcMMO/issues/2395","id":53210174,"number":2395,"title":"Specialisation for axes, swords and unarmed.","user":{"login":"CFLPlayer","id":10361074,"avatar_url":"https://avatars.githubusercontent.com/u/10361074?v=3","gravatar_id":"","url":"https://api.github.com/users/CFLPlayer","html_url":"https://github.com/CFLPlayer","followers_url":"https://api.github.com/users/CFLPlayer/followers","following_url":"https://api.github.com/users/CFLPlayer/following{/other_user}","gists_url":"https://api.github.com/users/CFLPlayer/gists{/gist_id}","starred_url":"https://api.github.com/users/CFLPlayer/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/CFLPlayer/subscriptions","organizations_url":"https://api.github.com/users/CFLPlayer/orgs","repos_url":"https://api.github.com/users/CFLPlayer/repos","events_url":"https://api.github.com/users/CFLPlayer/events{/privacy}","received_events_url":"https://api.github.com/users/CFLPlayer/received_events","type":"User","site_admin":false},"labels":[],"state":"open","locked":false,"assignee":null,"milestone":null,"comments":0,"created_at":"2015-01-01T01:00:25Z","updated_at":"2015-01-01T01:00:25Z","closed_at":null,"body":"Berserk, skull splitter and serrated strikes. In hypothetical terms, every person who wields an axe isnt always going to crack a skull open. A martial arts expert is hardly going to go into a full Celtic berserk are they?\r\nSo. My point is that there is no diversity. As you train up your skill you should be able to choose what you focus on when wielding your weapon. I'm proposing we add a progression system, which allows players to build upon a basic foundation of an ability. Using a point every 100 levels you should be able to build a \"ability specialisation\" that is unique to the player. I will use unarmed as an example;\r\nWhen your reach level 100 in unarmed you receive a small menu (possibly use the chest menu system?) from this you select a foundation perk, this gives you your beginning ability. Here's some ideas of unarmed abilities:\r\nForceful Kick. Ready your feet and deal astounding knock back damage to your foe.\r\nBerserk (changed). Ready your fists and enter a rage dealing more damage per hit though hitting slower.\r\nKneck Snap. Ready your hands as you approach your target, and if they are weak enough instantly put them to rest.\r\nDrunken Slugging. Ready your fists and enter a drunken state where you take less damage and deal a small amount more.\r\nClaws. Ready your hands as you tear at your enemy adding the bleed effect to them.\r\nLow Blow. Raise your foot and aim low, dazing your opponent.\r\n\r\nLets say I select Drunken Slugging. I cannot go back on that decision. Then I receive another menu giving me options into which aspect of drunken slugging I should focus on. My options would be:\r\nDrunken Resistance. Take less damage\r\nDrunken Bravery. Do slightly more damage\r\nDrunken belching. When fighting you belch causing a nausea effect to enemies around you.\r\n\r\nI would then gain more points every 100 levels to improve myself even more. These skills would cap at 1000 giving a varied result. Once completed you can rename your Technique for all to fear. This would be available for axe users and sword users to just different foundations.\r\n\r\nThank you for reading. Pls criticise / praise. Ask for more if you want it.\r\n-Regards CFLPlayer"}},"public":true,"created_at":"2015-01-01T01:00:25Z","org":{"id":1429663,"login":"mcMMO-Dev","gravatar_id":"","url":"https://api.github.com/orgs/mcMMO-Dev","avatar_url":"https://avatars.githubusercontent.com/u/1429663?"}}
{"id":"2489395982","type":"PushEvent","actor":{"id":624632,"login":"gusennan","gravatar_id":"","url":"https://api.github.com/users/gusennan","avatar_url":"https://avatars.githubusercontent.com/u/624632?"},"repo":{"id":28673499,"name":"gusennan/xamarin-forms-samples","url":"https://api.github.com/repos/gusennan/xamarin-forms-samples"},"payload":{"push_id":536752238,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"aa16d946ccf840fa6a1b57ee7d0fa8c44dad087a","before":"9e570dc829e7b3e9eb2e67769edd189cd0c8a723","commits":[{"sha":"aa16d946ccf840fa6a1b57ee7d0fa8c44dad087a","author":{"email":"b3a2a659a9d22951edeb5874b5d21f350b75f00e@riseup.net","name":"Nate Guerin"},"message":"revert some formatting changes","distinct":true,"url":"https://api.github.com/repos/gusennan/xamarin-forms-samples/commits/aa16d946ccf840fa6a1b57ee7d0fa8c44dad087a"}]},"public":true,"created_at":"2015-01-01T01:00:25Z"}
{"id":"2489395984","type":"WatchEvent","actor":{"id":5286446,"login":"otmjka","gravatar_id":"","url":"https://api.github.com/users/otmjka","avatar_url":"https://avatars.githubusercontent.com/u/5286446?"},"repo":{"id":1195004,"name":"angular/angular-seed","url":"https://api.github.com/repos/angular/angular-seed"},"payload":{"action":"started"},"public":true,"created_at":"2015-01-01T01:00:25Z","org":{"id":139426,"login":"angular","gravatar_id":"","url":"https://api.github.com/orgs/angular","avatar_url":"https://avatars.githubusercontent.com/u/139426?"}}
{"id":"2489395985","type":"PushEvent","actor":{"id":1432111,"login":"cubiclesoft","gravatar_id":"","url":"https://api.github.com/users/cubiclesoft","avatar_url":"https://avatars.githubusercontent.com/u/1432111?"},"repo":{"id":28677735,"name":"cubiclesoft/barebones-cms-shortcode-bb_syntaxhighlight","url":"https://api.github.com/repos/cubiclesoft/barebones-cms-shortcode-bb_syntaxhighlight"},"payload":{"push_id":536752240,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"51c7ea91a05fed5f7a7065da857de0fbf1eb6e2e","before":"9631619d7d26f9f5aff0641c78cf198ef21f46d0","commits":[{"sha":"51c7ea91a05fed5f7a7065da857de0fbf1eb6e2e","author":{"email":"50f3f01caa053693ce619d596e14b0ff3901ab49@cubiclesoft.com","name":"cubiclesoft"},"message":"Added extension ID.","distinct":true,"url":"https://api.github.com/repos/cubiclesoft/barebones-cms-shortcode-bb_syntaxhighlight/commits/51c7ea91a05fed5f7a7065da857de0fbf1eb6e2e"}]},"public":true,"created_at":"2015-01-01T01:00:25Z"}
{"id":"2489395992","type":"PushEvent","actor":{"id":1356088,"login":"Zaryafaraj","gravatar_id":"","url":"https://api.github.com/users/Zaryafaraj","avatar_url":"https://avatars.githubusercontent.com/u/1356088?"},"repo":{"id":26995510,"name":"Fathalian/Guild","url":"https://api.github.com/repos/Fathalian/Guild"},"payload":{"push_id":536752245,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"29abf0e942463dd27cf0666ddf54abda099859b2","before":"9a773fc648910c7a2499401f44a6e5f71eb30460","commits":[{"sha":"29abf0e942463dd27cf0666ddf54abda099859b2","author":{"email":"de8898f6c55e335aa0a2b937fae65fb756ee038f@gmail.com","name":"Zaryafaraj"},"message":"added back change from ali","distinct":true,"url":"https://api.github.com/repos/Fathalian/Guild/commits/29abf0e942463dd27cf0666ddf54abda099859b2"}]},"public":true,"created_at":"2015-01-01T01:00:26Z"}
{"id":"2489395993","type":"PushEvent","actor":{"id":1120754,"login":"dobkeratops","gravatar_id":"","url":"https://api.github.com/users/dobkeratops","avatar_url":"https://avatars.githubusercontent.com/u/1120754?"},"repo":{"id":27616619,"name":"dobkeratops/compiler","url":"https://api.github.com/repos/dobkeratops/compiler"},"payload":{"push_id":536752246,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"aa88601009f892e8890b2f47f2610d62c37e858b","before":"9a5138f5617f14feb94326b0673d9779d8ec70b8","commits":[{"sha":"aa88601009f892e8890b2f47f2610d62c37e858b","author":{"email":"f8c234822f2256bfec32be392872f65b14509346@gmail.com","name":"dobkeratops"},"message":"adding rvalue references","distinct":true,"url":"https://api.github.com/repos/dobkeratops/compiler/commits/aa88601009f892e8890b2f47f2610d62c37e858b"}]},"public":true,"created_at":"2015-01-01T01:00:26Z"}
{"id":"2489396002","type":"PushEvent","actor":{"id":1130906,"login":"eliben","gravatar_id":"","url":"https://api.github.com/users/eliben","avatar_url":"https://avatars.githubusercontent.com/u/1130906?"},"repo":{"id":13198211,"name":"python/cpython","url":"https://api.github.com/repos/python/cpython"},"payload":{"push_id":536752255,"size":6,"distinct_size":2,"ref":"refs/heads/master","head":"fa28e5ed9fb0bc5bed7fc7921c6638c8082cc3c4","before":"461185cc199dac7ce94a8699be66adb4d97288ab","commits":[{"sha":"44d315ac0e2cc59df9107f0853843ff7b461e32c","author":{"email":"fe09bc2ef2737a3258f978e26226dcbac1b3f948@python.org","name":"Benjamin Peterson"},"message":"update for copyright for 2015","distinct":false,"url":"https://api.github.com/repos/python/cpython/commits/44d315ac0e2cc59df9107f0853843ff7b461e32c"},{"sha":"615249dda22c98fdb9c5dfd7724b1e24eb62e71d","author":{"email":"fe09bc2ef2737a3258f978e26226dcbac1b3f948@python.org","name":"Benjamin Peterson"},"message":"merge 3.2","distinct":false,"url":"https://api.github.com/repos/python/cpython/commits/615249dda22c98fdb9c5dfd7724b1e24eb62e71d"},{"sha":"8f6109316e19f20ee94e39eef4a24ffd9db6dd10","author":{"email":"fe09bc2ef2737a3258f978e26226dcbac1b3f948@python.org","name":"Benjamin Peterson"},"message":"merge 3.3","distinct":false,"url":"https://api.github.com/repos/python/cpython/commits/8f6109316e19f20ee94e39eef4a24ffd9db6dd10"},{"sha":"db989c1d39c1a201fed41f0f8adacd589ede0a8f","author":{"email":"fe09bc2ef2737a3258f978e26226dcbac1b3f948@python.org","name":"Benjamin Peterson"},"message":"merge 3.4","distinct":true,"url":"https://api.github.com/repos/python/cpython/commits/db989c1d39c1a201fed41f0f8adacd589ede0a8f"},{"sha":"6c97ab26377576eaa2f10d451511cf10ba7cde12","author":{"email":"43f2a2d2c86e22bc80f5acc690d97a5dcf4c4b2f@acm.org","name":"Ned Deily"},"message":"Update copyright dates in OS X installer.","distinct":false,"url":"https://api.github.com/repos/python/cpython/commits/6c97ab26377576eaa2f10d451511cf10ba7cde12"},{"sha":"fa28e5ed9fb0bc5bed7fc7921c6638c8082cc3c4","author":{"email":"43f2a2d2c86e22bc80f5acc690d97a5dcf4c4b2f@acm.org","name":"Ned Deily"},"message":"Update copyright dates in OS X installer.","distinct":true,"url":"https://api.github.com/repos/python/cpython/commits/fa28e5ed9fb0bc5bed7fc7921c6638c8082cc3c4"}]},"public":true,"created_at":"2015-01-01T01:00:27Z","org":{"id":1525981,"login":"python","gravatar_id":"","url":"https://api.github.com/orgs/python","avatar_url":"https://avatars.githubusercontent.com/u/1525981?"}}
{"id":"2489396009","type":"PushEvent","actor":{"id":1297496,"login":"milkmanjack","gravatar_id":"","url":"https://api.github.com/users/milkmanjack","avatar_url":"https://avatars.githubusercontent.com/u/1297496?"},"repo":{"id":28675501,"name":"milkmanjack/twitch-intermission-testv1","url":"https://api.github.com/repos/milkmanjack/twitch-intermission-testv1"},"payload":{"push_id":536752260,"size":1,"distinct_size":1,"ref":"refs/heads/gh-pages","head":"1d30906590d5ab58448dd68c71f0f8ff4852da8c","before":"11a03a864e00804d1274b168e5bb07cbbab29502","commits":[{"sha":"1d30906590d5ab58448dd68c71f0f8ff4852da8c","author":{"email":"1a6575c57e84915cbf78e3fafdf0c16be650b9d0@gmail.com","name":"Curtis Erickson"},"message":"Update main.js","distinct":true,"url":"https://api.github.com/repos/milkmanjack/twitch-intermission-testv1/commits/1d30906590d5ab58448dd68c71f0f8ff4852da8c"}]},"public":true,"created_at":"2015-01-01T01:00:28Z"}
{"id":"2489396019","type":"PushEvent","actor":{"id":1130906,"login":"eliben","gravatar_id":"","url":"https://api.github.com/users/eliben","avatar_url":"https://avatars.githubusercontent.com/u/1130906?"},"repo":{"id":13198211,"name":"python/cpython","url":"https://api.github.com/repos/python/cpython"},"payload":{"push_id":536752266,"size":4,"distinct_size":0,"ref":"refs/heads/3.4","head":"6c97ab26377576eaa2f10d451511cf10ba7cde12","before":"7f6073da37c859f32b3a9bfcb0faa41d24db1230","commits":[{"sha":"44d315ac0e2cc59df9107f0853843ff7b461e32c","author":{"email":"fe09bc2ef2737a3258f978e26226dcbac1b3f948@python.org","name":"Benjamin Peterson"},"message":"update for copyright for 2015","distinct":false,"url":"https://api.github.com/repos/python/cpython/commits/44d315ac0e2cc59df9107f0853843ff7b461e32c"},{"sha":"615249dda22c98fdb9c5dfd7724b1e24eb62e71d","author":{"email":"fe09bc2ef2737a3258f978e26226dcbac1b3f948@python.org","name":"Benjamin Peterson"},"message":"merge 3.2","distinct":false,"url":"https://api.github.com/repos/python/cpython/commits/615249dda22c98fdb9c5dfd7724b1e24eb62e71d"},{"sha":"8f6109316e19f20ee94e39eef4a24ffd9db6dd10","author":{"email":"fe09bc2ef2737a3258f978e26226dcbac1b3f948@python.org","name":"Benjamin Peterson"},"message":"merge 3.3","distinct":false,"url":"https://api.github.com/repos/python/cpython/commits/8f6109316e19f20ee94e39eef4a24ffd9db6dd10"},{"sha":"6c97ab26377576eaa2f10d451511cf10ba7cde12","author":{"email":"43f2a2d2c86e22bc80f5acc690d97a5dcf4c4b2f@acm.org","name":"Ned Deily"},"message":"Update copyright dates in OS X installer.","distinct":false,"url":"https://api.github.com/repos/python/cpython/commits/6c97ab26377576eaa2f10d451511cf10ba7cde12"}]},"public":true,"created_at":"2015-01-01T01:00:28Z","org":{"id":1525981,"login":"python","gravatar_id":"","url":"https://api.github.com/orgs/python","avatar_url":"https://avatars.githubusercontent.com/u/1525981?"}}
{"id":"2489396023","type":"PushEvent","actor":{"id":5225396,"login":"zzzTNTzzz","gravatar_id":"","url":"https://api.github.com/users/zzzTNTzzz","avatar_url":"https://avatars.githubusercontent.com/u/5225396?"},"repo":{"id":28316263,"name":"zzzTNTzzz/TNT","url":"https://api.github.com/repos/zzzTNTzzz/TNT"},"payload":{"push_id":536752267,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"f4d5d7cef16304ef8787c96a9808a401c7578eb4","before":"9c700d0a24416ab735b1b45bce5de2531da02b4c","commits":[{"sha":"f4d5d7cef16304ef8787c96a9808a401c7578eb4","author":{"email":"c20044e993b98218b0a612f57dae8d33d3a1a159@live.com","name":"Tony"},"message":"small edits / removed fx for large mult","distinct":true,"url":"https://api.github.com/repos/zzzTNTzzz/TNT/commits/f4d5d7cef16304ef8787c96a9808a401c7578eb4"}]},"public":true,"created_at":"2015-01-01T01:00:29Z"}
{"id":"2489396028","type":"PushEvent","actor":{"id":1130906,"login":"eliben","gravatar_id":"","url":"https://api.github.com/users/eliben","avatar_url":"https://avatars.githubusercontent.com/u/1130906?"},"repo":{"id":13198211,"name":"python/cpython","url":"https://api.github.com/repos/python/cpython"},"payload":{"push_id":536752268,"size":2,"distinct_size":0,"ref":"refs/heads/3.3","head":"615249dda22c98fdb9c5dfd7724b1e24eb62e71d","before":"c917dcb370e4f785f4d5eabfb406bfd5949ce84b","commits":[{"sha":"44d315ac0e2cc59df9107f0853843ff7b461e32c","author":{"email":"fe09bc2ef2737a3258f978e26226dcbac1b3f948@python.org","name":"Benjamin Peterson"},"message":"update for copyright for 2015","distinct":false,"url":"https://api.github.com/repos/python/cpython/commits/44d315ac0e2cc59df9107f0853843ff7b461e32c"},{"sha":"615249dda22c98fdb9c5dfd7724b1e24eb62e71d","author":{"email":"fe09bc2ef2737a3258f978e26226dcbac1b3f948@python.org","name":"Benjamin Peterson"},"message":"merge 3.2","distinct":false,"url":"https://api.github.com/repos/python/cpython/commits/615249dda22c98fdb9c5dfd7724b1e24eb62e71d"}]},"public":true,"created_at":"2015-01-01T01:00:31Z","org":{"id":1525981,"login":"python","gravatar_id":"","url":"https://api.github.com/orgs/python","avatar_url":"https://avatars.githubusercontent.com/u/1525981?"}}
{"id":"2489396030","type":"IssueCommentEvent","actor":{"id":1540132,"login":"carltonwhitehead","gravatar_id":"","url":"https://api.github.com/users/carltonwhitehead","avatar_url":"https://avatars.githubusercontent.com/u/1540132?"},"repo":{"id":28649714,"name":"carltonwhitehead/coner","url":"https://api.github.com/repos/carltonwhitehead/coner"},"payload":{"action":"created","issue":{"url":"https://api.github.com/repos/carltonwhitehead/coner/issues/2","labels_url":"https://api.github.com/repos/carltonwhitehead/coner/issues/2/labels{/name}","comments_url":"https://api.github.com/repos/carltonwhitehead/coner/issues/2/comments","events_url":"https://api.github.com/repos/carltonwhitehead/coner/issues/2/events","html_url":"https://github.com/carltonwhitehead/coner/issues/2","id":53190006,"number":2,"title":"Integrate checkstyle","user":{"login":"carltonwhitehead","id":1540132,"avatar_url":"https://avatars.githubusercontent.com/u/1540132?v=3","gravatar_id":"","url":"https://api.github.com/users/carltonwhitehead","html_url":"https://github.com/carltonwhitehead","followers_url":"https://api.github.com/users/carltonwhitehead/followers","following_url":"https://api.github.com/users/carltonwhitehead/following{/other_user}","gists_url":"https://api.github.com/users/carltonwhitehead/gists{/gist_id}","starred_url":"https://api.github.com/users/carltonwhitehead/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/carltonwhitehead/subscriptions","organizations_url":"https://api.github.com/users/carltonwhitehead/orgs","repos_url":"https://api.github.com/users/carltonwhitehead/repos","events_url":"https://api.github.com/users/carltonwhitehead/events{/privacy}","received_events_url":"https://api.github.com/users/carltonwhitehead/received_events","type":"User","site_admin":false},"labels":[],"state":"open","locked":false,"assignee":{"login":"jshort","id":1186444,"avatar_url":"https://avatars.githubusercontent.com/u/1186444?v=3","gravatar_id":"","url":"https://api.github.com/users/jshort","html_url":"https://github.com/jshort","followers_url":"https://api.github.com/users/jshort/followers","following_url":"https://api.github.com/users/jshort/following{/other_user}","gists_url":"https://api.github.com/users/jshort/gists{/gist_id}","starred_url":"https://api.github.com/users/jshort/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/jshort/subscriptions","organizations_url":"https://api.github.com/users/jshort/orgs","repos_url":"https://api.github.com/users/jshort/repos","events_url":"https://api.github.com/users/jshort/events{/privacy}","received_events_url":"https://api.github.com/users/jshort/received_events","type":"User","site_admin":false},"milestone":null,"comments":4,"created_at":"2014-12-31T16:01:06Z","updated_at":"2015-01-01T01:00:30Z","closed_at":null,"body":""},"comment":{"url":"https://api.github.com/repos/carltonwhitehead/coner/issues/comments/68477218","html_url":"https://github.com/carltonwhitehead/coner/issues/2#issuecomment-68477218","issue_url":"https://api.github.com/repos/carltonwhitehead/coner/issues/2","id":68477218,"user":{"login":"carltonwhitehead","id":1540132,"avatar_url":"https://avatars.githubusercontent.com/u/1540132?v=3","gravatar_id":"","url":"https://api.github.com/users/carltonwhitehead","html_url":"https://github.com/carltonwhitehead","followers_url":"https://api.github.com/users/carltonwhitehead/followers","following_url":"https://api.github.com/users/carltonwhitehead/following{/other_user}","gists_url":"https://api.github.com/users/carltonwhitehead/gists{/gist_id}","starred_url":"https://api.github.com/users/carltonwhitehead/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/carltonwhitehead/subscriptions","organizations_url":"https://api.github.com/users/carltonwhitehead/orgs","repos_url":"https://api.github.com/users/carltonwhitehead/repos","events_url":"https://api.github.com/users/carltonwhitehead/events{/privacy}","received_events_url":"https://api.github.com/users/carltonwhitehead/received_events","type":"User","site_admin":false},"created_at":"2015-01-01T01:00:30Z","updated_at":"2015-01-01T01:00:30Z","body":"I agree we should have good javadocs. I'm happy to flag those as failures"}},"public":true,"created_at":"2015-01-01T01:00:31Z"}
{"id":"2489396036","type":"PushEvent","actor":{"id":1130906,"login":"eliben","gravatar_id":"","url":"https://api.github.com/users/eliben","avatar_url":"https://avatars.githubusercontent.com/u/1130906?"},"repo":{"id":13198211,"name":"python/cpython","url":"https://api.github.com/repos/python/cpython"},"payload":{"push_id":536752269,"size":1,"distinct_size":0,"ref":"refs/heads/3.2","head":"44d315ac0e2cc59df9107f0853843ff7b461e32c","before":"acc6002f0c33d1a29555e4a52322c7a20901ffe2","commits":[{"sha":"44d315ac0e2cc59df9107f0853843ff7b461e32c","author":{"email":"fe09bc2ef2737a3258f978e26226dcbac1b3f948@python.org","name":"Benjamin Peterson"},"message":"update for copyright for 2015","distinct":false,"url":"https://api.github.com/repos/python/cpython/commits/44d315ac0e2cc59df9107f0853843ff7b461e32c"}]},"public":true,"created_at":"2015-01-01T01:00:31Z","org":{"id":1525981,"login":"python","gravatar_id":"","url":"https://api.github.com/orgs/python","avatar_url":"https://avatars.githubusercontent.com/u/1525981?"}}
{"id":"2489396037","type":"PushEvent","actor":{"id":280212,"login":"KenanSulayman","gravatar_id":"","url":"https://api.github.com/users/KenanSulayman","avatar_url":"https://avatars.githubusercontent.com/u/280212?"},"repo":{"id":21481110,"name":"KenanSulayman/heartbeat","url":"https://api.github.com/repos/KenanSulayman/heartbeat"},"payload":{"push_id":536752271,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"9ceb5cdffe02cef186b379026ce6c2dc0d74b3d4","before":"a51c727e5f7d975cad627cddcbafb200a4fb5967","commits":[{"sha":"9ceb5cdffe02cef186b379026ce6c2dc0d74b3d4","author":{"email":"9176253dfc0bc82671a5e984646605f93319147a@sly.mn","name":"Kenan Sulayman"},"message":"1420074028174\n\n8KwesSwq0wt6hgDqwgssdjZHjXiw3zHu47um9GjGlvY=","distinct":true,"url":"https://api.github.com/repos/KenanSulayman/heartbeat/commits/9ceb5cdffe02cef186b379026ce6c2dc0d74b3d4"}]},"public":true,"created_at":"2015-01-01T01:00:31Z"}
{"id":"2489396038","type":"PushEvent","actor":{"id":2645146,"login":"daniel-beard","gravatar_id":"","url":"https://api.github.com/users/daniel-beard","avatar_url":"https://avatars.githubusercontent.com/u/2645146?"},"repo":{"id":28644199,"name":"daniel-beard/JuliaProjectEuler","url":"https://api.github.com/repos/daniel-beard/JuliaProjectEuler"},"payload":{"push_id":536752272,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"7881c902dceed5e101e6e42e96a792fefc0a9830","before":"e8f26d280d6ef9080a4d4dad3c3bde3bafaa3fab","commits":[{"sha":"7881c902dceed5e101e6e42e96a792fefc0a9830","author":{"email":"734c834e28fd1bd905b71456871f8daf85204b1a@groupon.com","name":"Daniel Beard"},"message":"Solution to p25, fix p2","distinct":true,"url":"https://api.github.com/repos/daniel-beard/JuliaProjectEuler/commits/7881c902dceed5e101e6e42e96a792fefc0a9830"}]},"public":true,"created_at":"2015-01-01T01:00:31Z"}
{"id":"2489396039","type":"CreateEvent","actor":{"id":1995168,"login":"bigtunacan","gravatar_id":"","url":"https://api.github.com/users/bigtunacan","avatar_url":"https://avatars.githubusercontent.com/u/1995168?"},"repo":{"id":28678198,"name":"bigtunacan/pages","url":"https://api.github.com/repos/bigtunacan/pages"},"payload":{"ref":"gh-pages","ref_type":"branch","master_branch":"gh-pages","description":"Jekyll Pages Blog","pusher_type":"user"},"public":true,"created_at":"2015-01-01T01:00:31Z"}
{"id":"2489396050","type":"PushEvent","actor":{"id":4181161,"login":"colin350","gravatar_id":"","url":"https://api.github.com/users/colin350","avatar_url":"https://avatars.githubusercontent.com/u/4181161?"},"repo":{"id":28090675,"name":"colin350/AMPlug","url":"https://api.github.com/repos/colin350/AMPlug"},"payload":{"push_id":536752284,"size":1,"distinct_size":1,"ref":"refs/heads/gh-pages","head":"68f22e3bc1dcf3f067f744a049977257c95cb45a","before":"2213bf636d7fe6ecf0d0a35aa8bc9bf3b4907c77","commits":[{"sha":"68f22e3bc1dcf3f067f744a049977257c95cb45a","author":{"email":"ca987d55a775ffdf8dd75c235e509848e0c30c0d@gmail.com","name":"colin350"},"message":"Update","distinct":true,"url":"https://api.github.com/repos/colin350/AMPlug/commits/68f22e3bc1dcf3f067f744a049977257c95cb45a"}]},"public":true,"created_at":"2015-01-01T01:00:31Z"}
{"id":"2489396053","type":"PushEvent","actor":{"id":532183,"login":"herry13","gravatar_id":"","url":"https://api.github.com/users/herry13","avatar_url":"https://avatars.githubusercontent.com/u/532183?"},"repo":{"id":26089827,"name":"nurilabs/nuri-lang","url":"https://api.github.com/repos/nurilabs/nuri-lang"},"payload":{"push_id":536752286,"size":5,"distinct_size":5,"ref":"refs/heads/refactor-type","head":"47ed22c2d952b6ce942a136189afe1de1b62c809","before":"4ae6e32a27fd491b5cc698fa26ef106bfa34b707","commits":[{"sha":"85b8ab769d6535156dcdd39b75fe2eaf56de1b84","author":{"email":"26abebc618a7c031a4cf36426687793911eeb0c3@gmail.com","name":"Herry"},"message":"Add forward-type reference-index (T_Forward T_RefIndex).","distinct":true,"url":"https://api.github.com/repos/nurilabs/nuri-lang/commits/85b8ab769d6535156dcdd39b75fe2eaf56de1b84"},{"sha":"42a9572c1bb841dd7e3c7daf51eb9a2e62bf113b","author":{"email":"26abebc618a7c031a4cf36426687793911eeb0c3@gmail.com","name":"Herry"},"message":"Define func 'at': return type of array-element. Implement forward-type of reference-index. Refactor forward-type substitution function (replace_forward_type).","distinct":true,"url":"https://api.github.com/repos/nurilabs/nuri-lang/commits/42a9572c1bb841dd7e3c7daf51eb9a2e62bf113b"},{"sha":"ec2e1143a239fed7dfd56fae987f277de80f411d","author":{"email":"26abebc618a7c031a4cf36426687793911eeb0c3@gmail.com","name":"Herry"},"message":"Removing func 'nuri_array_at_index', and replacing it with func 'Type.at'.","distinct":true,"url":"https://api.github.com/repos/nurilabs/nuri-lang/commits/ec2e1143a239fed7dfd56fae987f277de80f411d"},{"sha":"ae4ce825f60fdd621b47175d39974c158c36ba3d","author":{"email":"26abebc618a7c031a4cf36426687793911eeb0c3@gmail.com","name":"Herry"},"message":"Refactor 'array1.nuri'. Add files array{2,3}.nuri: test-cases of reference-index in function and forward-reference-index.","distinct":true,"url":"https://api.github.com/repos/nurilabs/nuri-lang/commits/ae4ce825f60fdd621b47175d39974c158c36ba3d"},{"sha":"47ed22c2d952b6ce942a136189afe1de1b62c809","author":{"email":"26abebc618a7c031a4cf36426687793911eeb0c3@gmail.com","name":"Herry"},"message":"Add array{2,3}.nuri to good test-files.","distinct":true,"url":"https://api.github.com/repos/nurilabs/nuri-lang/commits/47ed22c2d952b6ce942a136189afe1de1b62c809"}]},"public":true,"created_at":"2015-01-01T01:00:31Z","org":{"id":7775038,"login":"nurilabs","gravatar_id":"","url":"https://api.github.com/orgs/nurilabs","avatar_url":"https://avatars.githubusercontent.com/u/7775038?"}}
{"id":"2489396055","type":"PushEvent","actor":{"id":1456047,"login":"kyokomi","gravatar_id":"","url":"https://api.github.com/users/kyokomi","avatar_url":"https://avatars.githubusercontent.com/u/1456047?"},"repo":{"id":25506232,"name":"kyokomi/gomajan","url":"https://api.github.com/repos/kyokomi/gomajan"},"payload":{"push_id":536752287,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"33d7ed3c98a7cfb19ce924735a7420de0ca57ef7","before":"fb389c371934eb30c750195f1bff5e09627860aa","commits":[{"sha":"33d7ed3c98a7cfb19ce924735a7420de0ca57ef7","author":{"email":"2ea0042be6760fbcd1e13c4e2076e1e54e82d1d5@gmail.com","name":"kyokomi"},"message":"fix: 混全帯么九, 純全帯么九判定","distinct":true,"url":"https://api.github.com/repos/kyokomi/gomajan/commits/33d7ed3c98a7cfb19ce924735a7420de0ca57ef7"}]},"public":true,"created_at":"2015-01-01T01:00:32Z"}
{"id":"2489396057","type":"PushEvent","actor":{"id":1525481,"login":"timholy","gravatar_id":"","url":"https://api.github.com/users/timholy","avatar_url":"https://avatars.githubusercontent.com/u/1525481?"},"repo":{"id":9519622,"name":"timholy/ImageView.jl","url":"https://api.github.com/repos/timholy/ImageView.jl"},"payload":{"push_id":536752289,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"ddf2c3b25177c1cc75a47443cf401c235029c052","before":"a666eede913e449bcc3f91ac7a27fe8e67fd99f7","commits":[{"sha":"ddf2c3b25177c1cc75a47443cf401c235029c052","author":{"email":"cc3de660a22a4f0e231dde9743ac1c9a7d407254@gmail.com","name":"Tim Holy"},"message":"SubArrays are immutable in julia 0.4","distinct":true,"url":"https://api.github.com/repos/timholy/ImageView.jl/commits/ddf2c3b25177c1cc75a47443cf401c235029c052"}]},"public":true,"created_at":"2015-01-01T01:00:32Z"}
{"id":"2489396062","type":"PushEvent","actor":{"id":1130906,"login":"eliben","gravatar_id":"","url":"https://api.github.com/users/eliben","avatar_url":"https://avatars.githubusercontent.com/u/1130906?"},"repo":{"id":13198211,"name":"python/cpython","url":"https://api.github.com/repos/python/cpython"},"payload":{"push_id":536752291,"size":2,"distinct_size":2,"ref":"refs/heads/2.7","head":"23eea0071b058be9601a97f44835111a32127c2b","before":"bfce62ccfbf18d91f14357851d6dc959cfb66f72","commits":[{"sha":"9ab0287cda68aeb11567844635573caf0d55bb32","author":{"email":"fe09bc2ef2737a3258f978e26226dcbac1b3f948@python.org","name":"Benjamin Peterson"},"message":"update for copyright for 2015","distinct":true,"url":"https://api.github.com/repos/python/cpython/commits/9ab0287cda68aeb11567844635573caf0d55bb32"},{"sha":"23eea0071b058be9601a97f44835111a32127c2b","author":{"email":"43f2a2d2c86e22bc80f5acc690d97a5dcf4c4b2f@acm.org","name":"Ned Deily"},"message":"Update copyright dates in OS X installer.","distinct":true,"url":"https://api.github.com/repos/python/cpython/commits/23eea0071b058be9601a97f44835111a32127c2b"}]},"public":true,"created_at":"2015-01-01T01:00:32Z","org":{"id":1525981,"login":"python","gravatar_id":"","url":"https://api.github.com/orgs/python","avatar_url":"https://avatars.githubusercontent.com/u/1525981?"}}
{"id":"2489396071","type":"PushEvent","actor":{"id":775165,"login":"bingo2011","gravatar_id":"","url":"https://api.github.com/users/bingo2011","avatar_url":"https://avatars.githubusercontent.com/u/775165?"},"repo":{"id":26621366,"name":"bingo2011/build_my_own_angularjs","url":"https://api.github.com/repos/bingo2011/build_my_own_angularjs"},"payload":{"push_id":536752295,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"92be8c499b4444d5fa81526c236d786f5d7a72e7","before":"51d241ce6e96e416dd85444f19394836c649e20d","commits":[{"sha":"92be8c499b4444d5fa81526c236d786f5d7a72e7","author":{"email":"332f63e5fcc114b9df574d567c4a465ad2c0cc59@foxmail.com","name":"bingo2013"},"message":"compile section","distinct":true,"url":"https://api.github.com/repos/bingo2011/build_my_own_angularjs/commits/92be8c499b4444d5fa81526c236d786f5d7a72e7"}]},"public":true,"created_at":"2015-01-01T01:00:33Z"}
{"id":"2489396073","type":"PushEvent","actor":{"id":3730551,"login":"rjrobinson","gravatar_id":"","url":"https://api.github.com/users/rjrobinson","avatar_url":"https://avatars.githubusercontent.com/u/3730551?"},"repo":{"id":28096670,"name":"rjrobinson/js_advanced_fund","url":"https://api.github.com/repos/rjrobinson/js_advanced_fund"},"payload":{"push_id":536752296,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"90a1821a6b454797e205bb1fe6c25636b1b69af4","before":"85877570f9371cf50634c12350baba226706092e","commits":[{"sha":"90a1821a6b454797e205bb1fe6c25636b1b69af4","author":{"email":"a000d77e361dc814b63406f3083337032f0ff8f0@gmail.com","name":"RJ Robinson"},"message":"added todo list","distinct":true,"url":"https://api.github.com/repos/rjrobinson/js_advanced_fund/commits/90a1821a6b454797e205bb1fe6c25636b1b69af4"}]},"public":true,"created_at":"2015-01-01T01:00:33Z"}
{"id":"2489396077","type":"PushEvent","actor":{"id":4779042,"login":"catbox","gravatar_id":"","url":"https://api.github.com/users/catbox","avatar_url":"https://avatars.githubusercontent.com/u/4779042?"},"repo":{"id":21256946,"name":"catbox/spring","url":"https://api.github.com/repos/catbox/spring"},"payload":{"push_id":536752299,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"83bf3f6366f5426aeaea1e08f1f41232110a52fa","before":"6078a2bf85fdabb3702235219a5ad0c10d88013c","commits":[{"sha":"83bf3f6366f5426aeaea1e08f1f41232110a52fa","author":{"email":"bef99c22f6b2d87df8a9065e8478a3a5ff8b4a6c@gmail.com","name":"cocolekat"},"message":"app not needed\n\nSigned-off-by: cocolekat <cocolekat@gmail.com>","distinct":true,"url":"https://api.github.com/repos/catbox/spring/commits/83bf3f6366f5426aeaea1e08f1f41232110a52fa"}]},"public":true,"created_at":"2015-01-01T01:00:34Z"}
{"id":"2489396084","type":"PushEvent","actor":{"id":10225575,"login":"ExclusiveOrange","gravatar_id":"","url":"https://api.github.com/users/ExclusiveOrange","avatar_url":"https://avatars.githubusercontent.com/u/10225575?"},"repo":{"id":28677579,"name":"ExclusiveOrange/synthesizer","url":"https://api.github.com/repos/ExclusiveOrange/synthesizer"},"payload":{"push_id":536752304,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"0e64036d5ac0d9c24b4cbe39bb778570db49caba","before":"5e99a85807e01f44fed53f71bba0e0eaa3893084","commits":[{"sha":"0e64036d5ac0d9c24b4cbe39bb778570db49caba","author":{"email":"de3bd7888dcfc4f7d00a4ef606710f57cbba1dbb@hotmail.com","name":"ExclusiveOrange"},"message":"included release .exe","distinct":true,"url":"https://api.github.com/repos/ExclusiveOrange/synthesizer/commits/0e64036d5ac0d9c24b4cbe39bb778570db49caba"}]},"public":true,"created_at":"2015-01-01T01:00:35Z"}
{"id":"2489396087","type":"PushEvent","actor":{"id":1131743,"login":"rchurchley","gravatar_id":"","url":"https://api.github.com/users/rchurchley","avatar_url":"https://avatars.githubusercontent.com/u/1131743?"},"repo":{"id":11164964,"name":"rchurchley/copernicus","url":"https://api.github.com/repos/rchurchley/copernicus"},"payload":{"push_id":536752306,"size":22,"distinct_size":22,"ref":"refs/heads/master","head":"9c662abe7ba1c41dd88b82fdd2e5d3db6c58ad5b","before":"a8f7305f29a00541d042b1bef59ed103cfb6ee00","commits":[{"sha":"a69843ef6e07019640823112b0da21e25a85694f","author":{"email":"4557ca660bca40225ba58749d212d65c650d01ed@rosschurchley.com","name":"Ross Churchley"},"message":"Generalize: remove nanoc-specific items","distinct":true,"url":"https://api.github.com/repos/rchurchley/copernicus/commits/a69843ef6e07019640823112b0da21e25a85694f"},{"sha":"40ad2a87d890d196d2a7be7c5ae115e5942299e6","author":{"email":"4557ca660bca40225ba58749d212d65c650d01ed@rosschurchley.com","name":"Ross Churchley"},"message":"Generalize: rename reset.scss","distinct":true,"url":"https://api.github.com/repos/rchurchley/copernicus/commits/40ad2a87d890d196d2a7be7c5ae115e5942299e6"},{"sha":"4d2eda35659b203eae035775e616e15e6d196e25","author":{"email":"4557ca660bca40225ba58749d212d65c650d01ed@rosschurchley.com","name":"Ross Churchley"},"message":"Generalize: remove experimental styles","distinct":true,"url":"https://api.github.com/repos/rchurchley/copernicus/commits/4d2eda35659b203eae035775e616e15e6d196e25"},{"sha":"82b76a86f4652e7df9f66d8d1a3469ba88ca711c","author":{"email":"4557ca660bca40225ba58749d212d65c650d01ed@rosschurchley.com","name":"Ross Churchley"},"message":"Generalize: remove list thumbnails","distinct":true,"url":"https://api.github.com/repos/rchurchley/copernicus/commits/82b76a86f4652e7df9f66d8d1a3469ba88ca711c"},{"sha":"9520cb0fa5c5a4b023326a1a2b294a06f097ffba","author":{"email":"4557ca660bca40225ba58749d212d65c650d01ed@rosschurchley.com","name":"Ross Churchley"},"message":"Generalize: make default figure style a class","distinct":true,"url":"https://api.github.com/repos/rchurchley/copernicus/commits/9520cb0fa5c5a4b023326a1a2b294a06f097ffba"},{"sha":"78c41b207c2ff17d6f3045c42d464b022e933f54","author":{"email":"4557ca660bca40225ba58749d212d65c650d01ed@rosschurchley.com","name":"Ross Churchley"},"message":"Generalize: tidy up","distinct":true,"url":"https://api.github.com/repos/rchurchley/copernicus/commits/78c41b207c2ff17d6f3045c42d464b022e933f54"},{"sha":"9b2bec162526dd2eec69b892a67690c51e5ee8b4","author":{"email":"4557ca660bca40225ba58749d212d65c650d01ed@rosschurchley.com","name":"Ross Churchley"},"message":"Generalize: change nanoc defs to default colours","distinct":true,"url":"https://api.github.com/repos/rchurchley/copernicus/commits/9b2bec162526dd2eec69b892a67690c51e5ee8b4"},{"sha":"2d61026dd7195c44054d5b9716ec5e86f2b170a8","author":{"email":"4557ca660bca40225ba58749d212d65c650d01ed@rosschurchley.com","name":"Ross Churchley"},"message":"Generalize: document colour constraints","distinct":true,"url":"https://api.github.com/repos/rchurchley/copernicus/commits/2d61026dd7195c44054d5b9716ec5e86f2b170a8"},{"sha":"b42debf95608dcf289e6fc6f3b3c5ecda804924d","author":{"email":"4557ca660bca40225ba58749d212d65c650d01ed@rosschurchley.com","name":"Ross Churchley"},"message":"Generalize: remove unused colour styles","distinct":true,"url":"https://api.github.com/repos/rchurchley/copernicus/commits/b42debf95608dcf289e6fc6f3b3c5ecda804924d"},{"sha":"31be9980e714276088438763326624b2ecbf562c","author":{"email":"4557ca660bca40225ba58749d212d65c650d01ed@rosschurchley.com","name":"Ross Churchley"},"message":"Generalize: rearrange #site-navigation colour defs","distinct":true,"url":"https://api.github.com/repos/rchurchley/copernicus/commits/31be9980e714276088438763326624b2ecbf562c"},{"sha":"ddeb3eb6fb4336c2308b769faf584c94c0c9872e","author":{"email":"4557ca660bca40225ba58749d212d65c650d01ed@rosschurchley.com","name":"Ross Churchley"},"message":"Generalize: don't hardcode menu colours","distinct":true,"url":"https://api.github.com/repos/rchurchley/copernicus/commits/ddeb3eb6fb4336c2308b769faf584c94c0c9872e"},{"sha":"f1c8ce16fd1c8fcb5ad7286a639388d1d3a6a4c9","author":{"email":"4557ca660bca40225ba58749d212d65c650d01ed@rosschurchley.com","name":"Ross Churchley"},"message":"Tidy","distinct":true,"url":"https://api.github.com/repos/rchurchley/copernicus/commits/f1c8ce16fd1c8fcb5ad7286a639388d1d3a6a4c9"},{"sha":"9a11940e31e0bb8d8287a8c31116a67e0da142b6","author":{"email":"4557ca660bca40225ba58749d212d65c650d01ed@rosschurchley.com","name":"Ross Churchley"},"message":"Rename files","distinct":true,"url":"https://api.github.com/repos/rchurchley/copernicus/commits/9a11940e31e0bb8d8287a8c31116a67e0da142b6"},{"sha":"d83ab8c50466b9f8ec0a6844156f144084fdf0bf","author":{"email":"4557ca660bca40225ba58749d212d65c650d01ed@rosschurchley.com","name":"Ross Churchley"},"message":"Move scss files to /source","distinct":true,"url":"https://api.github.com/repos/rchurchley/copernicus/commits/d83ab8c50466b9f8ec0a6844156f144084fdf0bf"},{"sha":"4596b9fd19e0b3f3d45660ee66542d1b4fe9dbde","author":{"email":"4557ca660bca40225ba58749d212d65c650d01ed@rosschurchley.com","name":"Ross Churchley"},"message":"Generalize: add hooks to add site specific styles","distinct":true,"url":"https://api.github.com/repos/rchurchley/copernicus/commits/4596b9fd19e0b3f3d45660ee66542d1b4fe9dbde"},{"sha":"2116e5956af622c03ab4f520200a02079bdd4d94","author":{"email":"4557ca660bca40225ba58749d212d65c650d01ed@rosschurchley.com","name":"Ross Churchley"},"message":"Generalize: update README","distinct":true,"url":"https://api.github.com/repos/rchurchley/copernicus/commits/2116e5956af622c03ab4f520200a02079bdd4d94"},{"sha":"fbad248750a9f726da527ce461948bc8bfafac2f","author":{"email":"4557ca660bca40225ba58749d212d65c650d01ed@rosschurchley.com","name":"Ross Churchley"},"message":"Generalize: document HTML structure assumed by CSS","distinct":true,"url":"https://api.github.com/repos/rchurchley/copernicus/commits/fbad248750a9f726da527ce461948bc8bfafac2f"},{"sha":"98c3e6ab4a3823b08a22aa4b80b187460a203271","author":{"email":"4557ca660bca40225ba58749d212d65c650d01ed@rosschurchley.com","name":"Ross Churchley"},"message":"Consolidate stylesheets","distinct":true,"url":"https://api.github.com/repos/rchurchley/copernicus/commits/98c3e6ab4a3823b08a22aa4b80b187460a203271"},{"sha":"b12319ea726684152f0834c476ec1065aedf3162","author":{"email":"4557ca660bca40225ba58749d212d65c650d01ed@rosschurchley.com","name":"Ross Churchley"},"message":"Fully separate customizations from code","distinct":true,"url":"https://api.github.com/repos/rchurchley/copernicus/commits/b12319ea726684152f0834c476ec1065aedf3162"},{"sha":"733a490644efcb99e808ff7ef0fb532c84e71c4b","author":{"email":"4557ca660bca40225ba58749d212d65c650d01ed@rosschurchley.com","name":"Ross Churchley"},"message":"Documentation style","distinct":true,"url":"https://api.github.com/repos/rchurchley/copernicus/commits/733a490644efcb99e808ff7ef0fb532c84e71c4b"}]},"public":true,"created_at":"2015-01-01T01:00:35Z"}
{"id":"2489396088","type":"PushEvent","actor":{"id":210312,"login":"micahyoung","gravatar_id":"","url":"https://api.github.com/users/micahyoung","avatar_url":"https://avatars.githubusercontent.com/u/210312?"},"repo":{"id":25281621,"name":"micahyoung/citibike-data","url":"https://api.github.com/repos/micahyoung/citibike-data"},"payload":{"push_id":536752307,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"2f65fdd10fec0238a57fb81531e3c308dcf78515","before":"563bc4bc7f24f05120ff9007ae5e52b3853fcbf9","commits":[{"sha":"2f65fdd10fec0238a57fb81531e3c308dcf78515","author":{"email":"45b9372d3d6883e588eb18cca37878d6aa2d5cd5@young.io","name":"Micah Young"},"message":"1420074001","distinct":true,"url":"https://api.github.com/repos/micahyoung/citibike-data/commits/2f65fdd10fec0238a57fb81531e3c308dcf78515"}]},"public":true,"created_at":"2015-01-01T01:00:35Z"}
{"id":"2489396089","type":"IssueCommentEvent","actor":{"id":2605378,"login":"fivdi","gravatar_id":"","url":"https://api.github.com/users/fivdi","avatar_url":"https://avatars.githubusercontent.com/u/2605378?"},"repo":{"id":3880513,"name":"rwaldron/johnny-five","url":"https://api.github.com/repos/rwaldron/johnny-five"},"payload":{"action":"created","issue":{"url":"https://api.github.com/repos/rwaldron/johnny-five/issues/524","labels_url":"https://api.github.com/repos/rwaldron/johnny-five/issues/524/labels{/name}","comments_url":"https://api.github.com/repos/rwaldron/johnny-five/issues/524/comments","events_url":"https://api.github.com/repos/rwaldron/johnny-five/issues/524/events","html_url":"https://github.com/rwaldron/johnny-five/issues/524","id":51204388,"number":524,"title":"beaglebone-io & i2c head scratcher","user":{"login":"MrYsLab","id":5189838,"avatar_url":"https://avatars.githubusercontent.com/u/5189838?v=3","gravatar_id":"","url":"https://api.github.com/users/MrYsLab","html_url":"https://github.com/MrYsLab","followers_url":"https://api.github.com/users/MrYsLab/followers","following_url":"https://api.github.com/users/MrYsLab/following{/other_user}","gists_url":"https://api.github.com/users/MrYsLab/gists{/gist_id}","starred_url":"https://api.github.com/users/MrYsLab/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/MrYsLab/subscriptions","organizations_url":"https://api.github.com/users/MrYsLab/orgs","repos_url":"https://api.github.com/users/MrYsLab/repos","events_url":"https://api.github.com/users/MrYsLab/events{/privacy}","received_events_url":"https://api.github.com/users/MrYsLab/received_events","type":"User","site_admin":false},"labels":[],"state":"closed","locked":false,"assignee":null,"milestone":null,"comments":23,"created_at":"2014-12-07T02:10:56Z","updated_at":"2015-01-01T01:00:34Z","closed_at":"2014-12-30T16:41:06Z","body":"I have implemented i2c support for the beaglebone-io plugin using the i2c npm module. I have tested the code with eg/led-matrix-demo.js and it works identically on both Arduino and the BBB. I have also tested a TMP-102 temperature module with a quick and dirty lib module/demo (not yet ready for publishing). Again, both Arduino and BBB work identically and correctly.\r\n\r\nI am having problems however when i run eg/compass.js. It works fine on my Arduino, but when I run it on the BBB I get one good sample and then it just reports back \"data undefined\" ad infinitum. I am using a 2 amp external power supply with the BBB so I don't think this is a power issue.\r\n\r\nHere is my console output:\r\n\r\ndebian@beaglebone:~$ sudo node compass.js\r\n1417880024942 Device(s) BeagleBone-IO \r\n1417880024975 Connected BeagleBone-IO \r\n1417880024979 Repl Initialized\r\n\r\nheading 339\r\nbearing { name: 'North-NorthWest',\r\nabbr: 'NNW',\r\nlow: 331.88,\r\nmid: 337.5,\r\nhigh: 343.12,\r\nheading: 339 }\r\n(node) warning: possible EventEmitter memory leak detected. 11 listeners added. Use emitter.setMaxListeners() to increase limit.\r\nTrace\r\nat process.EventEmitter.addListener (events.js:160:15)\r\nat process.on.process.addListener (node.js:769:26)\r\nat new i2c (/home/debian/node_modules/beaglebone-io/node_modules/i2c/lib/i2c.coffee:34:15)\r\nat BeagleBone.sendI2CReadRequest (/home/debian/node_modules/beaglebone-io/lib/beaglebone.js:367:14)\r\nat Compass. (/home/debian/node_modules/johnny-five/lib/compass.js:91:13)\r\nat wrapper as _onTimeout\r\nat Timer.listOnTimeout as ontimeout\r\ndata undefined\r\n\r\nAny ideas what I might look at or try?"},"comment":{"url":"https://api.github.com/repos/rwaldron/johnny-five/issues/comments/68477220","html_url":"https://github.com/rwaldron/johnny-five/issues/524#issuecomment-68477220","issue_url":"https://api.github.com/repos/rwaldron/johnny-five/issues/524","id":68477220,"user":{"login":"fivdi","id":2605378,"avatar_url":"https://avatars.githubusercontent.com/u/2605378?v=3","gravatar_id":"","url":"https://api.github.com/users/fivdi","html_url":"https://github.com/fivdi","followers_url":"https://api.github.com/users/fivdi/followers","following_url":"https://api.github.com/users/fivdi/following{/other_user}","gists_url":"https://api.github.com/users/fivdi/gists{/gist_id}","starred_url":"https://api.github.com/users/fivdi/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/fivdi/subscriptions","organizations_url":"https://api.github.com/users/fivdi/orgs","repos_url":"https://api.github.com/users/fivdi/repos","events_url":"https://api.github.com/users/fivdi/events{/privacy}","received_events_url":"https://api.github.com/users/fivdi/received_events","type":"User","site_admin":false},"created_at":"2015-01-01T01:00:34Z","updated_at":"2015-01-01T01:00:34Z","body":"I'd say that's correct."}},"public":true,"created_at":"2015-01-01T01:00:35Z"}
{"id":"2489396094","type":"PushEvent","actor":{"id":10144074,"login":"carodew","gravatar_id":"","url":"https://api.github.com/users/carodew","avatar_url":"https://avatars.githubusercontent.com/u/10144074?"},"repo":{"id":27844858,"name":"carodew/carodew.github.io","url":"https://api.github.com/repos/carodew/carodew.github.io"},"payload":{"push_id":536752311,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"8b73f1d4d2ee61797b2d644ff44cda0f9b691aeb","before":"513a97293441c42fc14d311e273107115d210e1d","commits":[{"sha":"8b73f1d4d2ee61797b2d644ff44cda0f9b691aeb","author":{"email":"6e3c6f0214740e9061d9ca5c79eb6e0ff9cc1741@unknown542696dd77af.gateway.pace.com","name":"Carolyn"},"message":"update styling for base typography","distinct":true,"url":"https://api.github.com/repos/carodew/carodew.github.io/commits/8b73f1d4d2ee61797b2d644ff44cda0f9b691aeb"}]},"public":true,"created_at":"2015-01-01T01:00:35Z"}
{"id":"2489396097","type":"PushEvent","actor":{"id":909300,"login":"Bike","gravatar_id":"","url":"https://api.github.com/users/Bike","avatar_url":"https://avatars.githubusercontent.com/u/909300?"},"repo":{"id":24974235,"name":"Bike/burke","url":"https://api.github.com/repos/Bike/burke"},"payload":{"push_id":536752314,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"a99f8efe85dd17d4cf79fcf39405f003a4c39ffe","before":"c6a01ee88e26326a841c4364b607ff52c656fd48","commits":[{"sha":"a99f8efe85dd17d4cf79fcf39405f003a4c39ffe","author":{"email":"a15d8c4f8a46f6b42ad26134f414c80bc96140d6@gmail.com","name":"James Kalenius"},"message":"Make ground environment init functional, & add package objects\n\ninitialize_ground is replaced with make_ground, which returns an environment. It\nalso takes a \"package\" as an argument. Packages are lisp-accessible objects that\nhold symbols, which we did globally before this commit. Packages are also c\naccessible so, well, check main.c if you want to see how I'm envisioning the use\nAPI at this time.\n\nThis change may break a few things, namely read (called from within lisp).\nHaven't checked.","distinct":true,"url":"https://api.github.com/repos/Bike/burke/commits/a99f8efe85dd17d4cf79fcf39405f003a4c39ffe"}]},"public":true,"created_at":"2015-01-01T01:00:35Z"}
{"id":"2489396098","type":"PushEvent","actor":{"id":7866761,"login":"calmhorizons","gravatar_id":"","url":"https://api.github.com/users/calmhorizons","avatar_url":"https://avatars.githubusercontent.com/u/7866761?"},"repo":{"id":28292022,"name":"calmhorizons/innerworlds","url":"https://api.github.com/repos/calmhorizons/innerworlds"},"payload":{"push_id":536752315,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"24d4bf91156e009c55831b7fe8e030ed6c41c66c","before":"63c069a3407c634a81c53021d796d2083b6ac602","commits":[{"sha":"24d4bf91156e009c55831b7fe8e030ed6c41c66c","author":{"email":"5d0ccff408c420fe4db31c1ed4e6bb373cdb71a5@internode.on.net","name":"calmhorizons"},"message":"Retired example mod.","distinct":true,"url":"https://api.github.com/repos/calmhorizons/innerworlds/commits/24d4bf91156e009c55831b7fe8e030ed6c41c66c"}]},"public":true,"created_at":"2015-01-01T01:00:35Z"}
{"id":"2489396099","type":"PushEvent","actor":{"id":7727148,"login":"ThadHouse","gravatar_id":"","url":"https://api.github.com/users/ThadHouse","avatar_url":"https://avatars.githubusercontent.com/u/7727148?"},"repo":{"id":26708360,"name":"ThadHouse/SplineGenerator","url":"https://api.github.com/repos/ThadHouse/SplineGenerator"},"payload":{"push_id":536752316,"size":2,"distinct_size":2,"ref":"refs/heads/master","head":"8754d22a1254a5a372af8b00928187947e622c60","before":"3a313300b8a8694a20be00b74b25763b015f3549","commits":[{"sha":"9e6bad2c25af5d7d54d364b294933d54e29a0fc2","author":{"email":"3c6d060800eb1ad0bfd1a00db59ad460de4097ae@athometech.com","name":"ThadHouse"},"message":"accidentally typed something...","distinct":true,"url":"https://api.github.com/repos/ThadHouse/SplineGenerator/commits/9e6bad2c25af5d7d54d364b294933d54e29a0fc2"},{"sha":"8754d22a1254a5a372af8b00928187947e622c60","author":{"email":"3c6d060800eb1ad0bfd1a00db59ad460de4097ae@athometech.com","name":"ThadHouse"},"message":"Merge branch 'master' of https://github.com/ThadHouse/SplineGenerator.git","distinct":true,"url":"https://api.github.com/repos/ThadHouse/SplineGenerator/commits/8754d22a1254a5a372af8b00928187947e622c60"}]},"public":true,"created_at":"2015-01-01T01:00:35Z"}
{"id":"2489396101","type":"PushEvent","actor":{"id":210312,"login":"micahyoung","gravatar_id":"","url":"https://api.github.com/users/micahyoung","avatar_url":"https://avatars.githubusercontent.com/u/210312?"},"repo":{"id":16091467,"name":"micahyoung/cbstats-data","url":"https://api.github.com/repos/micahyoung/cbstats-data"},"payload":{"push_id":536752318,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"fed920aaffa850292184a7083200488d6c81c84c","before":"56100d60a9dcf0137f35638266d574c1500b330c","commits":[{"sha":"fed920aaffa850292184a7083200488d6c81c84c","author":{"email":"45b9372d3d6883e588eb18cca37878d6aa2d5cd5@young.io","name":"Micah Young"},"message":"1420074001","distinct":true,"url":"https://api.github.com/repos/micahyoung/cbstats-data/commits/fed920aaffa850292184a7083200488d6c81c84c"}]},"public":true,"created_at":"2015-01-01T01:00:36Z"}
{"id":"2489396118","type":"PushEvent","actor":{"id":370793,"login":"Ratmir15","gravatar_id":"","url":"https://api.github.com/users/Ratmir15","avatar_url":"https://avatars.githubusercontent.com/u/370793?"},"repo":{"id":3652623,"name":"Ratmir15/hz-base","url":"https://api.github.com/repos/Ratmir15/hz-base"},"payload":{"push_id":536752326,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"d94072efcb38808e10382a7c4828e6a191375a4e","before":"3fa465de3d29cd3806fadb2fbda9dab0375b1113","commits":[{"sha":"d94072efcb38808e10382a7c4828e6a191375a4e","author":{"email":"1de0837f738a2fcf8dd0b85edef8d919b335fdeb@yandex.ru","name":"Ratmir"},"message":"dump","distinct":true,"url":"https://api.github.com/repos/Ratmir15/hz-base/commits/d94072efcb38808e10382a7c4828e6a191375a4e"}]},"public":true,"created_at":"2015-01-01T01:00:38Z"}
{"id":"2489396123","type":"IssueCommentEvent","actor":{"id":865203,"login":"mrjoelkemp","gravatar_id":"","url":"https://api.github.com/users/mrjoelkemp","avatar_url":"https://avatars.githubusercontent.com/u/865203?"},"repo":{"id":10697582,"name":"jscs-dev/node-jscs","url":"https://api.github.com/repos/jscs-dev/node-jscs"},"payload":{"action":"created","issue":{"url":"https://api.github.com/repos/jscs-dev/node-jscs/issues/869","labels_url":"https://api.github.com/repos/jscs-dev/node-jscs/issues/869/labels{/name}","comments_url":"https://api.github.com/repos/jscs-dev/node-jscs/issues/869/comments","events_url":"https://api.github.com/repos/jscs-dev/node-jscs/issues/869/events","html_url":"https://github.com/jscs-dev/node-jscs/issues/869","id":53207615,"number":869,"title":"Bug? Node v0.11 and modules/checker checkStdin test","user":{"login":"zxqfox","id":677518,"avatar_url":"https://avatars.githubusercontent.com/u/677518?v=3","gravatar_id":"","url":"https://api.github.com/users/zxqfox","html_url":"https://github.com/zxqfox","followers_url":"https://api.github.com/users/zxqfox/followers","following_url":"https://api.github.com/users/zxqfox/following{/other_user}","gists_url":"https://api.github.com/users/zxqfox/gists{/gist_id}","starred_url":"https://api.github.com/users/zxqfox/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/zxqfox/subscriptions","organizations_url":"https://api.github.com/users/zxqfox/orgs","repos_url":"https://api.github.com/users/zxqfox/repos","events_url":"https://api.github.com/users/zxqfox/events{/privacy}","received_events_url":"https://api.github.com/users/zxqfox/received_events","type":"User","site_admin":false},"labels":[],"state":"open","locked":false,"assignee":null,"milestone":null,"comments":1,"created_at":"2014-12-31T23:06:47Z","updated_at":"2015-01-01T01:00:38Z","closed_at":null,"body":"I've used node 0.11 via nvm, ran mocha, and saw:\r\n```\r\n  1 failing\r\n\r\n  1) modules/checker checkStdin returns a promise:\r\n     TypeError: Attempted to wrap on which is already wrapped\r\n      at Object.wrapMethod (/home/alex/repos/node-jscs/node_modules/sinon/lib/sinon/util/core.js:78:25)\r\n      at Object.spy (/home/alex/repos/node-jscs/node_modules/sinon/lib/sinon/spy.js:34:26)\r\n      at Context.<anonymous> (/home/alex/repos/node-jscs/test/checker.js:62:29)\r\n      at callFn (/home/alex/repos/node-jscs/node_modules/mocha/lib/runnable.js:251:21)\r\n      at Test.Runnable.run (/home/alex/repos/node-jscs/node_modules/mocha/lib/runnable.js:244:7)\r\n      at Runner.runTest (/home/alex/repos/node-jscs/node_modules/mocha/lib/runner.js:374:10)\r\n      at /home/alex/repos/node-jscs/node_modules/mocha/lib/runner.js:452:12\r\n      at next (/home/alex/repos/node-jscs/node_modules/mocha/lib/runner.js:299:14)\r\n      at /home/alex/repos/node-jscs/node_modules/mocha/lib/runner.js:309:7\r\n      at next (/home/alex/repos/node-jscs/node_modules/mocha/lib/runner.js:248:23)\r\n      at Immediate._onImmediate (/home/alex/repos/node-jscs/node_modules/mocha/lib/runner.js:276:5)\r\n      at processImmediate [as _immediateCallback] (timers.js:374:17)\r\n  --------------\r\n  Error: Stack Trace for original\r\n      at Object.wrapMethod (/home/alex/repos/node-jscs/node_modules/sinon/lib/sinon/util/core.js:98:34)\r\n      at Object.spy (/home/alex/repos/node-jscs/node_modules/sinon/lib/sinon/spy.js:34:26)\r\n      at Context.<anonymous> (/home/alex/repos/node-jscs/test/checker.js:54:29)\r\n      at callFn (/home/alex/repos/node-jscs/node_modules/mocha/lib/runnable.js:251:21)\r\n      at Test.Runnable.run (/home/alex/repos/node-jscs/node_modules/mocha/lib/runnable.js:244:7)\r\n      at Runner.runTest (/home/alex/repos/node-jscs/node_modules/mocha/lib/runner.js:374:10)\r\n      at /home/alex/repos/node-jscs/node_modules/mocha/lib/runner.js:452:12\r\n      at next (/home/alex/repos/node-jscs/node_modules/mocha/lib/runner.js:299:14)\r\n      at /home/alex/repos/node-jscs/node_modules/mocha/lib/runner.js:309:7\r\n      at next (/home/alex/repos/node-jscs/node_modules/mocha/lib/runner.js:248:23)\r\n      at Immediate._onImmediate (/home/alex/repos/node-jscs/node_modules/mocha/lib/runner.js:276:5)\r\n      at processImmediate [as _immediateCallback] (timers.js:374:17)\r\n```\r\n\r\n/cc @mrjoelkemp\r\n\r\n<bountysource-plugin>\r\n\r\n---\r\nWant to back this issue? **[Place a bounty on it!](https://www.bountysource.com/issues/7416038-bug-node-v0-11-and-modules-checker-checkstdin-test?utm_campaign=plugin&utm_content=tracker%2F281640&utm_medium=issues&utm_source=github)** We accept bounties via [Bountysource](https://www.bountysource.com/?utm_campaign=plugin&utm_content=tracker%2F281640&utm_medium=issues&utm_source=github).\r\n</bountysource-plugin>"},"comment":{"url":"https://api.github.com/repos/jscs-dev/node-jscs/issues/comments/68477222","html_url":"https://github.com/jscs-dev/node-jscs/issues/869#issuecomment-68477222","issue_url":"https://api.github.com/repos/jscs-dev/node-jscs/issues/869","id":68477222,"user":{"login":"mrjoelkemp","id":865203,"avatar_url":"https://avatars.githubusercontent.com/u/865203?v=3","gravatar_id":"","url":"https://api.github.com/users/mrjoelkemp","html_url":"https://github.com/mrjoelkemp","followers_url":"https://api.github.com/users/mrjoelkemp/followers","following_url":"https://api.github.com/users/mrjoelkemp/following{/other_user}","gists_url":"https://api.github.com/users/mrjoelkemp/gists{/gist_id}","starred_url":"https://api.github.com/users/mrjoelkemp/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/mrjoelkemp/subscriptions","organizations_url":"https://api.github.com/users/mrjoelkemp/orgs","repos_url":"https://api.github.com/users/mrjoelkemp/repos","events_url":"https://api.github.com/users/mrjoelkemp/events{/privacy}","received_events_url":"https://api.github.com/users/mrjoelkemp/received_events","type":"User","site_admin":false},"created_at":"2015-01-01T01:00:38Z","updated_at":"2015-01-01T01:00:38Z","body":"Thanks for the report! Seems like it's specific to your node version. I had the same thing happen some time ago with an older version of node. Travis doesn't like your fix likely because it's running a newer stable version of node. \r\n\r\nTry upgrading locally if you can? \r\n\r\nHappy new year,  friend :) "}},"public":true,"created_at":"2015-01-01T01:00:39Z","org":{"id":8018201,"login":"jscs-dev","gravatar_id":"","url":"https://api.github.com/orgs/jscs-dev","avatar_url":"https://avatars.githubusercontent.com/u/8018201?"}}
{"id":"2489396126","type":"CreateEvent","actor":{"id":9874887,"login":"Akheon23","gravatar_id":"","url":"https://api.github.com/users/Akheon23","avatar_url":"https://avatars.githubusercontent.com/u/9874887?"},"repo":{"id":28678169,"name":"Akheon23/Node.js","url":"https://api.github.com/repos/Akheon23/Node.js"},"payload":{"ref":"master","ref_type":"branch","master_branch":"master","description":"","pusher_type":"user"},"public":true,"created_at":"2015-01-01T01:00:39Z"}
{"id":"2489396130","type":"ForkEvent","actor":{"id":9831378,"login":"Amit-P-Amin","gravatar_id":"","url":"https://api.github.com/users/Amit-P-Amin","avatar_url":"https://avatars.githubusercontent.com/u/9831378?"},"repo":{"id":12024210,"name":"appacademy/active_record_lite","url":"https://api.github.com/repos/appacademy/active_record_lite"},"payload":{"forkee":{"id":28678217,"name":"active_record_lite","full_name":"Amit-P-Amin/active_record_lite","owner":{"login":"Amit-P-Amin","id":9831378,"avatar_url":"https://avatars.githubusercontent.com/u/9831378?v=3","gravatar_id":"","url":"https://api.github.com/users/Amit-P-Amin","html_url":"https://github.com/Amit-P-Amin","followers_url":"https://api.github.com/users/Amit-P-Amin/followers","following_url":"https://api.github.com/users/Amit-P-Amin/following{/other_user}","gists_url":"https://api.github.com/users/Amit-P-Amin/gists{/gist_id}","starred_url":"https://api.github.com/users/Amit-P-Amin/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/Amit-P-Amin/subscriptions","organizations_url":"https://api.github.com/users/Amit-P-Amin/orgs","repos_url":"https://api.github.com/users/Amit-P-Amin/repos","events_url":"https://api.github.com/users/Amit-P-Amin/events{/privacy}","received_events_url":"https://api.github.com/users/Amit-P-Amin/received_events","type":"User","site_admin":false},"private":false,"html_url":"https://github.com/Amit-P-Amin/active_record_lite","description":"","fork":true,"url":"https://api.github.com/repos/Amit-P-Amin/active_record_lite","forks_url":"https://api.github.com/repos/Amit-P-Amin/active_record_lite/forks","keys_url":"https://api.github.com/repos/Amit-P-Amin/active_record_lite/keys{/key_id}","collaborators_url":"https://api.github.com/repos/Amit-P-Amin/active_record_lite/collaborators{/collaborator}","teams_url":"https://api.github.com/repos/Amit-P-Amin/active_record_lite/teams","hooks_url":"https://api.github.com/repos/Amit-P-Amin/active_record_lite/hooks","issue_events_url":"https://api.github.com/repos/Amit-P-Amin/active_record_lite/issues/events{/number}","events_url":"https://api.github.com/repos/Amit-P-Amin/active_record_lite/events","assignees_url":"https://api.github.com/repos/Amit-P-Amin/active_record_lite/assignees{/user}","branches_url":"https://api.github.com/repos/Amit-P-Amin/active_record_lite/branches{/branch}","tags_url":"https://api.github.com/repos/Amit-P-Amin/active_record_lite/tags","blobs_url":"https://api.github.com/repos/Amit-P-Amin/active_record_lite/git/blobs{/sha}","git_tags_url":"https://api.github.com/repos/Amit-P-Amin/active_record_lite/git/tags{/sha}","git_refs_url":"https://api.github.com/repos/Amit-P-Amin/active_record_lite/git/refs{/sha}","trees_url":"https://api.github.com/repos/Amit-P-Amin/active_record_lite/git/trees{/sha}","statuses_url":"https://api.github.com/repos/Amit-P-Amin/active_record_lite/statuses/{sha}","languages_url":"https://api.github.com/repos/Amit-P-Amin/active_record_lite/languages","stargazers_url":"https://api.github.com/repos/Amit-P-Amin/active_record_lite/stargazers","contributors_url":"https://api.github.com/repos/Amit-P-Amin/active_record_lite/contributors","subscribers_url":"https://api.github.com/repos/Amit-P-Amin/active_record_lite/subscribers","subscription_url":"https://api.github.com/repos/Amit-P-Amin/active_record_lite/subscription","commits_url":"https://api.github.com/repos/Amit-P-Amin/active_record_lite/commits{/sha}","git_commits_url":"https://api.github.com/repos/Amit-P-Amin/active_record_lite/git/commits{/sha}","comments_url":"https://api.github.com/repos/Amit-P-Amin/active_record_lite/comments{/number}","issue_comment_url":"https://api.github.com/repos/Amit-P-Amin/active_record_lite/issues/comments/{number}","contents_url":"https://api.github.com/repos/Amit-P-Amin/active_record_lite/contents/{+path}","compare_url":"https://api.github.com/repos/Amit-P-Amin/active_record_lite/compare/{base}...{head}","merges_url":"https://api.github.com/repos/Amit-P-Amin/active_record_lite/merges","archive_url":"https://api.github.com/repos/Amit-P-Amin/active_record_lite/{archive_format}{/ref}","downloads_url":"https://api.github.com/repos/Amit-P-Amin/active_record_lite/downloads","issues_url":"https://api.github.com/repos/Amit-P-Amin/active_record_lite/issues{/number}","pulls_url":"https://api.github.com/repos/Amit-P-Amin/active_record_lite/pulls{/number}","milestones_url":"https://api.github.com/repos/Amit-P-Amin/active_record_lite/milestones{/number}","notifications_url":"https://api.github.com/repos/Amit-P-Amin/active_record_lite/notifications{?since,all,participating}","labels_url":"https://api.github.com/repos/Amit-P-Amin/active_record_lite/labels{/name}","releases_url":"https://api.github.com/repos/Amit-P-Amin/active_record_lite/releases{/id}","created_at":"2015-01-01T01:00:39Z","updated_at":"2014-10-23T23:33:55Z","pushed_at":"2014-10-26T23:37:38Z","git_url":"git://github.com/Amit-P-Amin/active_record_lite.git","ssh_url":"git@github.com:Amit-P-Amin/active_record_lite.git","clone_url":"https://github.com/Amit-P-Amin/active_record_lite.git","svn_url":"https://github.com/Amit-P-Amin/active_record_lite","homepage":null,"size":632,"stargazers_count":0,"watchers_count":0,"language":null,"has_issues":false,"has_downloads":true,"has_wiki":true,"has_pages":false,"forks_count":0,"mirror_url":null,"open_issues_count":0,"forks":0,"open_issues":0,"watchers":0,"default_branch":"master","public":true}},"public":true,"created_at":"2015-01-01T01:00:39Z","org":{"id":2138704,"login":"appacademy","gravatar_id":"","url":"https://api.github.com/orgs/appacademy","avatar_url":"https://avatars.githubusercontent.com/u/2138704?"}}
{"id":"2489396135","type":"PushEvent","actor":{"id":6462036,"login":"samhillman","gravatar_id":"","url":"https://api.github.com/users/samhillman","avatar_url":"https://avatars.githubusercontent.com/u/6462036?"},"repo":{"id":28253700,"name":"samhillman/newdotcom","url":"https://api.github.com/repos/samhillman/newdotcom"},"payload":{"push_id":536752336,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"eb166d0e9ff48e250e0b322ef42013d02dca159c","before":"83eb012480e646f8a84e490bf3700f7441e875a7","commits":[{"sha":"eb166d0e9ff48e250e0b322ef42013d02dca159c","author":{"email":"3f12132dd817f39877292097b6071939bf5ccbcd@cvbay.co.uk","name":"Sam Hillman"},"message":"changed css","distinct":true,"url":"https://api.github.com/repos/samhillman/newdotcom/commits/eb166d0e9ff48e250e0b322ef42013d02dca159c"}]},"public":true,"created_at":"2015-01-01T01:00:40Z"}
{"id":"2489396143","type":"PushEvent","actor":{"id":20114,"login":"jdillon","gravatar_id":"","url":"https://api.github.com/users/jdillon","avatar_url":"https://avatars.githubusercontent.com/u/20114?"},"repo":{"id":10146961,"name":"sonatype/nexus-oss","url":"https://api.github.com/repos/sonatype/nexus-oss"},"payload":{"push_id":536752341,"size":6,"distinct_size":6,"ref":"refs/heads/nexus-cma","head":"bdb37c4b14d58c8f958f15050517a1ef1bf01c27","before":"f0590dba44a66b8a2ac16a74c3d7c387d6c33f90","commits":[{"sha":"c965763022e63b350354f1b49905bdee35cac22b","author":{"email":"68c46a606457643eab92053c1c05574abb26f861@planet57.com","name":"Jason Dillon"},"message":"Fix injected type name","distinct":true,"url":"https://api.github.com/repos/sonatype/nexus-oss/commits/c965763022e63b350354f1b49905bdee35cac22b"},{"sha":"9ae76c75d6fbe07d50d9563f156a909552ff07e9","author":{"email":"68c46a606457643eab92053c1c05574abb26f861@planet57.com","name":"Jason Dillon"},"message":"Add start of simple proxy recipe","distinct":true,"url":"https://api.github.com/repos/sonatype/nexus-oss/commits/9ae76c75d6fbe07d50d9563f156a909552ff07e9"},{"sha":"b8faa254870db34b17c660b6f263f6b85e300c81","author":{"email":"68c46a606457643eab92053c1c05574abb26f861@planet57.com","name":"Jason Dillon"},"message":"Mark as component, Simplify, update cheetsheet","distinct":true,"url":"https://api.github.com/repos/sonatype/nexus-oss/commits/b8faa254870db34b17c660b6f263f6b85e300c81"},{"sha":"659f782ed5530e2a659f69ed10c2462d5955b8de","author":{"email":"68c46a606457643eab92053c1c05574abb26f861@planet57.com","name":"Jason Dillon"},"message":"Simplify names","distinct":true,"url":"https://api.github.com/repos/sonatype/nexus-oss/commits/659f782ed5530e2a659f69ed10c2462d5955b8de"},{"sha":"2c07fa298017131e484db9bce2f91d8a7dc16335","author":{"email":"68c46a606457643eab92053c1c05574abb26f861@planet57.com","name":"Jason Dillon"},"message":"debug -> trace","distinct":true,"url":"https://api.github.com/repos/sonatype/nexus-oss/commits/2c07fa298017131e484db9bce2f91d8a7dc16335"},{"sha":"bdb37c4b14d58c8f958f15050517a1ef1bf01c27","author":{"email":"68c46a606457643eab92053c1c05574abb26f861@planet57.com","name":"Jason Dillon"},"message":"blah","distinct":true,"url":"https://api.github.com/repos/sonatype/nexus-oss/commits/bdb37c4b14d58c8f958f15050517a1ef1bf01c27"}]},"public":true,"created_at":"2015-01-01T01:00:41Z","org":{"id":44938,"login":"sonatype","gravatar_id":"","url":"https://api.github.com/orgs/sonatype","avatar_url":"https://avatars.githubusercontent.com/u/44938?"}}
{"id":"2489396149","type":"ForkEvent","actor":{"id":8484018,"login":"dskae","gravatar_id":"","url":"https://api.github.com/users/dskae","avatar_url":"https://avatars.githubusercontent.com/u/8484018?"},"repo":{"id":26194619,"name":"EKGAPI/webAppEKGAPI","url":"https://api.github.com/repos/EKGAPI/webAppEKGAPI"},"payload":{"forkee":{"id":28678218,"name":"webAppEKGAPI","full_name":"dskae/webAppEKGAPI","owner":{"login":"dskae","id":8484018,"avatar_url":"https://avatars.githubusercontent.com/u/8484018?v=3","gravatar_id":"","url":"https://api.github.com/users/dskae","html_url":"https://github.com/dskae","followers_url":"https://api.github.com/users/dskae/followers","following_url":"https://api.github.com/users/dskae/following{/other_user}","gists_url":"https://api.github.com/users/dskae/gists{/gist_id}","starred_url":"https://api.github.com/users/dskae/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/dskae/subscriptions","organizations_url":"https://api.github.com/users/dskae/orgs","repos_url":"https://api.github.com/users/dskae/repos","events_url":"https://api.github.com/users/dskae/events{/privacy}","received_events_url":"https://api.github.com/users/dskae/received_events","type":"User","site_admin":false},"private":false,"html_url":"https://github.com/dskae/webAppEKGAPI","description":"webAppEKGAPI","fork":true,"url":"https://api.github.com/repos/dskae/webAppEKGAPI","forks_url":"https://api.github.com/repos/dskae/webAppEKGAPI/forks","keys_url":"https://api.github.com/repos/dskae/webAppEKGAPI/keys{/key_id}","collaborators_url":"https://api.github.com/repos/dskae/webAppEKGAPI/collaborators{/collaborator}","teams_url":"https://api.github.com/repos/dskae/webAppEKGAPI/teams","hooks_url":"https://api.github.com/repos/dskae/webAppEKGAPI/hooks","issue_events_url":"https://api.github.com/repos/dskae/webAppEKGAPI/issues/events{/number}","events_url":"https://api.github.com/repos/dskae/webAppEKGAPI/events","assignees_url":"https://api.github.com/repos/dskae/webAppEKGAPI/assignees{/user}","branches_url":"https://api.github.com/repos/dskae/webAppEKGAPI/branches{/branch}","tags_url":"https://api.github.com/repos/dskae/webAppEKGAPI/tags","blobs_url":"https://api.github.com/repos/dskae/webAppEKGAPI/git/blobs{/sha}","git_tags_url":"https://api.github.com/repos/dskae/webAppEKGAPI/git/tags{/sha}","git_refs_url":"https://api.github.com/repos/dskae/webAppEKGAPI/git/refs{/sha}","trees_url":"https://api.github.com/repos/dskae/webAppEKGAPI/git/trees{/sha}","statuses_url":"https://api.github.com/repos/dskae/webAppEKGAPI/statuses/{sha}","languages_url":"https://api.github.com/repos/dskae/webAppEKGAPI/languages","stargazers_url":"https://api.github.com/repos/dskae/webAppEKGAPI/stargazers","contributors_url":"https://api.github.com/repos/dskae/webAppEKGAPI/contributors","subscribers_url":"https://api.github.com/repos/dskae/webAppEKGAPI/subscribers","subscription_url":"https://api.github.com/repos/dskae/webAppEKGAPI/subscription","commits_url":"https://api.github.com/repos/dskae/webAppEKGAPI/commits{/sha}","git_commits_url":"https://api.github.com/repos/dskae/webAppEKGAPI/git/commits{/sha}","comments_url":"https://api.github.com/repos/dskae/webAppEKGAPI/comments{/number}","issue_comment_url":"https://api.github.com/repos/dskae/webAppEKGAPI/issues/comments/{number}","contents_url":"https://api.github.com/repos/dskae/webAppEKGAPI/contents/{+path}","compare_url":"https://api.github.com/repos/dskae/webAppEKGAPI/compare/{base}...{head}","merges_url":"https://api.github.com/repos/dskae/webAppEKGAPI/merges","archive_url":"https://api.github.com/repos/dskae/webAppEKGAPI/{archive_format}{/ref}","downloads_url":"https://api.github.com/repos/dskae/webAppEKGAPI/downloads","issues_url":"https://api.github.com/repos/dskae/webAppEKGAPI/issues{/number}","pulls_url":"https://api.github.com/repos/dskae/webAppEKGAPI/pulls{/number}","milestones_url":"https://api.github.com/repos/dskae/webAppEKGAPI/milestones{/number}","notifications_url":"https://api.github.com/repos/dskae/webAppEKGAPI/notifications{?since,all,participating}","labels_url":"https://api.github.com/repos/dskae/webAppEKGAPI/labels{/name}","releases_url":"https://api.github.com/repos/dskae/webAppEKGAPI/releases{/id}","created_at":"2015-01-01T01:00:41Z","updated_at":"2015-01-01T00:57:42Z","pushed_at":"2015-01-01T00:57:42Z","git_url":"git://github.com/dskae/webAppEKGAPI.git","ssh_url":"git@github.com:dskae/webAppEKGAPI.git","clone_url":"https://github.com/dskae/webAppEKGAPI.git","svn_url":"https://github.com/dskae/webAppEKGAPI","homepage":null,"size":2776,"stargazers_count":0,"watchers_count":0,"language":null,"has_issues":false,"has_downloads":true,"has_wiki":true,"has_pages":false,"forks_count":0,"mirror_url":null,"open_issues_count":0,"forks":0,"open_issues":0,"watchers":0,"default_branch":"master","public":true}},"public":true,"created_at":"2015-01-01T01:00:41Z","org":{"id":9016021,"login":"EKGAPI","gravatar_id":"","url":"https://api.github.com/orgs/EKGAPI","avatar_url":"https://avatars.githubusercontent.com/u/9016021?"}}
{"id":"2489396153","type":"PushEvent","actor":{"id":1221156,"login":"fyfe","gravatar_id":"","url":"https://api.github.com/users/fyfe","avatar_url":"https://avatars.githubusercontent.com/u/1221156?"},"repo":{"id":28673837,"name":"fyfe/git-test","url":"https://api.github.com/repos/fyfe/git-test"},"payload":{"push_id":536752348,"size":1,"distinct_size":1,"ref":"refs/heads/feature/documentation","head":"ff2bf3e6e5ca5f2db8d995fb7e1a982b0d6c54ac","before":"5a1391eb7be74927581985100b2274f264a28386","commits":[{"sha":"ff2bf3e6e5ca5f2db8d995fb7e1a982b0d6c54ac","author":{"email":"02e0a999c50b1f88df7a8f5a04e1b76b35ea6a88@neptune-one.net","name":"Andrew Fyfe"},"message":"docs(developer-notes.md): documentation for developers/contributers","distinct":true,"url":"https://api.github.com/repos/fyfe/git-test/commits/ff2bf3e6e5ca5f2db8d995fb7e1a982b0d6c54ac"}]},"public":true,"created_at":"2015-01-01T01:00:42Z"}
{"id":"2489396163","type":"PushEvent","actor":{"id":6737270,"login":"JorgeX","gravatar_id":"","url":"https://api.github.com/users/JorgeX","avatar_url":"https://avatars.githubusercontent.com/u/6737270?"},"repo":{"id":25890220,"name":"JorgeX/dojo_rules","url":"https://api.github.com/repos/JorgeX/dojo_rules"},"payload":{"push_id":536752355,"size":1,"distinct_size":1,"ref":"refs/heads/deadly_skills","head":"923b0ffbc6a7f2fc6ff55b6d415fe70f824ea5e0","before":"fa8f9c257f146f27b1fbdc561e0f5c0b5e50e07c","commits":[{"sha":"923b0ffbc6a7f2fc6ff55b6d415fe70f824ea5e0","author":{"email":"33f927344e079e00d3fa45d8833b04e735223eec@Jorges-MacBook-Pro.local","name":"Jörge Ojanen"},"message":"ok323","distinct":true,"url":"https://api.github.com/repos/JorgeX/dojo_rules/commits/923b0ffbc6a7f2fc6ff55b6d415fe70f824ea5e0"}]},"public":true,"created_at":"2015-01-01T01:00:43Z"}
{"id":"2489396164","type":"PushEvent","actor":{"id":4153853,"login":"jlumijarvi","gravatar_id":"","url":"https://api.github.com/users/jlumijarvi","avatar_url":"https://avatars.githubusercontent.com/u/4153853?"},"repo":{"id":28678176,"name":"jlumijarvi/csv2xml","url":"https://api.github.com/repos/jlumijarvi/csv2xml"},"payload":{"push_id":536752356,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"8c339f97ba859406034a4b4803ff9f10986c16ea","before":"0366b227c1b20d451524d9712bb67771daa739f3","commits":[{"sha":"8c339f97ba859406034a4b4803ff9f10986c16ea","author":{"email":"40e6fc59d2535c98bfd5d19357e20df6e95cef64@gmail.com","name":"jlumijarvi"},"message":"Update README.md","distinct":true,"url":"https://api.github.com/repos/jlumijarvi/csv2xml/commits/8c339f97ba859406034a4b4803ff9f10986c16ea"}]},"public":true,"created_at":"2015-01-01T01:00:43Z"}
{"id":"2489396174","type":"PushEvent","actor":{"id":3990482,"login":"rosbuild","gravatar_id":"","url":"https://api.github.com/users/rosbuild","avatar_url":"https://avatars.githubusercontent.com/u/3990482?"},"repo":{"id":14125815,"name":"osrf/www.ros.org","url":"https://api.github.com/repos/osrf/www.ros.org"},"payload":{"push_id":536752363,"size":1,"distinct_size":1,"ref":"refs/heads/wordpressdb","head":"e37c3ad58cd26e5d95ba8209561ff1d54f68ff67","before":"0b551ea0ff449633f82f355144e7633b6d19380d","commits":[{"sha":"e37c3ad58cd26e5d95ba8209561ff1d54f68ff67","author":{"email":"c2678b3531040209f84244ce8534556c3494c8b3@osrfoundation.org","name":"Your Name"},"message":"automatic db update","distinct":true,"url":"https://api.github.com/repos/osrf/www.ros.org/commits/e37c3ad58cd26e5d95ba8209561ff1d54f68ff67"}]},"public":true,"created_at":"2015-01-01T01:00:43Z","org":{"id":3999730,"login":"osrf","gravatar_id":"","url":"https://api.github.com/orgs/osrf","avatar_url":"https://avatars.githubusercontent.com/u/3999730?"}}
{"id":"2489396182","type":"PushEvent","actor":{"id":3013275,"login":"rohatiro","gravatar_id":"","url":"https://api.github.com/users/rohatiro","avatar_url":"https://avatars.githubusercontent.com/u/3013275?"},"repo":{"id":23979538,"name":"rohatiro/apis","url":"https://api.github.com/repos/rohatiro/apis"},"payload":{"push_id":536752368,"size":9,"distinct_size":0,"ref":"refs/heads/soundcloud","head":"e60a4d532602c4df08a1a019d759ecac297fce89","before":"9a0c6b42bb3d3a112784abfe86f937d033e59689","commits":[{"sha":"a0cc0cf97f7c94da62dcfb80a0c71ff1d3e2a43e","author":{"email":"cf4c21b09c947740db10e2ccb7d10819767cd724@gmail.com","name":"Roberto Haziel Tienda Rodríguez"},"message":"Utilizando Passport con el API de Github","distinct":false,"url":"https://api.github.com/repos/rohatiro/apis/commits/a0cc0cf97f7c94da62dcfb80a0c71ff1d3e2a43e"},{"sha":"05031ae044ff6a66569b6caa61bdea7cfb80f6b9","author":{"email":"cf4c21b09c947740db10e2ccb7d10819767cd724@gmail.com","name":"Roberto Haziel Tienda Rodríguez"},"message":"Obtención de perfil de usuario en github","distinct":false,"url":"https://api.github.com/repos/rohatiro/apis/commits/05031ae044ff6a66569b6caa61bdea7cfb80f6b9"},{"sha":"d64269c3a069b30cc148086ca1d4e450b0cf074c","author":{"email":"cf4c21b09c947740db10e2ccb7d10819767cd724@gmail.com","name":"Roberto Haziel Tienda Rodríguez"},"message":"Manejo de información del usuario","distinct":false,"url":"https://api.github.com/repos/rohatiro/apis/commits/d64269c3a069b30cc148086ca1d4e450b0cf074c"},{"sha":"c104fa4b165a5a0f98c7fc8c8f1bd4f64d6bbabb","author":{"email":"cf4c21b09c947740db10e2ccb7d10819767cd724@gmail.com","name":"Roberto Haziel Tienda Rodríguez"},"message":"Utilización de Bootstrap para estilos de las paginas","distinct":false,"url":"https://api.github.com/repos/rohatiro/apis/commits/c104fa4b165a5a0f98c7fc8c8f1bd4f64d6bbabb"},{"sha":"5f746f48b8a9c9ad896e67045d41894fe311d7f3","author":{"email":"cf4c21b09c947740db10e2ccb7d10819767cd724@gmail.com","name":"Roberto Haziel Tienda Rodríguez"},"message":"Obteniendo repositorios de Usuario de Github con request","distinct":false,"url":"https://api.github.com/repos/rohatiro/apis/commits/5f746f48b8a9c9ad896e67045d41894fe311d7f3"},{"sha":"604f5ac73f6e928852e5ea727f03bf3c15ab95f0","author":{"email":"cf4c21b09c947740db10e2ccb7d10819767cd724@gmail.com","name":"Roberto Haziel Tienda Rodríguez"},"message":"Modularizando la funcionalidad de autorización de apis","distinct":false,"url":"https://api.github.com/repos/rohatiro/apis/commits/604f5ac73f6e928852e5ea727f03bf3c15ab95f0"},{"sha":"7ab8b993d9c7b23a887a9ff035ebeefa5c677baa","author":{"email":"cf4c21b09c947740db10e2ccb7d10819767cd724@gmail.com","name":"Roberto Haziel Tienda Rodríguez"},"message":"Autorizando usuarios con la api de SoundCloud","distinct":false,"url":"https://api.github.com/repos/rohatiro/apis/commits/7ab8b993d9c7b23a887a9ff035ebeefa5c677baa"},{"sha":"a1ed42e4db1832f9c1e0352cf4dd79b62dec2b0d","author":{"email":"cf4c21b09c947740db10e2ccb7d10819767cd724@gmail.com","name":"Roberto Haziel Tienda Rodríguez"},"message":"Utilización de proxy para obtener streams de tracks de soundcloud","distinct":false,"url":"https://api.github.com/repos/rohatiro/apis/commits/a1ed42e4db1832f9c1e0352cf4dd79b62dec2b0d"},{"sha":"e60a4d532602c4df08a1a019d759ecac297fce89","author":{"email":"cf4c21b09c947740db10e2ccb7d10819767cd724@gmail.com","name":"Roberto Haziel Tienda Rodríguez"},"message":"Corrigiendo repositorio para heroku","distinct":false,"url":"https://api.github.com/repos/rohatiro/apis/commits/e60a4d532602c4df08a1a019d759ecac297fce89"}]},"public":true,"created_at":"2015-01-01T01:00:44Z"}
{"id":"2489396183","type":"PushEvent","actor":{"id":3013275,"login":"rohatiro","gravatar_id":"","url":"https://api.github.com/users/rohatiro","avatar_url":"https://avatars.githubusercontent.com/u/3013275?"},"repo":{"id":23979538,"name":"rohatiro/apis","url":"https://api.github.com/repos/rohatiro/apis"},"payload":{"push_id":536752369,"size":125,"distinct_size":0,"ref":"refs/heads/temp","head":"9192bc90762e7b78ecc1e5ce5c0787cf13436cf8","before":"85d2f655fd86f8b77dc07ad12284e1d65542be22","commits":[{"sha":"a0cc0cf97f7c94da62dcfb80a0c71ff1d3e2a43e","author":{"email":"cf4c21b09c947740db10e2ccb7d10819767cd724@gmail.com","name":"Roberto Haziel Tienda Rodríguez"},"message":"Utilizando Passport con el API de Github","distinct":false,"url":"https://api.github.com/repos/rohatiro/apis/commits/a0cc0cf97f7c94da62dcfb80a0c71ff1d3e2a43e"},{"sha":"05031ae044ff6a66569b6caa61bdea7cfb80f6b9","author":{"email":"cf4c21b09c947740db10e2ccb7d10819767cd724@gmail.com","name":"Roberto Haziel Tienda Rodríguez"},"message":"Obtención de perfil de usuario en github","distinct":false,"url":"https://api.github.com/repos/rohatiro/apis/commits/05031ae044ff6a66569b6caa61bdea7cfb80f6b9"},{"sha":"d64269c3a069b30cc148086ca1d4e450b0cf074c","author":{"email":"cf4c21b09c947740db10e2ccb7d10819767cd724@gmail.com","name":"Roberto Haziel Tienda Rodríguez"},"message":"Manejo de información del usuario","distinct":false,"url":"https://api.github.com/repos/rohatiro/apis/commits/d64269c3a069b30cc148086ca1d4e450b0cf074c"},{"sha":"c104fa4b165a5a0f98c7fc8c8f1bd4f64d6bbabb","author":{"email":"cf4c21b09c947740db10e2ccb7d10819767cd724@gmail.com","name":"Roberto Haziel Tienda Rodríguez"},"message":"Utilización de Bootstrap para estilos de las paginas","distinct":false,"url":"https://api.github.com/repos/rohatiro/apis/commits/c104fa4b165a5a0f98c7fc8c8f1bd4f64d6bbabb"},{"sha":"5f746f48b8a9c9ad896e67045d41894fe311d7f3","author":{"email":"cf4c21b09c947740db10e2ccb7d10819767cd724@gmail.com","name":"Roberto Haziel Tienda Rodríguez"},"message":"Obteniendo repositorios de Usuario de Github con request","distinct":false,"url":"https://api.github.com/repos/rohatiro/apis/commits/5f746f48b8a9c9ad896e67045d41894fe311d7f3"},{"sha":"604f5ac73f6e928852e5ea727f03bf3c15ab95f0","author":{"email":"cf4c21b09c947740db10e2ccb7d10819767cd724@gmail.com","name":"Roberto Haziel Tienda Rodríguez"},"message":"Modularizando la funcionalidad de autorización de apis","distinct":false,"url":"https://api.github.com/repos/rohatiro/apis/commits/604f5ac73f6e928852e5ea727f03bf3c15ab95f0"},{"sha":"7ab8b993d9c7b23a887a9ff035ebeefa5c677baa","author":{"email":"cf4c21b09c947740db10e2ccb7d10819767cd724@gmail.com","name":"Roberto Haziel Tienda Rodríguez"},"message":"Autorizando usuarios con la api de SoundCloud","distinct":false,"url":"https://api.github.com/repos/rohatiro/apis/commits/7ab8b993d9c7b23a887a9ff035ebeefa5c677baa"},{"sha":"a1ed42e4db1832f9c1e0352cf4dd79b62dec2b0d","author":{"email":"cf4c21b09c947740db10e2ccb7d10819767cd724@gmail.com","name":"Roberto Haziel Tienda Rodríguez"},"message":"Utilización de proxy para obtener streams de tracks de soundcloud","distinct":false,"url":"https://api.github.com/repos/rohatiro/apis/commits/a1ed42e4db1832f9c1e0352cf4dd79b62dec2b0d"},{"sha":"e60a4d532602c4df08a1a019d759ecac297fce89","author":{"email":"cf4c21b09c947740db10e2ccb7d10819767cd724@gmail.com","name":"Roberto Haziel Tienda Rodríguez"},"message":"Corrigiendo repositorio para heroku","distinct":false,"url":"https://api.github.com/repos/rohatiro/apis/commits/e60a4d532602c4df08a1a019d759ecac297fce89"},{"sha":"41827cebc27d1c20c37f9d1663afff27bf56985c","author":{"email":"cf4c21b09c947740db10e2ccb7d10819767cd724@gmail.com","name":"Roberto Haziel Tienda Rodríguez"},"message":"Corrigiendo repositorio para heroku","distinct":false,"url":"https://api.github.com/repos/rohatiro/apis/commits/41827cebc27d1c20c37f9d1663afff27bf56985c"},{"sha":"f27ba51a8ca648f180fb95ce336b7d4ed2db6cf2","author":{"email":"cf4c21b09c947740db10e2ccb7d10819767cd724@gmail.com","name":"Roberto Haziel Tienda Rodríguez"},"message":"Corrigiendo repositorio para heroku","distinct":false,"url":"https://api.github.com/repos/rohatiro/apis/commits/f27ba51a8ca648f180fb95ce336b7d4ed2db6cf2"},{"sha":"5010b01e82fc526a16402712710dd7ef73d8086f","author":{"email":"cf4c21b09c947740db10e2ccb7d10819767cd724@gmail.com","name":"Roberto Haziel Tienda Rodríguez"},"message":"Corrigiendo repositorio para heroku","distinct":false,"url":"https://api.github.com/repos/rohatiro/apis/commits/5010b01e82fc526a16402712710dd7ef73d8086f"},{"sha":"7a903d21c5d3199520737de1228307b71e717a95","author":{"email":"cf4c21b09c947740db10e2ccb7d10819767cd724@gmail.com","name":"Roberto Haziel Tienda Rodríguez"},"message":"Corrigiendo repositorio para heroku","distinct":false,"url":"https://api.github.com/repos/rohatiro/apis/commits/7a903d21c5d3199520737de1228307b71e717a95"},{"sha":"ffbdb7c9aafdeb531a75b4cf64bdf1339058e8b9","author":{"email":"cf4c21b09c947740db10e2ccb7d10819767cd724@gmail.com","name":"Roberto Haziel Tienda Rodríguez"},"message":"Cambios para heroku","distinct":false,"url":"https://api.github.com/repos/rohatiro/apis/commits/ffbdb7c9aafdeb531a75b4cf64bdf1339058e8b9"},{"sha":"2c5fc015ed0b0dfcb893dec64f74cddf17e8d0c6","author":{"email":"cf4c21b09c947740db10e2ccb7d10819767cd724@gmail.com","name":"Roberto Haziel Tienda Rodríguez"},"message":"Cambios en la vista de la pagina inicial de soundcloud","distinct":false,"url":"https://api.github.com/repos/rohatiro/apis/commits/2c5fc015ed0b0dfcb893dec64f74cddf17e8d0c6"},{"sha":"76068ac452376c96f6feb6f07ff99566efa3a285","author":{"email":"cf4c21b09c947740db10e2ccb7d10819767cd724@gmail.com","name":"Roberto Haziel Tienda Rodríguez"},"message":"Cambios para heroku","distinct":false,"url":"https://api.github.com/repos/rohatiro/apis/commits/76068ac452376c96f6feb6f07ff99566efa3a285"},{"sha":"30c618724a70fe1bf06a5b484345b939b89f15e9","author":{"email":"cf4c21b09c947740db10e2ccb7d10819767cd724@gmail.com","name":"Roberto Haziel Tienda Rodríguez"},"message":"Cambios para heroku","distinct":false,"url":"https://api.github.com/repos/rohatiro/apis/commits/30c618724a70fe1bf06a5b484345b939b89f15e9"},{"sha":"9633445f2d373e68703b30f3fd15fd7240d31f6b","author":{"email":"cf4c21b09c947740db10e2ccb7d10819767cd724@gmail.com","name":"Roberto Haziel Tienda Rodríguez"},"message":"Cambios para heroku","distinct":false,"url":"https://api.github.com/repos/rohatiro/apis/commits/9633445f2d373e68703b30f3fd15fd7240d31f6b"},{"sha":"e3328c01916e16f2cb14ee5613dd0b9c04a4c067","author":{"email":"cf4c21b09c947740db10e2ccb7d10819767cd724@gmail.com","name":"Roberto Haziel Tienda Rodríguez"},"message":"Cambios para heroku","distinct":false,"url":"https://api.github.com/repos/rohatiro/apis/commits/e3328c01916e16f2cb14ee5613dd0b9c04a4c067"},{"sha":"f99a48fcedea35168b2e23421745fa2c16d232a4","author":{"email":"cf4c21b09c947740db10e2ccb7d10819767cd724@gmail.com","name":"Roberto Haziel Tienda Rodríguez"},"message":"Prueba para obtener el waveform","distinct":false,"url":"https://api.github.com/repos/rohatiro/apis/commits/f99a48fcedea35168b2e23421745fa2c16d232a4"}]},"public":true,"created_at":"2015-01-01T01:00:44Z"}
{"id":"2489396185","type":"PushEvent","actor":{"id":3013275,"login":"rohatiro","gravatar_id":"","url":"https://api.github.com/users/rohatiro","avatar_url":"https://avatars.githubusercontent.com/u/3013275?"},"repo":{"id":23979538,"name":"rohatiro/apis","url":"https://api.github.com/repos/rohatiro/apis"},"payload":{"push_id":536752370,"size":126,"distinct_size":1,"ref":"refs/heads/master","head":"36d1b23ede8251ca74685fad9fdbf219733be4dd","before":"3d37eb7613b5559e4eb66c0555ecbd589b25922d","commits":[{"sha":"a0cc0cf97f7c94da62dcfb80a0c71ff1d3e2a43e","author":{"email":"cf4c21b09c947740db10e2ccb7d10819767cd724@gmail.com","name":"Roberto Haziel Tienda Rodríguez"},"message":"Utilizando Passport con el API de Github","distinct":false,"url":"https://api.github.com/repos/rohatiro/apis/commits/a0cc0cf97f7c94da62dcfb80a0c71ff1d3e2a43e"},{"sha":"05031ae044ff6a66569b6caa61bdea7cfb80f6b9","author":{"email":"cf4c21b09c947740db10e2ccb7d10819767cd724@gmail.com","name":"Roberto Haziel Tienda Rodríguez"},"message":"Obtención de perfil de usuario en github","distinct":false,"url":"https://api.github.com/repos/rohatiro/apis/commits/05031ae044ff6a66569b6caa61bdea7cfb80f6b9"},{"sha":"d64269c3a069b30cc148086ca1d4e450b0cf074c","author":{"email":"cf4c21b09c947740db10e2ccb7d10819767cd724@gmail.com","name":"Roberto Haziel Tienda Rodríguez"},"message":"Manejo de información del usuario","distinct":false,"url":"https://api.github.com/repos/rohatiro/apis/commits/d64269c3a069b30cc148086ca1d4e450b0cf074c"},{"sha":"c104fa4b165a5a0f98c7fc8c8f1bd4f64d6bbabb","author":{"email":"cf4c21b09c947740db10e2ccb7d10819767cd724@gmail.com","name":"Roberto Haziel Tienda Rodríguez"},"message":"Utilización de Bootstrap para estilos de las paginas","distinct":false,"url":"https://api.github.com/repos/rohatiro/apis/commits/c104fa4b165a5a0f98c7fc8c8f1bd4f64d6bbabb"},{"sha":"5f746f48b8a9c9ad896e67045d41894fe311d7f3","author":{"email":"cf4c21b09c947740db10e2ccb7d10819767cd724@gmail.com","name":"Roberto Haziel Tienda Rodríguez"},"message":"Obteniendo repositorios de Usuario de Github con request","distinct":false,"url":"https://api.github.com/repos/rohatiro/apis/commits/5f746f48b8a9c9ad896e67045d41894fe311d7f3"},{"sha":"604f5ac73f6e928852e5ea727f03bf3c15ab95f0","author":{"email":"cf4c21b09c947740db10e2ccb7d10819767cd724@gmail.com","name":"Roberto Haziel Tienda Rodríguez"},"message":"Modularizando la funcionalidad de autorización de apis","distinct":false,"url":"https://api.github.com/repos/rohatiro/apis/commits/604f5ac73f6e928852e5ea727f03bf3c15ab95f0"},{"sha":"7ab8b993d9c7b23a887a9ff035ebeefa5c677baa","author":{"email":"cf4c21b09c947740db10e2ccb7d10819767cd724@gmail.com","name":"Roberto Haziel Tienda Rodríguez"},"message":"Autorizando usuarios con la api de SoundCloud","distinct":false,"url":"https://api.github.com/repos/rohatiro/apis/commits/7ab8b993d9c7b23a887a9ff035ebeefa5c677baa"},{"sha":"a1ed42e4db1832f9c1e0352cf4dd79b62dec2b0d","author":{"email":"cf4c21b09c947740db10e2ccb7d10819767cd724@gmail.com","name":"Roberto Haziel Tienda Rodríguez"},"message":"Utilización de proxy para obtener streams de tracks de soundcloud","distinct":false,"url":"https://api.github.com/repos/rohatiro/apis/commits/a1ed42e4db1832f9c1e0352cf4dd79b62dec2b0d"},{"sha":"e60a4d532602c4df08a1a019d759ecac297fce89","author":{"email":"cf4c21b09c947740db10e2ccb7d10819767cd724@gmail.com","name":"Roberto Haziel Tienda Rodríguez"},"message":"Corrigiendo repositorio para heroku","distinct":false,"url":"https://api.github.com/repos/rohatiro/apis/commits/e60a4d532602c4df08a1a019d759ecac297fce89"},{"sha":"41827cebc27d1c20c37f9d1663afff27bf56985c","author":{"email":"cf4c21b09c947740db10e2ccb7d10819767cd724@gmail.com","name":"Roberto Haziel Tienda Rodríguez"},"message":"Corrigiendo repositorio para heroku","distinct":false,"url":"https://api.github.com/repos/rohatiro/apis/commits/41827cebc27d1c20c37f9d1663afff27bf56985c"},{"sha":"f27ba51a8ca648f180fb95ce336b7d4ed2db6cf2","author":{"email":"cf4c21b09c947740db10e2ccb7d10819767cd724@gmail.com","name":"Roberto Haziel Tienda Rodríguez"},"message":"Corrigiendo repositorio para heroku","distinct":false,"url":"https://api.github.com/repos/rohatiro/apis/commits/f27ba51a8ca648f180fb95ce336b7d4ed2db6cf2"},{"sha":"5010b01e82fc526a16402712710dd7ef73d8086f","author":{"email":"cf4c21b09c947740db10e2ccb7d10819767cd724@gmail.com","name":"Roberto Haziel Tienda Rodríguez"},"message":"Corrigiendo repositorio para heroku","distinct":false,"url":"https://api.github.com/repos/rohatiro/apis/commits/5010b01e82fc526a16402712710dd7ef73d8086f"},{"sha":"7a903d21c5d3199520737de1228307b71e717a95","author":{"email":"cf4c21b09c947740db10e2ccb7d10819767cd724@gmail.com","name":"Roberto Haziel Tienda Rodríguez"},"message":"Corrigiendo repositorio para heroku","distinct":false,"url":"https://api.github.com/repos/rohatiro/apis/commits/7a903d21c5d3199520737de1228307b71e717a95"},{"sha":"ffbdb7c9aafdeb531a75b4cf64bdf1339058e8b9","author":{"email":"cf4c21b09c947740db10e2ccb7d10819767cd724@gmail.com","name":"Roberto Haziel Tienda Rodríguez"},"message":"Cambios para heroku","distinct":false,"url":"https://api.github.com/repos/rohatiro/apis/commits/ffbdb7c9aafdeb531a75b4cf64bdf1339058e8b9"},{"sha":"2c5fc015ed0b0dfcb893dec64f74cddf17e8d0c6","author":{"email":"cf4c21b09c947740db10e2ccb7d10819767cd724@gmail.com","name":"Roberto Haziel Tienda Rodríguez"},"message":"Cambios en la vista de la pagina inicial de soundcloud","distinct":false,"url":"https://api.github.com/repos/rohatiro/apis/commits/2c5fc015ed0b0dfcb893dec64f74cddf17e8d0c6"},{"sha":"76068ac452376c96f6feb6f07ff99566efa3a285","author":{"email":"cf4c21b09c947740db10e2ccb7d10819767cd724@gmail.com","name":"Roberto Haziel Tienda Rodríguez"},"message":"Cambios para heroku","distinct":false,"url":"https://api.github.com/repos/rohatiro/apis/commits/76068ac452376c96f6feb6f07ff99566efa3a285"},{"sha":"30c618724a70fe1bf06a5b484345b939b89f15e9","author":{"email":"cf4c21b09c947740db10e2ccb7d10819767cd724@gmail.com","name":"Roberto Haziel Tienda Rodríguez"},"message":"Cambios para heroku","distinct":false,"url":"https://api.github.com/repos/rohatiro/apis/commits/30c618724a70fe1bf06a5b484345b939b89f15e9"},{"sha":"9633445f2d373e68703b30f3fd15fd7240d31f6b","author":{"email":"cf4c21b09c947740db10e2ccb7d10819767cd724@gmail.com","name":"Roberto Haziel Tienda Rodríguez"},"message":"Cambios para heroku","distinct":false,"url":"https://api.github.com/repos/rohatiro/apis/commits/9633445f2d373e68703b30f3fd15fd7240d31f6b"},{"sha":"e3328c01916e16f2cb14ee5613dd0b9c04a4c067","author":{"email":"cf4c21b09c947740db10e2ccb7d10819767cd724@gmail.com","name":"Roberto Haziel Tienda Rodríguez"},"message":"Cambios para heroku","distinct":false,"url":"https://api.github.com/repos/rohatiro/apis/commits/e3328c01916e16f2cb14ee5613dd0b9c04a4c067"},{"sha":"f99a48fcedea35168b2e23421745fa2c16d232a4","author":{"email":"cf4c21b09c947740db10e2ccb7d10819767cd724@gmail.com","name":"Roberto Haziel Tienda Rodríguez"},"message":"Prueba para obtener el waveform","distinct":false,"url":"https://api.github.com/repos/rohatiro/apis/commits/f99a48fcedea35168b2e23421745fa2c16d232a4"}]},"public":true,"created_at":"2015-01-01T01:00:44Z"}
{"id":"2489396186","type":"PushEvent","actor":{"id":3013275,"login":"rohatiro","gravatar_id":"","url":"https://api.github.com/users/rohatiro","avatar_url":"https://avatars.githubusercontent.com/u/3013275?"},"repo":{"id":23979538,"name":"rohatiro/apis","url":"https://api.github.com/repos/rohatiro/apis"},"payload":{"push_id":536752371,"size":7,"distinct_size":1,"ref":"refs/heads/github","head":"0c6236cbbaa52265af1510ec177e26ebef449cd2","before":"e9070469477c9228dd12da0a32072b4a0a271912","commits":[{"sha":"a0cc0cf97f7c94da62dcfb80a0c71ff1d3e2a43e","author":{"email":"cf4c21b09c947740db10e2ccb7d10819767cd724@gmail.com","name":"Roberto Haziel Tienda Rodríguez"},"message":"Utilizando Passport con el API de Github","distinct":false,"url":"https://api.github.com/repos/rohatiro/apis/commits/a0cc0cf97f7c94da62dcfb80a0c71ff1d3e2a43e"},{"sha":"05031ae044ff6a66569b6caa61bdea7cfb80f6b9","author":{"email":"cf4c21b09c947740db10e2ccb7d10819767cd724@gmail.com","name":"Roberto Haziel Tienda Rodríguez"},"message":"Obtención de perfil de usuario en github","distinct":false,"url":"https://api.github.com/repos/rohatiro/apis/commits/05031ae044ff6a66569b6caa61bdea7cfb80f6b9"},{"sha":"d64269c3a069b30cc148086ca1d4e450b0cf074c","author":{"email":"cf4c21b09c947740db10e2ccb7d10819767cd724@gmail.com","name":"Roberto Haziel Tienda Rodríguez"},"message":"Manejo de información del usuario","distinct":false,"url":"https://api.github.com/repos/rohatiro/apis/commits/d64269c3a069b30cc148086ca1d4e450b0cf074c"},{"sha":"c104fa4b165a5a0f98c7fc8c8f1bd4f64d6bbabb","author":{"email":"cf4c21b09c947740db10e2ccb7d10819767cd724@gmail.com","name":"Roberto Haziel Tienda Rodríguez"},"message":"Utilización de Bootstrap para estilos de las paginas","distinct":false,"url":"https://api.github.com/repos/rohatiro/apis/commits/c104fa4b165a5a0f98c7fc8c8f1bd4f64d6bbabb"},{"sha":"5f746f48b8a9c9ad896e67045d41894fe311d7f3","author":{"email":"cf4c21b09c947740db10e2ccb7d10819767cd724@gmail.com","name":"Roberto Haziel Tienda Rodríguez"},"message":"Obteniendo repositorios de Usuario de Github con request","distinct":false,"url":"https://api.github.com/repos/rohatiro/apis/commits/5f746f48b8a9c9ad896e67045d41894fe311d7f3"},{"sha":"604f5ac73f6e928852e5ea727f03bf3c15ab95f0","author":{"email":"cf4c21b09c947740db10e2ccb7d10819767cd724@gmail.com","name":"Roberto Haziel Tienda Rodríguez"},"message":"Modularizando la funcionalidad de autorización de apis","distinct":false,"url":"https://api.github.com/repos/rohatiro/apis/commits/604f5ac73f6e928852e5ea727f03bf3c15ab95f0"},{"sha":"0c6236cbbaa52265af1510ec177e26ebef449cd2","author":{"email":"cf4c21b09c947740db10e2ccb7d10819767cd724@gmail.com","name":"Roberto Haziel Tienda Rodríguez"},"message":"Rediseño del api de github","distinct":true,"url":"https://api.github.com/repos/rohatiro/apis/commits/0c6236cbbaa52265af1510ec177e26ebef449cd2"}]},"public":true,"created_at":"2015-01-01T01:00:44Z"}
{"id":"2489396195","type":"PushEvent","actor":{"id":1371300,"login":"hovida","gravatar_id":"","url":"https://api.github.com/users/hovida","avatar_url":"https://avatars.githubusercontent.com/u/1371300?"},"repo":{"id":27575221,"name":"MyChannel-Apps/KFramework","url":"https://api.github.com/repos/MyChannel-Apps/KFramework"},"payload":{"push_id":536752374,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"f88618316a96ef97448b5595dd54c5e3478f69e9","before":"bb9b1c88fa505fdf0ad50ab8547141c597127549","commits":[{"sha":"f88618316a96ef97448b5595dd54c5e3478f69e9","author":{"email":"59bd0a3ff43b32849b319e645d4798d8a5d1e889@adi-code.de","name":"Adrian Preuß"},"message":"Cronjob: Comment out","distinct":true,"url":"https://api.github.com/repos/MyChannel-Apps/KFramework/commits/f88618316a96ef97448b5595dd54c5e3478f69e9"}]},"public":true,"created_at":"2015-01-01T01:00:45Z","org":{"id":10083083,"login":"MyChannel-Apps","gravatar_id":"","url":"https://api.github.com/orgs/MyChannel-Apps","avatar_url":"https://avatars.githubusercontent.com/u/10083083?"}}
{"id":"2489396203","type":"IssueCommentEvent","actor":{"id":18191,"login":"jc00ke","gravatar_id":"","url":"https://api.github.com/users/jc00ke","avatar_url":"https://avatars.githubusercontent.com/u/18191?"},"repo":{"id":10488201,"name":"JeanMertz/chruby-fish","url":"https://api.github.com/repos/JeanMertz/chruby-fish"},"payload":{"action":"created","issue":{"url":"https://api.github.com/repos/JeanMertz/chruby-fish/issues/14","labels_url":"https://api.github.com/repos/JeanMertz/chruby-fish/issues/14/labels{/name}","comments_url":"https://api.github.com/repos/JeanMertz/chruby-fish/issues/14/comments","events_url":"https://api.github.com/repos/JeanMertz/chruby-fish/issues/14/events","html_url":"https://github.com/JeanMertz/chruby-fish/issues/14","id":52577720,"number":14,"title":"\"path component may not be valid\" warning","user":{"login":"jc00ke","id":18191,"avatar_url":"https://avatars.githubusercontent.com/u/18191?v=3","gravatar_id":"","url":"https://api.github.com/users/jc00ke","html_url":"https://github.com/jc00ke","followers_url":"https://api.github.com/users/jc00ke/followers","following_url":"https://api.github.com/users/jc00ke/following{/other_user}","gists_url":"https://api.github.com/users/jc00ke/gists{/gist_id}","starred_url":"https://api.github.com/users/jc00ke/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/jc00ke/subscriptions","organizations_url":"https://api.github.com/users/jc00ke/orgs","repos_url":"https://api.github.com/users/jc00ke/repos","events_url":"https://api.github.com/users/jc00ke/events{/privacy}","received_events_url":"https://api.github.com/users/jc00ke/received_events","type":"User","site_admin":false},"labels":[],"state":"closed","locked":false,"assignee":null,"milestone":null,"comments":2,"created_at":"2014-12-20T21:52:33Z","updated_at":"2015-01-01T01:00:45Z","closed_at":"2015-01-01T01:00:45Z","body":"```\r\n$> cd ~/projects/foo/\r\nset: Warning: path component /home/jesse/.rubies/ruby-2.1.5/lib/ruby/gems/2.1.0/bin may not be valid in PATH.\r\nset: No such file or directory\r\n$> cat .ruby-version\r\n2.1.5\r\n$> chruby --version\r\nchruby: 0.3.9\r\nchruby-fish: 0.6.0\r\n```\r\n\r\n`chruby-fish` is actuall `HEAD` as of e8f28035e7\r\n\r\nIdeas on how to suppress the warning? There's definitely no `bin/` in that `path` above."},"comment":{"url":"https://api.github.com/repos/JeanMertz/chruby-fish/issues/comments/68477225","html_url":"https://github.com/JeanMertz/chruby-fish/issues/14#issuecomment-68477225","issue_url":"https://api.github.com/repos/JeanMertz/chruby-fish/issues/14","id":68477225,"user":{"login":"jc00ke","id":18191,"avatar_url":"https://avatars.githubusercontent.com/u/18191?v=3","gravatar_id":"","url":"https://api.github.com/users/jc00ke","html_url":"https://github.com/jc00ke","followers_url":"https://api.github.com/users/jc00ke/followers","following_url":"https://api.github.com/users/jc00ke/following{/other_user}","gists_url":"https://api.github.com/users/jc00ke/gists{/gist_id}","starred_url":"https://api.github.com/users/jc00ke/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/jc00ke/subscriptions","organizations_url":"https://api.github.com/users/jc00ke/orgs","repos_url":"https://api.github.com/users/jc00ke/repos","events_url":"https://api.github.com/users/jc00ke/events{/privacy}","received_events_url":"https://api.github.com/users/jc00ke/received_events","type":"User","site_admin":false},"created_at":"2015-01-01T01:00:45Z","updated_at":"2015-01-01T01:00:45Z","body":"Thanks @britishtea, I ended up creating the missing directories. Since multiple people reported this, maybe it's worth mentioning in the README? I'll open a PR for that, but I understand if it won't be merged."}},"public":true,"created_at":"2015-01-01T01:00:46Z"}
{"id":"2489396204","type":"IssuesEvent","actor":{"id":18191,"login":"jc00ke","gravatar_id":"","url":"https://api.github.com/users/jc00ke","avatar_url":"https://avatars.githubusercontent.com/u/18191?"},"repo":{"id":10488201,"name":"JeanMertz/chruby-fish","url":"https://api.github.com/repos/JeanMertz/chruby-fish"},"payload":{"action":"closed","issue":{"url":"https://api.github.com/repos/JeanMertz/chruby-fish/issues/14","labels_url":"https://api.github.com/repos/JeanMertz/chruby-fish/issues/14/labels{/name}","comments_url":"https://api.github.com/repos/JeanMertz/chruby-fish/issues/14/comments","events_url":"https://api.github.com/repos/JeanMertz/chruby-fish/issues/14/events","html_url":"https://github.com/JeanMertz/chruby-fish/issues/14","id":52577720,"number":14,"title":"\"path component may not be valid\" warning","user":{"login":"jc00ke","id":18191,"avatar_url":"https://avatars.githubusercontent.com/u/18191?v=3","gravatar_id":"","url":"https://api.github.com/users/jc00ke","html_url":"https://github.com/jc00ke","followers_url":"https://api.github.com/users/jc00ke/followers","following_url":"https://api.github.com/users/jc00ke/following{/other_user}","gists_url":"https://api.github.com/users/jc00ke/gists{/gist_id}","starred_url":"https://api.github.com/users/jc00ke/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/jc00ke/subscriptions","organizations_url":"https://api.github.com/users/jc00ke/orgs","repos_url":"https://api.github.com/users/jc00ke/repos","events_url":"https://api.github.com/users/jc00ke/events{/privacy}","received_events_url":"https://api.github.com/users/jc00ke/received_events","type":"User","site_admin":false},"labels":[],"state":"closed","locked":false,"assignee":null,"milestone":null,"comments":2,"created_at":"2014-12-20T21:52:33Z","updated_at":"2015-01-01T01:00:45Z","closed_at":"2015-01-01T01:00:45Z","body":"```\r\n$> cd ~/projects/foo/\r\nset: Warning: path component /home/jesse/.rubies/ruby-2.1.5/lib/ruby/gems/2.1.0/bin may not be valid in PATH.\r\nset: No such file or directory\r\n$> cat .ruby-version\r\n2.1.5\r\n$> chruby --version\r\nchruby: 0.3.9\r\nchruby-fish: 0.6.0\r\n```\r\n\r\n`chruby-fish` is actuall `HEAD` as of e8f28035e7\r\n\r\nIdeas on how to suppress the warning? There's definitely no `bin/` in that `path` above."}},"public":true,"created_at":"2015-01-01T01:00:46Z"}
{"id":"2489396213","type":"PushEvent","actor":{"id":1181205,"login":"malekbr","gravatar_id":"","url":"https://api.github.com/users/malekbr","avatar_url":"https://avatars.githubusercontent.com/u/1181205?"},"repo":{"id":28657751,"name":"malekbr/PeevedPenguinsTemplate-Spritebuilder","url":"https://api.github.com/repos/malekbr/PeevedPenguinsTemplate-Spritebuilder"},"payload":{"push_id":536752379,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"3084e78941af25cb8d49f4a9483e17ad41bcfd3e","before":"711944c3b36b8c6cc591c507db7c442d70ab02cf","commits":[{"sha":"3084e78941af25cb8d49f4a9483e17ad41bcfd3e","author":{"email":"73d3febb659ea118d8f1f9f1ff5f5ae09f3ca6d6@Mings-MacBook-Air.local","name":"Malek Ben Romdhane"},"message":"Automatically Committed for MakeGamesWithUs","distinct":true,"url":"https://api.github.com/repos/malekbr/PeevedPenguinsTemplate-Spritebuilder/commits/3084e78941af25cb8d49f4a9483e17ad41bcfd3e"}]},"public":true,"created_at":"2015-01-01T01:00:46Z"}
{"id":"2489396216","type":"CreateEvent","actor":{"id":6982503,"login":"josephsands","gravatar_id":"","url":"https://api.github.com/users/josephsands","avatar_url":"https://avatars.githubusercontent.com/u/6982503?"},"repo":{"id":28678205,"name":"josephsands/josephsands.github.io","url":"https://api.github.com/repos/josephsands/josephsands.github.io"},"payload":{"ref":"master","ref_type":"branch","master_branch":"master","description":"Independent iOS Developer Blog","pusher_type":"user"},"public":true,"created_at":"2015-01-01T01:00:46Z"}
{"id":"2489396218","type":"PushEvent","actor":{"id":954353,"login":"byronmccollum","gravatar_id":"","url":"https://api.github.com/users/byronmccollum","avatar_url":"https://avatars.githubusercontent.com/u/954353?"},"repo":{"id":14756639,"name":"byronmccollum/webscript.io-modules","url":"https://api.github.com/repos/byronmccollum/webscript.io-modules"},"payload":{"push_id":536752382,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"a6c25ed5f1bf15abfa2a8aa67dbcd6e560953296","before":"e90f21829951d8cc8d6dd79effefcda4cb7712e2","commits":[{"sha":"a6c25ed5f1bf15abfa2a8aa67dbcd6e560953296","author":{"email":"5c33cd3f0e8876e7150963b90c8e5c3e219c1462@rackspace.com","name":"Byron McCollum"},"message":"Create diff.lua","distinct":true,"url":"https://api.github.com/repos/byronmccollum/webscript.io-modules/commits/a6c25ed5f1bf15abfa2a8aa67dbcd6e560953296"}]},"public":true,"created_at":"2015-01-01T01:00:46Z"}
{"id":"2489396220","type":"PushEvent","actor":{"id":1167760,"login":"afawcett","gravatar_id":"","url":"https://api.github.com/users/afawcett","avatar_url":"https://avatars.githubusercontent.com/u/1167760?"},"repo":{"id":28570910,"name":"afawcett/littlebits-connector","url":"https://api.github.com/repos/afawcett/littlebits-connector"},"payload":{"push_id":536752383,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"3f4328e42d2051646d27b9ab14c011d4794c99bd","before":"0679908a11f472cc3787d2542850550b3dff2e5d","commits":[{"sha":"3f4328e42d2051646d27b9ab14c011d4794c99bd","author":{"email":"e3579b1e47f273529f0f929453e939a68ede9fd1@andyinthecloud.com","name":"Andrew Fawcett"},"message":"Update README.md","distinct":true,"url":"https://api.github.com/repos/afawcett/littlebits-connector/commits/3f4328e42d2051646d27b9ab14c011d4794c99bd"}]},"public":true,"created_at":"2015-01-01T01:00:46Z"}
{"id":"2489396223","type":"WatchEvent","actor":{"id":6186720,"login":"NyanKiyoshi","gravatar_id":"","url":"https://api.github.com/users/NyanKiyoshi","avatar_url":"https://avatars.githubusercontent.com/u/6186720?"},"repo":{"id":17528018,"name":"erming/shout","url":"https://api.github.com/repos/erming/shout"},"payload":{"action":"started"},"public":true,"created_at":"2015-01-01T01:00:46Z"}
{"id":"2489396225","type":"PushEvent","actor":{"id":1909779,"login":"omero","gravatar_id":"","url":"https://api.github.com/users/omero","avatar_url":"https://avatars.githubusercontent.com/u/1909779?"},"repo":{"id":19432745,"name":"omero/DrupalAppConsole","url":"https://api.github.com/repos/omero/DrupalAppConsole"},"payload":{"push_id":536752390,"size":1,"distinct_size":1,"ref":"refs/heads/remove_spaces_enity_class","head":"251788240077ded991d18f2bce83e89f1b09c864","before":"95d331818e7794dd248c75b6b7fbde933436e9f6","commits":[{"sha":"251788240077ded991d18f2bce83e89f1b09c864","author":{"email":"767e3cfe24a214e93dd88e66d7764801877079e9@gmail.com","name":"Omar Aguirre Tenorio"},"message":"#272 Adding askAndValidate function for helper dialog","distinct":true,"url":"https://api.github.com/repos/omero/DrupalAppConsole/commits/251788240077ded991d18f2bce83e89f1b09c864"}]},"public":true,"created_at":"2015-01-01T01:00:46Z"}
{"id":"2489396229","type":"PushEvent","actor":{"id":327833,"login":"dobesv","gravatar_id":"","url":"https://api.github.com/users/dobesv","avatar_url":"https://avatars.githubusercontent.com/u/327833?"},"repo":{"id":13713978,"name":"dobesv/functionaljava","url":"https://api.github.com/repos/dobesv/functionaljava"},"payload":{"push_id":536752391,"size":2,"distinct_size":2,"ref":"refs/heads/master","head":"3e1e6018a84070a70f0fe4c3f66b84719b98f6d7","before":"c98564f62dabfbeb4d8605f1578808575b18934d","commits":[{"sha":"e5425b09bc4ad462da121eedde1b2d8fb2d30f72","author":{"email":"686276df1403a18d9915ffe92f243f413570b0fc@gmail.com","name":"Dobes Vandermeer"},"message":"More NonNull annotations.","distinct":true,"url":"https://api.github.com/repos/dobesv/functionaljava/commits/e5425b09bc4ad462da121eedde1b2d8fb2d30f72"},{"sha":"3e1e6018a84070a70f0fe4c3f66b84719b98f6d7","author":{"email":"686276df1403a18d9915ffe92f243f413570b0fc@gmail.com","name":"Dobes Vandermeer"},"message":"More added annotations and helper methods.","distinct":true,"url":"https://api.github.com/repos/dobesv/functionaljava/commits/3e1e6018a84070a70f0fe4c3f66b84719b98f6d7"}]},"public":true,"created_at":"2015-01-01T01:00:47Z"}
{"id":"2489396233","type":"IssueCommentEvent","actor":{"id":3650755,"login":"scpeters","gravatar_id":"","url":"https://api.github.com/users/scpeters","avatar_url":"https://avatars.githubusercontent.com/u/3650755?"},"repo":{"id":11771697,"name":"osrf/homebrew-simulation","url":"https://api.github.com/repos/osrf/homebrew-simulation"},"payload":{"action":"created","issue":{"url":"https://api.github.com/repos/osrf/homebrew-simulation/issues/29","labels_url":"https://api.github.com/repos/osrf/homebrew-simulation/issues/29/labels{/name}","comments_url":"https://api.github.com/repos/osrf/homebrew-simulation/issues/29/comments","events_url":"https://api.github.com/repos/osrf/homebrew-simulation/issues/29/events","html_url":"https://github.com/osrf/homebrew-simulation/issues/29","id":44603425,"number":29,"title":"gazebo failed to build on 10.9.5","user":{"login":"kdorsel","id":2569415,"avatar_url":"https://avatars.githubusercontent.com/u/2569415?v=3","gravatar_id":"","url":"https://api.github.com/users/kdorsel","html_url":"https://github.com/kdorsel","followers_url":"https://api.github.com/users/kdorsel/followers","following_url":"https://api.github.com/users/kdorsel/following{/other_user}","gists_url":"https://api.github.com/users/kdorsel/gists{/gist_id}","starred_url":"https://api.github.com/users/kdorsel/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/kdorsel/subscriptions","organizations_url":"https://api.github.com/users/kdorsel/orgs","repos_url":"https://api.github.com/users/kdorsel/repos","events_url":"https://api.github.com/users/kdorsel/events{/privacy}","received_events_url":"https://api.github.com/users/kdorsel/received_events","type":"User","site_admin":false},"labels":[],"state":"open","locked":false,"assignee":null,"milestone":null,"comments":5,"created_at":"2014-10-01T19:10:39Z","updated_at":"2015-01-01T01:00:47Z","closed_at":null,"body":"Failing to build gazebo while trying to install ROS Hydro.\r\n\r\nhttps://gist.github.com/anonymous/3d72d247d7126bb44660"},"comment":{"url":"https://api.github.com/repos/osrf/homebrew-simulation/issues/comments/68477227","html_url":"https://github.com/osrf/homebrew-simulation/issues/29#issuecomment-68477227","issue_url":"https://api.github.com/repos/osrf/homebrew-simulation/issues/29","id":68477227,"user":{"login":"scpeters","id":3650755,"avatar_url":"https://avatars.githubusercontent.com/u/3650755?v=3","gravatar_id":"","url":"https://api.github.com/users/scpeters","html_url":"https://github.com/scpeters","followers_url":"https://api.github.com/users/scpeters/followers","following_url":"https://api.github.com/users/scpeters/following{/other_user}","gists_url":"https://api.github.com/users/scpeters/gists{/gist_id}","starred_url":"https://api.github.com/users/scpeters/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/scpeters/subscriptions","organizations_url":"https://api.github.com/users/scpeters/orgs","repos_url":"https://api.github.com/users/scpeters/repos","events_url":"https://api.github.com/users/scpeters/events{/privacy}","received_events_url":"https://api.github.com/users/scpeters/received_events","type":"User","site_admin":false},"created_at":"2015-01-01T01:00:47Z","updated_at":"2015-01-01T01:00:47Z","body":"The protobuf issues were resolved in [gazebo pull request 1346](https://bitbucket.org/osrf/gazebo/pull-request/1346/fix-build-for-os-x-1010-1304-1289/diff), though there are now some other issues with boost 1.57 that prevent gazebo from building. I have a fix for them waiting for code review. I'll close this when gazebo is building again."}},"public":true,"created_at":"2015-01-01T01:00:47Z","org":{"id":3999730,"login":"osrf","gravatar_id":"","url":"https://api.github.com/orgs/osrf","avatar_url":"https://avatars.githubusercontent.com/u/3999730?"}}
{"id":"2489396234","type":"ForkEvent","actor":{"id":8252171,"login":"WangXYZ","gravatar_id":"","url":"https://api.github.com/users/WangXYZ","avatar_url":"https://avatars.githubusercontent.com/u/8252171?"},"repo":{"id":7673434,"name":"blueboy/portaltbc","url":"https://api.github.com/repos/blueboy/portaltbc"},"payload":{"forkee":{"id":28678219,"name":"portaltbc","full_name":"WangXYZ/portaltbc","owner":{"login":"WangXYZ","id":8252171,"avatar_url":"https://avatars.githubusercontent.com/u/8252171?v=3","gravatar_id":"","url":"https://api.github.com/users/WangXYZ","html_url":"https://github.com/WangXYZ","followers_url":"https://api.github.com/users/WangXYZ/followers","following_url":"https://api.github.com/users/WangXYZ/following{/other_user}","gists_url":"https://api.github.com/users/WangXYZ/gists{/gist_id}","starred_url":"https://api.github.com/users/WangXYZ/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/WangXYZ/subscriptions","organizations_url":"https://api.github.com/users/WangXYZ/orgs","repos_url":"https://api.github.com/users/WangXYZ/repos","events_url":"https://api.github.com/users/WangXYZ/events{/privacy}","received_events_url":"https://api.github.com/users/WangXYZ/received_events","type":"Organization","site_admin":false},"private":false,"html_url":"https://github.com/WangXYZ/portaltbc","description":"playerbot support for C(ontinued)-MaNGOS (tbc fork)","fork":true,"url":"https://api.github.com/repos/WangXYZ/portaltbc","forks_url":"https://api.github.com/repos/WangXYZ/portaltbc/forks","keys_url":"https://api.github.com/repos/WangXYZ/portaltbc/keys{/key_id}","collaborators_url":"https://api.github.com/repos/WangXYZ/portaltbc/collaborators{/collaborator}","teams_url":"https://api.github.com/repos/WangXYZ/portaltbc/teams","hooks_url":"https://api.github.com/repos/WangXYZ/portaltbc/hooks","issue_events_url":"https://api.github.com/repos/WangXYZ/portaltbc/issues/events{/number}","events_url":"https://api.github.com/repos/WangXYZ/portaltbc/events","assignees_url":"https://api.github.com/repos/WangXYZ/portaltbc/assignees{/user}","branches_url":"https://api.github.com/repos/WangXYZ/portaltbc/branches{/branch}","tags_url":"https://api.github.com/repos/WangXYZ/portaltbc/tags","blobs_url":"https://api.github.com/repos/WangXYZ/portaltbc/git/blobs{/sha}","git_tags_url":"https://api.github.com/repos/WangXYZ/portaltbc/git/tags{/sha}","git_refs_url":"https://api.github.com/repos/WangXYZ/portaltbc/git/refs{/sha}","trees_url":"https://api.github.com/repos/WangXYZ/portaltbc/git/trees{/sha}","statuses_url":"https://api.github.com/repos/WangXYZ/portaltbc/statuses/{sha}","languages_url":"https://api.github.com/repos/WangXYZ/portaltbc/languages","stargazers_url":"https://api.github.com/repos/WangXYZ/portaltbc/stargazers","contributors_url":"https://api.github.com/repos/WangXYZ/portaltbc/contributors","subscribers_url":"https://api.github.com/repos/WangXYZ/portaltbc/subscribers","subscription_url":"https://api.github.com/repos/WangXYZ/portaltbc/subscription","commits_url":"https://api.github.com/repos/WangXYZ/portaltbc/commits{/sha}","git_commits_url":"https://api.github.com/repos/WangXYZ/portaltbc/git/commits{/sha}","comments_url":"https://api.github.com/repos/WangXYZ/portaltbc/comments{/number}","issue_comment_url":"https://api.github.com/repos/WangXYZ/portaltbc/issues/comments/{number}","contents_url":"https://api.github.com/repos/WangXYZ/portaltbc/contents/{+path}","compare_url":"https://api.github.com/repos/WangXYZ/portaltbc/compare/{base}...{head}","merges_url":"https://api.github.com/repos/WangXYZ/portaltbc/merges","archive_url":"https://api.github.com/repos/WangXYZ/portaltbc/{archive_format}{/ref}","downloads_url":"https://api.github.com/repos/WangXYZ/portaltbc/downloads","issues_url":"https://api.github.com/repos/WangXYZ/portaltbc/issues{/number}","pulls_url":"https://api.github.com/repos/WangXYZ/portaltbc/pulls{/number}","milestones_url":"https://api.github.com/repos/WangXYZ/portaltbc/milestones{/number}","notifications_url":"https://api.github.com/repos/WangXYZ/portaltbc/notifications{?since,all,participating}","labels_url":"https://api.github.com/repos/WangXYZ/portaltbc/labels{/name}","releases_url":"https://api.github.com/repos/WangXYZ/portaltbc/releases{/id}","created_at":"2015-01-01T01:00:47Z","updated_at":"2014-12-02T15:01:09Z","pushed_at":"2014-12-02T15:00:53Z","git_url":"git://github.com/WangXYZ/portaltbc.git","ssh_url":"git@github.com:WangXYZ/portaltbc.git","clone_url":"https://github.com/WangXYZ/portaltbc.git","svn_url":"https://github.com/WangXYZ/portaltbc","homepage":null,"size":46000,"stargazers_count":0,"watchers_count":0,"language":null,"has_issues":false,"has_downloads":true,"has_wiki":true,"has_pages":false,"forks_count":0,"mirror_url":null,"open_issues_count":0,"forks":0,"open_issues":0,"watchers":0,"default_branch":"master","public":true}},"public":true,"created_at":"2015-01-01T01:00:47Z"}
{"id":"2489396235","type":"IssuesEvent","actor":{"id":1414603,"login":"zoldello","gravatar_id":"","url":"https://api.github.com/users/zoldello","avatar_url":"https://avatars.githubusercontent.com/u/1414603?"},"repo":{"id":26617214,"name":"ChicagoVeg/restaurantList","url":"https://api.github.com/repos/ChicagoVeg/restaurantList"},"payload":{"action":"closed","issue":{"url":"https://api.github.com/repos/ChicagoVeg/restaurantList/issues/9","labels_url":"https://api.github.com/repos/ChicagoVeg/restaurantList/issues/9/labels{/name}","comments_url":"https://api.github.com/repos/ChicagoVeg/restaurantList/issues/9/comments","events_url":"https://api.github.com/repos/ChicagoVeg/restaurantList/issues/9/events","html_url":"https://github.com/ChicagoVeg/restaurantList/issues/9","id":53210171,"number":9,"title":"When I filter out restaurants by type, the removed restaurant pins remain in the map","user":{"login":"zoldello","id":1414603,"avatar_url":"https://avatars.githubusercontent.com/u/1414603?v=3","gravatar_id":"","url":"https://api.github.com/users/zoldello","html_url":"https://github.com/zoldello","followers_url":"https://api.github.com/users/zoldello/followers","following_url":"https://api.github.com/users/zoldello/following{/other_user}","gists_url":"https://api.github.com/users/zoldello/gists{/gist_id}","starred_url":"https://api.github.com/users/zoldello/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/zoldello/subscriptions","organizations_url":"https://api.github.com/users/zoldello/orgs","repos_url":"https://api.github.com/users/zoldello/repos","events_url":"https://api.github.com/users/zoldello/events{/privacy}","received_events_url":"https://api.github.com/users/zoldello/received_events","type":"User","site_admin":false},"labels":[{"url":"https://api.github.com/repos/ChicagoVeg/restaurantList/labels/bug","name":"bug","color":"fc2929"},{"url":"https://api.github.com/repos/ChicagoVeg/restaurantList/labels/Great+to+Have","name":"Great to Have","color":"f7c6c7"}],"state":"closed","locked":false,"assignee":{"login":"zoldello","id":1414603,"avatar_url":"https://avatars.githubusercontent.com/u/1414603?v=3","gravatar_id":"","url":"https://api.github.com/users/zoldello","html_url":"https://github.com/zoldello","followers_url":"https://api.github.com/users/zoldello/followers","following_url":"https://api.github.com/users/zoldello/following{/other_user}","gists_url":"https://api.github.com/users/zoldello/gists{/gist_id}","starred_url":"https://api.github.com/users/zoldello/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/zoldello/subscriptions","organizations_url":"https://api.github.com/users/zoldello/orgs","repos_url":"https://api.github.com/users/zoldello/repos","events_url":"https://api.github.com/users/zoldello/events{/privacy}","received_events_url":"https://api.github.com/users/zoldello/received_events","type":"User","site_admin":false},"milestone":{"url":"https://api.github.com/repos/ChicagoVeg/restaurantList/milestones/3","labels_url":"https://api.github.com/repos/ChicagoVeg/restaurantList/milestones/3/labels","id":894444,"number":3,"title":"Release 1","description":"","creator":{"login":"vadim424","id":10101875,"avatar_url":"https://avatars.githubusercontent.com/u/10101875?v=3","gravatar_id":"","url":"https://api.github.com/users/vadim424","html_url":"https://github.com/vadim424","followers_url":"https://api.github.com/users/vadim424/followers","following_url":"https://api.github.com/users/vadim424/following{/other_user}","gists_url":"https://api.github.com/users/vadim424/gists{/gist_id}","starred_url":"https://api.github.com/users/vadim424/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/vadim424/subscriptions","organizations_url":"https://api.github.com/users/vadim424/orgs","repos_url":"https://api.github.com/users/vadim424/repos","events_url":"https://api.github.com/users/vadim424/events{/privacy}","received_events_url":"https://api.github.com/users/vadim424/received_events","type":"User","site_admin":false},"open_issues":2,"closed_issues":5,"state":"open","created_at":"2014-12-07T00:34:16Z","updated_at":"2015-01-01T01:00:47Z","due_on":"2014-12-14T06:00:00Z","closed_at":null},"comments":0,"created_at":"2015-01-01T01:00:14Z","updated_at":"2015-01-01T01:00:47Z","closed_at":"2015-01-01T01:00:47Z","body":""}},"public":true,"created_at":"2015-01-01T01:00:47Z","org":{"id":9426295,"login":"ChicagoVeg","gravatar_id":"","url":"https://api.github.com/orgs/ChicagoVeg","avatar_url":"https://avatars.githubusercontent.com/u/9426295?"}}
{"id":"2489396238","type":"PushEvent","actor":{"id":1414603,"login":"zoldello","gravatar_id":"","url":"https://api.github.com/users/zoldello","avatar_url":"https://avatars.githubusercontent.com/u/1414603?"},"repo":{"id":26617214,"name":"ChicagoVeg/restaurantList","url":"https://api.github.com/repos/ChicagoVeg/restaurantList"},"payload":{"push_id":536752394,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"dae6d7b4323b0a3102a1decf5b9b0c12f51989a5","before":"6549a2eb06d7449819f2da7eba6015c413093315","commits":[{"sha":"dae6d7b4323b0a3102a1decf5b9b0c12f51989a5","author":{"email":"444a4929803744c29fad4ab600e75220d121ff93@gmail.com","name":"Phil"},"message":"removed filtered out pins, Fixes #9","distinct":true,"url":"https://api.github.com/repos/ChicagoVeg/restaurantList/commits/dae6d7b4323b0a3102a1decf5b9b0c12f51989a5"}]},"public":true,"created_at":"2015-01-01T01:00:47Z","org":{"id":9426295,"login":"ChicagoVeg","gravatar_id":"","url":"https://api.github.com/orgs/ChicagoVeg","avatar_url":"https://avatars.githubusercontent.com/u/9426295?"}}
{"id":"2489396239","type":"PushEvent","actor":{"id":3599988,"login":"wesdizzle","gravatar_id":"","url":"https://api.github.com/users/wesdizzle","avatar_url":"https://avatars.githubusercontent.com/u/3599988?"},"repo":{"id":28250120,"name":"wesdizzle/gagglelog","url":"https://api.github.com/repos/wesdizzle/gagglelog"},"payload":{"push_id":536752395,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"699893742e393b99eb2250f17b2aad8979d7b454","before":"bbd74811366cd3da6de3522bb2a9403b7e778a34","commits":[{"sha":"699893742e393b99eb2250f17b2aad8979d7b454","author":{"email":"baaa01a5d45f86e3d8f7008866cf0d37bea55570@gmail.com","name":"Wesley Miller"},"message":"added index values to DistributionMethods for sorting through multiple distribution methods on a single platform of a single type when alphabetical order is not sufficient","distinct":true,"url":"https://api.github.com/repos/wesdizzle/gagglelog/commits/699893742e393b99eb2250f17b2aad8979d7b454"}]},"public":true,"created_at":"2015-01-01T01:00:48Z"}
{"id":"2489396248","type":"PushEvent","actor":{"id":1681249,"login":"Toeler","gravatar_id":"","url":"https://api.github.com/users/Toeler","avatar_url":"https://avatars.githubusercontent.com/u/1681249?"},"repo":{"id":28678136,"name":"Toeler/Handmade-Hero","url":"https://api.github.com/repos/Toeler/Handmade-Hero"},"payload":{"push_id":536752397,"size":2,"distinct_size":2,"ref":"refs/heads/master","head":"408100c353fa4aa5b211754d5cfc1d83b8c359a3","before":"cdf1922395b7f019ed27b3a8ea4022d5e130c8f7","commits":[{"sha":"d028d9792ca92f20f8a1cde584e1a82d97acbdf6","author":{"email":"908cd16f96776f758750763d02c45f03b1281e90@gmail.com","name":"Toeler"},"message":"Initial commit of work as at end of ep20 (week 4).","distinct":true,"url":"https://api.github.com/repos/Toeler/Handmade-Hero/commits/d028d9792ca92f20f8a1cde584e1a82d97acbdf6"},{"sha":"408100c353fa4aa5b211754d5cfc1d83b8c359a3","author":{"email":"908cd16f96776f758750763d02c45f03b1281e90@gmail.com","name":"Toeler"},"message":"Merge branch 'master' of https://github.com/Toeler/Handmade-Hero","distinct":true,"url":"https://api.github.com/repos/Toeler/Handmade-Hero/commits/408100c353fa4aa5b211754d5cfc1d83b8c359a3"}]},"public":true,"created_at":"2015-01-01T01:00:49Z"}
{"id":"2489396253","type":"PushEvent","actor":{"id":9244168,"login":"gaokuan","gravatar_id":"","url":"https://api.github.com/users/gaokuan","avatar_url":"https://avatars.githubusercontent.com/u/9244168?"},"repo":{"id":27301392,"name":"208121222/gaokuan","url":"https://api.github.com/repos/208121222/gaokuan"},"payload":{"push_id":536752398,"size":1,"distinct_size":1,"ref":"refs/heads/xunni","head":"8eced38fc32bbcc27c5e449f3c774a90666034a6","before":"64237471e72a59de1744997734962a4df2f9b852","commits":[{"sha":"8eced38fc32bbcc27c5e449f3c774a90666034a6","author":{"email":"7ed3207dcf2d842d5b4994c386d23da61b479781@qq.com","name":"gaokuan"},"message":"pinlvji.vhd\n\npinlvji.vhd","distinct":true,"url":"https://api.github.com/repos/208121222/gaokuan/commits/8eced38fc32bbcc27c5e449f3c774a90666034a6"}]},"public":true,"created_at":"2015-01-01T01:00:50Z","org":{"id":9999410,"login":"208121222","gravatar_id":"","url":"https://api.github.com/orgs/208121222","avatar_url":"https://avatars.githubusercontent.com/u/9999410?"}}
{"id":"2489396256","type":"PushEvent","actor":{"id":5043639,"login":"akbar-sh","gravatar_id":"","url":"https://api.github.com/users/akbar-sh","avatar_url":"https://avatars.githubusercontent.com/u/5043639?"},"repo":{"id":28675338,"name":"akbar-sh/tracker","url":"https://api.github.com/repos/akbar-sh/tracker"},"payload":{"push_id":536752401,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"c45885fad735da88cd6dc0fbabd83a647a7c0289","before":"182a9b651f97650023f4b8d4a09f13b5e9b8f614","commits":[{"sha":"c45885fad735da88cd6dc0fbabd83a647a7c0289","author":{"email":"7eb7e51160615686946d5e19147edf697a6d53a2@MacBook.local","name":"Akbar Sharifi"},"message":"Removing facebook keys.","distinct":true,"url":"https://api.github.com/repos/akbar-sh/tracker/commits/c45885fad735da88cd6dc0fbabd83a647a7c0289"}]},"public":true,"created_at":"2015-01-01T01:00:50Z"}
{"id":"2489396258","type":"PushEvent","actor":{"id":1063076,"login":"Praneeta","gravatar_id":"","url":"https://api.github.com/users/Praneeta","avatar_url":"https://avatars.githubusercontent.com/u/1063076?"},"repo":{"id":28235730,"name":"Praneeta/animation","url":"https://api.github.com/repos/Praneeta/animation"},"payload":{"push_id":536752403,"size":2,"distinct_size":2,"ref":"refs/heads/new-year-simple","head":"c2486dbe0d16c6cc6a57e27470e475aff4e329f7","before":"3d60e5c7b0906f0fdf5f924c6a2a88b6d247e27a","commits":[{"sha":"e1f605daf044dcc0b529df04a88017715a9d41f6","author":{"email":"07cf5b0397e51b26de5d8e7005579c15dd1c2956@gmail.com","name":"IntroToCoding"},"message":"more cards","distinct":true,"url":"https://api.github.com/repos/Praneeta/animation/commits/e1f605daf044dcc0b529df04a88017715a9d41f6"},{"sha":"c2486dbe0d16c6cc6a57e27470e475aff4e329f7","author":{"email":"07cf5b0397e51b26de5d8e7005579c15dd1c2956@gmail.com","name":"IntroToCoding"},"message":"Merge branch 'new-year-simple' of https://github.com/Praneeta/animation into new-year-simple","distinct":true,"url":"https://api.github.com/repos/Praneeta/animation/commits/c2486dbe0d16c6cc6a57e27470e475aff4e329f7"}]},"public":true,"created_at":"2015-01-01T01:00:50Z"}
{"id":"2489396268","type":"PushEvent","actor":{"id":2539292,"login":"wmfgerrit","gravatar_id":"","url":"https://api.github.com/users/wmfgerrit","avatar_url":"https://avatars.githubusercontent.com/u/2539292?"},"repo":{"id":6495889,"name":"wikimedia/mediawiki-extensions-WikimediaMessages","url":"https://api.github.com/repos/wikimedia/mediawiki-extensions-WikimediaMessages"},"payload":{"push_id":536752404,"size":2,"distinct_size":2,"ref":"refs/heads/master","head":"61ec5c645adae968e353a778c4f7e82a86ad3468","before":"cdd4f8d557f206f88f06fb458ea07fa9359f0d15","commits":[{"sha":"b41f0ccd50df420206b77bb2c359a1d61202655a","author":{"email":"f2a16c7d37923d357c1a0ea372900e4a57158c3c@gmail.com","name":"Kunal Mehta"},"message":"Add missing wikibase-sitelinks-sitename-wikidatawiki message\n\nChange-Id: I1edd3a55f4c8240a2317828adcb9eedccbe904f4","distinct":true,"url":"https://api.github.com/repos/wikimedia/mediawiki-extensions-WikimediaMessages/commits/b41f0ccd50df420206b77bb2c359a1d61202655a"},{"sha":"61ec5c645adae968e353a778c4f7e82a86ad3468","author":{"email":"61a1c7c885f4fc173424af2875d459c32bdc4fee@gerrit.wikimedia.org","name":"jenkins-bot"},"message":"Merge \"Add missing wikibase-sitelinks-sitename-wikidatawiki message\"","distinct":true,"url":"https://api.github.com/repos/wikimedia/mediawiki-extensions-WikimediaMessages/commits/61ec5c645adae968e353a778c4f7e82a86ad3468"}]},"public":true,"created_at":"2015-01-01T01:00:51Z","org":{"id":56668,"login":"wikimedia","gravatar_id":"","url":"https://api.github.com/orgs/wikimedia","avatar_url":"https://avatars.githubusercontent.com/u/56668?"}}
{"id":"2489396273","type":"PushEvent","actor":{"id":5869772,"login":"felixonmars-bot","gravatar_id":"","url":"https://api.github.com/users/felixonmars-bot","avatar_url":"https://avatars.githubusercontent.com/u/5869772?"},"repo":{"id":14887549,"name":"felixonmars/community-mirror","url":"https://api.github.com/repos/felixonmars/community-mirror"},"payload":{"push_id":536752407,"size":2,"distinct_size":2,"ref":"refs/heads/master","head":"b60e989186fb5c092e27586953095c3c4c20c113","before":"09aa1bafd2e0d0fb066d1223e749425bd73dc640","commits":[{"sha":"d2ffde669aca182b3f737a4e3369d81d69bfdc10","author":{"email":"e841b73a36e3b1b8d38130b3ade2600d4fac5ad3@9fca08f4-af9d-4005-b8df-a31f2cc04f65","name":"fyan"},"message":"upgpkg: python-sh 1.11-1\n\nupstream new release\n\n\ngit-svn-id: file:///srv/repos/svn-community/svn@125087 9fca08f4-af9d-4005-b8df-a31f2cc04f65","distinct":true,"url":"https://api.github.com/repos/felixonmars/community-mirror/commits/d2ffde669aca182b3f737a4e3369d81d69bfdc10"},{"sha":"b60e989186fb5c092e27586953095c3c4c20c113","author":{"email":"e841b73a36e3b1b8d38130b3ade2600d4fac5ad3@9fca08f4-af9d-4005-b8df-a31f2cc04f65","name":"fyan"},"message":"archrelease: copy trunk to community-any\n\ngit-svn-id: file:///srv/repos/svn-community/svn@125088 9fca08f4-af9d-4005-b8df-a31f2cc04f65","distinct":true,"url":"https://api.github.com/repos/felixonmars/community-mirror/commits/b60e989186fb5c092e27586953095c3c4c20c113"}]},"public":true,"created_at":"2015-01-01T01:00:52Z"}
{"id":"2489396274","type":"IssuesEvent","actor":{"id":2791237,"login":"lauriegao","gravatar_id":"","url":"https://api.github.com/users/lauriegao","avatar_url":"https://avatars.githubusercontent.com/u/2791237?"},"repo":{"id":7064308,"name":"jisaacks/GitGutter","url":"https://api.github.com/repos/jisaacks/GitGutter"},"payload":{"action":"opened","issue":{"url":"https://api.github.com/repos/jisaacks/GitGutter/issues/207","labels_url":"https://api.github.com/repos/jisaacks/GitGutter/issues/207/labels{/name}","comments_url":"https://api.github.com/repos/jisaacks/GitGutter/issues/207/comments","events_url":"https://api.github.com/repos/jisaacks/GitGutter/issues/207/events","html_url":"https://github.com/jisaacks/GitGutter/issues/207","id":53210180,"number":207,"title":"Gitgutter icons not showing after updating to MAC OS X Yosemite","user":{"login":"lauriegao","id":2791237,"avatar_url":"https://avatars.githubusercontent.com/u/2791237?v=3","gravatar_id":"","url":"https://api.github.com/users/lauriegao","html_url":"https://github.com/lauriegao","followers_url":"https://api.github.com/users/lauriegao/followers","following_url":"https://api.github.com/users/lauriegao/following{/other_user}","gists_url":"https://api.github.com/users/lauriegao/gists{/gist_id}","starred_url":"https://api.github.com/users/lauriegao/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/lauriegao/subscriptions","organizations_url":"https://api.github.com/users/lauriegao/orgs","repos_url":"https://api.github.com/users/lauriegao/repos","events_url":"https://api.github.com/users/lauriegao/events{/privacy}","received_events_url":"https://api.github.com/users/lauriegao/received_events","type":"User","site_admin":false},"labels":[],"state":"open","locked":false,"assignee":null,"milestone":null,"comments":0,"created_at":"2015-01-01T01:00:52Z","updated_at":"2015-01-01T01:00:52Z","closed_at":null,"body":"My Gitgutter icons won't display after updating to Yosemite recently.\r\n\r\nI am using Sublme Text 2.  I tried uninstalling and reinstalling Gitgutter through Package Control and Git with no luck. \r\n\r\nFound this repeated three times in console every time I save changes.\r\n\r\n```\r\nTraceback (most recent call last):\r\n  File \"./sublime_plugin.py\", line 339, in run_\r\n  File \"./git_gutter.py\", line 33, in run\r\n  File \"./view_collection.py\", line 50, in diff\r\n  File \"./git_gutter_handler.py\", line 156, in diff\r\n  File \"./git_gutter_handler.py\", line 248, in run_command\r\n  File \"/System/Library/Frameworks/Python.framework/Versions/2.6/lib/python2.6/subprocess.py\", line 623, in __init__\r\n    errread, errwrite)\r\n  File \"/System/Library/Frameworks/Python.framework/Versions/2.6/lib/python2.6/subprocess.py\", line 1141, in _execute_child\r\n    raise child_exception\r\nOSError: [Errno 13] Permission denied\r\n```"}},"public":true,"created_at":"2015-01-01T01:00:52Z"}
{"id":"2489396276","type":"PushEvent","actor":{"id":6298185,"login":"salrodgom","gravatar_id":"","url":"https://api.github.com/users/salrodgom","avatar_url":"https://avatars.githubusercontent.com/u/6298185?"},"repo":{"id":28646555,"name":"salrodgom/MC-MD_hybrid_cycles","url":"https://api.github.com/repos/salrodgom/MC-MD_hybrid_cycles"},"payload":{"push_id":536752408,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"a762ae78e5c09457dcced64e3a6f6138906759f3","before":"dad880c5428f67cec42c7bc4a054befee370856a","commits":[{"sha":"a762ae78e5c09457dcced64e3a6f6138906759f3","author":{"email":"db47db2091bca5e23c026e50e0b9d2e8e7a8e001@upo.es","name":"Salvador R. G. Balestra"},"message":"\trenamed:    objsMC/RHO_i43m_C1.cif -> objsMC/RHO_i43m_80.cif\n\tnew file:   objsMC/RHO_i43m_92.cif\n\tnew file:   objsMC/RHO_im3m_80.cif\n\tnew file:   objsMC/RHO_im3m_92.cif","distinct":true,"url":"https://api.github.com/repos/salrodgom/MC-MD_hybrid_cycles/commits/a762ae78e5c09457dcced64e3a6f6138906759f3"}]},"public":true,"created_at":"2015-01-01T01:00:52Z"}
{"id":"2489396277","type":"PushEvent","actor":{"id":10343396,"login":"sosostris","gravatar_id":"","url":"https://api.github.com/users/sosostris","avatar_url":"https://avatars.githubusercontent.com/u/10343396?"},"repo":{"id":28607481,"name":"sosostris/javapetmarket","url":"https://api.github.com/repos/sosostris/javapetmarket"},"payload":{"push_id":536752410,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"4048ae0f8434f2ac9a5c4550f3b8252059e83594","before":"53bf643993375c731a60a6fa0c15b5ee043ef00a","commits":[{"sha":"4048ae0f8434f2ac9a5c4550f3b8252059e83594","author":{"email":"4dde01cb51e645a1a51fda7beda48cb0ddc0314e@zhenhuaxu-ltm.internal.salesforce.com","name":"Zhenhua Xu"},"message":"PetsVSAnantou","distinct":true,"url":"https://api.github.com/repos/sosostris/javapetmarket/commits/4048ae0f8434f2ac9a5c4550f3b8252059e83594"}]},"public":true,"created_at":"2015-01-01T01:00:52Z"}
{"id":"2489396280","type":"PushEvent","actor":{"id":1301018,"login":"Harinlen","gravatar_id":"","url":"https://api.github.com/users/Harinlen","avatar_url":"https://avatars.githubusercontent.com/u/1301018?"},"repo":{"id":22275454,"name":"Kreogist/Mu","url":"https://api.github.com/repos/Kreogist/Mu"},"payload":{"push_id":536752412,"size":53,"distinct_size":1,"ref":"refs/heads/master","head":"3f141a0111ec1b68690d6f23fd96abd42cfa1d87","before":"60056c7f8ff214177a84bda7bc7fee8bb7cecc48","commits":[{"sha":"064d1e3f9e31cd232468a7c81a0f94271536de21","author":{"email":"59ee19a92dc49eba15e3c296949ec051e29e0063@126.com","name":"Saki"},"message":"Major: 0.4.21\n\nNew Features:\n1. Add experimental ttplayer lyrics downloader, but cannot use.","distinct":false,"url":"https://api.github.com/repos/Kreogist/Mu/commits/064d1e3f9e31cd232468a7c81a0f94271536de21"},{"sha":"2d484f08c3886d0e0c379403b91067c083deda61","author":{"email":"59ee19a92dc49eba15e3c296949ec051e29e0063@126.com","name":"Saki"},"message":"Major: 0.4.22\n\nNew Features:\n1. Support download lyrics from TTPlayer server.\n2. Add main player base file.","distinct":false,"url":"https://api.github.com/repos/Kreogist/Mu/commits/2d484f08c3886d0e0c379403b91067c083deda61"},{"sha":"f9f4b8e12d9256fe132b8df61e45162725b2f4f1","author":{"email":"59ee19a92dc49eba15e3c296949ec051e29e0063@126.com","name":"Saki"},"message":"Major: 0.4.23\n\nNew Features:\n1. Support download lyrics from TTPod server.","distinct":false,"url":"https://api.github.com/repos/Kreogist/Mu/commits/f9f4b8e12d9256fe132b8df61e45162725b2f4f1"},{"sha":"d5d1f8463ede80378b4f9cf334bd892c4be9f97b","author":{"email":"59ee19a92dc49eba15e3c296949ec051e29e0063@126.com","name":"Saki"},"message":"Major: 0.4.24\n\nNew Features:\n1. Add SAO Style sub menu.","distinct":false,"url":"https://api.github.com/repos/Kreogist/Mu/commits/d5d1f8463ede80378b4f9cf334bd892c4be9f97b"},{"sha":"6d054cad0737d6776bbf634c022b10749f10d846","author":{"email":"59ee19a92dc49eba15e3c296949ec051e29e0063@126.com","name":"Saki"},"message":"Major: 0.4.25\n\nNew Features:\n1. Support show in actions in append menu.","distinct":false,"url":"https://api.github.com/repos/Kreogist/Mu/commits/6d054cad0737d6776bbf634c022b10749f10d846"},{"sha":"32f25a9a70c3b322afeb0fdecffae0194c049c11","author":{"email":"59ee19a92dc49eba15e3c296949ec051e29e0063@126.com","name":"Saki"},"message":"Major: 0.4.26\n\nNew Features:\n1. Support better album shadow.","distinct":false,"url":"https://api.github.com/repos/Kreogist/Mu/commits/32f25a9a70c3b322afeb0fdecffae0194c049c11"},{"sha":"f51ddf0213a95c037aa02023625d856da4893212","author":{"email":"59ee19a92dc49eba15e3c296949ec051e29e0063@126.com","name":"Saki"},"message":"Major: 0.4.27\n\nBug Fixed:\n1. Fixed the Windows menu indicator display bug.","distinct":false,"url":"https://api.github.com/repos/Kreogist/Mu/commits/f51ddf0213a95c037aa02023625d856da4893212"},{"sha":"100f2969eefac4ce8558c239ae43c155f58d87f5","author":{"email":"59ee19a92dc49eba15e3c296949ec051e29e0063@126.com","name":"Saki"},"message":"Major: 0.4.28\n\nNew Features:\n1. Tweak the WIN32 single property.","distinct":false,"url":"https://api.github.com/repos/Kreogist/Mu/commits/100f2969eefac4ce8558c239ae43c155f58d87f5"},{"sha":"5ec46f5972932993d0fdb9afa1a6983e0ef55f5d","author":{"email":"59ee19a92dc49eba15e3c296949ec051e29e0063@126.com","name":"Saki"},"message":"Major: 0.4.29\n\nUpdates:\n1. Update the music kind to fixed string.\n2. Update the number and path item value sync policy.","distinct":false,"url":"https://api.github.com/repos/Kreogist/Mu/commits/5ec46f5972932993d0fdb9afa1a6983e0ef55f5d"},{"sha":"01ea187618722bfaaf4dce1defa2d9cc3c01f384","author":{"email":"59ee19a92dc49eba15e3c296949ec051e29e0063@126.com","name":"Saki"},"message":"Major: 0.4.30\nWARNING:\nThis commit can be ONLY compile on Linux, do not try on Windows or Mac OS X.\nNew Features:\n1. Change the library dir on Linux to /.kreogist/mu/library.","distinct":false,"url":"https://api.github.com/repos/Kreogist/Mu/commits/01ea187618722bfaaf4dce1defa2d9cc3c01f384"},{"sha":"aecb03334f03845ee09b43a657110fd3d416513f","author":{"email":"59ee19a92dc49eba15e3c296949ec051e29e0063@126.com","name":"Saki"},"message":"Major: 0.4.30\nWARNING:\nThis commit can be ONLY compiled under Linux, don't try it on Windows or Mac OS X.\nNew Features:\n1. Update Linux user path.","distinct":false,"url":"https://api.github.com/repos/Kreogist/Mu/commits/aecb03334f03845ee09b43a657110fd3d416513f"},{"sha":"cf842e5cba099c1795de7e48bddf32505c83a87c","author":{"email":"59ee19a92dc49eba15e3c296949ec051e29e0063@126.com","name":"Saki"},"message":"Major: 0.4.31\n\nWARNING:\nThis commit can ONLY be compiled under Windows and Linux, don't try it\non Mac OS X.\nUpdates:\n1. Tweak the Windows document dir.","distinct":false,"url":"https://api.github.com/repos/Kreogist/Mu/commits/cf842e5cba099c1795de7e48bddf32505c83a87c"},{"sha":"b12c6bfd0de1600d34a4c32ded9275169e72fe2a","author":{"email":"59ee19a92dc49eba15e3c296949ec051e29e0063@126.com","name":"Saki"},"message":"Major: 0.4.29\n\nUpdates:\n1. Now shadow can automatically set their position via the increase\nparameters.","distinct":false,"url":"https://api.github.com/repos/Kreogist/Mu/commits/b12c6bfd0de1600d34a4c32ded9275169e72fe2a"},{"sha":"ce01605b171063699e908fa40b085cae3d77193a","author":{"email":"59ee19a92dc49eba15e3c296949ec051e29e0063@126.com","name":"Saki"},"message":"Major: 0.4.32\n\nMerge:\n1. Apply the merge.","distinct":false,"url":"https://api.github.com/repos/Kreogist/Mu/commits/ce01605b171063699e908fa40b085cae3d77193a"},{"sha":"9d3d4009e60161217944fe2afe8fd62a3d7edb0f","author":{"email":"59ee19a92dc49eba15e3c296949ec051e29e0063@126.com","name":"Saki"},"message":"Major: 0.4.33\n\nNew Features:\n1. Now locale manager can set the directory position.\n2. Tweak the Mac OS X folder.","distinct":false,"url":"https://api.github.com/repos/Kreogist/Mu/commits/9d3d4009e60161217944fe2afe8fd62a3d7edb0f"},{"sha":"0d368ca3131cf6cc754d38509dc674dbea86b587","author":{"email":"59ee19a92dc49eba15e3c296949ec051e29e0063@126.com","name":"Saki"},"message":"Major: 0.4.34\n\nNew Features:\n1. Add the rename function for single file.","distinct":false,"url":"https://api.github.com/repos/Kreogist/Mu/commits/0d368ca3131cf6cc754d38509dc674dbea86b587"},{"sha":"5d4940624bc23f14c83518e06c5673d359b6ccfb","author":{"email":"59ee19a92dc49eba15e3c296949ec051e29e0063@126.com","name":"Saki"},"message":"Major: 0.4.35\n\nNew Features:\n1. Experimental support KNMessageBox question static function.","distinct":false,"url":"https://api.github.com/repos/Kreogist/Mu/commits/5d4940624bc23f14c83518e06c5673d359b6ccfb"},{"sha":"210278fa178920b30bd7ecefa1faf1b9e9369027","author":{"email":"59ee19a92dc49eba15e3c296949ec051e29e0063@126.com","name":"Saki"},"message":"Major: 0.4.36\n\nNew Features:\n1. Initial add rename function.\n2. Change the drag class initial to QScopePointer.","distinct":false,"url":"https://api.github.com/repos/Kreogist/Mu/commits/210278fa178920b30bd7ecefa1faf1b9e9369027"},{"sha":"fba3bd8198c4e7cf26885059982ae754400fe03e","author":{"email":"59ee19a92dc49eba15e3c296949ec051e29e0063@126.com","name":"Saki"},"message":"Major: 0.4.37\n\nBug Fixed:\n1. Fixed the database won't change the file name bug.","distinct":false,"url":"https://api.github.com/repos/Kreogist/Mu/commits/fba3bd8198c4e7cf26885059982ae754400fe03e"},{"sha":"823ec79cb522f564c43b35f6f7d830143b431b21","author":{"email":"59ee19a92dc49eba15e3c296949ec051e29e0063@126.com","name":"Saki"},"message":"Major: 0.4.38\n\nUpdates:\n1. Replace the unavailable characters to '_' to avoid the name bug under\nWindows.","distinct":false,"url":"https://api.github.com/repos/Kreogist/Mu/commits/823ec79cb522f564c43b35f6f7d830143b431b21"}]},"public":true,"created_at":"2015-01-01T01:00:53Z","org":{"id":5064132,"login":"Kreogist","gravatar_id":"","url":"https://api.github.com/orgs/Kreogist","avatar_url":"https://avatars.githubusercontent.com/u/5064132?"}}
{"id":"2489396281","type":"PushEvent","actor":{"id":1253444,"login":"nathan-osman","gravatar_id":"","url":"https://api.github.com/users/nathan-osman","avatar_url":"https://avatars.githubusercontent.com/u/1253444?"},"repo":{"id":28151446,"name":"nathan-osman/django-archive","url":"https://api.github.com/repos/nathan-osman/django-archive"},"payload":{"push_id":536752413,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"ad9166116ced36397fca45582a93ab5d188df18f","before":"4e90d1956c0596dd0e2f546d2456c3ab2d0b749a","commits":[{"sha":"ad9166116ced36397fca45582a93ab5d188df18f","author":{"email":"2e8aa918660411855c6d44d5bb2da677aa033255@quickmediasolutions.com","name":"Nathan Osman"},"message":"Once again fixed the module paths in setup.py.","distinct":true,"url":"https://api.github.com/repos/nathan-osman/django-archive/commits/ad9166116ced36397fca45582a93ab5d188df18f"}]},"public":true,"created_at":"2015-01-01T01:00:53Z"}
{"id":"2489396285","type":"PushEvent","actor":{"id":236741,"login":"bryankennedy","gravatar_id":"","url":"https://api.github.com/users/bryankennedy","avatar_url":"https://avatars.githubusercontent.com/u/236741?"},"repo":{"id":28671124,"name":"scimusmn/chondrite","url":"https://api.github.com/repos/scimusmn/chondrite"},"payload":{"push_id":536752416,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"41a6c1af77a62f1f29c162ee4544b7094545fc2a","before":"723a5c3a1daadb296857b0c59df586b59f664d7c","commits":[{"sha":"41a6c1af77a62f1f29c162ee4544b7094545fc2a","author":{"email":"a2bc4ee92ccb7070799160edd9f39024dd8797ad@smm.org","name":"bryan kennedy"},"message":"Adding credits to the readme","distinct":true,"url":"https://api.github.com/repos/scimusmn/chondrite/commits/41a6c1af77a62f1f29c162ee4544b7094545fc2a"}]},"public":true,"created_at":"2015-01-01T01:00:54Z","org":{"id":777830,"login":"scimusmn","gravatar_id":"","url":"https://api.github.com/orgs/scimusmn","avatar_url":"https://avatars.githubusercontent.com/u/777830?"}}
{"id":"2489396287","type":"IssuesEvent","actor":{"id":8890114,"login":"speeldoos","gravatar_id":"","url":"https://api.github.com/users/speeldoos","avatar_url":"https://avatars.githubusercontent.com/u/8890114?"},"repo":{"id":28678093,"name":"speeldoos/hello-world","url":"https://api.github.com/repos/speeldoos/hello-world"},"payload":{"action":"opened","issue":{"url":"https://api.github.com/repos/speeldoos/hello-world/issues/1","labels_url":"https://api.github.com/repos/speeldoos/hello-world/issues/1/labels{/name}","comments_url":"https://api.github.com/repos/speeldoos/hello-world/issues/1/comments","events_url":"https://api.github.com/repos/speeldoos/hello-world/issues/1/events","html_url":"https://github.com/speeldoos/hello-world/issues/1","id":53210181,"number":1,"title":"Finish README","user":{"login":"speeldoos","id":8890114,"avatar_url":"https://avatars.githubusercontent.com/u/8890114?v=3","gravatar_id":"","url":"https://api.github.com/users/speeldoos","html_url":"https://github.com/speeldoos","followers_url":"https://api.github.com/users/speeldoos/followers","following_url":"https://api.github.com/users/speeldoos/following{/other_user}","gists_url":"https://api.github.com/users/speeldoos/gists{/gist_id}","starred_url":"https://api.github.com/users/speeldoos/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/speeldoos/subscriptions","organizations_url":"https://api.github.com/users/speeldoos/orgs","repos_url":"https://api.github.com/users/speeldoos/repos","events_url":"https://api.github.com/users/speeldoos/events{/privacy}","received_events_url":"https://api.github.com/users/speeldoos/received_events","type":"User","site_admin":false},"labels":[],"state":"open","locked":false,"assignee":null,"milestone":null,"comments":0,"created_at":"2015-01-01T01:00:54Z","updated_at":"2015-01-01T01:00:54Z","closed_at":null,"body":"So I can finish this tutorial ASAP!"}},"public":true,"created_at":"2015-01-01T01:00:55Z"}
{"id":"2489396288","type":"IssueCommentEvent","actor":{"id":253237,"login":"Jamesking56","gravatar_id":"","url":"https://api.github.com/users/Jamesking56","avatar_url":"https://avatars.githubusercontent.com/u/253237?"},"repo":{"id":26730195,"name":"cachethq/Cachet","url":"https://api.github.com/repos/cachethq/Cachet"},"payload":{"action":"created","issue":{"url":"https://api.github.com/repos/cachethq/Cachet/issues/173","labels_url":"https://api.github.com/repos/cachethq/Cachet/issues/173/labels{/name}","comments_url":"https://api.github.com/repos/cachethq/Cachet/issues/173/comments","events_url":"https://api.github.com/repos/cachethq/Cachet/issues/173/events","html_url":"https://github.com/cachethq/Cachet/issues/173","id":53210024,"number":173,"title":"Bug: Forms let you submit multiple times","user":{"login":"Jamesking56","id":253237,"avatar_url":"https://avatars.githubusercontent.com/u/253237?v=3","gravatar_id":"","url":"https://api.github.com/users/Jamesking56","html_url":"https://github.com/Jamesking56","followers_url":"https://api.github.com/users/Jamesking56/followers","following_url":"https://api.github.com/users/Jamesking56/following{/other_user}","gists_url":"https://api.github.com/users/Jamesking56/gists{/gist_id}","starred_url":"https://api.github.com/users/Jamesking56/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/Jamesking56/subscriptions","organizations_url":"https://api.github.com/users/Jamesking56/orgs","repos_url":"https://api.github.com/users/Jamesking56/repos","events_url":"https://api.github.com/users/Jamesking56/events{/privacy}","received_events_url":"https://api.github.com/users/Jamesking56/received_events","type":"User","site_admin":false},"labels":[],"state":"open","locked":false,"assignee":null,"milestone":null,"comments":2,"created_at":"2015-01-01T00:52:06Z","updated_at":"2015-01-01T01:00:54Z","closed_at":null,"body":"When adding a new incident, I noticed a weird bug.\r\n\r\nIf you fill in the form as normal, then click the submit button twice really quickly, it'll create __TWO__ identical new incidents!\r\n\r\nThis could be a bit annoying, a simple fix is using a bit of JS that on submit, disables the submit button so that once clicked, it cannot be clicked again."},"comment":{"url":"https://api.github.com/repos/cachethq/Cachet/issues/comments/68477229","html_url":"https://github.com/cachethq/Cachet/issues/173#issuecomment-68477229","issue_url":"https://api.github.com/repos/cachethq/Cachet/issues/173","id":68477229,"user":{"login":"Jamesking56","id":253237,"avatar_url":"https://avatars.githubusercontent.com/u/253237?v=3","gravatar_id":"","url":"https://api.github.com/users/Jamesking56","html_url":"https://github.com/Jamesking56","followers_url":"https://api.github.com/users/Jamesking56/followers","following_url":"https://api.github.com/users/Jamesking56/following{/other_user}","gists_url":"https://api.github.com/users/Jamesking56/gists{/gist_id}","starred_url":"https://api.github.com/users/Jamesking56/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/Jamesking56/subscriptions","organizations_url":"https://api.github.com/users/Jamesking56/orgs","repos_url":"https://api.github.com/users/Jamesking56/repos","events_url":"https://api.github.com/users/Jamesking56/events{/privacy}","received_events_url":"https://api.github.com/users/Jamesking56/received_events","type":"User","site_admin":false},"created_at":"2015-01-01T01:00:54Z","updated_at":"2015-01-01T01:00:54Z","body":"How do you suppose it could be fixed in Laravel?"}},"public":true,"created_at":"2015-01-01T01:00:55Z","org":{"id":9951502,"login":"cachethq","gravatar_id":"","url":"https://api.github.com/orgs/cachethq","avatar_url":"https://avatars.githubusercontent.com/u/9951502?"}}
{"id":"2489396289","type":"CommitCommentEvent","actor":{"id":3372342,"login":"bors","gravatar_id":"","url":"https://api.github.com/users/bors","avatar_url":"https://avatars.githubusercontent.com/u/3372342?"},"repo":{"id":724712,"name":"rust-lang/rust","url":"https://api.github.com/repos/rust-lang/rust"},"payload":{"comment":{"url":"https://api.github.com/repos/rust-lang/rust/comments/9131359","html_url":"https://github.com/rust-lang/rust/commit/8f98078b1508c7ebd488c4ab864a4d2fb02d44f8#commitcomment-9131359","id":9131359,"user":{"login":"bors","id":3372342,"avatar_url":"https://avatars.githubusercontent.com/u/3372342?v=3","gravatar_id":"","url":"https://api.github.com/users/bors","html_url":"https://github.com/bors","followers_url":"https://api.github.com/users/bors/followers","following_url":"https://api.github.com/users/bors/following{/other_user}","gists_url":"https://api.github.com/users/bors/gists{/gist_id}","starred_url":"https://api.github.com/users/bors/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/bors/subscriptions","organizations_url":"https://api.github.com/users/bors/orgs","repos_url":"https://api.github.com/users/bors/repos","events_url":"https://api.github.com/users/bors/events{/privacy}","received_events_url":"https://api.github.com/users/bors/received_events","type":"User","site_admin":false},"position":null,"line":null,"path":null,"commit_id":"8f98078b1508c7ebd488c4ab864a4d2fb02d44f8","created_at":"2015-01-01T01:00:54Z","updated_at":"2015-01-01T01:00:54Z","body":"saw approval from nmatsakis\nat https://github.com/japaric/rust/commit/8f98078b1508c7ebd488c4ab864a4d2fb02d44f8"}},"public":true,"created_at":"2015-01-01T01:00:54Z","org":{"id":5430905,"login":"rust-lang","gravatar_id":"","url":"https://api.github.com/orgs/rust-lang","avatar_url":"https://avatars.githubusercontent.com/u/5430905?"}}
{"id":"2489396293","type":"ForkEvent","actor":{"id":3245033,"login":"ZheYuan","gravatar_id":"","url":"https://api.github.com/users/ZheYuan","avatar_url":"https://avatars.githubusercontent.com/u/3245033?"},"repo":{"id":18537678,"name":"FiloSottile/Heartbleed","url":"https://api.github.com/repos/FiloSottile/Heartbleed"},"payload":{"forkee":{"id":28678220,"name":"Heartbleed","full_name":"ZheYuan/Heartbleed","owner":{"login":"ZheYuan","id":3245033,"avatar_url":"https://avatars.githubusercontent.com/u/3245033?v=3","gravatar_id":"","url":"https://api.github.com/users/ZheYuan","html_url":"https://github.com/ZheYuan","followers_url":"https://api.github.com/users/ZheYuan/followers","following_url":"https://api.github.com/users/ZheYuan/following{/other_user}","gists_url":"https://api.github.com/users/ZheYuan/gists{/gist_id}","starred_url":"https://api.github.com/users/ZheYuan/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/ZheYuan/subscriptions","organizations_url":"https://api.github.com/users/ZheYuan/orgs","repos_url":"https://api.github.com/users/ZheYuan/repos","events_url":"https://api.github.com/users/ZheYuan/events{/privacy}","received_events_url":"https://api.github.com/users/ZheYuan/received_events","type":"User","site_admin":false},"private":false,"html_url":"https://github.com/ZheYuan/Heartbleed","description":"A checker (site and tool) for CVE-2014-0160","fork":true,"url":"https://api.github.com/repos/ZheYuan/Heartbleed","forks_url":"https://api.github.com/repos/ZheYuan/Heartbleed/forks","keys_url":"https://api.github.com/repos/ZheYuan/Heartbleed/keys{/key_id}","collaborators_url":"https://api.github.com/repos/ZheYuan/Heartbleed/collaborators{/collaborator}","teams_url":"https://api.github.com/repos/ZheYuan/Heartbleed/teams","hooks_url":"https://api.github.com/repos/ZheYuan/Heartbleed/hooks","issue_events_url":"https://api.github.com/repos/ZheYuan/Heartbleed/issues/events{/number}","events_url":"https://api.github.com/repos/ZheYuan/Heartbleed/events","assignees_url":"https://api.github.com/repos/ZheYuan/Heartbleed/assignees{/user}","branches_url":"https://api.github.com/repos/ZheYuan/Heartbleed/branches{/branch}","tags_url":"https://api.github.com/repos/ZheYuan/Heartbleed/tags","blobs_url":"https://api.github.com/repos/ZheYuan/Heartbleed/git/blobs{/sha}","git_tags_url":"https://api.github.com/repos/ZheYuan/Heartbleed/git/tags{/sha}","git_refs_url":"https://api.github.com/repos/ZheYuan/Heartbleed/git/refs{/sha}","trees_url":"https://api.github.com/repos/ZheYuan/Heartbleed/git/trees{/sha}","statuses_url":"https://api.github.com/repos/ZheYuan/Heartbleed/statuses/{sha}","languages_url":"https://api.github.com/repos/ZheYuan/Heartbleed/languages","stargazers_url":"https://api.github.com/repos/ZheYuan/Heartbleed/stargazers","contributors_url":"https://api.github.com/repos/ZheYuan/Heartbleed/contributors","subscribers_url":"https://api.github.com/repos/ZheYuan/Heartbleed/subscribers","subscription_url":"https://api.github.com/repos/ZheYuan/Heartbleed/subscription","commits_url":"https://api.github.com/repos/ZheYuan/Heartbleed/commits{/sha}","git_commits_url":"https://api.github.com/repos/ZheYuan/Heartbleed/git/commits{/sha}","comments_url":"https://api.github.com/repos/ZheYuan/Heartbleed/comments{/number}","issue_comment_url":"https://api.github.com/repos/ZheYuan/Heartbleed/issues/comments/{number}","contents_url":"https://api.github.com/repos/ZheYuan/Heartbleed/contents/{+path}","compare_url":"https://api.github.com/repos/ZheYuan/Heartbleed/compare/{base}...{head}","merges_url":"https://api.github.com/repos/ZheYuan/Heartbleed/merges","archive_url":"https://api.github.com/repos/ZheYuan/Heartbleed/{archive_format}{/ref}","downloads_url":"https://api.github.com/repos/ZheYuan/Heartbleed/downloads","issues_url":"https://api.github.com/repos/ZheYuan/Heartbleed/issues{/number}","pulls_url":"https://api.github.com/repos/ZheYuan/Heartbleed/pulls{/number}","milestones_url":"https://api.github.com/repos/ZheYuan/Heartbleed/milestones{/number}","notifications_url":"https://api.github.com/repos/ZheYuan/Heartbleed/notifications{?since,all,participating}","labels_url":"https://api.github.com/repos/ZheYuan/Heartbleed/labels{/name}","releases_url":"https://api.github.com/repos/ZheYuan/Heartbleed/releases{/id}","created_at":"2015-01-01T01:00:55Z","updated_at":"2014-12-30T05:34:14Z","pushed_at":"2014-10-31T14:10:43Z","git_url":"git://github.com/ZheYuan/Heartbleed.git","ssh_url":"git@github.com:ZheYuan/Heartbleed.git","clone_url":"https://github.com/ZheYuan/Heartbleed.git","svn_url":"https://github.com/ZheYuan/Heartbleed","homepage":"http://filippo.io/Heartbleed","size":3139,"stargazers_count":0,"watchers_count":0,"language":null,"has_issues":false,"has_downloads":true,"has_wiki":true,"has_pages":false,"forks_count":0,"mirror_url":null,"open_issues_count":0,"forks":0,"open_issues":0,"watchers":0,"default_branch":"master","public":true}},"public":true,"created_at":"2015-01-01T01:00:56Z"}
{"id":"2489396297","type":"WatchEvent","actor":{"id":1015032,"login":"miketahani","gravatar_id":"","url":"https://api.github.com/users/miketahani","avatar_url":"https://avatars.githubusercontent.com/u/1015032?"},"repo":{"id":28179549,"name":"substack/geodetic-to-ecef","url":"https://api.github.com/repos/substack/geodetic-to-ecef"},"payload":{"action":"started"},"public":true,"created_at":"2015-01-01T01:00:56Z"}
{"id":"2489396300","type":"PushEvent","actor":{"id":10176820,"login":"chalavadivishnu","gravatar_id":"","url":"https://api.github.com/users/chalavadivishnu","avatar_url":"https://avatars.githubusercontent.com/u/10176820?"},"repo":{"id":28678150,"name":"chalavadivishnu/Face-Detection","url":"https://api.github.com/repos/chalavadivishnu/Face-Detection"},"payload":{"push_id":536752420,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"9b5858f96f8d101afa8e568dbe8424c32d010166","before":"8069b04a69d5729520e64e6c88c262a77407bd75","commits":[{"sha":"9b5858f96f8d101afa8e568dbe8424c32d010166","author":{"email":"ce8044f02eb2a26b631671f5297317036d398e79@gmail.com","name":"Chalavadi Vishnu"},"message":"create gabor","distinct":true,"url":"https://api.github.com/repos/chalavadivishnu/Face-Detection/commits/9b5858f96f8d101afa8e568dbe8424c32d010166"}]},"public":true,"created_at":"2015-01-01T01:00:56Z"}
{"id":"2489396301","type":"PushEvent","actor":{"id":66577,"login":"JakeWharton","gravatar_id":"","url":"https://api.github.com/users/JakeWharton","avatar_url":"https://avatars.githubusercontent.com/u/66577?"},"repo":{"id":5152285,"name":"square/okhttp","url":"https://api.github.com/repos/square/okhttp"},"payload":{"push_id":536752417,"size":1,"distinct_size":1,"ref":"refs/heads/jw/websocket-call","head":"aa126df6b62dfc1c5b442a8a53ee601ac2579ef7","before":"bc4462296aec3798ee5f2be993f851552b0e1215","commits":[{"sha":"aa126df6b62dfc1c5b442a8a53ee601ac2579ef7","author":{"email":"9ec2b9d5f2203d75c2b0f7885bd663d9d57a2d20@squareup.com","name":"Jake Wharton"},"message":"Add a web socket call concept for connecting.\n\nSimilar to HTTP and Call, the WebSocketCall is a representation of a pending HTTP request and subsequent upgrade to speak web sockets. Upon synchronous execution you are handed a WebSocket instance for synchronous writing and also pass in a WebSocketListener for async callbacks due to reading.\n\nThe API changes in this commits also generalize WebSocket such that it's agnostic to being a client or server peer.","distinct":true,"url":"https://api.github.com/repos/square/okhttp/commits/aa126df6b62dfc1c5b442a8a53ee601ac2579ef7"}]},"public":true,"created_at":"2015-01-01T01:00:56Z","org":{"id":82592,"login":"square","gravatar_id":"","url":"https://api.github.com/orgs/square","avatar_url":"https://avatars.githubusercontent.com/u/82592?"}}
{"id":"2489396303","type":"PushEvent","actor":{"id":1373703,"login":"team3cord","gravatar_id":"","url":"https://api.github.com/users/team3cord","avatar_url":"https://avatars.githubusercontent.com/u/1373703?"},"repo":{"id":20268125,"name":"team3cord/mc-dotfiles","url":"https://api.github.com/repos/team3cord/mc-dotfiles"},"payload":{"push_id":536752421,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"c274de69b1397e2b2b3a92b5cbba22b87211ffa0","before":"57e4c5c28b8fed6b308b24f86432d3676fd8d96e","commits":[{"sha":"c274de69b1397e2b2b3a92b5cbba22b87211ffa0","author":{"email":"67bcad84ab1facdcd6a44cf7083c26cfa2e421e4@gmail.com","name":"MattCordeiro"},"message":"Updated vim configuration","distinct":true,"url":"https://api.github.com/repos/team3cord/mc-dotfiles/commits/c274de69b1397e2b2b3a92b5cbba22b87211ffa0"}]},"public":true,"created_at":"2015-01-01T01:00:56Z"}
{"id":"2489396304","type":"PushEvent","actor":{"id":6972205,"login":"K-Niu","gravatar_id":"","url":"https://api.github.com/users/K-Niu","avatar_url":"https://avatars.githubusercontent.com/u/6972205?"},"repo":{"id":28167043,"name":"K-Niu/K-Niu.github.io","url":"https://api.github.com/repos/K-Niu/K-Niu.github.io"},"payload":{"push_id":536752423,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"f7edf3b95aaa966869a8fa8c38b9ff806578a6ef","before":"c62ef93bb13e2d3e3aa1539782d65e3850b08230","commits":[{"sha":"f7edf3b95aaa966869a8fa8c38b9ff806578a6ef","author":{"email":"13bbb662ce51dd619e7c17a547e4f7c5b3d9c40d@gmail.com","name":"K-Niu"},"message":"Updated README","distinct":true,"url":"https://api.github.com/repos/K-Niu/K-Niu.github.io/commits/f7edf3b95aaa966869a8fa8c38b9ff806578a6ef"}]},"public":true,"created_at":"2015-01-01T01:00:56Z"}
{"id":"2489396306","type":"PushEvent","actor":{"id":9828988,"login":"alexformagio","gravatar_id":"","url":"https://api.github.com/users/alexformagio","avatar_url":"https://avatars.githubusercontent.com/u/9828988?"},"repo":{"id":28678021,"name":"alexformagio/python30min","url":"https://api.github.com/repos/alexformagio/python30min"},"payload":{"push_id":536752424,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"6148df2e7babc92c0568cc452deae2b683a041da","before":"c20ef006701c56b5440a24d782a2330ddc465619","commits":[{"sha":"6148df2e7babc92c0568cc452deae2b683a041da","author":{"email":"eb51c250a6d7f2b7307829ec95405c85965e34b2@gmail.com","name":"alex_formagio"},"message":"adding gitignore","distinct":true,"url":"https://api.github.com/repos/alexformagio/python30min/commits/6148df2e7babc92c0568cc452deae2b683a041da"}]},"public":true,"created_at":"2015-01-01T01:00:56Z"}
{"id":"2489396307","type":"PushEvent","actor":{"id":10144074,"login":"carodew","gravatar_id":"","url":"https://api.github.com/users/carodew","avatar_url":"https://avatars.githubusercontent.com/u/10144074?"},"repo":{"id":27844858,"name":"carodew/carodew.github.io","url":"https://api.github.com/repos/carodew/carodew.github.io"},"payload":{"push_id":536752425,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"19643dcb3388a0ae99570e176fc592e0fd666c81","before":"8b73f1d4d2ee61797b2d644ff44cda0f9b691aeb","commits":[{"sha":"19643dcb3388a0ae99570e176fc592e0fd666c81","author":{"email":"6e3c6f0214740e9061d9ca5c79eb6e0ff9cc1741@unknown542696dd77af.gateway.pace.com","name":"Carolyn"},"message":"tweak project layout","distinct":true,"url":"https://api.github.com/repos/carodew/carodew.github.io/commits/19643dcb3388a0ae99570e176fc592e0fd666c81"}]},"public":true,"created_at":"2015-01-01T01:00:56Z"}
{"id":"2489396314","type":"CommitCommentEvent","actor":{"id":3372342,"login":"bors","gravatar_id":"","url":"https://api.github.com/users/bors","avatar_url":"https://avatars.githubusercontent.com/u/3372342?"},"repo":{"id":724712,"name":"rust-lang/rust","url":"https://api.github.com/repos/rust-lang/rust"},"payload":{"comment":{"url":"https://api.github.com/repos/rust-lang/rust/comments/9131360","html_url":"https://github.com/rust-lang/rust/commit/8f98078b1508c7ebd488c4ab864a4d2fb02d44f8#commitcomment-9131360","id":9131360,"user":{"login":"bors","id":3372342,"avatar_url":"https://avatars.githubusercontent.com/u/3372342?v=3","gravatar_id":"","url":"https://api.github.com/users/bors","html_url":"https://github.com/bors","followers_url":"https://api.github.com/users/bors/followers","following_url":"https://api.github.com/users/bors/following{/other_user}","gists_url":"https://api.github.com/users/bors/gists{/gist_id}","starred_url":"https://api.github.com/users/bors/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/bors/subscriptions","organizations_url":"https://api.github.com/users/bors/orgs","repos_url":"https://api.github.com/users/bors/repos","events_url":"https://api.github.com/users/bors/events{/privacy}","received_events_url":"https://api.github.com/users/bors/received_events","type":"User","site_admin":false},"position":null,"line":null,"path":null,"commit_id":"8f98078b1508c7ebd488c4ab864a4d2fb02d44f8","created_at":"2015-01-01T01:00:56Z","updated_at":"2015-01-01T01:00:56Z","body":"merging japaric/rust/moar-uc = 8f98078b into auto"}},"public":true,"created_at":"2015-01-01T01:00:56Z","org":{"id":5430905,"login":"rust-lang","gravatar_id":"","url":"https://api.github.com/orgs/rust-lang","avatar_url":"https://avatars.githubusercontent.com/u/5430905?"}}
{"id":"2489396315","type":"PushEvent","actor":{"id":3372342,"login":"bors","gravatar_id":"","url":"https://api.github.com/users/bors","avatar_url":"https://avatars.githubusercontent.com/u/3372342?"},"repo":{"id":724712,"name":"rust-lang/rust","url":"https://api.github.com/repos/rust-lang/rust"},"payload":{"push_id":536752427,"size":0,"distinct_size":0,"ref":"refs/heads/auto","head":"10d99a973498c5a1be6ba318210751efc1c2cf61","before":"7013291b3c4b85fb9ffe356630d9aa575aa7f35a","commits":[]},"public":true,"created_at":"2015-01-01T01:00:57Z","org":{"id":5430905,"login":"rust-lang","gravatar_id":"","url":"https://api.github.com/orgs/rust-lang","avatar_url":"https://avatars.githubusercontent.com/u/5430905?"}}
{"id":"2489396316","type":"PushEvent","actor":{"id":5869772,"login":"felixonmars-bot","gravatar_id":"","url":"https://api.github.com/users/felixonmars-bot","avatar_url":"https://avatars.githubusercontent.com/u/5869772?"},"repo":{"id":14148979,"name":"felixonmars/aur-mirror","url":"https://api.github.com/repos/felixonmars/aur-mirror"},"payload":{"push_id":536752431,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"e54aae07fb256cafa088c8fc82f21b2931fa0b12","before":"27b0aad8faabf64ecd13ba93090ebe43d2706d55","commits":[{"sha":"e54aae07fb256cafa088c8fc82f21b2931fa0b12","author":{"email":"b68e87e72ad86ae664b595742624a5b780191f69@gmail.com","name":"Kyle Keen"},"message":"updated on Thu Jan  1 00:00:32 UTC 2015","distinct":true,"url":"https://api.github.com/repos/felixonmars/aur-mirror/commits/e54aae07fb256cafa088c8fc82f21b2931fa0b12"}]},"public":true,"created_at":"2015-01-01T01:00:57Z"}
{"id":"2489396319","type":"PushEvent","actor":{"id":3828361,"login":"kiahosseini","gravatar_id":"","url":"https://api.github.com/users/kiahosseini","avatar_url":"https://avatars.githubusercontent.com/u/3828361?"},"repo":{"id":27885085,"name":"kiahosseini/kiahosseini.github.io","url":"https://api.github.com/repos/kiahosseini/kiahosseini.github.io"},"payload":{"push_id":536752434,"size":2,"distinct_size":2,"ref":"refs/heads/master","head":"c916f5f5ebe46499985ca552a6e0a1fd74599d54","before":"31b0d34e0a62d3b38e348a29a7e89079982080c4","commits":[{"sha":"ffd765729e0c8362490a5488cec37f072654cfec","author":{"email":"268618c87e98ee43d06d901feef069e47f43f688@gmail.com","name":"Kiarash Hosseini"},"message":".","distinct":true,"url":"https://api.github.com/repos/kiahosseini/kiahosseini.github.io/commits/ffd765729e0c8362490a5488cec37f072654cfec"},{"sha":"c916f5f5ebe46499985ca552a6e0a1fd74599d54","author":{"email":"268618c87e98ee43d06d901feef069e47f43f688@gmail.com","name":"Kiarash Hosseini"},"message":".","distinct":true,"url":"https://api.github.com/repos/kiahosseini/kiahosseini.github.io/commits/c916f5f5ebe46499985ca552a6e0a1fd74599d54"}]},"public":true,"created_at":"2015-01-01T01:00:57Z"}
{"id":"2489396320","type":"GollumEvent","actor":{"id":7797609,"login":"ivanwfr","gravatar_id":"","url":"https://api.github.com/users/ivanwfr","avatar_url":"https://avatars.githubusercontent.com/u/7797609?"},"repo":{"id":808316,"name":"cswetenham/tabspace2.1","url":"https://api.github.com/repos/cswetenham/tabspace2.1"},"payload":{"pages":[{"page_name":"Home","title":"Home","summary":null,"action":"edited","sha":"425ecdb18436e26cab4dcaa4db8d7b57650a5e27","html_url":"https://github.com/cswetenham/tabspace2.1/wiki/Home"}]},"public":true,"created_at":"2015-01-01T01:00:57Z"}
{"id":"2489396321","type":"PushEvent","actor":{"id":18257,"login":"keisukefukuda","gravatar_id":"","url":"https://api.github.com/users/keisukefukuda","avatar_url":"https://avatars.githubusercontent.com/u/18257?"},"repo":{"id":4476852,"name":"keisukefukuda/dotfiles","url":"https://api.github.com/repos/keisukefukuda/dotfiles"},"payload":{"push_id":536752435,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"32f4510f99c1963b3500fafe4a0373160f9290b6","before":"5c497bfeed64eb68e6b46645270222111ac51a4e","commits":[{"sha":"32f4510f99c1963b3500fafe4a0373160f9290b6","author":{"email":"e20d997393fae6e64f65ca9b73604073336c9900@gmail.com","name":"Keisuke Fukuda"},"message":"commented out unnecessary zsh fpath","distinct":true,"url":"https://api.github.com/repos/keisukefukuda/dotfiles/commits/32f4510f99c1963b3500fafe4a0373160f9290b6"}]},"public":true,"created_at":"2015-01-01T01:00:57Z"}
{"id":"2489396322","type":"PushEvent","actor":{"id":5631503,"login":"Autodidact24","gravatar_id":"","url":"https://api.github.com/users/Autodidact24","avatar_url":"https://avatars.githubusercontent.com/u/5631503?"},"repo":{"id":21542754,"name":"Autodidact24/autodidact24.github.io","url":"https://api.github.com/repos/Autodidact24/autodidact24.github.io"},"payload":{"push_id":536752436,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"2ee7b23cb5d65a89d79b88734e606fc0a1b2acac","before":"8b2eadf9f36df15261e7c2dbd502a0978fadfb82","commits":[{"sha":"2ee7b23cb5d65a89d79b88734e606fc0a1b2acac","author":{"email":"7e51ff80808f27ff5907bcc8c43a3f5980edcc6f@gmail.com","name":"Shubham Singh Tomar"},"message":"new post","distinct":true,"url":"https://api.github.com/repos/Autodidact24/autodidact24.github.io/commits/2ee7b23cb5d65a89d79b88734e606fc0a1b2acac"}]},"public":true,"created_at":"2015-01-01T01:00:57Z"}
{"id":"2489396324","type":"CommitCommentEvent","actor":{"id":3372342,"login":"bors","gravatar_id":"","url":"https://api.github.com/users/bors","avatar_url":"https://avatars.githubusercontent.com/u/3372342?"},"repo":{"id":724712,"name":"rust-lang/rust","url":"https://api.github.com/repos/rust-lang/rust"},"payload":{"comment":{"url":"https://api.github.com/repos/rust-lang/rust/comments/9131361","html_url":"https://github.com/rust-lang/rust/commit/8f98078b1508c7ebd488c4ab864a4d2fb02d44f8#commitcomment-9131361","id":9131361,"user":{"login":"bors","id":3372342,"avatar_url":"https://avatars.githubusercontent.com/u/3372342?v=3","gravatar_id":"","url":"https://api.github.com/users/bors","html_url":"https://github.com/bors","followers_url":"https://api.github.com/users/bors/followers","following_url":"https://api.github.com/users/bors/following{/other_user}","gists_url":"https://api.github.com/users/bors/gists{/gist_id}","starred_url":"https://api.github.com/users/bors/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/bors/subscriptions","organizations_url":"https://api.github.com/users/bors/orgs","repos_url":"https://api.github.com/users/bors/repos","events_url":"https://api.github.com/users/bors/events{/privacy}","received_events_url":"https://api.github.com/users/bors/received_events","type":"User","site_admin":false},"position":null,"line":null,"path":null,"commit_id":"8f98078b1508c7ebd488c4ab864a4d2fb02d44f8","created_at":"2015-01-01T01:00:57Z","updated_at":"2015-01-01T01:00:57Z","body":"status: {\"merge_sha\": \"a570791cd4118c97b4a14b4a27a273a2f3ed466e\"}"}},"public":true,"created_at":"2015-01-01T01:00:57Z","org":{"id":5430905,"login":"rust-lang","gravatar_id":"","url":"https://api.github.com/orgs/rust-lang","avatar_url":"https://avatars.githubusercontent.com/u/5430905?"}}
{"id":"2489396329","type":"PushEvent","actor":{"id":283089,"login":"openemr","gravatar_id":"","url":"https://api.github.com/users/openemr","avatar_url":"https://avatars.githubusercontent.com/u/283089?"},"repo":{"id":1473462,"name":"openemr/translations_development_openemr","url":"https://api.github.com/repos/openemr/translations_development_openemr"},"payload":{"push_id":536752438,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"6af5103f19520b8aa4560b55c1c5eedb668aea29","before":"d7c7b8cc839d9724d49a5f45176ed896226ca068","commits":[{"sha":"6af5103f19520b8aa4560b55c1c5eedb668aea29","author":{"email":"cbb210ee4c1aeabb7ba82d51bf63db966bfa0e88@users.sourceforge.net","name":"bradymiller"},"message":"Routine Automated Development Translations Update","distinct":true,"url":"https://api.github.com/repos/openemr/translations_development_openemr/commits/6af5103f19520b8aa4560b55c1c5eedb668aea29"}]},"public":true,"created_at":"2015-01-01T01:00:58Z"}
{"id":"2489396331","type":"PushEvent","actor":{"id":3372342,"login":"bors","gravatar_id":"","url":"https://api.github.com/users/bors","avatar_url":"https://avatars.githubusercontent.com/u/3372342?"},"repo":{"id":724712,"name":"rust-lang/rust","url":"https://api.github.com/repos/rust-lang/rust"},"payload":{"push_id":536752437,"size":24,"distinct_size":24,"ref":"refs/heads/auto","head":"a570791cd4118c97b4a14b4a27a273a2f3ed466e","before":"10d99a973498c5a1be6ba318210751efc1c2cf61","commits":[{"sha":"ea94a90488e6b4701581079339de3595389e5b15","author":{"email":"550518ab9d14bd32155907315f74849d7b5c2b36@gmail.com","name":"Jorge Aparicio"},"message":"unicode: unbox closures used in function arguments","distinct":true,"url":"https://api.github.com/repos/rust-lang/rust/commits/ea94a90488e6b4701581079339de3595389e5b15"},{"sha":"a17c2b60e1c32e950b011296025a9f88f4d3c4e4","author":{"email":"550518ab9d14bd32155907315f74849d7b5c2b36@gmail.com","name":"Jorge Aparicio"},"message":"collections: fix fallout","distinct":true,"url":"https://api.github.com/repos/rust-lang/rust/commits/a17c2b60e1c32e950b011296025a9f88f4d3c4e4"},{"sha":"44dc9196d3854e43e921800dea5d939b2ca178ce","author":{"email":"550518ab9d14bd32155907315f74849d7b5c2b36@gmail.com","name":"Jorge Aparicio"},"message":"std: unbox closures used in function arguments","distinct":true,"url":"https://api.github.com/repos/rust-lang/rust/commits/44dc9196d3854e43e921800dea5d939b2ca178ce"},{"sha":"bcbe9f2e7ae8cbea9f85100d50c00f3dd492b318","author":{"email":"550518ab9d14bd32155907315f74849d7b5c2b36@gmail.com","name":"Jorge Aparicio"},"message":"syntax: unbox closures used in function arguments","distinct":true,"url":"https://api.github.com/repos/rust-lang/rust/commits/bcbe9f2e7ae8cbea9f85100d50c00f3dd492b318"},{"sha":"3c1b5d3aa23ea16c804c1a7dbfab5ad932efd940","author":{"email":"550518ab9d14bd32155907315f74849d7b5c2b36@gmail.com","name":"Jorge Aparicio"},"message":"rustc: unbox closures used in function arguments","distinct":true,"url":"https://api.github.com/repos/rust-lang/rust/commits/3c1b5d3aa23ea16c804c1a7dbfab5ad932efd940"},{"sha":"c3baa1800105e2cb6e6d58b3f835812e150f50b2","author":{"email":"550518ab9d14bd32155907315f74849d7b5c2b36@gmail.com","name":"Jorge Aparicio"},"message":"rustc_trans: unbox closures used in function arguments","distinct":true,"url":"https://api.github.com/repos/rust-lang/rust/commits/c3baa1800105e2cb6e6d58b3f835812e150f50b2"},{"sha":"79b36818e4dc825dd843c2ee500b5969acee6068","author":{"email":"550518ab9d14bd32155907315f74849d7b5c2b36@gmail.com","name":"Jorge Aparicio"},"message":"rustc_borrowck: unbox closures used in function arguments","distinct":true,"url":"https://api.github.com/repos/rust-lang/rust/commits/79b36818e4dc825dd843c2ee500b5969acee6068"},{"sha":"9168e0f270783ce9e5238f87830c18df63c394a6","author":{"email":"550518ab9d14bd32155907315f74849d7b5c2b36@gmail.com","name":"Jorge Aparicio"},"message":"core: unbox closures used in let bindings","distinct":true,"url":"https://api.github.com/repos/rust-lang/rust/commits/9168e0f270783ce9e5238f87830c18df63c394a6"},{"sha":"e4397075acbb241926f142ed6b54a6d4abc198a9","author":{"email":"550518ab9d14bd32155907315f74849d7b5c2b36@gmail.com","name":"Jorge Aparicio"},"message":"getopts: unbox closures used in let bindings","distinct":true,"url":"https://api.github.com/repos/rust-lang/rust/commits/e4397075acbb241926f142ed6b54a6d4abc198a9"},{"sha":"aaed78886dbf819914c48fde4890f080548adcea","author":{"email":"550518ab9d14bd32155907315f74849d7b5c2b36@gmail.com","name":"Jorge Aparicio"},"message":"rustc: unbox closures used in let bindings","distinct":true,"url":"https://api.github.com/repos/rust-lang/rust/commits/aaed78886dbf819914c48fde4890f080548adcea"},{"sha":"d4bfc5c9cf24f0428124e1257dc631a7d9125088","author":{"email":"550518ab9d14bd32155907315f74849d7b5c2b36@gmail.com","name":"Jorge Aparicio"},"message":"rustc_back: unbox closures used in let bindings","distinct":true,"url":"https://api.github.com/repos/rust-lang/rust/commits/d4bfc5c9cf24f0428124e1257dc631a7d9125088"},{"sha":"e0ed73bd1d5308922c7f4a2e60e565e97b06160c","author":{"email":"550518ab9d14bd32155907315f74849d7b5c2b36@gmail.com","name":"Jorge Aparicio"},"message":"rustc_borrowck: unbox closures used in let bindings","distinct":true,"url":"https://api.github.com/repos/rust-lang/rust/commits/e0ed73bd1d5308922c7f4a2e60e565e97b06160c"},{"sha":"8c842f8ebf4f67e19e1d7e1e7538212575f10319","author":{"email":"550518ab9d14bd32155907315f74849d7b5c2b36@gmail.com","name":"Jorge Aparicio"},"message":"rustc_driver: unbox closures used in let bindings","distinct":true,"url":"https://api.github.com/repos/rust-lang/rust/commits/8c842f8ebf4f67e19e1d7e1e7538212575f10319"},{"sha":"48a1e43b92c46586f1ec77e63eb9c3b72468c00b","author":{"email":"550518ab9d14bd32155907315f74849d7b5c2b36@gmail.com","name":"Jorge Aparicio"},"message":"rustc_resolve: unbox closures used in let bindings","distinct":true,"url":"https://api.github.com/repos/rust-lang/rust/commits/48a1e43b92c46586f1ec77e63eb9c3b72468c00b"},{"sha":"5ac73e12e844b575961bf61a10f9b23e48e90c89","author":{"email":"550518ab9d14bd32155907315f74849d7b5c2b36@gmail.com","name":"Jorge Aparicio"},"message":"rustc_trans: unbox closures used in let bindings","distinct":true,"url":"https://api.github.com/repos/rust-lang/rust/commits/5ac73e12e844b575961bf61a10f9b23e48e90c89"},{"sha":"450e6793327408f14659b922b9ce0169798d1b07","author":{"email":"550518ab9d14bd32155907315f74849d7b5c2b36@gmail.com","name":"Jorge Aparicio"},"message":"rustc_typeck: unbox closures used in let bindings","distinct":true,"url":"https://api.github.com/repos/rust-lang/rust/commits/450e6793327408f14659b922b9ce0169798d1b07"},{"sha":"653f372b59f5465fac5f808e02c7dd82da7cdbd7","author":{"email":"550518ab9d14bd32155907315f74849d7b5c2b36@gmail.com","name":"Jorge Aparicio"},"message":"rustdoc: unbox closures used in let bindings","distinct":true,"url":"https://api.github.com/repos/rust-lang/rust/commits/653f372b59f5465fac5f808e02c7dd82da7cdbd7"},{"sha":"0da9d07e2d331a57304809e5cfc26b4b8d938b44","author":{"email":"550518ab9d14bd32155907315f74849d7b5c2b36@gmail.com","name":"Jorge Aparicio"},"message":"std: unbox closures used in let bindings","distinct":true,"url":"https://api.github.com/repos/rust-lang/rust/commits/0da9d07e2d331a57304809e5cfc26b4b8d938b44"},{"sha":"bbc0ce866d5f7db982eefbca6d184e2ce0c6ebe8","author":{"email":"550518ab9d14bd32155907315f74849d7b5c2b36@gmail.com","name":"Jorge Aparicio"},"message":"syntax: unbox closures used in let bindings","distinct":true,"url":"https://api.github.com/repos/rust-lang/rust/commits/bbc0ce866d5f7db982eefbca6d184e2ce0c6ebe8"},{"sha":"26278cea5afd35166415dcaede78c3b9b3fdaeac","author":{"email":"550518ab9d14bd32155907315f74849d7b5c2b36@gmail.com","name":"Jorge Aparicio"},"message":"time: unbox closures used in let bindings","distinct":true,"url":"https://api.github.com/repos/rust-lang/rust/commits/26278cea5afd35166415dcaede78c3b9b3fdaeac"}]},"public":true,"created_at":"2015-01-01T01:00:58Z","org":{"id":5430905,"login":"rust-lang","gravatar_id":"","url":"https://api.github.com/orgs/rust-lang","avatar_url":"https://avatars.githubusercontent.com/u/5430905?"}}
{"id":"2489396334","type":"CommitCommentEvent","actor":{"id":3372342,"login":"bors","gravatar_id":"","url":"https://api.github.com/users/bors","avatar_url":"https://avatars.githubusercontent.com/u/3372342?"},"repo":{"id":724712,"name":"rust-lang/rust","url":"https://api.github.com/repos/rust-lang/rust"},"payload":{"comment":{"url":"https://api.github.com/repos/rust-lang/rust/comments/9131362","html_url":"https://github.com/rust-lang/rust/commit/8f98078b1508c7ebd488c4ab864a4d2fb02d44f8#commitcomment-9131362","id":9131362,"user":{"login":"bors","id":3372342,"avatar_url":"https://avatars.githubusercontent.com/u/3372342?v=3","gravatar_id":"","url":"https://api.github.com/users/bors","html_url":"https://github.com/bors","followers_url":"https://api.github.com/users/bors/followers","following_url":"https://api.github.com/users/bors/following{/other_user}","gists_url":"https://api.github.com/users/bors/gists{/gist_id}","starred_url":"https://api.github.com/users/bors/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/bors/subscriptions","organizations_url":"https://api.github.com/users/bors/orgs","repos_url":"https://api.github.com/users/bors/repos","events_url":"https://api.github.com/users/bors/events{/privacy}","received_events_url":"https://api.github.com/users/bors/received_events","type":"User","site_admin":false},"position":null,"line":null,"path":null,"commit_id":"8f98078b1508c7ebd488c4ab864a4d2fb02d44f8","created_at":"2015-01-01T01:00:58Z","updated_at":"2015-01-01T01:00:58Z","body":"japaric/rust/moar-uc = 8f98078b merged ok, testing candidate = a570791c"}},"public":true,"created_at":"2015-01-01T01:00:58Z","org":{"id":5430905,"login":"rust-lang","gravatar_id":"","url":"https://api.github.com/orgs/rust-lang","avatar_url":"https://avatars.githubusercontent.com/u/5430905?"}}
{"id":"2489396336","type":"PushEvent","actor":{"id":6154548,"login":"chrisanthropic","gravatar_id":"","url":"https://api.github.com/users/chrisanthropic","avatar_url":"https://avatars.githubusercontent.com/u/6154548?"},"repo":{"id":28470344,"name":"chrisanthropic/comical-jekyll-theme","url":"https://api.github.com/repos/chrisanthropic/comical-jekyll-theme"},"payload":{"push_id":536752440,"size":1,"distinct_size":1,"ref":"refs/heads/gh-pages","head":"51a3f37c2253a92322a371d8dac0024c94929c77","before":"18691cb662324d1431eda0263f67f414d53b4870","commits":[{"sha":"51a3f37c2253a92322a371d8dac0024c94929c77","author":{"email":"a9c72f90f6fdaaea784cb28e2da787f981b8fb43@gmail.com","name":"Christopher Tarwater"},"message":"updates","distinct":true,"url":"https://api.github.com/repos/chrisanthropic/comical-jekyll-theme/commits/51a3f37c2253a92322a371d8dac0024c94929c77"}]},"public":true,"created_at":"2015-01-01T01:00:59Z"}
{"id":"2489396337","type":"ForkEvent","actor":{"id":7366091,"login":"coryasato","gravatar_id":"","url":"https://api.github.com/users/coryasato","avatar_url":"https://avatars.githubusercontent.com/u/7366091?"},"repo":{"id":28153049,"name":"EKGAPI/KardiaApp","url":"https://api.github.com/repos/EKGAPI/KardiaApp"},"payload":{"forkee":{"id":28678221,"name":"KardiaApp","full_name":"coryasato/KardiaApp","owner":{"login":"coryasato","id":7366091,"avatar_url":"https://avatars.githubusercontent.com/u/7366091?v=3","gravatar_id":"","url":"https://api.github.com/users/coryasato","html_url":"https://github.com/coryasato","followers_url":"https://api.github.com/users/coryasato/followers","following_url":"https://api.github.com/users/coryasato/following{/other_user}","gists_url":"https://api.github.com/users/coryasato/gists{/gist_id}","starred_url":"https://api.github.com/users/coryasato/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/coryasato/subscriptions","organizations_url":"https://api.github.com/users/coryasato/orgs","repos_url":"https://api.github.com/users/coryasato/repos","events_url":"https://api.github.com/users/coryasato/events{/privacy}","received_events_url":"https://api.github.com/users/coryasato/received_events","type":"User","site_admin":false},"private":false,"html_url":"https://github.com/coryasato/KardiaApp","description":"","fork":true,"url":"https://api.github.com/repos/coryasato/KardiaApp","forks_url":"https://api.github.com/repos/coryasato/KardiaApp/forks","keys_url":"https://api.github.com/repos/coryasato/KardiaApp/keys{/key_id}","collaborators_url":"https://api.github.com/repos/coryasato/KardiaApp/collaborators{/collaborator}","teams_url":"https://api.github.com/repos/coryasato/KardiaApp/teams","hooks_url":"https://api.github.com/repos/coryasato/KardiaApp/hooks","issue_events_url":"https://api.github.com/repos/coryasato/KardiaApp/issues/events{/number}","events_url":"https://api.github.com/repos/coryasato/KardiaApp/events","assignees_url":"https://api.github.com/repos/coryasato/KardiaApp/assignees{/user}","branches_url":"https://api.github.com/repos/coryasato/KardiaApp/branches{/branch}","tags_url":"https://api.github.com/repos/coryasato/KardiaApp/tags","blobs_url":"https://api.github.com/repos/coryasato/KardiaApp/git/blobs{/sha}","git_tags_url":"https://api.github.com/repos/coryasato/KardiaApp/git/tags{/sha}","git_refs_url":"https://api.github.com/repos/coryasato/KardiaApp/git/refs{/sha}","trees_url":"https://api.github.com/repos/coryasato/KardiaApp/git/trees{/sha}","statuses_url":"https://api.github.com/repos/coryasato/KardiaApp/statuses/{sha}","languages_url":"https://api.github.com/repos/coryasato/KardiaApp/languages","stargazers_url":"https://api.github.com/repos/coryasato/KardiaApp/stargazers","contributors_url":"https://api.github.com/repos/coryasato/KardiaApp/contributors","subscribers_url":"https://api.github.com/repos/coryasato/KardiaApp/subscribers","subscription_url":"https://api.github.com/repos/coryasato/KardiaApp/subscription","commits_url":"https://api.github.com/repos/coryasato/KardiaApp/commits{/sha}","git_commits_url":"https://api.github.com/repos/coryasato/KardiaApp/git/commits{/sha}","comments_url":"https://api.github.com/repos/coryasato/KardiaApp/comments{/number}","issue_comment_url":"https://api.github.com/repos/coryasato/KardiaApp/issues/comments/{number}","contents_url":"https://api.github.com/repos/coryasato/KardiaApp/contents/{+path}","compare_url":"https://api.github.com/repos/coryasato/KardiaApp/compare/{base}...{head}","merges_url":"https://api.github.com/repos/coryasato/KardiaApp/merges","archive_url":"https://api.github.com/repos/coryasato/KardiaApp/{archive_format}{/ref}","downloads_url":"https://api.github.com/repos/coryasato/KardiaApp/downloads","issues_url":"https://api.github.com/repos/coryasato/KardiaApp/issues{/number}","pulls_url":"https://api.github.com/repos/coryasato/KardiaApp/pulls{/number}","milestones_url":"https://api.github.com/repos/coryasato/KardiaApp/milestones{/number}","notifications_url":"https://api.github.com/repos/coryasato/KardiaApp/notifications{?since,all,participating}","labels_url":"https://api.github.com/repos/coryasato/KardiaApp/labels{/name}","releases_url":"https://api.github.com/repos/coryasato/KardiaApp/releases{/id}","created_at":"2015-01-01T01:00:59Z","updated_at":"2014-12-31T23:06:40Z","pushed_at":"2014-12-31T23:06:38Z","git_url":"git://github.com/coryasato/KardiaApp.git","ssh_url":"git@github.com:coryasato/KardiaApp.git","clone_url":"https://github.com/coryasato/KardiaApp.git","svn_url":"https://github.com/coryasato/KardiaApp","homepage":null,"size":362,"stargazers_count":0,"watchers_count":0,"language":null,"has_issues":false,"has_downloads":true,"has_wiki":true,"has_pages":false,"forks_count":0,"mirror_url":null,"open_issues_count":0,"forks":0,"open_issues":0,"watchers":0,"default_branch":"master","public":true}},"public":true,"created_at":"2015-01-01T01:00:59Z","org":{"id":9016021,"login":"EKGAPI","gravatar_id":"","url":"https://api.github.com/orgs/EKGAPI","avatar_url":"https://avatars.githubusercontent.com/u/9016021?"}}
{"id":"2489396340","type":"CreateEvent","actor":{"id":1734986,"login":"Adamwgoh","gravatar_id":"","url":"https://api.github.com/users/Adamwgoh","avatar_url":"https://avatars.githubusercontent.com/u/1734986?"},"repo":{"id":28678222,"name":"Adamwgoh/Laura","url":"https://api.github.com/repos/Adamwgoh/Laura"},"payload":{"ref":null,"ref_type":"repository","master_branch":"master","description":"G52GRP re-upload","pusher_type":"user"},"public":true,"created_at":"2015-01-01T01:00:59Z"}
{"id":"2489396341","type":"WatchEvent","actor":{"id":1570089,"login":"sirvon","gravatar_id":"","url":"https://api.github.com/users/sirvon","avatar_url":"https://avatars.githubusercontent.com/u/1570089?"},"repo":{"id":1971346,"name":"msgpack/msgpack-java","url":"https://api.github.com/repos/msgpack/msgpack-java"},"payload":{"action":"started"},"public":true,"created_at":"2015-01-01T01:00:59Z","org":{"id":198264,"login":"msgpack","gravatar_id":"","url":"https://api.github.com/orgs/msgpack","avatar_url":"https://avatars.githubusercontent.com/u/198264?"}}
{"id":"2489396342","type":"PushEvent","actor":{"id":6900864,"login":"abuehab","gravatar_id":"","url":"https://api.github.com/users/abuehab","avatar_url":"https://avatars.githubusercontent.com/u/6900864?"},"repo":{"id":26771667,"name":"smss123/BylsanSystem","url":"https://api.github.com/repos/smss123/BylsanSystem"},"payload":{"push_id":536752442,"size":0,"distinct_size":0,"ref":"refs/heads/master","head":"fc430dab978b650fcf7d828048be9dfacce2f4b7","before":"fc430dab978b650fcf7d828048be9dfacce2f4b7","commits":[]},"public":true,"created_at":"2015-01-01T01:00:59Z"}
{"id":"2489396343","type":"ForkEvent","actor":{"id":18191,"login":"jc00ke","gravatar_id":"","url":"https://api.github.com/users/jc00ke","avatar_url":"https://avatars.githubusercontent.com/u/18191?"},"repo":{"id":10488201,"name":"JeanMertz/chruby-fish","url":"https://api.github.com/repos/JeanMertz/chruby-fish"},"payload":{"forkee":{"id":28678223,"name":"chruby-fish","full_name":"jc00ke/chruby-fish","owner":{"login":"jc00ke","id":18191,"avatar_url":"https://avatars.githubusercontent.com/u/18191?v=3","gravatar_id":"","url":"https://api.github.com/users/jc00ke","html_url":"https://github.com/jc00ke","followers_url":"https://api.github.com/users/jc00ke/followers","following_url":"https://api.github.com/users/jc00ke/following{/other_user}","gists_url":"https://api.github.com/users/jc00ke/gists{/gist_id}","starred_url":"https://api.github.com/users/jc00ke/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/jc00ke/subscriptions","organizations_url":"https://api.github.com/users/jc00ke/orgs","repos_url":"https://api.github.com/users/jc00ke/repos","events_url":"https://api.github.com/users/jc00ke/events{/privacy}","received_events_url":"https://api.github.com/users/jc00ke/received_events","type":"User","site_admin":false},"private":false,"html_url":"https://github.com/jc00ke/chruby-fish","description":"Thin wrapper around chruby to make it work with the Fish shell","fork":true,"url":"https://api.github.com/repos/jc00ke/chruby-fish","forks_url":"https://api.github.com/repos/jc00ke/chruby-fish/forks","keys_url":"https://api.github.com/repos/jc00ke/chruby-fish/keys{/key_id}","collaborators_url":"https://api.github.com/repos/jc00ke/chruby-fish/collaborators{/collaborator}","teams_url":"https://api.github.com/repos/jc00ke/chruby-fish/teams","hooks_url":"https://api.github.com/repos/jc00ke/chruby-fish/hooks","issue_events_url":"https://api.github.com/repos/jc00ke/chruby-fish/issues/events{/number}","events_url":"https://api.github.com/repos/jc00ke/chruby-fish/events","assignees_url":"https://api.github.com/repos/jc00ke/chruby-fish/assignees{/user}","branches_url":"https://api.github.com/repos/jc00ke/chruby-fish/branches{/branch}","tags_url":"https://api.github.com/repos/jc00ke/chruby-fish/tags","blobs_url":"https://api.github.com/repos/jc00ke/chruby-fish/git/blobs{/sha}","git_tags_url":"https://api.github.com/repos/jc00ke/chruby-fish/git/tags{/sha}","git_refs_url":"https://api.github.com/repos/jc00ke/chruby-fish/git/refs{/sha}","trees_url":"https://api.github.com/repos/jc00ke/chruby-fish/git/trees{/sha}","statuses_url":"https://api.github.com/repos/jc00ke/chruby-fish/statuses/{sha}","languages_url":"https://api.github.com/repos/jc00ke/chruby-fish/languages","stargazers_url":"https://api.github.com/repos/jc00ke/chruby-fish/stargazers","contributors_url":"https://api.github.com/repos/jc00ke/chruby-fish/contributors","subscribers_url":"https://api.github.com/repos/jc00ke/chruby-fish/subscribers","subscription_url":"https://api.github.com/repos/jc00ke/chruby-fish/subscription","commits_url":"https://api.github.com/repos/jc00ke/chruby-fish/commits{/sha}","git_commits_url":"https://api.github.com/repos/jc00ke/chruby-fish/git/commits{/sha}","comments_url":"https://api.github.com/repos/jc00ke/chruby-fish/comments{/number}","issue_comment_url":"https://api.github.com/repos/jc00ke/chruby-fish/issues/comments/{number}","contents_url":"https://api.github.com/repos/jc00ke/chruby-fish/contents/{+path}","compare_url":"https://api.github.com/repos/jc00ke/chruby-fish/compare/{base}...{head}","merges_url":"https://api.github.com/repos/jc00ke/chruby-fish/merges","archive_url":"https://api.github.com/repos/jc00ke/chruby-fish/{archive_format}{/ref}","downloads_url":"https://api.github.com/repos/jc00ke/chruby-fish/downloads","issues_url":"https://api.github.com/repos/jc00ke/chruby-fish/issues{/number}","pulls_url":"https://api.github.com/repos/jc00ke/chruby-fish/pulls{/number}","milestones_url":"https://api.github.com/repos/jc00ke/chruby-fish/milestones{/number}","notifications_url":"https://api.github.com/repos/jc00ke/chruby-fish/notifications{?since,all,participating}","labels_url":"https://api.github.com/repos/jc00ke/chruby-fish/labels{/name}","releases_url":"https://api.github.com/repos/jc00ke/chruby-fish/releases{/id}","created_at":"2015-01-01T01:00:59Z","updated_at":"2015-01-01T01:00:59Z","pushed_at":"2014-12-14T22:38:55Z","git_url":"git://github.com/jc00ke/chruby-fish.git","ssh_url":"git@github.com:jc00ke/chruby-fish.git","clone_url":"https://github.com/jc00ke/chruby-fish.git","svn_url":"https://github.com/jc00ke/chruby-fish","homepage":"","size":1047,"stargazers_count":0,"watchers_count":0,"language":"Shell","has_issues":false,"has_downloads":true,"has_wiki":false,"has_pages":false,"forks_count":0,"mirror_url":null,"open_issues_count":0,"forks":0,"open_issues":0,"watchers":0,"default_branch":"master","public":true}},"public":true,"created_at":"2015-01-01T01:00:59Z"}
{"id":"2489396345","type":"IssueCommentEvent","actor":{"id":3318117,"login":"Z0mbine","gravatar_id":"","url":"https://api.github.com/users/Z0mbine","avatar_url":"https://avatars.githubusercontent.com/u/3318117?"},"repo":{"id":15829679,"name":"alexgrist/ServerGuard","url":"https://api.github.com/repos/alexgrist/ServerGuard"},"payload":{"action":"created","issue":{"url":"https://api.github.com/repos/alexgrist/ServerGuard/issues/118","labels_url":"https://api.github.com/repos/alexgrist/ServerGuard/issues/118/labels{/name}","comments_url":"https://api.github.com/repos/alexgrist/ServerGuard/issues/118/comments","events_url":"https://api.github.com/repos/alexgrist/ServerGuard/issues/118/events","html_url":"https://github.com/alexgrist/ServerGuard/issues/118","id":53203105,"number":118,"title":"[REQUEST] Chat","user":{"login":"SkyWalker3200","id":9349382,"avatar_url":"https://avatars.githubusercontent.com/u/9349382?v=3","gravatar_id":"","url":"https://api.github.com/users/SkyWalker3200","html_url":"https://github.com/SkyWalker3200","followers_url":"https://api.github.com/users/SkyWalker3200/followers","following_url":"https://api.github.com/users/SkyWalker3200/following{/other_user}","gists_url":"https://api.github.com/users/SkyWalker3200/gists{/gist_id}","starred_url":"https://api.github.com/users/SkyWalker3200/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/SkyWalker3200/subscriptions","organizations_url":"https://api.github.com/users/SkyWalker3200/orgs","repos_url":"https://api.github.com/users/SkyWalker3200/repos","events_url":"https://api.github.com/users/SkyWalker3200/events{/privacy}","received_events_url":"https://api.github.com/users/SkyWalker3200/received_events","type":"User","site_admin":false},"labels":[],"state":"open","locked":false,"assignee":null,"milestone":null,"comments":1,"created_at":"2014-12-31T20:57:23Z","updated_at":"2015-01-01T01:00:59Z","closed_at":null,"body":"Something that was brought up to me by one of my clan members is to have an option of chat prefixes.\r\nFor the ranks.\r\n\r\n[VIP] SkyWalker: Blah blah blah\r\n\r\nThought it would be a good addon.\r\n\r\n-SkyWalker"},"comment":{"url":"https://api.github.com/repos/alexgrist/ServerGuard/issues/comments/68477230","html_url":"https://github.com/alexgrist/ServerGuard/issues/118#issuecomment-68477230","issue_url":"https://api.github.com/repos/alexgrist/ServerGuard/issues/118","id":68477230,"user":{"login":"Z0mbine","id":3318117,"avatar_url":"https://avatars.githubusercontent.com/u/3318117?v=3","gravatar_id":"","url":"https://api.github.com/users/Z0mbine","html_url":"https://github.com/Z0mbine","followers_url":"https://api.github.com/users/Z0mbine/followers","following_url":"https://api.github.com/users/Z0mbine/following{/other_user}","gists_url":"https://api.github.com/users/Z0mbine/gists{/gist_id}","starred_url":"https://api.github.com/users/Z0mbine/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/Z0mbine/subscriptions","organizations_url":"https://api.github.com/users/Z0mbine/orgs","repos_url":"https://api.github.com/users/Z0mbine/repos","events_url":"https://api.github.com/users/Z0mbine/events{/privacy}","received_events_url":"https://api.github.com/users/Z0mbine/received_events","type":"User","site_admin":false},"created_at":"2015-01-01T01:00:59Z","updated_at":"2015-01-01T01:00:59Z","body":"Someone already requested this.\r\n#51 "}},"public":true,"created_at":"2015-01-01T01:01:00Z"}
{"id":"2489396346","type":"WatchEvent","actor":{"id":7291605,"login":"jtmancilla","gravatar_id":"","url":"https://api.github.com/users/jtmancilla","avatar_url":"https://avatars.githubusercontent.com/u/7291605?"},"repo":{"id":12711013,"name":"ropensci/webservices","url":"https://api.github.com/repos/ropensci/webservices"},"payload":{"action":"started"},"public":true,"created_at":"2015-01-01T01:01:00Z","org":{"id":1200269,"login":"ropensci","gravatar_id":"","url":"https://api.github.com/orgs/ropensci","avatar_url":"https://avatars.githubusercontent.com/u/1200269?"}}
{"id":"2489396354","type":"PushEvent","actor":{"id":10125388,"login":"vowsentente","gravatar_id":"","url":"https://api.github.com/users/vowsentente","avatar_url":"https://avatars.githubusercontent.com/u/10125388?"},"repo":{"id":28586913,"name":"vowsentente/P1-NYC-MTA-Dataset","url":"https://api.github.com/repos/vowsentente/P1-NYC-MTA-Dataset"},"payload":{"push_id":536752446,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"ff747f0fd326bc2942004bc3cd89f7235d58cb18","before":"aed0f46e9f6f914fe3ae2ba78026590f90bef4af","commits":[{"sha":"ff747f0fd326bc2942004bc3cd89f7235d58cb18","author":{"email":"5e402b391f4e77b9a75e1e07b1348ffeae489b97@gmail.com","name":"Steve"},"message":"Update Short_Questions.md","distinct":true,"url":"https://api.github.com/repos/vowsentente/P1-NYC-MTA-Dataset/commits/ff747f0fd326bc2942004bc3cd89f7235d58cb18"}]},"public":true,"created_at":"2015-01-01T01:01:01Z"}
{"id":"2489396355","type":"PushEvent","actor":{"id":7256509,"login":"ww44ss","gravatar_id":"","url":"https://api.github.com/users/ww44ss","avatar_url":"https://avatars.githubusercontent.com/u/7256509?"},"repo":{"id":28677457,"name":"ww44ss/Titanic","url":"https://api.github.com/repos/ww44ss/Titanic"},"payload":{"push_id":536752445,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"dbd6831a613af879e35527ea486c559c23fd9b4a","before":"346e3c7b8a56b797dcbe3d5cfdeea9ff9f2963f8","commits":[{"sha":"dbd6831a613af879e35527ea486c559c23fd9b4a","author":{"email":"f3f15001ba38afaee860a89905381c5bde0dd27e@gmail.com","name":"Winston Saunders"},"message":"model1","distinct":true,"url":"https://api.github.com/repos/ww44ss/Titanic/commits/dbd6831a613af879e35527ea486c559c23fd9b4a"}]},"public":true,"created_at":"2015-01-01T01:01:01Z"}
{"id":"2489396356","type":"PushEvent","actor":{"id":4167278,"login":"frechei","gravatar_id":"","url":"https://api.github.com/users/frechei","avatar_url":"https://avatars.githubusercontent.com/u/4167278?"},"repo":{"id":9475465,"name":"frechei/frechei.github.com","url":"https://api.github.com/repos/frechei/frechei.github.com"},"payload":{"push_id":536752447,"size":3,"distinct_size":3,"ref":"refs/heads/master","head":"ecc17f6817f60facb356cd2431fcae42aa1adde6","before":"2781f52cf83cccff5a44c2cd5e5a31c71507bc5d","commits":[{"sha":"11498120a07a44ddb0303eec31672e4a3cf7d26f","author":{"email":"3ba795b10b0bab9eb3b0f6e5eaa6ef981f2e220e@163.com¨","name":"¨frechei¨"},"message":"Octopress init","distinct":true,"url":"https://api.github.com/repos/frechei/frechei.github.com/commits/11498120a07a44ddb0303eec31672e4a3cf7d26f"},{"sha":"01faf6dabf6d005d77d2433a509a34017fd5a800","author":{"email":"3ba795b10b0bab9eb3b0f6e5eaa6ef981f2e220e@163.com¨","name":"¨frechei¨"},"message":"合并冲突","distinct":true,"url":"https://api.github.com/repos/frechei/frechei.github.com/commits/01faf6dabf6d005d77d2433a509a34017fd5a800"},{"sha":"ecc17f6817f60facb356cd2431fcae42aa1adde6","author":{"email":"3ba795b10b0bab9eb3b0f6e5eaa6ef981f2e220e@163.com¨","name":"¨frechei¨"},"message":"Site updated at 2015-01-01 01:00:53 UTC","distinct":true,"url":"https://api.github.com/repos/frechei/frechei.github.com/commits/ecc17f6817f60facb356cd2431fcae42aa1adde6"}]},"public":true,"created_at":"2015-01-01T01:01:01Z"}
{"id":"2489396357","type":"PushEvent","actor":{"id":1903079,"login":"krizvi","gravatar_id":"","url":"https://api.github.com/users/krizvi","avatar_url":"https://avatars.githubusercontent.com/u/1903079?"},"repo":{"id":20293030,"name":"VHAINNOVATIONS/Mental-Health-eScreening","url":"https://api.github.com/repos/VHAINNOVATIONS/Mental-Health-eScreening"},"payload":{"push_id":536752448,"size":1,"distinct_size":1,"ref":"refs/heads/t651","head":"df757ed8ad0c31af27c6099cc0c2d8818cb2ff6b","before":"89b68f2e450ba74e169210925a0b02b1b02e2d9f","commits":[{"sha":"df757ed8ad0c31af27c6099cc0c2d8818cb2ff6b","author":{"email":"e0c3a02e4102d2b5ed70e51bf9a27df65846d12e@gmail.com","name":"Khalid R. Rizvi"},"message":"t651 fixed json data response by plucking unncessary data and also Lint the section controller","distinct":true,"url":"https://api.github.com/repos/VHAINNOVATIONS/Mental-Health-eScreening/commits/df757ed8ad0c31af27c6099cc0c2d8818cb2ff6b"}]},"public":true,"created_at":"2015-01-01T01:01:01Z","org":{"id":1252476,"login":"VHAINNOVATIONS","gravatar_id":"","url":"https://api.github.com/orgs/VHAINNOVATIONS","avatar_url":"https://avatars.githubusercontent.com/u/1252476?"}}
{"id":"2489396359","type":"PushEvent","actor":{"id":6952185,"login":"krico","gravatar_id":"","url":"https://api.github.com/users/krico","avatar_url":"https://avatars.githubusercontent.com/u/6952185?"},"repo":{"id":25744696,"name":"krico/jas","url":"https://api.github.com/repos/krico/jas"},"payload":{"push_id":536752450,"size":16,"distinct_size":12,"ref":"refs/heads/jas-95","head":"08bf4359f7d54b6a488c650b08fe8f31a8e1703a","before":"0459dc09acd412b54aba4a18c3463173938fbe02","commits":[{"sha":"7ad7fa31bafceb692bfad082cd0893a25ab5140a","author":{"email":"a6066a030a600eca8738f6d597ace912fc74e459@wp.pl","name":"wszarmach"},"message":"jas-83 Complete specification","distinct":false,"url":"https://api.github.com/repos/krico/jas/commits/7ad7fa31bafceb692bfad082cd0893a25ab5140a"},{"sha":"6d5a4ab572693869e6ed99d95e0016c51bbb2082","author":{"email":"a6066a030a600eca8738f6d597ace912fc74e459@wp.pl","name":"wszarmach"},"message":"Merge pull request #97 from krico/jas-83\n\njas-83 Complete specification","distinct":false,"url":"https://api.github.com/repos/krico/jas/commits/6d5a4ab572693869e6ed99d95e0016c51bbb2082"},{"sha":"904f8b941ac5bfb140ebb52cb7e990955af60252","author":{"email":"a6066a030a600eca8738f6d597ace912fc74e459@wp.pl","name":"wszarmach"},"message":"fixes jas-93 Google and Facebook sign up have wrong symbols","distinct":false,"url":"https://api.github.com/repos/krico/jas/commits/904f8b941ac5bfb140ebb52cb7e990955af60252"},{"sha":"3cc7fce7bc815199132b04070fac7abf133e2a85","author":{"email":"a6066a030a600eca8738f6d597ace912fc74e459@wp.pl","name":"wszarmach"},"message":"Merge pull request #98 from krico/jas-93\n\nfixes jas-93 Google and Facebook sign up have wrong symbols","distinct":false,"url":"https://api.github.com/repos/krico/jas/commits/3cc7fce7bc815199132b04070fac7abf133e2a85"},{"sha":"17f2f8288a44307d644e53442aa2af8da4f06ef9","author":{"email":"64b2b6d12bfe4baae7dad3d018f8cbf6b0e7a044@cwa.to","name":"krico"},"message":"Refactored, cleaned up and tested api","distinct":true,"url":"https://api.github.com/repos/krico/jas/commits/17f2f8288a44307d644e53442aa2af8da4f06ef9"},{"sha":"afc0c40bd91051010ec51f179370b20a9df659f7","author":{"email":"64b2b6d12bfe4baae7dad3d018f8cbf6b0e7a044@cwa.to","name":"krico"},"message":"fixes #93","distinct":true,"url":"https://api.github.com/repos/krico/jas/commits/afc0c40bd91051010ec51f179370b20a9df659f7"},{"sha":"6e9fc012e2904977605aea893fc6cbb48bd2e958","author":{"email":"64b2b6d12bfe4baae7dad3d018f8cbf6b0e7a044@cwa.to","name":"krico"},"message":"fixes #93","distinct":true,"url":"https://api.github.com/repos/krico/jas/commits/6e9fc012e2904977605aea893fc6cbb48bd2e958"},{"sha":"befe1cef92f320fccdeccc0a695d8662e2a70ada","author":{"email":"64b2b6d12bfe4baae7dad3d018f8cbf6b0e7a044@cwa.to","name":"krico"},"message":"First javascript service (UserLogin) based on the jasify API","distinct":true,"url":"https://api.github.com/repos/krico/jas/commits/befe1cef92f320fccdeccc0a695d8662e2a70ada"},{"sha":"30042e5952af29070eeea08a3191aeedd745431f","author":{"email":"64b2b6d12bfe4baae7dad3d018f8cbf6b0e7a044@cwa.to","name":"krico"},"message":"JasUserLoginTransformer: had to change methods to be based on  UserLogin.id","distinct":true,"url":"https://api.github.com/repos/krico/jas/commits/30042e5952af29070eeea08a3191aeedd745431f"},{"sha":"0e38de2350dce0face64ce29ad79830ecca4ecae","author":{"email":"64b2b6d12bfe4baae7dad3d018f8cbf6b0e7a044@cwa.to","name":"krico"},"message":"UsernameServlet replaced by JasifyEndpoint","distinct":true,"url":"https://api.github.com/repos/krico/jas/commits/0e38de2350dce0face64ce29ad79830ecca4ecae"},{"sha":"d1af5a8f4d5f6c2cf379eeaa61c56a3e9d63af0e","author":{"email":"64b2b6d12bfe4baae7dad3d018f8cbf6b0e7a044@cwa.to","name":"krico"},"message":"UsernameServlet replaced by JasifyEndpoint (forgot js tests)","distinct":true,"url":"https://api.github.com/repos/krico/jas/commits/d1af5a8f4d5f6c2cf379eeaa61c56a3e9d63af0e"},{"sha":"04fdbb02d22c599d5697e87668b269113c51f77d","author":{"email":"64b2b6d12bfe4baae7dad3d018f8cbf6b0e7a044@cwa.to","name":"krico"},"message":"ChangePasswordServlet decommed and moved to JasifyEndpoint\n\n**LAST COMMIT OF 2014!!!!**","distinct":true,"url":"https://api.github.com/repos/krico/jas/commits/04fdbb02d22c599d5697e87668b269113c51f77d"},{"sha":"83676e90be82ad7e4401a5f1f7e8fe4eaf9235c3","author":{"email":"64b2b6d12bfe4baae7dad3d018f8cbf6b0e7a044@cwa.to","name":"krico"},"message":"Cannot use `@Named` parameters for password as they show in the URL","distinct":true,"url":"https://api.github.com/repos/krico/jas/commits/83676e90be82ad7e4401a5f1f7e8fe4eaf9235c3"},{"sha":"638d40f314d059beee89b841684d816f10973bff","author":{"email":"64b2b6d12bfe4baae7dad3d018f8cbf6b0e7a044@cwa.to","name":"krico"},"message":"Moved changePassword to auth","distinct":true,"url":"https://api.github.com/repos/krico/jas/commits/638d40f314d059beee89b841684d816f10973bff"},{"sha":"3dea0fdecaef71683ba7398586de15704f2803c6","author":{"email":"64b2b6d12bfe4baae7dad3d018f8cbf6b0e7a044@cwa.to","name":"krico"},"message":"LogoutServlet replaced with API","distinct":true,"url":"https://api.github.com/repos/krico/jas/commits/3dea0fdecaef71683ba7398586de15704f2803c6"},{"sha":"08bf4359f7d54b6a488c650b08fe8f31a8e1703a","author":{"email":"64b2b6d12bfe4baae7dad3d018f8cbf6b0e7a044@cwa.to","name":"krico"},"message":"Merge branch 'jas-95' of github.com:krico/jas into jas-95","distinct":true,"url":"https://api.github.com/repos/krico/jas/commits/08bf4359f7d54b6a488c650b08fe8f31a8e1703a"}]},"public":true,"created_at":"2015-01-01T01:01:02Z"}
{"id":"2489396363","type":"PushEvent","actor":{"id":2539292,"login":"wmfgerrit","gravatar_id":"","url":"https://api.github.com/users/wmfgerrit","avatar_url":"https://avatars.githubusercontent.com/u/2539292?"},"repo":{"id":6495082,"name":"wikimedia/mediawiki-extensions","url":"https://api.github.com/repos/wikimedia/mediawiki-extensions"},"payload":{"push_id":536752453,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"88b2fc95cfa3af5741e02f01e950b1f7c16cdfe8","before":"c5cc7199b6ff16671222f91c173945875911bc32","commits":[{"sha":"88b2fc95cfa3af5741e02f01e950b1f7c16cdfe8","author":{"email":"61a1c7c885f4fc173424af2875d459c32bdc4fee@gerrit.wikimedia.org","name":"jenkins-bot"},"message":"Updated mediawiki/extensions\nProject: mediawiki/extensions/WikimediaMessages  61ec5c645adae968e353a778c4f7e82a86ad3468\n\nAdd missing wikibase-sitelinks-sitename-wikidatawiki message\n\nChange-Id: I1edd3a55f4c8240a2317828adcb9eedccbe904f4","distinct":true,"url":"https://api.github.com/repos/wikimedia/mediawiki-extensions/commits/88b2fc95cfa3af5741e02f01e950b1f7c16cdfe8"}]},"public":true,"created_at":"2015-01-01T01:01:02Z","org":{"id":56668,"login":"wikimedia","gravatar_id":"","url":"https://api.github.com/orgs/wikimedia","avatar_url":"https://avatars.githubusercontent.com/u/56668?"}}
{"id":"2489396366","type":"IssueCommentEvent","actor":{"id":134455,"login":"whit537","gravatar_id":"","url":"https://api.github.com/users/whit537","avatar_url":"https://avatars.githubusercontent.com/u/134455?"},"repo":{"id":16488998,"name":"gratipay/inside.gratipay.com","url":"https://api.github.com/repos/gratipay/inside.gratipay.com"},"payload":{"action":"created","issue":{"url":"https://api.github.com/repos/gratipay/inside.gratipay.com/issues/86","labels_url":"https://api.github.com/repos/gratipay/inside.gratipay.com/issues/86/labels{/name}","comments_url":"https://api.github.com/repos/gratipay/inside.gratipay.com/issues/86/comments","events_url":"https://api.github.com/repos/gratipay/inside.gratipay.com/issues/86/events","html_url":"https://github.com/gratipay/inside.gratipay.com/issues/86","id":42198005,"number":86,"title":"RSVP List","user":{"login":"clone1018","id":226638,"avatar_url":"https://avatars.githubusercontent.com/u/226638?v=3","gravatar_id":"","url":"https://api.github.com/users/clone1018","html_url":"https://github.com/clone1018","followers_url":"https://api.github.com/users/clone1018/followers","following_url":"https://api.github.com/users/clone1018/following{/other_user}","gists_url":"https://api.github.com/users/clone1018/gists{/gist_id}","starred_url":"https://api.github.com/users/clone1018/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/clone1018/subscriptions","organizations_url":"https://api.github.com/users/clone1018/orgs","repos_url":"https://api.github.com/users/clone1018/repos","events_url":"https://api.github.com/users/clone1018/events{/privacy}","received_events_url":"https://api.github.com/users/clone1018/received_events","type":"User","site_admin":false},"labels":[],"state":"open","locked":false,"assignee":null,"milestone":{"url":"https://api.github.com/repos/gratipay/inside.gratipay.com/milestones/2","labels_url":"https://api.github.com/repos/gratipay/inside.gratipay.com/milestones/2/labels","id":782050,"number":2,"title":"Gratipay Retreat 2015","description":"This is an encompassing milestone for planning the Gratipay Retreat. ","creator":{"login":"clone1018","id":226638,"avatar_url":"https://avatars.githubusercontent.com/u/226638?v=3","gravatar_id":"","url":"https://api.github.com/users/clone1018","html_url":"https://github.com/clone1018","followers_url":"https://api.github.com/users/clone1018/followers","following_url":"https://api.github.com/users/clone1018/following{/other_user}","gists_url":"https://api.github.com/users/clone1018/gists{/gist_id}","starred_url":"https://api.github.com/users/clone1018/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/clone1018/subscriptions","organizations_url":"https://api.github.com/users/clone1018/orgs","repos_url":"https://api.github.com/users/clone1018/repos","events_url":"https://api.github.com/users/clone1018/events{/privacy}","received_events_url":"https://api.github.com/users/clone1018/received_events","type":"User","site_admin":false},"open_issues":2,"closed_issues":1,"state":"open","created_at":"2014-09-08T13:35:41Z","updated_at":"2015-01-01T00:49:37Z","due_on":"2015-01-02T08:00:00Z","closed_at":null},"comments":36,"created_at":"2014-09-08T13:52:30Z","updated_at":"2015-01-01T01:01:02Z","closed_at":null,"body":"## What?\r\n\r\nThe purpose of the Gratipay company retreat is to strategize about the year ahead, sprint on Gratipay and related projects, and to continue to build meaningful relationships.\r\n\r\n## When?\r\n\r\n![countdown!](http://secondapps.com/countdown/t1420236000z1.png)\r\n(Due to GitHub's image caching this may be out of date)\r\n\r\nStarts: Friday January 2, 2014 at 5:00pm\r\nEnds: Monday, January 5, 2014 at 12:00pm\r\n\r\n## Where?\r\n\r\n716 Park Road, Ambridge, PA 15003\r\n\r\n## Who?\r\n### Yes: 1\r\n1 @clone1018\r\n1 @seanlinsley \r\n1 @whit537 \r\n1 @rummik \r\n1 @colindean \r\n1 @kaguillera \r\n\r\n### Maybe: 0\r\n\r\n### No: 1\r\n1 @chrisdev\r\n1 @patcon"},"comment":{"url":"https://api.github.com/repos/gratipay/inside.gratipay.com/issues/comments/68477232","html_url":"https://github.com/gratipay/inside.gratipay.com/issues/86#issuecomment-68477232","issue_url":"https://api.github.com/repos/gratipay/inside.gratipay.com/issues/86","id":68477232,"user":{"login":"whit537","id":134455,"avatar_url":"https://avatars.githubusercontent.com/u/134455?v=3","gravatar_id":"","url":"https://api.github.com/users/whit537","html_url":"https://github.com/whit537","followers_url":"https://api.github.com/users/whit537/followers","following_url":"https://api.github.com/users/whit537/following{/other_user}","gists_url":"https://api.github.com/users/whit537/gists{/gist_id}","starred_url":"https://api.github.com/users/whit537/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/whit537/subscriptions","organizations_url":"https://api.github.com/users/whit537/orgs","repos_url":"https://api.github.com/users/whit537/repos","events_url":"https://api.github.com/users/whit537/events{/privacy}","received_events_url":"https://api.github.com/users/whit537/received_events","type":"User","site_admin":false},"created_at":"2015-01-01T01:01:02Z","updated_at":"2015-01-01T01:01:02Z","body":"Heard from @kaguillera in private email, sounds like he's planning to make it!"}},"public":true,"created_at":"2015-01-01T01:01:02Z","org":{"id":1744073,"login":"gratipay","gravatar_id":"","url":"https://api.github.com/orgs/gratipay","avatar_url":"https://avatars.githubusercontent.com/u/1744073?"}}
{"id":"2489396374","type":"ForkEvent","actor":{"id":1291511,"login":"aamedina","gravatar_id":"","url":"https://api.github.com/users/aamedina","avatar_url":"https://avatars.githubusercontent.com/u/1291511?"},"repo":{"id":10082287,"name":"clojure/core.async","url":"https://api.github.com/repos/clojure/core.async"},"payload":{"forkee":{"id":28678224,"name":"core.async","full_name":"aamedina/core.async","owner":{"login":"aamedina","id":1291511,"avatar_url":"https://avatars.githubusercontent.com/u/1291511?v=3","gravatar_id":"","url":"https://api.github.com/users/aamedina","html_url":"https://github.com/aamedina","followers_url":"https://api.github.com/users/aamedina/followers","following_url":"https://api.github.com/users/aamedina/following{/other_user}","gists_url":"https://api.github.com/users/aamedina/gists{/gist_id}","starred_url":"https://api.github.com/users/aamedina/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/aamedina/subscriptions","organizations_url":"https://api.github.com/users/aamedina/orgs","repos_url":"https://api.github.com/users/aamedina/repos","events_url":"https://api.github.com/users/aamedina/events{/privacy}","received_events_url":"https://api.github.com/users/aamedina/received_events","type":"User","site_admin":false},"private":false,"html_url":"https://github.com/aamedina/core.async","description":"Facilities for async programming and communication in Clojure","fork":true,"url":"https://api.github.com/repos/aamedina/core.async","forks_url":"https://api.github.com/repos/aamedina/core.async/forks","keys_url":"https://api.github.com/repos/aamedina/core.async/keys{/key_id}","collaborators_url":"https://api.github.com/repos/aamedina/core.async/collaborators{/collaborator}","teams_url":"https://api.github.com/repos/aamedina/core.async/teams","hooks_url":"https://api.github.com/repos/aamedina/core.async/hooks","issue_events_url":"https://api.github.com/repos/aamedina/core.async/issues/events{/number}","events_url":"https://api.github.com/repos/aamedina/core.async/events","assignees_url":"https://api.github.com/repos/aamedina/core.async/assignees{/user}","branches_url":"https://api.github.com/repos/aamedina/core.async/branches{/branch}","tags_url":"https://api.github.com/repos/aamedina/core.async/tags","blobs_url":"https://api.github.com/repos/aamedina/core.async/git/blobs{/sha}","git_tags_url":"https://api.github.com/repos/aamedina/core.async/git/tags{/sha}","git_refs_url":"https://api.github.com/repos/aamedina/core.async/git/refs{/sha}","trees_url":"https://api.github.com/repos/aamedina/core.async/git/trees{/sha}","statuses_url":"https://api.github.com/repos/aamedina/core.async/statuses/{sha}","languages_url":"https://api.github.com/repos/aamedina/core.async/languages","stargazers_url":"https://api.github.com/repos/aamedina/core.async/stargazers","contributors_url":"https://api.github.com/repos/aamedina/core.async/contributors","subscribers_url":"https://api.github.com/repos/aamedina/core.async/subscribers","subscription_url":"https://api.github.com/repos/aamedina/core.async/subscription","commits_url":"https://api.github.com/repos/aamedina/core.async/commits{/sha}","git_commits_url":"https://api.github.com/repos/aamedina/core.async/git/commits{/sha}","comments_url":"https://api.github.com/repos/aamedina/core.async/comments{/number}","issue_comment_url":"https://api.github.com/repos/aamedina/core.async/issues/comments/{number}","contents_url":"https://api.github.com/repos/aamedina/core.async/contents/{+path}","compare_url":"https://api.github.com/repos/aamedina/core.async/compare/{base}...{head}","merges_url":"https://api.github.com/repos/aamedina/core.async/merges","archive_url":"https://api.github.com/repos/aamedina/core.async/{archive_format}{/ref}","downloads_url":"https://api.github.com/repos/aamedina/core.async/downloads","issues_url":"https://api.github.com/repos/aamedina/core.async/issues{/number}","pulls_url":"https://api.github.com/repos/aamedina/core.async/pulls{/number}","milestones_url":"https://api.github.com/repos/aamedina/core.async/milestones{/number}","notifications_url":"https://api.github.com/repos/aamedina/core.async/notifications{?since,all,participating}","labels_url":"https://api.github.com/repos/aamedina/core.async/labels{/name}","releases_url":"https://api.github.com/repos/aamedina/core.async/releases{/id}","created_at":"2015-01-01T01:01:04Z","updated_at":"2014-12-29T21:26:26Z","pushed_at":"2014-10-15T00:42:26Z","git_url":"git://github.com/aamedina/core.async.git","ssh_url":"git@github.com:aamedina/core.async.git","clone_url":"https://github.com/aamedina/core.async.git","svn_url":"https://github.com/aamedina/core.async","homepage":null,"size":2570,"stargazers_count":0,"watchers_count":0,"language":null,"has_issues":false,"has_downloads":true,"has_wiki":true,"has_pages":false,"forks_count":0,"mirror_url":null,"open_issues_count":0,"forks":0,"open_issues":0,"watchers":0,"default_branch":"master","public":true}},"public":true,"created_at":"2015-01-01T01:01:04Z","org":{"id":317875,"login":"clojure","gravatar_id":"","url":"https://api.github.com/orgs/clojure","avatar_url":"https://avatars.githubusercontent.com/u/317875?"}}
{"id":"2489396375","type":"IssueCommentEvent","actor":{"id":2829600,"login":"GrahamCampbell","gravatar_id":"","url":"https://api.github.com/users/GrahamCampbell","avatar_url":"https://avatars.githubusercontent.com/u/2829600?"},"repo":{"id":26730195,"name":"cachethq/Cachet","url":"https://api.github.com/repos/cachethq/Cachet"},"payload":{"action":"created","issue":{"url":"https://api.github.com/repos/cachethq/Cachet/issues/173","labels_url":"https://api.github.com/repos/cachethq/Cachet/issues/173/labels{/name}","comments_url":"https://api.github.com/repos/cachethq/Cachet/issues/173/comments","events_url":"https://api.github.com/repos/cachethq/Cachet/issues/173/events","html_url":"https://github.com/cachethq/Cachet/issues/173","id":53210024,"number":173,"title":"Bug: Forms let you submit multiple times","user":{"login":"Jamesking56","id":253237,"avatar_url":"https://avatars.githubusercontent.com/u/253237?v=3","gravatar_id":"","url":"https://api.github.com/users/Jamesking56","html_url":"https://github.com/Jamesking56","followers_url":"https://api.github.com/users/Jamesking56/followers","following_url":"https://api.github.com/users/Jamesking56/following{/other_user}","gists_url":"https://api.github.com/users/Jamesking56/gists{/gist_id}","starred_url":"https://api.github.com/users/Jamesking56/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/Jamesking56/subscriptions","organizations_url":"https://api.github.com/users/Jamesking56/orgs","repos_url":"https://api.github.com/users/Jamesking56/repos","events_url":"https://api.github.com/users/Jamesking56/events{/privacy}","received_events_url":"https://api.github.com/users/Jamesking56/received_events","type":"User","site_admin":false},"labels":[],"state":"open","locked":false,"assignee":null,"milestone":null,"comments":3,"created_at":"2015-01-01T00:52:06Z","updated_at":"2015-01-01T01:01:04Z","closed_at":null,"body":"When adding a new incident, I noticed a weird bug.\r\n\r\nIf you fill in the form as normal, then click the submit button twice really quickly, it'll create __TWO__ identical new incidents!\r\n\r\nThis could be a bit annoying, a simple fix is using a bit of JS that on submit, disables the submit button so that once clicked, it cannot be clicked again."},"comment":{"url":"https://api.github.com/repos/cachethq/Cachet/issues/comments/68477233","html_url":"https://github.com/cachethq/Cachet/issues/173#issuecomment-68477233","issue_url":"https://api.github.com/repos/cachethq/Cachet/issues/173","id":68477233,"user":{"login":"GrahamCampbell","id":2829600,"avatar_url":"https://avatars.githubusercontent.com/u/2829600?v=3","gravatar_id":"","url":"https://api.github.com/users/GrahamCampbell","html_url":"https://github.com/GrahamCampbell","followers_url":"https://api.github.com/users/GrahamCampbell/followers","following_url":"https://api.github.com/users/GrahamCampbell/following{/other_user}","gists_url":"https://api.github.com/users/GrahamCampbell/gists{/gist_id}","starred_url":"https://api.github.com/users/GrahamCampbell/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/GrahamCampbell/subscriptions","organizations_url":"https://api.github.com/users/GrahamCampbell/orgs","repos_url":"https://api.github.com/users/GrahamCampbell/repos","events_url":"https://api.github.com/users/GrahamCampbell/events{/privacy}","received_events_url":"https://api.github.com/users/GrahamCampbell/received_events","type":"User","site_admin":false},"created_at":"2015-01-01T01:01:04Z","updated_at":"2015-01-01T01:01:04Z","body":"Provide a unique code as a hidden field that invalides once submitted."}},"public":true,"created_at":"2015-01-01T01:01:04Z","org":{"id":9951502,"login":"cachethq","gravatar_id":"","url":"https://api.github.com/orgs/cachethq","avatar_url":"https://avatars.githubusercontent.com/u/9951502?"}}
{"id":"2489396376","type":"PushEvent","actor":{"id":876467,"login":"flasheater","gravatar_id":"","url":"https://api.github.com/users/flasheater","avatar_url":"https://avatars.githubusercontent.com/u/876467?"},"repo":{"id":28678036,"name":"flasheater/fresh","url":"https://api.github.com/repos/flasheater/fresh"},"payload":{"push_id":536752458,"size":2,"distinct_size":2,"ref":"refs/heads/master","head":"36b46027ec5e7e97db30e05215d0bec5eeb0d138","before":"a38d020b7c78470cd59382245933e0ef62db5712","commits":[{"sha":"c0a0b02fe479a282199fbaec6e8530ad6c48379a","author":{"email":"51e5422d9fa86e2bc865774c76fbbdc9939f4d14@gmail.com","name":"Oliver Jan Krylow"},"message":"Inroduced variable FRESH_REPO to install.sh so that forks of fresh can use this script. Furthermore, begun adding fish\nsupport.","distinct":true,"url":"https://api.github.com/repos/flasheater/fresh/commits/c0a0b02fe479a282199fbaec6e8530ad6c48379a"},{"sha":"36b46027ec5e7e97db30e05215d0bec5eeb0d138","author":{"email":"51e5422d9fa86e2bc865774c76fbbdc9939f4d14@gmail.com","name":"Oliver Jan Krylow"},"message":"Push to repo to test vagrant support.","distinct":true,"url":"https://api.github.com/repos/flasheater/fresh/commits/36b46027ec5e7e97db30e05215d0bec5eeb0d138"}]},"public":true,"created_at":"2015-01-01T01:01:04Z"}
{"id":"2489396379","type":"PushEvent","actor":{"id":4809376,"login":"guavuslabs-builder","gravatar_id":"","url":"https://api.github.com/users/guavuslabs-builder","avatar_url":"https://avatars.githubusercontent.com/u/4809376?"},"repo":{"id":17457530,"name":"Guavus/spark","url":"https://api.github.com/repos/Guavus/spark"},"payload":{"push_id":536752459,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"4bb12488d56ea651c56d9688996b464b99095582","before":"fe6efacc0b865e9e827a1565877077000e63976e","commits":[{"sha":"4bb12488d56ea651c56d9688996b464b99095582","author":{"email":"291c18f3fb7528c712d9098b0e50a515ea0b91d5@cloudera.com","name":"Sean Owen"},"message":"SPARK-2757 [BUILD] [STREAMING] Add Mima test for Spark Sink after 1.10 is released\n\nRe-enable MiMa for Streaming Flume Sink module, now that 1.1.0 is released, per the JIRA TO-DO. That's pretty much all there is to this.\n\nAuthor: Sean Owen <sowen@cloudera.com>\n\nCloses #3842 from srowen/SPARK-2757 and squashes the following commits:\n\n50ff80e [Sean Owen] Exclude apparent false positive turned up by re-enabling MiMa checks for Streaming Flume Sink\n0e5ba5c [Sean Owen] Re-enable MiMa for Streaming Flume Sink module","distinct":true,"url":"https://api.github.com/repos/Guavus/spark/commits/4bb12488d56ea651c56d9688996b464b99095582"}]},"public":true,"created_at":"2015-01-01T01:01:04Z","org":{"id":3741861,"login":"Guavus","gravatar_id":"","url":"https://api.github.com/orgs/Guavus","avatar_url":"https://avatars.githubusercontent.com/u/3741861?"}}
{"id":"2489396385","type":"IssueCommentEvent","actor":{"id":228410,"login":"kitak","gravatar_id":"","url":"https://api.github.com/users/kitak","avatar_url":"https://avatars.githubusercontent.com/u/228410?"},"repo":{"id":11133793,"name":"mamebro/mameblo","url":"https://api.github.com/repos/mamebro/mameblo"},"payload":{"action":"created","issue":{"url":"https://api.github.com/repos/mamebro/mameblo/issues/249","labels_url":"https://api.github.com/repos/mamebro/mameblo/issues/249/labels{/name}","comments_url":"https://api.github.com/repos/mamebro/mameblo/issues/249/comments","events_url":"https://api.github.com/repos/mamebro/mameblo/issues/249/events","html_url":"https://github.com/mamebro/mameblo/pull/249","id":53185061,"number":249,"title":"!!! あけましておめでとうございます !!!","user":{"login":"shikakun","id":1396953,"avatar_url":"https://avatars.githubusercontent.com/u/1396953?v=3","gravatar_id":"","url":"https://api.github.com/users/shikakun","html_url":"https://github.com/shikakun","followers_url":"https://api.github.com/users/shikakun/followers","following_url":"https://api.github.com/users/shikakun/following{/other_user}","gists_url":"https://api.github.com/users/shikakun/gists{/gist_id}","starred_url":"https://api.github.com/users/shikakun/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/shikakun/subscriptions","organizations_url":"https://api.github.com/users/shikakun/orgs","repos_url":"https://api.github.com/users/shikakun/repos","events_url":"https://api.github.com/users/shikakun/events{/privacy}","received_events_url":"https://api.github.com/users/shikakun/received_events","type":"User","site_admin":false},"labels":[],"state":"closed","locked":false,"assignee":null,"milestone":null,"comments":2,"created_at":"2014-12-31T14:00:42Z","updated_at":"2015-01-01T01:01:05Z","closed_at":"2014-12-31T15:01:12Z","pull_request":{"url":"https://api.github.com/repos/mamebro/mameblo/pulls/249","html_url":"https://github.com/mamebro/mameblo/pull/249","diff_url":"https://github.com/mamebro/mameblo/pull/249.diff","patch_url":"https://github.com/mamebro/mameblo/pull/249.patch"},"body":"@mamebro/owners \r\n新年を迎えたのがめでたいので、背景が紅白にチカチカ点滅するようにしました。"},"comment":{"url":"https://api.github.com/repos/mamebro/mameblo/issues/comments/68477234","html_url":"https://github.com/mamebro/mameblo/pull/249#issuecomment-68477234","issue_url":"https://api.github.com/repos/mamebro/mameblo/issues/249","id":68477234,"user":{"login":"kitak","id":228410,"avatar_url":"https://avatars.githubusercontent.com/u/228410?v=3","gravatar_id":"","url":"https://api.github.com/users/kitak","html_url":"https://github.com/kitak","followers_url":"https://api.github.com/users/kitak/followers","following_url":"https://api.github.com/users/kitak/following{/other_user}","gists_url":"https://api.github.com/users/kitak/gists{/gist_id}","starred_url":"https://api.github.com/users/kitak/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/kitak/subscriptions","organizations_url":"https://api.github.com/users/kitak/orgs","repos_url":"https://api.github.com/users/kitak/repos","events_url":"https://api.github.com/users/kitak/events{/privacy}","received_events_url":"https://api.github.com/users/kitak/received_events","type":"User","site_admin":false},"created_at":"2015-01-01T01:01:05Z","updated_at":"2015-01-01T01:01:05Z","body":"おめでとうございます！ :tada: "}},"public":true,"created_at":"2015-01-01T01:01:06Z","org":{"id":3763231,"login":"mamebro","gravatar_id":"","url":"https://api.github.com/orgs/mamebro","avatar_url":"https://avatars.githubusercontent.com/u/3763231?"}}
{"id":"2489396387","type":"PushEvent","actor":{"id":5869772,"login":"felixonmars-bot","gravatar_id":"","url":"https://api.github.com/users/felixonmars-bot","avatar_url":"https://avatars.githubusercontent.com/u/5869772?"},"repo":{"id":15896070,"name":"felixonmars/packages-mirror","url":"https://api.github.com/repos/felixonmars/packages-mirror"},"payload":{"push_id":536752460,"size":5,"distinct_size":5,"ref":"refs/heads/master","head":"259643a2baa03206b68bee1ab0291f4e5731ba7f","before":"9fe97687a1282a034b2cc8abbe659ed029920bbc","commits":[{"sha":"4a722a9a329fe751f7f1564d888a1167880bb079","author":{"email":"96f164ad4d9b2b0dacf8ebee2bb1eeb3aa69adf1@eb2447ed-0c53-47e4-bac8-5bc4a241df78","name":"eric"},"message":"archrelease: copy trunk to staging-i686\n\ngit-svn-id: file:///srv/repos/svn-packages/svn@228268 eb2447ed-0c53-47e4-bac8-5bc4a241df78","distinct":true,"url":"https://api.github.com/repos/felixonmars/packages-mirror/commits/4a722a9a329fe751f7f1564d888a1167880bb079"},{"sha":"9ecdfd1cbd1543c91db31222a939ec481c99b2f0","author":{"email":"96f164ad4d9b2b0dacf8ebee2bb1eeb3aa69adf1@eb2447ed-0c53-47e4-bac8-5bc4a241df78","name":"eric"},"message":"archrelease: copy trunk to staging-x86_64\n\ngit-svn-id: file:///srv/repos/svn-packages/svn@228269 eb2447ed-0c53-47e4-bac8-5bc4a241df78","distinct":true,"url":"https://api.github.com/repos/felixonmars/packages-mirror/commits/9ecdfd1cbd1543c91db31222a939ec481c99b2f0"},{"sha":"7d83daeb67690660c7b36adb258b907f9ec4004a","author":{"email":"96f164ad4d9b2b0dacf8ebee2bb1eeb3aa69adf1@eb2447ed-0c53-47e4-bac8-5bc4a241df78","name":"eric"},"message":"Add validpgpkeys array\n\ngit-svn-id: file:///srv/repos/svn-packages/svn@228270 eb2447ed-0c53-47e4-bac8-5bc4a241df78","distinct":true,"url":"https://api.github.com/repos/felixonmars/packages-mirror/commits/7d83daeb67690660c7b36adb258b907f9ec4004a"},{"sha":"a9bd2311944899fdc40407321bf727615834b6cb","author":{"email":"96f164ad4d9b2b0dacf8ebee2bb1eeb3aa69adf1@eb2447ed-0c53-47e4-bac8-5bc4a241df78","name":"eric"},"message":"archrelease: copy trunk to extra-i686\n\ngit-svn-id: file:///srv/repos/svn-packages/svn@228271 eb2447ed-0c53-47e4-bac8-5bc4a241df78","distinct":true,"url":"https://api.github.com/repos/felixonmars/packages-mirror/commits/a9bd2311944899fdc40407321bf727615834b6cb"},{"sha":"259643a2baa03206b68bee1ab0291f4e5731ba7f","author":{"email":"96f164ad4d9b2b0dacf8ebee2bb1eeb3aa69adf1@eb2447ed-0c53-47e4-bac8-5bc4a241df78","name":"eric"},"message":"archrelease: copy trunk to extra-x86_64\n\ngit-svn-id: file:///srv/repos/svn-packages/svn@228272 eb2447ed-0c53-47e4-bac8-5bc4a241df78","distinct":true,"url":"https://api.github.com/repos/felixonmars/packages-mirror/commits/259643a2baa03206b68bee1ab0291f4e5731ba7f"}]},"public":true,"created_at":"2015-01-01T01:01:06Z"}
{"id":"2489396389","type":"PushEvent","actor":{"id":3487531,"login":"jl4282","gravatar_id":"","url":"https://api.github.com/users/jl4282","avatar_url":"https://avatars.githubusercontent.com/u/3487531?"},"repo":{"id":28677679,"name":"jl4282/swirlwebsite","url":"https://api.github.com/repos/jl4282/swirlwebsite"},"payload":{"push_id":536752462,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"bd278f438aba4582c30eb8d42e7b52740b739e5b","before":"78a50b06faa40c0fd632efd2f2f610652052a6c0","commits":[{"sha":"bd278f438aba4582c30eb8d42e7b52740b739e5b","author":{"email":"4068bf12e44880d7eec32c1ab3069b58d1acd33f@gmail.com","name":"jl4282"},"message":"started changing master","distinct":true,"url":"https://api.github.com/repos/jl4282/swirlwebsite/commits/bd278f438aba4582c30eb8d42e7b52740b739e5b"}]},"public":true,"created_at":"2015-01-01T01:01:06Z"}
{"id":"2489396392","type":"PushEvent","actor":{"id":8347069,"login":"williamtwilson","gravatar_id":"","url":"https://api.github.com/users/williamtwilson","avatar_url":"https://avatars.githubusercontent.com/u/8347069?"},"repo":{"id":28171448,"name":"williamtwilson/speedboard-frontend","url":"https://api.github.com/repos/williamtwilson/speedboard-frontend"},"payload":{"push_id":536752463,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"66d5fee55bda2c92031dcb9eb15cf02eeb7ecd90","before":"6138829ffa8274bce05eff607c5acf28fc880399","commits":[{"sha":"66d5fee55bda2c92031dcb9eb15cf02eeb7ecd90","author":{"email":"2ded4b346a572ccf57131801116a3edef4d9c258@gmail.com","name":"William Wilson"},"message":"Fixing again for heroku","distinct":true,"url":"https://api.github.com/repos/williamtwilson/speedboard-frontend/commits/66d5fee55bda2c92031dcb9eb15cf02eeb7ecd90"}]},"public":true,"created_at":"2015-01-01T01:01:06Z"}
{"id":"2489396393","type":"PushEvent","actor":{"id":6895040,"login":"codertradergambler","gravatar_id":"","url":"https://api.github.com/users/codertradergambler","avatar_url":"https://avatars.githubusercontent.com/u/6895040?"},"repo":{"id":18620619,"name":"chancecoin/chancecoinj","url":"https://api.github.com/repos/chancecoin/chancecoinj"},"payload":{"push_id":536752465,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"d4ec65797e8faf2aac84c02007d2ebeb342babd3","before":"2f4f83b1efbd39bd5a66a9929baa1fcee177851b","commits":[{"sha":"d4ec65797e8faf2aac84c02007d2ebeb342babd3","author":{"email":"0ccf54d51d1a5240ad356feb30dfa4d1749f8844@gmail.com","name":"TraderCoderGambler"},"message":"auto-update balances","distinct":true,"url":"https://api.github.com/repos/chancecoin/chancecoinj/commits/d4ec65797e8faf2aac84c02007d2ebeb342babd3"}]},"public":true,"created_at":"2015-01-01T01:01:06Z"}
{"id":"2489396397","type":"PushEvent","actor":{"id":7336721,"login":"aow1980","gravatar_id":"","url":"https://api.github.com/users/aow1980","avatar_url":"https://avatars.githubusercontent.com/u/7336721?"},"repo":{"id":28112636,"name":"aow1980/frameworks_base","url":"https://api.github.com/repos/aow1980/frameworks_base"},"payload":{"push_id":536752467,"size":1,"distinct_size":1,"ref":"refs/heads/lp5.0","head":"162d74b56f030928c24d1d4cb5033586e9d319db","before":"ee02cebf037cb979511dc12688e99a1492faa47d","commits":[{"sha":"162d74b56f030928c24d1d4cb5033586e9d319db","author":{"email":"457cfb837588e6491cbd81701614a2c9f7081d84@gmail.com","name":"aow1980"},"message":"base: fix battery stats wakelock crazyness\n\nUntil someone explains to me why google has killed the\nsince unplug stats for partitial and kernel wakelocks\nchange them from beeing screen off based to unplug based\n\nChange-Id: Id727d5d9e237eecb7e86d7dee3285f18a57f9723","distinct":true,"url":"https://api.github.com/repos/aow1980/frameworks_base/commits/162d74b56f030928c24d1d4cb5033586e9d319db"}]},"public":true,"created_at":"2015-01-01T01:01:07Z"}
{"id":"2489396399","type":"PushEvent","actor":{"id":3890972,"login":"timmmmyboy","gravatar_id":"","url":"https://api.github.com/users/timmmmyboy","avatar_url":"https://avatars.githubusercontent.com/u/3890972?"},"repo":{"id":26382386,"name":"reclaimhosting/federated-wiki","url":"https://api.github.com/repos/reclaimhosting/federated-wiki"},"payload":{"push_id":536752470,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"fdf80ab95eec8733946219b1a172269d3d802042","before":"fef0b8d914b47a72907042e8bdd4b631e331f1c4","commits":[{"sha":"fdf80ab95eec8733946219b1a172269d3d802042","author":{"email":"59bd0a3ff43b32849b319e645d4798d8a5d1e889@reclaimhosting.com","name":"Reclaim Hosting"},"message":"Recent Changes","distinct":true,"url":"https://api.github.com/repos/reclaimhosting/federated-wiki/commits/fdf80ab95eec8733946219b1a172269d3d802042"}]},"public":true,"created_at":"2015-01-01T01:01:07Z","org":{"id":6590468,"login":"reclaimhosting","gravatar_id":"","url":"https://api.github.com/orgs/reclaimhosting","avatar_url":"https://avatars.githubusercontent.com/u/6590468?"}}
{"id":"2489396405","type":"PushEvent","actor":{"id":1779595,"login":"dcbaker","gravatar_id":"","url":"https://api.github.com/users/dcbaker","avatar_url":"https://avatars.githubusercontent.com/u/1779595?"},"repo":{"id":8488437,"name":"dcbaker/piglit","url":"https://api.github.com/repos/dcbaker/piglit"},"payload":{"push_id":536752473,"size":2,"distinct_size":2,"ref":"refs/heads/wip/command-list-only-v5","head":"e81f4b28bf6ad78c7fb05257e77e42fe237a09ed","before":"2400271cda135b8077fd4a83254ef84edd92f6bd","commits":[{"sha":"cf5cf7224385c3c3d086762b5bc1d8f7df031ae7","author":{"email":"c26a678a04c601e0311b0d6006e67eee6ed19a8e@intel.com","name":"Dylan Baker"},"message":"fixup! all.py: Replace some string concatenation with str.format()","distinct":true,"url":"https://api.github.com/repos/dcbaker/piglit/commits/cf5cf7224385c3c3d086762b5bc1d8f7df031ae7"},{"sha":"e81f4b28bf6ad78c7fb05257e77e42fe237a09ed","author":{"email":"c26a678a04c601e0311b0d6006e67eee6ed19a8e@intel.com","name":"Dylan Baker"},"message":"all.py: Convert glean tests to list arguments\n\nThere aren't very many glean tests left, it was trivially easy to change\nthem with a simple vim macro and then one additional change.\n\nSigned-off-by: Dylan Baker <dylanx.c.baker@intel.com>","distinct":true,"url":"https://api.github.com/repos/dcbaker/piglit/commits/e81f4b28bf6ad78c7fb05257e77e42fe237a09ed"}]},"public":true,"created_at":"2015-01-01T01:01:08Z"}
{"id":"2489396406","type":"PushEvent","actor":{"id":41057,"login":"samv","gravatar_id":"","url":"https://api.github.com/users/samv","avatar_url":"https://avatars.githubusercontent.com/u/41057?"},"repo":{"id":16792286,"name":"hearsaycorp/normalize","url":"https://api.github.com/repos/hearsaycorp/normalize"},"payload":{"push_id":536752474,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"2f0df332bf4a1e963296f545802cf7497ac20ff8","before":"f0e473fa4a756b8c3b49a4f945845414f58bf9fb","commits":[{"sha":"2f0df332bf4a1e963296f545802cf7497ac20ff8","author":{"email":"f16bed56189e249fe4ca8ed10a1ecae60e8ceac0@vilain.net","name":"Sam Vilain"},"message":"Implement FieldSelector.delete\n\nAll 4 CRUD operations now supported :)","distinct":true,"url":"https://api.github.com/repos/hearsaycorp/normalize/commits/2f0df332bf4a1e963296f545802cf7497ac20ff8"}]},"public":true,"created_at":"2015-01-01T01:01:08Z","org":{"id":633032,"login":"hearsaycorp","gravatar_id":"","url":"https://api.github.com/orgs/hearsaycorp","avatar_url":"https://avatars.githubusercontent.com/u/633032?"}}
{"id":"2489396407","type":"WatchEvent","actor":{"id":5084309,"login":"Jorys-Paulin","gravatar_id":"","url":"https://api.github.com/users/Jorys-Paulin","avatar_url":"https://avatars.githubusercontent.com/u/5084309?"},"repo":{"id":28086817,"name":"Learn-Dev/Learn-Dev-Theme---Dashboard-partie-1","url":"https://api.github.com/repos/Learn-Dev/Learn-Dev-Theme---Dashboard-partie-1"},"payload":{"action":"started"},"public":true,"created_at":"2015-01-01T01:01:08Z"}
{"id":"2489396408","type":"PushEvent","actor":{"id":9000293,"login":"diianita","gravatar_id":"","url":"https://api.github.com/users/diianita","avatar_url":"https://avatars.githubusercontent.com/u/9000293?"},"repo":{"id":27146993,"name":"cArLiiToX/dtstore","url":"https://api.github.com/repos/cArLiiToX/dtstore"},"payload":{"push_id":536752475,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"57150fe4e8e3dbd8707e8bec5efdcbd306696812","before":"080810e75308aaace0986bf99858aee08f79fe60","commits":[{"sha":"57150fe4e8e3dbd8707e8bec5efdcbd306696812","author":{"email":"ab5e2bca84933118bbc9d48ffaccce3bac4eeb64@xng.bz","name":"cArLiiToX"},"message":"correciones","distinct":true,"url":"https://api.github.com/repos/cArLiiToX/dtstore/commits/57150fe4e8e3dbd8707e8bec5efdcbd306696812"}]},"public":true,"created_at":"2015-01-01T01:01:09Z"}
{"id":"2489396409","type":"CreateEvent","actor":{"id":57162,"login":"wbyoung","gravatar_id":"","url":"https://api.github.com/users/wbyoung","avatar_url":"https://avatars.githubusercontent.com/u/57162?"},"repo":{"id":25276289,"name":"wbyoung/azul","url":"https://api.github.com/repos/wbyoung/azul"},"payload":{"ref":"travis-docs","ref_type":"branch","master_branch":"master","description":"Elegant Node.js ORM","pusher_type":"user"},"public":true,"created_at":"2015-01-01T01:01:09Z"}
{"id":"2489396413","type":"WatchEvent","actor":{"id":1015032,"login":"miketahani","gravatar_id":"","url":"https://api.github.com/users/miketahani","avatar_url":"https://avatars.githubusercontent.com/u/1015032?"},"repo":{"id":3253898,"name":"greggman/webgl-fundamentals","url":"https://api.github.com/repos/greggman/webgl-fundamentals"},"payload":{"action":"started"},"public":true,"created_at":"2015-01-01T01:01:11Z"}
{"id":"2489396414","type":"PushEvent","actor":{"id":1514700,"login":"YoshikiShibata","gravatar_id":"","url":"https://api.github.com/users/YoshikiShibata","avatar_url":"https://avatars.githubusercontent.com/u/1514700?"},"repo":{"id":23509495,"name":"YoshikiShibata/js8ri","url":"https://api.github.com/repos/YoshikiShibata/js8ri"},"payload":{"push_id":536752478,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"b17a952587b5f8accbf2451df75b97812402210f","before":"201f71f7ce532cf0ee666466ffa97d7003402328","commits":[{"sha":"b17a952587b5f8accbf2451df75b97812402210f","author":{"email":"fc4b8596386bb28ae34eb13b0bb8db8e7157ad6c@ca2.so-net.ne.jp","name":"Yoshiki Shibata"},"message":"ex07 done","distinct":true,"url":"https://api.github.com/repos/YoshikiShibata/js8ri/commits/b17a952587b5f8accbf2451df75b97812402210f"}]},"public":true,"created_at":"2015-01-01T01:01:11Z"}
{"id":"2489396415","type":"PushEvent","actor":{"id":1380844,"login":"lyricorpse","gravatar_id":"","url":"https://api.github.com/users/lyricorpse","avatar_url":"https://avatars.githubusercontent.com/u/1380844?"},"repo":{"id":28656760,"name":"lyricorpse/PyESG","url":"https://api.github.com/repos/lyricorpse/PyESG"},"payload":{"push_id":536752479,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"6f2430e5a35ddc873ff33e454ffe95d3754aab32","before":"14e8117e011afcadb8066ac8de75976359c7818f","commits":[{"sha":"6f2430e5a35ddc873ff33e454ffe95d3754aab32","author":{"email":"0a7b040fc4054c5d741bd0ad5ddf9a49e6d82d24@gmail.com","name":"Lyricorpse"},"message":"Fix a bug with Quadrangle search","distinct":true,"url":"https://api.github.com/repos/lyricorpse/PyESG/commits/6f2430e5a35ddc873ff33e454ffe95d3754aab32"}]},"public":true,"created_at":"2015-01-01T01:01:11Z"}
{"id":"2489396422","type":"PushEvent","actor":{"id":2287714,"login":"mchen804","gravatar_id":"","url":"https://api.github.com/users/mchen804","avatar_url":"https://avatars.githubusercontent.com/u/2287714?"},"repo":{"id":28678145,"name":"mchen804/LearnToGit","url":"https://api.github.com/repos/mchen804/LearnToGit"},"payload":{"push_id":536752481,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"d81f2b2536eac12bec771117976723439102d999","before":"c25d99beb779acd54c083029bb51d94ec9e2bbe4","commits":[{"sha":"d81f2b2536eac12bec771117976723439102d999","author":{"email":"ce78b05c0afb1e03455d157070260213f45d7b80@osu.edu","name":"Michael Chen"},"message":"Create README.md","distinct":true,"url":"https://api.github.com/repos/mchen804/LearnToGit/commits/d81f2b2536eac12bec771117976723439102d999"}]},"public":true,"created_at":"2015-01-01T01:01:11Z"}
{"id":"2489396432","type":"IssueCommentEvent","actor":{"id":238759,"login":"chrisfilo","gravatar_id":"","url":"https://api.github.com/users/chrisfilo","avatar_url":"https://avatars.githubusercontent.com/u/238759?"},"repo":{"id":7963570,"name":"NeuroVault/NeuroVault","url":"https://api.github.com/repos/NeuroVault/NeuroVault"},"payload":{"action":"created","issue":{"url":"https://api.github.com/repos/NeuroVault/NeuroVault/issues/90","labels_url":"https://api.github.com/repos/NeuroVault/NeuroVault/issues/90/labels{/name}","comments_url":"https://api.github.com/repos/NeuroVault/NeuroVault/issues/90/comments","events_url":"https://api.github.com/repos/NeuroVault/NeuroVault/issues/90/events","html_url":"https://github.com/NeuroVault/NeuroVault/pull/90","id":53209632,"number":90,"title":"Enh/nidm results [final]","user":{"login":"infocortex","id":7991256,"avatar_url":"https://avatars.githubusercontent.com/u/7991256?v=3","gravatar_id":"","url":"https://api.github.com/users/infocortex","html_url":"https://github.com/infocortex","followers_url":"https://api.github.com/users/infocortex/followers","following_url":"https://api.github.com/users/infocortex/following{/other_user}","gists_url":"https://api.github.com/users/infocortex/gists{/gist_id}","starred_url":"https://api.github.com/users/infocortex/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/infocortex/subscriptions","organizations_url":"https://api.github.com/users/infocortex/orgs","repos_url":"https://api.github.com/users/infocortex/repos","events_url":"https://api.github.com/users/infocortex/events{/privacy}","received_events_url":"https://api.github.com/users/infocortex/received_events","type":"User","site_admin":false},"labels":[],"state":"open","locked":false,"assignee":null,"milestone":null,"comments":1,"created_at":"2015-01-01T00:29:03Z","updated_at":"2015-01-01T01:01:13Z","closed_at":null,"pull_request":{"url":"https://api.github.com/repos/NeuroVault/NeuroVault/pulls/90","html_url":"https://github.com/NeuroVault/NeuroVault/pull/90","diff_url":"https://github.com/NeuroVault/NeuroVault/pull/90.diff","patch_url":"https://github.com/NeuroVault/NeuroVault/pull/90.patch"},"body":"feature complete\r\n\r\nstill todo:\r\n-migration test \r\n-addditional unit test(s)"},"comment":{"url":"https://api.github.com/repos/NeuroVault/NeuroVault/issues/comments/68477237","html_url":"https://github.com/NeuroVault/NeuroVault/pull/90#issuecomment-68477237","issue_url":"https://api.github.com/repos/NeuroVault/NeuroVault/issues/90","id":68477237,"user":{"login":"chrisfilo","id":238759,"avatar_url":"https://avatars.githubusercontent.com/u/238759?v=3","gravatar_id":"","url":"https://api.github.com/users/chrisfilo","html_url":"https://github.com/chrisfilo","followers_url":"https://api.github.com/users/chrisfilo/followers","following_url":"https://api.github.com/users/chrisfilo/following{/other_user}","gists_url":"https://api.github.com/users/chrisfilo/gists{/gist_id}","starred_url":"https://api.github.com/users/chrisfilo/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/chrisfilo/subscriptions","organizations_url":"https://api.github.com/users/chrisfilo/orgs","repos_url":"https://api.github.com/users/chrisfilo/repos","events_url":"https://api.github.com/users/chrisfilo/events{/privacy}","received_events_url":"https://api.github.com/users/chrisfilo/received_events","type":"User","site_admin":false},"created_at":"2015-01-01T01:01:13Z","updated_at":"2015-01-01T01:01:13Z","body":"Migration went well, test pass. However edit images dialog does not work. Clicking on any of the images does not change anything. Neighter does clicking on the Add a new image button. JS console gives the following error:\r\n\r\n\tUncaught TypeError: Cannot read property 'slice' of nullj query-2.1.0.min.js:2"}},"public":true,"created_at":"2015-01-01T01:01:13Z","org":{"id":9168649,"login":"NeuroVault","gravatar_id":"","url":"https://api.github.com/orgs/NeuroVault","avatar_url":"https://avatars.githubusercontent.com/u/9168649?"}}
{"id":"2489396433","type":"PushEvent","actor":{"id":1745861,"login":"topaztee","gravatar_id":"","url":"https://api.github.com/users/topaztee","avatar_url":"https://avatars.githubusercontent.com/u/1745861?"},"repo":{"id":28677407,"name":"topaztee/topaztee.github.io","url":"https://api.github.com/repos/topaztee/topaztee.github.io"},"payload":{"push_id":536752485,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"a66e99dc9be241e6a513acfcc79ac27757a4a5bb","before":"e0ee4ea2c3198a01bf7f11096b6c35a05fa11ae1","commits":[{"sha":"a66e99dc9be241e6a513acfcc79ac27757a4a5bb","author":{"email":"f74c82d708bb42a372674042ebc8a1411fbc9344@192-168-1-2.tpgi.com.au","name":"topaztur@gmail.com"},"message":"Blog update at 2015-01-01 01:01:05","distinct":true,"url":"https://api.github.com/repos/topaztee/topaztee.github.io/commits/a66e99dc9be241e6a513acfcc79ac27757a4a5bb"}]},"public":true,"created_at":"2015-01-01T01:01:13Z"}
{"id":"2489396443","type":"PushEvent","actor":{"id":5863537,"login":"jimv39","gravatar_id":"","url":"https://api.github.com/users/jimv39","avatar_url":"https://avatars.githubusercontent.com/u/5863537?"},"repo":{"id":17339971,"name":"jimv39/qvcsos","url":"https://api.github.com/repos/jimv39/qvcsos"},"payload":{"push_id":536752489,"size":3,"distinct_size":3,"ref":"refs/heads/develop","head":"96ae99b1cb7c178ee7951befbe8bd9a9df12bda5","before":"ab423d835e445dcf8c3073753ae1b964e386dfdd","commits":[{"sha":"f673e524b862f0ee3ecc023d4f668282f07dd8ce","author":{"email":"9be38403eb58d3adbe34866aa881dcd238ac5d2e@comcast.net","name":"Jim Voris"},"message":"First pass at adding jmockit unit test to OperationGet. It really only provides code coverage, but it's better than nothing.","distinct":true,"url":"https://api.github.com/repos/jimv39/qvcsos/commits/f673e524b862f0ee3ecc023d4f668282f07dd8ce"},{"sha":"7b2e46db58499c257cb0d1740af53807c87d2b92","author":{"email":"9be38403eb58d3adbe34866aa881dcd238ac5d2e@comcast.net","name":"Jim Voris"},"message":"Fix some checkstyle problems.","distinct":true,"url":"https://api.github.com/repos/jimv39/qvcsos/commits/7b2e46db58499c257cb0d1740af53807c87d2b92"},{"sha":"96ae99b1cb7c178ee7951befbe8bd9a9df12bda5","author":{"email":"9be38403eb58d3adbe34866aa881dcd238ac5d2e@comcast.net","name":"Jim Voris"},"message":"Remove dead/commented-out plugin.","distinct":true,"url":"https://api.github.com/repos/jimv39/qvcsos/commits/96ae99b1cb7c178ee7951befbe8bd9a9df12bda5"}]},"public":true,"created_at":"2015-01-01T01:01:14Z"}
{"id":"2489396456","type":"WatchEvent","actor":{"id":5565906,"login":"WRuman","gravatar_id":"","url":"https://api.github.com/users/WRuman","avatar_url":"https://avatars.githubusercontent.com/u/5565906?"},"repo":{"id":14579010,"name":"suffick/Tearable-Cloth","url":"https://api.github.com/repos/suffick/Tearable-Cloth"},"payload":{"action":"started"},"public":true,"created_at":"2015-01-01T01:01:16Z"}
{"id":"2489396458","type":"PushEvent","actor":{"id":6955349,"login":"rachidkada","gravatar_id":"","url":"https://api.github.com/users/rachidkada","avatar_url":"https://avatars.githubusercontent.com/u/6955349?"},"repo":{"id":27822066,"name":"ATS001/NEWCOMPTA","url":"https://api.github.com/repos/ATS001/NEWCOMPTA"},"payload":{"push_id":536752490,"size":1,"distinct_size":0,"ref":"refs/heads/gestion_depense_last","head":"8ed92a796d203fdc84e418d3f9ca725cccd0fec4","before":"890201ee3b26f2e7c383a1c8f4206ebf0015c3ee","commits":[{"sha":"8ed92a796d203fdc84e418d3f9ca725cccd0fec4","author":{"email":"af045d9e68f1279af589eff3a2682851ea4e8686@atelsolution.com","name":"id-rach"},"message":"fournisseur\n\nfournisseur","distinct":false,"url":"https://api.github.com/repos/ATS001/NEWCOMPTA/commits/8ed92a796d203fdc84e418d3f9ca725cccd0fec4"}]},"public":true,"created_at":"2015-01-01T01:01:16Z","org":{"id":8378855,"login":"ATS001","gravatar_id":"","url":"https://api.github.com/orgs/ATS001","avatar_url":"https://avatars.githubusercontent.com/u/8378855?"}}
{"id":"2489396459","type":"PushEvent","actor":{"id":280212,"login":"KenanSulayman","gravatar_id":"","url":"https://api.github.com/users/KenanSulayman","avatar_url":"https://avatars.githubusercontent.com/u/280212?"},"repo":{"id":21481110,"name":"KenanSulayman/heartbeat","url":"https://api.github.com/repos/KenanSulayman/heartbeat"},"payload":{"push_id":536752491,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"f5fd8c9b5d99ba2f521c56658163b69c29eb1027","before":"9ceb5cdffe02cef186b379026ce6c2dc0d74b3d4","commits":[{"sha":"f5fd8c9b5d99ba2f521c56658163b69c29eb1027","author":{"email":"9176253dfc0bc82671a5e984646605f93319147a@sly.mn","name":"Kenan Sulayman"},"message":"1420074073410\n\nZl5biUHcnwVJiZ03vi7LUj1wLwVyyBgsRxOBQqS03lg=","distinct":true,"url":"https://api.github.com/repos/KenanSulayman/heartbeat/commits/f5fd8c9b5d99ba2f521c56658163b69c29eb1027"}]},"public":true,"created_at":"2015-01-01T01:01:16Z"}
{"id":"2489396460","type":"PushEvent","actor":{"id":2147137,"login":"xkyouchoux","gravatar_id":"","url":"https://api.github.com/users/xkyouchoux","avatar_url":"https://avatars.githubusercontent.com/u/2147137?"},"repo":{"id":28676642,"name":"xkyouchoux/dh","url":"https://api.github.com/repos/xkyouchoux/dh"},"payload":{"push_id":536752493,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"b6d6c9c6e52c6a414626a870ee6179d8e3bdd437","before":"bcf6c520af9d96ed8d9c978d723b94191b4c7828","commits":[{"sha":"b6d6c9c6e52c6a414626a870ee6179d8e3bdd437","author":{"email":"fefcf3693656ff0c8f9b06efb68deae5a2d3a81a@hotmail.com","name":"xkyouchoux"},"message":"A General generated set","distinct":true,"url":"https://api.github.com/repos/xkyouchoux/dh/commits/b6d6c9c6e52c6a414626a870ee6179d8e3bdd437"}]},"public":true,"created_at":"2015-01-01T01:01:16Z"}
{"id":"2489396461","type":"PushEvent","actor":{"id":7751315,"login":"ApocalypticOctopus","gravatar_id":"","url":"https://api.github.com/users/ApocalypticOctopus","avatar_url":"https://avatars.githubusercontent.com/u/7751315?"},"repo":{"id":27552091,"name":"ApocalypticOctopus/Epic.Numbers","url":"https://api.github.com/repos/ApocalypticOctopus/Epic.Numbers"},"payload":{"push_id":536752492,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"f8af8686554e318964193f2da13f486aabaeaf99","before":"dff9cb7b8c26a82657601a5365b5b92fd3317902","commits":[{"sha":"f8af8686554e318964193f2da13f486aabaeaf99","author":{"email":"60e80a2f6e90298c62ee9e963a3f42492975e450@gmail.com","name":"Apocalyptic Octopus"},"message":"Add a few basic generic number algorithms","distinct":true,"url":"https://api.github.com/repos/ApocalypticOctopus/Epic.Numbers/commits/f8af8686554e318964193f2da13f486aabaeaf99"}]},"public":true,"created_at":"2015-01-01T01:01:16Z"}
{"id":"2489396468","type":"PushEvent","actor":{"id":95203,"login":"bhaisaab","gravatar_id":"","url":"https://api.github.com/users/bhaisaab","avatar_url":"https://avatars.githubusercontent.com/u/95203?"},"repo":{"id":23222011,"name":"shapeblue/cloudstack","url":"https://api.github.com/repos/shapeblue/cloudstack"},"payload":{"push_id":536752498,"size":1,"distinct_size":1,"ref":"refs/heads/4.5","head":"85e88e9cbcba913fd9848e1daa42e21259c02a96","before":"94237a4c5b08356bb0a4950ce9fd7ec78f2168f9","commits":[{"sha":"85e88e9cbcba913fd9848e1daa42e21259c02a96","author":{"email":"908e82d1c152b24fc5de9371836b7f39094e3948@apache.org","name":"Jessica Wang"},"message":"CLOUDSTACK-8139: UI > create compute offering > server-side only supports one single host tag instead of multiple host tags. So, change UI to take in only one single host tag instead of multiple host tags in create compute dialog.","distinct":true,"url":"https://api.github.com/repos/shapeblue/cloudstack/commits/85e88e9cbcba913fd9848e1daa42e21259c02a96"}]},"public":true,"created_at":"2015-01-01T01:01:17Z","org":{"id":6001764,"login":"shapeblue","gravatar_id":"","url":"https://api.github.com/orgs/shapeblue","avatar_url":"https://avatars.githubusercontent.com/u/6001764?"}}
{"id":"2489396482","type":"ForkEvent","actor":{"id":31330,"login":"dwmorgan","gravatar_id":"","url":"https://api.github.com/users/dwmorgan","avatar_url":"https://avatars.githubusercontent.com/u/31330?"},"repo":{"id":289499,"name":"pezra/parallel-each","url":"https://api.github.com/repos/pezra/parallel-each"},"payload":{"forkee":{"id":28678226,"name":"parallel-each","full_name":"dwmorgan/parallel-each","owner":{"login":"dwmorgan","id":31330,"avatar_url":"https://avatars.githubusercontent.com/u/31330?v=3","gravatar_id":"","url":"https://api.github.com/users/dwmorgan","html_url":"https://github.com/dwmorgan","followers_url":"https://api.github.com/users/dwmorgan/followers","following_url":"https://api.github.com/users/dwmorgan/following{/other_user}","gists_url":"https://api.github.com/users/dwmorgan/gists{/gist_id}","starred_url":"https://api.github.com/users/dwmorgan/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/dwmorgan/subscriptions","organizations_url":"https://api.github.com/users/dwmorgan/orgs","repos_url":"https://api.github.com/users/dwmorgan/repos","events_url":"https://api.github.com/users/dwmorgan/events{/privacy}","received_events_url":"https://api.github.com/users/dwmorgan/received_events","type":"User","site_admin":false},"private":false,"html_url":"https://github.com/dwmorgan/parallel-each","description":"A mechanism for concurrently iterating over the items in Enumerables","fork":true,"url":"https://api.github.com/repos/dwmorgan/parallel-each","forks_url":"https://api.github.com/repos/dwmorgan/parallel-each/forks","keys_url":"https://api.github.com/repos/dwmorgan/parallel-each/keys{/key_id}","collaborators_url":"https://api.github.com/repos/dwmorgan/parallel-each/collaborators{/collaborator}","teams_url":"https://api.github.com/repos/dwmorgan/parallel-each/teams","hooks_url":"https://api.github.com/repos/dwmorgan/parallel-each/hooks","issue_events_url":"https://api.github.com/repos/dwmorgan/parallel-each/issues/events{/number}","events_url":"https://api.github.com/repos/dwmorgan/parallel-each/events","assignees_url":"https://api.github.com/repos/dwmorgan/parallel-each/assignees{/user}","branches_url":"https://api.github.com/repos/dwmorgan/parallel-each/branches{/branch}","tags_url":"https://api.github.com/repos/dwmorgan/parallel-each/tags","blobs_url":"https://api.github.com/repos/dwmorgan/parallel-each/git/blobs{/sha}","git_tags_url":"https://api.github.com/repos/dwmorgan/parallel-each/git/tags{/sha}","git_refs_url":"https://api.github.com/repos/dwmorgan/parallel-each/git/refs{/sha}","trees_url":"https://api.github.com/repos/dwmorgan/parallel-each/git/trees{/sha}","statuses_url":"https://api.github.com/repos/dwmorgan/parallel-each/statuses/{sha}","languages_url":"https://api.github.com/repos/dwmorgan/parallel-each/languages","stargazers_url":"https://api.github.com/repos/dwmorgan/parallel-each/stargazers","contributors_url":"https://api.github.com/repos/dwmorgan/parallel-each/contributors","subscribers_url":"https://api.github.com/repos/dwmorgan/parallel-each/subscribers","subscription_url":"https://api.github.com/repos/dwmorgan/parallel-each/subscription","commits_url":"https://api.github.com/repos/dwmorgan/parallel-each/commits{/sha}","git_commits_url":"https://api.github.com/repos/dwmorgan/parallel-each/git/commits{/sha}","comments_url":"https://api.github.com/repos/dwmorgan/parallel-each/comments{/number}","issue_comment_url":"https://api.github.com/repos/dwmorgan/parallel-each/issues/comments/{number}","contents_url":"https://api.github.com/repos/dwmorgan/parallel-each/contents/{+path}","compare_url":"https://api.github.com/repos/dwmorgan/parallel-each/compare/{base}...{head}","merges_url":"https://api.github.com/repos/dwmorgan/parallel-each/merges","archive_url":"https://api.github.com/repos/dwmorgan/parallel-each/{archive_format}{/ref}","downloads_url":"https://api.github.com/repos/dwmorgan/parallel-each/downloads","issues_url":"https://api.github.com/repos/dwmorgan/parallel-each/issues{/number}","pulls_url":"https://api.github.com/repos/dwmorgan/parallel-each/pulls{/number}","milestones_url":"https://api.github.com/repos/dwmorgan/parallel-each/milestones{/number}","notifications_url":"https://api.github.com/repos/dwmorgan/parallel-each/notifications{?since,all,participating}","labels_url":"https://api.github.com/repos/dwmorgan/parallel-each/labels{/name}","releases_url":"https://api.github.com/repos/dwmorgan/parallel-each/releases{/id}","created_at":"2015-01-01T01:01:18Z","updated_at":"2014-08-09T03:47:03Z","pushed_at":"2009-09-14T23:08:58Z","git_url":"git://github.com/dwmorgan/parallel-each.git","ssh_url":"git@github.com:dwmorgan/parallel-each.git","clone_url":"https://github.com/dwmorgan/parallel-each.git","svn_url":"https://github.com/dwmorgan/parallel-each","homepage":"","size":87,"stargazers_count":0,"watchers_count":0,"language":null,"has_issues":false,"has_downloads":true,"has_wiki":true,"has_pages":false,"forks_count":0,"mirror_url":null,"open_issues_count":0,"forks":0,"open_issues":0,"watchers":0,"default_branch":"master","public":true}},"public":true,"created_at":"2015-01-01T01:01:19Z"}
{"id":"2489396489","type":"ForkEvent","actor":{"id":10361464,"login":"addisonep","gravatar_id":"","url":"https://api.github.com/users/addisonep","avatar_url":"https://avatars.githubusercontent.com/u/10361464?"},"repo":{"id":2293158,"name":"rapid7/metasploit-framework","url":"https://api.github.com/repos/rapid7/metasploit-framework"},"payload":{"forkee":{"id":28678227,"name":"metasploit-framework","full_name":"addisonep/metasploit-framework","owner":{"login":"addisonep","id":10361464,"avatar_url":"https://avatars.githubusercontent.com/u/10361464?v=3","gravatar_id":"","url":"https://api.github.com/users/addisonep","html_url":"https://github.com/addisonep","followers_url":"https://api.github.com/users/addisonep/followers","following_url":"https://api.github.com/users/addisonep/following{/other_user}","gists_url":"https://api.github.com/users/addisonep/gists{/gist_id}","starred_url":"https://api.github.com/users/addisonep/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/addisonep/subscriptions","organizations_url":"https://api.github.com/users/addisonep/orgs","repos_url":"https://api.github.com/users/addisonep/repos","events_url":"https://api.github.com/users/addisonep/events{/privacy}","received_events_url":"https://api.github.com/users/addisonep/received_events","type":"User","site_admin":false},"private":false,"html_url":"https://github.com/addisonep/metasploit-framework","description":"Metasploit Framework","fork":true,"url":"https://api.github.com/repos/addisonep/metasploit-framework","forks_url":"https://api.github.com/repos/addisonep/metasploit-framework/forks","keys_url":"https://api.github.com/repos/addisonep/metasploit-framework/keys{/key_id}","collaborators_url":"https://api.github.com/repos/addisonep/metasploit-framework/collaborators{/collaborator}","teams_url":"https://api.github.com/repos/addisonep/metasploit-framework/teams","hooks_url":"https://api.github.com/repos/addisonep/metasploit-framework/hooks","issue_events_url":"https://api.github.com/repos/addisonep/metasploit-framework/issues/events{/number}","events_url":"https://api.github.com/repos/addisonep/metasploit-framework/events","assignees_url":"https://api.github.com/repos/addisonep/metasploit-framework/assignees{/user}","branches_url":"https://api.github.com/repos/addisonep/metasploit-framework/branches{/branch}","tags_url":"https://api.github.com/repos/addisonep/metasploit-framework/tags","blobs_url":"https://api.github.com/repos/addisonep/metasploit-framework/git/blobs{/sha}","git_tags_url":"https://api.github.com/repos/addisonep/metasploit-framework/git/tags{/sha}","git_refs_url":"https://api.github.com/repos/addisonep/metasploit-framework/git/refs{/sha}","trees_url":"https://api.github.com/repos/addisonep/metasploit-framework/git/trees{/sha}","statuses_url":"https://api.github.com/repos/addisonep/metasploit-framework/statuses/{sha}","languages_url":"https://api.github.com/repos/addisonep/metasploit-framework/languages","stargazers_url":"https://api.github.com/repos/addisonep/metasploit-framework/stargazers","contributors_url":"https://api.github.com/repos/addisonep/metasploit-framework/contributors","subscribers_url":"https://api.github.com/repos/addisonep/metasploit-framework/subscribers","subscription_url":"https://api.github.com/repos/addisonep/metasploit-framework/subscription","commits_url":"https://api.github.com/repos/addisonep/metasploit-framework/commits{/sha}","git_commits_url":"https://api.github.com/repos/addisonep/metasploit-framework/git/commits{/sha}","comments_url":"https://api.github.com/repos/addisonep/metasploit-framework/comments{/number}","issue_comment_url":"https://api.github.com/repos/addisonep/metasploit-framework/issues/comments/{number}","contents_url":"https://api.github.com/repos/addisonep/metasploit-framework/contents/{+path}","compare_url":"https://api.github.com/repos/addisonep/metasploit-framework/compare/{base}...{head}","merges_url":"https://api.github.com/repos/addisonep/metasploit-framework/merges","archive_url":"https://api.github.com/repos/addisonep/metasploit-framework/{archive_format}{/ref}","downloads_url":"https://api.github.com/repos/addisonep/metasploit-framework/downloads","issues_url":"https://api.github.com/repos/addisonep/metasploit-framework/issues{/number}","pulls_url":"https://api.github.com/repos/addisonep/metasploit-framework/pulls{/number}","milestones_url":"https://api.github.com/repos/addisonep/metasploit-framework/milestones{/number}","notifications_url":"https://api.github.com/repos/addisonep/metasploit-framework/notifications{?since,all,participating}","labels_url":"https://api.github.com/repos/addisonep/metasploit-framework/labels{/name}","releases_url":"https://api.github.com/repos/addisonep/metasploit-framework/releases{/id}","created_at":"2015-01-01T01:01:19Z","updated_at":"2015-01-01T00:04:48Z","pushed_at":"2015-01-01T00:02:05Z","git_url":"git://github.com/addisonep/metasploit-framework.git","ssh_url":"git@github.com:addisonep/metasploit-framework.git","clone_url":"https://github.com/addisonep/metasploit-framework.git","svn_url":"https://github.com/addisonep/metasploit-framework","homepage":"http://www.metasploit.com/","size":1010071,"stargazers_count":0,"watchers_count":0,"language":null,"has_issues":false,"has_downloads":true,"has_wiki":true,"has_pages":false,"forks_count":0,"mirror_url":null,"open_issues_count":0,"forks":0,"open_issues":0,"watchers":0,"default_branch":"master","public":true}},"public":true,"created_at":"2015-01-01T01:01:20Z","org":{"id":1013671,"login":"rapid7","gravatar_id":"","url":"https://api.github.com/orgs/rapid7","avatar_url":"https://avatars.githubusercontent.com/u/1013671?"}}
{"id":"2489396501","type":"PushEvent","actor":{"id":1625941,"login":"nocarryr","gravatar_id":"","url":"https://api.github.com/users/nocarryr","avatar_url":"https://avatars.githubusercontent.com/u/1625941?"},"repo":{"id":26180933,"name":"nocarryr/node_mapper","url":"https://api.github.com/repos/nocarryr/node_mapper"},"payload":{"push_id":536752509,"size":2,"distinct_size":2,"ref":"refs/heads/master","head":"777997a518ce5e14439a4a91eef156531af3260e","before":"48c138a0ad0b1511492d63e5f1513a4726f831e9","commits":[{"sha":"d058ed5ac475b1287e513e1944ea4cc8276b000a","author":{"email":"1fa2ef4755a9226cb9a0a4840bd89b158ac71391@nomadic-recording.com","name":"nocarryr"},"message":"Squashed 'node_mapper/nomadic_recording_lib/' changes from 95ea390..fad5239\n\nfad5239 add prefs file for eric-ide v6\n1acd9f1 modified layout sizing for embed\n\ngit-subtree-dir: node_mapper/nomadic_recording_lib\ngit-subtree-split: fad5239c8a8ce199abc1e7d11c8d199b719e39df","distinct":true,"url":"https://api.github.com/repos/nocarryr/node_mapper/commits/d058ed5ac475b1287e513e1944ea4cc8276b000a"},{"sha":"777997a518ce5e14439a4a91eef156531af3260e","author":{"email":"1fa2ef4755a9226cb9a0a4840bd89b158ac71391@nomadic-recording.com","name":"nocarryr"},"message":"Merge commit 'd058ed5ac475b1287e513e1944ea4cc8276b000a'","distinct":true,"url":"https://api.github.com/repos/nocarryr/node_mapper/commits/777997a518ce5e14439a4a91eef156531af3260e"}]},"public":true,"created_at":"2015-01-01T01:01:21Z"}
{"id":"2489396503","type":"PushEvent","actor":{"id":6948206,"login":"JamesHutchison","gravatar_id":"","url":"https://api.github.com/users/JamesHutchison","avatar_url":"https://avatars.githubusercontent.com/u/6948206?"},"repo":{"id":24011719,"name":"JamesHutchison/brython","url":"https://api.github.com/repos/JamesHutchison/brython"},"payload":{"push_id":536752511,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"6364b4328ddb8e64ed9164f025196aaceaf830d3","before":"19eb5015b968d8c865423573fcae3afe805f2434","commits":[{"sha":"6364b4328ddb8e64ed9164f025196aaceaf830d3","author":{"email":"3ead6fdcf55e8f3c93103fc571861d43d648edff@microsoft.com","name":"James Hutchison"},"message":"Updated to latest copy of the repo","distinct":true,"url":"https://api.github.com/repos/JamesHutchison/brython/commits/6364b4328ddb8e64ed9164f025196aaceaf830d3"}]},"public":true,"created_at":"2015-01-01T01:01:22Z"}
{"id":"2489396511","type":"PushEvent","actor":{"id":1903079,"login":"krizvi","gravatar_id":"","url":"https://api.github.com/users/krizvi","avatar_url":"https://avatars.githubusercontent.com/u/1903079?"},"repo":{"id":20293030,"name":"VHAINNOVATIONS/Mental-Health-eScreening","url":"https://api.github.com/repos/VHAINNOVATIONS/Mental-Health-eScreening"},"payload":{"push_id":536752514,"size":2,"distinct_size":1,"ref":"refs/heads/resolved","head":"6af479cb61611efc8ce9449c28a3e0eaf6aa9fe0","before":"59f67bcf971fad269926139596d22cd4e1f03e05","commits":[{"sha":"df757ed8ad0c31af27c6099cc0c2d8818cb2ff6b","author":{"email":"e0c3a02e4102d2b5ed70e51bf9a27df65846d12e@gmail.com","name":"Khalid R. Rizvi"},"message":"t651 fixed json data response by plucking unncessary data and also Lint the section controller","distinct":false,"url":"https://api.github.com/repos/VHAINNOVATIONS/Mental-Health-eScreening/commits/df757ed8ad0c31af27c6099cc0c2d8818cb2ff6b"},{"sha":"6af479cb61611efc8ce9449c28a3e0eaf6aa9fe0","author":{"email":"e0c3a02e4102d2b5ed70e51bf9a27df65846d12e@gmail.com","name":"Khalid R. Rizvi"},"message":"Merge branch 't651' into resolved","distinct":true,"url":"https://api.github.com/repos/VHAINNOVATIONS/Mental-Health-eScreening/commits/6af479cb61611efc8ce9449c28a3e0eaf6aa9fe0"}]},"public":true,"created_at":"2015-01-01T01:01:24Z","org":{"id":1252476,"login":"VHAINNOVATIONS","gravatar_id":"","url":"https://api.github.com/orgs/VHAINNOVATIONS","avatar_url":"https://avatars.githubusercontent.com/u/1252476?"}}
{"id":"2489396514","type":"PushEvent","actor":{"id":1181205,"login":"malekbr","gravatar_id":"","url":"https://api.github.com/users/malekbr","avatar_url":"https://avatars.githubusercontent.com/u/1181205?"},"repo":{"id":28657751,"name":"malekbr/PeevedPenguinsTemplate-Spritebuilder","url":"https://api.github.com/repos/malekbr/PeevedPenguinsTemplate-Spritebuilder"},"payload":{"push_id":536752516,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"460a58f6adfc1f1b56a088c786717a53749f4cd7","before":"3084e78941af25cb8d49f4a9483e17ad41bcfd3e","commits":[{"sha":"460a58f6adfc1f1b56a088c786717a53749f4cd7","author":{"email":"73d3febb659ea118d8f1f9f1ff5f5ae09f3ca6d6@Mings-MacBook-Air.local","name":"Malek Ben Romdhane"},"message":"Automatically Committed for MakeGamesWithUs","distinct":true,"url":"https://api.github.com/repos/malekbr/PeevedPenguinsTemplate-Spritebuilder/commits/460a58f6adfc1f1b56a088c786717a53749f4cd7"}]},"public":true,"created_at":"2015-01-01T01:01:24Z"}
{"id":"2489396516","type":"PushEvent","actor":{"id":4444926,"login":"freeweibo","gravatar_id":"","url":"https://api.github.com/users/freeweibo","avatar_url":"https://avatars.githubusercontent.com/u/4444926?"},"repo":{"id":10095561,"name":"freeweibo/top","url":"https://api.github.com/repos/freeweibo/top"},"payload":{"push_id":536752517,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"83e98b10262f4a2ff93e33070453ab590be73eb2","before":"dc98fbebd53e1dbc0499aca11e5d293b3330ae2e","commits":[{"sha":"83e98b10262f4a2ff93e33070453ab590be73eb2","author":{"email":"24bf68e341ce0fbd9259a5d51feed79682ea4eba@ec2-us-web2.(none)","name":"Ubuntu"},"message":"auto","distinct":true,"url":"https://api.github.com/repos/freeweibo/top/commits/83e98b10262f4a2ff93e33070453ab590be73eb2"}]},"public":true,"created_at":"2015-01-01T01:01:24Z"}
{"id":"2489396517","type":"IssuesEvent","actor":{"id":6744175,"login":"antonioortegajr","gravatar_id":"","url":"https://api.github.com/users/antonioortegajr","avatar_url":"https://avatars.githubusercontent.com/u/6744175?"},"repo":{"id":28573267,"name":"antonioortegajr/beerfind.me","url":"https://api.github.com/repos/antonioortegajr/beerfind.me"},"payload":{"action":"opened","issue":{"url":"https://api.github.com/repos/antonioortegajr/beerfind.me/issues/13","labels_url":"https://api.github.com/repos/antonioortegajr/beerfind.me/issues/13/labels{/name}","comments_url":"https://api.github.com/repos/antonioortegajr/beerfind.me/issues/13/comments","events_url":"https://api.github.com/repos/antonioortegajr/beerfind.me/issues/13/events","html_url":"https://github.com/antonioortegajr/beerfind.me/issues/13","id":53210186,"number":13,"title":"search for six beers instead of five.","user":{"login":"antonioortegajr","id":6744175,"avatar_url":"https://avatars.githubusercontent.com/u/6744175?v=3","gravatar_id":"","url":"https://api.github.com/users/antonioortegajr","html_url":"https://github.com/antonioortegajr","followers_url":"https://api.github.com/users/antonioortegajr/followers","following_url":"https://api.github.com/users/antonioortegajr/following{/other_user}","gists_url":"https://api.github.com/users/antonioortegajr/gists{/gist_id}","starred_url":"https://api.github.com/users/antonioortegajr/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/antonioortegajr/subscriptions","organizations_url":"https://api.github.com/users/antonioortegajr/orgs","repos_url":"https://api.github.com/users/antonioortegajr/repos","events_url":"https://api.github.com/users/antonioortegajr/events{/privacy}","received_events_url":"https://api.github.com/users/antonioortegajr/received_events","type":"User","site_admin":false},"labels":[],"state":"open","locked":false,"assignee":null,"milestone":null,"comments":0,"created_at":"2015-01-01T01:01:24Z","updated_at":"2015-01-01T01:01:24Z","closed_at":null,"body":"Currently 5 beers is the Max to  search for. This should be six and twelve after that."}},"public":true,"created_at":"2015-01-01T01:01:24Z"}
{"id":"2489396526","type":"IssueCommentEvent","actor":{"id":10334102,"login":"DaDominat0r","gravatar_id":"","url":"https://api.github.com/users/DaDominat0r","avatar_url":"https://avatars.githubusercontent.com/u/10334102?"},"repo":{"id":16182383,"name":"Wynncraft/Issues","url":"https://api.github.com/repos/Wynncraft/Issues"},"payload":{"action":"created","issue":{"url":"https://api.github.com/repos/Wynncraft/Issues/issues/1409","labels_url":"https://api.github.com/repos/Wynncraft/Issues/issues/1409/labels{/name}","comments_url":"https://api.github.com/repos/Wynncraft/Issues/issues/1409/comments","events_url":"https://api.github.com/repos/Wynncraft/Issues/issues/1409/events","html_url":"https://github.com/Wynncraft/Issues/issues/1409","id":53013103,"number":1409,"title":"WynnExcavation Site A Broken","user":{"login":"DaDominat0r","id":10334102,"avatar_url":"https://avatars.githubusercontent.com/u/10334102?v=3","gravatar_id":"","url":"https://api.github.com/users/DaDominat0r","html_url":"https://github.com/DaDominat0r","followers_url":"https://api.github.com/users/DaDominat0r/followers","following_url":"https://api.github.com/users/DaDominat0r/following{/other_user}","gists_url":"https://api.github.com/users/DaDominat0r/gists{/gist_id}","starred_url":"https://api.github.com/users/DaDominat0r/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/DaDominat0r/subscriptions","organizations_url":"https://api.github.com/users/DaDominat0r/orgs","repos_url":"https://api.github.com/users/DaDominat0r/repos","events_url":"https://api.github.com/users/DaDominat0r/events{/privacy}","received_events_url":"https://api.github.com/users/DaDominat0r/received_events","type":"User","site_admin":false},"labels":[],"state":"closed","locked":false,"assignee":null,"milestone":null,"comments":1,"created_at":"2014-12-28T23:56:03Z","updated_at":"2015-01-01T01:01:26Z","closed_at":"2014-12-29T18:08:12Z","body":"I cannot finish the WynnExcavation Site A quest. First I got the message to translate from Vade. I brought it to Tesha and she translated it. I then gave it back to Vade but I disconnected. I came back on with no translated paper and I could not finish the quest. I was also not able to use /fixquests to help me."},"comment":{"url":"https://api.github.com/repos/Wynncraft/Issues/issues/comments/68477243","html_url":"https://github.com/Wynncraft/Issues/issues/1409#issuecomment-68477243","issue_url":"https://api.github.com/repos/Wynncraft/Issues/issues/1409","id":68477243,"user":{"login":"DaDominat0r","id":10334102,"avatar_url":"https://avatars.githubusercontent.com/u/10334102?v=3","gravatar_id":"","url":"https://api.github.com/users/DaDominat0r","html_url":"https://github.com/DaDominat0r","followers_url":"https://api.github.com/users/DaDominat0r/followers","following_url":"https://api.github.com/users/DaDominat0r/following{/other_user}","gists_url":"https://api.github.com/users/DaDominat0r/gists{/gist_id}","starred_url":"https://api.github.com/users/DaDominat0r/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/DaDominat0r/subscriptions","organizations_url":"https://api.github.com/users/DaDominat0r/orgs","repos_url":"https://api.github.com/users/DaDominat0r/repos","events_url":"https://api.github.com/users/DaDominat0r/events{/privacy}","received_events_url":"https://api.github.com/users/DaDominat0r/received_events","type":"User","site_admin":false},"created_at":"2015-01-01T01:01:26Z","updated_at":"2015-01-01T01:01:26Z","body":"So.. Can I get help on this or what?"}},"public":true,"created_at":"2015-01-01T01:01:26Z","org":{"id":5337644,"login":"Wynncraft","gravatar_id":"","url":"https://api.github.com/orgs/Wynncraft","avatar_url":"https://avatars.githubusercontent.com/u/5337644?"}}
{"id":"2489396528","type":"WatchEvent","actor":{"id":2519036,"login":"scidom","gravatar_id":"","url":"https://api.github.com/users/scidom","avatar_url":"https://avatars.githubusercontent.com/u/2519036?"},"repo":{"id":6201939,"name":"mlemerre/l-lang","url":"https://api.github.com/repos/mlemerre/l-lang"},"payload":{"action":"started"},"public":true,"created_at":"2015-01-01T01:01:26Z"}
{"id":"2489396531","type":"PushEvent","actor":{"id":6232704,"login":"nashpitre","gravatar_id":"","url":"https://api.github.com/users/nashpitre","avatar_url":"https://avatars.githubusercontent.com/u/6232704?"},"repo":{"id":28620312,"name":"nashpitre/nashpitre.github.io","url":"https://api.github.com/repos/nashpitre/nashpitre.github.io"},"payload":{"push_id":536752519,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"51b30814df5685fd473d136c26735a17cf577361","before":"c819b12361e14ee82463ecd628fb30cfcbade895","commits":[{"sha":"51b30814df5685fd473d136c26735a17cf577361","author":{"email":"be30e9ada7478b999c213bbb3535884788d4bb46@me.com","name":"nashpitre"},"message":"short","distinct":true,"url":"https://api.github.com/repos/nashpitre/nashpitre.github.io/commits/51b30814df5685fd473d136c26735a17cf577361"}]},"public":true,"created_at":"2015-01-01T01:01:26Z"}
{"id":"2489396532","type":"PushEvent","actor":{"id":171072,"login":"floydpink","gravatar_id":"","url":"https://api.github.com/users/floydpink","avatar_url":"https://avatars.githubusercontent.com/u/171072?"},"repo":{"id":28069452,"name":"floydpink/BhagavadGita-ios","url":"https://api.github.com/repos/floydpink/BhagavadGita-ios"},"payload":{"push_id":536752520,"size":2,"distinct_size":2,"ref":"refs/heads/master","head":"5a83c1baf8fb498f94821ee6c946cb6e9e2b9045","before":"aac807139c1fdd163e6ca29e937d1c684c6db953","commits":[{"sha":"be50a575a875bc3f19cf04fb114509a0ebf4f677","author":{"email":"5f2a1115638e65cf53a275a1d015ff80305829a3@googlemail.com","name":"Floyd Pink"},"message":"section detail is much better","distinct":true,"url":"https://api.github.com/repos/floydpink/BhagavadGita-ios/commits/be50a575a875bc3f19cf04fb114509a0ebf4f677"},{"sha":"5a83c1baf8fb498f94821ee6c946cb6e9e2b9045","author":{"email":"5f2a1115638e65cf53a275a1d015ff80305829a3@googlemail.com","name":"Floyd Pink"},"message":"updated gita.json with sloka number","distinct":true,"url":"https://api.github.com/repos/floydpink/BhagavadGita-ios/commits/5a83c1baf8fb498f94821ee6c946cb6e9e2b9045"}]},"public":true,"created_at":"2015-01-01T01:01:27Z"}
{"id":"2489396534","type":"PushEvent","actor":{"id":8017734,"login":"mikebutts","gravatar_id":"","url":"https://api.github.com/users/mikebutts","avatar_url":"https://avatars.githubusercontent.com/u/8017734?"},"repo":{"id":27460929,"name":"mikebutts/rgs","url":"https://api.github.com/repos/mikebutts/rgs"},"payload":{"push_id":536752521,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"15b9c4283de821b7f69199886593ebd231a11c41","before":"99cbde7783ed2cf0ea1db35f8c2ca1bffadcac5f","commits":[{"sha":"15b9c4283de821b7f69199886593ebd231a11c41","author":{"email":"1cf700477a4cf35c86434038dff20d0fc84c9161@gmail.com","name":"mikebutts"},"message":"Customized the views","distinct":true,"url":"https://api.github.com/repos/mikebutts/rgs/commits/15b9c4283de821b7f69199886593ebd231a11c41"}]},"public":true,"created_at":"2015-01-01T01:01:27Z"}
{"id":"2489396538","type":"PushEvent","actor":{"id":8703251,"login":"ameliamarie","gravatar_id":"","url":"https://api.github.com/users/ameliamarie","avatar_url":"https://avatars.githubusercontent.com/u/8703251?"},"repo":{"id":23813546,"name":"thearrow/ameliamarie","url":"https://api.github.com/repos/thearrow/ameliamarie"},"payload":{"push_id":536752526,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"0229ea3cce319f0d61433d352c2b900c77a4762a","before":"3471f07be1e4b322e72c7e1ede88a521139462cc","commits":[{"sha":"0229ea3cce319f0d61433d352c2b900c77a4762a","author":{"email":"54048cf8a75c1b0abf0231a8f9808799724944c4@gmail.com","name":"Amelia Schumacher"},"message":"Added logo, decreased top margin","distinct":true,"url":"https://api.github.com/repos/thearrow/ameliamarie/commits/0229ea3cce319f0d61433d352c2b900c77a4762a"}]},"public":true,"created_at":"2015-01-01T01:01:28Z"}
{"id":"2489396539","type":"PushEvent","actor":{"id":6154548,"login":"chrisanthropic","gravatar_id":"","url":"https://api.github.com/users/chrisanthropic","avatar_url":"https://avatars.githubusercontent.com/u/6154548?"},"repo":{"id":28470344,"name":"chrisanthropic/comical-jekyll-theme","url":"https://api.github.com/repos/chrisanthropic/comical-jekyll-theme"},"payload":{"push_id":536752527,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"16fe2da04c5558db261f6c5eb49bb07d805ebefc","before":"ad3cceedf0f2687257655fc606f863da4639b4f9","commits":[{"sha":"16fe2da04c5558db261f6c5eb49bb07d805ebefc","author":{"email":"a9c72f90f6fdaaea784cb28e2da787f981b8fb43@gmail.com","name":"Christopher Tarwater"},"message":"fix banner image url on banner documentation page","distinct":true,"url":"https://api.github.com/repos/chrisanthropic/comical-jekyll-theme/commits/16fe2da04c5558db261f6c5eb49bb07d805ebefc"}]},"public":true,"created_at":"2015-01-01T01:01:28Z"}
{"id":"2489396540","type":"PushEvent","actor":{"id":5784044,"login":"Guad","gravatar_id":"","url":"https://api.github.com/users/Guad","avatar_url":"https://avatars.githubusercontent.com/u/5784044?"},"repo":{"id":28678140,"name":"Guad/pydeo","url":"https://api.github.com/repos/Guad/pydeo"},"payload":{"push_id":536752528,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"e19a124b7d16dfc2bb3c53a25f6bed3d41df5dc0","before":"286c1baf59bad94aa73e3e60bd63ad4646727022","commits":[{"sha":"e19a124b7d16dfc2bb3c53a25f6bed3d41df5dc0","author":{"email":"45325f93c3023a3d37b7fdabaeabd7a663a476f8@gmail.com","name":"Phil"},"message":"Added starting files","distinct":true,"url":"https://api.github.com/repos/Guad/pydeo/commits/e19a124b7d16dfc2bb3c53a25f6bed3d41df5dc0"}]},"public":true,"created_at":"2015-01-01T01:01:28Z"}
{"id":"2489396542","type":"PushEvent","actor":{"id":10176820,"login":"chalavadivishnu","gravatar_id":"","url":"https://api.github.com/users/chalavadivishnu","avatar_url":"https://avatars.githubusercontent.com/u/10176820?"},"repo":{"id":28678150,"name":"chalavadivishnu/Face-Detection","url":"https://api.github.com/repos/chalavadivishnu/Face-Detection"},"payload":{"push_id":536752529,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"22a9bd6584d30cc259b5b0055cb6a8bff31d8d9e","before":"9b5858f96f8d101afa8e568dbe8424c32d010166","commits":[{"sha":"22a9bd6584d30cc259b5b0055cb6a8bff31d8d9e","author":{"email":"ce8044f02eb2a26b631671f5297317036d398e79@gmail.com","name":"Chalavadi Vishnu"},"message":"gabor function","distinct":true,"url":"https://api.github.com/repos/chalavadivishnu/Face-Detection/commits/22a9bd6584d30cc259b5b0055cb6a8bff31d8d9e"}]},"public":true,"created_at":"2015-01-01T01:01:29Z"}
{"id":"2489396543","type":"PushEvent","actor":{"id":1967266,"login":"ogupte","gravatar_id":"","url":"https://api.github.com/users/ogupte","avatar_url":"https://avatars.githubusercontent.com/u/1967266?"},"repo":{"id":28677997,"name":"ogupte/trope","url":"https://api.github.com/repos/ogupte/trope"},"payload":{"push_id":536752531,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"481e49afd08fbfd366fc7a88674b3a1d669c96ce","before":"e9e440aaa8897bbc0de676772f236f89c53c9ecb","commits":[{"sha":"481e49afd08fbfd366fc7a88674b3a1d669c96ce","author":{"email":"bd02fa4a4ee63436bd157864cccdf8b3a026562b@appnexus.com","name":"Oliver Gupte"},"message":"fixed README formatting to conform with github markdown standards","distinct":true,"url":"https://api.github.com/repos/ogupte/trope/commits/481e49afd08fbfd366fc7a88674b3a1d669c96ce"}]},"public":true,"created_at":"2015-01-01T01:01:29Z"}
{"id":"2489396545","type":"PushEvent","actor":{"id":6436073,"login":"523860169","gravatar_id":"","url":"https://api.github.com/users/523860169","avatar_url":"https://avatars.githubusercontent.com/u/6436073?"},"repo":{"id":23783874,"name":"523860169/list","url":"https://api.github.com/repos/523860169/list"},"payload":{"push_id":536752532,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"f27f319fd966f774f9a14aad012414686f2285f2","before":"639e5ab48e2bb80c20c195c456783b0e29c97838","commits":[{"sha":"f27f319fd966f774f9a14aad012414686f2285f2","author":{"email":"10f258ee912bdd79d094034bf50cfe8c68b73bc7@gmail.com","name":"523860169"},"message":"update","distinct":true,"url":"https://api.github.com/repos/523860169/list/commits/f27f319fd966f774f9a14aad012414686f2285f2"}]},"public":true,"created_at":"2015-01-01T01:01:29Z"}
{"id":"2489396549","type":"IssuesEvent","actor":{"id":541713,"login":"aaronpeterson","gravatar_id":"","url":"https://api.github.com/users/aaronpeterson","avatar_url":"https://avatars.githubusercontent.com/u/541713?"},"repo":{"id":15320781,"name":"paulyoder/angular-bootstrap-show-errors","url":"https://api.github.com/repos/paulyoder/angular-bootstrap-show-errors"},"payload":{"action":"opened","issue":{"url":"https://api.github.com/repos/paulyoder/angular-bootstrap-show-errors/issues/30","labels_url":"https://api.github.com/repos/paulyoder/angular-bootstrap-show-errors/issues/30/labels{/name}","comments_url":"https://api.github.com/repos/paulyoder/angular-bootstrap-show-errors/issues/30/comments","events_url":"https://api.github.com/repos/paulyoder/angular-bootstrap-show-errors/issues/30/events","html_url":"https://github.com/paulyoder/angular-bootstrap-show-errors/issues/30","id":53210190,"number":30,"title":"Using inside of a directive","user":{"login":"aaronpeterson","id":541713,"avatar_url":"https://avatars.githubusercontent.com/u/541713?v=3","gravatar_id":"","url":"https://api.github.com/users/aaronpeterson","html_url":"https://github.com/aaronpeterson","followers_url":"https://api.github.com/users/aaronpeterson/followers","following_url":"https://api.github.com/users/aaronpeterson/following{/other_user}","gists_url":"https://api.github.com/users/aaronpeterson/gists{/gist_id}","starred_url":"https://api.github.com/users/aaronpeterson/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/aaronpeterson/subscriptions","organizations_url":"https://api.github.com/users/aaronpeterson/orgs","repos_url":"https://api.github.com/users/aaronpeterson/repos","events_url":"https://api.github.com/users/aaronpeterson/events{/privacy}","received_events_url":"https://api.github.com/users/aaronpeterson/received_events","type":"User","site_admin":false},"labels":[],"state":"open","locked":false,"assignee":null,"milestone":null,"comments":0,"created_at":"2015-01-01T01:01:29Z","updated_at":"2015-01-01T01:01:29Z","closed_at":null,"body":"Should show-errors work inside of another (parent) directive's template?  I see 'formCtrl' being injected as a result of require: '^form' but the instance of formCtrl is missing fields.  This results in formCtrl[inputName] being undefined on [line 39](https://github.com/paulyoder/angular-bootstrap-show-errors/blob/master/src/showErrors.js#L39) when the event is triggered.  \r\n\r\nMy parent directive uses templateUrl, so not sure if related to [this issue](http://stackoverflow.com/questions/22535317/using-directive-inside-a-templateurl-attribute).  Still digging."}},"public":true,"created_at":"2015-01-01T01:01:29Z"}
{"id":"2489396550","type":"PushEvent","actor":{"id":3949826,"login":"tschudin","gravatar_id":"","url":"https://api.github.com/users/tschudin","avatar_url":"https://avatars.githubusercontent.com/u/3949826?"},"repo":{"id":8971938,"name":"cn-uofbasel/ccn-lite","url":"https://api.github.com/repos/cn-uofbasel/ccn-lite"},"payload":{"push_id":536752533,"size":1,"distinct_size":1,"ref":"refs/heads/forwarder","head":"21284a42e4588d65ec5b763cee8e728d9d398e16","before":"3380f880670b473df5069028a4622e9aedcd5521","commits":[{"sha":"21284a42e4588d65ec5b763cee8e728d9d398e16","author":{"email":"53311a286a42748871239dcb38bda6322d2809ef@l2apps.com","name":"Christian F. Tschudin"},"message":"purged all duplicate fields in ccnl_content_s, ccnl_interest_s still pending","distinct":true,"url":"https://api.github.com/repos/cn-uofbasel/ccn-lite/commits/21284a42e4588d65ec5b763cee8e728d9d398e16"}]},"public":true,"created_at":"2015-01-01T01:01:29Z","org":{"id":3949801,"login":"cn-uofbasel","gravatar_id":"","url":"https://api.github.com/orgs/cn-uofbasel","avatar_url":"https://avatars.githubusercontent.com/u/3949801?"}}
{"id":"2489396557","type":"PushEvent","actor":{"id":2099320,"login":"cindyker","gravatar_id":"","url":"https://api.github.com/users/cindyker","avatar_url":"https://avatars.githubusercontent.com/u/2099320?"},"repo":{"id":28552874,"name":"cindyker/Crafty","url":"https://api.github.com/repos/cindyker/Crafty"},"payload":{"push_id":536752535,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"cd304b11129fa0888ead7673b3d83336033585c5","before":"93fd373cb7d26ac0e201680ac33cfc831ac6686e","commits":[{"sha":"cd304b11129fa0888ead7673b3d83336033585c5","author":{"email":"3a89c3a4a263b82f3475f9f2af701d5c4dba9e08@hotmail.com","name":"cindyker"},"message":"pom update for heroes","distinct":true,"url":"https://api.github.com/repos/cindyker/Crafty/commits/cd304b11129fa0888ead7673b3d83336033585c5"}]},"public":true,"created_at":"2015-01-01T01:01:32Z"}
{"id":"2489396558","type":"PushEvent","actor":{"id":735008,"login":"kragniz","gravatar_id":"","url":"https://api.github.com/users/kragniz","avatar_url":"https://avatars.githubusercontent.com/u/735008?"},"repo":{"id":28620211,"name":"kragniz/json-sempai","url":"https://api.github.com/repos/kragniz/json-sempai"},"payload":{"push_id":536752536,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"b96375864c7b6e5868a18833a2bc226d8dbbf275","before":"bdf617ecb4a1465ce5d392c65d98165e6652c7e2","commits":[{"sha":"b96375864c7b6e5868a18833a2bc226d8dbbf275","author":{"email":"c6a2862a65fb525f43531512880f69e2460922c9@gmail.com","name":"Louis Taylor"},"message":"Update description in setup.py","distinct":true,"url":"https://api.github.com/repos/kragniz/json-sempai/commits/b96375864c7b6e5868a18833a2bc226d8dbbf275"}]},"public":true,"created_at":"2015-01-01T01:01:32Z"}
{"id":"2489396565","type":"PushEvent","actor":{"id":3781771,"login":"hwchen","gravatar_id":"","url":"https://api.github.com/users/hwchen","avatar_url":"https://avatars.githubusercontent.com/u/3781771?"},"repo":{"id":26837590,"name":"hwchen/euler-hs","url":"https://api.github.com/repos/hwchen/euler-hs"},"payload":{"push_id":536752541,"size":3,"distinct_size":3,"ref":"refs/heads/master","head":"f03bbb2e8b1ea9c47bbc4b16db55ce9c3c55ae12","before":"5e8b1b964b46fff4d9c16f073dded632719d044d","commits":[{"sha":"ef089e1f30c63552f274a6bbb7da24584f464045","author":{"email":"731c5ac76cbb5cd3515a328d1315fcf27dc3a4f9@gmail.com","name":"hwchen"},"message":"finished euler 50","distinct":true,"url":"https://api.github.com/repos/hwchen/euler-hs/commits/ef089e1f30c63552f274a6bbb7da24584f464045"},{"sha":"8378498984bf415a4ed61877babcaa2cc4cc9f13","author":{"email":"731c5ac76cbb5cd3515a328d1315fcf27dc3a4f9@gmail.com","name":"hwchen"},"message":"finished euler 57","distinct":true,"url":"https://api.github.com/repos/hwchen/euler-hs/commits/8378498984bf415a4ed61877babcaa2cc4cc9f13"},{"sha":"f03bbb2e8b1ea9c47bbc4b16db55ce9c3c55ae12","author":{"email":"731c5ac76cbb5cd3515a328d1315fcf27dc3a4f9@gmail.com","name":"hwchen"},"message":"finished euler 62","distinct":true,"url":"https://api.github.com/repos/hwchen/euler-hs/commits/f03bbb2e8b1ea9c47bbc4b16db55ce9c3c55ae12"}]},"public":true,"created_at":"2015-01-01T01:01:32Z"}
{"id":"2489396567","type":"IssueCommentEvent","actor":{"id":913757,"login":"adarsh","gravatar_id":"","url":"https://api.github.com/users/adarsh","avatar_url":"https://avatars.githubusercontent.com/u/913757?"},"repo":{"id":7411076,"name":"thoughtbot/hound","url":"https://api.github.com/repos/thoughtbot/hound"},"payload":{"action":"created","issue":{"url":"https://api.github.com/repos/thoughtbot/hound/issues/527","labels_url":"https://api.github.com/repos/thoughtbot/hound/issues/527/labels{/name}","comments_url":"https://api.github.com/repos/thoughtbot/hound/issues/527/comments","events_url":"https://api.github.com/repos/thoughtbot/hound/issues/527/events","html_url":"https://github.com/thoughtbot/hound/pull/527","id":52546556,"number":527,"title":"Handle repos with inadequate information","user":{"login":"adarsh","id":913757,"avatar_url":"https://avatars.githubusercontent.com/u/913757?v=3","gravatar_id":"","url":"https://api.github.com/users/adarsh","html_url":"https://github.com/adarsh","followers_url":"https://api.github.com/users/adarsh/followers","following_url":"https://api.github.com/users/adarsh/following{/other_user}","gists_url":"https://api.github.com/users/adarsh/gists{/gist_id}","starred_url":"https://api.github.com/users/adarsh/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/adarsh/subscriptions","organizations_url":"https://api.github.com/users/adarsh/orgs","repos_url":"https://api.github.com/users/adarsh/repos","events_url":"https://api.github.com/users/adarsh/events{/privacy}","received_events_url":"https://api.github.com/users/adarsh/received_events","type":"User","site_admin":false},"labels":[],"state":"open","locked":false,"assignee":null,"milestone":null,"comments":3,"created_at":"2014-12-20T01:24:36Z","updated_at":"2015-01-01T01:01:32Z","closed_at":null,"pull_request":{"url":"https://api.github.com/repos/thoughtbot/hound/pulls/527","html_url":"https://github.com/thoughtbot/hound/pull/527","diff_url":"https://github.com/thoughtbot/hound/pull/527.diff","patch_url":"https://github.com/thoughtbot/hound/pull/527.patch"},"body":"* Inactivate repositories which lack privacy or org information\n* Add rake task to update repo information\n\nhttps://trello.com/c/oPFtmreZ/393-builds-are-being-run-for-active-repos-missing-privacy-and-organization-information"},"comment":{"url":"https://api.github.com/repos/thoughtbot/hound/issues/comments/68477246","html_url":"https://github.com/thoughtbot/hound/pull/527#issuecomment-68477246","issue_url":"https://api.github.com/repos/thoughtbot/hound/issues/527","id":68477246,"user":{"login":"adarsh","id":913757,"avatar_url":"https://avatars.githubusercontent.com/u/913757?v=3","gravatar_id":"","url":"https://api.github.com/users/adarsh","html_url":"https://github.com/adarsh","followers_url":"https://api.github.com/users/adarsh/followers","following_url":"https://api.github.com/users/adarsh/following{/other_user}","gists_url":"https://api.github.com/users/adarsh/gists{/gist_id}","starred_url":"https://api.github.com/users/adarsh/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/adarsh/subscriptions","organizations_url":"https://api.github.com/users/adarsh/orgs","repos_url":"https://api.github.com/users/adarsh/repos","events_url":"https://api.github.com/users/adarsh/events{/privacy}","received_events_url":"https://api.github.com/users/adarsh/received_events","type":"User","site_admin":false},"created_at":"2015-01-01T01:01:32Z","updated_at":"2015-01-01T01:01:32Z","body":"@gylaz Note that I had to add the new `schema.rb` file. Please doublecheck before I merge. 707b26b"}},"public":true,"created_at":"2015-01-01T01:01:32Z","org":{"id":6183,"login":"thoughtbot","gravatar_id":"","url":"https://api.github.com/orgs/thoughtbot","avatar_url":"https://avatars.githubusercontent.com/u/6183?"}}
{"id":"2489396576","type":"PushEvent","actor":{"id":376230,"login":"tiandavis","gravatar_id":"","url":"https://api.github.com/users/tiandavis","avatar_url":"https://avatars.githubusercontent.com/u/376230?"},"repo":{"id":28674331,"name":"tiandavis/caramel","url":"https://api.github.com/repos/tiandavis/caramel"},"payload":{"push_id":536752546,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"70b984b9789c97a222fb2a1cca637243f31dd977","before":"975b81e7e10ead6dc0078fde03cf3f30079f2adf","commits":[{"sha":"70b984b9789c97a222fb2a1cca637243f31dd977","author":{"email":"e9142163b8d26080ab61ec5db295a45dad55c70e@gmail.com","name":"Tian Davis"},"message":"Updated project readme.","distinct":true,"url":"https://api.github.com/repos/tiandavis/caramel/commits/70b984b9789c97a222fb2a1cca637243f31dd977"}]},"public":true,"created_at":"2015-01-01T01:01:33Z"}
{"id":"2489396577","type":"PushEvent","actor":{"id":814471,"login":"swegener","gravatar_id":"","url":"https://api.github.com/users/swegener","avatar_url":"https://avatars.githubusercontent.com/u/814471?"},"repo":{"id":17971324,"name":"swegener/gentoo-portage","url":"https://api.github.com/repos/swegener/gentoo-portage"},"payload":{"push_id":536752547,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"d2d7b600bdf168a351eae73f0df0d6c6feebc174","before":"93c6eace483ddf68d6707b005bed915724da00b2","commits":[{"sha":"d2d7b600bdf168a351eae73f0df0d6c6feebc174","author":{"email":"18dc2ed701c57df81c0b5498c13767c232eb398f@stealer.net","name":"Sven Wegener"},"message":"2015-01-01 00:36:52+00:00","distinct":true,"url":"https://api.github.com/repos/swegener/gentoo-portage/commits/d2d7b600bdf168a351eae73f0df0d6c6feebc174"}]},"public":true,"created_at":"2015-01-01T01:01:33Z"}
{"id":"2489396581","type":"WatchEvent","actor":{"id":8263721,"login":"akatray","gravatar_id":"","url":"https://api.github.com/users/akatray","avatar_url":"https://avatars.githubusercontent.com/u/8263721?"},"repo":{"id":9524997,"name":"glfw/glfw","url":"https://api.github.com/repos/glfw/glfw"},"payload":{"action":"started"},"public":true,"created_at":"2015-01-01T01:01:35Z","org":{"id":3905364,"login":"glfw","gravatar_id":"","url":"https://api.github.com/orgs/glfw","avatar_url":"https://avatars.githubusercontent.com/u/3905364?"}}
{"id":"2489396582","type":"IssueCommentEvent","actor":{"id":874715,"login":"jenkinsadmin","gravatar_id":"","url":"https://api.github.com/users/jenkinsadmin","avatar_url":"https://avatars.githubusercontent.com/u/874715?"},"repo":{"id":1488959,"name":"jenkinsci/periodicbackup-plugin","url":"https://api.github.com/repos/jenkinsci/periodicbackup-plugin"},"payload":{"action":"created","issue":{"url":"https://api.github.com/repos/jenkinsci/periodicbackup-plugin/issues/9","labels_url":"https://api.github.com/repos/jenkinsci/periodicbackup-plugin/issues/9/labels{/name}","comments_url":"https://api.github.com/repos/jenkinsci/periodicbackup-plugin/issues/9/comments","events_url":"https://api.github.com/repos/jenkinsci/periodicbackup-plugin/issues/9/events","html_url":"https://github.com/jenkinsci/periodicbackup-plugin/pull/9","id":53200776,"number":9,"title":"Don't follow symlinks.","user":{"login":"jikamens","id":1598067,"avatar_url":"https://avatars.githubusercontent.com/u/1598067?v=3","gravatar_id":"","url":"https://api.github.com/users/jikamens","html_url":"https://github.com/jikamens","followers_url":"https://api.github.com/users/jikamens/followers","following_url":"https://api.github.com/users/jikamens/following{/other_user}","gists_url":"https://api.github.com/users/jikamens/gists{/gist_id}","starred_url":"https://api.github.com/users/jikamens/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/jikamens/subscriptions","organizations_url":"https://api.github.com/users/jikamens/orgs","repos_url":"https://api.github.com/users/jikamens/repos","events_url":"https://api.github.com/users/jikamens/events{/privacy}","received_events_url":"https://api.github.com/users/jikamens/received_events","type":"User","site_admin":false},"labels":[],"state":"open","locked":false,"assignee":null,"milestone":null,"comments":1,"created_at":"2014-12-31T19:57:13Z","updated_at":"2015-01-01T01:01:34Z","closed_at":null,"pull_request":{"url":"https://api.github.com/repos/jenkinsci/periodicbackup-plugin/pulls/9","html_url":"https://github.com/jenkinsci/periodicbackup-plugin/pull/9","diff_url":"https://github.com/jenkinsci/periodicbackup-plugin/pull/9.diff","patch_url":"https://github.com/jenkinsci/periodicbackup-plugin/pull/9.patch"},"body":"Backups shouldn't follow symbolic links.\r\n\r\nI haven't been able to actually compile and test this change, because it uses out-of-date packages, and my various efforts to update various packages all ended in failure, when I discovered that the latest versions of some of the required packages use google-collections (which is obsolete and no longer maintained), and this package itself uses guava instead, and google-collections and guava are incompatible.\r\n\r\nI don't know if anybody is maintaining this anymore. If so, then I think it needs some work to be compilable with an up-to-date java. My java mojo is not strong enough to get it done.\r\n"},"comment":{"url":"https://api.github.com/repos/jenkinsci/periodicbackup-plugin/issues/comments/68477247","html_url":"https://github.com/jenkinsci/periodicbackup-plugin/pull/9#issuecomment-68477247","issue_url":"https://api.github.com/repos/jenkinsci/periodicbackup-plugin/issues/9","id":68477247,"user":{"login":"jenkinsadmin","id":874715,"avatar_url":"https://avatars.githubusercontent.com/u/874715?v=3","gravatar_id":"","url":"https://api.github.com/users/jenkinsadmin","html_url":"https://github.com/jenkinsadmin","followers_url":"https://api.github.com/users/jenkinsadmin/followers","following_url":"https://api.github.com/users/jenkinsadmin/following{/other_user}","gists_url":"https://api.github.com/users/jenkinsadmin/gists{/gist_id}","starred_url":"https://api.github.com/users/jenkinsadmin/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/jenkinsadmin/subscriptions","organizations_url":"https://api.github.com/users/jenkinsadmin/orgs","repos_url":"https://api.github.com/users/jenkinsadmin/repos","events_url":"https://api.github.com/users/jenkinsadmin/events{/privacy}","received_events_url":"https://api.github.com/users/jenkinsadmin/received_events","type":"User","site_admin":false},"created_at":"2015-01-01T01:01:34Z","updated_at":"2015-01-01T01:01:34Z","body":"Thank you for a pull request! Please check [this document](http://jenkins-ci.org/pull-request-greeting) for how the Jenkins project handles pull requests"}},"public":true,"created_at":"2015-01-01T01:01:35Z","org":{"id":107424,"login":"jenkinsci","gravatar_id":"","url":"https://api.github.com/orgs/jenkinsci","avatar_url":"https://avatars.githubusercontent.com/u/107424?"}}
{"id":"2489396583","type":"CreateEvent","actor":{"id":8005041,"login":"quynk94","gravatar_id":"","url":"https://api.github.com/users/quynk94","avatar_url":"https://avatars.githubusercontent.com/u/8005041?"},"repo":{"id":28678228,"name":"quynk94/fedora-WP-Theme-","url":"https://api.github.com/repos/quynk94/fedora-WP-Theme-"},"payload":{"ref":null,"ref_type":"repository","master_branch":"master","description":"","pusher_type":"user"},"public":true,"created_at":"2015-01-01T01:01:36Z"}
{"id":"2489396585","type":"PushEvent","actor":{"id":10225575,"login":"ExclusiveOrange","gravatar_id":"","url":"https://api.github.com/users/ExclusiveOrange","avatar_url":"https://avatars.githubusercontent.com/u/10225575?"},"repo":{"id":28677579,"name":"ExclusiveOrange/synthesizer","url":"https://api.github.com/repos/ExclusiveOrange/synthesizer"},"payload":{"push_id":536752550,"size":0,"distinct_size":0,"ref":"refs/heads/master","head":"0e64036d5ac0d9c24b4cbe39bb778570db49caba","before":"0e64036d5ac0d9c24b4cbe39bb778570db49caba","commits":[]},"public":true,"created_at":"2015-01-01T01:01:36Z"}
{"id":"2489396597","type":"PushEvent","actor":{"id":433707,"login":"ile","gravatar_id":"","url":"https://api.github.com/users/ile","avatar_url":"https://avatars.githubusercontent.com/u/433707?"},"repo":{"id":26847132,"name":"kantele/k-templates","url":"https://api.github.com/repos/kantele/k-templates"},"payload":{"push_id":536752555,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"d989a60a4e050573d9ba85048499d9a0a7e8117e","before":"263e28e0e1c63e70b3ba9fd7b157945a394c6d14","commits":[{"sha":"d989a60a4e050573d9ba85048499d9a0a7e8117e","author":{"email":"4f3407de78bccc8cc160ee4d278d5efe7162e6b5@nateps.com","name":"Nate Smith"},"message":"fix bug with attribute bindings because forInnerPath wasn't being passed","distinct":true,"url":"https://api.github.com/repos/kantele/k-templates/commits/d989a60a4e050573d9ba85048499d9a0a7e8117e"}]},"public":true,"created_at":"2015-01-01T01:01:37Z","org":{"id":5687585,"login":"kantele","gravatar_id":"","url":"https://api.github.com/orgs/kantele","avatar_url":"https://avatars.githubusercontent.com/u/5687585?"}}
{"id":"2489396602","type":"IssuesEvent","actor":{"id":1432632,"login":"ajubbal","gravatar_id":"","url":"https://api.github.com/users/ajubbal","avatar_url":"https://avatars.githubusercontent.com/u/1432632?"},"repo":{"id":629921,"name":"bobthecow/git-flow-completion","url":"https://api.github.com/repos/bobthecow/git-flow-completion"},"payload":{"action":"opened","issue":{"url":"https://api.github.com/repos/bobthecow/git-flow-completion/issues/37","labels_url":"https://api.github.com/repos/bobthecow/git-flow-completion/issues/37/labels{/name}","comments_url":"https://api.github.com/repos/bobthecow/git-flow-completion/issues/37/comments","events_url":"https://api.github.com/repos/bobthecow/git-flow-completion/issues/37/events","html_url":"https://github.com/bobthecow/git-flow-completion/issues/37","id":53210191,"number":37,"title":"Git Completion No Longer Working After Migration Between Computers","user":{"login":"ajubbal","id":1432632,"avatar_url":"https://avatars.githubusercontent.com/u/1432632?v=3","gravatar_id":"","url":"https://api.github.com/users/ajubbal","html_url":"https://github.com/ajubbal","followers_url":"https://api.github.com/users/ajubbal/followers","following_url":"https://api.github.com/users/ajubbal/following{/other_user}","gists_url":"https://api.github.com/users/ajubbal/gists{/gist_id}","starred_url":"https://api.github.com/users/ajubbal/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/ajubbal/subscriptions","organizations_url":"https://api.github.com/users/ajubbal/orgs","repos_url":"https://api.github.com/users/ajubbal/repos","events_url":"https://api.github.com/users/ajubbal/events{/privacy}","received_events_url":"https://api.github.com/users/ajubbal/received_events","type":"User","site_admin":false},"labels":[],"state":"open","locked":false,"assignee":null,"milestone":null,"comments":0,"created_at":"2015-01-01T01:01:38Z","updated_at":"2015-01-01T01:01:38Z","closed_at":null,"body":"Everything is intact as I used the migration assistant, unless there is a requirement for Xcode command line tools or something of that nature? I installed this through Homebrew and it was working fine on my initial computer (running Mac OS 10.9.5) but ceases to work with my new machine (same OS version). Some help would be greatly appreciated."}},"public":true,"created_at":"2015-01-01T01:01:38Z"}
{"id":"2489396606","type":"WatchEvent","actor":{"id":5061849,"login":"newbin","gravatar_id":"","url":"https://api.github.com/users/newbin","avatar_url":"https://avatars.githubusercontent.com/u/5061849?"},"repo":{"id":661420,"name":"simplegeo/python-geohash","url":"https://api.github.com/repos/simplegeo/python-geohash"},"payload":{"action":"started"},"public":true,"created_at":"2015-01-01T01:01:39Z","org":{"id":93415,"login":"simplegeo","gravatar_id":"","url":"https://api.github.com/orgs/simplegeo","avatar_url":"https://avatars.githubusercontent.com/u/93415?"}}
{"id":"2489396609","type":"PushEvent","actor":{"id":8933459,"login":"lmontopo","gravatar_id":"","url":"https://api.github.com/users/lmontopo","avatar_url":"https://avatars.githubusercontent.com/u/8933459?"},"repo":{"id":24911711,"name":"lmontopo/lmontopo.github.io","url":"https://api.github.com/repos/lmontopo/lmontopo.github.io"},"payload":{"push_id":536752559,"size":1,"distinct_size":1,"ref":"refs/heads/source","head":"7812248ef9626c3f04dcb73f41eab673e6cb3691","before":"5f6068e7c82948857bb919d278793bed517d069f","commits":[{"sha":"7812248ef9626c3f04dcb73f41eab673e6cb3691","author":{"email":"6beaeb38ccda0977b766148789e916197124dfed@gmail.com","name":"Leta Montopoli"},"message":"edited lessons.md","distinct":true,"url":"https://api.github.com/repos/lmontopo/lmontopo.github.io/commits/7812248ef9626c3f04dcb73f41eab673e6cb3691"}]},"public":true,"created_at":"2015-01-01T01:01:39Z"}
{"id":"2489396616","type":"CreateEvent","actor":{"id":3489773,"login":"captainkirkby","gravatar_id":"","url":"https://api.github.com/users/captainkirkby","avatar_url":"https://avatars.githubusercontent.com/u/3489773?"},"repo":{"id":15461243,"name":"captainkirkby/Gears","url":"https://api.github.com/repos/captainkirkby/Gears"},"payload":{"ref":"#30","ref_type":"branch","master_branch":"master","description":"Set of packages used to measure a mechanical clock.","pusher_type":"user"},"public":true,"created_at":"2015-01-01T01:01:40Z"}
{"id":"2489396617","type":"PushEvent","actor":{"id":4390732,"login":"iamchairs","gravatar_id":"","url":"https://api.github.com/users/iamchairs","avatar_url":"https://avatars.githubusercontent.com/u/4390732?"},"repo":{"id":20004313,"name":"iamchairs/snooze","url":"https://api.github.com/repos/iamchairs/snooze"},"payload":{"push_id":536752563,"size":1,"distinct_size":1,"ref":"refs/heads/1.0.0-alpha.1","head":"9f289c1a6fd9b85e213e0a7104b2a2bfe6ee4104","before":"f9f2212d389e344e61c32f961ef77adbdef23bb3","commits":[{"sha":"9f289c1a6fd9b85e213e0a7104b2a2bfe6ee4104","author":{"email":"1de9ff26e599b349bd443b5cc72b005ab8ff1e50@gmail.com","name":"Micah Williamson"},"message":"return this on everything","distinct":true,"url":"https://api.github.com/repos/iamchairs/snooze/commits/9f289c1a6fd9b85e213e0a7104b2a2bfe6ee4104"}]},"public":true,"created_at":"2015-01-01T01:01:40Z"}
{"id":"2489396620","type":"PushEvent","actor":{"id":4115801,"login":"afeinland","gravatar_id":"","url":"https://api.github.com/users/afeinland","avatar_url":"https://avatars.githubusercontent.com/u/4115801?"},"repo":{"id":16446548,"name":"afeinland/vimrc","url":"https://api.github.com/repos/afeinland/vimrc"},"payload":{"push_id":536752565,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"dc3aa0c350eb43be8cd66bc83b053bf84ed4364a","before":"ed20c634809a7a3375a41b819143f5bf64389bd9","commits":[{"sha":"dc3aa0c350eb43be8cd66bc83b053bf84ed4364a","author":{"email":"de080937e87a3fc5b57c1b6f90bb5aded8f69508@ucr.edu","name":"Alex Feinland"},"message":"added set ruler rule","distinct":true,"url":"https://api.github.com/repos/afeinland/vimrc/commits/dc3aa0c350eb43be8cd66bc83b053bf84ed4364a"}]},"public":true,"created_at":"2015-01-01T01:01:41Z"}
{"id":"2489396621","type":"PushEvent","actor":{"id":8699738,"login":"harryganz","gravatar_id":"","url":"https://api.github.com/users/harryganz","avatar_url":"https://avatars.githubusercontent.com/u/8699738?"},"repo":{"id":28651515,"name":"harryganz/ganzfacts","url":"https://api.github.com/repos/harryganz/ganzfacts"},"payload":{"push_id":536752566,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"df578268ecc281cfadd96b2f884d19b3562c70e1","before":"0ffe15d38852b93efab774b6d51442c6fd9633e4","commits":[{"sha":"df578268ecc281cfadd96b2f884d19b3562c70e1","author":{"email":"8e8abe39cdbc49fc743305288c23722c02c5f1c2@rsmas.miami.edu","name":"Harry Ganz"},"message":"Added controllers\n\nAdded controllers for access, admin, fact, photo, post","distinct":true,"url":"https://api.github.com/repos/harryganz/ganzfacts/commits/df578268ecc281cfadd96b2f884d19b3562c70e1"}]},"public":true,"created_at":"2015-01-01T01:01:41Z"}
{"id":"2489396622","type":"PushEvent","actor":{"id":4153853,"login":"jlumijarvi","gravatar_id":"","url":"https://api.github.com/users/jlumijarvi","avatar_url":"https://avatars.githubusercontent.com/u/4153853?"},"repo":{"id":28678176,"name":"jlumijarvi/csv2xml","url":"https://api.github.com/repos/jlumijarvi/csv2xml"},"payload":{"push_id":536752567,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"c64c0c7b60fea3b7a191f3b8b39aa144d281ceba","before":"8c339f97ba859406034a4b4803ff9f10986c16ea","commits":[{"sha":"c64c0c7b60fea3b7a191f3b8b39aa144d281ceba","author":{"email":"40e6fc59d2535c98bfd5d19357e20df6e95cef64@gmail.com","name":"jlumijarvi"},"message":"Update README.md","distinct":true,"url":"https://api.github.com/repos/jlumijarvi/csv2xml/commits/c64c0c7b60fea3b7a191f3b8b39aa144d281ceba"}]},"public":true,"created_at":"2015-01-01T01:01:42Z"}
{"id":"2489396624","type":"PushEvent","actor":{"id":3124267,"login":"acprimer","gravatar_id":"","url":"https://api.github.com/users/acprimer","avatar_url":"https://avatars.githubusercontent.com/u/3124267?"},"repo":{"id":28179725,"name":"acprimer/Beauty-of-Programming","url":"https://api.github.com/repos/acprimer/Beauty-of-Programming"},"payload":{"push_id":536752568,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"8d605c3d782cf051a9b03b55b619a9525c3d5add","before":"a10e8208f5e136f1ba4c2ae16f56cee76f0e563d","commits":[{"sha":"8d605c3d782cf051a9b03b55b619a9525c3d5add","author":{"email":"621c6ca061921149bf4dbea85ceffd5a4497c1dc@qq.com","name":"Dahai Yao"},"message":"chap2.17","distinct":true,"url":"https://api.github.com/repos/acprimer/Beauty-of-Programming/commits/8d605c3d782cf051a9b03b55b619a9525c3d5add"}]},"public":true,"created_at":"2015-01-01T01:01:42Z"}
{"id":"2489396625","type":"PushEvent","actor":{"id":1221092,"login":"vuolter","gravatar_id":"","url":"https://api.github.com/users/vuolter","avatar_url":"https://avatars.githubusercontent.com/u/1221092?"},"repo":{"id":8122790,"name":"pyload/pyload","url":"https://api.github.com/repos/pyload/pyload"},"payload":{"push_id":536752569,"size":1,"distinct_size":1,"ref":"refs/heads/stable","head":"1f1e5cd57b08353c5f42add8f9b842c4926ba8ed","before":"60e9c46f32d97d01d728c8515985b58ba33fdafd","commits":[{"sha":"1f1e5cd57b08353c5f42add8f9b842c4926ba8ed","author":{"email":"5cc667be46e22897a880e49707c8ded7041bc0f9@gmail.com","name":"Walter Purcaro"},"message":"[RapiduNet] Fixup","distinct":true,"url":"https://api.github.com/repos/pyload/pyload/commits/1f1e5cd57b08353c5f42add8f9b842c4926ba8ed"}]},"public":true,"created_at":"2015-01-01T01:01:42Z","org":{"id":3521496,"login":"pyload","gravatar_id":"","url":"https://api.github.com/orgs/pyload","avatar_url":"https://avatars.githubusercontent.com/u/3521496?"}}
{"id":"2489396626","type":"PushEvent","actor":{"id":935160,"login":"thenomain","gravatar_id":"","url":"https://api.github.com/users/thenomain","avatar_url":"https://avatars.githubusercontent.com/u/935160?"},"repo":{"id":26726490,"name":"thenomain/GMCCG","url":"https://api.github.com/repos/thenomain/GMCCG"},"payload":{"push_id":536752570,"size":2,"distinct_size":2,"ref":"refs/heads/master","head":"32a8000020397a3c786d167233dfab8397cf2735","before":"265550d7fa10002cee34e64effe1dff2f0461287","commits":[{"sha":"5ef5e29232c7bfb607eef378bb9f9e18e0929819","author":{"email":"f2f79094bfbbb4cfcb0b5f9d1737b6d1f43b0201@gmail.com","name":"Kent Jenkins"},"message":"more class-system overhaul","distinct":true,"url":"https://api.github.com/repos/thenomain/GMCCG/commits/5ef5e29232c7bfb607eef378bb9f9e18e0929819"},{"sha":"32a8000020397a3c786d167233dfab8397cf2735","author":{"email":"f2f79094bfbbb4cfcb0b5f9d1737b6d1f43b0201@gmail.com","name":"Kent Jenkins"},"message":"separate tags out to own object\n\nTags are a huge portion of our lookup information, so I'm hoping that by taking them out of the main Data Dictionary and to their own object (Data Tags) that they will make lookup of most things quicker.\n\nThis paves the way in case Prerequisites, Book Reference, and Notes needs to do the same.","distinct":true,"url":"https://api.github.com/repos/thenomain/GMCCG/commits/32a8000020397a3c786d167233dfab8397cf2735"}]},"public":true,"created_at":"2015-01-01T01:01:42Z"}
{"id":"2489396630","type":"PushEvent","actor":{"id":6436073,"login":"523860169","gravatar_id":"","url":"https://api.github.com/users/523860169","avatar_url":"https://avatars.githubusercontent.com/u/6436073?"},"repo":{"id":27432101,"name":"523860169/sh","url":"https://api.github.com/repos/523860169/sh"},"payload":{"push_id":536752572,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"f5565a7f3a75c7fca3b11480b24c02b70dd64f72","before":"55d430ff46d9023d0cdc935212ffa50328920a11","commits":[{"sha":"f5565a7f3a75c7fca3b11480b24c02b70dd64f72","author":{"email":"10f258ee912bdd79d094034bf50cfe8c68b73bc7@gmail.com","name":"523860169"},"message":"update","distinct":true,"url":"https://api.github.com/repos/523860169/sh/commits/f5565a7f3a75c7fca3b11480b24c02b70dd64f72"}]},"public":true,"created_at":"2015-01-01T01:01:43Z"}
{"id":"2489396631","type":"PushEvent","actor":{"id":367618,"login":"cm-gerrit","gravatar_id":"","url":"https://api.github.com/users/cm-gerrit","avatar_url":"https://avatars.githubusercontent.com/u/367618?"},"repo":{"id":26532168,"name":"CyanogenMod/android_device_qcom_sepolicy","url":"https://api.github.com/repos/CyanogenMod/android_device_qcom_sepolicy"},"payload":{"push_id":536752573,"size":1,"distinct_size":1,"ref":"refs/heads/cm-12.0","head":"77bb91189b6200c7743acad40b8cc1fb6fe32bc0","before":"233406f509e344c11d9a39a647cd6381afa42304","commits":[{"sha":"77bb91189b6200c7743acad40b8cc1fb6fe32bc0","author":{"email":"9ce5770b3bb4b2a1d59be2d97e34379cd192299f@cyngn.com","name":"Steve Kondik"},"message":"sepolicy: Allow apps to read battery status\n\n * Various apps do this to monitor the battery. No harm there.\n\nChange-Id: Id1b843ca509747ed963b89d025a39b5b1fcc7ddb","distinct":true,"url":"https://api.github.com/repos/CyanogenMod/android_device_qcom_sepolicy/commits/77bb91189b6200c7743acad40b8cc1fb6fe32bc0"}]},"public":true,"created_at":"2015-01-01T01:01:43Z","org":{"id":317721,"login":"CyanogenMod","gravatar_id":"","url":"https://api.github.com/orgs/CyanogenMod","avatar_url":"https://avatars.githubusercontent.com/u/317721?"}}
{"id":"2489396635","type":"PushEvent","actor":{"id":5975070,"login":"marcellodibello","gravatar_id":"","url":"https://api.github.com/users/marcellodibello","avatar_url":"https://avatars.githubusercontent.com/u/5975070?"},"repo":{"id":17580814,"name":"marcellodibello/marcellodibello.github.io","url":"https://api.github.com/repos/marcellodibello/marcellodibello.github.io"},"payload":{"push_id":536752575,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"7995cfd2d91a5b11eff75239ac124fae9af80d6d","before":"b5fdeaa9282cb3b94536ea0a2485e7b154c33d0a","commits":[{"sha":"7995cfd2d91a5b11eff75239ac124fae9af80d6d","author":{"email":"babd00909fb78351e79d40af26c77fc37bb4ed59@gmail.com","name":"marcellodibello"},"message":"Update index.html","distinct":true,"url":"https://api.github.com/repos/marcellodibello/marcellodibello.github.io/commits/7995cfd2d91a5b11eff75239ac124fae9af80d6d"}]},"public":true,"created_at":"2015-01-01T01:01:43Z"}
{"id":"2489396636","type":"PushEvent","actor":{"id":8819701,"login":"r-ggraham","gravatar_id":"","url":"https://api.github.com/users/r-ggraham","avatar_url":"https://avatars.githubusercontent.com/u/8819701?"},"repo":{"id":28678173,"name":"r-ggraham/Crumpet_Bot","url":"https://api.github.com/repos/r-ggraham/Crumpet_Bot"},"payload":{"push_id":536752576,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"332746658edcc60bca17720fce153357a2cd9dfb","before":"63b341a1c133b56bfaf703a2fed167478e1e4ed3","commits":[{"sha":"332746658edcc60bca17720fce153357a2cd9dfb","author":{"email":"f2f9dd43aa4244d32208a2ccfa0c7c9e9c48f7e7@uni.worc.ac.uk","name":"Rob G"},"message":"Credits\n\nAdded comment credits","distinct":true,"url":"https://api.github.com/repos/r-ggraham/Crumpet_Bot/commits/332746658edcc60bca17720fce153357a2cd9dfb"}]},"public":true,"created_at":"2015-01-01T01:01:43Z"}
{"id":"2489396639","type":"PushEvent","actor":{"id":869882,"login":"dpt","gravatar_id":"","url":"https://api.github.com/users/dpt","avatar_url":"https://avatars.githubusercontent.com/u/869882?"},"repo":{"id":27767031,"name":"dpt/DPTLib","url":"https://api.github.com/repos/dpt/DPTLib"},"payload":{"push_id":536752579,"size":4,"distinct_size":4,"ref":"refs/heads/master","head":"4517cde2c28d1ace039a16ed0d5e08859768602a","before":"e43b8c4ccd99f455062cce4952f013bcf986482a","commits":[{"sha":"88577c3778df7df077f6dd4323e59b8b9b41b688","author":{"email":"bfcdf3e6ca6cef45543bfbb57509c92aec9a39fb@davespace.co.uk","name":"David Thomas"},"message":"datastruct/vector: Add vector_insert, vector_ensure.","distinct":true,"url":"https://api.github.com/repos/dpt/DPTLib/commits/88577c3778df7df077f6dd4323e59b8b9b41b688"},{"sha":"b93b96d5db4bd7265a141337c0ac6979f4d8398c","author":{"email":"bfcdf3e6ca6cef45543bfbb57509c92aec9a39fb@davespace.co.uk","name":"David Thomas"},"message":"datastruct/vector: vector_insert()'s element to insert can be const *.","distinct":true,"url":"https://api.github.com/repos/dpt/DPTLib/commits/b93b96d5db4bd7265a141337c0ac6979f4d8398c"},{"sha":"51a8c9129b2983ac5486eda95484ac549f84e60d","author":{"email":"bfcdf3e6ca6cef45543bfbb57509c92aec9a39fb@davespace.co.uk","name":"David Thomas"},"message":"databases/digest-db: Mild rewrite of header prologue.","distinct":true,"url":"https://api.github.com/repos/dpt/DPTLib/commits/51a8c9129b2983ac5486eda95484ac549f84e60d"},{"sha":"4517cde2c28d1ace039a16ed0d5e08859768602a","author":{"email":"bfcdf3e6ca6cef45543bfbb57509c92aec9a39fb@davespace.co.uk","name":"David Thomas"},"message":"DPTLib.xccheckout: Remove stale repo refs.","distinct":true,"url":"https://api.github.com/repos/dpt/DPTLib/commits/4517cde2c28d1ace039a16ed0d5e08859768602a"}]},"public":true,"created_at":"2015-01-01T01:01:45Z"}
{"id":"2489396640","type":"CreateEvent","actor":{"id":790511,"login":"rizumita","gravatar_id":"","url":"https://api.github.com/users/rizumita","avatar_url":"https://avatars.githubusercontent.com/u/790511?"},"repo":{"id":28678229,"name":"rizumita/Ptarmigan","url":"https://api.github.com/repos/rizumita/Ptarmigan"},"payload":{"ref":null,"ref_type":"repository","master_branch":"master","description":"CoreData functions for Swift","pusher_type":"user"},"public":true,"created_at":"2015-01-01T01:01:45Z"}
{"id":"2489396645","type":"PushEvent","actor":{"id":904370,"login":"helhum","gravatar_id":"","url":"https://api.github.com/users/helhum","avatar_url":"https://avatars.githubusercontent.com/u/904370?"},"repo":{"id":21070637,"name":"TYPO3-Surf-CMS/TYPO3SurfCms.SurfTools","url":"https://api.github.com/repos/TYPO3-Surf-CMS/TYPO3SurfCms.SurfTools"},"payload":{"push_id":536752582,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"03ce16ec5d355a60057fb57f8d27d7116422f722","before":"e74bb4aec4a873f3a9ed58e829b7f9f908cfa544","commits":[{"sha":"03ce16ec5d355a60057fb57f8d27d7116422f722","author":{"email":"6bf857ca7de026fbed4ae790a809a0ea640901f4@helmuthummel.de","name":"Helmut Hummel"},"message":"Update README.md","distinct":true,"url":"https://api.github.com/repos/TYPO3-Surf-CMS/TYPO3SurfCms.SurfTools/commits/03ce16ec5d355a60057fb57f8d27d7116422f722"}]},"public":true,"created_at":"2015-01-01T01:01:46Z","org":{"id":7921669,"login":"TYPO3-Surf-CMS","gravatar_id":"","url":"https://api.github.com/orgs/TYPO3-Surf-CMS","avatar_url":"https://avatars.githubusercontent.com/u/7921669?"}}
{"id":"2489396647","type":"PushEvent","actor":{"id":4359301,"login":"inmWill","gravatar_id":"","url":"https://api.github.com/users/inmWill","avatar_url":"https://avatars.githubusercontent.com/u/4359301?"},"repo":{"id":27058289,"name":"inmWill/inmNgLayouts","url":"https://api.github.com/repos/inmWill/inmNgLayouts"},"payload":{"push_id":536752584,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"1b30dcdd5a034183a7b2da4c8abc8b4736ce144a","before":"38d6079b791807f692845a7e665ff146cce78b2f","commits":[{"sha":"1b30dcdd5a034183a7b2da4c8abc8b4736ce144a","author":{"email":"b8d2c4785179c9d0f40139a5951d8a653241c7ef@inmerge.com","name":"Farang"},"message":"removed test","distinct":true,"url":"https://api.github.com/repos/inmWill/inmNgLayouts/commits/1b30dcdd5a034183a7b2da4c8abc8b4736ce144a"}]},"public":true,"created_at":"2015-01-01T01:01:47Z"}
{"id":"2489396656","type":"PushEvent","actor":{"id":2501598,"login":"paciorek","gravatar_id":"","url":"https://api.github.com/users/paciorek","avatar_url":"https://avatars.githubusercontent.com/u/2501598?"},"repo":{"id":17234057,"name":"PalEON-Project/composition","url":"https://api.github.com/repos/PalEON-Project/composition"},"payload":{"push_id":536752590,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"f355f83b85994252322ee2194d54576077d38c88","before":"0cdff15a8f0387fe76196a3f05528b3128083d11","commits":[{"sha":"f355f83b85994252322ee2194d54576077d38c88","author":{"email":"cd2303627620d42aea1f002984decb2f80e8de9b@scf.Berkeley.EDU","name":"Christopher Paciorek"},"message":"more cleaning of files/paths in R files;\nadded packrat to repo","distinct":true,"url":"https://api.github.com/repos/PalEON-Project/composition/commits/f355f83b85994252322ee2194d54576077d38c88"}]},"public":true,"created_at":"2015-01-01T01:01:47Z","org":{"id":5016491,"login":"PalEON-Project","gravatar_id":"","url":"https://api.github.com/orgs/PalEON-Project","avatar_url":"https://avatars.githubusercontent.com/u/5016491?"}}
{"id":"2489396657","type":"PushEvent","actor":{"id":3495129,"login":"sundaymtn","gravatar_id":"","url":"https://api.github.com/users/sundaymtn","avatar_url":"https://avatars.githubusercontent.com/u/3495129?"},"repo":{"id":24147122,"name":"sundaymtn/waterline","url":"https://api.github.com/repos/sundaymtn/waterline"},"payload":{"push_id":536752591,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"b0598d6ba34d42ad8cfe6b10a7567951ede389a0","before":"44753191dc8f615ccda4f0afe31a09342172cfe4","commits":[{"sha":"b0598d6ba34d42ad8cfe6b10a7567951ede389a0","author":{"email":"7fbc091194a9488bfb16868527a7c3a8ba469dba@gmail.com","name":"Seth Carter"},"message":"[skip ci] updated waterline data","distinct":true,"url":"https://api.github.com/repos/sundaymtn/waterline/commits/b0598d6ba34d42ad8cfe6b10a7567951ede389a0"}]},"public":true,"created_at":"2015-01-01T01:01:48Z"}
{"id":"2489396659","type":"PushEvent","actor":{"id":10345916,"login":"robelgeda","gravatar_id":"","url":"https://api.github.com/users/robelgeda","avatar_url":"https://avatars.githubusercontent.com/u/10345916?"},"repo":{"id":28621069,"name":"robelgeda/robelgeda","url":"https://api.github.com/repos/robelgeda/robelgeda"},"payload":{"push_id":536752593,"size":1,"distinct_size":1,"ref":"refs/heads/gh-pages","head":"e454e00c6264adc11f7f0099e438399d8a5a88c8","before":"86b6e2201b0f4fc2256234b9bfea74873e21ed90","commits":[{"sha":"e454e00c6264adc11f7f0099e438399d8a5a88c8","author":{"email":"26dc263e33784ddd01201ac6953f5dcb1af40498@yahoo.com","name":"robelgeda"},"message":"New stuff","distinct":true,"url":"https://api.github.com/repos/robelgeda/robelgeda/commits/e454e00c6264adc11f7f0099e438399d8a5a88c8"}]},"public":true,"created_at":"2015-01-01T01:01:49Z"}
{"id":"2489396663","type":"WatchEvent","actor":{"id":9970148,"login":"bchoomnuan","gravatar_id":"","url":"https://api.github.com/users/bchoomnuan","avatar_url":"https://avatars.githubusercontent.com/u/9970148?"},"repo":{"id":21827146,"name":"chrislusf/weed-fs","url":"https://api.github.com/repos/chrislusf/weed-fs"},"payload":{"action":"started"},"public":true,"created_at":"2015-01-01T01:01:50Z"}
{"id":"2489396669","type":"PushEvent","actor":{"id":7950744,"login":"dmen555","gravatar_id":"","url":"https://api.github.com/users/dmen555","avatar_url":"https://avatars.githubusercontent.com/u/7950744?"},"repo":{"id":28383621,"name":"dmen555/SleepManager","url":"https://api.github.com/repos/dmen555/SleepManager"},"payload":{"push_id":536752597,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"689e3b010ca618cbb854cfc86f1f7763c3278569","before":"867bc6099ada213768c16ab01bc3627da7b04ead","commits":[{"sha":"689e3b010ca618cbb854cfc86f1f7763c3278569","author":{"email":"d1512ec681e77465d7ece3f74330967627c1d339@gmail.com","name":"David Qian"},"message":"Patch 7.1: Completed music timer except the graphs\n\n-successfully implemented the four different types of decay functions\n-successfully implemented services\n-successfully implemented sharedpreferences","distinct":true,"url":"https://api.github.com/repos/dmen555/SleepManager/commits/689e3b010ca618cbb854cfc86f1f7763c3278569"}]},"public":true,"created_at":"2015-01-01T01:01:50Z"}
{"id":"2489396676","type":"PushEvent","actor":{"id":8548034,"login":"Mortifica","gravatar_id":"","url":"https://api.github.com/users/Mortifica","avatar_url":"https://avatars.githubusercontent.com/u/8548034?"},"repo":{"id":28653599,"name":"Mortifica/DungeonTestArea","url":"https://api.github.com/repos/Mortifica/DungeonTestArea"},"payload":{"push_id":536752599,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"24beef29c0a3c297ab998b41726b048ec4bcaf08","before":"e27d2f3c9eb7716c52e2dd8325e8d22bd5733560","commits":[{"sha":"24beef29c0a3c297ab998b41726b048ec4bcaf08","author":{"email":"c4d9a55a62f361685d2115e4dff82e20462062f9@gmail.com","name":"Josh Hanke"},"message":"update","distinct":true,"url":"https://api.github.com/repos/Mortifica/DungeonTestArea/commits/24beef29c0a3c297ab998b41726b048ec4bcaf08"}]},"public":true,"created_at":"2015-01-01T01:01:52Z"}
{"id":"2489396678","type":"PushEvent","actor":{"id":2230058,"login":"CrazyAlvaro","gravatar_id":"","url":"https://api.github.com/users/CrazyAlvaro","avatar_url":"https://avatars.githubusercontent.com/u/2230058?"},"repo":{"id":28671592,"name":"CrazyAlvaro/Coursera-Cryptography-I","url":"https://api.github.com/repos/CrazyAlvaro/Coursera-Cryptography-I"},"payload":{"push_id":536752601,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"76e0858cb983271caedcbefe194ec462269d958c","before":"6112537f4a7b0b5d0792580d8a40a7998bacbea4","commits":[{"sha":"76e0858cb983271caedcbefe194ec462269d958c","author":{"email":"dad06db06a260749086cfe9a867182e7a593fa69@gmail.com","name":"Yechen Huang"},"message":"[#85323898] Add Calendar schedule","distinct":true,"url":"https://api.github.com/repos/CrazyAlvaro/Coursera-Cryptography-I/commits/76e0858cb983271caedcbefe194ec462269d958c"}]},"public":true,"created_at":"2015-01-01T01:01:52Z"}
{"id":"2489396682","type":"PushEvent","actor":{"id":4153853,"login":"jlumijarvi","gravatar_id":"","url":"https://api.github.com/users/jlumijarvi","avatar_url":"https://avatars.githubusercontent.com/u/4153853?"},"repo":{"id":28678176,"name":"jlumijarvi/csv2xml","url":"https://api.github.com/repos/jlumijarvi/csv2xml"},"payload":{"push_id":536752605,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"b3500640ddd547415a82cbc026d91be7f76ff14f","before":"c64c0c7b60fea3b7a191f3b8b39aa144d281ceba","commits":[{"sha":"b3500640ddd547415a82cbc026d91be7f76ff14f","author":{"email":"40e6fc59d2535c98bfd5d19357e20df6e95cef64@gmail.com","name":"jlumijarvi"},"message":"Update README.md","distinct":true,"url":"https://api.github.com/repos/jlumijarvi/csv2xml/commits/b3500640ddd547415a82cbc026d91be7f76ff14f"}]},"public":true,"created_at":"2015-01-01T01:01:53Z"}
{"id":"2489396684","type":"PushEvent","actor":{"id":3964764,"login":"elliekimpot","gravatar_id":"","url":"https://api.github.com/users/elliekimpot","avatar_url":"https://avatars.githubusercontent.com/u/3964764?"},"repo":{"id":28625867,"name":"elliekimpot/msm","url":"https://api.github.com/repos/elliekimpot/msm"},"payload":{"push_id":536752606,"size":5,"distinct_size":5,"ref":"refs/heads/feature/removed","head":"2c854302b53eef234eae379576a870f9ef9aa3bd","before":"b02f898e373a3b228ac7b5f815ffadb9a821e8f9","commits":[{"sha":"8ae5cba2d0c6e13cdbb3682fa7cc70960cd95246","author":{"email":"c6c610d4ed4672366596341ac49b62c9256ebf55@gmail.com","name":"Ellie"},"message":"pantech/debug: Drop PANTECH_MORE_DEBUGGING_INFO_ON_KERNEL\n\nSigned-off-by: Ellie <elliekimpot@gmail.com>","distinct":true,"url":"https://api.github.com/repos/elliekimpot/msm/commits/8ae5cba2d0c6e13cdbb3682fa7cc70960cd95246"},{"sha":"1fae68014e73cfc3a32fa5eca33505b011ebb7b4","author":{"email":"c6c610d4ed4672366596341ac49b62c9256ebf55@gmail.com","name":"Ellie"},"message":"Revert \"add basic CFLAGS for Krait\"\n\nThis reverts commit 0011b847c3b6a0082306b3b29077bdc9550c6dda.","distinct":true,"url":"https://api.github.com/repos/elliekimpot/msm/commits/1fae68014e73cfc3a32fa5eca33505b011ebb7b4"},{"sha":"ff109d56f2b1b87aada770208ba471ef9d085a70","author":{"email":"c6c610d4ed4672366596341ac49b62c9256ebf55@gmail.com","name":"Ellie"},"message":"pantech/debug: Drop PANTECH_DEBUG\n\nDrop following features\n* PANTECH_DEBUG_ON\n* PANTECH_DEBUG\n* PANTECH_DEBUG_SCHED_LOG\n* PANTECH_DEBUG_IRQ_LOG\n* PANTECH_DEBUG_DCVS_LOG\n* PANTECH_DEBUG_RPM_LOG\n\nSigned-off-by: Ellie <elliekimpot@gmail.com>","distinct":true,"url":"https://api.github.com/repos/elliekimpot/msm/commits/ff109d56f2b1b87aada770208ba471ef9d085a70"},{"sha":"c3d59ecafe5fda8c6776139e45c6c76eecbf046d","author":{"email":"c6c610d4ed4672366596341ac49b62c9256ebf55@gmail.com","name":"Ellie"},"message":"pantech/debug: Drop PANTECH_FS_AUTO_REPAIR\n\nSigned-off-by: Ellie <elliekimpot@gmail.com>","distinct":true,"url":"https://api.github.com/repos/elliekimpot/msm/commits/c3d59ecafe5fda8c6776139e45c6c76eecbf046d"},{"sha":"2c854302b53eef234eae379576a870f9ef9aa3bd","author":{"email":"c6c610d4ed4672366596341ac49b62c9256ebf55@gmail.com","name":"Ellie"},"message":"pantech/debug: Drop PANTECH_ERR_CRASH_LOGGING\n\nDop PANTECH_ERR_CRASH_LOGGING and introduce PANTECH_SYS\ndue to proper build (Solve error/mipi_sony_incell.c).\n\nSigned-off-by: Ellie <elliekimpot@gmail.com>","distinct":true,"url":"https://api.github.com/repos/elliekimpot/msm/commits/2c854302b53eef234eae379576a870f9ef9aa3bd"}]},"public":true,"created_at":"2015-01-01T01:01:53Z"}
{"id":"2489396685","type":"PushEvent","actor":{"id":8908145,"login":"jburgos1","gravatar_id":"","url":"https://api.github.com/users/jburgos1","avatar_url":"https://avatars.githubusercontent.com/u/8908145?"},"repo":{"id":25492727,"name":"jburgos1/fls1lambdas","url":"https://api.github.com/repos/jburgos1/fls1lambdas"},"payload":{"push_id":536752607,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"ffc8f8f329910df1b92686097a402204a1c6a148","before":"3b4244d64d7fe1637440dbefabfd907bbc45f696","commits":[{"sha":"ffc8f8f329910df1b92686097a402204a1c6a148","author":{"email":"a6f8acae3f5fd51a4ab59395a7512c8c769df47e@live.com","name":"Juan Burgos"},"message":"CSS Changes\n\nNo more text/box shadow\n\nyuck.","distinct":true,"url":"https://api.github.com/repos/jburgos1/fls1lambdas/commits/ffc8f8f329910df1b92686097a402204a1c6a148"}]},"public":true,"created_at":"2015-01-01T01:01:53Z"}
{"id":"2489396689","type":"ForkEvent","actor":{"id":1380147,"login":"arathael","gravatar_id":"","url":"https://api.github.com/users/arathael","avatar_url":"https://avatars.githubusercontent.com/u/1380147?"},"repo":{"id":27724993,"name":"homerjam/angular-ui-sref-fastclick","url":"https://api.github.com/repos/homerjam/angular-ui-sref-fastclick"},"payload":{"forkee":{"id":28678230,"name":"angular-ui-sref-fastclick","full_name":"arathael/angular-ui-sref-fastclick","owner":{"login":"arathael","id":1380147,"avatar_url":"https://avatars.githubusercontent.com/u/1380147?v=3","gravatar_id":"","url":"https://api.github.com/users/arathael","html_url":"https://github.com/arathael","followers_url":"https://api.github.com/users/arathael/followers","following_url":"https://api.github.com/users/arathael/following{/other_user}","gists_url":"https://api.github.com/users/arathael/gists{/gist_id}","starred_url":"https://api.github.com/users/arathael/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/arathael/subscriptions","organizations_url":"https://api.github.com/users/arathael/orgs","repos_url":"https://api.github.com/users/arathael/repos","events_url":"https://api.github.com/users/arathael/events{/privacy}","received_events_url":"https://api.github.com/users/arathael/received_events","type":"User","site_admin":false},"private":false,"html_url":"https://github.com/arathael/angular-ui-sref-fastclick","description":"Extends ui-sref directive (part of angular-ui-router) to add fastclick style behaviour","fork":true,"url":"https://api.github.com/repos/arathael/angular-ui-sref-fastclick","forks_url":"https://api.github.com/repos/arathael/angular-ui-sref-fastclick/forks","keys_url":"https://api.github.com/repos/arathael/angular-ui-sref-fastclick/keys{/key_id}","collaborators_url":"https://api.github.com/repos/arathael/angular-ui-sref-fastclick/collaborators{/collaborator}","teams_url":"https://api.github.com/repos/arathael/angular-ui-sref-fastclick/teams","hooks_url":"https://api.github.com/repos/arathael/angular-ui-sref-fastclick/hooks","issue_events_url":"https://api.github.com/repos/arathael/angular-ui-sref-fastclick/issues/events{/number}","events_url":"https://api.github.com/repos/arathael/angular-ui-sref-fastclick/events","assignees_url":"https://api.github.com/repos/arathael/angular-ui-sref-fastclick/assignees{/user}","branches_url":"https://api.github.com/repos/arathael/angular-ui-sref-fastclick/branches{/branch}","tags_url":"https://api.github.com/repos/arathael/angular-ui-sref-fastclick/tags","blobs_url":"https://api.github.com/repos/arathael/angular-ui-sref-fastclick/git/blobs{/sha}","git_tags_url":"https://api.github.com/repos/arathael/angular-ui-sref-fastclick/git/tags{/sha}","git_refs_url":"https://api.github.com/repos/arathael/angular-ui-sref-fastclick/git/refs{/sha}","trees_url":"https://api.github.com/repos/arathael/angular-ui-sref-fastclick/git/trees{/sha}","statuses_url":"https://api.github.com/repos/arathael/angular-ui-sref-fastclick/statuses/{sha}","languages_url":"https://api.github.com/repos/arathael/angular-ui-sref-fastclick/languages","stargazers_url":"https://api.github.com/repos/arathael/angular-ui-sref-fastclick/stargazers","contributors_url":"https://api.github.com/repos/arathael/angular-ui-sref-fastclick/contributors","subscribers_url":"https://api.github.com/repos/arathael/angular-ui-sref-fastclick/subscribers","subscription_url":"https://api.github.com/repos/arathael/angular-ui-sref-fastclick/subscription","commits_url":"https://api.github.com/repos/arathael/angular-ui-sref-fastclick/commits{/sha}","git_commits_url":"https://api.github.com/repos/arathael/angular-ui-sref-fastclick/git/commits{/sha}","comments_url":"https://api.github.com/repos/arathael/angular-ui-sref-fastclick/comments{/number}","issue_comment_url":"https://api.github.com/repos/arathael/angular-ui-sref-fastclick/issues/comments/{number}","contents_url":"https://api.github.com/repos/arathael/angular-ui-sref-fastclick/contents/{+path}","compare_url":"https://api.github.com/repos/arathael/angular-ui-sref-fastclick/compare/{base}...{head}","merges_url":"https://api.github.com/repos/arathael/angular-ui-sref-fastclick/merges","archive_url":"https://api.github.com/repos/arathael/angular-ui-sref-fastclick/{archive_format}{/ref}","downloads_url":"https://api.github.com/repos/arathael/angular-ui-sref-fastclick/downloads","issues_url":"https://api.github.com/repos/arathael/angular-ui-sref-fastclick/issues{/number}","pulls_url":"https://api.github.com/repos/arathael/angular-ui-sref-fastclick/pulls{/number}","milestones_url":"https://api.github.com/repos/arathael/angular-ui-sref-fastclick/milestones{/number}","notifications_url":"https://api.github.com/repos/arathael/angular-ui-sref-fastclick/notifications{?since,all,participating}","labels_url":"https://api.github.com/repos/arathael/angular-ui-sref-fastclick/labels{/name}","releases_url":"https://api.github.com/repos/arathael/angular-ui-sref-fastclick/releases{/id}","created_at":"2015-01-01T01:01:53Z","updated_at":"2015-01-01T00:56:57Z","pushed_at":"2014-12-08T16:59:03Z","git_url":"git://github.com/arathael/angular-ui-sref-fastclick.git","ssh_url":"git@github.com:arathael/angular-ui-sref-fastclick.git","clone_url":"https://github.com/arathael/angular-ui-sref-fastclick.git","svn_url":"https://github.com/arathael/angular-ui-sref-fastclick","homepage":"","size":116,"stargazers_count":0,"watchers_count":0,"language":null,"has_issues":false,"has_downloads":true,"has_wiki":true,"has_pages":false,"forks_count":0,"mirror_url":null,"open_issues_count":0,"forks":0,"open_issues":0,"watchers":0,"default_branch":"master","public":true}},"public":true,"created_at":"2015-01-01T01:01:54Z"}
{"id":"2489396690","type":"IssuesEvent","actor":{"id":305455,"login":"mykmelez","gravatar_id":"","url":"https://api.github.com/users/mykmelez","avatar_url":"https://avatars.githubusercontent.com/u/305455?"},"repo":{"id":15485479,"name":"facelessuser/TabsExtra","url":"https://api.github.com/repos/facelessuser/TabsExtra"},"payload":{"action":"opened","issue":{"url":"https://api.github.com/repos/facelessuser/TabsExtra/issues/21","labels_url":"https://api.github.com/repos/facelessuser/TabsExtra/issues/21/labels{/name}","comments_url":"https://api.github.com/repos/facelessuser/TabsExtra/issues/21/comments","events_url":"https://api.github.com/repos/facelessuser/TabsExtra/issues/21/events","html_url":"https://github.com/facelessuser/TabsExtra/issues/21","id":53210194,"number":21,"title":"\"reopen closed file\" moves reopened tab to the right of its previous location","user":{"login":"mykmelez","id":305455,"avatar_url":"https://avatars.githubusercontent.com/u/305455?v=3","gravatar_id":"","url":"https://api.github.com/users/mykmelez","html_url":"https://github.com/mykmelez","followers_url":"https://api.github.com/users/mykmelez/followers","following_url":"https://api.github.com/users/mykmelez/following{/other_user}","gists_url":"https://api.github.com/users/mykmelez/gists{/gist_id}","starred_url":"https://api.github.com/users/mykmelez/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/mykmelez/subscriptions","organizations_url":"https://api.github.com/users/mykmelez/orgs","repos_url":"https://api.github.com/users/mykmelez/repos","events_url":"https://api.github.com/users/mykmelez/events{/privacy}","received_events_url":"https://api.github.com/users/mykmelez/received_events","type":"User","site_admin":false},"labels":[],"state":"open","locked":false,"assignee":null,"milestone":null,"comments":0,"created_at":"2015-01-01T01:01:54Z","updated_at":"2015-01-01T01:01:54Z","closed_at":null,"body":"I like *fallback_focus* set to `right`, which is why I found and installed TabsExtra! But there's an issue with it: if you \"reopen closed file\", the reopened tab doesn't go back to its previous position on the tab bar. Instead, it jumps one position to the right.\r\n\r\nSteps to Reproduce:\r\n\r\n1. Open three tabs, A, B, and C, in that order.\r\n2. Activate tab B (the middle tab) and then close it (Cmd-W on my Mac).\r\n3. Reopen it (Cmd-Shift-T).\r\n\r\nB should reopen between A and C, which is where it was before; but instead it reopens to the right of C!\r\n"}},"public":true,"created_at":"2015-01-01T01:01:54Z"}
{"id":"2489396699","type":"PushEvent","actor":{"id":458272,"login":"tomalexander","gravatar_id":"","url":"https://api.github.com/users/tomalexander","avatar_url":"https://avatars.githubusercontent.com/u/458272?"},"repo":{"id":28367645,"name":"tomalexander/basic_multi_bot","url":"https://api.github.com/repos/tomalexander/basic_multi_bot"},"payload":{"push_id":536752612,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"bcc7dd7ee5550ef6d71e14b4d4c587477f71a3dc","before":"d299ad2b913fffa66512180cd642e89cca3db789","commits":[{"sha":"bcc7dd7ee5550ef6d71e14b4d4c587477f71a3dc","author":{"email":"a09a620e88c0ebee24434030b77c3b58d8242b71@gmail.com","name":"Tom Alexander"},"message":"switched to single instances of delegates and delegates determining rooms","distinct":true,"url":"https://api.github.com/repos/tomalexander/basic_multi_bot/commits/bcc7dd7ee5550ef6d71e14b4d4c587477f71a3dc"}]},"public":true,"created_at":"2015-01-01T01:01:55Z"}
{"id":"2489396700","type":"IssuesEvent","actor":{"id":640745,"login":"bchurchill","gravatar_id":"","url":"https://api.github.com/users/bchurchill","avatar_url":"https://avatars.githubusercontent.com/u/640745?"},"repo":{"id":2747319,"name":"eschkufz/cpputil","url":"https://api.github.com/repos/eschkufz/cpputil"},"payload":{"action":"closed","issue":{"url":"https://api.github.com/repos/eschkufz/cpputil/issues/21","labels_url":"https://api.github.com/repos/eschkufz/cpputil/issues/21/labels{/name}","comments_url":"https://api.github.com/repos/eschkufz/cpputil/issues/21/comments","events_url":"https://api.github.com/repos/eschkufz/cpputil/issues/21/events","html_url":"https://github.com/eschkufz/cpputil/issues/21","id":52613427,"number":21,"title":"Get string representation of bitstring","user":{"login":"bchurchill","id":640745,"avatar_url":"https://avatars.githubusercontent.com/u/640745?v=3","gravatar_id":"","url":"https://api.github.com/users/bchurchill","html_url":"https://github.com/bchurchill","followers_url":"https://api.github.com/users/bchurchill/followers","following_url":"https://api.github.com/users/bchurchill/following{/other_user}","gists_url":"https://api.github.com/users/bchurchill/gists{/gist_id}","starred_url":"https://api.github.com/users/bchurchill/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/bchurchill/subscriptions","organizations_url":"https://api.github.com/users/bchurchill/orgs","repos_url":"https://api.github.com/users/bchurchill/repos","events_url":"https://api.github.com/users/bchurchill/events{/privacy}","received_events_url":"https://api.github.com/users/bchurchill/received_events","type":"User","site_admin":false},"labels":[],"state":"closed","locked":false,"assignee":{"login":"bchurchill","id":640745,"avatar_url":"https://avatars.githubusercontent.com/u/640745?v=3","gravatar_id":"","url":"https://api.github.com/users/bchurchill","html_url":"https://github.com/bchurchill","followers_url":"https://api.github.com/users/bchurchill/followers","following_url":"https://api.github.com/users/bchurchill/following{/other_user}","gists_url":"https://api.github.com/users/bchurchill/gists{/gist_id}","starred_url":"https://api.github.com/users/bchurchill/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/bchurchill/subscriptions","organizations_url":"https://api.github.com/users/bchurchill/orgs","repos_url":"https://api.github.com/users/bchurchill/repos","events_url":"https://api.github.com/users/bchurchill/events{/privacy}","received_events_url":"https://api.github.com/users/bchurchill/received_events","type":"User","site_admin":false},"milestone":null,"comments":2,"created_at":"2014-12-22T01:47:57Z","updated_at":"2015-01-01T01:01:55Z","closed_at":"2015-01-01T01:01:55Z","body":"It would be nice to have a way to get a base-16 string representation of the contents of a bitstring."}},"public":true,"created_at":"2015-01-01T01:01:56Z"}
{"id":"2489396702","type":"CreateEvent","actor":{"id":543483,"login":"rockdragon","gravatar_id":"","url":"https://api.github.com/users/rockdragon","avatar_url":"https://avatars.githubusercontent.com/u/543483?"},"repo":{"id":28678231,"name":"rockdragon/SocketChat","url":"https://api.github.com/repos/rockdragon/SocketChat"},"payload":{"ref":null,"ref_type":"repository","master_branch":"master","description":"Chat room scaffolding","pusher_type":"user"},"public":true,"created_at":"2015-01-01T01:01:56Z"}
{"id":"2489396701","type":"IssueCommentEvent","actor":{"id":640745,"login":"bchurchill","gravatar_id":"","url":"https://api.github.com/users/bchurchill","avatar_url":"https://avatars.githubusercontent.com/u/640745?"},"repo":{"id":2747319,"name":"eschkufz/cpputil","url":"https://api.github.com/repos/eschkufz/cpputil"},"payload":{"action":"created","issue":{"url":"https://api.github.com/repos/eschkufz/cpputil/issues/21","labels_url":"https://api.github.com/repos/eschkufz/cpputil/issues/21/labels{/name}","comments_url":"https://api.github.com/repos/eschkufz/cpputil/issues/21/comments","events_url":"https://api.github.com/repos/eschkufz/cpputil/issues/21/events","html_url":"https://github.com/eschkufz/cpputil/issues/21","id":52613427,"number":21,"title":"Get string representation of bitstring","user":{"login":"bchurchill","id":640745,"avatar_url":"https://avatars.githubusercontent.com/u/640745?v=3","gravatar_id":"","url":"https://api.github.com/users/bchurchill","html_url":"https://github.com/bchurchill","followers_url":"https://api.github.com/users/bchurchill/followers","following_url":"https://api.github.com/users/bchurchill/following{/other_user}","gists_url":"https://api.github.com/users/bchurchill/gists{/gist_id}","starred_url":"https://api.github.com/users/bchurchill/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/bchurchill/subscriptions","organizations_url":"https://api.github.com/users/bchurchill/orgs","repos_url":"https://api.github.com/users/bchurchill/repos","events_url":"https://api.github.com/users/bchurchill/events{/privacy}","received_events_url":"https://api.github.com/users/bchurchill/received_events","type":"User","site_admin":false},"labels":[],"state":"closed","locked":false,"assignee":{"login":"bchurchill","id":640745,"avatar_url":"https://avatars.githubusercontent.com/u/640745?v=3","gravatar_id":"","url":"https://api.github.com/users/bchurchill","html_url":"https://github.com/bchurchill","followers_url":"https://api.github.com/users/bchurchill/followers","following_url":"https://api.github.com/users/bchurchill/following{/other_user}","gists_url":"https://api.github.com/users/bchurchill/gists{/gist_id}","starred_url":"https://api.github.com/users/bchurchill/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/bchurchill/subscriptions","organizations_url":"https://api.github.com/users/bchurchill/orgs","repos_url":"https://api.github.com/users/bchurchill/repos","events_url":"https://api.github.com/users/bchurchill/events{/privacy}","received_events_url":"https://api.github.com/users/bchurchill/received_events","type":"User","site_admin":false},"milestone":null,"comments":2,"created_at":"2014-12-22T01:47:57Z","updated_at":"2015-01-01T01:01:55Z","closed_at":"2015-01-01T01:01:55Z","body":"It would be nice to have a way to get a base-16 string representation of the contents of a bitstring."},"comment":{"url":"https://api.github.com/repos/eschkufz/cpputil/issues/comments/68477253","html_url":"https://github.com/eschkufz/cpputil/issues/21#issuecomment-68477253","issue_url":"https://api.github.com/repos/eschkufz/cpputil/issues/21","id":68477253,"user":{"login":"bchurchill","id":640745,"avatar_url":"https://avatars.githubusercontent.com/u/640745?v=3","gravatar_id":"","url":"https://api.github.com/users/bchurchill","html_url":"https://github.com/bchurchill","followers_url":"https://api.github.com/users/bchurchill/followers","following_url":"https://api.github.com/users/bchurchill/following{/other_user}","gists_url":"https://api.github.com/users/bchurchill/gists{/gist_id}","starred_url":"https://api.github.com/users/bchurchill/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/bchurchill/subscriptions","organizations_url":"https://api.github.com/users/bchurchill/orgs","repos_url":"https://api.github.com/users/bchurchill/repos","events_url":"https://api.github.com/users/bchurchill/events{/privacy}","received_events_url":"https://api.github.com/users/bchurchill/received_events","type":"User","site_admin":false},"created_at":"2015-01-01T01:01:55Z","updated_at":"2015-01-01T01:01:55Z","body":"That's slick.  But I don't need this anymore because I'm not using these for constant SymBitVectors.  Closing."}},"public":true,"created_at":"2015-01-01T01:01:56Z"}
{"id":"2489396705","type":"DeleteEvent","actor":{"id":10263666,"login":"katiekroik","gravatar_id":"","url":"https://api.github.com/users/katiekroik","avatar_url":"https://avatars.githubusercontent.com/u/10263666?"},"repo":{"id":28677679,"name":"jl4282/swirlwebsite","url":"https://api.github.com/repos/jl4282/swirlwebsite"},"payload":{"ref":"Develop","ref_type":"branch","pusher_type":"user"},"public":true,"created_at":"2015-01-01T01:01:57Z"}
{"id":"2489396707","type":"PushEvent","actor":{"id":8962953,"login":"kutlass","gravatar_id":"","url":"https://api.github.com/users/kutlass","avatar_url":"https://avatars.githubusercontent.com/u/8962953?"},"repo":{"id":24609481,"name":"kutlass/YogaFrame","url":"https://api.github.com/repos/kutlass/YogaFrame"},"payload":{"push_id":536752614,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"84fb78bea76b0c5933953a897540a10122b3fba6","before":"38aff9c324f9ad1e211195a00bf70ca0c84cb2d9","commits":[{"sha":"84fb78bea76b0c5933953a897540a10122b3fba6","author":{"email":"f1f30ec1cfc7458c34a4cc74fc6809cf46b6b758@yogaframe.net","name":"Karl Flores"},"message":"Change return type from Dispatch to a JSession for WebPostJSession API.","distinct":true,"url":"https://api.github.com/repos/kutlass/YogaFrame/commits/84fb78bea76b0c5933953a897540a10122b3fba6"}]},"public":true,"created_at":"2015-01-01T01:01:57Z"}
{"id":"2489396710","type":"PushEvent","actor":{"id":3386273,"login":"david-ragazzi","gravatar_id":"","url":"https://api.github.com/users/david-ragazzi","avatar_url":"https://avatars.githubusercontent.com/u/3386273?"},"repo":{"id":18156369,"name":"david-ragazzi/nupic","url":"https://api.github.com/repos/david-ragazzi/nupic"},"payload":{"push_id":536752616,"size":1,"distinct_size":1,"ref":"refs/heads/move_testpyhtm_to_nupiccore","head":"61cd06671a19147d11da4c23d5d9fbe811e73124","before":"f64e0e47e581048266793e22ff005600cc5a5f9f","commits":[{"sha":"61cd06671a19147d11da4c23d5d9fbe811e73124","author":{"email":"9f810c70f0453cb6f7cc60219cf23ba543fb72b1@hotmail.com","name":"DavidRagazzi"},"message":"Remove HtmTest and call it from nupic.core binaries","distinct":true,"url":"https://api.github.com/repos/david-ragazzi/nupic/commits/61cd06671a19147d11da4c23d5d9fbe811e73124"}]},"public":true,"created_at":"2015-01-01T01:01:57Z"}
{"id":"2489396712","type":"PushEvent","actor":{"id":226950,"login":"chotchki","gravatar_id":"","url":"https://api.github.com/users/chotchki","avatar_url":"https://avatars.githubusercontent.com/u/226950?"},"repo":{"id":28649464,"name":"chotchki/Henge","url":"https://api.github.com/repos/chotchki/Henge"},"payload":{"push_id":536752617,"size":2,"distinct_size":2,"ref":"refs/heads/master","head":"60a6ee7b0f57de246ed67a5e8d3f18bfd353d43a","before":"0b6b908abb4f0380f136ebd5f5a2cafb76364ad5","commits":[{"sha":"95124fea28815ccfa0300470d3ac447ff351f8a2","author":{"email":"4cb429e61173bad4e4892a8806f74a746a9d9e4a@gmail.com","name":"Christopher Hotchkiss"},"message":"Adding skeleton classes for startup","distinct":true,"url":"https://api.github.com/repos/chotchki/Henge/commits/95124fea28815ccfa0300470d3ac447ff351f8a2"},{"sha":"60a6ee7b0f57de246ed67a5e8d3f18bfd353d43a","author":{"email":"4cb429e61173bad4e4892a8806f74a746a9d9e4a@gmail.com","name":"Christopher Hotchkiss"},"message":"Merge branch 'master' of ssh://git@github.com/chotchki/Henge.git","distinct":true,"url":"https://api.github.com/repos/chotchki/Henge/commits/60a6ee7b0f57de246ed67a5e8d3f18bfd353d43a"}]},"public":true,"created_at":"2015-01-01T01:01:57Z"}
{"id":"2489396713","type":"IssueCommentEvent","actor":{"id":8903402,"login":"oncomangus","gravatar_id":"","url":"https://api.github.com/users/oncomangus","avatar_url":"https://avatars.githubusercontent.com/u/8903402?"},"repo":{"id":26731988,"name":"badrsony/icloudin-support-","url":"https://api.github.com/repos/badrsony/icloudin-support-"},"payload":{"action":"created","issue":{"url":"https://api.github.com/repos/badrsony/icloudin-support-/issues/4","labels_url":"https://api.github.com/repos/badrsony/icloudin-support-/issues/4/labels{/name}","comments_url":"https://api.github.com/repos/badrsony/icloudin-support-/issues/4/comments","events_url":"https://api.github.com/repos/badrsony/icloudin-support-/issues/4/events","html_url":"https://github.com/badrsony/icloudin-support-/issues/4","id":50920400,"number":4,"title":"icloudin support ","user":{"login":"badrsony","id":7895050,"avatar_url":"https://avatars.githubusercontent.com/u/7895050?v=3","gravatar_id":"","url":"https://api.github.com/users/badrsony","html_url":"https://github.com/badrsony","followers_url":"https://api.github.com/users/badrsony/followers","following_url":"https://api.github.com/users/badrsony/following{/other_user}","gists_url":"https://api.github.com/users/badrsony/gists{/gist_id}","starred_url":"https://api.github.com/users/badrsony/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/badrsony/subscriptions","organizations_url":"https://api.github.com/users/badrsony/orgs","repos_url":"https://api.github.com/users/badrsony/repos","events_url":"https://api.github.com/users/badrsony/events{/privacy}","received_events_url":"https://api.github.com/users/badrsony/received_events","type":"User","site_admin":false},"labels":[],"state":"closed","locked":false,"assignee":null,"milestone":null,"comments":996,"created_at":"2014-12-04T02:13:39Z","updated_at":"2015-01-01T01:01:58Z","closed_at":"2015-01-01T00:00:32Z","body":"Originally written by @TTMTT. That we hope for him safery and peace\r\n.\r\n\r\nWow, ipod touch 5G (8.1) - iCL0udin v1.0 bypass activation (icloud)\r\n\r\nhttp://youtu.be/tZmEdlDGNu4\r\n\r\niCL0udin v1.0 bypass activation (icloud) - ipad mini 2G (7.1.1)\r\n\r\nhttp://youtu.be/tevYyBN2QCQ\r\n\r\nVideo for bypass icloud (iCL0udin v1.0) for iphone 4 CDMA ..\r\n\r\nhttp://youtu.be/i85-D6N2YLk\r\n\r\nNew video for iCL0udin v1.0 bypass icloud (3 iphones 7.1.2):\r\n\r\nhttp://youtu.be/p51TNlCr7ug\r\n\r\niCL0udin v1.0 -> %98\r\n\r\nRemaining: %2 testing with some people..\r\n\r\nLast Method:\r\n\r\nmethod 1 : via (other xml not to deviceservices - exploit)\r\nmethod 2 : via (apple cert & key and i can downgrade to any ios)\r\nmethod 3 : via (change some string by hex on ELF file << some times i got error)\r\nmethod 4 : via (use apple ssl cert or real ssl in server and change some string in iphone)\r\n\r\niCL0udin v1.0 have this method:\r\n\r\nmethod 1 : via (other xml not to deviceservices - exploit)\r\nmethod 2 : via (apple cert & key and i can downgrade to any ios)"},"comment":{"url":"https://api.github.com/repos/badrsony/icloudin-support-/issues/comments/68477255","html_url":"https://github.com/badrsony/icloudin-support-/issues/4#issuecomment-68477255","issue_url":"https://api.github.com/repos/badrsony/icloudin-support-/issues/4","id":68477255,"user":{"login":"oncomangus","id":8903402,"avatar_url":"https://avatars.githubusercontent.com/u/8903402?v=3","gravatar_id":"","url":"https://api.github.com/users/oncomangus","html_url":"https://github.com/oncomangus","followers_url":"https://api.github.com/users/oncomangus/followers","following_url":"https://api.github.com/users/oncomangus/following{/other_user}","gists_url":"https://api.github.com/users/oncomangus/gists{/gist_id}","starred_url":"https://api.github.com/users/oncomangus/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/oncomangus/subscriptions","organizations_url":"https://api.github.com/users/oncomangus/orgs","repos_url":"https://api.github.com/users/oncomangus/repos","events_url":"https://api.github.com/users/oncomangus/events{/privacy}","received_events_url":"https://api.github.com/users/oncomangus/received_events","type":"User","site_admin":false},"created_at":"2015-01-01T01:01:58Z","updated_at":"2015-01-01T01:01:58Z","body":"@All HAPPY NEW ICLOUD YEAR #cheers #coffee"}},"public":true,"created_at":"2015-01-01T01:01:58Z"}
{"id":"2489396720","type":"PushEvent","actor":{"id":41057,"login":"samv","gravatar_id":"","url":"https://api.github.com/users/samv","avatar_url":"https://avatars.githubusercontent.com/u/41057?"},"repo":{"id":16792286,"name":"hearsaycorp/normalize","url":"https://api.github.com/repos/hearsaycorp/normalize"},"payload":{"push_id":536752624,"size":2,"distinct_size":1,"ref":"refs/heads/gh-pages","head":"20f0f9bbc6dd3bc111019fb985fc42d28a9814ee","before":"3e040e2c4d617beb145074a21cac1402edcea35c","commits":[{"sha":"2f0df332bf4a1e963296f545802cf7497ac20ff8","author":{"email":"f16bed56189e249fe4ca8ed10a1ecae60e8ceac0@vilain.net","name":"Sam Vilain"},"message":"Implement FieldSelector.delete\n\nAll 4 CRUD operations now supported :)","distinct":false,"url":"https://api.github.com/repos/hearsaycorp/normalize/commits/2f0df332bf4a1e963296f545802cf7497ac20ff8"},{"sha":"20f0f9bbc6dd3bc111019fb985fc42d28a9814ee","author":{"email":"f16bed56189e249fe4ca8ed10a1ecae60e8ceac0@vilain.net","name":"Sam Vilain"},"message":"Update sphinx docs to commit 0.6.3-1-g2f0df33","distinct":true,"url":"https://api.github.com/repos/hearsaycorp/normalize/commits/20f0f9bbc6dd3bc111019fb985fc42d28a9814ee"}]},"public":true,"created_at":"2015-01-01T01:01:59Z","org":{"id":633032,"login":"hearsaycorp","gravatar_id":"","url":"https://api.github.com/orgs/hearsaycorp","avatar_url":"https://avatars.githubusercontent.com/u/633032?"}}
{"id":"2489396721","type":"PullRequestReviewCommentEvent","actor":{"id":3103764,"login":"carymrobbins","gravatar_id":"","url":"https://api.github.com/users/carymrobbins","avatar_url":"https://avatars.githubusercontent.com/u/3103764?"},"repo":{"id":15573192,"name":"carymrobbins/intellij-haskforce","url":"https://api.github.com/repos/carymrobbins/intellij-haskforce"},"payload":{"action":"created","comment":{"url":"https://api.github.com/repos/carymrobbins/intellij-haskforce/pulls/comments/22397260","id":22397260,"diff_hunk":"@@ -0,0 +1,53 @@\n+package com.haskforce.highlighting.annotation.external;\n+\n+import com.intellij.openapi.editor.LogicalPosition;\n+import com.intellij.openapi.editor.VisualPosition;\n+import org.junit.Assert;\n+import org.junit.Test;\n+\n+/**\n+ * Created by kasper on 12/24/14.\n+ */\n+public class GhcUtilTest {","path":"tests/com/haskforce/highlighting/annotation/external/GhcUtilTest.java","position":11,"original_position":11,"commit_id":"73ec576f11ba5aa0906e1ca03bc9390ca94b40e2","original_commit_id":"73ec576f11ba5aa0906e1ca03bc9390ca94b40e2","user":{"login":"carymrobbins","id":3103764,"avatar_url":"https://avatars.githubusercontent.com/u/3103764?v=3","gravatar_id":"","url":"https://api.github.com/users/carymrobbins","html_url":"https://github.com/carymrobbins","followers_url":"https://api.github.com/users/carymrobbins/followers","following_url":"https://api.github.com/users/carymrobbins/following{/other_user}","gists_url":"https://api.github.com/users/carymrobbins/gists{/gist_id}","starred_url":"https://api.github.com/users/carymrobbins/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/carymrobbins/subscriptions","organizations_url":"https://api.github.com/users/carymrobbins/orgs","repos_url":"https://api.github.com/users/carymrobbins/repos","events_url":"https://api.github.com/users/carymrobbins/events{/privacy}","received_events_url":"https://api.github.com/users/carymrobbins/received_events","type":"User","site_admin":false},"body":"Nice!  Thanks for adding tests.  Be sure to add this class to **tests/com/haskforce/HaskellTestCase.java**","created_at":"2015-01-01T01:02:00Z","updated_at":"2015-01-01T01:02:00Z","html_url":"https://github.com/carymrobbins/intellij-haskforce/pull/105#discussion_r22397260","pull_request_url":"https://api.github.com/repos/carymrobbins/intellij-haskforce/pulls/105","_links":{"self":{"href":"https://api.github.com/repos/carymrobbins/intellij-haskforce/pulls/comments/22397260"},"html":{"href":"https://github.com/carymrobbins/intellij-haskforce/pull/105#discussion_r22397260"},"pull_request":{"href":"https://api.github.com/repos/carymrobbins/intellij-haskforce/pulls/105"}}},"pull_request":{"url":"https://api.github.com/repos/carymrobbins/intellij-haskforce/pulls/105","id":26615813,"html_url":"https://github.com/carymrobbins/intellij-haskforce/pull/105","diff_url":"https://github.com/carymrobbins/intellij-haskforce/pull/105.diff","patch_url":"https://github.com/carymrobbins/intellij-haskforce/pull/105.patch","issue_url":"https://api.github.com/repos/carymrobbins/intellij-haskforce/issues/105","number":105,"state":"open","locked":false,"title":"Issue90 type information","user":{"login":"KasperJanssens","id":5415995,"avatar_url":"https://avatars.githubusercontent.com/u/5415995?v=3","gravatar_id":"","url":"https://api.github.com/users/KasperJanssens","html_url":"https://github.com/KasperJanssens","followers_url":"https://api.github.com/users/KasperJanssens/followers","following_url":"https://api.github.com/users/KasperJanssens/following{/other_user}","gists_url":"https://api.github.com/users/KasperJanssens/gists{/gist_id}","starred_url":"https://api.github.com/users/KasperJanssens/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/KasperJanssens/subscriptions","organizations_url":"https://api.github.com/users/KasperJanssens/orgs","repos_url":"https://api.github.com/users/KasperJanssens/repos","events_url":"https://api.github.com/users/KasperJanssens/events{/privacy}","received_events_url":"https://api.github.com/users/KasperJanssens/received_events","type":"User","site_admin":false},"body":"Cary,\r\n\r\nFirst try of the type information. It seems quite stable, been using it for a few days (provided the configuration is correct, I suppose, didn't test what happens when ghc-modi is not correctly configured).\r\n\r\nI bound the type info call to the DocumentationProvider as well as to an action (alt - equals, like scala). I prefer the action, I think the documentation provider doesn't work so well. There are tests of the parsing of the output of ghc-modi, but not really of the documentationprovider, basically because of the abundance of static calls and the fact that I think they can only be mocked while testing, and statics can only be mocked through Powermock if I recall correctly, which would mean an extra test dependency and so on and so forth, so I left that to be your call.\r\n\r\nAlso, there is a weird behaviour that getting the editor creates a stack trace of around 5 kilometers long, something that seems like a threading issue, but the function seems to work. I don't really know why the stack trace happens, all the more because it only happens when calling the type information through the documentation provider (same code path is used when the action is called, but no stack trace). Maybe you know more what could go wrong, it looks like something intellij-related.\r\n\r\nSo, consider this a \"request for comment\" more than a pull request ;-)\r\n\r\nKasper","created_at":"2014-12-27T16:19:07Z","updated_at":"2015-01-01T01:02:00Z","closed_at":null,"merged_at":null,"merge_commit_sha":"b32a5f3ef0bc14eebea4baa946ec2e66008086dd","assignee":null,"milestone":null,"commits_url":"https://api.github.com/repos/carymrobbins/intellij-haskforce/pulls/105/commits","review_comments_url":"https://api.github.com/repos/carymrobbins/intellij-haskforce/pulls/105/comments","review_comment_url":"https://api.github.com/repos/carymrobbins/intellij-haskforce/pulls/comments/{number}","comments_url":"https://api.github.com/repos/carymrobbins/intellij-haskforce/issues/105/comments","statuses_url":"https://api.github.com/repos/carymrobbins/intellij-haskforce/statuses/73ec576f11ba5aa0906e1ca03bc9390ca94b40e2","head":{"label":"KasperJanssens:issue90TypeInformation","ref":"issue90TypeInformation","sha":"73ec576f11ba5aa0906e1ca03bc9390ca94b40e2","user":{"login":"KasperJanssens","id":5415995,"avatar_url":"https://avatars.githubusercontent.com/u/5415995?v=3","gravatar_id":"","url":"https://api.github.com/users/KasperJanssens","html_url":"https://github.com/KasperJanssens","followers_url":"https://api.github.com/users/KasperJanssens/followers","following_url":"https://api.github.com/users/KasperJanssens/following{/other_user}","gists_url":"https://api.github.com/users/KasperJanssens/gists{/gist_id}","starred_url":"https://api.github.com/users/KasperJanssens/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/KasperJanssens/subscriptions","organizations_url":"https://api.github.com/users/KasperJanssens/orgs","repos_url":"https://api.github.com/users/KasperJanssens/repos","events_url":"https://api.github.com/users/KasperJanssens/events{/privacy}","received_events_url":"https://api.github.com/users/KasperJanssens/received_events","type":"User","site_admin":false},"repo":{"id":28540684,"name":"intellij-haskforce","full_name":"KasperJanssens/intellij-haskforce","owner":{"login":"KasperJanssens","id":5415995,"avatar_url":"https://avatars.githubusercontent.com/u/5415995?v=3","gravatar_id":"","url":"https://api.github.com/users/KasperJanssens","html_url":"https://github.com/KasperJanssens","followers_url":"https://api.github.com/users/KasperJanssens/followers","following_url":"https://api.github.com/users/KasperJanssens/following{/other_user}","gists_url":"https://api.github.com/users/KasperJanssens/gists{/gist_id}","starred_url":"https://api.github.com/users/KasperJanssens/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/KasperJanssens/subscriptions","organizations_url":"https://api.github.com/users/KasperJanssens/orgs","repos_url":"https://api.github.com/users/KasperJanssens/repos","events_url":"https://api.github.com/users/KasperJanssens/events{/privacy}","received_events_url":"https://api.github.com/users/KasperJanssens/received_events","type":"User","site_admin":false},"private":false,"html_url":"https://github.com/KasperJanssens/intellij-haskforce","description":"Haskell plugin for IntelliJ IDEA Community Edition","fork":true,"url":"https://api.github.com/repos/KasperJanssens/intellij-haskforce","forks_url":"https://api.github.com/repos/KasperJanssens/intellij-haskforce/forks","keys_url":"https://api.github.com/repos/KasperJanssens/intellij-haskforce/keys{/key_id}","collaborators_url":"https://api.github.com/repos/KasperJanssens/intellij-haskforce/collaborators{/collaborator}","teams_url":"https://api.github.com/repos/KasperJanssens/intellij-haskforce/teams","hooks_url":"https://api.github.com/repos/KasperJanssens/intellij-haskforce/hooks","issue_events_url":"https://api.github.com/repos/KasperJanssens/intellij-haskforce/issues/events{/number}","events_url":"https://api.github.com/repos/KasperJanssens/intellij-haskforce/events","assignees_url":"https://api.github.com/repos/KasperJanssens/intellij-haskforce/assignees{/user}","branches_url":"https://api.github.com/repos/KasperJanssens/intellij-haskforce/branches{/branch}","tags_url":"https://api.github.com/repos/KasperJanssens/intellij-haskforce/tags","blobs_url":"https://api.github.com/repos/KasperJanssens/intellij-haskforce/git/blobs{/sha}","git_tags_url":"https://api.github.com/repos/KasperJanssens/intellij-haskforce/git/tags{/sha}","git_refs_url":"https://api.github.com/repos/KasperJanssens/intellij-haskforce/git/refs{/sha}","trees_url":"https://api.github.com/repos/KasperJanssens/intellij-haskforce/git/trees{/sha}","statuses_url":"https://api.github.com/repos/KasperJanssens/intellij-haskforce/statuses/{sha}","languages_url":"https://api.github.com/repos/KasperJanssens/intellij-haskforce/languages","stargazers_url":"https://api.github.com/repos/KasperJanssens/intellij-haskforce/stargazers","contributors_url":"https://api.github.com/repos/KasperJanssens/intellij-haskforce/contributors","subscribers_url":"https://api.github.com/repos/KasperJanssens/intellij-haskforce/subscribers","subscription_url":"https://api.github.com/repos/KasperJanssens/intellij-haskforce/subscription","commits_url":"https://api.github.com/repos/KasperJanssens/intellij-haskforce/commits{/sha}","git_commits_url":"https://api.github.com/repos/KasperJanssens/intellij-haskforce/git/commits{/sha}","comments_url":"https://api.github.com/repos/KasperJanssens/intellij-haskforce/comments{/number}","issue_comment_url":"https://api.github.com/repos/KasperJanssens/intellij-haskforce/issues/comments/{number}","contents_url":"https://api.github.com/repos/KasperJanssens/intellij-haskforce/contents/{+path}","compare_url":"https://api.github.com/repos/KasperJanssens/intellij-haskforce/compare/{base}...{head}","merges_url":"https://api.github.com/repos/KasperJanssens/intellij-haskforce/merges","archive_url":"https://api.github.com/repos/KasperJanssens/intellij-haskforce/{archive_format}{/ref}","downloads_url":"https://api.github.com/repos/KasperJanssens/intellij-haskforce/downloads","issues_url":"https://api.github.com/repos/KasperJanssens/intellij-haskforce/issues{/number}","pulls_url":"https://api.github.com/repos/KasperJanssens/intellij-haskforce/pulls{/number}","milestones_url":"https://api.github.com/repos/KasperJanssens/intellij-haskforce/milestones{/number}","notifications_url":"https://api.github.com/repos/KasperJanssens/intellij-haskforce/notifications{?since,all,participating}","labels_url":"https://api.github.com/repos/KasperJanssens/intellij-haskforce/labels{/name}","releases_url":"https://api.github.com/repos/KasperJanssens/intellij-haskforce/releases{/id}","created_at":"2014-12-27T16:11:01Z","updated_at":"2014-12-27T16:11:03Z","pushed_at":"2014-12-31T15:44:48Z","git_url":"git://github.com/KasperJanssens/intellij-haskforce.git","ssh_url":"git@github.com:KasperJanssens/intellij-haskforce.git","clone_url":"https://github.com/KasperJanssens/intellij-haskforce.git","svn_url":"https://github.com/KasperJanssens/intellij-haskforce","homepage":"http://carymrobbins.github.io/intellij-haskforce/","size":7553,"stargazers_count":0,"watchers_count":0,"language":"Java","has_issues":false,"has_downloads":true,"has_wiki":true,"has_pages":true,"forks_count":0,"mirror_url":null,"open_issues_count":0,"forks":0,"open_issues":0,"watchers":0,"default_branch":"master"}},"base":{"label":"carymrobbins:master","ref":"master","sha":"19442eb58293650dc699e30ccf2d5482e1c688d8","user":{"login":"carymrobbins","id":3103764,"avatar_url":"https://avatars.githubusercontent.com/u/3103764?v=3","gravatar_id":"","url":"https://api.github.com/users/carymrobbins","html_url":"https://github.com/carymrobbins","followers_url":"https://api.github.com/users/carymrobbins/followers","following_url":"https://api.github.com/users/carymrobbins/following{/other_user}","gists_url":"https://api.github.com/users/carymrobbins/gists{/gist_id}","starred_url":"https://api.github.com/users/carymrobbins/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/carymrobbins/subscriptions","organizations_url":"https://api.github.com/users/carymrobbins/orgs","repos_url":"https://api.github.com/users/carymrobbins/repos","events_url":"https://api.github.com/users/carymrobbins/events{/privacy}","received_events_url":"https://api.github.com/users/carymrobbins/received_events","type":"User","site_admin":false},"repo":{"id":15573192,"name":"intellij-haskforce","full_name":"carymrobbins/intellij-haskforce","owner":{"login":"carymrobbins","id":3103764,"avatar_url":"https://avatars.githubusercontent.com/u/3103764?v=3","gravatar_id":"","url":"https://api.github.com/users/carymrobbins","html_url":"https://github.com/carymrobbins","followers_url":"https://api.github.com/users/carymrobbins/followers","following_url":"https://api.github.com/users/carymrobbins/following{/other_user}","gists_url":"https://api.github.com/users/carymrobbins/gists{/gist_id}","starred_url":"https://api.github.com/users/carymrobbins/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/carymrobbins/subscriptions","organizations_url":"https://api.github.com/users/carymrobbins/orgs","repos_url":"https://api.github.com/users/carymrobbins/repos","events_url":"https://api.github.com/users/carymrobbins/events{/privacy}","received_events_url":"https://api.github.com/users/carymrobbins/received_events","type":"User","site_admin":false},"private":false,"html_url":"https://github.com/carymrobbins/intellij-haskforce","description":"Haskell plugin for IntelliJ IDEA Community Edition","fork":false,"url":"https://api.github.com/repos/carymrobbins/intellij-haskforce","forks_url":"https://api.github.com/repos/carymrobbins/intellij-haskforce/forks","keys_url":"https://api.github.com/repos/carymrobbins/intellij-haskforce/keys{/key_id}","collaborators_url":"https://api.github.com/repos/carymrobbins/intellij-haskforce/collaborators{/collaborator}","teams_url":"https://api.github.com/repos/carymrobbins/intellij-haskforce/teams","hooks_url":"https://api.github.com/repos/carymrobbins/intellij-haskforce/hooks","issue_events_url":"https://api.github.com/repos/carymrobbins/intellij-haskforce/issues/events{/number}","events_url":"https://api.github.com/repos/carymrobbins/intellij-haskforce/events","assignees_url":"https://api.github.com/repos/carymrobbins/intellij-haskforce/assignees{/user}","branches_url":"https://api.github.com/repos/carymrobbins/intellij-haskforce/branches{/branch}","tags_url":"https://api.github.com/repos/carymrobbins/intellij-haskforce/tags","blobs_url":"https://api.github.com/repos/carymrobbins/intellij-haskforce/git/blobs{/sha}","git_tags_url":"https://api.github.com/repos/carymrobbins/intellij-haskforce/git/tags{/sha}","git_refs_url":"https://api.github.com/repos/carymrobbins/intellij-haskforce/git/refs{/sha}","trees_url":"https://api.github.com/repos/carymrobbins/intellij-haskforce/git/trees{/sha}","statuses_url":"https://api.github.com/repos/carymrobbins/intellij-haskforce/statuses/{sha}","languages_url":"https://api.github.com/repos/carymrobbins/intellij-haskforce/languages","stargazers_url":"https://api.github.com/repos/carymrobbins/intellij-haskforce/stargazers","contributors_url":"https://api.github.com/repos/carymrobbins/intellij-haskforce/contributors","subscribers_url":"https://api.github.com/repos/carymrobbins/intellij-haskforce/subscribers","subscription_url":"https://api.github.com/repos/carymrobbins/intellij-haskforce/subscription","commits_url":"https://api.github.com/repos/carymrobbins/intellij-haskforce/commits{/sha}","git_commits_url":"https://api.github.com/repos/carymrobbins/intellij-haskforce/git/commits{/sha}","comments_url":"https://api.github.com/repos/carymrobbins/intellij-haskforce/comments{/number}","issue_comment_url":"https://api.github.com/repos/carymrobbins/intellij-haskforce/issues/comments/{number}","contents_url":"https://api.github.com/repos/carymrobbins/intellij-haskforce/contents/{+path}","compare_url":"https://api.github.com/repos/carymrobbins/intellij-haskforce/compare/{base}...{head}","merges_url":"https://api.github.com/repos/carymrobbins/intellij-haskforce/merges","archive_url":"https://api.github.com/repos/carymrobbins/intellij-haskforce/{archive_format}{/ref}","downloads_url":"https://api.github.com/repos/carymrobbins/intellij-haskforce/downloads","issues_url":"https://api.github.com/repos/carymrobbins/intellij-haskforce/issues{/number}","pulls_url":"https://api.github.com/repos/carymrobbins/intellij-haskforce/pulls{/number}","milestones_url":"https://api.github.com/repos/carymrobbins/intellij-haskforce/milestones{/number}","notifications_url":"https://api.github.com/repos/carymrobbins/intellij-haskforce/notifications{?since,all,participating}","labels_url":"https://api.github.com/repos/carymrobbins/intellij-haskforce/labels{/name}","releases_url":"https://api.github.com/repos/carymrobbins/intellij-haskforce/releases{/id}","created_at":"2014-01-02T01:28:54Z","updated_at":"2014-12-30T16:15:50Z","pushed_at":"2014-12-27T04:28:50Z","git_url":"git://github.com/carymrobbins/intellij-haskforce.git","ssh_url":"git@github.com:carymrobbins/intellij-haskforce.git","clone_url":"https://github.com/carymrobbins/intellij-haskforce.git","svn_url":"https://github.com/carymrobbins/intellij-haskforce","homepage":"http://carymrobbins.github.io/intellij-haskforce/","size":11390,"stargazers_count":159,"watchers_count":159,"language":"Java","has_issues":true,"has_downloads":true,"has_wiki":true,"has_pages":true,"forks_count":9,"mirror_url":null,"open_issues_count":30,"forks":9,"open_issues":30,"watchers":159,"default_branch":"master"}},"_links":{"self":{"href":"https://api.github.com/repos/carymrobbins/intellij-haskforce/pulls/105"},"html":{"href":"https://github.com/carymrobbins/intellij-haskforce/pull/105"},"issue":{"href":"https://api.github.com/repos/carymrobbins/intellij-haskforce/issues/105"},"comments":{"href":"https://api.github.com/repos/carymrobbins/intellij-haskforce/issues/105/comments"},"review_comments":{"href":"https://api.github.com/repos/carymrobbins/intellij-haskforce/pulls/105/comments"},"review_comment":{"href":"https://api.github.com/repos/carymrobbins/intellij-haskforce/pulls/comments/{number}"},"commits":{"href":"https://api.github.com/repos/carymrobbins/intellij-haskforce/pulls/105/commits"},"statuses":{"href":"https://api.github.com/repos/carymrobbins/intellij-haskforce/statuses/73ec576f11ba5aa0906e1ca03bc9390ca94b40e2"}}}},"public":true,"created_at":"2015-01-01T01:02:00Z"}
{"id":"2489396724","type":"PushEvent","actor":{"id":280212,"login":"KenanSulayman","gravatar_id":"","url":"https://api.github.com/users/KenanSulayman","avatar_url":"https://avatars.githubusercontent.com/u/280212?"},"repo":{"id":21481110,"name":"KenanSulayman/heartbeat","url":"https://api.github.com/repos/KenanSulayman/heartbeat"},"payload":{"push_id":536752626,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"1ac37b74ae21d946dc3826883204811da6d06852","before":"f5fd8c9b5d99ba2f521c56658163b69c29eb1027","commits":[{"sha":"1ac37b74ae21d946dc3826883204811da6d06852","author":{"email":"9176253dfc0bc82671a5e984646605f93319147a@sly.mn","name":"Kenan Sulayman"},"message":"1420074118714\n\noJhRtiHmitwAmvo7xDna+E9mim307BW3xojcjXsX+6M=","distinct":true,"url":"https://api.github.com/repos/KenanSulayman/heartbeat/commits/1ac37b74ae21d946dc3826883204811da6d06852"}]},"public":true,"created_at":"2015-01-01T01:02:00Z"}
{"id":"2489396725","type":"PushEvent","actor":{"id":9515067,"login":"freundTech","gravatar_id":"","url":"https://api.github.com/users/freundTech","avatar_url":"https://avatars.githubusercontent.com/u/9515067?"},"repo":{"id":27674403,"name":"freundTech/lightDMX","url":"https://api.github.com/repos/freundTech/lightDMX"},"payload":{"push_id":536752627,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"1949bbb851b79b526154c7cec6a0e7e00f1420a6","before":"def97c029096a9b41b592ae7070a651b78edcac3","commits":[{"sha":"1949bbb851b79b526154c7cec6a0e7e00f1420a6","author":{"email":"d6643dd9a6fe6114980ecaf6d787b2a0da7fc377@gmail.com","name":"Adrian"},"message":"Finished connections and made connectors their own class.","distinct":true,"url":"https://api.github.com/repos/freundTech/lightDMX/commits/1949bbb851b79b526154c7cec6a0e7e00f1420a6"}]},"public":true,"created_at":"2015-01-01T01:02:00Z"}
{"id":"2489396728","type":"PushEvent","actor":{"id":66897,"login":"asad","gravatar_id":"","url":"https://api.github.com/users/asad","avatar_url":"https://avatars.githubusercontent.com/u/66897?"},"repo":{"id":28622285,"name":"asad/ChemBLAST","url":"https://api.github.com/repos/asad/ChemBLAST"},"payload":{"push_id":536752629,"size":3,"distinct_size":3,"ref":"refs/heads/master","head":"4fd33b8625d56ca7dcda0acc38f6f51ec1358c87","before":"b41b8269e88a699180c115deb6c7ec8df44cf263","commits":[{"sha":"1f8049a2b5c2b640dc0c3577bdbbaa075c8d7827","author":{"email":"09eb4ce7c91ecff4eff21da1532c566afe7cb66c@gmail.com","name":"Syed Asad Rahman"},"message":"parallel java search implemented","distinct":true,"url":"https://api.github.com/repos/asad/ChemBLAST/commits/1f8049a2b5c2b640dc0c3577bdbbaa075c8d7827"},{"sha":"ebdea677d4adff3460a744e5c4499c42022eeca3","author":{"email":"09eb4ce7c91ecff4eff21da1532c566afe7cb66c@gmail.com","name":"Syed Asad Rahman"},"message":"parallel java search implemented","distinct":true,"url":"https://api.github.com/repos/asad/ChemBLAST/commits/ebdea677d4adff3460a744e5c4499c42022eeca3"},{"sha":"4fd33b8625d56ca7dcda0acc38f6f51ec1358c87","author":{"email":"09eb4ce7c91ecff4eff21da1532c566afe7cb66c@gmail.com","name":"Syed Asad Rahman"},"message":"4X speed up obtained with join and fork search implementation.","distinct":true,"url":"https://api.github.com/repos/asad/ChemBLAST/commits/4fd33b8625d56ca7dcda0acc38f6f51ec1358c87"}]},"public":true,"created_at":"2015-01-01T01:02:01Z"}
{"id":"2489396733","type":"PushEvent","actor":{"id":7886751,"login":"harrison0723","gravatar_id":"","url":"https://api.github.com/users/harrison0723","avatar_url":"https://avatars.githubusercontent.com/u/7886751?"},"repo":{"id":28653649,"name":"harrison0723/bloccit","url":"https://api.github.com/repos/harrison0723/bloccit"},"payload":{"push_id":536752633,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"1294ea64e75c5da49f0239c796445374870a0eae","before":"63a17d0ec4d8e6a4e143fe5775b5fcc25a765b05","commits":[{"sha":"1294ea64e75c5da49f0239c796445374870a0eae","author":{"email":"cf9e7917eadcf4e1a3e8784c7f4ca5d67be0f8ad@gmail.com","name":"HarrisonLo"},"message":"Updated add layout and welcome views","distinct":true,"url":"https://api.github.com/repos/harrison0723/bloccit/commits/1294ea64e75c5da49f0239c796445374870a0eae"}]},"public":true,"created_at":"2015-01-01T01:02:02Z"}
{"id":"2489396734","type":"PushEvent","actor":{"id":5728403,"login":"patrick-hudson","gravatar_id":"","url":"https://api.github.com/users/patrick-hudson","avatar_url":"https://avatars.githubusercontent.com/u/5728403?"},"repo":{"id":25392255,"name":"patrick-hudson/EggDrop","url":"https://api.github.com/repos/patrick-hudson/EggDrop"},"payload":{"push_id":536752634,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"cb11cf77a4d9d7625c14e50c27fe61d387d2c95e","before":"6336938241e7f58f06585498f1e07b6645b86630","commits":[{"sha":"cb11cf77a4d9d7625c14e50c27fe61d387d2c95e","author":{"email":"cbb7353e6d953ef360baf960c122346276c6e320@hudson.bz","name":"Patrick Hudson"},"message":"Scripted auto-commit on change (2014-12-31 20:02:00) by gitwatch.sh","distinct":true,"url":"https://api.github.com/repos/patrick-hudson/EggDrop/commits/cb11cf77a4d9d7625c14e50c27fe61d387d2c95e"}]},"public":true,"created_at":"2015-01-01T01:02:02Z"}
{"id":"2489396740","type":"CreateEvent","actor":{"id":7989982,"login":"wxv","gravatar_id":"","url":"https://api.github.com/users/wxv","avatar_url":"https://avatars.githubusercontent.com/u/7989982?"},"repo":{"id":28678232,"name":"wxv/Items-Index","url":"https://api.github.com/repos/wxv/Items-Index"},"payload":{"ref":null,"ref_type":"repository","master_branch":"master","description":"Historical item prices","pusher_type":"user"},"public":true,"created_at":"2015-01-01T01:02:03Z"}
{"id":"2489396741","type":"PushEvent","actor":{"id":1981539,"login":"harshiet","gravatar_id":"","url":"https://api.github.com/users/harshiet","avatar_url":"https://avatars.githubusercontent.com/u/1981539?"},"repo":{"id":28192167,"name":"harshiet/jira-reports-pro","url":"https://api.github.com/repos/harshiet/jira-reports-pro"},"payload":{"push_id":536752637,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"3f51d07d0517bbbc9fdc9ff27d615b175fd3084a","before":"8e111512bd19a9db1e99ed05e0290dbfea5de705","commits":[{"sha":"3f51d07d0517bbbc9fdc9ff27d615b175fd3084a","author":{"email":"ed07a1efef8aa439ec830948475d9a155b709cf5@gmail.com","name":"harshiet"},"message":"1","distinct":true,"url":"https://api.github.com/repos/harshiet/jira-reports-pro/commits/3f51d07d0517bbbc9fdc9ff27d615b175fd3084a"}]},"public":true,"created_at":"2015-01-01T01:02:03Z"}
{"id":"2489396747","type":"PushEvent","actor":{"id":1640798,"login":"langorn","gravatar_id":"","url":"https://api.github.com/users/langorn","avatar_url":"https://avatars.githubusercontent.com/u/1640798?"},"repo":{"id":28678190,"name":"langorn/crm","url":"https://api.github.com/repos/langorn/crm"},"payload":{"push_id":536752639,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"408cbaf7c4cc00d021d00dc14dacb8f2095c6fa3","before":"95907808683f55c40c7ce5552330d0c276921cb1","commits":[{"sha":"408cbaf7c4cc00d021d00dc14dacb8f2095c6fa3","author":{"email":"ba36a5a19299fe08d08975c8488c56bf95772e2d@gmail.com","name":"Mark"},"message":"first commit","distinct":true,"url":"https://api.github.com/repos/langorn/crm/commits/408cbaf7c4cc00d021d00dc14dacb8f2095c6fa3"}]},"public":true,"created_at":"2015-01-01T01:02:04Z"}
{"id":"2489396754","type":"CreateEvent","actor":{"id":1253444,"login":"nathan-osman","gravatar_id":"","url":"https://api.github.com/users/nathan-osman","avatar_url":"https://avatars.githubusercontent.com/u/1253444?"},"repo":{"id":28151446,"name":"nathan-osman/django-archive","url":"https://api.github.com/repos/nathan-osman/django-archive"},"payload":{"ref":"0.1.2","ref_type":"tag","master_branch":"master","description":"Management command for creating compressed archives of Django projects, including database tables and uploaded media.","pusher_type":"user"},"public":true,"created_at":"2015-01-01T01:02:06Z"}
{"id":"2489396756","type":"PushEvent","actor":{"id":9201970,"login":"qdm","gravatar_id":"","url":"https://api.github.com/users/qdm","avatar_url":"https://avatars.githubusercontent.com/u/9201970?"},"repo":{"id":25173910,"name":"qdm/qdm.github.io","url":"https://api.github.com/repos/qdm/qdm.github.io"},"payload":{"push_id":536752642,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"94683ca14e320a286452e2f2e873ff5d603f1a98","before":"05438aee0e5572a6e4adf91d7eef32917812d9e9","commits":[{"sha":"94683ca14e320a286452e2f2e873ff5d603f1a98","author":{"email":"de163e90d3aeef9f404d1de71c48e234a211e3c3@gmail.com","name":"KT"},"message":"Update","distinct":true,"url":"https://api.github.com/repos/qdm/qdm.github.io/commits/94683ca14e320a286452e2f2e873ff5d603f1a98"}]},"public":true,"created_at":"2015-01-01T01:02:06Z"}
{"id":"2489396757","type":"PushEvent","actor":{"id":31338,"login":"gak","gravatar_id":"","url":"https://api.github.com/users/gak","avatar_url":"https://avatars.githubusercontent.com/u/31338?"},"repo":{"id":28615761,"name":"PayGroove/fig","url":"https://api.github.com/repos/PayGroove/fig"},"payload":{"push_id":536752643,"size":2,"distinct_size":2,"ref":"refs/heads/templates","head":"1614c4c666c85d5447e1ae10ad81f9ece1852062","before":"c10351e1f8f17f6733a0db29aedf3b377b96fcf2","commits":[{"sha":"b91fe46a080165aa154a2b17bf0699c67010fea3","author":{"email":"bee25f9566f14bcc1d385b4a10d34d2cb725465a@gak0.com","name":"Gerald Kaszuba"},"message":"docker/fig#761 Additional template checks and bug fixes\n\nThere were a few bugs in my initial implementation:\n - Infinite recursion when referring to the same template file.\n   Implementing a class and caching previously loaded yml files handles\n   that problem.\n - Dictionaries that were updated in place where left \"dirty\". The\n   copy.copy fixes that.\n - Incorrectly configured template yml files were not throwing fig\n   exceptions.\n\nSigned-off-by: Gerald Kaszuba <gak@gak0.com>","distinct":true,"url":"https://api.github.com/repos/PayGroove/fig/commits/b91fe46a080165aa154a2b17bf0699c67010fea3"},{"sha":"1614c4c666c85d5447e1ae10ad81f9ece1852062","author":{"email":"bee25f9566f14bcc1d385b4a10d34d2cb725465a@gak0.com","name":"Gerald Kaszuba"},"message":"docker/fig#761 Added some docs for template in yml.md\n\nSigned-off-by: Gerald Kaszuba <gak@gak0.com>","distinct":true,"url":"https://api.github.com/repos/PayGroove/fig/commits/1614c4c666c85d5447e1ae10ad81f9ece1852062"}]},"public":true,"created_at":"2015-01-01T01:02:06Z","org":{"id":10135493,"login":"PayGroove","gravatar_id":"","url":"https://api.github.com/orgs/PayGroove","avatar_url":"https://avatars.githubusercontent.com/u/10135493?"}}
{"id":"2489396764","type":"PushEvent","actor":{"id":8404840,"login":"orionmelt","gravatar_id":"","url":"https://api.github.com/users/orionmelt","avatar_url":"https://avatars.githubusercontent.com/u/8404840?"},"repo":{"id":23653249,"name":"orionmelt/sherlock","url":"https://api.github.com/repos/orionmelt/sherlock"},"payload":{"push_id":536752649,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"8d16004c2185415f95881976b8245083e3b0bf1d","before":"a11d423101ce2b72d54a79e82ea92805b3590098","commits":[{"sha":"8d16004c2185415f95881976b8245083e3b0bf1d","author":{"email":"d987d5b2320ab4566c87c2023d39457639743791@gmail.com","name":"Raj"},"message":"Docstrings, comments and some renaming updates.","distinct":true,"url":"https://api.github.com/repos/orionmelt/sherlock/commits/8d16004c2185415f95881976b8245083e3b0bf1d"}]},"public":true,"created_at":"2015-01-01T01:02:07Z"}
{"id":"2489396765","type":"PushEvent","actor":{"id":1456047,"login":"kyokomi","gravatar_id":"","url":"https://api.github.com/users/kyokomi","avatar_url":"https://avatars.githubusercontent.com/u/1456047?"},"repo":{"id":25506232,"name":"kyokomi/gomajan","url":"https://api.github.com/repos/kyokomi/gomajan"},"payload":{"push_id":536752650,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"0dc0e50eb584a0f312f5f6ce1c3a85d4ddb3f62e","before":"33d7ed3c98a7cfb19ce924735a7420de0ca57ef7","commits":[{"sha":"0dc0e50eb584a0f312f5f6ce1c3a85d4ddb3f62e","author":{"email":"2ea0042be6760fbcd1e13c4e2076e1e54e82d1d5@gmail.com","name":"kyokomi"},"message":"test: 混全帯么九","distinct":true,"url":"https://api.github.com/repos/kyokomi/gomajan/commits/0dc0e50eb584a0f312f5f6ce1c3a85d4ddb3f62e"}]},"public":true,"created_at":"2015-01-01T01:02:07Z"}
{"id":"2489396766","type":"WatchEvent","actor":{"id":3344033,"login":"neverfox","gravatar_id":"","url":"https://api.github.com/users/neverfox","avatar_url":"https://avatars.githubusercontent.com/u/3344033?"},"repo":{"id":11744114,"name":"eviltrout/ember-renderspeed","url":"https://api.github.com/repos/eviltrout/ember-renderspeed"},"payload":{"action":"started"},"public":true,"created_at":"2015-01-01T01:02:07Z"}
{"id":"2489396770","type":"PushEvent","actor":{"id":7050164,"login":"marvalgames","gravatar_id":"","url":"https://api.github.com/users/marvalgames","avatar_url":"https://avatars.githubusercontent.com/u/7050164?"},"repo":{"id":28167953,"name":"marvalgames/dead-pixels","url":"https://api.github.com/repos/marvalgames/dead-pixels"},"payload":{"push_id":536752653,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"d4f2a4466aceef8bc6db2232451ba31fcd431a0a","before":"5ff63a7b9f29739457db94f530b83e6f46afb85e","commits":[{"sha":"d4f2a4466aceef8bc6db2232451ba31fcd431a0a","author":{"email":"6c18ea4526e2e66416491c4bc60d3d5a42aaebd8@gmail.com","name":"marvalgames"},"message":".28","distinct":true,"url":"https://api.github.com/repos/marvalgames/dead-pixels/commits/d4f2a4466aceef8bc6db2232451ba31fcd431a0a"}]},"public":true,"created_at":"2015-01-01T01:02:07Z"}
{"id":"2489396775","type":"PushEvent","actor":{"id":7391433,"login":"StevenXL","gravatar_id":"","url":"https://api.github.com/users/StevenXL","avatar_url":"https://avatars.githubusercontent.com/u/7391433?"},"repo":{"id":28642919,"name":"StevenXL/learntoprogram","url":"https://api.github.com/repos/StevenXL/learntoprogram"},"payload":{"push_id":536752654,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"85f31e3ddb605fe4a1bde3ddb537ab3302d4c59d","before":"5cb1eace288863132472638e17792604cbdc5443","commits":[{"sha":"85f31e3ddb605fe4a1bde3ddb537ab3302d4c59d","author":{"email":"2a2c33fb7ea332dc4f943c4fb28454a257783aab@gmail.com","name":"StevenXL"},"message":"Finished Chapter 7","distinct":true,"url":"https://api.github.com/repos/StevenXL/learntoprogram/commits/85f31e3ddb605fe4a1bde3ddb537ab3302d4c59d"}]},"public":true,"created_at":"2015-01-01T01:02:08Z"}
{"id":"2489396778","type":"CreateEvent","actor":{"id":7989982,"login":"wxv","gravatar_id":"","url":"https://api.github.com/users/wxv","avatar_url":"https://avatars.githubusercontent.com/u/7989982?"},"repo":{"id":28678232,"name":"wxv/Items-Index","url":"https://api.github.com/repos/wxv/Items-Index"},"payload":{"ref":"master","ref_type":"branch","master_branch":"master","description":"Historical item prices","pusher_type":"user"},"public":true,"created_at":"2015-01-01T01:02:08Z"}
{"id":"2489396781","type":"PushEvent","actor":{"id":3489773,"login":"captainkirkby","gravatar_id":"","url":"https://api.github.com/users/captainkirkby","avatar_url":"https://avatars.githubusercontent.com/u/3489773?"},"repo":{"id":15461243,"name":"captainkirkby/Gears","url":"https://api.github.com/repos/captainkirkby/Gears"},"payload":{"push_id":536752657,"size":1,"distinct_size":1,"ref":"refs/heads/#30","head":"0ce69fa19d81de656dd6a74629099a7fa9261d1c","before":"b838f0c36403eab209f3565eeb7a10375911d228","commits":[{"sha":"0ce69fa19d81de656dd6a74629099a7fa9261d1c","author":{"email":"4d1902cf1aefa3df01c59cbb9ae7db3045be42ae@gmail.com","name":"Dylan Kirkby"},"message":"Add simple C program to replay binary file","distinct":true,"url":"https://api.github.com/repos/captainkirkby/Gears/commits/0ce69fa19d81de656dd6a74629099a7fa9261d1c"}]},"public":true,"created_at":"2015-01-01T01:02:09Z"}
{"id":"2489396783","type":"PushEvent","actor":{"id":1017605,"login":"wangshan","gravatar_id":"","url":"https://api.github.com/users/wangshan","avatar_url":"https://avatars.githubusercontent.com/u/1017605?"},"repo":{"id":28666633,"name":"wangshan/wangshan.github.io","url":"https://api.github.com/repos/wangshan/wangshan.github.io"},"payload":{"push_id":536752658,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"92d20ac01b4767280cccaf71ee20f173529877a0","before":"3a5b62221723e1a468813feef26cb122942c53b1","commits":[{"sha":"92d20ac01b4767280cccaf71ee20f173529877a0","author":{"email":"e3e97680eb29c788f35181af31eb442b3251e18f@gmail.com","name":"Shan"},"message":"Update 2012-03-03-mac-development-environment-setup.md","distinct":true,"url":"https://api.github.com/repos/wangshan/wangshan.github.io/commits/92d20ac01b4767280cccaf71ee20f173529877a0"}]},"public":true,"created_at":"2015-01-01T01:02:09Z"}
{"id":"2489396785","type":"PushEvent","actor":{"id":72326,"login":"Lexikos","gravatar_id":"","url":"https://api.github.com/users/Lexikos","avatar_url":"https://avatars.githubusercontent.com/u/72326?"},"repo":{"id":28678134,"name":"Lexikos/xHotkey.ahk","url":"https://api.github.com/repos/Lexikos/xHotkey.ahk"},"payload":{"push_id":536752659,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"f117c07dcb8ff33133d2da0476dfbaf70644b476","before":"8f491d820da9469ab89fe548aadc82a11f8af250","commits":[{"sha":"f117c07dcb8ff33133d2da0476dfbaf70644b476","author":{"email":"e144dba3b863bfb4ca42790332b351be659b9c7e@gmail.com","name":"Lexikos"},"message":"Fix readme","distinct":true,"url":"https://api.github.com/repos/Lexikos/xHotkey.ahk/commits/f117c07dcb8ff33133d2da0476dfbaf70644b476"}]},"public":true,"created_at":"2015-01-01T01:02:09Z"}
{"id":"2489396786","type":"IssueCommentEvent","actor":{"id":253237,"login":"Jamesking56","gravatar_id":"","url":"https://api.github.com/users/Jamesking56","avatar_url":"https://avatars.githubusercontent.com/u/253237?"},"repo":{"id":26730195,"name":"cachethq/Cachet","url":"https://api.github.com/repos/cachethq/Cachet"},"payload":{"action":"created","issue":{"url":"https://api.github.com/repos/cachethq/Cachet/issues/173","labels_url":"https://api.github.com/repos/cachethq/Cachet/issues/173/labels{/name}","comments_url":"https://api.github.com/repos/cachethq/Cachet/issues/173/comments","events_url":"https://api.github.com/repos/cachethq/Cachet/issues/173/events","html_url":"https://github.com/cachethq/Cachet/issues/173","id":53210024,"number":173,"title":"Bug: Forms let you submit multiple times","user":{"login":"Jamesking56","id":253237,"avatar_url":"https://avatars.githubusercontent.com/u/253237?v=3","gravatar_id":"","url":"https://api.github.com/users/Jamesking56","html_url":"https://github.com/Jamesking56","followers_url":"https://api.github.com/users/Jamesking56/followers","following_url":"https://api.github.com/users/Jamesking56/following{/other_user}","gists_url":"https://api.github.com/users/Jamesking56/gists{/gist_id}","starred_url":"https://api.github.com/users/Jamesking56/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/Jamesking56/subscriptions","organizations_url":"https://api.github.com/users/Jamesking56/orgs","repos_url":"https://api.github.com/users/Jamesking56/repos","events_url":"https://api.github.com/users/Jamesking56/events{/privacy}","received_events_url":"https://api.github.com/users/Jamesking56/received_events","type":"User","site_admin":false},"labels":[],"state":"open","locked":false,"assignee":null,"milestone":null,"comments":4,"created_at":"2015-01-01T00:52:06Z","updated_at":"2015-01-01T01:02:10Z","closed_at":null,"body":"When adding a new incident, I noticed a weird bug.\r\n\r\nIf you fill in the form as normal, then click the submit button twice really quickly, it'll create __TWO__ identical new incidents!\r\n\r\nThis could be a bit annoying, a simple fix is using a bit of JS that on submit, disables the submit button so that once clicked, it cannot be clicked again."},"comment":{"url":"https://api.github.com/repos/cachethq/Cachet/issues/comments/68477258","html_url":"https://github.com/cachethq/Cachet/issues/173#issuecomment-68477258","issue_url":"https://api.github.com/repos/cachethq/Cachet/issues/173","id":68477258,"user":{"login":"Jamesking56","id":253237,"avatar_url":"https://avatars.githubusercontent.com/u/253237?v=3","gravatar_id":"","url":"https://api.github.com/users/Jamesking56","html_url":"https://github.com/Jamesking56","followers_url":"https://api.github.com/users/Jamesking56/followers","following_url":"https://api.github.com/users/Jamesking56/following{/other_user}","gists_url":"https://api.github.com/users/Jamesking56/gists{/gist_id}","starred_url":"https://api.github.com/users/Jamesking56/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/Jamesking56/subscriptions","organizations_url":"https://api.github.com/users/Jamesking56/orgs","repos_url":"https://api.github.com/users/Jamesking56/repos","events_url":"https://api.github.com/users/Jamesking56/events{/privacy}","received_events_url":"https://api.github.com/users/Jamesking56/received_events","type":"User","site_admin":false},"created_at":"2015-01-01T01:02:10Z","updated_at":"2015-01-01T01:02:10Z","body":"Doesn't Laravel have that already?\r\n\r\nhttp://laravel.com/docs/4.2/security#protecting-routes\r\n\r\nDoesn't Laravel's CSRF Protection offer this?"}},"public":true,"created_at":"2015-01-01T01:02:11Z","org":{"id":9951502,"login":"cachethq","gravatar_id":"","url":"https://api.github.com/orgs/cachethq","avatar_url":"https://avatars.githubusercontent.com/u/9951502?"}}
{"id":"2489396788","type":"CreateEvent","actor":{"id":2851221,"login":"alkass","gravatar_id":"","url":"https://api.github.com/users/alkass","avatar_url":"https://avatars.githubusercontent.com/u/2851221?"},"repo":{"id":28678233,"name":"alkass/seQre","url":"https://api.github.com/repos/alkass/seQre"},"payload":{"ref":null,"ref_type":"repository","master_branch":"master","description":"","pusher_type":"user"},"public":true,"created_at":"2015-01-01T01:02:11Z"}
{"id":"2489396795","type":"PushEvent","actor":{"id":3414800,"login":"Jyang772","gravatar_id":"","url":"https://api.github.com/users/Jyang772","avatar_url":"https://avatars.githubusercontent.com/u/3414800?"},"repo":{"id":28655798,"name":"Jyang772/MacSpoof","url":"https://api.github.com/repos/Jyang772/MacSpoof"},"payload":{"push_id":536752661,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"8ec327a2306084297e54415c994eae67a75df167","before":"633d4b381b6272a89070428ea1ef67600b934eac","commits":[{"sha":"8ec327a2306084297e54415c994eae67a75df167","author":{"email":"6c73cfbdcadf6d6f6fd0a03108daf8b6f1dd8164@gmail.com","name":"Justin"},"message":"Update lol.sh\n\nBug with wpa_cli reassociate. \r\nDoes not seem to work on secured networks. Might be driver issue.","distinct":true,"url":"https://api.github.com/repos/Jyang772/MacSpoof/commits/8ec327a2306084297e54415c994eae67a75df167"}]},"public":true,"created_at":"2015-01-01T01:02:11Z"}
{"id":"2489396796","type":"PushEvent","actor":{"id":10298641,"login":"lucachr","gravatar_id":"","url":"https://api.github.com/users/lucachr","avatar_url":"https://avatars.githubusercontent.com/u/10298641?"},"repo":{"id":28611069,"name":"lucachr/lucachr.github.io","url":"https://api.github.com/repos/lucachr/lucachr.github.io"},"payload":{"push_id":536752662,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"7ff7b895ca4968b985f29cf50ee59fe249a50471","before":"144530b760f22ed18330baeefc89d8f4eb8bbac8","commits":[{"sha":"7ff7b895ca4968b985f29cf50ee59fe249a50471","author":{"email":"3a92d5230cd572ed7ca38353f6e589037a70deaa@gmail.com","name":"Luca Chiricozzi"},"message":"Generate Pelican site","distinct":true,"url":"https://api.github.com/repos/lucachr/lucachr.github.io/commits/7ff7b895ca4968b985f29cf50ee59fe249a50471"}]},"public":true,"created_at":"2015-01-01T01:02:11Z"}
{"id":"2489396797","type":"PushEvent","actor":{"id":10176820,"login":"chalavadivishnu","gravatar_id":"","url":"https://api.github.com/users/chalavadivishnu","avatar_url":"https://avatars.githubusercontent.com/u/10176820?"},"repo":{"id":28678150,"name":"chalavadivishnu/Face-Detection","url":"https://api.github.com/repos/chalavadivishnu/Face-Detection"},"payload":{"push_id":536752663,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"b956bef865580106b571e412e35308b3e7ab708e","before":"22a9bd6584d30cc259b5b0055cb6a8bff31d8d9e","commits":[{"sha":"b956bef865580106b571e412e35308b3e7ab708e","author":{"email":"ce8044f02eb2a26b631671f5297317036d398e79@gmail.com","name":"Chalavadi Vishnu"},"message":"image to vector function","distinct":true,"url":"https://api.github.com/repos/chalavadivishnu/Face-Detection/commits/b956bef865580106b571e412e35308b3e7ab708e"}]},"public":true,"created_at":"2015-01-01T01:02:11Z"}
{"id":"2489396802","type":"CreateEvent","actor":{"id":2624357,"login":"mike-spainhower","gravatar_id":"","url":"https://api.github.com/users/mike-spainhower","avatar_url":"https://avatars.githubusercontent.com/u/2624357?"},"repo":{"id":27418269,"name":"LiveSafe/lvsf-opsworks-php-cookbook","url":"https://api.github.com/repos/LiveSafe/lvsf-opsworks-php-cookbook"},"payload":{"ref":"1.0.7","ref_type":"tag","master_branch":"master","description":"","pusher_type":"user"},"public":true,"created_at":"2015-01-01T01:02:12Z","org":{"id":9778464,"login":"LiveSafe","gravatar_id":"","url":"https://api.github.com/orgs/LiveSafe","avatar_url":"https://avatars.githubusercontent.com/u/9778464?"}}
{"id":"2489396804","type":"PushEvent","actor":{"id":7809663,"login":"TheRingMaster","gravatar_id":"","url":"https://api.github.com/users/TheRingMaster","avatar_url":"https://avatars.githubusercontent.com/u/7809663?"},"repo":{"id":28453562,"name":"Team-Validus/packages_apps_Settings","url":"https://api.github.com/repos/Team-Validus/packages_apps_Settings"},"payload":{"push_id":536752666,"size":1,"distinct_size":1,"ref":"refs/heads/lp5.0","head":"e7a56745d952f34256729857ef14d4653a239e80","before":"879f03889afd8fa8b52f57a24f8a354060cbeea8","commits":[{"sha":"e7a56745d952f34256729857ef14d4653a239e80","author":{"email":"a2771a13522a1cd683d518d8a964b5d8d1f00d68@hotmail.com","name":"John Brewer"},"message":"derpp","distinct":true,"url":"https://api.github.com/repos/Team-Validus/packages_apps_Settings/commits/e7a56745d952f34256729857ef14d4653a239e80"}]},"public":true,"created_at":"2015-01-01T01:02:12Z","org":{"id":10274350,"login":"Team-Validus","gravatar_id":"","url":"https://api.github.com/orgs/Team-Validus","avatar_url":"https://avatars.githubusercontent.com/u/10274350?"}}
{"id":"2489396808","type":"GollumEvent","actor":{"id":7797609,"login":"ivanwfr","gravatar_id":"","url":"https://api.github.com/users/ivanwfr","avatar_url":"https://avatars.githubusercontent.com/u/7797609?"},"repo":{"id":808316,"name":"cswetenham/tabspace2.1","url":"https://api.github.com/repos/cswetenham/tabspace2.1"},"payload":{"pages":[{"page_name":"Brandon-Craig-Rhodes-TabSpace-Chords-Colored","title":"Brandon Craig Rhodes TabSpace Chords Colored","summary":null,"action":"edited","sha":"bcca6468cba9dd67ac2605d00e9c0a6ce3fb9dbc","html_url":"https://github.com/cswetenham/tabspace2.1/wiki/Brandon-Craig-Rhodes-TabSpace-Chords-Colored"}]},"public":true,"created_at":"2015-01-01T01:02:13Z"}
{"id":"2489396817","type":"PushEvent","actor":{"id":720376,"login":"picodotdev","gravatar_id":"","url":"https://api.github.com/users/picodotdev","avatar_url":"https://avatars.githubusercontent.com/u/720376?"},"repo":{"id":18271108,"name":"picodotdev/blog-stack","url":"https://api.github.com/repos/picodotdev/blog-stack"},"payload":{"push_id":536752673,"size":1,"distinct_size":1,"ref":"refs/heads/gh-pages","head":"fbe0d7491c42bdac571af3a587319e78ffb19516","before":"cd288dc8c7adb8b8c3049ad3b8956472d3e5e450","commits":[{"sha":"fbe0d7491c42bdac571af3a587319e78ffb19516","author":{"email":"82119ca92ec3f303155279e5d516019ee5c15a97@gmail.com","name":"pico.dev"},"message":"Site updated Wednesday, 31-12-2014 20:02","distinct":true,"url":"https://api.github.com/repos/picodotdev/blog-stack/commits/fbe0d7491c42bdac571af3a587319e78ffb19516"}]},"public":true,"created_at":"2015-01-01T01:02:14Z"}
{"id":"2489396819","type":"PushEvent","actor":{"id":7825844,"login":"praashie","gravatar_id":"","url":"https://api.github.com/users/praashie","avatar_url":"https://avatars.githubusercontent.com/u/7825844?"},"repo":{"id":25791959,"name":"praashie/launchpad-visualizer","url":"https://api.github.com/repos/praashie/launchpad-visualizer"},"payload":{"push_id":536752675,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"e01d22445a2098bcf6c73997bcc20afa9a5e926e","before":"c4fdda6869f1e2ab3926d26efe7362c7a630068c","commits":[{"sha":"e01d22445a2098bcf6c73997bcc20afa9a5e926e","author":{"email":"3b921b218ce02163a39d90caa7b3b815b7e415aa@users.noreply.github.com","name":"Praashie"},"message":"Added color palette, prettified code","distinct":true,"url":"https://api.github.com/repos/praashie/launchpad-visualizer/commits/e01d22445a2098bcf6c73997bcc20afa9a5e926e"}]},"public":true,"created_at":"2015-01-01T01:02:14Z"}
{"id":"2489396828","type":"WatchEvent","actor":{"id":3129699,"login":"2xtreme","gravatar_id":"","url":"https://api.github.com/users/2xtreme","avatar_url":"https://avatars.githubusercontent.com/u/3129699?"},"repo":{"id":10263553,"name":"ejurgensen/forked-daapd","url":"https://api.github.com/repos/ejurgensen/forked-daapd"},"payload":{"action":"started"},"public":true,"created_at":"2015-01-01T01:02:17Z"}
{"id":"2489396829","type":"CreateEvent","actor":{"id":1265899,"login":"lynas","gravatar_id":"","url":"https://api.github.com/users/lynas","avatar_url":"https://avatars.githubusercontent.com/u/1265899?"},"repo":{"id":28678234,"name":"lynas/springsecurity3.2","url":"https://api.github.com/repos/lynas/springsecurity3.2"},"payload":{"ref":null,"ref_type":"repository","master_branch":"master","description":"","pusher_type":"user"},"public":true,"created_at":"2015-01-01T01:02:17Z"}
{"id":"2489396831","type":"GollumEvent","actor":{"id":46323,"login":"paulcon","gravatar_id":"","url":"https://api.github.com/users/paulcon","avatar_url":"https://avatars.githubusercontent.com/u/46323?"},"repo":{"id":28157780,"name":"paulcon/active_subspaces","url":"https://api.github.com/repos/paulcon/active_subspaces"},"payload":{"pages":[{"page_name":"_Footer","title":"_Footer","summary":null,"action":"created","sha":"6f09c11d8614aa5c5b996a528905b2a8ae78d59f","html_url":"https://github.com/paulcon/active_subspaces/wiki/_Footer"}]},"public":true,"created_at":"2015-01-01T01:02:17Z"}
{"id":"2489396835","type":"PushEvent","actor":{"id":506010,"login":"gabeshaughnessy","gravatar_id":"","url":"https://api.github.com/users/gabeshaughnessy","avatar_url":"https://avatars.githubusercontent.com/u/506010?"},"repo":{"id":13913264,"name":"gabeshaughnessy/augmentedart","url":"https://api.github.com/repos/gabeshaughnessy/augmentedart"},"payload":{"push_id":536752682,"size":1,"distinct_size":1,"ref":"refs/heads/dungeon-hacker","head":"070da10a642c004ef5bc428b8ce1bf88e410e7b4","before":"49cd4f7ff271d91fedc4c45a85e590295ae59629","commits":[{"sha":"070da10a642c004ef5bc428b8ce1bf88e410e7b4","author":{"email":"a2b2bb6e7f1b10ac88b326d5c10e33af6a8546bc@gmail.com","name":"gabeshaughnessy"},"message":"readme overview","distinct":true,"url":"https://api.github.com/repos/gabeshaughnessy/augmentedart/commits/070da10a642c004ef5bc428b8ce1bf88e410e7b4"}]},"public":true,"created_at":"2015-01-01T01:02:17Z"}
{"id":"2489396843","type":"PushEvent","actor":{"id":2048268,"login":"unzan","gravatar_id":"","url":"https://api.github.com/users/unzan","avatar_url":"https://avatars.githubusercontent.com/u/2048268?"},"repo":{"id":19362226,"name":"unzan/TerribleName","url":"https://api.github.com/repos/unzan/TerribleName"},"payload":{"push_id":536752684,"size":1,"distinct_size":1,"ref":"refs/heads/alternate-version","head":"81fee9bd4bb72b559e86b984dd75a52b29f7123b","before":"048e306634e1334934b62dd234ae1a6a8daaef65","commits":[{"sha":"81fee9bd4bb72b559e86b984dd75a52b29f7123b","author":{"email":"10ccfcfbdc2deb68576e3809f6b38b3d0b355b5a@yahoo.com","name":"unzan"},"message":"cleaned up some codes for buttons and texts\n\n- use `!important` on some button's properties. it's much shorter than the\n  massive wall of selectors caused by abusing `&`\n- removed gradient from disabled submit button\n- fixed mod button when the only visible button is \"ignore reports\"\n- removed `%tn-engraved-box` and `%tn-raised-box`. they're not needed\n  anymore\n- added `%tn-simple-text-container` used by wiki text, self post text\n  and comment/message boxes.","distinct":true,"url":"https://api.github.com/repos/unzan/TerribleName/commits/81fee9bd4bb72b559e86b984dd75a52b29f7123b"}]},"public":true,"created_at":"2015-01-01T01:02:17Z"}
{"id":"2489396856","type":"IssueCommentEvent","actor":{"id":597617,"login":"soniktrooth","gravatar_id":"","url":"https://api.github.com/users/soniktrooth","avatar_url":"https://avatars.githubusercontent.com/u/597617?"},"repo":{"id":28677072,"name":"kalamuna/kalastatic","url":"https://api.github.com/repos/kalamuna/kalastatic"},"payload":{"action":"created","issue":{"url":"https://api.github.com/repos/kalamuna/kalastatic/issues/3","labels_url":"https://api.github.com/repos/kalamuna/kalastatic/issues/3/labels{/name}","comments_url":"https://api.github.com/repos/kalamuna/kalastatic/issues/3/comments","events_url":"https://api.github.com/repos/kalamuna/kalastatic/issues/3/events","html_url":"https://github.com/kalamuna/kalastatic/issues/3","id":53209605,"number":3,"title":"bash variable","user":{"login":"soniktrooth","id":597617,"avatar_url":"https://avatars.githubusercontent.com/u/597617?v=3","gravatar_id":"","url":"https://api.github.com/users/soniktrooth","html_url":"https://github.com/soniktrooth","followers_url":"https://api.github.com/users/soniktrooth/followers","following_url":"https://api.github.com/users/soniktrooth/following{/other_user}","gists_url":"https://api.github.com/users/soniktrooth/gists{/gist_id}","starred_url":"https://api.github.com/users/soniktrooth/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/soniktrooth/subscriptions","organizations_url":"https://api.github.com/users/soniktrooth/orgs","repos_url":"https://api.github.com/users/soniktrooth/repos","events_url":"https://api.github.com/users/soniktrooth/events{/privacy}","received_events_url":"https://api.github.com/users/soniktrooth/received_events","type":"User","site_admin":false},"labels":[],"state":"open","locked":false,"assignee":null,"milestone":null,"comments":1,"created_at":"2015-01-01T00:28:01Z","updated_at":"2015-01-01T01:02:19Z","closed_at":null,"body":"My bash foo is weak. Can someone check what I've done with moving the repo address in travis-ci.sh into a variable? Unsure if it's a @RobLoach thing or a @andrewmallis thing. I will update this with a line number when I've pushed the initial code up."},"comment":{"url":"https://api.github.com/repos/kalamuna/kalastatic/issues/comments/68477261","html_url":"https://github.com/kalamuna/kalastatic/issues/3#issuecomment-68477261","issue_url":"https://api.github.com/repos/kalamuna/kalastatic/issues/3","id":68477261,"user":{"login":"soniktrooth","id":597617,"avatar_url":"https://avatars.githubusercontent.com/u/597617?v=3","gravatar_id":"","url":"https://api.github.com/users/soniktrooth","html_url":"https://github.com/soniktrooth","followers_url":"https://api.github.com/users/soniktrooth/followers","following_url":"https://api.github.com/users/soniktrooth/following{/other_user}","gists_url":"https://api.github.com/users/soniktrooth/gists{/gist_id}","starred_url":"https://api.github.com/users/soniktrooth/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/soniktrooth/subscriptions","organizations_url":"https://api.github.com/users/soniktrooth/orgs","repos_url":"https://api.github.com/users/soniktrooth/repos","events_url":"https://api.github.com/users/soniktrooth/events{/privacy}","received_events_url":"https://api.github.com/users/soniktrooth/received_events","type":"User","site_admin":false},"created_at":"2015-01-01T01:02:19Z","updated_at":"2015-01-01T01:02:19Z","body":"Ok, line [47](https://github.com/kalamuna/kalastatic/blob/master/ci/travis-ci.sh#L47) is where I set up the var and [67](https://github.com/kalamuna/kalastatic/blob/master/ci/travis-ci.sh#L67) is where I used it.\r\n\r\nI also noticed just now that the check for $TRAVIS_REPO_SLUG is looking for \"kalamuna/pinnacle\" on line [50](https://github.com/kalamuna/kalastatic/blob/master/ci/travis-ci.sh#L50). I guess that will need to be a variable that can be set per project too but I'm unsure how that would have to be as it relates to Travis of which my foo is also weak. "}},"public":true,"created_at":"2015-01-01T01:02:19Z","org":{"id":2373705,"login":"kalamuna","gravatar_id":"","url":"https://api.github.com/orgs/kalamuna","avatar_url":"https://avatars.githubusercontent.com/u/2373705?"}}
{"id":"2489396859","type":"WatchEvent","actor":{"id":681965,"login":"wonbyte","gravatar_id":"","url":"https://api.github.com/users/wonbyte","avatar_url":"https://avatars.githubusercontent.com/u/681965?"},"repo":{"id":13324424,"name":"idris-hackers/idris-vim","url":"https://api.github.com/repos/idris-hackers/idris-vim"},"payload":{"action":"started"},"public":true,"created_at":"2015-01-01T01:02:19Z","org":{"id":3963683,"login":"idris-hackers","gravatar_id":"","url":"https://api.github.com/orgs/idris-hackers","avatar_url":"https://avatars.githubusercontent.com/u/3963683?"}}
{"id":"2489396862","type":"PushEvent","actor":{"id":1684950,"login":"naijaping","gravatar_id":"","url":"https://api.github.com/users/naijaping","avatar_url":"https://avatars.githubusercontent.com/u/1684950?"},"repo":{"id":28650038,"name":"naijaping/awonlist","url":"https://api.github.com/repos/naijaping/awonlist"},"payload":{"push_id":536752689,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"e80946e9abd94a00ce15b06ad502211a518e2ffd","before":"5286c7f80658d4fa04dc7a13901fe3b7ceefa3a4","commits":[{"sha":"e80946e9abd94a00ce15b06ad502211a518e2ffd","author":{"email":"8a1440b218d23a283d388025f7c9dc3555009ec5@gmail.com","name":"naijaping"},"message":"Update uk","distinct":true,"url":"https://api.github.com/repos/naijaping/awonlist/commits/e80946e9abd94a00ce15b06ad502211a518e2ffd"}]},"public":true,"created_at":"2015-01-01T01:02:20Z"}
{"id":"2489396864","type":"PushEvent","actor":{"id":4153853,"login":"jlumijarvi","gravatar_id":"","url":"https://api.github.com/users/jlumijarvi","avatar_url":"https://avatars.githubusercontent.com/u/4153853?"},"repo":{"id":24660234,"name":"jlumijarvi/excelimporter","url":"https://api.github.com/repos/jlumijarvi/excelimporter"},"payload":{"push_id":536752691,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"0c317517b4de211b349b78609a2eb9a6872607da","before":"be0ee8ea1d35abc029e24aecbbe2c0a68c8e1387","commits":[{"sha":"0c317517b4de211b349b78609a2eb9a6872607da","author":{"email":"40e6fc59d2535c98bfd5d19357e20df6e95cef64@gmail.com","name":"jlumijarvi"},"message":"Create LICENSE.md","distinct":true,"url":"https://api.github.com/repos/jlumijarvi/excelimporter/commits/0c317517b4de211b349b78609a2eb9a6872607da"}]},"public":true,"created_at":"2015-01-01T01:02:20Z"}
{"id":"2489396867","type":"CreateEvent","actor":{"id":6863829,"login":"essemfly","gravatar_id":"","url":"https://api.github.com/users/essemfly","avatar_url":"https://avatars.githubusercontent.com/u/6863829?"},"repo":{"id":28678193,"name":"essemfly/myVirtualHome","url":"https://api.github.com/repos/essemfly/myVirtualHome"},"payload":{"ref":"master","ref_type":"branch","master_branch":"master","description":"laboratory","pusher_type":"user"},"public":true,"created_at":"2015-01-01T01:02:22Z"}
{"id":"2489396868","type":"IssueCommentEvent","actor":{"id":7058721,"login":"alextegelid","gravatar_id":"","url":"https://api.github.com/users/alextegelid","avatar_url":"https://avatars.githubusercontent.com/u/7058721?"},"repo":{"id":2469037,"name":"kemayo/sublime-text-git","url":"https://api.github.com/repos/kemayo/sublime-text-git"},"payload":{"action":"created","issue":{"url":"https://api.github.com/repos/kemayo/sublime-text-git/issues/371","labels_url":"https://api.github.com/repos/kemayo/sublime-text-git/issues/371/labels{/name}","comments_url":"https://api.github.com/repos/kemayo/sublime-text-git/issues/371/comments","events_url":"https://api.github.com/repos/kemayo/sublime-text-git/issues/371/events","html_url":"https://github.com/kemayo/sublime-text-git/issues/371","id":48203601,"number":371,"title":"Cannot commit","user":{"login":"evenfrost","id":3055750,"avatar_url":"https://avatars.githubusercontent.com/u/3055750?v=3","gravatar_id":"","url":"https://api.github.com/users/evenfrost","html_url":"https://github.com/evenfrost","followers_url":"https://api.github.com/users/evenfrost/followers","following_url":"https://api.github.com/users/evenfrost/following{/other_user}","gists_url":"https://api.github.com/users/evenfrost/gists{/gist_id}","starred_url":"https://api.github.com/users/evenfrost/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/evenfrost/subscriptions","organizations_url":"https://api.github.com/users/evenfrost/orgs","repos_url":"https://api.github.com/users/evenfrost/repos","events_url":"https://api.github.com/users/evenfrost/events{/privacy}","received_events_url":"https://api.github.com/users/evenfrost/received_events","type":"User","site_admin":false},"labels":[],"state":"open","locked":false,"assignee":null,"milestone":null,"comments":9,"created_at":"2014-11-09T15:06:06Z","updated_at":"2015-01-01T01:02:21Z","closed_at":null,"body":"Every time I try to do git commit, I get this error: \"fatal: Unable to create '/home/evenfrost/work/projects/aword/.git/index.lock': File exists.\". There is no such file though. I believe this is somehow related to the fact that I've upgraded git to 2.1.0, cause guys from SO had similar problems with the plugin and newer versions of git."},"comment":{"url":"https://api.github.com/repos/kemayo/sublime-text-git/issues/comments/68477262","html_url":"https://github.com/kemayo/sublime-text-git/issues/371#issuecomment-68477262","issue_url":"https://api.github.com/repos/kemayo/sublime-text-git/issues/371","id":68477262,"user":{"login":"alextegelid","id":7058721,"avatar_url":"https://avatars.githubusercontent.com/u/7058721?v=3","gravatar_id":"","url":"https://api.github.com/users/alextegelid","html_url":"https://github.com/alextegelid","followers_url":"https://api.github.com/users/alextegelid/followers","following_url":"https://api.github.com/users/alextegelid/following{/other_user}","gists_url":"https://api.github.com/users/alextegelid/gists{/gist_id}","starred_url":"https://api.github.com/users/alextegelid/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/alextegelid/subscriptions","organizations_url":"https://api.github.com/users/alextegelid/orgs","repos_url":"https://api.github.com/users/alextegelid/repos","events_url":"https://api.github.com/users/alextegelid/events{/privacy}","received_events_url":"https://api.github.com/users/alextegelid/received_events","type":"User","site_admin":false},"created_at":"2015-01-01T01:02:21Z","updated_at":"2015-01-01T01:02:21Z","body":"I can confirm that the problem I experienced only occurred on a large repo aswell. All other repos were/are still working fine\r\n\r\n—\r\nAlexander Tegelid\r\n070-508 49 90\r\nalex@tegelid.se\r\n—\r\nSent from Mailbox App on iPhone.\r\n\r\nOn Thu, Jan 1, 2015 at 12:54 AM, John Watson <notifications@github.com>\r\nwrote:\r\n\r\n> I've only started experiencing this issue with larger repos (10k+ files) (st3, python3 branch). I did some experimenting and added print statements to `CommandThread` so I could see when threads were starting and finishing. Here's what I think is happening:\r\n> - When a commit is started, the plugin collects history and diffs and shows the commit buffer allowing the user to enter a commit message.\r\n> - The user then closes the buffer, starting the commit.\r\n> - At that moment, another buffer is activated (because the commit message buffer was closed) causing the GitBranchStatusCommand to run (statusbar.py)\r\n> - On these large repos, `git status --porcelain` does not finish until AFTER the `git commit` thread starts. `git status --porcelain` creates an index.lock file\r\n> The threads are running like this:\r\n> 1. Start status thread\r\n> 2. Start commit thread\r\n> 3. Finish commit (fails because status is still running)\r\n> 4. Finish status\r\n> Because `git status` creates an index.lock file, the commit fails. This doesn't affect me on small repos, I assume because `git status` runs much faster there. Sometimes `git status` runs fast enough even on large repos for this not to happen. I don't know what git is doing or why it's creating the lock file for a status.\r\n> I'm not sure how to resolve the issue. Perhaps just temporarily disable the GitBranchStatusListener listener during a commit (and then update the statusbar when the commit is finished). Or queue the commands. A workaround is to add `\"statusbar_status\": false` to the user settings.\r\n> ---\r\n> Reply to this email directly or view it on GitHub:\r\n> https://github.com/kemayo/sublime-text-git/issues/371#issuecomment-68475631"}},"public":true,"created_at":"2015-01-01T01:02:22Z"}
{"id":"2489396870","type":"PushEvent","actor":{"id":170161,"login":"mebigfatguy","gravatar_id":"","url":"https://api.github.com/users/mebigfatguy","avatar_url":"https://avatars.githubusercontent.com/u/170161?"},"repo":{"id":21152272,"name":"mebigfatguy/fbaas","url":"https://api.github.com/repos/mebigfatguy/fbaas"},"payload":{"push_id":536752694,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"3eb098edd4b8287fbf779bfe19f1b786c18996cb","before":"3a78ece9dce4562acbf24e05d4c1f79e5b8814b3","commits":[{"sha":"3eb098edd4b8287fbf779bfe19f1b786c18996cb","author":{"email":"daf9f6e8320e49c5c7007b0c59aaad531fc83397@mebigfatguy.com","name":"Dave Brosius"},"message":"differentiate different status","distinct":true,"url":"https://api.github.com/repos/mebigfatguy/fbaas/commits/3eb098edd4b8287fbf779bfe19f1b786c18996cb"}]},"public":true,"created_at":"2015-01-01T01:02:22Z"}
{"id":"2489396871","type":"PushEvent","actor":{"id":4482745,"login":"thedax","gravatar_id":"","url":"https://api.github.com/users/thedax","avatar_url":"https://avatars.githubusercontent.com/u/4482745?"},"repo":{"id":19226700,"name":"thedax/nintendont-mirror","url":"https://api.github.com/repos/thedax/nintendont-mirror"},"payload":{"push_id":536752695,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"110d802334f7f4d1b01b43639585bfdad9f68bf5","before":"e46036d65d64c9fb27c14e22872fd047aed65cf7","commits":[{"sha":"110d802334f7f4d1b01b43639585bfdad9f68bf5","author":{"email":"292e5fdbe23a481a99bcd6ac5ca3dd0ad2d7d447@yahoo.com","name":"Howard"},"message":"-Added Trio Linker Plus II controller.ini (Thanks gillhaj02)","distinct":true,"url":"https://api.github.com/repos/thedax/nintendont-mirror/commits/110d802334f7f4d1b01b43639585bfdad9f68bf5"}]},"public":true,"created_at":"2015-01-01T01:02:22Z"}
{"id":"2489396873","type":"PushEvent","actor":{"id":6529689,"login":"Conutant","gravatar_id":"","url":"https://api.github.com/users/Conutant","avatar_url":"https://avatars.githubusercontent.com/u/6529689?"},"repo":{"id":28280392,"name":"Conutant/TESSERACT","url":"https://api.github.com/repos/Conutant/TESSERACT"},"payload":{"push_id":536752697,"size":1,"distinct_size":1,"ref":"refs/heads/dev_andrei","head":"cf3ff97c0ea2d16063914756cb392679d53ee5c8","before":"eb99354eb7062b40f28369958e4b3a38757e46b5","commits":[{"sha":"cf3ff97c0ea2d16063914756cb392679d53ee5c8","author":{"email":"f7be974c25647e34f805d7b31d9b10b18614a452@gmail.com","name":"Conutant"},"message":"Displaying comments, adding  padding","distinct":true,"url":"https://api.github.com/repos/Conutant/TESSERACT/commits/cf3ff97c0ea2d16063914756cb392679d53ee5c8"}]},"public":true,"created_at":"2015-01-01T01:02:22Z"}
{"id":"2489396880","type":"PushEvent","actor":{"id":429706,"login":"podviaznikov","gravatar_id":"","url":"https://api.github.com/users/podviaznikov","avatar_url":"https://avatars.githubusercontent.com/u/429706?"},"repo":{"id":28254077,"name":"podviaznikov/hellonode","url":"https://api.github.com/repos/podviaznikov/hellonode"},"payload":{"push_id":536752700,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"b1e60af7541bcba479a2adc7b4e892219371dc4e","before":"7edf6f05533eafe99dfffbb67bda921e6e341f61","commits":[{"sha":"b1e60af7541bcba479a2adc7b4e892219371dc4e","author":{"email":"9f35d6cbd99efe2457db40f739c2a082624247fb@gmail.com","name":"Anton Podviaznikov"},"message":"Update server.js","distinct":true,"url":"https://api.github.com/repos/podviaznikov/hellonode/commits/b1e60af7541bcba479a2adc7b4e892219371dc4e"}]},"public":true,"created_at":"2015-01-01T01:02:22Z"}
{"id":"2489396885","type":"PushEvent","actor":{"id":1558638,"login":"trm36","gravatar_id":"","url":"https://api.github.com/users/trm36","avatar_url":"https://avatars.githubusercontent.com/u/1558638?"},"repo":{"id":28282084,"name":"trm36/finalGrade","url":"https://api.github.com/repos/trm36/finalGrade"},"payload":{"push_id":536752706,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"cacd357c0cb98995763482eeae7d98627a226048","before":"a9cce18b4d22234ab644c4cf9daa27d32eff83ab","commits":[{"sha":"cacd357c0cb98995763482eeae7d98627a226048","author":{"email":"514b3b67f3b99c0e9708fdb5f8805e588c97ad00@humboldt.edu","name":"Taylor Mott"},"message":"Adds user instructions\n\nSigned-off-by: Taylor Mott <trm36@humboldt.edu>","distinct":true,"url":"https://api.github.com/repos/trm36/finalGrade/commits/cacd357c0cb98995763482eeae7d98627a226048"}]},"public":true,"created_at":"2015-01-01T01:02:23Z"}
{"id":"2489396886","type":"PushEvent","actor":{"id":94782,"login":"ixti","gravatar_id":"","url":"https://api.github.com/users/ixti","avatar_url":"https://avatars.githubusercontent.com/u/94782?"},"repo":{"id":2524005,"name":"tarcieri/http.rb","url":"https://api.github.com/repos/tarcieri/http.rb"},"payload":{"push_id":536752705,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"b144b32f7b148df242604fdb7752c76f6053cb24","before":"bbe9fe50b6ebe907a1cea8d2da00d2eacb9e06dd","commits":[{"sha":"b144b32f7b148df242604fdb7752c76f6053cb24","author":{"email":"e6e135d16927e8bca193effa00241a85121e93df@member.fsf.org","name":"Aleksey V Zapparov"},"message":"Cleanup HTTP::Request spec","distinct":true,"url":"https://api.github.com/repos/tarcieri/http.rb/commits/b144b32f7b148df242604fdb7752c76f6053cb24"}]},"public":true,"created_at":"2015-01-01T01:02:23Z"}
{"id":"2489396891","type":"WatchEvent","actor":{"id":10254377,"login":"majache","gravatar_id":"","url":"https://api.github.com/users/majache","avatar_url":"https://avatars.githubusercontent.com/u/10254377?"},"repo":{"id":16190750,"name":"evanbrooks/syntax-highlight","url":"https://api.github.com/repos/evanbrooks/syntax-highlight"},"payload":{"action":"started"},"public":true,"created_at":"2015-01-01T01:02:23Z"}
{"id":"2489396892","type":"PushEvent","actor":{"id":1221156,"login":"fyfe","gravatar_id":"","url":"https://api.github.com/users/fyfe","avatar_url":"https://avatars.githubusercontent.com/u/1221156?"},"repo":{"id":28673837,"name":"fyfe/git-test","url":"https://api.github.com/repos/fyfe/git-test"},"payload":{"push_id":536752708,"size":0,"distinct_size":0,"ref":"refs/heads/master","head":"aeffe262b4f19a801509f8dcc9611a2e8b1c9c5f","before":"25430ccc1c5249741feb237b0d0f1db055fe4b55","commits":[]},"public":true,"created_at":"2015-01-01T01:02:23Z"}
{"id":"2489396895","type":"PushEvent","actor":{"id":9831378,"login":"Amit-P-Amin","gravatar_id":"","url":"https://api.github.com/users/Amit-P-Amin","avatar_url":"https://avatars.githubusercontent.com/u/9831378?"},"repo":{"id":28678217,"name":"Amit-P-Amin/active_record_lite","url":"https://api.github.com/repos/Amit-P-Amin/active_record_lite"},"payload":{"push_id":536752710,"size":1,"distinct_size":1,"ref":"refs/heads/patch-1","head":"b5ac327b20f2041652e3228ce4612880aae97beb","before":"ca4e169591deec6c4b30b611e8ed5bdf89b3386a","commits":[{"sha":"b5ac327b20f2041652e3228ce4612880aae97beb","author":{"email":"b5bfea0f6fb804e6f8331851ae8acd4de4a8dcf9@gmail.com","name":"Amit-P-Amin"},"message":"Update 03_associatable_spec.rb\n\nWas confused for a while because \"AssocOptions #model_class returns class of associated object\" was failing. This is because that spec tests 2 methods, but the description just mentions 1 (only model class, instead of model class and table name).","distinct":true,"url":"https://api.github.com/repos/Amit-P-Amin/active_record_lite/commits/b5ac327b20f2041652e3228ce4612880aae97beb"}]},"public":true,"created_at":"2015-01-01T01:02:24Z"}
{"id":"2489396899","type":"IssuesEvent","actor":{"id":894251,"login":"oubiwann","gravatar_id":"","url":"https://api.github.com/users/oubiwann","avatar_url":"https://avatars.githubusercontent.com/u/894251?"},"repo":{"id":27462056,"name":"lfex/lsci","url":"https://api.github.com/repos/lfex/lsci"},"payload":{"action":"opened","issue":{"url":"https://api.github.com/repos/lfex/lsci/issues/36","labels_url":"https://api.github.com/repos/lfex/lsci/issues/36/labels{/name}","comments_url":"https://api.github.com/repos/lfex/lsci/issues/36/comments","events_url":"https://api.github.com/repos/lfex/lsci/issues/36/events","html_url":"https://github.com/lfex/lsci/issues/36","id":53210200,"number":36,"title":"NaN and Infinity from NumPy crashes ErlPort","user":{"login":"oubiwann","id":894251,"avatar_url":"https://avatars.githubusercontent.com/u/894251?v=3","gravatar_id":"","url":"https://api.github.com/users/oubiwann","html_url":"https://github.com/oubiwann","followers_url":"https://api.github.com/users/oubiwann/followers","following_url":"https://api.github.com/users/oubiwann/following{/other_user}","gists_url":"https://api.github.com/users/oubiwann/gists{/gist_id}","starred_url":"https://api.github.com/users/oubiwann/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/oubiwann/subscriptions","organizations_url":"https://api.github.com/users/oubiwann/orgs","repos_url":"https://api.github.com/users/oubiwann/repos","events_url":"https://api.github.com/users/oubiwann/events{/privacy}","received_events_url":"https://api.github.com/users/oubiwann/received_events","type":"User","site_admin":false},"labels":[{"url":"https://api.github.com/repos/lfex/lsci/labels/bug","name":"bug","color":"fc2929"}],"state":"open","locked":false,"assignee":null,"milestone":null,"comments":0,"created_at":"2015-01-01T01:02:24Z","updated_at":"2015-01-01T01:02:24Z","closed_at":null,"body":"Need to figure out how to properly pickle these for ErlPort's improved digestion ..."}},"public":true,"created_at":"2015-01-01T01:02:24Z","org":{"id":7939791,"login":"lfex","gravatar_id":"","url":"https://api.github.com/orgs/lfex","avatar_url":"https://avatars.githubusercontent.com/u/7939791?"}}
{"id":"2489396902","type":"PushEvent","actor":{"id":753926,"login":"egisatoshi","gravatar_id":"","url":"https://api.github.com/users/egisatoshi","avatar_url":"https://avatars.githubusercontent.com/u/753926?"},"repo":{"id":8212790,"name":"egison/egison","url":"https://api.github.com/repos/egison/egison"},"payload":{"push_id":536752712,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"80dae4e133a2d4645a6105eeffddbcd1e22eed99","before":"a6e78dde839fe67e410946bd8c168771e58cbbe1","commits":[{"sha":"80dae4e133a2d4645a6105eeffddbcd1e22eed99","author":{"email":"71e7d9a5a106c46ef4ccb3a433d905fea747e8cc@egison.org","name":"Satoshi Egi"},"message":"update","distinct":true,"url":"https://api.github.com/repos/egison/egison/commits/80dae4e133a2d4645a6105eeffddbcd1e22eed99"}]},"public":true,"created_at":"2015-01-01T01:02:25Z","org":{"id":6812884,"login":"egison","gravatar_id":"","url":"https://api.github.com/orgs/egison","avatar_url":"https://avatars.githubusercontent.com/u/6812884?"}}
{"id":"2489396903","type":"CreateEvent","actor":{"id":8918426,"login":"Spekular","gravatar_id":"","url":"https://api.github.com/users/Spekular","avatar_url":"https://avatars.githubusercontent.com/u/8918426?"},"repo":{"id":28678100,"name":"Spekular/Project-Version","url":"https://api.github.com/repos/Spekular/Project-Version"},"payload":{"ref":"master","ref_type":"branch","master_branch":"master","description":"Adds Information popup when projects created with older or newer LMMS versions.","pusher_type":"user"},"public":true,"created_at":"2015-01-01T01:02:25Z"}
{"id":"2489396913","type":"PushEvent","actor":{"id":4858543,"login":"mtklr","gravatar_id":"","url":"https://api.github.com/users/mtklr","avatar_url":"https://avatars.githubusercontent.com/u/4858543?"},"repo":{"id":28118151,"name":"mtklr/howard","url":"https://api.github.com/repos/mtklr/howard"},"payload":{"push_id":536752715,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"756c131344998885363d26d74a5698f910a2dcb1","before":"d5b4d89f63a7fedf51ac911b6df897b21466189a","commits":[{"sha":"756c131344998885363d26d74a5698f910a2dcb1","author":{"email":"b9663e167dc762614bed337db2d0a7492d0ce96b@gmail.com","name":"Matt Keller"},"message":"add #202 title","distinct":true,"url":"https://api.github.com/repos/mtklr/howard/commits/756c131344998885363d26d74a5698f910a2dcb1"}]},"public":true,"created_at":"2015-01-01T01:02:27Z"}
{"id":"2489396915","type":"PushEvent","actor":{"id":542045,"login":"apipe-tester","gravatar_id":"","url":"https://api.github.com/users/apipe-tester","avatar_url":"https://avatars.githubusercontent.com/u/542045?"},"repo":{"id":23442737,"name":"genome/genome","url":"https://api.github.com/repos/genome/genome"},"payload":{"push_id":536752716,"size":30,"distinct_size":0,"ref":"refs/heads/snapshot","head":"65a175d735f2507c7ce46239fc8192f7b1fabcfd","before":"7184935531d3758833760b60be75a69fc2100afa","commits":[{"sha":"02256b48b155180783a99a0ef318da86a1e2d178","author":{"email":"ee527c7899460c7ad6b19d12059ad61f80cf4acd@genome.wustl.edu","name":"apregier"},"message":"New way to read a bam-readcount file\n\nAssuming that the file is sorted by position, this allows you to\nget entries by position.  You have to read the positions almost in\norder, although you can look back into a buffer of one entry.\nWe need this because vcf entries can look at multiple bam-readcount\nentries, depending on whether they have deletion alternate alleles.","distinct":false,"url":"https://api.github.com/repos/genome/genome/commits/02256b48b155180783a99a0ef318da86a1e2d178"},{"sha":"942b44ab8ef5628e72985d11006aef09924028db","author":{"email":"ee527c7899460c7ad6b19d12059ad61f80cf4acd@genome.wustl.edu","name":"apregier"},"message":"Move bam-readcount vcf-safe encode and decode to a separate class","distinct":false,"url":"https://api.github.com/repos/genome/genome/commits/942b44ab8ef5628e72985d11006aef09924028db"},{"sha":"a40e73ea13267236ab8499cd095a87c77f0b25e1","author":{"email":"ee527c7899460c7ad6b19d12059ad61f80cf4acd@genome.wustl.edu","name":"apregier"},"message":"Factor out is_deletion","distinct":false,"url":"https://api.github.com/repos/genome/genome/commits/a40e73ea13267236ab8499cd095a87c77f0b25e1"},{"sha":"a7bfeb1898edda953544ff65722679cbf750b0d3","author":{"email":"ee527c7899460c7ad6b19d12059ad61f80cf4acd@genome.wustl.edu","name":"apregier"},"message":"create_deletion_entry is always called with bam_readcount_line_deletion\n\nDon't need to pass it as a param or export/import it","distinct":false,"url":"https://api.github.com/repos/genome/genome/commits/a7bfeb1898edda953544ff65722679cbf750b0d3"},{"sha":"79b180206258cb3120ac57b6277147544aace88a","author":{"email":"ee527c7899460c7ad6b19d12059ad61f80cf4acd@genome.wustl.edu","name":"apregier"},"message":"Bam readcount test helper gets entries from vcf files","distinct":false,"url":"https://api.github.com/repos/genome/genome/commits/79b180206258cb3120ac57b6277147544aace88a"},{"sha":"6f0eb821ca4cc346c332903abd909d98f0a9cad8","author":{"email":"ee527c7899460c7ad6b19d12059ad61f80cf4acd@genome.wustl.edu","name":"apregier"},"message":"Add a bam readcount parser that can encode and decode bam-readcount lines in vcf\n\nLines from bam-readcount are stored in a sample format field as json.\nThe json contains a hash with two types of keys:\n-alternate alleles.  The values of these entries point to which offset key\nshould be checked to find the bam-readcount line for that allele.\n-offsets.  The key is the offset from the vcf position on this line (since\nbam readcount interprets deletion start positions differently, they will be 1; all\nother types of normalized vcf alleles will be 0).  The value is the bam-readcount line.\n\nThe json is made vcf sample field safe using the encode function","distinct":false,"url":"https://api.github.com/repos/genome/genome/commits/6f0eb821ca4cc346c332903abd909d98f0a9cad8"},{"sha":"913c134a75265a5f5c083f767d0d3bfbd3b74efa","author":{"email":"ee527c7899460c7ad6b19d12059ad61f80cf4acd@genome.wustl.edu","name":"apregier"},"message":"Correctly mock up test data\n\nThe single-bam (\"normal\") build should return the alignment\nresult from the normal sample as its merged_aligned_bam_result","distinct":false,"url":"https://api.github.com/repos/genome/genome/commits/913c134a75265a5f5c083f767d0d3bfbd3b74efa"},{"sha":"39c9a2bcf9dead867f16fbc9c89f0b602a8840e3","author":{"email":"ee527c7899460c7ad6b19d12059ad61f80cf4acd@genome.wustl.edu","name":"apregier"},"message":"Use the new BamReadcountParser to get allele-specific bam-readcounts from vcf\n\n-gmt annotate-with-readcounts now uses BamReadcountParser\n-update all of the interpreters and filters that use bam-readcount to\nhandle bam-readcount entries on a per-allele and per-sample basis rather than on a\nstrictly per-sample basis.","distinct":false,"url":"https://api.github.com/repos/genome/genome/commits/39c9a2bcf9dead867f16fbc9c89f0b602a8840e3"},{"sha":"d0d1a46075772341a6a627530b6346354f602c35","author":{"email":"ee527c7899460c7ad6b19d12059ad61f80cf4acd@genome.wustl.edu","name":"apregier"},"message":"Test doesn't actually depend on bam-readcount\n\nSince the test is just using the bam-readcount test helper\nas a convenient way to make a vcf entry, use the simpler\nentry that doesn't actually contain bam-readcount output","distinct":false,"url":"https://api.github.com/repos/genome/genome/commits/d0d1a46075772341a6a627530b6346354f602c35"},{"sha":"0bd03ea587b5d6cc2cdf83aa5356c9d170d15505","author":{"email":"ee527c7899460c7ad6b19d12059ad61f80cf4acd@genome.wustl.edu","name":"apregier"},"message":"Variant callers interpreter takes a list of valid callers","distinct":false,"url":"https://api.github.com/repos/genome/genome/commits/0bd03ea587b5d6cc2cdf83aa5356c9d170d15505"},{"sha":"794dad92553ad30f03c6c539647b743aeb64cdf1","author":{"email":"ee527c7899460c7ad6b19d12059ad61f80cf4acd@genome.wustl.edu","name":"apregier"},"message":"Enforce no duplicate entries in bam-readcount file","distinct":false,"url":"https://api.github.com/repos/genome/genome/commits/794dad92553ad30f03c6c539647b743aeb64cdf1"},{"sha":"14099eee5b5c68fd647a4669b274ce6c256f6634","author":{"email":"ee527c7899460c7ad6b19d12059ad61f80cf4acd@genome.wustl.edu","name":"apregier"},"message":"Rename some variables to make them easier to read","distinct":false,"url":"https://api.github.com/repos/genome/genome/commits/14099eee5b5c68fd647a4669b274ce6c256f6634"},{"sha":"b9655006e621a59f1f4e8e3529889dbe1b4f37f1","author":{"email":"ee527c7899460c7ad6b19d12059ad61f80cf4acd@genome.wustl.edu","name":"apregier"},"message":"Fix bam-readcount reader","distinct":false,"url":"https://api.github.com/repos/genome/genome/commits/b9655006e621a59f1f4e8e3529889dbe1b4f37f1"},{"sha":"be1d571a7149b25d16228578a84327c8458652c9","author":{"email":"ee527c7899460c7ad6b19d12059ad61f80cf4acd@genome.wustl.edu","name":"apregier"},"message":"Handle vcf entries with no alternate alleles","distinct":false,"url":"https://api.github.com/repos/genome/genome/commits/be1d571a7149b25d16228578a84327c8458652c9"},{"sha":"64306ea12dd8d3dc538f7eb5637ff36dba750567","author":{"email":"ee527c7899460c7ad6b19d12059ad61f80cf4acd@genome.wustl.edu","name":"apregier"},"message":"Regions list for bam readcount should be de-duplicated\n\nKeep the sort order of the chromosomes the same as in the vcf file","distinct":false,"url":"https://api.github.com/repos/genome/genome/commits/64306ea12dd8d3dc538f7eb5637ff36dba750567"},{"sha":"20228e5869e518eafc7e71c3345b2f650de5412a","author":{"email":"ee527c7899460c7ad6b19d12059ad61f80cf4acd@genome.wustl.edu","name":"apregier"},"message":"Add missing use statement","distinct":false,"url":"https://api.github.com/repos/genome/genome/commits/20228e5869e518eafc7e71c3345b2f650de5412a"},{"sha":"cbcf18f5553082355415acac0a2db31f71232fee","author":{"email":"ee527c7899460c7ad6b19d12059ad61f80cf4acd@genome.wustl.edu","name":"apregier"},"message":"Rename class","distinct":false,"url":"https://api.github.com/repos/genome/genome/commits/cbcf18f5553082355415acac0a2db31f71232fee"},{"sha":"dedc88e580410e57d7c4c417d520cb806fc322e8","author":{"email":"ee527c7899460c7ad6b19d12059ad61f80cf4acd@genome.wustl.edu","name":"apregier"},"message":"Remove unnecessary conditional","distinct":false,"url":"https://api.github.com/repos/genome/genome/commits/dedc88e580410e57d7c4c417d520cb806fc322e8"},{"sha":"aaa4cd72a8690ac5cd916c5be748c782cd00d510","author":{"email":"ee527c7899460c7ad6b19d12059ad61f80cf4acd@genome.wustl.edu","name":"apregier"},"message":"Make the buffered reader more robust","distinct":false,"url":"https://api.github.com/repos/genome/genome/commits/aaa4cd72a8690ac5cd916c5be748c782cd00d510"},{"sha":"81c8d713309c76520ae1766e79ca3d5628ed95eb","author":{"email":"ee527c7899460c7ad6b19d12059ad61f80cf4acd@genome.wustl.edu","name":"apregier"},"message":"Simplify function","distinct":false,"url":"https://api.github.com/repos/genome/genome/commits/81c8d713309c76520ae1766e79ca3d5628ed95eb"}]},"public":true,"created_at":"2015-01-01T01:02:27Z","org":{"id":318108,"login":"genome","gravatar_id":"","url":"https://api.github.com/orgs/genome","avatar_url":"https://avatars.githubusercontent.com/u/318108?"}}
{"id":"2489396917","type":"IssueCommentEvent","actor":{"id":3117019,"login":"robotbrain","gravatar_id":"","url":"https://api.github.com/users/robotbrain","avatar_url":"https://avatars.githubusercontent.com/u/3117019?"},"repo":{"id":12682212,"name":"MultiMC/MultiMC5","url":"https://api.github.com/repos/MultiMC/MultiMC5"},"payload":{"action":"created","issue":{"url":"https://api.github.com/repos/MultiMC/MultiMC5/issues/704","labels_url":"https://api.github.com/repos/MultiMC/MultiMC5/issues/704/labels{/name}","comments_url":"https://api.github.com/repos/MultiMC/MultiMC5/issues/704/comments","events_url":"https://api.github.com/repos/MultiMC/MultiMC5/issues/704/events","html_url":"https://github.com/MultiMC/MultiMC5/issues/704","id":53210008,"number":704,"title":"Development optin","user":{"login":"bl968","id":4886192,"avatar_url":"https://avatars.githubusercontent.com/u/4886192?v=3","gravatar_id":"","url":"https://api.github.com/users/bl968","html_url":"https://github.com/bl968","followers_url":"https://api.github.com/users/bl968/followers","following_url":"https://api.github.com/users/bl968/following{/other_user}","gists_url":"https://api.github.com/users/bl968/gists{/gist_id}","starred_url":"https://api.github.com/users/bl968/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/bl968/subscriptions","organizations_url":"https://api.github.com/users/bl968/orgs","repos_url":"https://api.github.com/users/bl968/repos","events_url":"https://api.github.com/users/bl968/events{/privacy}","received_events_url":"https://api.github.com/users/bl968/received_events","type":"User","site_admin":false},"labels":[],"state":"open","locked":false,"assignee":null,"milestone":null,"comments":1,"created_at":"2015-01-01T00:51:03Z","updated_at":"2015-01-01T01:02:27Z","closed_at":null,"body":"Give us a checkbox to allow installation of development versions of forge and liteloader for the client"},"comment":{"url":"https://api.github.com/repos/MultiMC/MultiMC5/issues/comments/68477263","html_url":"https://github.com/MultiMC/MultiMC5/issues/704#issuecomment-68477263","issue_url":"https://api.github.com/repos/MultiMC/MultiMC5/issues/704","id":68477263,"user":{"login":"robotbrain","id":3117019,"avatar_url":"https://avatars.githubusercontent.com/u/3117019?v=3","gravatar_id":"","url":"https://api.github.com/users/robotbrain","html_url":"https://github.com/robotbrain","followers_url":"https://api.github.com/users/robotbrain/followers","following_url":"https://api.github.com/users/robotbrain/following{/other_user}","gists_url":"https://api.github.com/users/robotbrain/gists{/gist_id}","starred_url":"https://api.github.com/users/robotbrain/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/robotbrain/subscriptions","organizations_url":"https://api.github.com/users/robotbrain/orgs","repos_url":"https://api.github.com/users/robotbrain/repos","events_url":"https://api.github.com/users/robotbrain/events{/privacy}","received_events_url":"https://api.github.com/users/robotbrain/received_events","type":"User","site_admin":false},"created_at":"2015-01-01T01:02:27Z","updated_at":"2015-01-01T01:02:27Z","body":"liteloader: no, mumfrey doesnt give us a way to do that\r\nforge: already supported for actual forge, just not fml by itself"}},"public":true,"created_at":"2015-01-01T01:02:27Z","org":{"id":5411890,"login":"MultiMC","gravatar_id":"","url":"https://api.github.com/orgs/MultiMC","avatar_url":"https://avatars.githubusercontent.com/u/5411890?"}}
{"id":"2489396923","type":"WatchEvent","actor":{"id":3087225,"login":"zephraph","gravatar_id":"","url":"https://api.github.com/users/zephraph","avatar_url":"https://avatars.githubusercontent.com/u/3087225?"},"repo":{"id":6794407,"name":"jpsarda/Pixel-based-destructible-ground-with-Cocos2d-iPhone","url":"https://api.github.com/repos/jpsarda/Pixel-based-destructible-ground-with-Cocos2d-iPhone"},"payload":{"action":"started"},"public":true,"created_at":"2015-01-01T01:02:28Z"}
{"id":"2489396925","type":"IssuesEvent","actor":{"id":1778966,"login":"emage","gravatar_id":"","url":"https://api.github.com/users/emage","avatar_url":"https://avatars.githubusercontent.com/u/1778966?"},"repo":{"id":1653882,"name":"thoughtbot/bourbon","url":"https://api.github.com/repos/thoughtbot/bourbon"},"payload":{"action":"opened","issue":{"url":"https://api.github.com/repos/thoughtbot/bourbon/issues/605","labels_url":"https://api.github.com/repos/thoughtbot/bourbon/issues/605/labels{/name}","comments_url":"https://api.github.com/repos/thoughtbot/bourbon/issues/605/comments","events_url":"https://api.github.com/repos/thoughtbot/bourbon/issues/605/events","html_url":"https://github.com/thoughtbot/bourbon/issues/605","id":53210202,"number":605,"title":"Bourbon CSS error using Scout compiler on Windows","user":{"login":"emage","id":1778966,"avatar_url":"https://avatars.githubusercontent.com/u/1778966?v=3","gravatar_id":"","url":"https://api.github.com/users/emage","html_url":"https://github.com/emage","followers_url":"https://api.github.com/users/emage/followers","following_url":"https://api.github.com/users/emage/following{/other_user}","gists_url":"https://api.github.com/users/emage/gists{/gist_id}","starred_url":"https://api.github.com/users/emage/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/emage/subscriptions","organizations_url":"https://api.github.com/users/emage/orgs","repos_url":"https://api.github.com/users/emage/repos","events_url":"https://api.github.com/users/emage/events{/privacy}","received_events_url":"https://api.github.com/users/emage/received_events","type":"User","site_admin":false},"labels":[],"state":"open","locked":false,"assignee":null,"milestone":null,"comments":0,"created_at":"2015-01-01T01:02:28Z","updated_at":"2015-01-01T01:02:28Z","closed_at":null,"body":"I am just starting to get into SASS.  I recently installed Ruby and Bourbon on my window machine and using Scout to compile.  Everything is going well until i import the bourbon files using:\r\n\r\n@import \"bourbon/bourbon\";\r\n\r\nI am not sure if its the Scout Compile output error or Bourbon.\r\n\r\nCompile Error:\r\n\r\nCommon error is the Invalid CSS:\r\n-------------------------------------------\r\n>>> Change detected at 16:48:33 to: main.scss\r\nerror main.scss (Line 22 of _font-source-declaration.scss: Invalid CSS after \" eot\": expected \")\", was \": $font-url +...\")\r\noverwrite main.css \r\n>>> Change detected at 16:50:46 to: bourbon/_bourbon.scss\r\nerror main.scss (Line 21 of _linear-angle-parser.scss: Invalid CSS after \" webkit-image\": expected \")\", was \": -webkit- + $p...\")\r\noverwrite main.css \r\n>>> Change detected at 16:51:01 to: main.scss\r\nerror main.scss (Line 21 of _linear-angle-parser.scss: Invalid CSS after \" webkit-image\": expected \")\", was \": -webkit- + $p...\")\r\nidentical main.css \r\n----------------------------------------------------\r\n\r\nI went into the bourbon.scss to remove the said error imported file, it just goes to the next import file and output the same error.\r\n\r\nAny thought or suggestion?\r\n\r\nThanks\r\n\r\n\r\n\r\n\r\n\r\n\r\n\r\n\r\n"}},"public":true,"created_at":"2015-01-01T01:02:28Z","org":{"id":6183,"login":"thoughtbot","gravatar_id":"","url":"https://api.github.com/orgs/thoughtbot","avatar_url":"https://avatars.githubusercontent.com/u/6183?"}}
{"id":"2489396932","type":"IssuesEvent","actor":{"id":703007,"login":"r4j4h","gravatar_id":"","url":"https://api.github.com/users/r4j4h","avatar_url":"https://avatars.githubusercontent.com/u/703007?"},"repo":{"id":14075249,"name":"zhanghuancs/D3.js-Link-Filter","url":"https://api.github.com/repos/zhanghuancs/D3.js-Link-Filter"},"payload":{"action":"opened","issue":{"url":"https://api.github.com/repos/zhanghuancs/D3.js-Link-Filter/issues/1","labels_url":"https://api.github.com/repos/zhanghuancs/D3.js-Link-Filter/issues/1/labels{/name}","comments_url":"https://api.github.com/repos/zhanghuancs/D3.js-Link-Filter/issues/1/comments","events_url":"https://api.github.com/repos/zhanghuancs/D3.js-Link-Filter/issues/1/events","html_url":"https://github.com/zhanghuancs/D3.js-Link-Filter/issues/1","id":53210203,"number":1,"title":"Sometimes labels get clipped","user":{"login":"r4j4h","id":703007,"avatar_url":"https://avatars.githubusercontent.com/u/703007?v=3","gravatar_id":"","url":"https://api.github.com/users/r4j4h","html_url":"https://github.com/r4j4h","followers_url":"https://api.github.com/users/r4j4h/followers","following_url":"https://api.github.com/users/r4j4h/following{/other_user}","gists_url":"https://api.github.com/users/r4j4h/gists{/gist_id}","starred_url":"https://api.github.com/users/r4j4h/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/r4j4h/subscriptions","organizations_url":"https://api.github.com/users/r4j4h/orgs","repos_url":"https://api.github.com/users/r4j4h/repos","events_url":"https://api.github.com/users/r4j4h/events{/privacy}","received_events_url":"https://api.github.com/users/r4j4h/received_events","type":"User","site_admin":false},"labels":[],"state":"open","locked":false,"assignee":null,"milestone":null,"comments":0,"created_at":"2015-01-01T01:02:29Z","updated_at":"2015-01-01T01:02:29Z","closed_at":null,"body":"Great work! I found one issue I want to raise awareness around.\r\n\r\nTo recreate, go to demo page at `http://jsfiddle.net/zhanghuancs/cuYu8/`\r\n\r\nand then\r\n\r\n1. Uncheck licensing\r\n2. Uncheck suit\r\n3. Uncheck resolved\r\n4. Recheck resolved\r\n\r\n_Notice the bottom strand has only the LG label._\r\n\r\n1. Recheck suit\r\n2. Uncheck suit\r\n\r\n_Notice how Samsung and Kodak labels are now present._\r\n\r\n"}},"public":true,"created_at":"2015-01-01T01:02:29Z"}
{"id":"2489396936","type":"PushEvent","actor":{"id":1727112,"login":"nucleardreamer","gravatar_id":"","url":"https://api.github.com/users/nucleardreamer","avatar_url":"https://avatars.githubusercontent.com/u/1727112?"},"repo":{"id":28675721,"name":"nucleardreamer/tdc","url":"https://api.github.com/repos/nucleardreamer/tdc"},"payload":{"push_id":536752725,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"07a6ae5cdb39596d5aed1b3794229968810bce1f","before":"dca862ebee0ce9425e5e9a00ab856d32f5e178e9","commits":[{"sha":"07a6ae5cdb39596d5aed1b3794229968810bce1f","author":{"email":"61996574b2cb2f66e0c7dcf5a13359213bfaba5a@gmail.com","name":"nucleardreamer"},"message":"repeating background movie","distinct":true,"url":"https://api.github.com/repos/nucleardreamer/tdc/commits/07a6ae5cdb39596d5aed1b3794229968810bce1f"}]},"public":true,"created_at":"2015-01-01T01:02:30Z"}
{"id":"2489396940","type":"CreateEvent","actor":{"id":2829718,"login":"phister","gravatar_id":"","url":"https://api.github.com/users/phister","avatar_url":"https://avatars.githubusercontent.com/u/2829718?"},"repo":{"id":28678235,"name":"phister/Cfb","url":"https://api.github.com/repos/phister/Cfb"},"payload":{"ref":null,"ref_type":"repository","master_branch":"master","description":"College football playoffs","pusher_type":"user"},"public":true,"created_at":"2015-01-01T01:02:32Z"}
{"id":"2489396941","type":"WatchEvent","actor":{"id":5317,"login":"textgoeshere","gravatar_id":"","url":"https://api.github.com/users/textgoeshere","avatar_url":"https://avatars.githubusercontent.com/u/5317?"},"repo":{"id":146167,"name":"tyler/trie","url":"https://api.github.com/repos/tyler/trie"},"payload":{"action":"started"},"public":true,"created_at":"2015-01-01T01:02:32Z"}
{"id":"2489396946","type":"PushEvent","actor":{"id":1031119,"login":"wavewave","gravatar_id":"","url":"https://api.github.com/users/wavewave","avatar_url":"https://avatars.githubusercontent.com/u/1031119?"},"repo":{"id":4619831,"name":"wavewave/hoodle","url":"https://api.github.com/repos/wavewave/hoodle"},"payload":{"push_id":536752730,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"1fffe5741ea097ea926cf8693061f2f741da71c8","before":"482d9eb8ea9fbdbb2f39d27779dbf7dcd749db8d","commits":[{"sha":"1fffe5741ea097ea926cf8693061f2f741da71c8","author":{"email":"0a0eb067dd98769f500dabe6a55682ac6cdd3c08@gmail.com","name":"Ian-Woo Kim"},"message":"introduce RendererState in Renderer monad (simply Reader.) renderCache -> renderCacheVar using TVar for asynchronous update","distinct":true,"url":"https://api.github.com/repos/wavewave/hoodle/commits/1fffe5741ea097ea926cf8693061f2f741da71c8"}]},"public":true,"created_at":"2015-01-01T01:02:32Z"}
{"id":"2489396949","type":"PushEvent","actor":{"id":7725188,"login":"hellerve","gravatar_id":"","url":"https://api.github.com/users/hellerve","avatar_url":"https://avatars.githubusercontent.com/u/7725188?"},"repo":{"id":27544900,"name":"hellerve/hiss","url":"https://api.github.com/repos/hellerve/hiss"},"payload":{"push_id":536752732,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"55772d134ab1da7db17da6350549eee504666acb","before":"a791dd0816d3a263e215334f3f0ba936642a2251","commits":[{"sha":"55772d134ab1da7db17da6350549eee504666acb","author":{"email":"9f918abde07a882492d318338ec4304e4a124b0a@student.htw-berlin.de","name":"Veit Heller"},"message":"Removed unnecessary enum","distinct":true,"url":"https://api.github.com/repos/hellerve/hiss/commits/55772d134ab1da7db17da6350549eee504666acb"}]},"public":true,"created_at":"2015-01-01T01:02:32Z"}
{"id":"2489396950","type":"PushEvent","actor":{"id":8620186,"login":"hoorayhu","gravatar_id":"","url":"https://api.github.com/users/hoorayhu","avatar_url":"https://avatars.githubusercontent.com/u/8620186?"},"repo":{"id":28647744,"name":"hoorayhu/sodoku-cc","url":"https://api.github.com/repos/hoorayhu/sodoku-cc"},"payload":{"push_id":536752733,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"16cb1762122432f441586c990a14c948874366f7","before":"35cdf012648c32078ee0a310e39875fed02f68e0","commits":[{"sha":"16cb1762122432f441586c990a14c948874366f7","author":{"email":"042dc4512fa3d391c5170cf3aa61e6a638f84342@hoorayhu.com","name":"Hooray Hu"},"message":"Applying MVC, making it playable for alpha testing","distinct":true,"url":"https://api.github.com/repos/hoorayhu/sodoku-cc/commits/16cb1762122432f441586c990a14c948874366f7"}]},"public":true,"created_at":"2015-01-01T01:02:32Z"}
{"id":"2489396966","type":"PushEvent","actor":{"id":6565577,"login":"CurrentResident","gravatar_id":"","url":"https://api.github.com/users/CurrentResident","avatar_url":"https://avatars.githubusercontent.com/u/6565577?"},"repo":{"id":27690802,"name":"CurrentResident/MendifactQuake","url":"https://api.github.com/repos/CurrentResident/MendifactQuake"},"payload":{"push_id":536752743,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"4769846610c03ef389d6c7345e67dcf1fb4069d8","before":"42db2228115b4098670d851ab3823ac59fa890e0","commits":[{"sha":"4769846610c03ef389d6c7345e67dcf1fb4069d8","author":{"email":"828e27bdf506438b277b61a8f22de5998c7b8e91@gmail.com","name":"Jim Thoenen"},"message":"Remove some unused globals and commented-out original id code","distinct":true,"url":"https://api.github.com/repos/CurrentResident/MendifactQuake/commits/4769846610c03ef389d6c7345e67dcf1fb4069d8"}]},"public":true,"created_at":"2015-01-01T01:02:33Z"}
{"id":"2489396972","type":"IssuesEvent","actor":{"id":6964047,"login":"TTMTT","gravatar_id":"","url":"https://api.github.com/users/TTMTT","avatar_url":"https://avatars.githubusercontent.com/u/6964047?"},"repo":{"id":28678195,"name":"TTMTT/iCL0udin","url":"https://api.github.com/repos/TTMTT/iCL0udin"},"payload":{"action":"opened","issue":{"url":"https://api.github.com/repos/TTMTT/iCL0udin/issues/1","labels_url":"https://api.github.com/repos/TTMTT/iCL0udin/issues/1/labels{/name}","comments_url":"https://api.github.com/repos/TTMTT/iCL0udin/issues/1/comments","events_url":"https://api.github.com/repos/TTMTT/iCL0udin/issues/1/events","html_url":"https://github.com/TTMTT/iCL0udin/issues/1","id":53210206,"number":1,"title":"Discuss1","user":{"login":"TTMTT","id":6964047,"avatar_url":"https://avatars.githubusercontent.com/u/6964047?v=3","gravatar_id":"","url":"https://api.github.com/users/TTMTT","html_url":"https://github.com/TTMTT","followers_url":"https://api.github.com/users/TTMTT/followers","following_url":"https://api.github.com/users/TTMTT/following{/other_user}","gists_url":"https://api.github.com/users/TTMTT/gists{/gist_id}","starred_url":"https://api.github.com/users/TTMTT/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/TTMTT/subscriptions","organizations_url":"https://api.github.com/users/TTMTT/orgs","repos_url":"https://api.github.com/users/TTMTT/repos","events_url":"https://api.github.com/users/TTMTT/events{/privacy}","received_events_url":"https://api.github.com/users/TTMTT/received_events","type":"User","site_admin":false},"labels":[],"state":"open","locked":false,"assignee":null,"milestone":null,"comments":0,"created_at":"2015-01-01T01:02:34Z","updated_at":"2015-01-01T01:02:34Z","closed_at":null,"body":"Now you can download vresion 1.0 from :\r\n---------------------------------------------------\r\nhttp://www.icloudin.net\r\n-----------------------------\r\nWow, ipod touch 5G (8.1) - iCL0udin v1.0 bypass activation (icloud)\r\n-------------------------------------------------------------------------------------\r\nhttp://youtu.be/tZmEdlDGNu4\r\n--------------------------------------\r\niCL0udin v1.0 bypass activation (icloud) - ipad mini 2G (7.1.1)\r\n-------------------------------------------------------------------------------------\r\nhttp://youtu.be/tevYyBN2QCQ\r\n---------------------------------------\r\nVideo for bypass icloud (iCL0udin v1.0) for iphone 4 CDMA ..\r\n-------------------------------------------------------------------------------------\r\nhttp://youtu.be/i85-D6N2YLk\r\n-------------------------------------\r\nNew video for iCL0udin v1.0 bypass icloud (3 iphones 7.1.2):\r\n-------------------------------------------------------------------------------------\r\nhttp://youtu.be/p51TNlCr7ug\r\n-------------------------------------\r\niCL0udin v1.0 -> %100\r\n----------------------------\r\nRemaining: %3 testing with some people..\r\n-----------------------------------------------------\r\nLast Method:\r\n-----------------\r\n\r\nmethod 1 : via (other xml not to deviceservices - exploit)\r\nmethod 2 : via (apple cert & key and i can downgrade to any ios)\r\nmethod 3 : via (change some string by hex on ELF file << some times i got error)\r\nmethod 4 : via (use apple ssl cert or real ssl in server and change some string in iphone)\r\niCL0udin v1.0 have this method:\r\n-----------------------------------------\r\n\r\nmethod 1 : via (other xml not to deviceservices - exploit)\r\nmethod 2 : via (apple cert & key and i can downgrade to any ios)"}},"public":true,"created_at":"2015-01-01T01:02:34Z"}
{"id":"2489396976","type":"PushEvent","actor":{"id":369807,"login":"tarr11","gravatar_id":"","url":"https://api.github.com/users/tarr11","avatar_url":"https://avatars.githubusercontent.com/u/369807?"},"repo":{"id":28670957,"name":"tarr11/wizbang","url":"https://api.github.com/repos/tarr11/wizbang"},"payload":{"push_id":536752748,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"bc001c10242651bd44db229260e70b9fa810d12e","before":"63e6a6e27a5f3ec455f526bb18c453e8cafb9854","commits":[{"sha":"bc001c10242651bd44db229260e70b9fa810d12e","author":{"email":"25c75c966e2ccc8083891108da2f841d165bf0eb@gmail.com","name":"Douglas Tarr"},"message":"Update and rename README.rdoc to README.md","distinct":true,"url":"https://api.github.com/repos/tarr11/wizbang/commits/bc001c10242651bd44db229260e70b9fa810d12e"}]},"public":true,"created_at":"2015-01-01T01:02:35Z"}
{"id":"2489396978","type":"IssuesEvent","actor":{"id":447792,"login":"nathanjsweet","gravatar_id":"","url":"https://api.github.com/users/nathanjsweet","avatar_url":"https://avatars.githubusercontent.com/u/447792?"},"repo":{"id":15714889,"name":"nathanjsweet/nodehun","url":"https://api.github.com/repos/nathanjsweet/nodehun"},"payload":{"action":"closed","issue":{"url":"https://api.github.com/repos/nathanjsweet/nodehun/issues/13","labels_url":"https://api.github.com/repos/nathanjsweet/nodehun/issues/13/labels{/name}","comments_url":"https://api.github.com/repos/nathanjsweet/nodehun/issues/13/comments","events_url":"https://api.github.com/repos/nathanjsweet/nodehun/issues/13/events","html_url":"https://github.com/nathanjsweet/nodehun/issues/13","id":51903837,"number":13,"title":"Memory Releasing issue","user":{"login":"nathanjsweet","id":447792,"avatar_url":"https://avatars.githubusercontent.com/u/447792?v=3","gravatar_id":"","url":"https://api.github.com/users/nathanjsweet","html_url":"https://github.com/nathanjsweet","followers_url":"https://api.github.com/users/nathanjsweet/followers","following_url":"https://api.github.com/users/nathanjsweet/following{/other_user}","gists_url":"https://api.github.com/users/nathanjsweet/gists{/gist_id}","starred_url":"https://api.github.com/users/nathanjsweet/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/nathanjsweet/subscriptions","organizations_url":"https://api.github.com/users/nathanjsweet/orgs","repos_url":"https://api.github.com/users/nathanjsweet/repos","events_url":"https://api.github.com/users/nathanjsweet/events{/privacy}","received_events_url":"https://api.github.com/users/nathanjsweet/received_events","type":"User","site_admin":false},"labels":[],"state":"closed","locked":false,"assignee":{"login":"nathanjsweet","id":447792,"avatar_url":"https://avatars.githubusercontent.com/u/447792?v=3","gravatar_id":"","url":"https://api.github.com/users/nathanjsweet","html_url":"https://github.com/nathanjsweet","followers_url":"https://api.github.com/users/nathanjsweet/followers","following_url":"https://api.github.com/users/nathanjsweet/following{/other_user}","gists_url":"https://api.github.com/users/nathanjsweet/gists{/gist_id}","starred_url":"https://api.github.com/users/nathanjsweet/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/nathanjsweet/subscriptions","organizations_url":"https://api.github.com/users/nathanjsweet/orgs","repos_url":"https://api.github.com/users/nathanjsweet/repos","events_url":"https://api.github.com/users/nathanjsweet/events{/privacy}","received_events_url":"https://api.github.com/users/nathanjsweet/received_events","type":"User","site_admin":false},"milestone":null,"comments":5,"created_at":"2014-12-14T00:03:14Z","updated_at":"2015-01-01T01:02:35Z","closed_at":"2015-01-01T01:02:35Z","body":"For Someone named Matt:\r\n\r\nHi, Nathan,\r\n\r\nI'm working on a node.js-based spell-checking service and was delighted to stumble upon [1]. Thanks for creating/maintaining this hunspell binding.\r\n\r\nI'm running into an issue, on my Mac (OSX Yosemite) where the node.js process crashes with 'Segmentation fault: 11' randomly after as few as 11 HTTP requests and up to ~100 HTTP requests.\r\n\r\nIf I cache a single nodehun instance and reuse that, I can run my test suite (contains ~5500 inputs) repeatedly.\r\n\r\nAlas, the requirement of the service is that it can accept requests for various combinations of dictionaries and word lists, so I'll likely need to create a custom instance for many requests (I can probably employ some caching).\r\n\r\nMy pattern for instantiating nodehun which produces the results above was that shown in examples/a_init.js (new nodehun(aff, dict)).\r\n\r\nI modified the code to use the pattern in g_asyncinvoke.js, and that's producing the following:\r\n\r\nnode(10787,0x103c8d000) malloc: *** error for object 0x104039008: incorrect checksum for freed object - object was probably modified after being freed.\r\n*** set a breakpoint in malloc_error_break to debug\r\n\r\nIn an attempt to simplify / make the problem more easy to repo, I've attached a modified version of the g_asyncinvoke.js example. It looks like the issue (hopefully equivalent to what I'm seeing in my service) can be reproduced after ~35 iterations.\r\n\r\nFWIW, I'm using 64-bit node v0.10.33.\r\n\r\nPlease let me know if I can provide additional info. I can also take this to [2] if you prefer.\r\n\r\nRegards,\r\nMatt\r\n\r\nRelevant file: https://docs.google.com/document/d/1qamzmStKEogJI3ybaJKNgT8xLiSCc2JdWAnJ-3CFk-c/edit?usp=sharing\r\n"}},"public":true,"created_at":"2015-01-01T01:02:37Z"}
{"id":"2489396977","type":"IssueCommentEvent","actor":{"id":447792,"login":"nathanjsweet","gravatar_id":"","url":"https://api.github.com/users/nathanjsweet","avatar_url":"https://avatars.githubusercontent.com/u/447792?"},"repo":{"id":15714889,"name":"nathanjsweet/nodehun","url":"https://api.github.com/repos/nathanjsweet/nodehun"},"payload":{"action":"created","issue":{"url":"https://api.github.com/repos/nathanjsweet/nodehun/issues/13","labels_url":"https://api.github.com/repos/nathanjsweet/nodehun/issues/13/labels{/name}","comments_url":"https://api.github.com/repos/nathanjsweet/nodehun/issues/13/comments","events_url":"https://api.github.com/repos/nathanjsweet/nodehun/issues/13/events","html_url":"https://github.com/nathanjsweet/nodehun/issues/13","id":51903837,"number":13,"title":"Memory Releasing issue","user":{"login":"nathanjsweet","id":447792,"avatar_url":"https://avatars.githubusercontent.com/u/447792?v=3","gravatar_id":"","url":"https://api.github.com/users/nathanjsweet","html_url":"https://github.com/nathanjsweet","followers_url":"https://api.github.com/users/nathanjsweet/followers","following_url":"https://api.github.com/users/nathanjsweet/following{/other_user}","gists_url":"https://api.github.com/users/nathanjsweet/gists{/gist_id}","starred_url":"https://api.github.com/users/nathanjsweet/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/nathanjsweet/subscriptions","organizations_url":"https://api.github.com/users/nathanjsweet/orgs","repos_url":"https://api.github.com/users/nathanjsweet/repos","events_url":"https://api.github.com/users/nathanjsweet/events{/privacy}","received_events_url":"https://api.github.com/users/nathanjsweet/received_events","type":"User","site_admin":false},"labels":[],"state":"closed","locked":false,"assignee":{"login":"nathanjsweet","id":447792,"avatar_url":"https://avatars.githubusercontent.com/u/447792?v=3","gravatar_id":"","url":"https://api.github.com/users/nathanjsweet","html_url":"https://github.com/nathanjsweet","followers_url":"https://api.github.com/users/nathanjsweet/followers","following_url":"https://api.github.com/users/nathanjsweet/following{/other_user}","gists_url":"https://api.github.com/users/nathanjsweet/gists{/gist_id}","starred_url":"https://api.github.com/users/nathanjsweet/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/nathanjsweet/subscriptions","organizations_url":"https://api.github.com/users/nathanjsweet/orgs","repos_url":"https://api.github.com/users/nathanjsweet/repos","events_url":"https://api.github.com/users/nathanjsweet/events{/privacy}","received_events_url":"https://api.github.com/users/nathanjsweet/received_events","type":"User","site_admin":false},"milestone":null,"comments":5,"created_at":"2014-12-14T00:03:14Z","updated_at":"2015-01-01T01:02:35Z","closed_at":"2015-01-01T01:02:35Z","body":"For Someone named Matt:\r\n\r\nHi, Nathan,\r\n\r\nI'm working on a node.js-based spell-checking service and was delighted to stumble upon [1]. Thanks for creating/maintaining this hunspell binding.\r\n\r\nI'm running into an issue, on my Mac (OSX Yosemite) where the node.js process crashes with 'Segmentation fault: 11' randomly after as few as 11 HTTP requests and up to ~100 HTTP requests.\r\n\r\nIf I cache a single nodehun instance and reuse that, I can run my test suite (contains ~5500 inputs) repeatedly.\r\n\r\nAlas, the requirement of the service is that it can accept requests for various combinations of dictionaries and word lists, so I'll likely need to create a custom instance for many requests (I can probably employ some caching).\r\n\r\nMy pattern for instantiating nodehun which produces the results above was that shown in examples/a_init.js (new nodehun(aff, dict)).\r\n\r\nI modified the code to use the pattern in g_asyncinvoke.js, and that's producing the following:\r\n\r\nnode(10787,0x103c8d000) malloc: *** error for object 0x104039008: incorrect checksum for freed object - object was probably modified after being freed.\r\n*** set a breakpoint in malloc_error_break to debug\r\n\r\nIn an attempt to simplify / make the problem more easy to repo, I've attached a modified version of the g_asyncinvoke.js example. It looks like the issue (hopefully equivalent to what I'm seeing in my service) can be reproduced after ~35 iterations.\r\n\r\nFWIW, I'm using 64-bit node v0.10.33.\r\n\r\nPlease let me know if I can provide additional info. I can also take this to [2] if you prefer.\r\n\r\nRegards,\r\nMatt\r\n\r\nRelevant file: https://docs.google.com/document/d/1qamzmStKEogJI3ybaJKNgT8xLiSCc2JdWAnJ-3CFk-c/edit?usp=sharing\r\n"},"comment":{"url":"https://api.github.com/repos/nathanjsweet/nodehun/issues/comments/68477264","html_url":"https://github.com/nathanjsweet/nodehun/issues/13#issuecomment-68477264","issue_url":"https://api.github.com/repos/nathanjsweet/nodehun/issues/13","id":68477264,"user":{"login":"nathanjsweet","id":447792,"avatar_url":"https://avatars.githubusercontent.com/u/447792?v=3","gravatar_id":"","url":"https://api.github.com/users/nathanjsweet","html_url":"https://github.com/nathanjsweet","followers_url":"https://api.github.com/users/nathanjsweet/followers","following_url":"https://api.github.com/users/nathanjsweet/following{/other_user}","gists_url":"https://api.github.com/users/nathanjsweet/gists{/gist_id}","starred_url":"https://api.github.com/users/nathanjsweet/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/nathanjsweet/subscriptions","organizations_url":"https://api.github.com/users/nathanjsweet/orgs","repos_url":"https://api.github.com/users/nathanjsweet/repos","events_url":"https://api.github.com/users/nathanjsweet/events{/privacy}","received_events_url":"https://api.github.com/users/nathanjsweet/received_events","type":"User","site_admin":false},"created_at":"2015-01-01T01:02:35Z","updated_at":"2015-01-01T01:02:35Z","body":"Matt,\r\nI'm not on Yosemite, yet, I will update later to check this out. I'm hoping that you plan on deploying on a linux server. If that's the case, then I would say you shouldn't have to worry about this issue (I've tested this script on several linux boxes and they all worked fine).\r\n\r\nThis is going to sound like a cop out, but OSX sucks. I run into all sorts of memory and segmentation issues that just don't crop up on linux (32 bit or 64) or even windows (again 32/64). I have personally played around a lot with libuv on my macbook and my impression of the teams for it, v8, and nodeJS is that apple is an afterthought for them.\r\n\r\nFor example, there are many hacks out there to get node to work around the 256 file-descriptor per process limit on OSX, but nobody has bothered to include any of these into libuv or node.\r\n\r\nI'm going to mark this issue as closed for now. If this ever becomes an issue on linux or windows let me know.\r\nThanks,\r\nNate"}},"public":true,"created_at":"2015-01-01T01:02:37Z"}
{"id":"2489396985","type":"PushEvent","actor":{"id":433707,"login":"ile","gravatar_id":"","url":"https://api.github.com/users/ile","avatar_url":"https://avatars.githubusercontent.com/u/433707?"},"repo":{"id":26847132,"name":"kantele/k-templates","url":"https://api.github.com/repos/kantele/k-templates"},"payload":{"push_id":536752750,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"53ba5e0e3194a42192f5aa9f9cd3fd2d79281ce4","before":"d989a60a4e050573d9ba85048499d9a0a7e8117e","commits":[{"sha":"53ba5e0e3194a42192f5aa9f9cd3fd2d79281ce4","author":{"email":"4f3407de78bccc8cc160ee4d278d5efe7162e6b5@nateps.com","name":"Nate Smith"},"message":"fix binding issues with relative paths etc; don't add bindings for each items or with blocks\n\nConflicts:\n\tpackage.json","distinct":true,"url":"https://api.github.com/repos/kantele/k-templates/commits/53ba5e0e3194a42192f5aa9f9cd3fd2d79281ce4"}]},"public":true,"created_at":"2015-01-01T01:02:37Z","org":{"id":5687585,"login":"kantele","gravatar_id":"","url":"https://api.github.com/orgs/kantele","avatar_url":"https://avatars.githubusercontent.com/u/5687585?"}}
{"id":"2489396987","type":"PushEvent","actor":{"id":6287026,"login":"unixabg","gravatar_id":"","url":"https://api.github.com/users/unixabg","avatar_url":"https://avatars.githubusercontent.com/u/6287026?"},"repo":{"id":23363281,"name":"unixabg/ts-yt-dl","url":"https://api.github.com/repos/unixabg/ts-yt-dl"},"payload":{"push_id":536752753,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"cc14de8e1f3c8402100c787405c1b8ef420978af","before":"d4fd67f93ff9f5ba614b0df495f67843f96c3b6c","commits":[{"sha":"cc14de8e1f3c8402100c787405c1b8ef420978af","author":{"email":"82b6c79a2ca714d2dcf70b1e2e7c5fc1711a4b07@gmail.com","name":"Richard Nelson"},"message":"Added youtube-dl version to scripts/support.php.","distinct":true,"url":"https://api.github.com/repos/unixabg/ts-yt-dl/commits/cc14de8e1f3c8402100c787405c1b8ef420978af"}]},"public":true,"created_at":"2015-01-01T01:02:37Z"}
{"id":"2489396988","type":"IssueCommentEvent","actor":{"id":2188638,"login":"manuel-rubio","gravatar_id":"","url":"https://api.github.com/users/manuel-rubio","avatar_url":"https://avatars.githubusercontent.com/u/2188638?"},"repo":{"id":1035547,"name":"inaka/apns4erl","url":"https://api.github.com/repos/inaka/apns4erl"},"payload":{"action":"created","issue":{"url":"https://api.github.com/repos/inaka/apns4erl/issues/39","labels_url":"https://api.github.com/repos/inaka/apns4erl/issues/39/labels{/name}","comments_url":"https://api.github.com/repos/inaka/apns4erl/issues/39/comments","events_url":"https://api.github.com/repos/inaka/apns4erl/issues/39/events","html_url":"https://github.com/inaka/apns4erl/pull/39","id":53184390,"number":39,"title":"APNS resend queue","user":{"login":"alexdruzhilov","id":490425,"avatar_url":"https://avatars.githubusercontent.com/u/490425?v=3","gravatar_id":"","url":"https://api.github.com/users/alexdruzhilov","html_url":"https://github.com/alexdruzhilov","followers_url":"https://api.github.com/users/alexdruzhilov/followers","following_url":"https://api.github.com/users/alexdruzhilov/following{/other_user}","gists_url":"https://api.github.com/users/alexdruzhilov/gists{/gist_id}","starred_url":"https://api.github.com/users/alexdruzhilov/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/alexdruzhilov/subscriptions","organizations_url":"https://api.github.com/users/alexdruzhilov/orgs","repos_url":"https://api.github.com/users/alexdruzhilov/repos","events_url":"https://api.github.com/users/alexdruzhilov/events{/privacy}","received_events_url":"https://api.github.com/users/alexdruzhilov/received_events","type":"User","site_admin":false},"labels":[],"state":"open","locked":false,"assignee":null,"milestone":null,"comments":1,"created_at":"2014-12-31T13:40:31Z","updated_at":"2015-01-01T01:02:37Z","closed_at":null,"pull_request":{"url":"https://api.github.com/repos/inaka/apns4erl/pulls/39","html_url":"https://github.com/inaka/apns4erl/pull/39","diff_url":"https://github.com/inaka/apns4erl/pull/39.diff","patch_url":"https://github.com/inaka/apns4erl/pull/39.patch"},"body":"Fix for issue https://github.com/inaka/apns4erl/issues/17\r\n\r\nCommit is adopted for version 1.0.2 from two commits:\r\nhttps://github.com/altenwald/apns4erl/commit/06431ef47ce3593ce0635375f0ba786cea9fecae\r\nhttps://github.com/altenwald/apns4erl/commit/618e52cb350742f4391d35768f20c4e1619061d0"},"comment":{"url":"https://api.github.com/repos/inaka/apns4erl/issues/comments/68477265","html_url":"https://github.com/inaka/apns4erl/pull/39#issuecomment-68477265","issue_url":"https://api.github.com/repos/inaka/apns4erl/issues/39","id":68477265,"user":{"login":"manuel-rubio","id":2188638,"avatar_url":"https://avatars.githubusercontent.com/u/2188638?v=3","gravatar_id":"","url":"https://api.github.com/users/manuel-rubio","html_url":"https://github.com/manuel-rubio","followers_url":"https://api.github.com/users/manuel-rubio/followers","following_url":"https://api.github.com/users/manuel-rubio/following{/other_user}","gists_url":"https://api.github.com/users/manuel-rubio/gists{/gist_id}","starred_url":"https://api.github.com/users/manuel-rubio/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/manuel-rubio/subscriptions","organizations_url":"https://api.github.com/users/manuel-rubio/orgs","repos_url":"https://api.github.com/users/manuel-rubio/repos","events_url":"https://api.github.com/users/manuel-rubio/events{/privacy}","received_events_url":"https://api.github.com/users/manuel-rubio/received_events","type":"User","site_admin":false},"created_at":"2015-01-01T01:02:37Z","updated_at":"2015-01-01T01:02:37Z","body":"Fixed: altenwald/apns4erl@b59e7a0"}},"public":true,"created_at":"2015-01-01T01:02:37Z","org":{"id":867053,"login":"inaka","gravatar_id":"","url":"https://api.github.com/orgs/inaka","avatar_url":"https://avatars.githubusercontent.com/u/867053?"}}
{"id":"2489396992","type":"PushEvent","actor":{"id":3960243,"login":"wp-plugins-user","gravatar_id":"","url":"https://api.github.com/users/wp-plugins-user","avatar_url":"https://avatars.githubusercontent.com/u/3960243?"},"repo":{"id":19549672,"name":"wp-plugins/facebook-secret-meta","url":"https://api.github.com/repos/wp-plugins/facebook-secret-meta"},"payload":{"push_id":536752756,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"4302987080a9f480e078903f1fb948b025beed8c","before":"8623e15f41d0186a6ce8cd402c06ba3299a96577","commits":[{"sha":"4302987080a9f480e078903f1fb948b025beed8c","author":{"email":"c84fcc9b3d1ea987f4c82b2df8285ca158ac8f6b@b8457f37-d9ea-0310-8a92-e5e31aec5664","name":"Asif2BD"},"message":"4.1 version compatible\n\ngit-svn-id: https://plugins.svn.wordpress.org/facebook-secret-meta/trunk@1057713 b8457f37-d9ea-0310-8a92-e5e31aec5664","distinct":true,"url":"https://api.github.com/repos/wp-plugins/facebook-secret-meta/commits/4302987080a9f480e078903f1fb948b025beed8c"}]},"public":true,"created_at":"2015-01-01T01:02:37Z","org":{"id":2996849,"login":"wp-plugins","gravatar_id":"","url":"https://api.github.com/orgs/wp-plugins","avatar_url":"https://avatars.githubusercontent.com/u/2996849?"}}
{"id":"2489396995","type":"IssueCommentEvent","actor":{"id":1238621,"login":"Corosauce","gravatar_id":"","url":"https://api.github.com/users/Corosauce","avatar_url":"https://avatars.githubusercontent.com/u/1238621?"},"repo":{"id":19960516,"name":"Corosauce/weather2","url":"https://api.github.com/repos/Corosauce/weather2"},"payload":{"action":"created","issue":{"url":"https://api.github.com/repos/Corosauce/weather2/issues/2","labels_url":"https://api.github.com/repos/Corosauce/weather2/issues/2/labels{/name}","comments_url":"https://api.github.com/repos/Corosauce/weather2/issues/2/comments","events_url":"https://api.github.com/repos/Corosauce/weather2/issues/2/events","html_url":"https://github.com/Corosauce/weather2/issues/2","id":52972104,"number":2,"title":"Support for snow from other mods","user":{"login":"dexman545","id":4873274,"avatar_url":"https://avatars.githubusercontent.com/u/4873274?v=3","gravatar_id":"","url":"https://api.github.com/users/dexman545","html_url":"https://github.com/dexman545","followers_url":"https://api.github.com/users/dexman545/followers","following_url":"https://api.github.com/users/dexman545/following{/other_user}","gists_url":"https://api.github.com/users/dexman545/gists{/gist_id}","starred_url":"https://api.github.com/users/dexman545/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/dexman545/subscriptions","organizations_url":"https://api.github.com/users/dexman545/orgs","repos_url":"https://api.github.com/users/dexman545/repos","events_url":"https://api.github.com/users/dexman545/events{/privacy}","received_events_url":"https://api.github.com/users/dexman545/received_events","type":"User","site_admin":false},"labels":[],"state":"closed","locked":false,"assignee":null,"milestone":null,"comments":3,"created_at":"2014-12-28T03:55:02Z","updated_at":"2015-01-01T01:02:37Z","closed_at":"2015-01-01T01:02:37Z","body":"Would it be possible to change Blocks.snow in StormObject.java to Material.snow so that mods that add their own snow will be populated on the ground? In a discussion with one of the TFC devs, this was theorized as a possible solution to Weather 2's storms not placing snow.\r\n\r\n(http://terrafirmacraft.com/f/topic/6945-1710-technofirma-mod-pack/page-5#entry101107)\r\n\r\nThank you, \r\ndex"},"comment":{"url":"https://api.github.com/repos/Corosauce/weather2/issues/comments/68477266","html_url":"https://github.com/Corosauce/weather2/issues/2#issuecomment-68477266","issue_url":"https://api.github.com/repos/Corosauce/weather2/issues/2","id":68477266,"user":{"login":"Corosauce","id":1238621,"avatar_url":"https://avatars.githubusercontent.com/u/1238621?v=3","gravatar_id":"","url":"https://api.github.com/users/Corosauce","html_url":"https://github.com/Corosauce","followers_url":"https://api.github.com/users/Corosauce/followers","following_url":"https://api.github.com/users/Corosauce/following{/other_user}","gists_url":"https://api.github.com/users/Corosauce/gists{/gist_id}","starred_url":"https://api.github.com/users/Corosauce/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/Corosauce/subscriptions","organizations_url":"https://api.github.com/users/Corosauce/orgs","repos_url":"https://api.github.com/users/Corosauce/repos","events_url":"https://api.github.com/users/Corosauce/events{/privacy}","received_events_url":"https://api.github.com/users/Corosauce/received_events","type":"User","site_admin":false},"created_at":"2015-01-01T01:02:37Z","updated_at":"2015-01-01T01:02:37Z","body":"Hmm yeah, still sounds better than the current situation so I'll do what I can on my part with checking against material type instead of block and we'll see how it plays together in the future."}},"public":true,"created_at":"2015-01-01T01:02:37Z"}
{"id":"2489396996","type":"IssuesEvent","actor":{"id":1238621,"login":"Corosauce","gravatar_id":"","url":"https://api.github.com/users/Corosauce","avatar_url":"https://avatars.githubusercontent.com/u/1238621?"},"repo":{"id":19960516,"name":"Corosauce/weather2","url":"https://api.github.com/repos/Corosauce/weather2"},"payload":{"action":"closed","issue":{"url":"https://api.github.com/repos/Corosauce/weather2/issues/2","labels_url":"https://api.github.com/repos/Corosauce/weather2/issues/2/labels{/name}","comments_url":"https://api.github.com/repos/Corosauce/weather2/issues/2/comments","events_url":"https://api.github.com/repos/Corosauce/weather2/issues/2/events","html_url":"https://github.com/Corosauce/weather2/issues/2","id":52972104,"number":2,"title":"Support for snow from other mods","user":{"login":"dexman545","id":4873274,"avatar_url":"https://avatars.githubusercontent.com/u/4873274?v=3","gravatar_id":"","url":"https://api.github.com/users/dexman545","html_url":"https://github.com/dexman545","followers_url":"https://api.github.com/users/dexman545/followers","following_url":"https://api.github.com/users/dexman545/following{/other_user}","gists_url":"https://api.github.com/users/dexman545/gists{/gist_id}","starred_url":"https://api.github.com/users/dexman545/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/dexman545/subscriptions","organizations_url":"https://api.github.com/users/dexman545/orgs","repos_url":"https://api.github.com/users/dexman545/repos","events_url":"https://api.github.com/users/dexman545/events{/privacy}","received_events_url":"https://api.github.com/users/dexman545/received_events","type":"User","site_admin":false},"labels":[],"state":"closed","locked":false,"assignee":null,"milestone":null,"comments":3,"created_at":"2014-12-28T03:55:02Z","updated_at":"2015-01-01T01:02:37Z","closed_at":"2015-01-01T01:02:37Z","body":"Would it be possible to change Blocks.snow in StormObject.java to Material.snow so that mods that add their own snow will be populated on the ground? In a discussion with one of the TFC devs, this was theorized as a possible solution to Weather 2's storms not placing snow.\r\n\r\n(http://terrafirmacraft.com/f/topic/6945-1710-technofirma-mod-pack/page-5#entry101107)\r\n\r\nThank you, \r\ndex"}},"public":true,"created_at":"2015-01-01T01:02:37Z"}
{"id":"2489396997","type":"PushEvent","actor":{"id":498666,"login":"yaboyanees","gravatar_id":"","url":"https://api.github.com/users/yaboyanees","avatar_url":"https://avatars.githubusercontent.com/u/498666?"},"repo":{"id":28573192,"name":"yaboyanees/audibleDSS","url":"https://api.github.com/repos/yaboyanees/audibleDSS"},"payload":{"push_id":536752758,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"7213655448351edf7420c7ffc675bf9fe08348b3","before":"5f3e41d9a87b429dbf00877aba66f68b99664803","commits":[{"sha":"7213655448351edf7420c7ffc675bf9fe08348b3","author":{"email":"26e9cab5de48070b64acff125a9ff6569947913f@yahoo.com","name":"yaboyanees"},"message":"cleaning up views with css and small form formatting","distinct":true,"url":"https://api.github.com/repos/yaboyanees/audibleDSS/commits/7213655448351edf7420c7ffc675bf9fe08348b3"}]},"public":true,"created_at":"2015-01-01T01:02:37Z"}
{"id":"2489397003","type":"WatchEvent","actor":{"id":630099,"login":"Nevyn357","gravatar_id":"","url":"https://api.github.com/users/Nevyn357","avatar_url":"https://avatars.githubusercontent.com/u/630099?"},"repo":{"id":8668792,"name":"ilirb/ahk-scripts","url":"https://api.github.com/repos/ilirb/ahk-scripts"},"payload":{"action":"started"},"public":true,"created_at":"2015-01-01T01:02:39Z"}
{"id":"2489397005","type":"PushEvent","actor":{"id":7046289,"login":"ValentinGabriel","gravatar_id":"","url":"https://api.github.com/users/ValentinGabriel","avatar_url":"https://avatars.githubusercontent.com/u/7046289?"},"repo":{"id":28188264,"name":"Jeremj0/RebootFactory","url":"https://api.github.com/repos/Jeremj0/RebootFactory"},"payload":{"push_id":536752759,"size":1,"distinct_size":1,"ref":"refs/heads/Master","head":"966dfc06ccc1c565f5a91f6ae9b5b71501d8d6cb","before":"4eaaa79af7f99f45c706c3745f5c56b46ba14a4b","commits":[{"sha":"966dfc06ccc1c565f5a91f6ae9b5b71501d8d6cb","author":{"email":"40615740715968d1630b9e998e85827713fc82bb@hotmail.fr","name":"ValentinGabriel"},"message":"Etude de cas\n\nhtml et css quasi vierge, à compléter.","distinct":true,"url":"https://api.github.com/repos/Jeremj0/RebootFactory/commits/966dfc06ccc1c565f5a91f6ae9b5b71501d8d6cb"}]},"public":true,"created_at":"2015-01-01T01:02:40Z"}
{"id":"2489397007","type":"PushEvent","actor":{"id":8819701,"login":"r-ggraham","gravatar_id":"","url":"https://api.github.com/users/r-ggraham","avatar_url":"https://avatars.githubusercontent.com/u/8819701?"},"repo":{"id":28678173,"name":"r-ggraham/Crumpet_Bot","url":"https://api.github.com/repos/r-ggraham/Crumpet_Bot"},"payload":{"push_id":536752761,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"51951542e9d518f59ff62753725e5186d4111822","before":"332746658edcc60bca17720fce153357a2cd9dfb","commits":[{"sha":"51951542e9d518f59ff62753725e5186d4111822","author":{"email":"f2f9dd43aa4244d32208a2ccfa0c7c9e9c48f7e7@uni.worc.ac.uk","name":"Rob G"},"message":"Remove .gitFiles","distinct":true,"url":"https://api.github.com/repos/r-ggraham/Crumpet_Bot/commits/51951542e9d518f59ff62753725e5186d4111822"}]},"public":true,"created_at":"2015-01-01T01:02:40Z"}
{"id":"2489397015","type":"PushEvent","actor":{"id":3960243,"login":"wp-plugins-user","gravatar_id":"","url":"https://api.github.com/users/wp-plugins-user","avatar_url":"https://avatars.githubusercontent.com/u/3960243?"},"repo":{"id":27287679,"name":"wp-plugins/woocommerce-eu-vat-compliance","url":"https://api.github.com/repos/wp-plugins/woocommerce-eu-vat-compliance"},"payload":{"push_id":536752764,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"af0132f4527cc3eaa4838c86c7280d4a304ad9f8","before":"4d08fb010b86a14f694d7ae6ebe0e169379072be","commits":[{"sha":"af0132f4527cc3eaa4838c86c7280d4a304ad9f8","author":{"email":"77d7830c4a7293f46a95bf3929d24b006a29ede7@b8457f37-d9ea-0310-8a92-e5e31aec5664","name":"DavidAnderson"},"message":"1.6.7\n\ngit-svn-id: https://plugins.svn.wordpress.org/woocommerce-eu-vat-compliance/trunk@1057712 b8457f37-d9ea-0310-8a92-e5e31aec5664","distinct":true,"url":"https://api.github.com/repos/wp-plugins/woocommerce-eu-vat-compliance/commits/af0132f4527cc3eaa4838c86c7280d4a304ad9f8"}]},"public":true,"created_at":"2015-01-01T01:02:41Z","org":{"id":2996849,"login":"wp-plugins","gravatar_id":"","url":"https://api.github.com/orgs/wp-plugins","avatar_url":"https://avatars.githubusercontent.com/u/2996849?"}}
{"id":"2489397016","type":"IssueCommentEvent","actor":{"id":2829600,"login":"GrahamCampbell","gravatar_id":"","url":"https://api.github.com/users/GrahamCampbell","avatar_url":"https://avatars.githubusercontent.com/u/2829600?"},"repo":{"id":26730195,"name":"cachethq/Cachet","url":"https://api.github.com/repos/cachethq/Cachet"},"payload":{"action":"created","issue":{"url":"https://api.github.com/repos/cachethq/Cachet/issues/173","labels_url":"https://api.github.com/repos/cachethq/Cachet/issues/173/labels{/name}","comments_url":"https://api.github.com/repos/cachethq/Cachet/issues/173/comments","events_url":"https://api.github.com/repos/cachethq/Cachet/issues/173/events","html_url":"https://github.com/cachethq/Cachet/issues/173","id":53210024,"number":173,"title":"Bug: Forms let you submit multiple times","user":{"login":"Jamesking56","id":253237,"avatar_url":"https://avatars.githubusercontent.com/u/253237?v=3","gravatar_id":"","url":"https://api.github.com/users/Jamesking56","html_url":"https://github.com/Jamesking56","followers_url":"https://api.github.com/users/Jamesking56/followers","following_url":"https://api.github.com/users/Jamesking56/following{/other_user}","gists_url":"https://api.github.com/users/Jamesking56/gists{/gist_id}","starred_url":"https://api.github.com/users/Jamesking56/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/Jamesking56/subscriptions","organizations_url":"https://api.github.com/users/Jamesking56/orgs","repos_url":"https://api.github.com/users/Jamesking56/repos","events_url":"https://api.github.com/users/Jamesking56/events{/privacy}","received_events_url":"https://api.github.com/users/Jamesking56/received_events","type":"User","site_admin":false},"labels":[],"state":"open","locked":false,"assignee":null,"milestone":null,"comments":5,"created_at":"2015-01-01T00:52:06Z","updated_at":"2015-01-01T01:02:40Z","closed_at":null,"body":"When adding a new incident, I noticed a weird bug.\r\n\r\nIf you fill in the form as normal, then click the submit button twice really quickly, it'll create __TWO__ identical new incidents!\r\n\r\nThis could be a bit annoying, a simple fix is using a bit of JS that on submit, disables the submit button so that once clicked, it cannot be clicked again."},"comment":{"url":"https://api.github.com/repos/cachethq/Cachet/issues/comments/68477269","html_url":"https://github.com/cachethq/Cachet/issues/173#issuecomment-68477269","issue_url":"https://api.github.com/repos/cachethq/Cachet/issues/173","id":68477269,"user":{"login":"GrahamCampbell","id":2829600,"avatar_url":"https://avatars.githubusercontent.com/u/2829600?v=3","gravatar_id":"","url":"https://api.github.com/users/GrahamCampbell","html_url":"https://github.com/GrahamCampbell","followers_url":"https://api.github.com/users/GrahamCampbell/followers","following_url":"https://api.github.com/users/GrahamCampbell/following{/other_user}","gists_url":"https://api.github.com/users/GrahamCampbell/gists{/gist_id}","starred_url":"https://api.github.com/users/GrahamCampbell/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/GrahamCampbell/subscriptions","organizations_url":"https://api.github.com/users/GrahamCampbell/orgs","repos_url":"https://api.github.com/users/GrahamCampbell/repos","events_url":"https://api.github.com/users/GrahamCampbell/events{/privacy}","received_events_url":"https://api.github.com/users/GrahamCampbell/received_events","type":"User","site_admin":false},"created_at":"2015-01-01T01:02:40Z","updated_at":"2015-01-01T01:02:40Z","body":"No, it doesn't. That's something different. It doesn't prevent multiple submissions of a form."}},"public":true,"created_at":"2015-01-01T01:02:41Z","org":{"id":9951502,"login":"cachethq","gravatar_id":"","url":"https://api.github.com/orgs/cachethq","avatar_url":"https://avatars.githubusercontent.com/u/9951502?"}}
{"id":"2489397020","type":"PullRequestEvent","actor":{"id":5573038,"login":"CorruptComputer","gravatar_id":"","url":"https://api.github.com/users/CorruptComputer","avatar_url":"https://avatars.githubusercontent.com/u/5573038?"},"repo":{"id":28371640,"name":"AsteroidStation/-tg-station","url":"https://api.github.com/repos/AsteroidStation/-tg-station"},"payload":{"action":"opened","number":8,"pull_request":{"url":"https://api.github.com/repos/AsteroidStation/-tg-station/pulls/8","id":26739422,"html_url":"https://github.com/AsteroidStation/-tg-station/pull/8","diff_url":"https://github.com/AsteroidStation/-tg-station/pull/8.diff","patch_url":"https://github.com/AsteroidStation/-tg-station/pull/8.patch","issue_url":"https://api.github.com/repos/AsteroidStation/-tg-station/issues/8","number":8,"state":"open","locked":false,"title":"tg update","user":{"login":"CorruptComputer","id":5573038,"avatar_url":"https://avatars.githubusercontent.com/u/5573038?v=3","gravatar_id":"","url":"https://api.github.com/users/CorruptComputer","html_url":"https://github.com/CorruptComputer","followers_url":"https://api.github.com/users/CorruptComputer/followers","following_url":"https://api.github.com/users/CorruptComputer/following{/other_user}","gists_url":"https://api.github.com/users/CorruptComputer/gists{/gist_id}","starred_url":"https://api.github.com/users/CorruptComputer/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/CorruptComputer/subscriptions","organizations_url":"https://api.github.com/users/CorruptComputer/orgs","repos_url":"https://api.github.com/users/CorruptComputer/repos","events_url":"https://api.github.com/users/CorruptComputer/events{/privacy}","received_events_url":"https://api.github.com/users/CorruptComputer/received_events","type":"User","site_admin":false},"body":"","created_at":"2015-01-01T01:02:41Z","updated_at":"2015-01-01T01:02:41Z","closed_at":null,"merged_at":null,"merge_commit_sha":null,"assignee":null,"milestone":null,"commits_url":"https://api.github.com/repos/AsteroidStation/-tg-station/pulls/8/commits","review_comments_url":"https://api.github.com/repos/AsteroidStation/-tg-station/pulls/8/comments","review_comment_url":"https://api.github.com/repos/AsteroidStation/-tg-station/pulls/comments/{number}","comments_url":"https://api.github.com/repos/AsteroidStation/-tg-station/issues/8/comments","statuses_url":"https://api.github.com/repos/AsteroidStation/-tg-station/statuses/34c4c027770518e2087db44a89cad07cd91ceb84","head":{"label":"tgstation:master","ref":"master","sha":"34c4c027770518e2087db44a89cad07cd91ceb84","user":{"login":"tgstation","id":1363778,"avatar_url":"https://avatars.githubusercontent.com/u/1363778?v=3","gravatar_id":"","url":"https://api.github.com/users/tgstation","html_url":"https://github.com/tgstation","followers_url":"https://api.github.com/users/tgstation/followers","following_url":"https://api.github.com/users/tgstation/following{/other_user}","gists_url":"https://api.github.com/users/tgstation/gists{/gist_id}","starred_url":"https://api.github.com/users/tgstation/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/tgstation/subscriptions","organizations_url":"https://api.github.com/users/tgstation/orgs","repos_url":"https://api.github.com/users/tgstation/repos","events_url":"https://api.github.com/users/tgstation/events{/privacy}","received_events_url":"https://api.github.com/users/tgstation/received_events","type":"Organization","site_admin":false},"repo":{"id":3234987,"name":"-tg-station","full_name":"tgstation/-tg-station","owner":{"login":"tgstation","id":1363778,"avatar_url":"https://avatars.githubusercontent.com/u/1363778?v=3","gravatar_id":"","url":"https://api.github.com/users/tgstation","html_url":"https://github.com/tgstation","followers_url":"https://api.github.com/users/tgstation/followers","following_url":"https://api.github.com/users/tgstation/following{/other_user}","gists_url":"https://api.github.com/users/tgstation/gists{/gist_id}","starred_url":"https://api.github.com/users/tgstation/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/tgstation/subscriptions","organizations_url":"https://api.github.com/users/tgstation/orgs","repos_url":"https://api.github.com/users/tgstation/repos","events_url":"https://api.github.com/users/tgstation/events{/privacy}","received_events_url":"https://api.github.com/users/tgstation/received_events","type":"Organization","site_admin":false},"private":false,"html_url":"https://github.com/tgstation/-tg-station","description":"/tg/'s SS13 branch","fork":false,"url":"https://api.github.com/repos/tgstation/-tg-station","forks_url":"https://api.github.com/repos/tgstation/-tg-station/forks","keys_url":"https://api.github.com/repos/tgstation/-tg-station/keys{/key_id}","collaborators_url":"https://api.github.com/repos/tgstation/-tg-station/collaborators{/collaborator}","teams_url":"https://api.github.com/repos/tgstation/-tg-station/teams","hooks_url":"https://api.github.com/repos/tgstation/-tg-station/hooks","issue_events_url":"https://api.github.com/repos/tgstation/-tg-station/issues/events{/number}","events_url":"https://api.github.com/repos/tgstation/-tg-station/events","assignees_url":"https://api.github.com/repos/tgstation/-tg-station/assignees{/user}","branches_url":"https://api.github.com/repos/tgstation/-tg-station/branches{/branch}","tags_url":"https://api.github.com/repos/tgstation/-tg-station/tags","blobs_url":"https://api.github.com/repos/tgstation/-tg-station/git/blobs{/sha}","git_tags_url":"https://api.github.com/repos/tgstation/-tg-station/git/tags{/sha}","git_refs_url":"https://api.github.com/repos/tgstation/-tg-station/git/refs{/sha}","trees_url":"https://api.github.com/repos/tgstation/-tg-station/git/trees{/sha}","statuses_url":"https://api.github.com/repos/tgstation/-tg-station/statuses/{sha}","languages_url":"https://api.github.com/repos/tgstation/-tg-station/languages","stargazers_url":"https://api.github.com/repos/tgstation/-tg-station/stargazers","contributors_url":"https://api.github.com/repos/tgstation/-tg-station/contributors","subscribers_url":"https://api.github.com/repos/tgstation/-tg-station/subscribers","subscription_url":"https://api.github.com/repos/tgstation/-tg-station/subscription","commits_url":"https://api.github.com/repos/tgstation/-tg-station/commits{/sha}","git_commits_url":"https://api.github.com/repos/tgstation/-tg-station/git/commits{/sha}","comments_url":"https://api.github.com/repos/tgstation/-tg-station/comments{/number}","issue_comment_url":"https://api.github.com/repos/tgstation/-tg-station/issues/comments/{number}","contents_url":"https://api.github.com/repos/tgstation/-tg-station/contents/{+path}","compare_url":"https://api.github.com/repos/tgstation/-tg-station/compare/{base}...{head}","merges_url":"https://api.github.com/repos/tgstation/-tg-station/merges","archive_url":"https://api.github.com/repos/tgstation/-tg-station/{archive_format}{/ref}","downloads_url":"https://api.github.com/repos/tgstation/-tg-station/downloads","issues_url":"https://api.github.com/repos/tgstation/-tg-station/issues{/number}","pulls_url":"https://api.github.com/repos/tgstation/-tg-station/pulls{/number}","milestones_url":"https://api.github.com/repos/tgstation/-tg-station/milestones{/number}","notifications_url":"https://api.github.com/repos/tgstation/-tg-station/notifications{?since,all,participating}","labels_url":"https://api.github.com/repos/tgstation/-tg-station/labels{/name}","releases_url":"https://api.github.com/repos/tgstation/-tg-station/releases{/id}","created_at":"2012-01-21T17:32:47Z","updated_at":"2015-01-01T00:47:49Z","pushed_at":"2015-01-01T00:47:48Z","git_url":"git://github.com/tgstation/-tg-station.git","ssh_url":"git@github.com:tgstation/-tg-station.git","clone_url":"https://github.com/tgstation/-tg-station.git","svn_url":"https://github.com/tgstation/-tg-station","homepage":"http://www.tgstation13.org/","size":550715,"stargazers_count":172,"watchers_count":172,"language":"DM","has_issues":true,"has_downloads":true,"has_wiki":true,"has_pages":false,"forks_count":609,"mirror_url":null,"open_issues_count":618,"forks":609,"open_issues":618,"watchers":172,"default_branch":"master"}},"base":{"label":"AsteroidStation:master","ref":"master","sha":"d98abaabaa971c9092a200961915c9e60015ab20","user":{"login":"AsteroidStation","id":9313156,"avatar_url":"https://avatars.githubusercontent.com/u/9313156?v=3","gravatar_id":"","url":"https://api.github.com/users/AsteroidStation","html_url":"https://github.com/AsteroidStation","followers_url":"https://api.github.com/users/AsteroidStation/followers","following_url":"https://api.github.com/users/AsteroidStation/following{/other_user}","gists_url":"https://api.github.com/users/AsteroidStation/gists{/gist_id}","starred_url":"https://api.github.com/users/AsteroidStation/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/AsteroidStation/subscriptions","organizations_url":"https://api.github.com/users/AsteroidStation/orgs","repos_url":"https://api.github.com/users/AsteroidStation/repos","events_url":"https://api.github.com/users/AsteroidStation/events{/privacy}","received_events_url":"https://api.github.com/users/AsteroidStation/received_events","type":"Organization","site_admin":false},"repo":{"id":28371640,"name":"-tg-station","full_name":"AsteroidStation/-tg-station","owner":{"login":"AsteroidStation","id":9313156,"avatar_url":"https://avatars.githubusercontent.com/u/9313156?v=3","gravatar_id":"","url":"https://api.github.com/users/AsteroidStation","html_url":"https://github.com/AsteroidStation","followers_url":"https://api.github.com/users/AsteroidStation/followers","following_url":"https://api.github.com/users/AsteroidStation/following{/other_user}","gists_url":"https://api.github.com/users/AsteroidStation/gists{/gist_id}","starred_url":"https://api.github.com/users/AsteroidStation/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/AsteroidStation/subscriptions","organizations_url":"https://api.github.com/users/AsteroidStation/orgs","repos_url":"https://api.github.com/users/AsteroidStation/repos","events_url":"https://api.github.com/users/AsteroidStation/events{/privacy}","received_events_url":"https://api.github.com/users/AsteroidStation/received_events","type":"Organization","site_admin":false},"private":false,"html_url":"https://github.com/AsteroidStation/-tg-station","description":"/tg/'s SS13 branch","fork":true,"url":"https://api.github.com/repos/AsteroidStation/-tg-station","forks_url":"https://api.github.com/repos/AsteroidStation/-tg-station/forks","keys_url":"https://api.github.com/repos/AsteroidStation/-tg-station/keys{/key_id}","collaborators_url":"https://api.github.com/repos/AsteroidStation/-tg-station/collaborators{/collaborator}","teams_url":"https://api.github.com/repos/AsteroidStation/-tg-station/teams","hooks_url":"https://api.github.com/repos/AsteroidStation/-tg-station/hooks","issue_events_url":"https://api.github.com/repos/AsteroidStation/-tg-station/issues/events{/number}","events_url":"https://api.github.com/repos/AsteroidStation/-tg-station/events","assignees_url":"https://api.github.com/repos/AsteroidStation/-tg-station/assignees{/user}","branches_url":"https://api.github.com/repos/AsteroidStation/-tg-station/branches{/branch}","tags_url":"https://api.github.com/repos/AsteroidStation/-tg-station/tags","blobs_url":"https://api.github.com/repos/AsteroidStation/-tg-station/git/blobs{/sha}","git_tags_url":"https://api.github.com/repos/AsteroidStation/-tg-station/git/tags{/sha}","git_refs_url":"https://api.github.com/repos/AsteroidStation/-tg-station/git/refs{/sha}","trees_url":"https://api.github.com/repos/AsteroidStation/-tg-station/git/trees{/sha}","statuses_url":"https://api.github.com/repos/AsteroidStation/-tg-station/statuses/{sha}","languages_url":"https://api.github.com/repos/AsteroidStation/-tg-station/languages","stargazers_url":"https://api.github.com/repos/AsteroidStation/-tg-station/stargazers","contributors_url":"https://api.github.com/repos/AsteroidStation/-tg-station/contributors","subscribers_url":"https://api.github.com/repos/AsteroidStation/-tg-station/subscribers","subscription_url":"https://api.github.com/repos/AsteroidStation/-tg-station/subscription","commits_url":"https://api.github.com/repos/AsteroidStation/-tg-station/commits{/sha}","git_commits_url":"https://api.github.com/repos/AsteroidStation/-tg-station/git/commits{/sha}","comments_url":"https://api.github.com/repos/AsteroidStation/-tg-station/comments{/number}","issue_comment_url":"https://api.github.com/repos/AsteroidStation/-tg-station/issues/comments/{number}","contents_url":"https://api.github.com/repos/AsteroidStation/-tg-station/contents/{+path}","compare_url":"https://api.github.com/repos/AsteroidStation/-tg-station/compare/{base}...{head}","merges_url":"https://api.github.com/repos/AsteroidStation/-tg-station/merges","archive_url":"https://api.github.com/repos/AsteroidStation/-tg-station/{archive_format}{/ref}","downloads_url":"https://api.github.com/repos/AsteroidStation/-tg-station/downloads","issues_url":"https://api.github.com/repos/AsteroidStation/-tg-station/issues{/number}","pulls_url":"https://api.github.com/repos/AsteroidStation/-tg-station/pulls{/number}","milestones_url":"https://api.github.com/repos/AsteroidStation/-tg-station/milestones{/number}","notifications_url":"https://api.github.com/repos/AsteroidStation/-tg-station/notifications{?since,all,participating}","labels_url":"https://api.github.com/repos/AsteroidStation/-tg-station/labels{/name}","releases_url":"https://api.github.com/repos/AsteroidStation/-tg-station/releases{/id}","created_at":"2014-12-23T02:11:11Z","updated_at":"2014-12-31T02:35:57Z","pushed_at":"2014-12-31T02:35:56Z","git_url":"git://github.com/AsteroidStation/-tg-station.git","ssh_url":"git@github.com:AsteroidStation/-tg-station.git","clone_url":"https://github.com/AsteroidStation/-tg-station.git","svn_url":"https://github.com/AsteroidStation/-tg-station","homepage":"http://www.tgstation13.org/","size":414377,"stargazers_count":0,"watchers_count":0,"language":"DM","has_issues":false,"has_downloads":true,"has_wiki":true,"has_pages":false,"forks_count":0,"mirror_url":null,"open_issues_count":1,"forks":0,"open_issues":1,"watchers":0,"default_branch":"master"}},"_links":{"self":{"href":"https://api.github.com/repos/AsteroidStation/-tg-station/pulls/8"},"html":{"href":"https://github.com/AsteroidStation/-tg-station/pull/8"},"issue":{"href":"https://api.github.com/repos/AsteroidStation/-tg-station/issues/8"},"comments":{"href":"https://api.github.com/repos/AsteroidStation/-tg-station/issues/8/comments"},"review_comments":{"href":"https://api.github.com/repos/AsteroidStation/-tg-station/pulls/8/comments"},"review_comment":{"href":"https://api.github.com/repos/AsteroidStation/-tg-station/pulls/comments/{number}"},"commits":{"href":"https://api.github.com/repos/AsteroidStation/-tg-station/pulls/8/commits"},"statuses":{"href":"https://api.github.com/repos/AsteroidStation/-tg-station/statuses/34c4c027770518e2087db44a89cad07cd91ceb84"}},"merged":false,"mergeable":null,"mergeable_state":"unknown","merged_by":null,"comments":0,"review_comments":0,"commits":55,"additions":1841,"deletions":1195,"changed_files":145}},"public":true,"created_at":"2015-01-01T01:02:41Z","org":{"id":9313156,"login":"AsteroidStation","gravatar_id":"","url":"https://api.github.com/orgs/AsteroidStation","avatar_url":"https://avatars.githubusercontent.com/u/9313156?"}}
{"id":"2489397024","type":"CreateEvent","actor":{"id":2684528,"login":"pAs2aL","gravatar_id":"","url":"https://api.github.com/users/pAs2aL","avatar_url":"https://avatars.githubusercontent.com/u/2684528?"},"repo":{"id":28649619,"name":"pAs2aL/nightjar","url":"https://api.github.com/repos/pAs2aL/nightjar"},"payload":{"ref":"gh-pages","ref_type":"branch","master_branch":"master","description":"A 2D cooperative role playing game","pusher_type":"user"},"public":true,"created_at":"2015-01-01T01:02:41Z"}
{"id":"2489397025","type":"PushEvent","actor":{"id":5043639,"login":"akbar-sh","gravatar_id":"","url":"https://api.github.com/users/akbar-sh","avatar_url":"https://avatars.githubusercontent.com/u/5043639?"},"repo":{"id":28675338,"name":"akbar-sh/tracker","url":"https://api.github.com/repos/akbar-sh/tracker"},"payload":{"push_id":536752768,"size":2,"distinct_size":2,"ref":"refs/heads/master","head":"88fede14a8bc23b1e9654a297922a0791f7522d1","before":"c45885fad735da88cd6dc0fbabd83a647a7c0289","commits":[{"sha":"87bc2f0f2b96ef7847dfd4d65bcaeef8182e1711","author":{"email":"7eb7e51160615686946d5e19147edf697a6d53a2@MacBook.local","name":"Akbar Sharifi"},"message":"Removing facebook keys.","distinct":true,"url":"https://api.github.com/repos/akbar-sh/tracker/commits/87bc2f0f2b96ef7847dfd4d65bcaeef8182e1711"},{"sha":"88fede14a8bc23b1e9654a297922a0791f7522d1","author":{"email":"7eb7e51160615686946d5e19147edf697a6d53a2@MacBook.local","name":"Akbar Sharifi"},"message":"Merge branch 'master' of https://github.com/akbar-sh/tracker","distinct":true,"url":"https://api.github.com/repos/akbar-sh/tracker/commits/88fede14a8bc23b1e9654a297922a0791f7522d1"}]},"public":true,"created_at":"2015-01-01T01:02:41Z"}
{"id":"2489397036","type":"PushEvent","actor":{"id":6241554,"login":"leo-yuriev","gravatar_id":"","url":"https://api.github.com/users/leo-yuriev","avatar_url":"https://avatars.githubusercontent.com/u/6241554?"},"repo":{"id":23696666,"name":"leo-yuriev/openldap-lmdb-challenge","url":"https://api.github.com/repos/leo-yuriev/openldap-lmdb-challenge"},"payload":{"push_id":536752772,"size":14,"distinct_size":14,"ref":"refs/heads/2.4-devel","head":"f705475af08e6b50420a8ff22b71cfbe45cea409","before":"6dc7947be776bbce629aac14e588307e2889740b","commits":[{"sha":"d99cbb501031c413632e403be0ea63281270e47b","author":{"email":"1f0a51c36efaa0f44e4899c26d2028681997c8ea@yuriev.ru","name":"Leo Yuriev"},"message":"ps-build.sh","distinct":true,"url":"https://api.github.com/repos/leo-yuriev/openldap-lmdb-challenge/commits/d99cbb501031c413632e403be0ea63281270e47b"},{"sha":"758e5973787cc5cdf089dc860a05393594a88410","author":{"email":"1f0a51c36efaa0f44e4899c26d2028681997c8ea@yuriev.ru","name":"Leo Yuriev"},"message":"qt-creator project","distinct":true,"url":"https://api.github.com/repos/leo-yuriev/openldap-lmdb-challenge/commits/758e5973787cc5cdf089dc860a05393594a88410"},{"sha":"e79179f8971b6f5bd0b2de68fc52911644be5099","author":{"email":"1f0a51c36efaa0f44e4899c26d2028681997c8ea@yuriev.ru","name":"Leo Yuriev"},"message":"fix debug marco","distinct":true,"url":"https://api.github.com/repos/leo-yuriev/openldap-lmdb-challenge/commits/e79179f8971b6f5bd0b2de68fc52911644be5099"},{"sha":"251d0e76442dfd449eb60fa95c3512b88f7d2c28","author":{"email":"1f0a51c36efaa0f44e4899c26d2028681997c8ea@yuriev.ru","name":"Leo Yuriev"},"message":"fix: using strerror_r()","distinct":true,"url":"https://api.github.com/repos/leo-yuriev/openldap-lmdb-challenge/commits/251d0e76442dfd449eb60fa95c3512b88f7d2c28"},{"sha":"dea8bab3a83841845cbd5e7eaae856a00b944c9e","author":{"email":"1f0a51c36efaa0f44e4899c26d2028681997c8ea@yuriev.ru","name":"Leo Yuriev"},"message":"fix: read/write ignored result.","distinct":true,"url":"https://api.github.com/repos/leo-yuriev/openldap-lmdb-challenge/commits/dea8bab3a83841845cbd5e7eaae856a00b944c9e"},{"sha":"ae9384015ad55a10cdc94ce4e0d7db629345342a","author":{"email":"1f0a51c36efaa0f44e4899c26d2028681997c8ea@yuriev.ru","name":"Leo Yuriev"},"message":"fix: check getcmd() result","distinct":true,"url":"https://api.github.com/repos/leo-yuriev/openldap-lmdb-challenge/commits/ae9384015ad55a10cdc94ce4e0d7db629345342a"},{"sha":"1c6e1547e8a51177bedca0296288c38745161afe","author":{"email":"1f0a51c36efaa0f44e4899c26d2028681997c8ea@yuriev.ru","name":"Leo Yuriev"},"message":"fix: printf unused agrv[0] in main()","distinct":true,"url":"https://api.github.com/repos/leo-yuriev/openldap-lmdb-challenge/commits/1c6e1547e8a51177bedca0296288c38745161afe"},{"sha":"5b8dc917757526f0290c2bb7dda9f06dbd621ab6","author":{"email":"1f0a51c36efaa0f44e4899c26d2028681997c8ea@yuriev.ru","name":"Leo Yuriev"},"message":"fix: printf %d without arg in main()","distinct":true,"url":"https://api.github.com/repos/leo-yuriev/openldap-lmdb-challenge/commits/5b8dc917757526f0290c2bb7dda9f06dbd621ab6"},{"sha":"28182c76f57c5c328a302b4867a3dda600b99b7d","author":{"email":"1f0a51c36efaa0f44e4899c26d2028681997c8ea@yuriev.ru","name":"Leo Yuriev"},"message":"fix: warning-errors for configure","distinct":true,"url":"https://api.github.com/repos/leo-yuriev/openldap-lmdb-challenge/commits/28182c76f57c5c328a302b4867a3dda600b99b7d"},{"sha":"64725efd6f4369f3985d6785ef3c1c9f9452be4e","author":{"email":"1f0a51c36efaa0f44e4899c26d2028681997c8ea@yuriev.ru","name":"Leo Yuriev"},"message":"fix: build-warnings (most 'unused')","distinct":true,"url":"https://api.github.com/repos/leo-yuriev/openldap-lmdb-challenge/commits/64725efd6f4369f3985d6785ef3c1c9f9452be4e"},{"sha":"9011ed6d444ae30acd17fb3b335ae901e5927bd7","author":{"email":"1f0a51c36efaa0f44e4899c26d2028681997c8ea@yuriev.ru","name":"Leo Yuriev"},"message":"fix: const","distinct":true,"url":"https://api.github.com/repos/leo-yuriev/openldap-lmdb-challenge/commits/9011ed6d444ae30acd17fb3b335ae901e5927bd7"},{"sha":"72a7cc8702ce5394b1c78c976064f37fd75920f9","author":{"email":"1f0a51c36efaa0f44e4899c26d2028681997c8ea@yuriev.ru","name":"Leo Yuriev"},"message":"fix: warnings (uninitialized)","distinct":true,"url":"https://api.github.com/repos/leo-yuriev/openldap-lmdb-challenge/commits/72a7cc8702ce5394b1c78c976064f37fd75920f9"},{"sha":"26d527311aec553be799e2ab27a407be58c79ec6","author":{"email":"1f0a51c36efaa0f44e4899c26d2028681997c8ea@yuriev.ru","name":"Leo Yuriev"},"message":"sasl callback's typecast","distinct":true,"url":"https://api.github.com/repos/leo-yuriev/openldap-lmdb-challenge/commits/26d527311aec553be799e2ab27a407be58c79ec6"},{"sha":"f705475af08e6b50420a8ff22b71cfbe45cea409","author":{"email":"1f0a51c36efaa0f44e4899c26d2028681997c8ea@yuriev.ru","name":"Leo Yuriev"},"message":"fix warnings (unused, uninitialized, misc);","distinct":true,"url":"https://api.github.com/repos/leo-yuriev/openldap-lmdb-challenge/commits/f705475af08e6b50420a8ff22b71cfbe45cea409"}]},"public":true,"created_at":"2015-01-01T01:02:43Z"}
{"id":"2489397037","type":"PushEvent","actor":{"id":1932804,"login":"coldmind","gravatar_id":"","url":"https://api.github.com/users/coldmind","avatar_url":"https://avatars.githubusercontent.com/u/1932804?"},"repo":{"id":18882135,"name":"coldmind/django","url":"https://api.github.com/repos/coldmind/django"},"payload":{"push_id":536752773,"size":1,"distinct_size":1,"ref":"refs/heads/ticket_24064","head":"f1231658677318fd416661219e1480a46fba4b71","before":"7cec2b4d707716d83aad641e84b1daf064811ca8","commits":[{"sha":"f1231658677318fd416661219e1480a46fba4b71","author":{"email":"1f135da694de981cc7e3d5bc8ed1049495ca7439@yandex.ru","name":"Andriy Sokolovskiy"},"message":"Fixed #24064 - Prevented database access in compile time in spatialite models","distinct":true,"url":"https://api.github.com/repos/coldmind/django/commits/f1231658677318fd416661219e1480a46fba4b71"}]},"public":true,"created_at":"2015-01-01T01:02:43Z"}
{"id":"2489397039","type":"IssuesEvent","actor":{"id":1742369,"login":"gbathree","gravatar_id":"","url":"https://api.github.com/users/gbathree","avatar_url":"https://avatars.githubusercontent.com/u/1742369?"},"repo":{"id":20705156,"name":"Photosynq/PhotosynQ-ChromeApp","url":"https://api.github.com/repos/Photosynq/PhotosynQ-ChromeApp"},"payload":{"action":"opened","issue":{"url":"https://api.github.com/repos/Photosynq/PhotosynQ-ChromeApp/issues/14","labels_url":"https://api.github.com/repos/Photosynq/PhotosynQ-ChromeApp/issues/14/labels{/name}","comments_url":"https://api.github.com/repos/Photosynq/PhotosynQ-ChromeApp/issues/14/comments","events_url":"https://api.github.com/repos/Photosynq/PhotosynQ-ChromeApp/issues/14/events","html_url":"https://github.com/Photosynq/PhotosynQ-ChromeApp/issues/14","id":53210212,"number":14,"title":"get rid of 'get_offset' function from protocol creator - it's not used anymore","user":{"login":"gbathree","id":1742369,"avatar_url":"https://avatars.githubusercontent.com/u/1742369?v=3","gravatar_id":"","url":"https://api.github.com/users/gbathree","html_url":"https://github.com/gbathree","followers_url":"https://api.github.com/users/gbathree/followers","following_url":"https://api.github.com/users/gbathree/following{/other_user}","gists_url":"https://api.github.com/users/gbathree/gists{/gist_id}","starred_url":"https://api.github.com/users/gbathree/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/gbathree/subscriptions","organizations_url":"https://api.github.com/users/gbathree/orgs","repos_url":"https://api.github.com/users/gbathree/repos","events_url":"https://api.github.com/users/gbathree/events{/privacy}","received_events_url":"https://api.github.com/users/gbathree/received_events","type":"User","site_admin":false},"labels":[],"state":"open","locked":false,"assignee":null,"milestone":null,"comments":0,"created_at":"2015-01-01T01:02:43Z","updated_at":"2015-01-01T01:02:43Z","closed_at":null,"body":""}},"public":true,"created_at":"2015-01-01T01:02:43Z","org":{"id":5068236,"login":"Photosynq","gravatar_id":"","url":"https://api.github.com/orgs/Photosynq","avatar_url":"https://avatars.githubusercontent.com/u/5068236?"}}
{"id":"2489397043","type":"PushEvent","actor":{"id":3964764,"login":"elliekimpot","gravatar_id":"","url":"https://api.github.com/users/elliekimpot","avatar_url":"https://avatars.githubusercontent.com/u/3964764?"},"repo":{"id":28625867,"name":"elliekimpot/msm","url":"https://api.github.com/repos/elliekimpot/msm"},"payload":{"push_id":536752776,"size":1,"distinct_size":1,"ref":"refs/heads/feature/removed","head":"6393887f2296f3e7d7820ceefa0177003261ec68","before":"2c854302b53eef234eae379576a870f9ef9aa3bd","commits":[{"sha":"6393887f2296f3e7d7820ceefa0177003261ec68","author":{"email":"c6c610d4ed4672366596341ac49b62c9256ebf55@gmail.com","name":"Ellie"},"message":"pantech/debug: Drop PANTECH_ERR_CRASH_LOGGING\n\nDrop PANTECH_ERR_CRASH_LOGGING and introduce PANTECH_SYS\ndue to proper build (Solve error/mipi_sony_incell.c).\n\nSigned-off-by: Ellie <elliekimpot@gmail.com>","distinct":true,"url":"https://api.github.com/repos/elliekimpot/msm/commits/6393887f2296f3e7d7820ceefa0177003261ec68"}]},"public":true,"created_at":"2015-01-01T01:02:44Z"}
{"id":"2489397046","type":"PushEvent","actor":{"id":10176820,"login":"chalavadivishnu","gravatar_id":"","url":"https://api.github.com/users/chalavadivishnu","avatar_url":"https://avatars.githubusercontent.com/u/10176820?"},"repo":{"id":28678150,"name":"chalavadivishnu/Face-Detection","url":"https://api.github.com/repos/chalavadivishnu/Face-Detection"},"payload":{"push_id":536752778,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"74e68efacee23b35716fa9b2b46d0926e552250b","before":"b956bef865580106b571e412e35308b3e7ab708e","commits":[{"sha":"74e68efacee23b35716fa9b2b46d0926e552250b","author":{"email":"ce8044f02eb2a26b631671f5297317036d398e79@gmail.com","name":"Chalavadi Vishnu"},"message":"image scan","distinct":true,"url":"https://api.github.com/repos/chalavadivishnu/Face-Detection/commits/74e68efacee23b35716fa9b2b46d0926e552250b"}]},"public":true,"created_at":"2015-01-01T01:02:44Z"}
{"id":"2489397047","type":"PushEvent","actor":{"id":904370,"login":"helhum","gravatar_id":"","url":"https://api.github.com/users/helhum","avatar_url":"https://avatars.githubusercontent.com/u/904370?"},"repo":{"id":20956969,"name":"TYPO3-Surf-CMS/Distribution","url":"https://api.github.com/repos/TYPO3-Surf-CMS/Distribution"},"payload":{"push_id":536752779,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"f566d43f3b6ada009c3f571fac56f51b35110a46","before":"241f31bdc19c49919632933ff22e01b4f73220ad","commits":[{"sha":"f566d43f3b6ada009c3f571fac56f51b35110a46","author":{"email":"6bf857ca7de026fbed4ae790a809a0ea640901f4@helmuthummel.de","name":"Helmut Hummel"},"message":"Update README.md","distinct":true,"url":"https://api.github.com/repos/TYPO3-Surf-CMS/Distribution/commits/f566d43f3b6ada009c3f571fac56f51b35110a46"}]},"public":true,"created_at":"2015-01-01T01:02:44Z","org":{"id":7921669,"login":"TYPO3-Surf-CMS","gravatar_id":"","url":"https://api.github.com/orgs/TYPO3-Surf-CMS","avatar_url":"https://avatars.githubusercontent.com/u/7921669?"}}
{"id":"2489397049","type":"PushEvent","actor":{"id":9000293,"login":"diianita","gravatar_id":"","url":"https://api.github.com/users/diianita","avatar_url":"https://avatars.githubusercontent.com/u/9000293?"},"repo":{"id":27146993,"name":"cArLiiToX/dtstore","url":"https://api.github.com/repos/cArLiiToX/dtstore"},"payload":{"push_id":536752780,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"8cacad9b34f30388789700e5bb81deaa4471de12","before":"57150fe4e8e3dbd8707e8bec5efdcbd306696812","commits":[{"sha":"8cacad9b34f30388789700e5bb81deaa4471de12","author":{"email":"ab5e2bca84933118bbc9d48ffaccce3bac4eeb64@xng.bz","name":"cArLiiToX"},"message":"correciones","distinct":true,"url":"https://api.github.com/repos/cArLiiToX/dtstore/commits/8cacad9b34f30388789700e5bb81deaa4471de12"}]},"public":true,"created_at":"2015-01-01T01:02:44Z"}
{"id":"2489397053","type":"PushEvent","actor":{"id":280212,"login":"KenanSulayman","gravatar_id":"","url":"https://api.github.com/users/KenanSulayman","avatar_url":"https://avatars.githubusercontent.com/u/280212?"},"repo":{"id":21481110,"name":"KenanSulayman/heartbeat","url":"https://api.github.com/repos/KenanSulayman/heartbeat"},"payload":{"push_id":536752782,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"d3f1564c71b9e115435146f52c4c7c5771f819c7","before":"1ac37b74ae21d946dc3826883204811da6d06852","commits":[{"sha":"d3f1564c71b9e115435146f52c4c7c5771f819c7","author":{"email":"9176253dfc0bc82671a5e984646605f93319147a@sly.mn","name":"Kenan Sulayman"},"message":"1420074163829\n\nXtUeXIlAxXGaVujlvuXtkkZObuk/+aeIggSf/No53Io=","distinct":true,"url":"https://api.github.com/repos/KenanSulayman/heartbeat/commits/d3f1564c71b9e115435146f52c4c7c5771f819c7"}]},"public":true,"created_at":"2015-01-01T01:02:45Z"}
{"id":"2489397054","type":"PushEvent","actor":{"id":3520402,"login":"GGGGGGGG","gravatar_id":"","url":"https://api.github.com/users/GGGGGGGG","avatar_url":"https://avatars.githubusercontent.com/u/3520402?"},"repo":{"id":18301597,"name":"GGGGGGGG/s2wrapper","url":"https://api.github.com/repos/GGGGGGGG/s2wrapper"},"payload":{"push_id":536752783,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"cdb993c4bc1f95f25298c1676aa2b054c7887156","before":"20f7e6744e1589aab24b558e51e81511417673bc","commits":[{"sha":"cdb993c4bc1f95f25298c1676aa2b054c7887156","author":{"email":"f2a2448977df35866ec00b7ed7fec9e564d96bb3@fallenwow.net","name":"Cedeqien"},"message":"fix for sudo","distinct":true,"url":"https://api.github.com/repos/GGGGGGGG/s2wrapper/commits/cdb993c4bc1f95f25298c1676aa2b054c7887156"}]},"public":true,"created_at":"2015-01-01T01:02:45Z"}
{"id":"2489397064","type":"PullRequestReviewCommentEvent","actor":{"id":706947,"login":"d3athrow","gravatar_id":"","url":"https://api.github.com/users/d3athrow","avatar_url":"https://avatars.githubusercontent.com/u/706947?"},"repo":{"id":10441188,"name":"d3athrow/vgstation13","url":"https://api.github.com/repos/d3athrow/vgstation13"},"payload":{"action":"created","comment":{"url":"https://api.github.com/repos/d3athrow/vgstation13/pulls/comments/22397265","id":22397265,"diff_hunk":"@@ -476,6 +476,8 @@ var/global/list/RPD_recipes=list(\n \t\treturn 0\n \tif(istype(A,/area/shuttle)||istype(A,/turf/space/transit))\n \t\treturn 0\n+\tif(istype(A, /obj/structure/lattice))","path":"code/game/objects/items/weapons/RPD.dm","position":4,"original_position":4,"commit_id":"a360358fdff0ce9979647f10ddc1a5364d33f229","original_commit_id":"a360358fdff0ce9979647f10ddc1a5364d33f229","user":{"login":"d3athrow","id":706947,"avatar_url":"https://avatars.githubusercontent.com/u/706947?v=3","gravatar_id":"","url":"https://api.github.com/users/d3athrow","html_url":"https://github.com/d3athrow","followers_url":"https://api.github.com/users/d3athrow/followers","following_url":"https://api.github.com/users/d3athrow/following{/other_user}","gists_url":"https://api.github.com/users/d3athrow/gists{/gist_id}","starred_url":"https://api.github.com/users/d3athrow/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/d3athrow/subscriptions","organizations_url":"https://api.github.com/users/d3athrow/orgs","repos_url":"https://api.github.com/users/d3athrow/repos","events_url":"https://api.github.com/users/d3athrow/events{/privacy}","received_events_url":"https://api.github.com/users/d3athrow/received_events","type":"User","site_admin":false},"body":"consider checking for lattice on space turf click as well.","created_at":"2015-01-01T01:02:46Z","updated_at":"2015-01-01T01:02:46Z","html_url":"https://github.com/d3athrow/vgstation13/pull/2418#discussion_r22397265","pull_request_url":"https://api.github.com/repos/d3athrow/vgstation13/pulls/2418","_links":{"self":{"href":"https://api.github.com/repos/d3athrow/vgstation13/pulls/comments/22397265"},"html":{"href":"https://github.com/d3athrow/vgstation13/pull/2418#discussion_r22397265"},"pull_request":{"href":"https://api.github.com/repos/d3athrow/vgstation13/pulls/2418"}}},"pull_request":{"url":"https://api.github.com/repos/d3athrow/vgstation13/pulls/2418","id":26731379,"html_url":"https://github.com/d3athrow/vgstation13/pull/2418","diff_url":"https://github.com/d3athrow/vgstation13/pull/2418.diff","patch_url":"https://github.com/d3athrow/vgstation13/pull/2418.patch","issue_url":"https://api.github.com/repos/d3athrow/vgstation13/issues/2418","number":2418,"state":"open","locked":false,"title":"Nightvision Goggles update + RPD on lattices","user":{"login":"clusterfack","id":8516830,"avatar_url":"https://avatars.githubusercontent.com/u/8516830?v=3","gravatar_id":"","url":"https://api.github.com/users/clusterfack","html_url":"https://github.com/clusterfack","followers_url":"https://api.github.com/users/clusterfack/followers","following_url":"https://api.github.com/users/clusterfack/following{/other_user}","gists_url":"https://api.github.com/users/clusterfack/gists{/gist_id}","starred_url":"https://api.github.com/users/clusterfack/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/clusterfack/subscriptions","organizations_url":"https://api.github.com/users/clusterfack/orgs","repos_url":"https://api.github.com/users/clusterfack/repos","events_url":"https://api.github.com/users/clusterfack/events{/privacy}","received_events_url":"https://api.github.com/users/clusterfack/received_events","type":"User","site_admin":false},"body":"Night vision goggles work like night vision goggles, they let you see through the dark, they dont let you see through walls, and they illuminate all darkness.\r\n\r\nRPDs can now build on lattice when you click on them.","created_at":"2014-12-31T18:20:37Z","updated_at":"2015-01-01T01:02:46Z","closed_at":null,"merged_at":null,"merge_commit_sha":"77cf984c1f278d4fe6f04974b19d5837b4c3b353","assignee":null,"milestone":null,"commits_url":"https://api.github.com/repos/d3athrow/vgstation13/pulls/2418/commits","review_comments_url":"https://api.github.com/repos/d3athrow/vgstation13/pulls/2418/comments","review_comment_url":"https://api.github.com/repos/d3athrow/vgstation13/pulls/comments/{number}","comments_url":"https://api.github.com/repos/d3athrow/vgstation13/issues/2418/comments","statuses_url":"https://api.github.com/repos/d3athrow/vgstation13/statuses/a360358fdff0ce9979647f10ddc1a5364d33f229","head":{"label":"clusterfack:NVG","ref":"NVG","sha":"a360358fdff0ce9979647f10ddc1a5364d33f229","user":{"login":"clusterfack","id":8516830,"avatar_url":"https://avatars.githubusercontent.com/u/8516830?v=3","gravatar_id":"","url":"https://api.github.com/users/clusterfack","html_url":"https://github.com/clusterfack","followers_url":"https://api.github.com/users/clusterfack/followers","following_url":"https://api.github.com/users/clusterfack/following{/other_user}","gists_url":"https://api.github.com/users/clusterfack/gists{/gist_id}","starred_url":"https://api.github.com/users/clusterfack/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/clusterfack/subscriptions","organizations_url":"https://api.github.com/users/clusterfack/orgs","repos_url":"https://api.github.com/users/clusterfack/repos","events_url":"https://api.github.com/users/clusterfack/events{/privacy}","received_events_url":"https://api.github.com/users/clusterfack/received_events","type":"User","site_admin":false},"repo":{"id":28336888,"name":"bugfixstation13","full_name":"clusterfack/bugfixstation13","owner":{"login":"clusterfack","id":8516830,"avatar_url":"https://avatars.githubusercontent.com/u/8516830?v=3","gravatar_id":"","url":"https://api.github.com/users/clusterfack","html_url":"https://github.com/clusterfack","followers_url":"https://api.github.com/users/clusterfack/followers","following_url":"https://api.github.com/users/clusterfack/following{/other_user}","gists_url":"https://api.github.com/users/clusterfack/gists{/gist_id}","starred_url":"https://api.github.com/users/clusterfack/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/clusterfack/subscriptions","organizations_url":"https://api.github.com/users/clusterfack/orgs","repos_url":"https://api.github.com/users/clusterfack/repos","events_url":"https://api.github.com/users/clusterfack/events{/privacy}","received_events_url":"https://api.github.com/users/clusterfack/received_events","type":"User","site_admin":false},"private":false,"html_url":"https://github.com/clusterfack/bugfixstation13","description":"This is the vgstation's fork of baystation12's code.","fork":true,"url":"https://api.github.com/repos/clusterfack/bugfixstation13","forks_url":"https://api.github.com/repos/clusterfack/bugfixstation13/forks","keys_url":"https://api.github.com/repos/clusterfack/bugfixstation13/keys{/key_id}","collaborators_url":"https://api.github.com/repos/clusterfack/bugfixstation13/collaborators{/collaborator}","teams_url":"https://api.github.com/repos/clusterfack/bugfixstation13/teams","hooks_url":"https://api.github.com/repos/clusterfack/bugfixstation13/hooks","issue_events_url":"https://api.github.com/repos/clusterfack/bugfixstation13/issues/events{/number}","events_url":"https://api.github.com/repos/clusterfack/bugfixstation13/events","assignees_url":"https://api.github.com/repos/clusterfack/bugfixstation13/assignees{/user}","branches_url":"https://api.github.com/repos/clusterfack/bugfixstation13/branches{/branch}","tags_url":"https://api.github.com/repos/clusterfack/bugfixstation13/tags","blobs_url":"https://api.github.com/repos/clusterfack/bugfixstation13/git/blobs{/sha}","git_tags_url":"https://api.github.com/repos/clusterfack/bugfixstation13/git/tags{/sha}","git_refs_url":"https://api.github.com/repos/clusterfack/bugfixstation13/git/refs{/sha}","trees_url":"https://api.github.com/repos/clusterfack/bugfixstation13/git/trees{/sha}","statuses_url":"https://api.github.com/repos/clusterfack/bugfixstation13/statuses/{sha}","languages_url":"https://api.github.com/repos/clusterfack/bugfixstation13/languages","stargazers_url":"https://api.github.com/repos/clusterfack/bugfixstation13/stargazers","contributors_url":"https://api.github.com/repos/clusterfack/bugfixstation13/contributors","subscribers_url":"https://api.github.com/repos/clusterfack/bugfixstation13/subscribers","subscription_url":"https://api.github.com/repos/clusterfack/bugfixstation13/subscription","commits_url":"https://api.github.com/repos/clusterfack/bugfixstation13/commits{/sha}","git_commits_url":"https://api.github.com/repos/clusterfack/bugfixstation13/git/commits{/sha}","comments_url":"https://api.github.com/repos/clusterfack/bugfixstation13/comments{/number}","issue_comment_url":"https://api.github.com/repos/clusterfack/bugfixstation13/issues/comments/{number}","contents_url":"https://api.github.com/repos/clusterfack/bugfixstation13/contents/{+path}","compare_url":"https://api.github.com/repos/clusterfack/bugfixstation13/compare/{base}...{head}","merges_url":"https://api.github.com/repos/clusterfack/bugfixstation13/merges","archive_url":"https://api.github.com/repos/clusterfack/bugfixstation13/{archive_format}{/ref}","downloads_url":"https://api.github.com/repos/clusterfack/bugfixstation13/downloads","issues_url":"https://api.github.com/repos/clusterfack/bugfixstation13/issues{/number}","pulls_url":"https://api.github.com/repos/clusterfack/bugfixstation13/pulls{/number}","milestones_url":"https://api.github.com/repos/clusterfack/bugfixstation13/milestones{/number}","notifications_url":"https://api.github.com/repos/clusterfack/bugfixstation13/notifications{?since,all,participating}","labels_url":"https://api.github.com/repos/clusterfack/bugfixstation13/labels{/name}","releases_url":"https://api.github.com/repos/clusterfack/bugfixstation13/releases{/id}","created_at":"2014-12-22T11:57:24Z","updated_at":"2014-12-31T18:43:55Z","pushed_at":"2014-12-31T18:47:03Z","git_url":"git://github.com/clusterfack/bugfixstation13.git","ssh_url":"git@github.com:clusterfack/bugfixstation13.git","clone_url":"https://github.com/clusterfack/bugfixstation13.git","svn_url":"https://github.com/clusterfack/bugfixstation13","homepage":"","size":760194,"stargazers_count":0,"watchers_count":0,"language":"DM","has_issues":false,"has_downloads":true,"has_wiki":true,"has_pages":false,"forks_count":0,"mirror_url":null,"open_issues_count":0,"forks":0,"open_issues":0,"watchers":0,"default_branch":"Bleeding-Edge"}},"base":{"label":"d3athrow:Bleeding-Edge","ref":"Bleeding-Edge","sha":"5e8624143efbf348ed553421b76293ef84acac57","user":{"login":"d3athrow","id":706947,"avatar_url":"https://avatars.githubusercontent.com/u/706947?v=3","gravatar_id":"","url":"https://api.github.com/users/d3athrow","html_url":"https://github.com/d3athrow","followers_url":"https://api.github.com/users/d3athrow/followers","following_url":"https://api.github.com/users/d3athrow/following{/other_user}","gists_url":"https://api.github.com/users/d3athrow/gists{/gist_id}","starred_url":"https://api.github.com/users/d3athrow/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/d3athrow/subscriptions","organizations_url":"https://api.github.com/users/d3athrow/orgs","repos_url":"https://api.github.com/users/d3athrow/repos","events_url":"https://api.github.com/users/d3athrow/events{/privacy}","received_events_url":"https://api.github.com/users/d3athrow/received_events","type":"User","site_admin":false},"repo":{"id":10441188,"name":"vgstation13","full_name":"d3athrow/vgstation13","owner":{"login":"d3athrow","id":706947,"avatar_url":"https://avatars.githubusercontent.com/u/706947?v=3","gravatar_id":"","url":"https://api.github.com/users/d3athrow","html_url":"https://github.com/d3athrow","followers_url":"https://api.github.com/users/d3athrow/followers","following_url":"https://api.github.com/users/d3athrow/following{/other_user}","gists_url":"https://api.github.com/users/d3athrow/gists{/gist_id}","starred_url":"https://api.github.com/users/d3athrow/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/d3athrow/subscriptions","organizations_url":"https://api.github.com/users/d3athrow/orgs","repos_url":"https://api.github.com/users/d3athrow/repos","events_url":"https://api.github.com/users/d3athrow/events{/privacy}","received_events_url":"https://api.github.com/users/d3athrow/received_events","type":"User","site_admin":false},"private":false,"html_url":"https://github.com/d3athrow/vgstation13","description":"This is the vgstation's fork of baystation12's code.","fork":true,"url":"https://api.github.com/repos/d3athrow/vgstation13","forks_url":"https://api.github.com/repos/d3athrow/vgstation13/forks","keys_url":"https://api.github.com/repos/d3athrow/vgstation13/keys{/key_id}","collaborators_url":"https://api.github.com/repos/d3athrow/vgstation13/collaborators{/collaborator}","teams_url":"https://api.github.com/repos/d3athrow/vgstation13/teams","hooks_url":"https://api.github.com/repos/d3athrow/vgstation13/hooks","issue_events_url":"https://api.github.com/repos/d3athrow/vgstation13/issues/events{/number}","events_url":"https://api.github.com/repos/d3athrow/vgstation13/events","assignees_url":"https://api.github.com/repos/d3athrow/vgstation13/assignees{/user}","branches_url":"https://api.github.com/repos/d3athrow/vgstation13/branches{/branch}","tags_url":"https://api.github.com/repos/d3athrow/vgstation13/tags","blobs_url":"https://api.github.com/repos/d3athrow/vgstation13/git/blobs{/sha}","git_tags_url":"https://api.github.com/repos/d3athrow/vgstation13/git/tags{/sha}","git_refs_url":"https://api.github.com/repos/d3athrow/vgstation13/git/refs{/sha}","trees_url":"https://api.github.com/repos/d3athrow/vgstation13/git/trees{/sha}","statuses_url":"https://api.github.com/repos/d3athrow/vgstation13/statuses/{sha}","languages_url":"https://api.github.com/repos/d3athrow/vgstation13/languages","stargazers_url":"https://api.github.com/repos/d3athrow/vgstation13/stargazers","contributors_url":"https://api.github.com/repos/d3athrow/vgstation13/contributors","subscribers_url":"https://api.github.com/repos/d3athrow/vgstation13/subscribers","subscription_url":"https://api.github.com/repos/d3athrow/vgstation13/subscription","commits_url":"https://api.github.com/repos/d3athrow/vgstation13/commits{/sha}","git_commits_url":"https://api.github.com/repos/d3athrow/vgstation13/git/commits{/sha}","comments_url":"https://api.github.com/repos/d3athrow/vgstation13/comments{/number}","issue_comment_url":"https://api.github.com/repos/d3athrow/vgstation13/issues/comments/{number}","contents_url":"https://api.github.com/repos/d3athrow/vgstation13/contents/{+path}","compare_url":"https://api.github.com/repos/d3athrow/vgstation13/compare/{base}...{head}","merges_url":"https://api.github.com/repos/d3athrow/vgstation13/merges","archive_url":"https://api.github.com/repos/d3athrow/vgstation13/{archive_format}{/ref}","downloads_url":"https://api.github.com/repos/d3athrow/vgstation13/downloads","issues_url":"https://api.github.com/repos/d3athrow/vgstation13/issues{/number}","pulls_url":"https://api.github.com/repos/d3athrow/vgstation13/pulls{/number}","milestones_url":"https://api.github.com/repos/d3athrow/vgstation13/milestones{/number}","notifications_url":"https://api.github.com/repos/d3athrow/vgstation13/notifications{?since,all,participating}","labels_url":"https://api.github.com/repos/d3athrow/vgstation13/labels{/name}","releases_url":"https://api.github.com/repos/d3athrow/vgstation13/releases{/id}","created_at":"2013-06-02T19:39:54Z","updated_at":"2014-12-31T20:06:46Z","pushed_at":"2014-12-31T23:06:06Z","git_url":"git://github.com/d3athrow/vgstation13.git","ssh_url":"git@github.com:d3athrow/vgstation13.git","clone_url":"https://github.com/d3athrow/vgstation13.git","svn_url":"https://github.com/d3athrow/vgstation13","homepage":"","size":937605,"stargazers_count":45,"watchers_count":45,"language":"DM","has_issues":true,"has_downloads":true,"has_wiki":true,"has_pages":false,"forks_count":135,"mirror_url":null,"open_issues_count":260,"forks":135,"open_issues":260,"watchers":45,"default_branch":"master"}},"_links":{"self":{"href":"https://api.github.com/repos/d3athrow/vgstation13/pulls/2418"},"html":{"href":"https://github.com/d3athrow/vgstation13/pull/2418"},"issue":{"href":"https://api.github.com/repos/d3athrow/vgstation13/issues/2418"},"comments":{"href":"https://api.github.com/repos/d3athrow/vgstation13/issues/2418/comments"},"review_comments":{"href":"https://api.github.com/repos/d3athrow/vgstation13/pulls/2418/comments"},"review_comment":{"href":"https://api.github.com/repos/d3athrow/vgstation13/pulls/comments/{number}"},"commits":{"href":"https://api.github.com/repos/d3athrow/vgstation13/pulls/2418/commits"},"statuses":{"href":"https://api.github.com/repos/d3athrow/vgstation13/statuses/a360358fdff0ce9979647f10ddc1a5364d33f229"}}}},"public":true,"created_at":"2015-01-01T01:02:46Z"}
{"id":"2489397070","type":"PushEvent","actor":{"id":2226434,"login":"andschwa","gravatar_id":"","url":"https://api.github.com/users/andschwa","avatar_url":"https://avatars.githubusercontent.com/u/2226434?"},"repo":{"id":6480901,"name":"andschwa/dotfiles","url":"https://api.github.com/repos/andschwa/dotfiles"},"payload":{"push_id":536752785,"size":3,"distinct_size":3,"ref":"refs/heads/master","head":"6141ae1ad24a045ceb531541f2ee6d242c8d6501","before":"677ba270bf789af52a4df9dbc07af6dbca96295b","commits":[{"sha":"06b1e8dbfecb03fe23ce6b8bf1b13fe4567e1152","author":{"email":"02e0a999c50b1f88df7a8f5a04e1b76b35ea6a88@schwartzmeyer.com","name":"Andrew Schwartzmeyer"},"message":"Updating mrconfig","distinct":true,"url":"https://api.github.com/repos/andschwa/dotfiles/commits/06b1e8dbfecb03fe23ce6b8bf1b13fe4567e1152"},{"sha":"bdc7c21ecfb664b32305747d3a4c525c33df9d5a","author":{"email":"02e0a999c50b1f88df7a8f5a04e1b76b35ea6a88@schwartzmeyer.com","name":"Andrew Schwartzmeyer"},"message":"Fixing mr repo","distinct":true,"url":"https://api.github.com/repos/andschwa/dotfiles/commits/bdc7c21ecfb664b32305747d3a4c525c33df9d5a"},{"sha":"6141ae1ad24a045ceb531541f2ee6d242c8d6501","author":{"email":"02e0a999c50b1f88df7a8f5a04e1b76b35ea6a88@schwartzmeyer.com","name":"Andrew Schwartzmeyer"},"message":"Don't repeat myself","distinct":true,"url":"https://api.github.com/repos/andschwa/dotfiles/commits/6141ae1ad24a045ceb531541f2ee6d242c8d6501"}]},"public":true,"created_at":"2015-01-01T01:02:47Z"}
{"id":"2489397071","type":"PushEvent","actor":{"id":227068,"login":"radix","gravatar_id":"","url":"https://api.github.com/users/radix","avatar_url":"https://avatars.githubusercontent.com/u/227068?"},"repo":{"id":20022094,"name":"radix/effect","url":"https://api.github.com/repos/radix/effect"},"payload":{"push_id":536752786,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"1d1a8441574438befa1731113e960e12b24258c3","before":"defdbe78db98ad69d72f42b09194309f47616592","commits":[{"sha":"1d1a8441574438befa1731113e960e12b24258c3","author":{"email":"5f33e8ddd36b0c849687df732835b9abbe9b347b@twistedmatrix.com","name":"Christopher Armstrong"},"message":"add the one-line description to the top of the sphinx doc","distinct":true,"url":"https://api.github.com/repos/radix/effect/commits/1d1a8441574438befa1731113e960e12b24258c3"}]},"public":true,"created_at":"2015-01-01T01:02:47Z"}
{"id":"2489397083","type":"PushEvent","actor":{"id":906529,"login":"dpwolfe","gravatar_id":"","url":"https://api.github.com/users/dpwolfe","avatar_url":"https://avatars.githubusercontent.com/u/906529?"},"repo":{"id":26579311,"name":"dpwolfe/otucha","url":"https://api.github.com/repos/dpwolfe/otucha"},"payload":{"push_id":536752791,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"a9a695f1f7a3395f7394ae668feab71f35a5f622","before":"a8f720680aef094515b09c16aff3a59a4d6b2baa","commits":[{"sha":"a9a695f1f7a3395f7394ae668feab71f35a5f622","author":{"email":"b7dfe270ecb2603aba704ea15b776485da19da15@gmail.com","name":"David Wolfe"},"message":"Update README.md","distinct":true,"url":"https://api.github.com/repos/dpwolfe/otucha/commits/a9a695f1f7a3395f7394ae668feab71f35a5f622"}]},"public":true,"created_at":"2015-01-01T01:02:48Z"}
{"id":"2489397084","type":"ReleaseEvent","actor":{"id":99359,"login":"llinder","gravatar_id":"","url":"https://api.github.com/users/llinder","avatar_url":"https://avatars.githubusercontent.com/u/99359?"},"repo":{"id":28669941,"name":"llinder/salt","url":"https://api.github.com/repos/llinder/salt"},"payload":{"action":"published","release":{"url":"https://api.github.com/repos/llinder/salt/releases/818219","assets_url":"https://api.github.com/repos/llinder/salt/releases/818219/assets","upload_url":"https://uploads.github.com/repos/llinder/salt/releases/818219/assets{?name}","html_url":"https://github.com/llinder/salt/releases/tag/v2014.7.0_1","id":818219,"tag_name":"v2014.7.0_1","target_commitish":"2014.7","name":"","draft":false,"author":{"login":"llinder","id":99359,"avatar_url":"https://avatars.githubusercontent.com/u/99359?v=3","gravatar_id":"","url":"https://api.github.com/users/llinder","html_url":"https://github.com/llinder","followers_url":"https://api.github.com/users/llinder/followers","following_url":"https://api.github.com/users/llinder/following{/other_user}","gists_url":"https://api.github.com/users/llinder/gists{/gist_id}","starred_url":"https://api.github.com/users/llinder/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/llinder/subscriptions","organizations_url":"https://api.github.com/users/llinder/orgs","repos_url":"https://api.github.com/users/llinder/repos","events_url":"https://api.github.com/users/llinder/events{/privacy}","received_events_url":"https://api.github.com/users/llinder/received_events","type":"User","site_admin":false},"prerelease":false,"created_at":"2014-12-31T17:03:50Z","published_at":"2015-01-01T01:02:48Z","assets":[],"tarball_url":"https://api.github.com/repos/llinder/salt/tarball/v2014.7.0_1","zipball_url":"https://api.github.com/repos/llinder/salt/zipball/v2014.7.0_1","body":""}},"public":true,"created_at":"2015-01-01T01:02:48Z"}
{"id":"2489397087","type":"PullRequestEvent","actor":{"id":5573038,"login":"CorruptComputer","gravatar_id":"","url":"https://api.github.com/users/CorruptComputer","avatar_url":"https://avatars.githubusercontent.com/u/5573038?"},"repo":{"id":28371640,"name":"AsteroidStation/-tg-station","url":"https://api.github.com/repos/AsteroidStation/-tg-station"},"payload":{"action":"closed","number":8,"pull_request":{"url":"https://api.github.com/repos/AsteroidStation/-tg-station/pulls/8","id":26739422,"html_url":"https://github.com/AsteroidStation/-tg-station/pull/8","diff_url":"https://github.com/AsteroidStation/-tg-station/pull/8.diff","patch_url":"https://github.com/AsteroidStation/-tg-station/pull/8.patch","issue_url":"https://api.github.com/repos/AsteroidStation/-tg-station/issues/8","number":8,"state":"closed","locked":false,"title":"tg update","user":{"login":"CorruptComputer","id":5573038,"avatar_url":"https://avatars.githubusercontent.com/u/5573038?v=3","gravatar_id":"","url":"https://api.github.com/users/CorruptComputer","html_url":"https://github.com/CorruptComputer","followers_url":"https://api.github.com/users/CorruptComputer/followers","following_url":"https://api.github.com/users/CorruptComputer/following{/other_user}","gists_url":"https://api.github.com/users/CorruptComputer/gists{/gist_id}","starred_url":"https://api.github.com/users/CorruptComputer/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/CorruptComputer/subscriptions","organizations_url":"https://api.github.com/users/CorruptComputer/orgs","repos_url":"https://api.github.com/users/CorruptComputer/repos","events_url":"https://api.github.com/users/CorruptComputer/events{/privacy}","received_events_url":"https://api.github.com/users/CorruptComputer/received_events","type":"User","site_admin":false},"body":"","created_at":"2015-01-01T01:02:41Z","updated_at":"2015-01-01T01:02:48Z","closed_at":"2015-01-01T01:02:48Z","merged_at":"2015-01-01T01:02:48Z","merge_commit_sha":"9a329cfe57a587090aecaa6410a370ee062046a9","assignee":null,"milestone":null,"commits_url":"https://api.github.com/repos/AsteroidStation/-tg-station/pulls/8/commits","review_comments_url":"https://api.github.com/repos/AsteroidStation/-tg-station/pulls/8/comments","review_comment_url":"https://api.github.com/repos/AsteroidStation/-tg-station/pulls/comments/{number}","comments_url":"https://api.github.com/repos/AsteroidStation/-tg-station/issues/8/comments","statuses_url":"https://api.github.com/repos/AsteroidStation/-tg-station/statuses/34c4c027770518e2087db44a89cad07cd91ceb84","head":{"label":"tgstation:master","ref":"master","sha":"34c4c027770518e2087db44a89cad07cd91ceb84","user":{"login":"tgstation","id":1363778,"avatar_url":"https://avatars.githubusercontent.com/u/1363778?v=3","gravatar_id":"","url":"https://api.github.com/users/tgstation","html_url":"https://github.com/tgstation","followers_url":"https://api.github.com/users/tgstation/followers","following_url":"https://api.github.com/users/tgstation/following{/other_user}","gists_url":"https://api.github.com/users/tgstation/gists{/gist_id}","starred_url":"https://api.github.com/users/tgstation/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/tgstation/subscriptions","organizations_url":"https://api.github.com/users/tgstation/orgs","repos_url":"https://api.github.com/users/tgstation/repos","events_url":"https://api.github.com/users/tgstation/events{/privacy}","received_events_url":"https://api.github.com/users/tgstation/received_events","type":"Organization","site_admin":false},"repo":{"id":3234987,"name":"-tg-station","full_name":"tgstation/-tg-station","owner":{"login":"tgstation","id":1363778,"avatar_url":"https://avatars.githubusercontent.com/u/1363778?v=3","gravatar_id":"","url":"https://api.github.com/users/tgstation","html_url":"https://github.com/tgstation","followers_url":"https://api.github.com/users/tgstation/followers","following_url":"https://api.github.com/users/tgstation/following{/other_user}","gists_url":"https://api.github.com/users/tgstation/gists{/gist_id}","starred_url":"https://api.github.com/users/tgstation/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/tgstation/subscriptions","organizations_url":"https://api.github.com/users/tgstation/orgs","repos_url":"https://api.github.com/users/tgstation/repos","events_url":"https://api.github.com/users/tgstation/events{/privacy}","received_events_url":"https://api.github.com/users/tgstation/received_events","type":"Organization","site_admin":false},"private":false,"html_url":"https://github.com/tgstation/-tg-station","description":"/tg/'s SS13 branch","fork":false,"url":"https://api.github.com/repos/tgstation/-tg-station","forks_url":"https://api.github.com/repos/tgstation/-tg-station/forks","keys_url":"https://api.github.com/repos/tgstation/-tg-station/keys{/key_id}","collaborators_url":"https://api.github.com/repos/tgstation/-tg-station/collaborators{/collaborator}","teams_url":"https://api.github.com/repos/tgstation/-tg-station/teams","hooks_url":"https://api.github.com/repos/tgstation/-tg-station/hooks","issue_events_url":"https://api.github.com/repos/tgstation/-tg-station/issues/events{/number}","events_url":"https://api.github.com/repos/tgstation/-tg-station/events","assignees_url":"https://api.github.com/repos/tgstation/-tg-station/assignees{/user}","branches_url":"https://api.github.com/repos/tgstation/-tg-station/branches{/branch}","tags_url":"https://api.github.com/repos/tgstation/-tg-station/tags","blobs_url":"https://api.github.com/repos/tgstation/-tg-station/git/blobs{/sha}","git_tags_url":"https://api.github.com/repos/tgstation/-tg-station/git/tags{/sha}","git_refs_url":"https://api.github.com/repos/tgstation/-tg-station/git/refs{/sha}","trees_url":"https://api.github.com/repos/tgstation/-tg-station/git/trees{/sha}","statuses_url":"https://api.github.com/repos/tgstation/-tg-station/statuses/{sha}","languages_url":"https://api.github.com/repos/tgstation/-tg-station/languages","stargazers_url":"https://api.github.com/repos/tgstation/-tg-station/stargazers","contributors_url":"https://api.github.com/repos/tgstation/-tg-station/contributors","subscribers_url":"https://api.github.com/repos/tgstation/-tg-station/subscribers","subscription_url":"https://api.github.com/repos/tgstation/-tg-station/subscription","commits_url":"https://api.github.com/repos/tgstation/-tg-station/commits{/sha}","git_commits_url":"https://api.github.com/repos/tgstation/-tg-station/git/commits{/sha}","comments_url":"https://api.github.com/repos/tgstation/-tg-station/comments{/number}","issue_comment_url":"https://api.github.com/repos/tgstation/-tg-station/issues/comments/{number}","contents_url":"https://api.github.com/repos/tgstation/-tg-station/contents/{+path}","compare_url":"https://api.github.com/repos/tgstation/-tg-station/compare/{base}...{head}","merges_url":"https://api.github.com/repos/tgstation/-tg-station/merges","archive_url":"https://api.github.com/repos/tgstation/-tg-station/{archive_format}{/ref}","downloads_url":"https://api.github.com/repos/tgstation/-tg-station/downloads","issues_url":"https://api.github.com/repos/tgstation/-tg-station/issues{/number}","pulls_url":"https://api.github.com/repos/tgstation/-tg-station/pulls{/number}","milestones_url":"https://api.github.com/repos/tgstation/-tg-station/milestones{/number}","notifications_url":"https://api.github.com/repos/tgstation/-tg-station/notifications{?since,all,participating}","labels_url":"https://api.github.com/repos/tgstation/-tg-station/labels{/name}","releases_url":"https://api.github.com/repos/tgstation/-tg-station/releases{/id}","created_at":"2012-01-21T17:32:47Z","updated_at":"2015-01-01T00:47:49Z","pushed_at":"2015-01-01T00:47:48Z","git_url":"git://github.com/tgstation/-tg-station.git","ssh_url":"git@github.com:tgstation/-tg-station.git","clone_url":"https://github.com/tgstation/-tg-station.git","svn_url":"https://github.com/tgstation/-tg-station","homepage":"http://www.tgstation13.org/","size":550715,"stargazers_count":172,"watchers_count":172,"language":"DM","has_issues":true,"has_downloads":true,"has_wiki":true,"has_pages":false,"forks_count":609,"mirror_url":null,"open_issues_count":618,"forks":609,"open_issues":618,"watchers":172,"default_branch":"master"}},"base":{"label":"AsteroidStation:master","ref":"master","sha":"d98abaabaa971c9092a200961915c9e60015ab20","user":{"login":"AsteroidStation","id":9313156,"avatar_url":"https://avatars.githubusercontent.com/u/9313156?v=3","gravatar_id":"","url":"https://api.github.com/users/AsteroidStation","html_url":"https://github.com/AsteroidStation","followers_url":"https://api.github.com/users/AsteroidStation/followers","following_url":"https://api.github.com/users/AsteroidStation/following{/other_user}","gists_url":"https://api.github.com/users/AsteroidStation/gists{/gist_id}","starred_url":"https://api.github.com/users/AsteroidStation/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/AsteroidStation/subscriptions","organizations_url":"https://api.github.com/users/AsteroidStation/orgs","repos_url":"https://api.github.com/users/AsteroidStation/repos","events_url":"https://api.github.com/users/AsteroidStation/events{/privacy}","received_events_url":"https://api.github.com/users/AsteroidStation/received_events","type":"Organization","site_admin":false},"repo":{"id":28371640,"name":"-tg-station","full_name":"AsteroidStation/-tg-station","owner":{"login":"AsteroidStation","id":9313156,"avatar_url":"https://avatars.githubusercontent.com/u/9313156?v=3","gravatar_id":"","url":"https://api.github.com/users/AsteroidStation","html_url":"https://github.com/AsteroidStation","followers_url":"https://api.github.com/users/AsteroidStation/followers","following_url":"https://api.github.com/users/AsteroidStation/following{/other_user}","gists_url":"https://api.github.com/users/AsteroidStation/gists{/gist_id}","starred_url":"https://api.github.com/users/AsteroidStation/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/AsteroidStation/subscriptions","organizations_url":"https://api.github.com/users/AsteroidStation/orgs","repos_url":"https://api.github.com/users/AsteroidStation/repos","events_url":"https://api.github.com/users/AsteroidStation/events{/privacy}","received_events_url":"https://api.github.com/users/AsteroidStation/received_events","type":"Organization","site_admin":false},"private":false,"html_url":"https://github.com/AsteroidStation/-tg-station","description":"/tg/'s SS13 branch","fork":true,"url":"https://api.github.com/repos/AsteroidStation/-tg-station","forks_url":"https://api.github.com/repos/AsteroidStation/-tg-station/forks","keys_url":"https://api.github.com/repos/AsteroidStation/-tg-station/keys{/key_id}","collaborators_url":"https://api.github.com/repos/AsteroidStation/-tg-station/collaborators{/collaborator}","teams_url":"https://api.github.com/repos/AsteroidStation/-tg-station/teams","hooks_url":"https://api.github.com/repos/AsteroidStation/-tg-station/hooks","issue_events_url":"https://api.github.com/repos/AsteroidStation/-tg-station/issues/events{/number}","events_url":"https://api.github.com/repos/AsteroidStation/-tg-station/events","assignees_url":"https://api.github.com/repos/AsteroidStation/-tg-station/assignees{/user}","branches_url":"https://api.github.com/repos/AsteroidStation/-tg-station/branches{/branch}","tags_url":"https://api.github.com/repos/AsteroidStation/-tg-station/tags","blobs_url":"https://api.github.com/repos/AsteroidStation/-tg-station/git/blobs{/sha}","git_tags_url":"https://api.github.com/repos/AsteroidStation/-tg-station/git/tags{/sha}","git_refs_url":"https://api.github.com/repos/AsteroidStation/-tg-station/git/refs{/sha}","trees_url":"https://api.github.com/repos/AsteroidStation/-tg-station/git/trees{/sha}","statuses_url":"https://api.github.com/repos/AsteroidStation/-tg-station/statuses/{sha}","languages_url":"https://api.github.com/repos/AsteroidStation/-tg-station/languages","stargazers_url":"https://api.github.com/repos/AsteroidStation/-tg-station/stargazers","contributors_url":"https://api.github.com/repos/AsteroidStation/-tg-station/contributors","subscribers_url":"https://api.github.com/repos/AsteroidStation/-tg-station/subscribers","subscription_url":"https://api.github.com/repos/AsteroidStation/-tg-station/subscription","commits_url":"https://api.github.com/repos/AsteroidStation/-tg-station/commits{/sha}","git_commits_url":"https://api.github.com/repos/AsteroidStation/-tg-station/git/commits{/sha}","comments_url":"https://api.github.com/repos/AsteroidStation/-tg-station/comments{/number}","issue_comment_url":"https://api.github.com/repos/AsteroidStation/-tg-station/issues/comments/{number}","contents_url":"https://api.github.com/repos/AsteroidStation/-tg-station/contents/{+path}","compare_url":"https://api.github.com/repos/AsteroidStation/-tg-station/compare/{base}...{head}","merges_url":"https://api.github.com/repos/AsteroidStation/-tg-station/merges","archive_url":"https://api.github.com/repos/AsteroidStation/-tg-station/{archive_format}{/ref}","downloads_url":"https://api.github.com/repos/AsteroidStation/-tg-station/downloads","issues_url":"https://api.github.com/repos/AsteroidStation/-tg-station/issues{/number}","pulls_url":"https://api.github.com/repos/AsteroidStation/-tg-station/pulls{/number}","milestones_url":"https://api.github.com/repos/AsteroidStation/-tg-station/milestones{/number}","notifications_url":"https://api.github.com/repos/AsteroidStation/-tg-station/notifications{?since,all,participating}","labels_url":"https://api.github.com/repos/AsteroidStation/-tg-station/labels{/name}","releases_url":"https://api.github.com/repos/AsteroidStation/-tg-station/releases{/id}","created_at":"2014-12-23T02:11:11Z","updated_at":"2014-12-31T02:35:57Z","pushed_at":"2015-01-01T01:02:48Z","git_url":"git://github.com/AsteroidStation/-tg-station.git","ssh_url":"git@github.com:AsteroidStation/-tg-station.git","clone_url":"https://github.com/AsteroidStation/-tg-station.git","svn_url":"https://github.com/AsteroidStation/-tg-station","homepage":"http://www.tgstation13.org/","size":414377,"stargazers_count":0,"watchers_count":0,"language":"DM","has_issues":false,"has_downloads":true,"has_wiki":true,"has_pages":false,"forks_count":0,"mirror_url":null,"open_issues_count":0,"forks":0,"open_issues":0,"watchers":0,"default_branch":"master"}},"_links":{"self":{"href":"https://api.github.com/repos/AsteroidStation/-tg-station/pulls/8"},"html":{"href":"https://github.com/AsteroidStation/-tg-station/pull/8"},"issue":{"href":"https://api.github.com/repos/AsteroidStation/-tg-station/issues/8"},"comments":{"href":"https://api.github.com/repos/AsteroidStation/-tg-station/issues/8/comments"},"review_comments":{"href":"https://api.github.com/repos/AsteroidStation/-tg-station/pulls/8/comments"},"review_comment":{"href":"https://api.github.com/repos/AsteroidStation/-tg-station/pulls/comments/{number}"},"commits":{"href":"https://api.github.com/repos/AsteroidStation/-tg-station/pulls/8/commits"},"statuses":{"href":"https://api.github.com/repos/AsteroidStation/-tg-station/statuses/34c4c027770518e2087db44a89cad07cd91ceb84"}},"merged":true,"mergeable":null,"mergeable_state":"unknown","merged_by":{"login":"CorruptComputer","id":5573038,"avatar_url":"https://avatars.githubusercontent.com/u/5573038?v=3","gravatar_id":"","url":"https://api.github.com/users/CorruptComputer","html_url":"https://github.com/CorruptComputer","followers_url":"https://api.github.com/users/CorruptComputer/followers","following_url":"https://api.github.com/users/CorruptComputer/following{/other_user}","gists_url":"https://api.github.com/users/CorruptComputer/gists{/gist_id}","starred_url":"https://api.github.com/users/CorruptComputer/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/CorruptComputer/subscriptions","organizations_url":"https://api.github.com/users/CorruptComputer/orgs","repos_url":"https://api.github.com/users/CorruptComputer/repos","events_url":"https://api.github.com/users/CorruptComputer/events{/privacy}","received_events_url":"https://api.github.com/users/CorruptComputer/received_events","type":"User","site_admin":false},"comments":0,"review_comments":0,"commits":55,"additions":1841,"deletions":1195,"changed_files":145}},"public":true,"created_at":"2015-01-01T01:02:48Z","org":{"id":9313156,"login":"AsteroidStation","gravatar_id":"","url":"https://api.github.com/orgs/AsteroidStation","avatar_url":"https://avatars.githubusercontent.com/u/9313156?"}}
{"id":"2489397088","type":"CreateEvent","actor":{"id":99359,"login":"llinder","gravatar_id":"","url":"https://api.github.com/users/llinder","avatar_url":"https://avatars.githubusercontent.com/u/99359?"},"repo":{"id":28669941,"name":"llinder/salt","url":"https://api.github.com/repos/llinder/salt"},"payload":{"ref":"v2014.7.0_1","ref_type":"tag","master_branch":"develop","description":"Infrastructure automation and management system","pusher_type":"user"},"public":true,"created_at":"2015-01-01T01:02:48Z"}
{"id":"2489397095","type":"PushEvent","actor":{"id":5573038,"login":"CorruptComputer","gravatar_id":"","url":"https://api.github.com/users/CorruptComputer","avatar_url":"https://avatars.githubusercontent.com/u/5573038?"},"repo":{"id":28371640,"name":"AsteroidStation/-tg-station","url":"https://api.github.com/repos/AsteroidStation/-tg-station"},"payload":{"push_id":536752794,"size":56,"distinct_size":56,"ref":"refs/heads/master","head":"4352171f2ac3e6930e2b4b0b5c384779b2908eae","before":"d98abaabaa971c9092a200961915c9e60015ab20","commits":[{"sha":"0921aa201f3ee3894dfad2d400023c39fe1d1e01","author":{"email":"cf55a9c90d41f12e3e2216800693d3a930e4551a@gmail.com","name":"Razharas"},"message":"Added datum mutations\n\nAlso removed some mob vars like sdisabilities and merged the usability\nwith disabilities\nRemoved need for mutations var, they are not handled in dna\nRemoved blinded var, now its handled by eye_blind being bigger than zero\nAnds lots, lots of other shit in files that used mutations","distinct":true,"url":"https://api.github.com/repos/AsteroidStation/-tg-station/commits/0921aa201f3ee3894dfad2d400023c39fe1d1e01"},{"sha":"11f6c7c40148a6c8be2abc5ebb7cc9b967a20950","author":{"email":"cf55a9c90d41f12e3e2216800693d3a930e4551a@gmail.com","name":"Razharas"},"message":"Merge branch 'master' of https://github.com/tgstation/-tg-station into GenShit","distinct":true,"url":"https://api.github.com/repos/AsteroidStation/-tg-station/commits/11f6c7c40148a6c8be2abc5ebb7cc9b967a20950"},{"sha":"8d110ee49639b4d3163529868339ea993330b2cf","author":{"email":"cf55a9c90d41f12e3e2216800693d3a930e4551a@gmail.com","name":"Razharas"},"message":"Tiny clean up, still lots of work to do\n\nOnly compiletested, these changes were never tested in the game yet","distinct":true,"url":"https://api.github.com/repos/AsteroidStation/-tg-station/commits/8d110ee49639b4d3163529868339ea993330b2cf"},{"sha":"861072596873d47ea851480df74854a78a28f948","author":{"email":"cf55a9c90d41f12e3e2216800693d3a930e4551a@gmail.com","name":"Razharas"},"message":"Monkifying change and some mutations fixes\n\nIt approaches playable level of working, hurray!","distinct":true,"url":"https://api.github.com/repos/AsteroidStation/-tg-station/commits/861072596873d47ea851480df74854a78a28f948"},{"sha":"44cc6c6d97543b63d277f1d6eb980d56d90b4d1e","author":{"email":"cf55a9c90d41f12e3e2216800693d3a930e4551a@gmail.com","name":"Razharas"},"message":"Merge branch 'master' of https://github.com/tgstation/-tg-station into GenShit","distinct":true,"url":"https://api.github.com/repos/AsteroidStation/-tg-station/commits/44cc6c6d97543b63d277f1d6eb980d56d90b4d1e"},{"sha":"21a2c2d21eccd62394113a0ac6395397aa9d80a8","author":{"email":"cf55a9c90d41f12e3e2216800693d3a930e4551a@gmail.com","name":"Razharas"},"message":"Made clumsiness into disability\n\nI really dont want to make clumsy_act()","distinct":true,"url":"https://api.github.com/repos/AsteroidStation/-tg-station/commits/21a2c2d21eccd62394113a0ac6395397aa9d80a8"},{"sha":"570783d2c776ad6b2106440a1afbab38af6f8c88","author":{"email":"cf55a9c90d41f12e3e2216800693d3a930e4551a@gmail.com","name":"Razharas"},"message":"Added comments for RR for future","distinct":true,"url":"https://api.github.com/repos/AsteroidStation/-tg-station/commits/570783d2c776ad6b2106440a1afbab38af6f8c88"},{"sha":"f0c8f2eeacc3e59d9c9f0942d7bfad5daabcacff","author":{"email":"cf55a9c90d41f12e3e2216800693d3a930e4551a@gmail.com","name":"Razharas"},"message":"Merge branch 'master' of https://github.com/tgstation/-tg-station into GenShit\n\nConflicts:\n\tcode/modules/reagents/Chemistry-Reagents.dm\n\nconflicts resolution","distinct":true,"url":"https://api.github.com/repos/AsteroidStation/-tg-station/commits/f0c8f2eeacc3e59d9c9f0942d7bfad5daabcacff"},{"sha":"b12472e0bb1845d312386e96f953b4ae9ab07de2","author":{"email":"cf55a9c90d41f12e3e2216800693d3a930e4551a@gmail.com","name":"Razharas"},"message":"Made shit compilable, probably broke new hunger\n\nWhoever made it: tough luck bro","distinct":true,"url":"https://api.github.com/repos/AsteroidStation/-tg-station/commits/b12472e0bb1845d312386e96f953b4ae9ab07de2"},{"sha":"9a27fe7c8dc9fe426723fd0f8c97160a51037dd6","author":{"email":"cf55a9c90d41f12e3e2216800693d3a930e4551a@gmail.com","name":"Razharas"},"message":"Conflict fix\n\nYeah makes it all work","distinct":true,"url":"https://api.github.com/repos/AsteroidStation/-tg-station/commits/9a27fe7c8dc9fe426723fd0f8c97160a51037dd6"},{"sha":"57b41dce0d954580aa4531310ac1f0a2ee255814","author":{"email":"cf55a9c90d41f12e3e2216800693d3a930e4551a@gmail.com","name":"Razharas"},"message":"Fixed some shiet\n\nRedone how injectors handle mutations(now it doesnt copy the SE but\nmanipulates mutations directly)\nRemoved sole leftovers\nFixed humanizing\nFixed grammer","distinct":true,"url":"https://api.github.com/repos/AsteroidStation/-tg-station/commits/57b41dce0d954580aa4531310ac1f0a2ee255814"},{"sha":"92fc9b5d1b4a91317143e1db1a6c22af59f1f6a3","author":{"email":"cf55a9c90d41f12e3e2216800693d3a930e4551a@gmail.com","name":"Razharas"},"message":"And some more little fixes\n\nReturn of the prob to foam smashing\nCorrect laserpointer check\nCorrect wield behaviour with hulk","distinct":true,"url":"https://api.github.com/repos/AsteroidStation/-tg-station/commits/92fc9b5d1b4a91317143e1db1a6c22af59f1f6a3"},{"sha":"1b45752b05bbc5cd285d6432d22510cbba86840d","author":{"email":"cf55a9c90d41f12e3e2216800693d3a930e4551a@gmail.com","name":"Razharas"},"message":"Fixed conflicts\n\nYe again and again and again and again\nDo it again, do it again~","distinct":true,"url":"https://api.github.com/repos/AsteroidStation/-tg-station/commits/1b45752b05bbc5cd285d6432d22510cbba86840d"},{"sha":"208b59c30ef5a597545a49a46fe3983dde1f01f6","author":{"email":"cf55a9c90d41f12e3e2216800693d3a930e4551a@gmail.com","name":"Razharas"},"message":"Fixed stuff tkdrg pointed out\n\nAdded comment to dualsaber and hulk checks to explain whats going on\nAdded defines that converts to mutation names\nFixed grammer again","distinct":true,"url":"https://api.github.com/repos/AsteroidStation/-tg-station/commits/208b59c30ef5a597545a49a46fe3983dde1f01f6"},{"sha":"76a21883a8d70c71d30b9acb3162cc21e80b2ca9","author":{"email":"cf55a9c90d41f12e3e2216800693d3a930e4551a@gmail.com","name":"Razharas"},"message":"Merge branch 'master' of https://github.com/tgstation/-tg-station into GenShit\n\nConflicts:\n\tcode/game/mecha/mecha.dm\n\tcode/game/objects/structures/tables_racks.dm\n\tcode/modules/mob/living/silicon/silicon.dm\n\tcode/modules/projectiles/gun.dm\n\nFixes dem conflicts","distinct":true,"url":"https://api.github.com/repos/AsteroidStation/-tg-station/commits/76a21883a8d70c71d30b9acb3162cc21e80b2ca9"},{"sha":"4c3f83d085ccae384a33db2498de970cf0918df5","author":{"email":"cf55a9c90d41f12e3e2216800693d3a930e4551a@gmail.com","name":"Razharas"},"message":"This shall fix the hunger system\n\nI really really hope it does","distinct":true,"url":"https://api.github.com/repos/AsteroidStation/-tg-station/commits/4c3f83d085ccae384a33db2498de970cf0918df5"},{"sha":"418e3a061364d97a01321d023b9a418881896984","author":{"email":"cf55a9c90d41f12e3e2216800693d3a930e4551a@gmail.com","name":"Razharas"},"message":"General cleanup\n\nFixed the magic text failing in monkey injectors\nRemoved lots of comments\nDidnt fix mysterious list bounds runtime in tourettes","distinct":true,"url":"https://api.github.com/repos/AsteroidStation/-tg-station/commits/418e3a061364d97a01321d023b9a418881896984"},{"sha":"10b21b20ab801fbc5ce469964c322fc2ccca0138","author":{"email":"cf55a9c90d41f12e3e2216800693d3a930e4551a@gmail.com","name":"Razharas"},"message":"Conflicts resolution\n\nIn items weapons melee misc","distinct":true,"url":"https://api.github.com/repos/AsteroidStation/-tg-station/commits/10b21b20ab801fbc5ce469964c322fc2ccca0138"},{"sha":"501a120cca348b88447f1d90b25fbf888fdababa","author":{"email":"cf55a9c90d41f12e3e2216800693d3a930e4551a@gmail.com","name":"Razharas"},"message":"Fixes the defines\n\nNow all the shit uses them i hope","distinct":true,"url":"https://api.github.com/repos/AsteroidStation/-tg-station/commits/501a120cca348b88447f1d90b25fbf888fdababa"},{"sha":"37a7fa24146b27dcc10ea6acdad19a7aa67f3fb1","author":{"email":"cf55a9c90d41f12e3e2216800693d3a930e4551a@gmail.com","name":"Razharas"},"message":"Fixes that one runtime with tourettes\n\nAnimation proc is magic, dont ask dont tell","distinct":true,"url":"https://api.github.com/repos/AsteroidStation/-tg-station/commits/37a7fa24146b27dcc10ea6acdad19a7aa67f3fb1"}]},"public":true,"created_at":"2015-01-01T01:02:49Z","org":{"id":9313156,"login":"AsteroidStation","gravatar_id":"","url":"https://api.github.com/orgs/AsteroidStation","avatar_url":"https://avatars.githubusercontent.com/u/9313156?"}}
{"id":"2489397109","type":"WatchEvent","actor":{"id":438131,"login":"linuxlizard","gravatar_id":"","url":"https://api.github.com/users/linuxlizard","avatar_url":"https://avatars.githubusercontent.com/u/438131?"},"repo":{"id":952838,"name":"adafruit/Adafruit_SSD1306","url":"https://api.github.com/repos/adafruit/Adafruit_SSD1306"},"payload":{"action":"started"},"public":true,"created_at":"2015-01-01T01:02:52Z","org":{"id":181069,"login":"adafruit","gravatar_id":"","url":"https://api.github.com/orgs/adafruit","avatar_url":"https://avatars.githubusercontent.com/u/181069?"}}
{"id":"2489397111","type":"WatchEvent","actor":{"id":8055446,"login":"mchenla","gravatar_id":"","url":"https://api.github.com/users/mchenla","avatar_url":"https://avatars.githubusercontent.com/u/8055446?"},"repo":{"id":3816248,"name":"basecamp/bcx-api","url":"https://api.github.com/repos/basecamp/bcx-api"},"payload":{"action":"started"},"public":true,"created_at":"2015-01-01T01:02:52Z","org":{"id":13131,"login":"basecamp","gravatar_id":"","url":"https://api.github.com/orgs/basecamp","avatar_url":"https://avatars.githubusercontent.com/u/13131?"}}
{"id":"2489397117","type":"PushEvent","actor":{"id":1059214,"login":"wlaurance","gravatar_id":"","url":"https://api.github.com/users/wlaurance","avatar_url":"https://avatars.githubusercontent.com/u/1059214?"},"repo":{"id":28050478,"name":"empirical-org/Quill-Grammar","url":"https://api.github.com/repos/empirical-org/Quill-Grammar"},"payload":{"push_id":536752803,"size":1,"distinct_size":0,"ref":"refs/heads/develop","head":"9835f267914e973c8ca53b28b85b94bdf3086ba2","before":"166d757dfcef4f5a7f9642883745a949444a131d","commits":[{"sha":"9835f267914e973c8ca53b28b85b94bdf3086ba2","author":{"email":"c55061f2e98089f7f71676646e4a1dbbd0f0ebe8@gmail.com","name":"Peter Gault"},"message":"Update README.md","distinct":false,"url":"https://api.github.com/repos/empirical-org/Quill-Grammar/commits/9835f267914e973c8ca53b28b85b94bdf3086ba2"}]},"public":true,"created_at":"2015-01-01T01:02:52Z","org":{"id":4258432,"login":"empirical-org","gravatar_id":"","url":"https://api.github.com/orgs/empirical-org","avatar_url":"https://avatars.githubusercontent.com/u/4258432?"}}
{"id":"2489397118","type":"PushEvent","actor":{"id":2851221,"login":"alkass","gravatar_id":"","url":"https://api.github.com/users/alkass","avatar_url":"https://avatars.githubusercontent.com/u/2851221?"},"repo":{"id":28678233,"name":"alkass/seQre","url":"https://api.github.com/repos/alkass/seQre"},"payload":{"push_id":536752805,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"3e46496fed34162743f34c34d45cca60df88ba6f","before":"d566054d43b3ecce423e2e8e585b3881467437d7","commits":[{"sha":"3e46496fed34162743f34c34d45cca60df88ba6f","author":{"email":"adc72828a6d71e3d0c694f02fcfcce48ee8a532b@users.noreply.github.com","name":"Fadi Hanna Al-Kass"},"message":"Delete README.md","distinct":true,"url":"https://api.github.com/repos/alkass/seQre/commits/3e46496fed34162743f34c34d45cca60df88ba6f"}]},"public":true,"created_at":"2015-01-01T01:02:52Z"}
{"id":"2489397119","type":"PushEvent","actor":{"id":3656079,"login":"marklrh","gravatar_id":"","url":"https://api.github.com/users/marklrh","avatar_url":"https://avatars.githubusercontent.com/u/3656079?"},"repo":{"id":27470715,"name":"marklrh/ocaml-cohttp-test","url":"https://api.github.com/repos/marklrh/ocaml-cohttp-test"},"payload":{"push_id":536752804,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"7525c74ee31f49f576408a7d50d1cf8b9d3d1441","before":"aa8ec0de017c8003758776739facc819e33ac7c9","commits":[{"sha":"7525c74ee31f49f576408a7d50d1cf8b9d3d1441","author":{"email":"e0e04a2320844b42511db0376599e166ab5bda54@gmail.com","name":"Runhang Li"},"message":"lint README","distinct":true,"url":"https://api.github.com/repos/marklrh/ocaml-cohttp-test/commits/7525c74ee31f49f576408a7d50d1cf8b9d3d1441"}]},"public":true,"created_at":"2015-01-01T01:02:52Z"}
{"id":"2489397120","type":"PushEvent","actor":{"id":2453862,"login":"schloo","gravatar_id":"","url":"https://api.github.com/users/schloo","avatar_url":"https://avatars.githubusercontent.com/u/2453862?"},"repo":{"id":28160579,"name":"azilnik/phetch","url":"https://api.github.com/repos/azilnik/phetch"},"payload":{"push_id":536752806,"size":1,"distinct_size":1,"ref":"refs/heads/gh-pages","head":"47f6ee4ea9a5e9d67f20809dd3876760eaf13680","before":"ab393a029b968e4d41ade0a85c86f879e171c805","commits":[{"sha":"47f6ee4ea9a5e9d67f20809dd3876760eaf13680","author":{"email":"03cd939e5e01f81bd3cbeb1977c82e3d0109cf43@Michelles-Air.home","name":"schloo"},"message":"copy and misc tweaks","distinct":true,"url":"https://api.github.com/repos/azilnik/phetch/commits/47f6ee4ea9a5e9d67f20809dd3876760eaf13680"}]},"public":true,"created_at":"2015-01-01T01:02:52Z"}
{"id":"2489397128","type":"CreateEvent","actor":{"id":1341245,"login":"asfgit","gravatar_id":"","url":"https://api.github.com/users/asfgit","avatar_url":"https://avatars.githubusercontent.com/u/1341245?"},"repo":{"id":26798421,"name":"apache/infrastructure-puppet","url":"https://api.github.com/repos/apache/infrastructure-puppet"},"payload":{"ref":"puppet-test-work","ref_type":"branch","master_branch":"master","description":"Mirror of Apache Infrastructure Puppet","pusher_type":"user"},"public":true,"created_at":"2015-01-01T01:02:53Z","org":{"id":47359,"login":"apache","gravatar_id":"","url":"https://api.github.com/orgs/apache","avatar_url":"https://avatars.githubusercontent.com/u/47359?"}}
{"id":"2489397137","type":"PushEvent","actor":{"id":965430,"login":"waltzofpearls","gravatar_id":"","url":"https://api.github.com/users/waltzofpearls","avatar_url":"https://avatars.githubusercontent.com/u/965430?"},"repo":{"id":28505561,"name":"waltzofpearls/dotfiles","url":"https://api.github.com/repos/waltzofpearls/dotfiles"},"payload":{"push_id":536752816,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"d5a1f77ab903cdcf1d2ae292c7f0f259c6e32211","before":"7e0e2a2759ddafd07d02d2167359a84c7cf15194","commits":[{"sha":"d5a1f77ab903cdcf1d2ae292c7f0f259c6e32211","author":{"email":"c514db49330801e4e831feeacd2b70f6f55a5048@gmail.com","name":"Rollie Ma"},"message":"Some minor tweaks to dotfiles","distinct":true,"url":"https://api.github.com/repos/waltzofpearls/dotfiles/commits/d5a1f77ab903cdcf1d2ae292c7f0f259c6e32211"}]},"public":true,"created_at":"2015-01-01T01:02:53Z"}
{"id":"2489397138","type":"PushEvent","actor":{"id":171043,"login":"jeffnv","gravatar_id":"","url":"https://api.github.com/users/jeffnv","avatar_url":"https://avatars.githubusercontent.com/u/171043?"},"repo":{"id":28159277,"name":"jeffnv/elite-golf","url":"https://api.github.com/repos/jeffnv/elite-golf"},"payload":{"push_id":536752817,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"12162bb9f224c179a9ea7d8abbac7dadec15ee2a","before":"a88fa3bfffc1d1f4ce9b668412981ff071d9920e","commits":[{"sha":"12162bb9f224c179a9ea7d8abbac7dadec15ee2a","author":{"email":"a4a950aede9822deccc73582f88e82e913eb89d5@gmail.com","name":"Jeff Fiddler"},"message":"more useful alert when clicking idle creator map","distinct":true,"url":"https://api.github.com/repos/jeffnv/elite-golf/commits/12162bb9f224c179a9ea7d8abbac7dadec15ee2a"}]},"public":true,"created_at":"2015-01-01T01:02:53Z"}
{"id":"2489397150","type":"PushEvent","actor":{"id":904370,"login":"helhum","gravatar_id":"","url":"https://api.github.com/users/helhum","avatar_url":"https://avatars.githubusercontent.com/u/904370?"},"repo":{"id":20956969,"name":"TYPO3-Surf-CMS/Distribution","url":"https://api.github.com/repos/TYPO3-Surf-CMS/Distribution"},"payload":{"push_id":536752822,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"e585c369f862ad016cdc8ac608adce8e1d2a348c","before":"f566d43f3b6ada009c3f571fac56f51b35110a46","commits":[{"sha":"e585c369f862ad016cdc8ac608adce8e1d2a348c","author":{"email":"6bf857ca7de026fbed4ae790a809a0ea640901f4@helmuthummel.de","name":"Helmut Hummel"},"message":"Update README.md","distinct":true,"url":"https://api.github.com/repos/TYPO3-Surf-CMS/Distribution/commits/e585c369f862ad016cdc8ac608adce8e1d2a348c"}]},"public":true,"created_at":"2015-01-01T01:02:57Z","org":{"id":7921669,"login":"TYPO3-Surf-CMS","gravatar_id":"","url":"https://api.github.com/orgs/TYPO3-Surf-CMS","avatar_url":"https://avatars.githubusercontent.com/u/7921669?"}}
{"id":"2489397154","type":"PushEvent","actor":{"id":5623501,"login":"xbony2","gravatar_id":"","url":"https://api.github.com/users/xbony2","avatar_url":"https://avatars.githubusercontent.com/u/5623501?"},"repo":{"id":28162672,"name":"xbony2/Experimental-Self-Aware-Electronic-Based-Space-Analyzing-Droid","url":"https://api.github.com/repos/xbony2/Experimental-Self-Aware-Electronic-Based-Space-Analyzing-Droid"},"payload":{"push_id":536752826,"size":2,"distinct_size":2,"ref":"refs/heads/master","head":"f151107a11fa3dbf47a1fe26ec221e49daeca203","before":"ebbaebe4084a57cc1553d710f12013d0dba10bd7","commits":[{"sha":"7fa4f074eeabe4fa22ef9042e260f81dbceda991","author":{"email":"8371f52126eb90da97b7600da3d2d08e783fe9cf@gmail.com","name":"xbony2"},"message":"nother channel","distinct":true,"url":"https://api.github.com/repos/xbony2/Experimental-Self-Aware-Electronic-Based-Space-Analyzing-Droid/commits/7fa4f074eeabe4fa22ef9042e260f81dbceda991"},{"sha":"f151107a11fa3dbf47a1fe26ec221e49daeca203","author":{"email":"8371f52126eb90da97b7600da3d2d08e783fe9cf@gmail.com","name":"xbony2"},"message":"Merge branch 'master' of https://github.com/xbony2/Experimental-Self-Aware-Electronic-Based-Space-Analyzing-Droid.git","distinct":true,"url":"https://api.github.com/repos/xbony2/Experimental-Self-Aware-Electronic-Based-Space-Analyzing-Droid/commits/f151107a11fa3dbf47a1fe26ec221e49daeca203"}]},"public":true,"created_at":"2015-01-01T01:02:57Z"}
{"id":"2489397164","type":"PushEvent","actor":{"id":1017605,"login":"wangshan","gravatar_id":"","url":"https://api.github.com/users/wangshan","avatar_url":"https://avatars.githubusercontent.com/u/1017605?"},"repo":{"id":28666633,"name":"wangshan/wangshan.github.io","url":"https://api.github.com/repos/wangshan/wangshan.github.io"},"payload":{"push_id":536752830,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"5a94fdd12e5d88be38cca22321e943d374d3e4d5","before":"92d20ac01b4767280cccaf71ee20f173529877a0","commits":[{"sha":"5a94fdd12e5d88be38cca22321e943d374d3e4d5","author":{"email":"e3e97680eb29c788f35181af31eb442b3251e18f@gmail.com","name":"Shan"},"message":"Update 2012-03-03-mac-development-environment-setup.md","distinct":true,"url":"https://api.github.com/repos/wangshan/wangshan.github.io/commits/5a94fdd12e5d88be38cca22321e943d374d3e4d5"}]},"public":true,"created_at":"2015-01-01T01:02:58Z"}
{"id":"2489397169","type":"WatchEvent","actor":{"id":1902323,"login":"zoontek","gravatar_id":"","url":"https://api.github.com/users/zoontek","avatar_url":"https://avatars.githubusercontent.com/u/1902323?"},"repo":{"id":11393110,"name":"codegangsta/cli","url":"https://api.github.com/repos/codegangsta/cli"},"payload":{"action":"started"},"public":true,"created_at":"2015-01-01T01:02:59Z"}
{"id":"2489397179","type":"PushEvent","actor":{"id":2453862,"login":"schloo","gravatar_id":"","url":"https://api.github.com/users/schloo","avatar_url":"https://avatars.githubusercontent.com/u/2453862?"},"repo":{"id":28160579,"name":"azilnik/phetch","url":"https://api.github.com/repos/azilnik/phetch"},"payload":{"push_id":536752838,"size":1,"distinct_size":1,"ref":"refs/heads/gh-pages","head":"1b32d9c513558f8cc57ed88edff23b0d45610363","before":"47f6ee4ea9a5e9d67f20809dd3876760eaf13680","commits":[{"sha":"1b32d9c513558f8cc57ed88edff23b0d45610363","author":{"email":"03cd939e5e01f81bd3cbeb1977c82e3d0109cf43@Michelles-Air.home","name":"schloo"},"message":"revised images","distinct":true,"url":"https://api.github.com/repos/azilnik/phetch/commits/1b32d9c513558f8cc57ed88edff23b0d45610363"}]},"public":true,"created_at":"2015-01-01T01:03:01Z"}
{"id":"2489397180","type":"PullRequestEvent","actor":{"id":6737270,"login":"JorgeX","gravatar_id":"","url":"https://api.github.com/users/JorgeX","avatar_url":"https://avatars.githubusercontent.com/u/6737270?"},"repo":{"id":25890220,"name":"JorgeX/dojo_rules","url":"https://api.github.com/repos/JorgeX/dojo_rules"},"payload":{"action":"opened","number":1,"pull_request":{"url":"https://api.github.com/repos/JorgeX/dojo_rules/pulls/1","id":26739426,"html_url":"https://github.com/JorgeX/dojo_rules/pull/1","diff_url":"https://github.com/JorgeX/dojo_rules/pull/1.diff","patch_url":"https://github.com/JorgeX/dojo_rules/pull/1.patch","issue_url":"https://api.github.com/repos/JorgeX/dojo_rules/issues/1","number":1,"state":"open","locked":false,"title":"Deadly skills","user":{"login":"JorgeX","id":6737270,"avatar_url":"https://avatars.githubusercontent.com/u/6737270?v=3","gravatar_id":"","url":"https://api.github.com/users/JorgeX","html_url":"https://github.com/JorgeX","followers_url":"https://api.github.com/users/JorgeX/followers","following_url":"https://api.github.com/users/JorgeX/following{/other_user}","gists_url":"https://api.github.com/users/JorgeX/gists{/gist_id}","starred_url":"https://api.github.com/users/JorgeX/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/JorgeX/subscriptions","organizations_url":"https://api.github.com/users/JorgeX/orgs","repos_url":"https://api.github.com/users/JorgeX/repos","events_url":"https://api.github.com/users/JorgeX/events{/privacy}","received_events_url":"https://api.github.com/users/JorgeX/received_events","type":"User","site_admin":false},"body":"ok","created_at":"2015-01-01T01:03:01Z","updated_at":"2015-01-01T01:03:01Z","closed_at":null,"merged_at":null,"merge_commit_sha":null,"assignee":null,"milestone":null,"commits_url":"https://api.github.com/repos/JorgeX/dojo_rules/pulls/1/commits","review_comments_url":"https://api.github.com/repos/JorgeX/dojo_rules/pulls/1/comments","review_comment_url":"https://api.github.com/repos/JorgeX/dojo_rules/pulls/comments/{number}","comments_url":"https://api.github.com/repos/JorgeX/dojo_rules/issues/1/comments","statuses_url":"https://api.github.com/repos/JorgeX/dojo_rules/statuses/923b0ffbc6a7f2fc6ff55b6d415fe70f824ea5e0","head":{"label":"JorgeX:deadly_skills","ref":"deadly_skills","sha":"923b0ffbc6a7f2fc6ff55b6d415fe70f824ea5e0","user":{"login":"JorgeX","id":6737270,"avatar_url":"https://avatars.githubusercontent.com/u/6737270?v=3","gravatar_id":"","url":"https://api.github.com/users/JorgeX","html_url":"https://github.com/JorgeX","followers_url":"https://api.github.com/users/JorgeX/followers","following_url":"https://api.github.com/users/JorgeX/following{/other_user}","gists_url":"https://api.github.com/users/JorgeX/gists{/gist_id}","starred_url":"https://api.github.com/users/JorgeX/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/JorgeX/subscriptions","organizations_url":"https://api.github.com/users/JorgeX/orgs","repos_url":"https://api.github.com/users/JorgeX/repos","events_url":"https://api.github.com/users/JorgeX/events{/privacy}","received_events_url":"https://api.github.com/users/JorgeX/received_events","type":"User","site_admin":false},"repo":{"id":25890220,"name":"dojo_rules","full_name":"JorgeX/dojo_rules","owner":{"login":"JorgeX","id":6737270,"avatar_url":"https://avatars.githubusercontent.com/u/6737270?v=3","gravatar_id":"","url":"https://api.github.com/users/JorgeX","html_url":"https://github.com/JorgeX","followers_url":"https://api.github.com/users/JorgeX/followers","following_url":"https://api.github.com/users/JorgeX/following{/other_user}","gists_url":"https://api.github.com/users/JorgeX/gists{/gist_id}","starred_url":"https://api.github.com/users/JorgeX/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/JorgeX/subscriptions","organizations_url":"https://api.github.com/users/JorgeX/orgs","repos_url":"https://api.github.com/users/JorgeX/repos","events_url":"https://api.github.com/users/JorgeX/events{/privacy}","received_events_url":"https://api.github.com/users/JorgeX/received_events","type":"User","site_admin":false},"private":false,"html_url":"https://github.com/JorgeX/dojo_rules","description":"","fork":true,"url":"https://api.github.com/repos/JorgeX/dojo_rules","forks_url":"https://api.github.com/repos/JorgeX/dojo_rules/forks","keys_url":"https://api.github.com/repos/JorgeX/dojo_rules/keys{/key_id}","collaborators_url":"https://api.github.com/repos/JorgeX/dojo_rules/collaborators{/collaborator}","teams_url":"https://api.github.com/repos/JorgeX/dojo_rules/teams","hooks_url":"https://api.github.com/repos/JorgeX/dojo_rules/hooks","issue_events_url":"https://api.github.com/repos/JorgeX/dojo_rules/issues/events{/number}","events_url":"https://api.github.com/repos/JorgeX/dojo_rules/events","assignees_url":"https://api.github.com/repos/JorgeX/dojo_rules/assignees{/user}","branches_url":"https://api.github.com/repos/JorgeX/dojo_rules/branches{/branch}","tags_url":"https://api.github.com/repos/JorgeX/dojo_rules/tags","blobs_url":"https://api.github.com/repos/JorgeX/dojo_rules/git/blobs{/sha}","git_tags_url":"https://api.github.com/repos/JorgeX/dojo_rules/git/tags{/sha}","git_refs_url":"https://api.github.com/repos/JorgeX/dojo_rules/git/refs{/sha}","trees_url":"https://api.github.com/repos/JorgeX/dojo_rules/git/trees{/sha}","statuses_url":"https://api.github.com/repos/JorgeX/dojo_rules/statuses/{sha}","languages_url":"https://api.github.com/repos/JorgeX/dojo_rules/languages","stargazers_url":"https://api.github.com/repos/JorgeX/dojo_rules/stargazers","contributors_url":"https://api.github.com/repos/JorgeX/dojo_rules/contributors","subscribers_url":"https://api.github.com/repos/JorgeX/dojo_rules/subscribers","subscription_url":"https://api.github.com/repos/JorgeX/dojo_rules/subscription","commits_url":"https://api.github.com/repos/JorgeX/dojo_rules/commits{/sha}","git_commits_url":"https://api.github.com/repos/JorgeX/dojo_rules/git/commits{/sha}","comments_url":"https://api.github.com/repos/JorgeX/dojo_rules/comments{/number}","issue_comment_url":"https://api.github.com/repos/JorgeX/dojo_rules/issues/comments/{number}","contents_url":"https://api.github.com/repos/JorgeX/dojo_rules/contents/{+path}","compare_url":"https://api.github.com/repos/JorgeX/dojo_rules/compare/{base}...{head}","merges_url":"https://api.github.com/repos/JorgeX/dojo_rules/merges","archive_url":"https://api.github.com/repos/JorgeX/dojo_rules/{archive_format}{/ref}","downloads_url":"https://api.github.com/repos/JorgeX/dojo_rules/downloads","issues_url":"https://api.github.com/repos/JorgeX/dojo_rules/issues{/number}","pulls_url":"https://api.github.com/repos/JorgeX/dojo_rules/pulls{/number}","milestones_url":"https://api.github.com/repos/JorgeX/dojo_rules/milestones{/number}","notifications_url":"https://api.github.com/repos/JorgeX/dojo_rules/notifications{?since,all,participating}","labels_url":"https://api.github.com/repos/JorgeX/dojo_rules/labels{/name}","releases_url":"https://api.github.com/repos/JorgeX/dojo_rules/releases{/id}","created_at":"2014-10-28T21:09:20Z","updated_at":"2014-10-28T21:13:40Z","pushed_at":"2015-01-01T01:00:43Z","git_url":"git://github.com/JorgeX/dojo_rules.git","ssh_url":"git@github.com:JorgeX/dojo_rules.git","clone_url":"https://github.com/JorgeX/dojo_rules.git","svn_url":"https://github.com/JorgeX/dojo_rules","homepage":null,"size":104,"stargazers_count":0,"watchers_count":0,"language":"Ruby","has_issues":false,"has_downloads":true,"has_wiki":true,"has_pages":true,"forks_count":0,"mirror_url":null,"open_issues_count":1,"forks":0,"open_issues":1,"watchers":0,"default_branch":"master"}},"base":{"label":"JorgeX:master","ref":"master","sha":"d1b0081019d3c0e43266beaa87fee523fc684649","user":{"login":"JorgeX","id":6737270,"avatar_url":"https://avatars.githubusercontent.com/u/6737270?v=3","gravatar_id":"","url":"https://api.github.com/users/JorgeX","html_url":"https://github.com/JorgeX","followers_url":"https://api.github.com/users/JorgeX/followers","following_url":"https://api.github.com/users/JorgeX/following{/other_user}","gists_url":"https://api.github.com/users/JorgeX/gists{/gist_id}","starred_url":"https://api.github.com/users/JorgeX/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/JorgeX/subscriptions","organizations_url":"https://api.github.com/users/JorgeX/orgs","repos_url":"https://api.github.com/users/JorgeX/repos","events_url":"https://api.github.com/users/JorgeX/events{/privacy}","received_events_url":"https://api.github.com/users/JorgeX/received_events","type":"User","site_admin":false},"repo":{"id":25890220,"name":"dojo_rules","full_name":"JorgeX/dojo_rules","owner":{"login":"JorgeX","id":6737270,"avatar_url":"https://avatars.githubusercontent.com/u/6737270?v=3","gravatar_id":"","url":"https://api.github.com/users/JorgeX","html_url":"https://github.com/JorgeX","followers_url":"https://api.github.com/users/JorgeX/followers","following_url":"https://api.github.com/users/JorgeX/following{/other_user}","gists_url":"https://api.github.com/users/JorgeX/gists{/gist_id}","starred_url":"https://api.github.com/users/JorgeX/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/JorgeX/subscriptions","organizations_url":"https://api.github.com/users/JorgeX/orgs","repos_url":"https://api.github.com/users/JorgeX/repos","events_url":"https://api.github.com/users/JorgeX/events{/privacy}","received_events_url":"https://api.github.com/users/JorgeX/received_events","type":"User","site_admin":false},"private":false,"html_url":"https://github.com/JorgeX/dojo_rules","description":"","fork":true,"url":"https://api.github.com/repos/JorgeX/dojo_rules","forks_url":"https://api.github.com/repos/JorgeX/dojo_rules/forks","keys_url":"https://api.github.com/repos/JorgeX/dojo_rules/keys{/key_id}","collaborators_url":"https://api.github.com/repos/JorgeX/dojo_rules/collaborators{/collaborator}","teams_url":"https://api.github.com/repos/JorgeX/dojo_rules/teams","hooks_url":"https://api.github.com/repos/JorgeX/dojo_rules/hooks","issue_events_url":"https://api.github.com/repos/JorgeX/dojo_rules/issues/events{/number}","events_url":"https://api.github.com/repos/JorgeX/dojo_rules/events","assignees_url":"https://api.github.com/repos/JorgeX/dojo_rules/assignees{/user}","branches_url":"https://api.github.com/repos/JorgeX/dojo_rules/branches{/branch}","tags_url":"https://api.github.com/repos/JorgeX/dojo_rules/tags","blobs_url":"https://api.github.com/repos/JorgeX/dojo_rules/git/blobs{/sha}","git_tags_url":"https://api.github.com/repos/JorgeX/dojo_rules/git/tags{/sha}","git_refs_url":"https://api.github.com/repos/JorgeX/dojo_rules/git/refs{/sha}","trees_url":"https://api.github.com/repos/JorgeX/dojo_rules/git/trees{/sha}","statuses_url":"https://api.github.com/repos/JorgeX/dojo_rules/statuses/{sha}","languages_url":"https://api.github.com/repos/JorgeX/dojo_rules/languages","stargazers_url":"https://api.github.com/repos/JorgeX/dojo_rules/stargazers","contributors_url":"https://api.github.com/repos/JorgeX/dojo_rules/contributors","subscribers_url":"https://api.github.com/repos/JorgeX/dojo_rules/subscribers","subscription_url":"https://api.github.com/repos/JorgeX/dojo_rules/subscription","commits_url":"https://api.github.com/repos/JorgeX/dojo_rules/commits{/sha}","git_commits_url":"https://api.github.com/repos/JorgeX/dojo_rules/git/commits{/sha}","comments_url":"https://api.github.com/repos/JorgeX/dojo_rules/comments{/number}","issue_comment_url":"https://api.github.com/repos/JorgeX/dojo_rules/issues/comments/{number}","contents_url":"https://api.github.com/repos/JorgeX/dojo_rules/contents/{+path}","compare_url":"https://api.github.com/repos/JorgeX/dojo_rules/compare/{base}...{head}","merges_url":"https://api.github.com/repos/JorgeX/dojo_rules/merges","archive_url":"https://api.github.com/repos/JorgeX/dojo_rules/{archive_format}{/ref}","downloads_url":"https://api.github.com/repos/JorgeX/dojo_rules/downloads","issues_url":"https://api.github.com/repos/JorgeX/dojo_rules/issues{/number}","pulls_url":"https://api.github.com/repos/JorgeX/dojo_rules/pulls{/number}","milestones_url":"https://api.github.com/repos/JorgeX/dojo_rules/milestones{/number}","notifications_url":"https://api.github.com/repos/JorgeX/dojo_rules/notifications{?since,all,participating}","labels_url":"https://api.github.com/repos/JorgeX/dojo_rules/labels{/name}","releases_url":"https://api.github.com/repos/JorgeX/dojo_rules/releases{/id}","created_at":"2014-10-28T21:09:20Z","updated_at":"2014-10-28T21:13:40Z","pushed_at":"2015-01-01T01:00:43Z","git_url":"git://github.com/JorgeX/dojo_rules.git","ssh_url":"git@github.com:JorgeX/dojo_rules.git","clone_url":"https://github.com/JorgeX/dojo_rules.git","svn_url":"https://github.com/JorgeX/dojo_rules","homepage":null,"size":104,"stargazers_count":0,"watchers_count":0,"language":"Ruby","has_issues":false,"has_downloads":true,"has_wiki":true,"has_pages":true,"forks_count":0,"mirror_url":null,"open_issues_count":1,"forks":0,"open_issues":1,"watchers":0,"default_branch":"master"}},"_links":{"self":{"href":"https://api.github.com/repos/JorgeX/dojo_rules/pulls/1"},"html":{"href":"https://github.com/JorgeX/dojo_rules/pull/1"},"issue":{"href":"https://api.github.com/repos/JorgeX/dojo_rules/issues/1"},"comments":{"href":"https://api.github.com/repos/JorgeX/dojo_rules/issues/1/comments"},"review_comments":{"href":"https://api.github.com/repos/JorgeX/dojo_rules/pulls/1/comments"},"review_comment":{"href":"https://api.github.com/repos/JorgeX/dojo_rules/pulls/comments/{number}"},"commits":{"href":"https://api.github.com/repos/JorgeX/dojo_rules/pulls/1/commits"},"statuses":{"href":"https://api.github.com/repos/JorgeX/dojo_rules/statuses/923b0ffbc6a7f2fc6ff55b6d415fe70f824ea5e0"}},"merged":false,"mergeable":null,"mergeable_state":"unknown","merged_by":null,"comments":0,"review_comments":0,"commits":4,"additions":6,"deletions":8,"changed_files":2}},"public":true,"created_at":"2015-01-01T01:03:01Z"}
{"id":"2489397186","type":"IssueCommentEvent","actor":{"id":19792,"login":"wiredfool","gravatar_id":"","url":"https://api.github.com/users/wiredfool","avatar_url":"https://avatars.githubusercontent.com/u/19792?"},"repo":{"id":5171600,"name":"python-pillow/Pillow","url":"https://api.github.com/repos/python-pillow/Pillow"},"payload":{"action":"created","issue":{"url":"https://api.github.com/repos/python-pillow/Pillow/issues/949","labels_url":"https://api.github.com/repos/python-pillow/Pillow/issues/949/labels{/name}","comments_url":"https://api.github.com/repos/python-pillow/Pillow/issues/949/comments","events_url":"https://api.github.com/repos/python-pillow/Pillow/issues/949/events","html_url":"https://github.com/python-pillow/Pillow/issues/949","id":45165342,"number":949,"title":"Release 2.7.0 on January 1, 2015","user":{"login":"aclark4life","id":72164,"avatar_url":"https://avatars.githubusercontent.com/u/72164?v=3","gravatar_id":"","url":"https://api.github.com/users/aclark4life","html_url":"https://github.com/aclark4life","followers_url":"https://api.github.com/users/aclark4life/followers","following_url":"https://api.github.com/users/aclark4life/following{/other_user}","gists_url":"https://api.github.com/users/aclark4life/gists{/gist_id}","starred_url":"https://api.github.com/users/aclark4life/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/aclark4life/subscriptions","organizations_url":"https://api.github.com/users/aclark4life/orgs","repos_url":"https://api.github.com/users/aclark4life/repos","events_url":"https://api.github.com/users/aclark4life/events{/privacy}","received_events_url":"https://api.github.com/users/aclark4life/received_events","type":"User","site_admin":false},"labels":[{"url":"https://api.github.com/repos/python-pillow/Pillow/labels/Release","name":"Release","color":"bfdadc"}],"state":"open","locked":false,"assignee":null,"milestone":{"url":"https://api.github.com/repos/python-pillow/Pillow/milestones/8","labels_url":"https://api.github.com/repos/python-pillow/Pillow/milestones/8/labels","id":840816,"number":8,"title":"2.7.0","description":"","creator":{"login":"hugovk","id":1324225,"avatar_url":"https://avatars.githubusercontent.com/u/1324225?v=3","gravatar_id":"","url":"https://api.github.com/users/hugovk","html_url":"https://github.com/hugovk","followers_url":"https://api.github.com/users/hugovk/followers","following_url":"https://api.github.com/users/hugovk/following{/other_user}","gists_url":"https://api.github.com/users/hugovk/gists{/gist_id}","starred_url":"https://api.github.com/users/hugovk/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/hugovk/subscriptions","organizations_url":"https://api.github.com/users/hugovk/orgs","repos_url":"https://api.github.com/users/hugovk/repos","events_url":"https://api.github.com/users/hugovk/events{/privacy}","received_events_url":"https://api.github.com/users/hugovk/received_events","type":"User","site_admin":false},"open_issues":7,"closed_issues":0,"state":"open","created_at":"2014-10-26T09:53:06Z","updated_at":"2014-10-26T09:55:42Z","due_on":"2015-01-01T08:00:00Z","closed_at":null},"comments":11,"created_at":"2014-10-07T20:49:47Z","updated_at":"2015-01-01T01:03:02Z","closed_at":null,"body":"OK I'm dropping off again, please use @aclark4life if you need anything or email aclark@aclark.net. Thank you :beers:"},"comment":{"url":"https://api.github.com/repos/python-pillow/Pillow/issues/comments/68477275","html_url":"https://github.com/python-pillow/Pillow/issues/949#issuecomment-68477275","issue_url":"https://api.github.com/repos/python-pillow/Pillow/issues/949","id":68477275,"user":{"login":"wiredfool","id":19792,"avatar_url":"https://avatars.githubusercontent.com/u/19792?v=3","gravatar_id":"","url":"https://api.github.com/users/wiredfool","html_url":"https://github.com/wiredfool","followers_url":"https://api.github.com/users/wiredfool/followers","following_url":"https://api.github.com/users/wiredfool/following{/other_user}","gists_url":"https://api.github.com/users/wiredfool/gists{/gist_id}","starred_url":"https://api.github.com/users/wiredfool/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/wiredfool/subscriptions","organizations_url":"https://api.github.com/users/wiredfool/orgs","repos_url":"https://api.github.com/users/wiredfool/repos","events_url":"https://api.github.com/users/wiredfool/events{/privacy}","received_events_url":"https://api.github.com/users/wiredfool/received_events","type":"User","site_admin":false},"created_at":"2015-01-01T01:03:02Z","updated_at":"2015-01-01T01:03:02Z","body":"The scipy change appears to be because of a change in the way that image resizing works. The new version looks more reasonable to me, which fits with the conclusions that we've had from the changes in the resizing code this iteration. "}},"public":true,"created_at":"2015-01-01T01:03:02Z","org":{"id":2036701,"login":"python-pillow","gravatar_id":"","url":"https://api.github.com/orgs/python-pillow","avatar_url":"https://avatars.githubusercontent.com/u/2036701?"}}
{"id":"2489397187","type":"IssueCommentEvent","actor":{"id":100206,"login":"quicksketch","gravatar_id":"","url":"https://api.github.com/users/quicksketch","avatar_url":"https://avatars.githubusercontent.com/u/100206?"},"repo":{"id":12582950,"name":"backdrop/backdrop-issues","url":"https://api.github.com/repos/backdrop/backdrop-issues"},"payload":{"action":"created","issue":{"url":"https://api.github.com/repos/backdrop/backdrop-issues/issues/521","labels_url":"https://api.github.com/repos/backdrop/backdrop-issues/issues/521/labels{/name}","comments_url":"https://api.github.com/repos/backdrop/backdrop-issues/issues/521/comments","events_url":"https://api.github.com/repos/backdrop/backdrop-issues/issues/521/events","html_url":"https://github.com/backdrop/backdrop-issues/issues/521","id":53210114,"number":521,"title":"[UX] The structure of the Structure -> Views menu makes no sense.","user":{"login":"klonos","id":2423362,"avatar_url":"https://avatars.githubusercontent.com/u/2423362?v=3","gravatar_id":"","url":"https://api.github.com/users/klonos","html_url":"https://github.com/klonos","followers_url":"https://api.github.com/users/klonos/followers","following_url":"https://api.github.com/users/klonos/following{/other_user}","gists_url":"https://api.github.com/users/klonos/gists{/gist_id}","starred_url":"https://api.github.com/users/klonos/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/klonos/subscriptions","organizations_url":"https://api.github.com/users/klonos/orgs","repos_url":"https://api.github.com/users/klonos/repos","events_url":"https://api.github.com/users/klonos/events{/privacy}","received_events_url":"https://api.github.com/users/klonos/received_events","type":"User","site_admin":false},"labels":[],"state":"open","locked":false,"assignee":null,"milestone":null,"comments":1,"created_at":"2015-01-01T00:57:24Z","updated_at":"2015-01-01T01:03:02Z","closed_at":null,"body":"![structure-views_menu_makes_no_sense](https://cloud.githubusercontent.com/assets/2423362/5591356/f4ac78aa-91aa-11e4-8142-aa0104e86099.png)\r\n\r\n1. The views submenu entries in the menu are listed in alphabetical order while in the views list page they are not.\r\n2. They are not grouped together nor listed alphabetically with the rest of the menu entries:\r\n  - The \"Add new view\", \"Import\", \"List\" and \"Settings\" entries are listed alphabetically, but not when views are added (once enabled)\r\n  - The views are listed alphabetically, but the \"Settings\" entry is included/sorted along and the alphabetization starts after the \"Add new view\", \"Import\", \"List\" trio.\r\n\r\nWTF!?!\r\n\r\nDid we mean to list the views within the \"List\" entry but failed somehow? If not, I think it would make sense to move them there.\r\n\r\nIf we do not move them under \"List\", then lets move all non-view-name entries in that menu (currently \"Add new view\", \"Import\", \"List\" and \"Settings\") at the top and list the views entries alphabetically right after them.\r\n\r\nI think that if the views entries are to be listed alphabetically in the menu, then so should they be in the index page (```/admin/structure/views```). If we choose to not list them alphabetically in the views index page, then at least keep the same order in the menu. If we do decide to list them alphabetically everywhere (my vote BTW), then the enabled views in the views index page should \"bubble\" up and the disabled kept down, but still in alphabetical order."},"comment":{"url":"https://api.github.com/repos/backdrop/backdrop-issues/issues/comments/68477274","html_url":"https://github.com/backdrop/backdrop-issues/issues/521#issuecomment-68477274","issue_url":"https://api.github.com/repos/backdrop/backdrop-issues/issues/521","id":68477274,"user":{"login":"quicksketch","id":100206,"avatar_url":"https://avatars.githubusercontent.com/u/100206?v=3","gravatar_id":"","url":"https://api.github.com/users/quicksketch","html_url":"https://github.com/quicksketch","followers_url":"https://api.github.com/users/quicksketch/followers","following_url":"https://api.github.com/users/quicksketch/following{/other_user}","gists_url":"https://api.github.com/users/quicksketch/gists{/gist_id}","starred_url":"https://api.github.com/users/quicksketch/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/quicksketch/subscriptions","organizations_url":"https://api.github.com/users/quicksketch/orgs","repos_url":"https://api.github.com/users/quicksketch/repos","events_url":"https://api.github.com/users/quicksketch/events{/privacy}","received_events_url":"https://api.github.com/users/quicksketch/received_events","type":"User","site_admin":false},"created_at":"2015-01-01T01:03:02Z","updated_at":"2015-01-01T01:03:02Z","body":"> Did we mean to list the views within the \"List\" entry but failed somehow? If not, I think it would make sense to move them there.\r\n\r\nThis is a straight-port from D7's admin_menu. I don't think we've reconsidered anything about the way that views are listed in the menu.\r\n\r\nMy preference would be to simply remove the individual Views from the admin bar entirely. We don't include blocks, layouts, text formats, image styles, or any other user-created configurations within a sub-system directly within the admin bar, why are Views special? You can easily end up with dozens of views even on a moderately complex site, making use of the admin menu to navigate them hopeless anyway."}},"public":true,"created_at":"2015-01-01T01:03:02Z","org":{"id":5283039,"login":"backdrop","gravatar_id":"","url":"https://api.github.com/orgs/backdrop","avatar_url":"https://avatars.githubusercontent.com/u/5283039?"}}
{"id":"2489397193","type":"CreateEvent","actor":{"id":568036,"login":"Tyilo","gravatar_id":"","url":"https://api.github.com/users/Tyilo","avatar_url":"https://avatars.githubusercontent.com/u/568036?"},"repo":{"id":28676548,"name":"Tyilo/pyth","url":"https://api.github.com/repos/Tyilo/pyth"},"payload":{"ref":"patch-2","ref_type":"branch","master_branch":"master","description":"Pyth, an extremely concise language. Try it here:","pusher_type":"user"},"public":true,"created_at":"2015-01-01T01:03:03Z"}
{"id":"2489397194","type":"PushEvent","actor":{"id":616495,"login":"harveyt","gravatar_id":"","url":"https://api.github.com/users/harveyt","avatar_url":"https://avatars.githubusercontent.com/u/616495?"},"repo":{"id":28677911,"name":"harveyt/harveyt.github.io","url":"https://api.github.com/repos/harveyt/harveyt.github.io"},"payload":{"push_id":536752843,"size":2,"distinct_size":2,"ref":"refs/heads/source","head":"9f57ade1c98efb400f57d710a69c272464596ba4","before":"44fbf89a779b08acc862d4177398f8cb7b1eed3d","commits":[{"sha":"6a98c29ce4e4d65ba4958c06a382a935f931a20a","author":{"email":"5b18f340f96afc1bfd4fbf498467b8b0cb41ea73@me.com","name":"Harvey Thompson"},"message":"Added _deploy.yml for github publishing.","distinct":true,"url":"https://api.github.com/repos/harveyt/harveyt.github.io/commits/6a98c29ce4e4d65ba4958c06a382a935f931a20a"},{"sha":"9f57ade1c98efb400f57d710a69c272464596ba4","author":{"email":"5b18f340f96afc1bfd4fbf498467b8b0cb41ea73@me.com","name":"Harvey Thompson"},"message":"Final tweaks before first publish.","distinct":true,"url":"https://api.github.com/repos/harveyt/harveyt.github.io/commits/9f57ade1c98efb400f57d710a69c272464596ba4"}]},"public":true,"created_at":"2015-01-01T01:03:03Z"}
{"id":"2489397210","type":"WatchEvent","actor":{"id":9970148,"login":"bchoomnuan","gravatar_id":"","url":"https://api.github.com/users/bchoomnuan","avatar_url":"https://avatars.githubusercontent.com/u/9970148?"},"repo":{"id":27032923,"name":"dockerboard/dockerboard","url":"https://api.github.com/repos/dockerboard/dockerboard"},"payload":{"action":"started"},"public":true,"created_at":"2015-01-01T01:03:05Z","org":{"id":9627875,"login":"dockerboard","gravatar_id":"","url":"https://api.github.com/orgs/dockerboard","avatar_url":"https://avatars.githubusercontent.com/u/9627875?"}}
{"id":"2489397216","type":"PushEvent","actor":{"id":9515067,"login":"freundTech","gravatar_id":"","url":"https://api.github.com/users/freundTech","avatar_url":"https://avatars.githubusercontent.com/u/9515067?"},"repo":{"id":27674403,"name":"freundTech/lightDMX","url":"https://api.github.com/repos/freundTech/lightDMX"},"payload":{"push_id":536752852,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"5a3fdac84c88e3bc2e2b24afa750b5ca36e74bc4","before":"1949bbb851b79b526154c7cec6a0e7e00f1420a6","commits":[{"sha":"5a3fdac84c88e3bc2e2b24afa750b5ca36e74bc4","author":{"email":"d6643dd9a6fe6114980ecaf6d787b2a0da7fc377@gmail.com","name":"Adrian"},"message":"Updated TODO","distinct":true,"url":"https://api.github.com/repos/freundTech/lightDMX/commits/5a3fdac84c88e3bc2e2b24afa750b5ca36e74bc4"}]},"public":true,"created_at":"2015-01-01T01:03:07Z"}
{"id":"2489397221","type":"PushEvent","actor":{"id":3635680,"login":"BatikhSouri","gravatar_id":"","url":"https://api.github.com/users/BatikhSouri","avatar_url":"https://avatars.githubusercontent.com/u/3635680?"},"repo":{"id":28186746,"name":"BatikhSouri/git-lesson","url":"https://api.github.com/repos/BatikhSouri/git-lesson"},"payload":{"push_id":536752856,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"0f00c9c76eb55c71f81be40fd7479c7923bf8187","before":"b6b546ecf0c97fffcb8c4d0cd8bd1554d256abca","commits":[{"sha":"0f00c9c76eb55c71f81be40fd7479c7923bf8187","author":{"email":"965e9967770cc67c48586cfa730edd14b783f677@gmail.com","name":"Syrian Watermelon"},"message":"Improving the lesson parsing, among other little tweaks","distinct":true,"url":"https://api.github.com/repos/BatikhSouri/git-lesson/commits/0f00c9c76eb55c71f81be40fd7479c7923bf8187"}]},"public":true,"created_at":"2015-01-01T01:03:07Z"}
{"id":"2489397225","type":"PushEvent","actor":{"id":1745861,"login":"topaztee","gravatar_id":"","url":"https://api.github.com/users/topaztee","avatar_url":"https://avatars.githubusercontent.com/u/1745861?"},"repo":{"id":28677407,"name":"topaztee/topaztee.github.io","url":"https://api.github.com/repos/topaztee/topaztee.github.io"},"payload":{"push_id":536752857,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"70a7d7ee278b87fbcbe0c785d3ec3c1dcb12a8d4","before":"a66e99dc9be241e6a513acfcc79ac27757a4a5bb","commits":[{"sha":"70a7d7ee278b87fbcbe0c785d3ec3c1dcb12a8d4","author":{"email":"f74c82d708bb42a372674042ebc8a1411fbc9344@192-168-1-2.tpgi.com.au","name":"topaztur@gmail.com"},"message":"Blog update at 2015-01-01 01:03:00","distinct":true,"url":"https://api.github.com/repos/topaztee/topaztee.github.io/commits/70a7d7ee278b87fbcbe0c785d3ec3c1dcb12a8d4"}]},"public":true,"created_at":"2015-01-01T01:03:07Z"}
{"id":"2489397239","type":"WatchEvent","actor":{"id":923144,"login":"pythonesque","gravatar_id":"","url":"https://api.github.com/users/pythonesque","avatar_url":"https://avatars.githubusercontent.com/u/923144?"},"repo":{"id":1698955,"name":"csmith-project/csmith","url":"https://api.github.com/repos/csmith-project/csmith"},"payload":{"action":"started"},"public":true,"created_at":"2015-01-01T01:03:09Z","org":{"id":757200,"login":"csmith-project","gravatar_id":"","url":"https://api.github.com/orgs/csmith-project","avatar_url":"https://avatars.githubusercontent.com/u/757200?"}}
{"id":"2489397243","type":"IssuesEvent","actor":{"id":2222834,"login":"madeofwin","gravatar_id":"","url":"https://api.github.com/users/madeofwin","avatar_url":"https://avatars.githubusercontent.com/u/2222834?"},"repo":{"id":12279254,"name":"cudamat/cudamat","url":"https://api.github.com/repos/cudamat/cudamat"},"payload":{"action":"opened","issue":{"url":"https://api.github.com/repos/cudamat/cudamat/issues/40","labels_url":"https://api.github.com/repos/cudamat/cudamat/issues/40/labels{/name}","comments_url":"https://api.github.com/repos/cudamat/cudamat/issues/40/comments","events_url":"https://api.github.com/repos/cudamat/cudamat/issues/40/events","html_url":"https://github.com/cudamat/cudamat/issues/40","id":53210222,"number":40,"title":"nvcc fatal   : Path to libdevice library not specified","user":{"login":"madeofwin","id":2222834,"avatar_url":"https://avatars.githubusercontent.com/u/2222834?v=3","gravatar_id":"","url":"https://api.github.com/users/madeofwin","html_url":"https://github.com/madeofwin","followers_url":"https://api.github.com/users/madeofwin/followers","following_url":"https://api.github.com/users/madeofwin/following{/other_user}","gists_url":"https://api.github.com/users/madeofwin/gists{/gist_id}","starred_url":"https://api.github.com/users/madeofwin/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/madeofwin/subscriptions","organizations_url":"https://api.github.com/users/madeofwin/orgs","repos_url":"https://api.github.com/users/madeofwin/repos","events_url":"https://api.github.com/users/madeofwin/events{/privacy}","received_events_url":"https://api.github.com/users/madeofwin/received_events","type":"User","site_admin":false},"labels":[],"state":"open","locked":false,"assignee":null,"milestone":null,"comments":0,"created_at":"2015-01-01T01:03:09Z","updated_at":"2015-01-01T01:03:09Z","closed_at":null,"body":"Hi, I'm running a fresh ubuntu 14.04 installation with Cuda 6.5 and a GT650M. I downloaded the deb files from the official nvidia cuda site, added it via dpkg and executed 'sudo apt-get install cuda'. This installed Cuda 6.5 and nvidia-340 drivers. However, I'm running into troubles when I try to install cudamat by 'sudo python install setup.py', see the output:\r\n\r\nrunning install\r\nrunning bdist_egg\r\nrunning egg_info\r\nwriting cudamat.egg-info/PKG-INFO\r\nwriting top-level names to cudamat.egg-info/top_level.txt\r\nwriting dependency_links to cudamat.egg-info/dependency_links.txt\r\nreading manifest file 'cudamat.egg-info/SOURCES.txt'\r\nwriting manifest file 'cudamat.egg-info/SOURCES.txt'\r\ninstalling library code to build/bdist.linux-x86_64/egg\r\nrunning install_lib\r\nrunning build_py\r\nrunning build_ext\r\nbuilding 'cudamat.libcudamat' extension\r\nnvcc -I/usr/include/python2.7 -c cudamat/cudamat.cu -o build/temp.linux-x86_64-2.7/cudamat/cudamat.o -O --ptxas-options=-v --compiler-options '-fPIC'\r\nnvcc fatal   : Path to libdevice library not specified\r\nerror: command 'nvcc' failed with exit status 1\r\n\r\nI'm googling and trying different things for hours now and can't find a solutions. cuda examples are running without problems. Can you help me out?\r\n"}},"public":true,"created_at":"2015-01-01T01:03:09Z","org":{"id":5281810,"login":"cudamat","gravatar_id":"","url":"https://api.github.com/orgs/cudamat","avatar_url":"https://avatars.githubusercontent.com/u/5281810?"}}
{"id":"2489397244","type":"CreateEvent","actor":{"id":838098,"login":"burgerbecky","gravatar_id":"","url":"https://api.github.com/users/burgerbecky","avatar_url":"https://avatars.githubusercontent.com/u/838098?"},"repo":{"id":28677547,"name":"burgerbecky/glslvisualstudio","url":"https://api.github.com/repos/burgerbecky/glslvisualstudio"},"payload":{"ref":"master","ref_type":"branch","master_branch":"master","description":"Visual Studio Plug in to add in GLSL source as directly linked source code","pusher_type":"user"},"public":true,"created_at":"2015-01-01T01:03:09Z"}
{"id":"2489397246","type":"PushEvent","actor":{"id":1398544,"login":"joelpurra","gravatar_id":"","url":"https://api.github.com/users/joelpurra","avatar_url":"https://avatars.githubusercontent.com/u/1398544?"},"repo":{"id":28595466,"name":"joelpurra/jqnpm","url":"https://api.github.com/repos/joelpurra/jqnpm"},"payload":{"push_id":536752863,"size":2,"distinct_size":2,"ref":"refs/heads/master","head":"402ca05191199df582b663242f0e000d6fb33292","before":"fbb2a9631bf887443ad696637417d1564f07f56b","commits":[{"sha":"591fa3c627d7a3eeee457ed5daf7a997a5469338","author":{"email":"4774889311d71ea3a81d88c867cde99c6ccb427e@joelpurra.com","name":"Joel Purra"},"message":"Only clean folders affected by tests, not generated bundles - and re-add an ignored file","distinct":true,"url":"https://api.github.com/repos/joelpurra/jqnpm/commits/591fa3c627d7a3eeee457ed5daf7a997a5469338"},{"sha":"402ca05191199df582b663242f0e000d6fb33292","author":{"email":"4774889311d71ea3a81d88c867cde99c6ccb427e@joelpurra.com","name":"Joel Purra"},"message":"Encourage cleaning up files, regenerating bundles","distinct":true,"url":"https://api.github.com/repos/joelpurra/jqnpm/commits/402ca05191199df582b663242f0e000d6fb33292"}]},"public":true,"created_at":"2015-01-01T01:03:10Z"}
{"id":"2489397249","type":"IssuesEvent","actor":{"id":4712580,"login":"ericdahl","gravatar_id":"","url":"https://api.github.com/users/ericdahl","avatar_url":"https://avatars.githubusercontent.com/u/4712580?"},"repo":{"id":9396682,"name":"spring-guides/gs-rest-service","url":"https://api.github.com/repos/spring-guides/gs-rest-service"},"payload":{"action":"opened","issue":{"url":"https://api.github.com/repos/spring-guides/gs-rest-service/issues/28","labels_url":"https://api.github.com/repos/spring-guides/gs-rest-service/issues/28/labels{/name}","comments_url":"https://api.github.com/repos/spring-guides/gs-rest-service/issues/28/comments","events_url":"https://api.github.com/repos/spring-guides/gs-rest-service/issues/28/events","html_url":"https://github.com/spring-guides/gs-rest-service/issues/28","id":53210223,"number":28,"title":"pom.xml has unnecessary <start-class>","user":{"login":"ericdahl","id":4712580,"avatar_url":"https://avatars.githubusercontent.com/u/4712580?v=3","gravatar_id":"","url":"https://api.github.com/users/ericdahl","html_url":"https://github.com/ericdahl","followers_url":"https://api.github.com/users/ericdahl/followers","following_url":"https://api.github.com/users/ericdahl/following{/other_user}","gists_url":"https://api.github.com/users/ericdahl/gists{/gist_id}","starred_url":"https://api.github.com/users/ericdahl/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/ericdahl/subscriptions","organizations_url":"https://api.github.com/users/ericdahl/orgs","repos_url":"https://api.github.com/users/ericdahl/repos","events_url":"https://api.github.com/users/ericdahl/events{/privacy}","received_events_url":"https://api.github.com/users/ericdahl/received_events","type":"User","site_admin":false},"labels":[],"state":"open","locked":false,"assignee":null,"milestone":null,"comments":0,"created_at":"2015-01-01T01:03:10Z","updated_at":"2015-01-01T01:03:10Z","closed_at":null,"body":"I was confused to see that the ```pom.xml``` includes:\r\n\r\n```xml\r\n<properties>\r\n    <start-class>hello.Application</start-class>\r\n</properties>\r\n```\r\n\r\nsince the [main documentation](http://docs.spring.io/spring-boot/docs/current-SNAPSHOT/reference/htmlsingle/#getting-started-first-application-pom) doesn't include references to it. It's unnecessary and adds unnecessary complexity for a getting started guide.\r\n\r\nI was about to submit a pull request to remove it, but then I saw that all of the spring-guides include it. Possibly there's some reason for keeping it?\r\n"}},"public":true,"created_at":"2015-01-01T01:03:10Z","org":{"id":4161866,"login":"spring-guides","gravatar_id":"","url":"https://api.github.com/orgs/spring-guides","avatar_url":"https://avatars.githubusercontent.com/u/4161866?"}}
{"id":"2489397250","type":"PullRequestReviewCommentEvent","actor":{"id":7882662,"login":"codeschool-kiddo","gravatar_id":"","url":"https://api.github.com/users/codeschool-kiddo","avatar_url":"https://avatars.githubusercontent.com/u/7882662?"},"repo":{"id":25890220,"name":"JorgeX/dojo_rules","url":"https://api.github.com/repos/JorgeX/dojo_rules"},"payload":{"action":"created","comment":{"url":"https://api.github.com/repos/JorgeX/dojo_rules/pulls/comments/22397268","id":22397268,"diff_hunk":"@@ -1,3 +1,3 @@\n-Hello, Deadly vipers\n-regards, Jorge!\n-Favourite path: Javascript\n+* GitG\n+* Java\n+* polle\n\\ No newline at end of file","path":"introduction.md","position":7,"original_position":7,"commit_id":"923b0ffbc6a7f2fc6ff55b6d415fe70f824ea5e0","original_commit_id":"923b0ffbc6a7f2fc6ff55b6d415fe70f824ea5e0","user":{"login":"codeschool-kiddo","id":7882662,"avatar_url":"https://avatars.githubusercontent.com/u/7882662?v=3","gravatar_id":"","url":"https://api.github.com/users/codeschool-kiddo","html_url":"https://github.com/codeschool-kiddo","followers_url":"https://api.github.com/users/codeschool-kiddo/followers","following_url":"https://api.github.com/users/codeschool-kiddo/following{/other_user}","gists_url":"https://api.github.com/users/codeschool-kiddo/gists{/gist_id}","starred_url":"https://api.github.com/users/codeschool-kiddo/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/codeschool-kiddo/subscriptions","organizations_url":"https://api.github.com/users/codeschool-kiddo/orgs","repos_url":"https://api.github.com/users/codeschool-kiddo/repos","events_url":"https://api.github.com/users/codeschool-kiddo/events{/privacy}","received_events_url":"https://api.github.com/users/codeschool-kiddo/received_events","type":"User","site_admin":false},"body":"Since you're becoming a GitHub master, could you also add \"Killing history using git rebase\" as one of your deadly skills?","created_at":"2015-01-01T01:03:10Z","updated_at":"2015-01-01T01:03:10Z","html_url":"https://github.com/JorgeX/dojo_rules/pull/1#discussion_r22397268","pull_request_url":"https://api.github.com/repos/JorgeX/dojo_rules/pulls/1","_links":{"self":{"href":"https://api.github.com/repos/JorgeX/dojo_rules/pulls/comments/22397268"},"html":{"href":"https://github.com/JorgeX/dojo_rules/pull/1#discussion_r22397268"},"pull_request":{"href":"https://api.github.com/repos/JorgeX/dojo_rules/pulls/1"}}},"pull_request":{"url":"https://api.github.com/repos/JorgeX/dojo_rules/pulls/1","id":26739426,"html_url":"https://github.com/JorgeX/dojo_rules/pull/1","diff_url":"https://github.com/JorgeX/dojo_rules/pull/1.diff","patch_url":"https://github.com/JorgeX/dojo_rules/pull/1.patch","issue_url":"https://api.github.com/repos/JorgeX/dojo_rules/issues/1","number":1,"state":"open","locked":false,"title":"Deadly skills","user":{"login":"JorgeX","id":6737270,"avatar_url":"https://avatars.githubusercontent.com/u/6737270?v=3","gravatar_id":"","url":"https://api.github.com/users/JorgeX","html_url":"https://github.com/JorgeX","followers_url":"https://api.github.com/users/JorgeX/followers","following_url":"https://api.github.com/users/JorgeX/following{/other_user}","gists_url":"https://api.github.com/users/JorgeX/gists{/gist_id}","starred_url":"https://api.github.com/users/JorgeX/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/JorgeX/subscriptions","organizations_url":"https://api.github.com/users/JorgeX/orgs","repos_url":"https://api.github.com/users/JorgeX/repos","events_url":"https://api.github.com/users/JorgeX/events{/privacy}","received_events_url":"https://api.github.com/users/JorgeX/received_events","type":"User","site_admin":false},"body":"ok","created_at":"2015-01-01T01:03:01Z","updated_at":"2015-01-01T01:03:10Z","closed_at":null,"merged_at":null,"merge_commit_sha":"fe9e81e8157ba236bc48b8ee411b4e12fc8666e4","assignee":null,"milestone":null,"commits_url":"https://api.github.com/repos/JorgeX/dojo_rules/pulls/1/commits","review_comments_url":"https://api.github.com/repos/JorgeX/dojo_rules/pulls/1/comments","review_comment_url":"https://api.github.com/repos/JorgeX/dojo_rules/pulls/comments/{number}","comments_url":"https://api.github.com/repos/JorgeX/dojo_rules/issues/1/comments","statuses_url":"https://api.github.com/repos/JorgeX/dojo_rules/statuses/923b0ffbc6a7f2fc6ff55b6d415fe70f824ea5e0","head":{"label":"JorgeX:deadly_skills","ref":"deadly_skills","sha":"923b0ffbc6a7f2fc6ff55b6d415fe70f824ea5e0","user":{"login":"JorgeX","id":6737270,"avatar_url":"https://avatars.githubusercontent.com/u/6737270?v=3","gravatar_id":"","url":"https://api.github.com/users/JorgeX","html_url":"https://github.com/JorgeX","followers_url":"https://api.github.com/users/JorgeX/followers","following_url":"https://api.github.com/users/JorgeX/following{/other_user}","gists_url":"https://api.github.com/users/JorgeX/gists{/gist_id}","starred_url":"https://api.github.com/users/JorgeX/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/JorgeX/subscriptions","organizations_url":"https://api.github.com/users/JorgeX/orgs","repos_url":"https://api.github.com/users/JorgeX/repos","events_url":"https://api.github.com/users/JorgeX/events{/privacy}","received_events_url":"https://api.github.com/users/JorgeX/received_events","type":"User","site_admin":false},"repo":{"id":25890220,"name":"dojo_rules","full_name":"JorgeX/dojo_rules","owner":{"login":"JorgeX","id":6737270,"avatar_url":"https://avatars.githubusercontent.com/u/6737270?v=3","gravatar_id":"","url":"https://api.github.com/users/JorgeX","html_url":"https://github.com/JorgeX","followers_url":"https://api.github.com/users/JorgeX/followers","following_url":"https://api.github.com/users/JorgeX/following{/other_user}","gists_url":"https://api.github.com/users/JorgeX/gists{/gist_id}","starred_url":"https://api.github.com/users/JorgeX/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/JorgeX/subscriptions","organizations_url":"https://api.github.com/users/JorgeX/orgs","repos_url":"https://api.github.com/users/JorgeX/repos","events_url":"https://api.github.com/users/JorgeX/events{/privacy}","received_events_url":"https://api.github.com/users/JorgeX/received_events","type":"User","site_admin":false},"private":false,"html_url":"https://github.com/JorgeX/dojo_rules","description":"","fork":true,"url":"https://api.github.com/repos/JorgeX/dojo_rules","forks_url":"https://api.github.com/repos/JorgeX/dojo_rules/forks","keys_url":"https://api.github.com/repos/JorgeX/dojo_rules/keys{/key_id}","collaborators_url":"https://api.github.com/repos/JorgeX/dojo_rules/collaborators{/collaborator}","teams_url":"https://api.github.com/repos/JorgeX/dojo_rules/teams","hooks_url":"https://api.github.com/repos/JorgeX/dojo_rules/hooks","issue_events_url":"https://api.github.com/repos/JorgeX/dojo_rules/issues/events{/number}","events_url":"https://api.github.com/repos/JorgeX/dojo_rules/events","assignees_url":"https://api.github.com/repos/JorgeX/dojo_rules/assignees{/user}","branches_url":"https://api.github.com/repos/JorgeX/dojo_rules/branches{/branch}","tags_url":"https://api.github.com/repos/JorgeX/dojo_rules/tags","blobs_url":"https://api.github.com/repos/JorgeX/dojo_rules/git/blobs{/sha}","git_tags_url":"https://api.github.com/repos/JorgeX/dojo_rules/git/tags{/sha}","git_refs_url":"https://api.github.com/repos/JorgeX/dojo_rules/git/refs{/sha}","trees_url":"https://api.github.com/repos/JorgeX/dojo_rules/git/trees{/sha}","statuses_url":"https://api.github.com/repos/JorgeX/dojo_rules/statuses/{sha}","languages_url":"https://api.github.com/repos/JorgeX/dojo_rules/languages","stargazers_url":"https://api.github.com/repos/JorgeX/dojo_rules/stargazers","contributors_url":"https://api.github.com/repos/JorgeX/dojo_rules/contributors","subscribers_url":"https://api.github.com/repos/JorgeX/dojo_rules/subscribers","subscription_url":"https://api.github.com/repos/JorgeX/dojo_rules/subscription","commits_url":"https://api.github.com/repos/JorgeX/dojo_rules/commits{/sha}","git_commits_url":"https://api.github.com/repos/JorgeX/dojo_rules/git/commits{/sha}","comments_url":"https://api.github.com/repos/JorgeX/dojo_rules/comments{/number}","issue_comment_url":"https://api.github.com/repos/JorgeX/dojo_rules/issues/comments/{number}","contents_url":"https://api.github.com/repos/JorgeX/dojo_rules/contents/{+path}","compare_url":"https://api.github.com/repos/JorgeX/dojo_rules/compare/{base}...{head}","merges_url":"https://api.github.com/repos/JorgeX/dojo_rules/merges","archive_url":"https://api.github.com/repos/JorgeX/dojo_rules/{archive_format}{/ref}","downloads_url":"https://api.github.com/repos/JorgeX/dojo_rules/downloads","issues_url":"https://api.github.com/repos/JorgeX/dojo_rules/issues{/number}","pulls_url":"https://api.github.com/repos/JorgeX/dojo_rules/pulls{/number}","milestones_url":"https://api.github.com/repos/JorgeX/dojo_rules/milestones{/number}","notifications_url":"https://api.github.com/repos/JorgeX/dojo_rules/notifications{?since,all,participating}","labels_url":"https://api.github.com/repos/JorgeX/dojo_rules/labels{/name}","releases_url":"https://api.github.com/repos/JorgeX/dojo_rules/releases{/id}","created_at":"2014-10-28T21:09:20Z","updated_at":"2014-10-28T21:13:40Z","pushed_at":"2015-01-01T01:00:43Z","git_url":"git://github.com/JorgeX/dojo_rules.git","ssh_url":"git@github.com:JorgeX/dojo_rules.git","clone_url":"https://github.com/JorgeX/dojo_rules.git","svn_url":"https://github.com/JorgeX/dojo_rules","homepage":null,"size":104,"stargazers_count":0,"watchers_count":0,"language":"Ruby","has_issues":false,"has_downloads":true,"has_wiki":true,"has_pages":true,"forks_count":0,"mirror_url":null,"open_issues_count":1,"forks":0,"open_issues":1,"watchers":0,"default_branch":"master"}},"base":{"label":"JorgeX:master","ref":"master","sha":"d1b0081019d3c0e43266beaa87fee523fc684649","user":{"login":"JorgeX","id":6737270,"avatar_url":"https://avatars.githubusercontent.com/u/6737270?v=3","gravatar_id":"","url":"https://api.github.com/users/JorgeX","html_url":"https://github.com/JorgeX","followers_url":"https://api.github.com/users/JorgeX/followers","following_url":"https://api.github.com/users/JorgeX/following{/other_user}","gists_url":"https://api.github.com/users/JorgeX/gists{/gist_id}","starred_url":"https://api.github.com/users/JorgeX/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/JorgeX/subscriptions","organizations_url":"https://api.github.com/users/JorgeX/orgs","repos_url":"https://api.github.com/users/JorgeX/repos","events_url":"https://api.github.com/users/JorgeX/events{/privacy}","received_events_url":"https://api.github.com/users/JorgeX/received_events","type":"User","site_admin":false},"repo":{"id":25890220,"name":"dojo_rules","full_name":"JorgeX/dojo_rules","owner":{"login":"JorgeX","id":6737270,"avatar_url":"https://avatars.githubusercontent.com/u/6737270?v=3","gravatar_id":"","url":"https://api.github.com/users/JorgeX","html_url":"https://github.com/JorgeX","followers_url":"https://api.github.com/users/JorgeX/followers","following_url":"https://api.github.com/users/JorgeX/following{/other_user}","gists_url":"https://api.github.com/users/JorgeX/gists{/gist_id}","starred_url":"https://api.github.com/users/JorgeX/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/JorgeX/subscriptions","organizations_url":"https://api.github.com/users/JorgeX/orgs","repos_url":"https://api.github.com/users/JorgeX/repos","events_url":"https://api.github.com/users/JorgeX/events{/privacy}","received_events_url":"https://api.github.com/users/JorgeX/received_events","type":"User","site_admin":false},"private":false,"html_url":"https://github.com/JorgeX/dojo_rules","description":"","fork":true,"url":"https://api.github.com/repos/JorgeX/dojo_rules","forks_url":"https://api.github.com/repos/JorgeX/dojo_rules/forks","keys_url":"https://api.github.com/repos/JorgeX/dojo_rules/keys{/key_id}","collaborators_url":"https://api.github.com/repos/JorgeX/dojo_rules/collaborators{/collaborator}","teams_url":"https://api.github.com/repos/JorgeX/dojo_rules/teams","hooks_url":"https://api.github.com/repos/JorgeX/dojo_rules/hooks","issue_events_url":"https://api.github.com/repos/JorgeX/dojo_rules/issues/events{/number}","events_url":"https://api.github.com/repos/JorgeX/dojo_rules/events","assignees_url":"https://api.github.com/repos/JorgeX/dojo_rules/assignees{/user}","branches_url":"https://api.github.com/repos/JorgeX/dojo_rules/branches{/branch}","tags_url":"https://api.github.com/repos/JorgeX/dojo_rules/tags","blobs_url":"https://api.github.com/repos/JorgeX/dojo_rules/git/blobs{/sha}","git_tags_url":"https://api.github.com/repos/JorgeX/dojo_rules/git/tags{/sha}","git_refs_url":"https://api.github.com/repos/JorgeX/dojo_rules/git/refs{/sha}","trees_url":"https://api.github.com/repos/JorgeX/dojo_rules/git/trees{/sha}","statuses_url":"https://api.github.com/repos/JorgeX/dojo_rules/statuses/{sha}","languages_url":"https://api.github.com/repos/JorgeX/dojo_rules/languages","stargazers_url":"https://api.github.com/repos/JorgeX/dojo_rules/stargazers","contributors_url":"https://api.github.com/repos/JorgeX/dojo_rules/contributors","subscribers_url":"https://api.github.com/repos/JorgeX/dojo_rules/subscribers","subscription_url":"https://api.github.com/repos/JorgeX/dojo_rules/subscription","commits_url":"https://api.github.com/repos/JorgeX/dojo_rules/commits{/sha}","git_commits_url":"https://api.github.com/repos/JorgeX/dojo_rules/git/commits{/sha}","comments_url":"https://api.github.com/repos/JorgeX/dojo_rules/comments{/number}","issue_comment_url":"https://api.github.com/repos/JorgeX/dojo_rules/issues/comments/{number}","contents_url":"https://api.github.com/repos/JorgeX/dojo_rules/contents/{+path}","compare_url":"https://api.github.com/repos/JorgeX/dojo_rules/compare/{base}...{head}","merges_url":"https://api.github.com/repos/JorgeX/dojo_rules/merges","archive_url":"https://api.github.com/repos/JorgeX/dojo_rules/{archive_format}{/ref}","downloads_url":"https://api.github.com/repos/JorgeX/dojo_rules/downloads","issues_url":"https://api.github.com/repos/JorgeX/dojo_rules/issues{/number}","pulls_url":"https://api.github.com/repos/JorgeX/dojo_rules/pulls{/number}","milestones_url":"https://api.github.com/repos/JorgeX/dojo_rules/milestones{/number}","notifications_url":"https://api.github.com/repos/JorgeX/dojo_rules/notifications{?since,all,participating}","labels_url":"https://api.github.com/repos/JorgeX/dojo_rules/labels{/name}","releases_url":"https://api.github.com/repos/JorgeX/dojo_rules/releases{/id}","created_at":"2014-10-28T21:09:20Z","updated_at":"2014-10-28T21:13:40Z","pushed_at":"2015-01-01T01:00:43Z","git_url":"git://github.com/JorgeX/dojo_rules.git","ssh_url":"git@github.com:JorgeX/dojo_rules.git","clone_url":"https://github.com/JorgeX/dojo_rules.git","svn_url":"https://github.com/JorgeX/dojo_rules","homepage":null,"size":104,"stargazers_count":0,"watchers_count":0,"language":"Ruby","has_issues":false,"has_downloads":true,"has_wiki":true,"has_pages":true,"forks_count":0,"mirror_url":null,"open_issues_count":1,"forks":0,"open_issues":1,"watchers":0,"default_branch":"master"}},"_links":{"self":{"href":"https://api.github.com/repos/JorgeX/dojo_rules/pulls/1"},"html":{"href":"https://github.com/JorgeX/dojo_rules/pull/1"},"issue":{"href":"https://api.github.com/repos/JorgeX/dojo_rules/issues/1"},"comments":{"href":"https://api.github.com/repos/JorgeX/dojo_rules/issues/1/comments"},"review_comments":{"href":"https://api.github.com/repos/JorgeX/dojo_rules/pulls/1/comments"},"review_comment":{"href":"https://api.github.com/repos/JorgeX/dojo_rules/pulls/comments/{number}"},"commits":{"href":"https://api.github.com/repos/JorgeX/dojo_rules/pulls/1/commits"},"statuses":{"href":"https://api.github.com/repos/JorgeX/dojo_rules/statuses/923b0ffbc6a7f2fc6ff55b6d415fe70f824ea5e0"}}}},"public":true,"created_at":"2015-01-01T01:03:10Z"}
{"id":"2489397251","type":"PushEvent","actor":{"id":13564,"login":"ezyang","gravatar_id":"","url":"https://api.github.com/users/ezyang","avatar_url":"https://avatars.githubusercontent.com/u/13564?"},"repo":{"id":28672247,"name":"ezyang/stenowiki","url":"https://api.github.com/repos/ezyang/stenowiki"},"payload":{"push_id":536752865,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"36ab97683d88f48611b24a8afd888d18fa660fea","before":"82d4215f37b7f39a5b818fc53b8120650648da8b","commits":[{"sha":"36ab97683d88f48611b24a8afd888d18fa660fea","author":{"email":"dbd597f5635f432486c5d365e9bb585b3eaa1853@cs.stanford.edu","name":"Edward Z. Yang"},"message":"Plz to not truncate\n\nSigned-off-by: Edward Z. Yang <ezyang@cs.stanford.edu>","distinct":true,"url":"https://api.github.com/repos/ezyang/stenowiki/commits/36ab97683d88f48611b24a8afd888d18fa660fea"}]},"public":true,"created_at":"2015-01-01T01:03:10Z"}
{"id":"2489397252","type":"PushEvent","actor":{"id":9101573,"login":"megantmcginley","gravatar_id":"","url":"https://api.github.com/users/megantmcginley","avatar_url":"https://avatars.githubusercontent.com/u/9101573?"},"repo":{"id":25549968,"name":"megantmcginley/megantmcginley.github.io","url":"https://api.github.com/repos/megantmcginley/megantmcginley.github.io"},"payload":{"push_id":536752866,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"1ac2c938f5436c6ff9576e262b80ccbced4586a8","before":"e613a42ea94329f38b4f9994b48ccd4f845a5225","commits":[{"sha":"1ac2c938f5436c6ff9576e262b80ccbced4586a8","author":{"email":"92f56e51255edbb80c74150d0115560b34c2bc35@users.noreply.github.com","name":"megantmcginley"},"message":"Update about.html","distinct":true,"url":"https://api.github.com/repos/megantmcginley/megantmcginley.github.io/commits/1ac2c938f5436c6ff9576e262b80ccbced4586a8"}]},"public":true,"created_at":"2015-01-01T01:03:11Z"}
{"id":"2489397253","type":"PushEvent","actor":{"id":6539368,"login":"acecodes","gravatar_id":"","url":"https://api.github.com/users/acecodes","avatar_url":"https://avatars.githubusercontent.com/u/6539368?"},"repo":{"id":28677898,"name":"acecodes/ace_website_jekyll","url":"https://api.github.com/repos/acecodes/ace_website_jekyll"},"payload":{"push_id":536752867,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"3ae19325c6d52115bd67dd5e3c30d7cf39919dd4","before":"771ef2fd1fb62b6fbb993ea283997c1ec6669062","commits":[{"sha":"3ae19325c6d52115bd67dd5e3c30d7cf39919dd4","author":{"email":"c74c402f1e088afb65e1933981f21221d4142751@gmail.com","name":"Ace"},"message":"Added web dev section and cleaned up contact form","distinct":true,"url":"https://api.github.com/repos/acecodes/ace_website_jekyll/commits/3ae19325c6d52115bd67dd5e3c30d7cf39919dd4"}]},"public":true,"created_at":"2015-01-01T01:03:11Z"}
{"id":"2489397255","type":"WatchEvent","actor":{"id":5352,"login":"juno","gravatar_id":"","url":"https://api.github.com/users/juno","avatar_url":"https://avatars.githubusercontent.com/u/5352?"},"repo":{"id":28648528,"name":"josh/cafe-js","url":"https://api.github.com/repos/josh/cafe-js"},"payload":{"action":"started"},"public":true,"created_at":"2015-01-01T01:03:12Z"}
{"id":"2489397260","type":"PushEvent","actor":{"id":6232704,"login":"nashpitre","gravatar_id":"","url":"https://api.github.com/users/nashpitre","avatar_url":"https://avatars.githubusercontent.com/u/6232704?"},"repo":{"id":28620312,"name":"nashpitre/nashpitre.github.io","url":"https://api.github.com/repos/nashpitre/nashpitre.github.io"},"payload":{"push_id":536752869,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"5a1d53fae41d4355c5710a87efbe6cfd6c96a539","before":"51b30814df5685fd473d136c26735a17cf577361","commits":[{"sha":"5a1d53fae41d4355c5710a87efbe6cfd6c96a539","author":{"email":"be30e9ada7478b999c213bbb3535884788d4bb46@me.com","name":"nashpitre"},"message":"revert","distinct":true,"url":"https://api.github.com/repos/nashpitre/nashpitre.github.io/commits/5a1d53fae41d4355c5710a87efbe6cfd6c96a539"}]},"public":true,"created_at":"2015-01-01T01:03:12Z"}
{"id":"2489397261","type":"PushEvent","actor":{"id":1386607,"login":"nbransby","gravatar_id":"","url":"https://api.github.com/users/nbransby","avatar_url":"https://avatars.githubusercontent.com/u/1386607?"},"repo":{"id":25346686,"name":"hambroperks/joda-convert","url":"https://api.github.com/repos/hambroperks/joda-convert"},"payload":{"push_id":536752870,"size":2,"distinct_size":2,"ref":"refs/heads/master","head":"80741e6ce6fa90f13d52b94fa7ebaa8347589d01","before":"73695867751ce7e02a24ca5d8eb8ce23025f9c57","commits":[{"sha":"6df78b2d5f529fdd8c731af40bc528c9faa357b7","author":{"email":"75ef9faee755c70589550b513ad881e5a603182c@laundrapp.com","name":"Nicholas Bransby-Williams"},"message":"add gradle wrapper","distinct":true,"url":"https://api.github.com/repos/hambroperks/joda-convert/commits/6df78b2d5f529fdd8c731af40bc528c9faa357b7"},{"sha":"80741e6ce6fa90f13d52b94fa7ebaa8347589d01","author":{"email":"75ef9faee755c70589550b513ad881e5a603182c@laundrapp.com","name":"Nicholas Bransby-Williams"},"message":"translate with 0.9.5","distinct":true,"url":"https://api.github.com/repos/hambroperks/joda-convert/commits/80741e6ce6fa90f13d52b94fa7ebaa8347589d01"}]},"public":true,"created_at":"2015-01-01T01:03:12Z","org":{"id":9292560,"login":"hambroperks","gravatar_id":"","url":"https://api.github.com/orgs/hambroperks","avatar_url":"https://avatars.githubusercontent.com/u/9292560?"}}
{"id":"2489397267","type":"PushEvent","actor":{"id":8132102,"login":"the-cdnjs-curator","gravatar_id":"","url":"https://api.github.com/users/the-cdnjs-curator","avatar_url":"https://avatars.githubusercontent.com/u/8132102?"},"repo":{"id":18663590,"name":"cdnjs/new-website","url":"https://api.github.com/repos/cdnjs/new-website"},"payload":{"push_id":536752875,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"5ba7b04046ce0a6421ebdb04d954baa39128b42d","before":"d8e84baf664dde8025c7c00f177fc681c60a405d","commits":[{"sha":"5ba7b04046ce0a6421ebdb04d954baa39128b42d","author":{"email":"a81c8330dae20b275f250c899f16a97692457035@gmail.com","name":"the-cdnjs-curator"},"message":"added ner files","distinct":true,"url":"https://api.github.com/repos/cdnjs/new-website/commits/5ba7b04046ce0a6421ebdb04d954baa39128b42d"}]},"public":true,"created_at":"2015-01-01T01:03:12Z","org":{"id":637362,"login":"cdnjs","gravatar_id":"","url":"https://api.github.com/orgs/cdnjs","avatar_url":"https://avatars.githubusercontent.com/u/637362?"}}
{"id":"2489397278","type":"CreateEvent","actor":{"id":616495,"login":"harveyt","gravatar_id":"","url":"https://api.github.com/users/harveyt","avatar_url":"https://avatars.githubusercontent.com/u/616495?"},"repo":{"id":28677911,"name":"harveyt/harveyt.github.io","url":"https://api.github.com/repos/harveyt/harveyt.github.io"},"payload":{"ref":"master","ref_type":"branch","master_branch":"source","description":"Personal webpage for Harvey Thompson","pusher_type":"user"},"public":true,"created_at":"2015-01-01T01:03:13Z"}
{"id":"2489397279","type":"GollumEvent","actor":{"id":7797609,"login":"ivanwfr","gravatar_id":"","url":"https://api.github.com/users/ivanwfr","avatar_url":"https://avatars.githubusercontent.com/u/7797609?"},"repo":{"id":808316,"name":"cswetenham/tabspace2.1","url":"https://api.github.com/repos/cswetenham/tabspace2.1"},"payload":{"pages":[{"page_name":"Home","title":"Home","summary":null,"action":"edited","sha":"685d71e9099c3e471f9a9a4917a16a52e89582f7","html_url":"https://github.com/cswetenham/tabspace2.1/wiki/Home"}]},"public":true,"created_at":"2015-01-01T01:03:13Z"}
{"id":"2489397280","type":"IssueCommentEvent","actor":{"id":778068,"login":"snarfed","gravatar_id":"","url":"https://api.github.com/users/snarfed","avatar_url":"https://avatars.githubusercontent.com/u/778068?"},"repo":{"id":2968000,"name":"snarfed/bridgy","url":"https://api.github.com/repos/snarfed/bridgy"},"payload":{"action":"created","issue":{"url":"https://api.github.com/repos/snarfed/bridgy/issues/315","labels_url":"https://api.github.com/repos/snarfed/bridgy/issues/315/labels{/name}","comments_url":"https://api.github.com/repos/snarfed/bridgy/issues/315/comments","events_url":"https://api.github.com/repos/snarfed/bridgy/issues/315/events","html_url":"https://github.com/snarfed/bridgy/issues/315","id":51612550,"number":315,"title":"char encoding bug while discovering webmention endpoint for teriiehina.net","user":{"login":"snarfed","id":778068,"avatar_url":"https://avatars.githubusercontent.com/u/778068?v=3","gravatar_id":"","url":"https://api.github.com/users/snarfed","html_url":"https://github.com/snarfed","followers_url":"https://api.github.com/users/snarfed/followers","following_url":"https://api.github.com/users/snarfed/following{/other_user}","gists_url":"https://api.github.com/users/snarfed/gists{/gist_id}","starred_url":"https://api.github.com/users/snarfed/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/snarfed/subscriptions","organizations_url":"https://api.github.com/users/snarfed/orgs","repos_url":"https://api.github.com/users/snarfed/repos","events_url":"https://api.github.com/users/snarfed/events{/privacy}","received_events_url":"https://api.github.com/users/snarfed/received_events","type":"User","site_admin":false},"labels":[{"url":"https://api.github.com/repos/snarfed/bridgy/labels/listen","name":"listen","color":"207de5"},{"url":"https://api.github.com/repos/snarfed/bridgy/labels/now","name":"now","color":"009800"}],"state":"closed","locked":false,"assignee":{"login":"kylewm","id":950127,"avatar_url":"https://avatars.githubusercontent.com/u/950127?v=3","gravatar_id":"","url":"https://api.github.com/users/kylewm","html_url":"https://github.com/kylewm","followers_url":"https://api.github.com/users/kylewm/followers","following_url":"https://api.github.com/users/kylewm/following{/other_user}","gists_url":"https://api.github.com/users/kylewm/gists{/gist_id}","starred_url":"https://api.github.com/users/kylewm/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/kylewm/subscriptions","organizations_url":"https://api.github.com/users/kylewm/orgs","repos_url":"https://api.github.com/users/kylewm/repos","events_url":"https://api.github.com/users/kylewm/events{/privacy}","received_events_url":"https://api.github.com/users/kylewm/received_events","type":"User","site_admin":false},"milestone":null,"comments":20,"created_at":"2014-12-10T21:20:17Z","updated_at":"2015-01-01T01:03:13Z","closed_at":"2015-01-01T00:49:46Z","body":"[log](https://www.brid.gy/log?start_time=1418245934&key=aglzfmJyaWQtZ3lyNQsSCFJlc3BvbnNlIid0YWc6dHdpdHRlci5jb20sMjAxMzo1NDI3MjY5MzQ4ODc1NDI3ODQM):\r\n\r\n```py\r\nStarting Response comment tag:twitter.com,2013:542726934887542784 https://twitter.com/teriiehina/status/542726934887542784\r\nWebmention from https://brid-gy.appspot.com/comment/twitter/elfpavlik/541974355010650112/542726934887542784 to http://www.teriiehina.net/\r\nSending...\r\nStarting new HTTP connection (1): www.teriiehina.net\r\n\"GET / HTTP/1.1\" 200 None\r\nTraceback (most recent call last):\r\n File \"/base/data/home/apps/s~brid-gy/3.380705500338596153/tasks.py\", line 494, in do_send_webmentions\r\n  if not mention.send(timeout=999):\r\n File \"/base/data/home/apps/s~brid-gy/3.380705500338596153/webmention-tools/webmentiontools/send.py\", line 24, in send\r\n  self._discoverEndpoint()\r\n File \"/base/data/home/apps/s~brid-gy/3.380705500338596153/webmention-tools/webmentiontools/send.py\", line 60, in _discoverEndpoint\r\n  soup = BeautifulSoup(self.html)\r\n File \"/base/data/home/apps/s~brid-gy/3.380705500338596153/activitystreams/beautifulsoup/bs4/__init__.py\", line 167, in __init__\r\n  if os.path.exists(markup):\r\n File \"/base/data/home/runtimes/python27/python27_dist/lib/python2.7/genericpath.py\", line 18, in exists\r\n  os.stat(path)\r\nUnicodeEncodeError: 'ascii' codec can't encode characters in position 0-2: ordinal not in range(128)```"},"comment":{"url":"https://api.github.com/repos/snarfed/bridgy/issues/comments/68477279","html_url":"https://github.com/snarfed/bridgy/issues/315#issuecomment-68477279","issue_url":"https://api.github.com/repos/snarfed/bridgy/issues/315","id":68477279,"user":{"login":"snarfed","id":778068,"avatar_url":"https://avatars.githubusercontent.com/u/778068?v=3","gravatar_id":"","url":"https://api.github.com/users/snarfed","html_url":"https://github.com/snarfed","followers_url":"https://api.github.com/users/snarfed/followers","following_url":"https://api.github.com/users/snarfed/following{/other_user}","gists_url":"https://api.github.com/users/snarfed/gists{/gist_id}","starred_url":"https://api.github.com/users/snarfed/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/snarfed/subscriptions","organizations_url":"https://api.github.com/users/snarfed/orgs","repos_url":"https://api.github.com/users/snarfed/repos","events_url":"https://api.github.com/users/snarfed/events{/privacy}","received_events_url":"https://api.github.com/users/snarfed/received_events","type":"User","site_admin":false},"created_at":"2015-01-01T01:03:13Z","updated_at":"2015-01-01T01:03:13Z","body":"awesome! nice work, especially for including the test. serious brownie points for that. thank you!\n\nwant to push this? I won't touch prod the rest of the day, so all clear if you want."}},"public":true,"created_at":"2015-01-01T01:03:13Z"}
{"id":"2489397283","type":"WatchEvent","actor":{"id":3889660,"login":"coder-chenzhi","gravatar_id":"","url":"https://api.github.com/users/coder-chenzhi","avatar_url":"https://avatars.githubusercontent.com/u/3889660?"},"repo":{"id":15045751,"name":"docker/fig","url":"https://api.github.com/repos/docker/fig"},"payload":{"action":"started"},"public":true,"created_at":"2015-01-01T01:03:13Z","org":{"id":5429470,"login":"docker","gravatar_id":"","url":"https://api.github.com/orgs/docker","avatar_url":"https://avatars.githubusercontent.com/u/5429470?"}}
{"id":"2489397287","type":"PullRequestReviewCommentEvent","actor":{"id":663212,"login":"tdas","gravatar_id":"","url":"https://api.github.com/users/tdas","avatar_url":"https://avatars.githubusercontent.com/u/663212?"},"repo":{"id":17165658,"name":"apache/spark","url":"https://api.github.com/repos/apache/spark"},"payload":{"action":"created","comment":{"url":"https://api.github.com/repos/apache/spark/pulls/comments/22397269","id":22397269,"diff_hunk":"@@ -17,31 +17,65 @@\n \n package org.apache.spark.streaming.mqtt\n \n-import org.scalatest.FunSuite\n-\n+import org.scalatest.{BeforeAndAfter, FunSuite}\n+import org.scalatest.concurrent.Eventually\n+import scala.concurrent.duration._\n import org.apache.spark.streaming.{Seconds, StreamingContext}\n import org.apache.spark.storage.StorageLevel\n import org.apache.spark.streaming.dstream.ReceiverInputDStream\n+import org.eclipse.paho.client.mqttv3._\n+import org.eclipse.paho.client.mqttv3.persist.MqttDefaultFilePersistence\n \n-class MQTTStreamSuite extends FunSuite {\n-\n-  val batchDuration = Seconds(1)\n+class MQTTStreamSuite extends FunSuite with Eventually with BeforeAndAfter {\n \n+  private val batchDuration = Seconds(1)\n   private val master: String = \"local[2]\"\n-\n   private val framework: String = this.getClass.getSimpleName\n+  private val brokerUrl = \"tcp://localhost:1883\"","path":"external/mqtt/src/test/scala/org/apache/spark/streaming/mqtt/MQTTStreamSuite.scala","position":24,"original_position":24,"commit_id":"fc8eb286db6aa8e78a567537996011f554eed969","original_commit_id":"fc8eb286db6aa8e78a567537996011f554eed969","user":{"login":"tdas","id":663212,"avatar_url":"https://avatars.githubusercontent.com/u/663212?v=3","gravatar_id":"","url":"https://api.github.com/users/tdas","html_url":"https://github.com/tdas","followers_url":"https://api.github.com/users/tdas/followers","following_url":"https://api.github.com/users/tdas/following{/other_user}","gists_url":"https://api.github.com/users/tdas/gists{/gist_id}","starred_url":"https://api.github.com/users/tdas/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/tdas/subscriptions","organizations_url":"https://api.github.com/users/tdas/orgs","repos_url":"https://api.github.com/users/tdas/repos","events_url":"https://api.github.com/users/tdas/events{/privacy}","received_events_url":"https://api.github.com/users/tdas/received_events","type":"User","site_admin":false},"body":"Who is running the broker? Also this port is hardcoded. There is a small, non-trivial chance that this port may not be free (in Jenkins, where multiple series of test maybe running in parallel) causing the server to not bind thus failing test. Can you find a free port (see [FlumeStreamSuite](https://github.com/apache/spark/blob/master/external/flume/src/test/scala/org/apache/spark/streaming/flume/FlumeStreamSuite.scala#L78)) and use that instead?","created_at":"2015-01-01T01:03:14Z","updated_at":"2015-01-01T01:03:14Z","html_url":"https://github.com/apache/spark/pull/3844#discussion_r22397269","pull_request_url":"https://api.github.com/repos/apache/spark/pulls/3844","_links":{"self":{"href":"https://api.github.com/repos/apache/spark/pulls/comments/22397269"},"html":{"href":"https://github.com/apache/spark/pull/3844#discussion_r22397269"},"pull_request":{"href":"https://api.github.com/repos/apache/spark/pulls/3844"}}},"pull_request":{"url":"https://api.github.com/repos/apache/spark/pulls/3844","id":26684823,"html_url":"https://github.com/apache/spark/pull/3844","diff_url":"https://github.com/apache/spark/pull/3844.diff","patch_url":"https://github.com/apache/spark/pull/3844.patch","issue_url":"https://api.github.com/repos/apache/spark/issues/3844","number":3844,"state":"open","locked":false,"title":"[SPARK-4631] unit test for MQTT","user":{"login":"Bilna","id":7123586,"avatar_url":"https://avatars.githubusercontent.com/u/7123586?v=3","gravatar_id":"","url":"https://api.github.com/users/Bilna","html_url":"https://github.com/Bilna","followers_url":"https://api.github.com/users/Bilna/followers","following_url":"https://api.github.com/users/Bilna/following{/other_user}","gists_url":"https://api.github.com/users/Bilna/gists{/gist_id}","starred_url":"https://api.github.com/users/Bilna/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/Bilna/subscriptions","organizations_url":"https://api.github.com/users/Bilna/orgs","repos_url":"https://api.github.com/users/Bilna/repos","events_url":"https://api.github.com/users/Bilna/events{/privacy}","received_events_url":"https://api.github.com/users/Bilna/received_events","type":"User","site_admin":false},"body":"Please review the unit test for MQTT","created_at":"2014-12-30T13:12:33Z","updated_at":"2015-01-01T01:03:14Z","closed_at":null,"merged_at":null,"merge_commit_sha":"78f53f74b7089734c2cc3a2f701e6044194cda1d","assignee":null,"milestone":null,"commits_url":"https://api.github.com/repos/apache/spark/pulls/3844/commits","review_comments_url":"https://api.github.com/repos/apache/spark/pulls/3844/comments","review_comment_url":"https://api.github.com/repos/apache/spark/pulls/comments/{number}","comments_url":"https://api.github.com/repos/apache/spark/issues/3844/comments","statuses_url":"https://api.github.com/repos/apache/spark/statuses/fc8eb286db6aa8e78a567537996011f554eed969","head":{"label":"Bilna:master","ref":"master","sha":"fc8eb286db6aa8e78a567537996011f554eed969","user":{"login":"Bilna","id":7123586,"avatar_url":"https://avatars.githubusercontent.com/u/7123586?v=3","gravatar_id":"","url":"https://api.github.com/users/Bilna","html_url":"https://github.com/Bilna","followers_url":"https://api.github.com/users/Bilna/followers","following_url":"https://api.github.com/users/Bilna/following{/other_user}","gists_url":"https://api.github.com/users/Bilna/gists{/gist_id}","starred_url":"https://api.github.com/users/Bilna/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/Bilna/subscriptions","organizations_url":"https://api.github.com/users/Bilna/orgs","repos_url":"https://api.github.com/users/Bilna/repos","events_url":"https://api.github.com/users/Bilna/events{/privacy}","received_events_url":"https://api.github.com/users/Bilna/received_events","type":"User","site_admin":false},"repo":{"id":28630516,"name":"spark","full_name":"Bilna/spark","owner":{"login":"Bilna","id":7123586,"avatar_url":"https://avatars.githubusercontent.com/u/7123586?v=3","gravatar_id":"","url":"https://api.github.com/users/Bilna","html_url":"https://github.com/Bilna","followers_url":"https://api.github.com/users/Bilna/followers","following_url":"https://api.github.com/users/Bilna/following{/other_user}","gists_url":"https://api.github.com/users/Bilna/gists{/gist_id}","starred_url":"https://api.github.com/users/Bilna/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/Bilna/subscriptions","organizations_url":"https://api.github.com/users/Bilna/orgs","repos_url":"https://api.github.com/users/Bilna/repos","events_url":"https://api.github.com/users/Bilna/events{/privacy}","received_events_url":"https://api.github.com/users/Bilna/received_events","type":"User","site_admin":false},"private":false,"html_url":"https://github.com/Bilna/spark","description":"Mirror of Apache Spark","fork":true,"url":"https://api.github.com/repos/Bilna/spark","forks_url":"https://api.github.com/repos/Bilna/spark/forks","keys_url":"https://api.github.com/repos/Bilna/spark/keys{/key_id}","collaborators_url":"https://api.github.com/repos/Bilna/spark/collaborators{/collaborator}","teams_url":"https://api.github.com/repos/Bilna/spark/teams","hooks_url":"https://api.github.com/repos/Bilna/spark/hooks","issue_events_url":"https://api.github.com/repos/Bilna/spark/issues/events{/number}","events_url":"https://api.github.com/repos/Bilna/spark/events","assignees_url":"https://api.github.com/repos/Bilna/spark/assignees{/user}","branches_url":"https://api.github.com/repos/Bilna/spark/branches{/branch}","tags_url":"https://api.github.com/repos/Bilna/spark/tags","blobs_url":"https://api.github.com/repos/Bilna/spark/git/blobs{/sha}","git_tags_url":"https://api.github.com/repos/Bilna/spark/git/tags{/sha}","git_refs_url":"https://api.github.com/repos/Bilna/spark/git/refs{/sha}","trees_url":"https://api.github.com/repos/Bilna/spark/git/trees{/sha}","statuses_url":"https://api.github.com/repos/Bilna/spark/statuses/{sha}","languages_url":"https://api.github.com/repos/Bilna/spark/languages","stargazers_url":"https://api.github.com/repos/Bilna/spark/stargazers","contributors_url":"https://api.github.com/repos/Bilna/spark/contributors","subscribers_url":"https://api.github.com/repos/Bilna/spark/subscribers","subscription_url":"https://api.github.com/repos/Bilna/spark/subscription","commits_url":"https://api.github.com/repos/Bilna/spark/commits{/sha}","git_commits_url":"https://api.github.com/repos/Bilna/spark/git/commits{/sha}","comments_url":"https://api.github.com/repos/Bilna/spark/comments{/number}","issue_comment_url":"https://api.github.com/repos/Bilna/spark/issues/comments/{number}","contents_url":"https://api.github.com/repos/Bilna/spark/contents/{+path}","compare_url":"https://api.github.com/repos/Bilna/spark/compare/{base}...{head}","merges_url":"https://api.github.com/repos/Bilna/spark/merges","archive_url":"https://api.github.com/repos/Bilna/spark/{archive_format}{/ref}","downloads_url":"https://api.github.com/repos/Bilna/spark/downloads","issues_url":"https://api.github.com/repos/Bilna/spark/issues{/number}","pulls_url":"https://api.github.com/repos/Bilna/spark/pulls{/number}","milestones_url":"https://api.github.com/repos/Bilna/spark/milestones{/number}","notifications_url":"https://api.github.com/repos/Bilna/spark/notifications{?since,all,participating}","labels_url":"https://api.github.com/repos/Bilna/spark/labels{/name}","releases_url":"https://api.github.com/repos/Bilna/spark/releases{/id}","created_at":"2014-12-30T12:47:01Z","updated_at":"2014-12-31T09:52:36Z","pushed_at":"2014-12-31T09:52:35Z","git_url":"git://github.com/Bilna/spark.git","ssh_url":"git@github.com:Bilna/spark.git","clone_url":"https://github.com/Bilna/spark.git","svn_url":"https://github.com/Bilna/spark","homepage":null,"size":87823,"stargazers_count":1,"watchers_count":1,"language":"Scala","has_issues":false,"has_downloads":true,"has_wiki":false,"has_pages":false,"forks_count":0,"mirror_url":null,"open_issues_count":0,"forks":0,"open_issues":0,"watchers":1,"default_branch":"master"}},"base":{"label":"apache:master","ref":"master","sha":"352ed6bbe3c3b67e52e298e7c535ae414d96beca","user":{"login":"apache","id":47359,"avatar_url":"https://avatars.githubusercontent.com/u/47359?v=3","gravatar_id":"","url":"https://api.github.com/users/apache","html_url":"https://github.com/apache","followers_url":"https://api.github.com/users/apache/followers","following_url":"https://api.github.com/users/apache/following{/other_user}","gists_url":"https://api.github.com/users/apache/gists{/gist_id}","starred_url":"https://api.github.com/users/apache/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/apache/subscriptions","organizations_url":"https://api.github.com/users/apache/orgs","repos_url":"https://api.github.com/users/apache/repos","events_url":"https://api.github.com/users/apache/events{/privacy}","received_events_url":"https://api.github.com/users/apache/received_events","type":"Organization","site_admin":false},"repo":{"id":17165658,"name":"spark","full_name":"apache/spark","owner":{"login":"apache","id":47359,"avatar_url":"https://avatars.githubusercontent.com/u/47359?v=3","gravatar_id":"","url":"https://api.github.com/users/apache","html_url":"https://github.com/apache","followers_url":"https://api.github.com/users/apache/followers","following_url":"https://api.github.com/users/apache/following{/other_user}","gists_url":"https://api.github.com/users/apache/gists{/gist_id}","starred_url":"https://api.github.com/users/apache/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/apache/subscriptions","organizations_url":"https://api.github.com/users/apache/orgs","repos_url":"https://api.github.com/users/apache/repos","events_url":"https://api.github.com/users/apache/events{/privacy}","received_events_url":"https://api.github.com/users/apache/received_events","type":"Organization","site_admin":false},"private":false,"html_url":"https://github.com/apache/spark","description":"Mirror of Apache Spark","fork":false,"url":"https://api.github.com/repos/apache/spark","forks_url":"https://api.github.com/repos/apache/spark/forks","keys_url":"https://api.github.com/repos/apache/spark/keys{/key_id}","collaborators_url":"https://api.github.com/repos/apache/spark/collaborators{/collaborator}","teams_url":"https://api.github.com/repos/apache/spark/teams","hooks_url":"https://api.github.com/repos/apache/spark/hooks","issue_events_url":"https://api.github.com/repos/apache/spark/issues/events{/number}","events_url":"https://api.github.com/repos/apache/spark/events","assignees_url":"https://api.github.com/repos/apache/spark/assignees{/user}","branches_url":"https://api.github.com/repos/apache/spark/branches{/branch}","tags_url":"https://api.github.com/repos/apache/spark/tags","blobs_url":"https://api.github.com/repos/apache/spark/git/blobs{/sha}","git_tags_url":"https://api.github.com/repos/apache/spark/git/tags{/sha}","git_refs_url":"https://api.github.com/repos/apache/spark/git/refs{/sha}","trees_url":"https://api.github.com/repos/apache/spark/git/trees{/sha}","statuses_url":"https://api.github.com/repos/apache/spark/statuses/{sha}","languages_url":"https://api.github.com/repos/apache/spark/languages","stargazers_url":"https://api.github.com/repos/apache/spark/stargazers","contributors_url":"https://api.github.com/repos/apache/spark/contributors","subscribers_url":"https://api.github.com/repos/apache/spark/subscribers","subscription_url":"https://api.github.com/repos/apache/spark/subscription","commits_url":"https://api.github.com/repos/apache/spark/commits{/sha}","git_commits_url":"https://api.github.com/repos/apache/spark/git/commits{/sha}","comments_url":"https://api.github.com/repos/apache/spark/comments{/number}","issue_comment_url":"https://api.github.com/repos/apache/spark/issues/comments/{number}","contents_url":"https://api.github.com/repos/apache/spark/contents/{+path}","compare_url":"https://api.github.com/repos/apache/spark/compare/{base}...{head}","merges_url":"https://api.github.com/repos/apache/spark/merges","archive_url":"https://api.github.com/repos/apache/spark/{archive_format}{/ref}","downloads_url":"https://api.github.com/repos/apache/spark/downloads","issues_url":"https://api.github.com/repos/apache/spark/issues{/number}","pulls_url":"https://api.github.com/repos/apache/spark/pulls{/number}","milestones_url":"https://api.github.com/repos/apache/spark/milestones{/number}","notifications_url":"https://api.github.com/repos/apache/spark/notifications{?since,all,participating}","labels_url":"https://api.github.com/repos/apache/spark/labels{/name}","releases_url":"https://api.github.com/repos/apache/spark/releases{/id}","created_at":"2014-02-25T08:00:08Z","updated_at":"2015-01-01T00:59:33Z","pushed_at":"2015-01-01T00:59:33Z","git_url":"git://github.com/apache/spark.git","ssh_url":"git@github.com:apache/spark.git","clone_url":"https://github.com/apache/spark.git","svn_url":"https://github.com/apache/spark","homepage":null,"size":1083068,"stargazers_count":2458,"watchers_count":2458,"language":"Scala","has_issues":false,"has_downloads":true,"has_wiki":false,"has_pages":false,"forks_count":2179,"mirror_url":"git://git.apache.org/spark.git","open_issues_count":268,"forks":2179,"open_issues":268,"watchers":2458,"default_branch":"master"}},"_links":{"self":{"href":"https://api.github.com/repos/apache/spark/pulls/3844"},"html":{"href":"https://github.com/apache/spark/pull/3844"},"issue":{"href":"https://api.github.com/repos/apache/spark/issues/3844"},"comments":{"href":"https://api.github.com/repos/apache/spark/issues/3844/comments"},"review_comments":{"href":"https://api.github.com/repos/apache/spark/pulls/3844/comments"},"review_comment":{"href":"https://api.github.com/repos/apache/spark/pulls/comments/{number}"},"commits":{"href":"https://api.github.com/repos/apache/spark/pulls/3844/commits"},"statuses":{"href":"https://api.github.com/repos/apache/spark/statuses/fc8eb286db6aa8e78a567537996011f554eed969"}}}},"public":true,"created_at":"2015-01-01T01:03:14Z","org":{"id":47359,"login":"apache","gravatar_id":"","url":"https://api.github.com/orgs/apache","avatar_url":"https://avatars.githubusercontent.com/u/47359?"}}
{"id":"2489397290","type":"PullRequestEvent","actor":{"id":4276679,"login":"robot-dreams","gravatar_id":"","url":"https://api.github.com/users/robot-dreams","avatar_url":"https://avatars.githubusercontent.com/u/4276679?"},"repo":{"id":25705676,"name":"machine-intelligence/research-forum","url":"https://api.github.com/repos/machine-intelligence/research-forum"},"payload":{"action":"closed","number":62,"pull_request":{"url":"https://api.github.com/repos/machine-intelligence/research-forum/pulls/62","id":26712730,"html_url":"https://github.com/machine-intelligence/research-forum/pull/62","diff_url":"https://github.com/machine-intelligence/research-forum/pull/62.diff","patch_url":"https://github.com/machine-intelligence/research-forum/pull/62.patch","issue_url":"https://api.github.com/repos/machine-intelligence/research-forum/issues/62","number":62,"state":"closed","locked":false,"title":"Feature/look and feel","user":{"login":"robot-dreams","id":4276679,"avatar_url":"https://avatars.githubusercontent.com/u/4276679?v=3","gravatar_id":"","url":"https://api.github.com/users/robot-dreams","html_url":"https://github.com/robot-dreams","followers_url":"https://api.github.com/users/robot-dreams/followers","following_url":"https://api.github.com/users/robot-dreams/following{/other_user}","gists_url":"https://api.github.com/users/robot-dreams/gists{/gist_id}","starred_url":"https://api.github.com/users/robot-dreams/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/robot-dreams/subscriptions","organizations_url":"https://api.github.com/users/robot-dreams/orgs","repos_url":"https://api.github.com/users/robot-dreams/repos","events_url":"https://api.github.com/users/robot-dreams/events{/privacy}","received_events_url":"https://api.github.com/users/robot-dreams/received_events","type":"User","site_admin":false},"body":"","created_at":"2014-12-31T02:03:18Z","updated_at":"2015-01-01T01:03:14Z","closed_at":"2015-01-01T01:03:14Z","merged_at":"2015-01-01T01:03:14Z","merge_commit_sha":"6a6cdb34b95036fe523e7c90643ed5d3e278e2b8","assignee":null,"milestone":null,"commits_url":"https://api.github.com/repos/machine-intelligence/research-forum/pulls/62/commits","review_comments_url":"https://api.github.com/repos/machine-intelligence/research-forum/pulls/62/comments","review_comment_url":"https://api.github.com/repos/machine-intelligence/research-forum/pulls/comments/{number}","comments_url":"https://api.github.com/repos/machine-intelligence/research-forum/issues/62/comments","statuses_url":"https://api.github.com/repos/machine-intelligence/research-forum/statuses/f50826580c1451f8724025ba97df13b45d3a827c","head":{"label":"machine-intelligence:feature/look-and-feel","ref":"feature/look-and-feel","sha":"f50826580c1451f8724025ba97df13b45d3a827c","user":{"login":"machine-intelligence","id":7153909,"avatar_url":"https://avatars.githubusercontent.com/u/7153909?v=3","gravatar_id":"","url":"https://api.github.com/users/machine-intelligence","html_url":"https://github.com/machine-intelligence","followers_url":"https://api.github.com/users/machine-intelligence/followers","following_url":"https://api.github.com/users/machine-intelligence/following{/other_user}","gists_url":"https://api.github.com/users/machine-intelligence/gists{/gist_id}","starred_url":"https://api.github.com/users/machine-intelligence/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/machine-intelligence/subscriptions","organizations_url":"https://api.github.com/users/machine-intelligence/orgs","repos_url":"https://api.github.com/users/machine-intelligence/repos","events_url":"https://api.github.com/users/machine-intelligence/events{/privacy}","received_events_url":"https://api.github.com/users/machine-intelligence/received_events","type":"Organization","site_admin":false},"repo":{"id":25705676,"name":"research-forum","full_name":"machine-intelligence/research-forum","owner":{"login":"machine-intelligence","id":7153909,"avatar_url":"https://avatars.githubusercontent.com/u/7153909?v=3","gravatar_id":"","url":"https://api.github.com/users/machine-intelligence","html_url":"https://github.com/machine-intelligence","followers_url":"https://api.github.com/users/machine-intelligence/followers","following_url":"https://api.github.com/users/machine-intelligence/following{/other_user}","gists_url":"https://api.github.com/users/machine-intelligence/gists{/gist_id}","starred_url":"https://api.github.com/users/machine-intelligence/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/machine-intelligence/subscriptions","organizations_url":"https://api.github.com/users/machine-intelligence/orgs","repos_url":"https://api.github.com/users/machine-intelligence/repos","events_url":"https://api.github.com/users/machine-intelligence/events{/privacy}","received_events_url":"https://api.github.com/users/machine-intelligence/received_events","type":"Organization","site_admin":false},"private":false,"html_url":"https://github.com/machine-intelligence/research-forum","description":"","fork":false,"url":"https://api.github.com/repos/machine-intelligence/research-forum","forks_url":"https://api.github.com/repos/machine-intelligence/research-forum/forks","keys_url":"https://api.github.com/repos/machine-intelligence/research-forum/keys{/key_id}","collaborators_url":"https://api.github.com/repos/machine-intelligence/research-forum/collaborators{/collaborator}","teams_url":"https://api.github.com/repos/machine-intelligence/research-forum/teams","hooks_url":"https://api.github.com/repos/machine-intelligence/research-forum/hooks","issue_events_url":"https://api.github.com/repos/machine-intelligence/research-forum/issues/events{/number}","events_url":"https://api.github.com/repos/machine-intelligence/research-forum/events","assignees_url":"https://api.github.com/repos/machine-intelligence/research-forum/assignees{/user}","branches_url":"https://api.github.com/repos/machine-intelligence/research-forum/branches{/branch}","tags_url":"https://api.github.com/repos/machine-intelligence/research-forum/tags","blobs_url":"https://api.github.com/repos/machine-intelligence/research-forum/git/blobs{/sha}","git_tags_url":"https://api.github.com/repos/machine-intelligence/research-forum/git/tags{/sha}","git_refs_url":"https://api.github.com/repos/machine-intelligence/research-forum/git/refs{/sha}","trees_url":"https://api.github.com/repos/machine-intelligence/research-forum/git/trees{/sha}","statuses_url":"https://api.github.com/repos/machine-intelligence/research-forum/statuses/{sha}","languages_url":"https://api.github.com/repos/machine-intelligence/research-forum/languages","stargazers_url":"https://api.github.com/repos/machine-intelligence/research-forum/stargazers","contributors_url":"https://api.github.com/repos/machine-intelligence/research-forum/contributors","subscribers_url":"https://api.github.com/repos/machine-intelligence/research-forum/subscribers","subscription_url":"https://api.github.com/repos/machine-intelligence/research-forum/subscription","commits_url":"https://api.github.com/repos/machine-intelligence/research-forum/commits{/sha}","git_commits_url":"https://api.github.com/repos/machine-intelligence/research-forum/git/commits{/sha}","comments_url":"https://api.github.com/repos/machine-intelligence/research-forum/comments{/number}","issue_comment_url":"https://api.github.com/repos/machine-intelligence/research-forum/issues/comments/{number}","contents_url":"https://api.github.com/repos/machine-intelligence/research-forum/contents/{+path}","compare_url":"https://api.github.com/repos/machine-intelligence/research-forum/compare/{base}...{head}","merges_url":"https://api.github.com/repos/machine-intelligence/research-forum/merges","archive_url":"https://api.github.com/repos/machine-intelligence/research-forum/{archive_format}{/ref}","downloads_url":"https://api.github.com/repos/machine-intelligence/research-forum/downloads","issues_url":"https://api.github.com/repos/machine-intelligence/research-forum/issues{/number}","pulls_url":"https://api.github.com/repos/machine-intelligence/research-forum/pulls{/number}","milestones_url":"https://api.github.com/repos/machine-intelligence/research-forum/milestones{/number}","notifications_url":"https://api.github.com/repos/machine-intelligence/research-forum/notifications{?since,all,participating}","labels_url":"https://api.github.com/repos/machine-intelligence/research-forum/labels{/name}","releases_url":"https://api.github.com/repos/machine-intelligence/research-forum/releases{/id}","created_at":"2014-10-24T20:02:46Z","updated_at":"2014-12-16T14:48:44Z","pushed_at":"2015-01-01T01:03:14Z","git_url":"git://github.com/machine-intelligence/research-forum.git","ssh_url":"git@github.com:machine-intelligence/research-forum.git","clone_url":"https://github.com/machine-intelligence/research-forum.git","svn_url":"https://github.com/machine-intelligence/research-forum","homepage":null,"size":952,"stargazers_count":0,"watchers_count":0,"language":"Arc","has_issues":true,"has_downloads":true,"has_wiki":true,"has_pages":false,"forks_count":0,"mirror_url":null,"open_issues_count":1,"forks":0,"open_issues":1,"watchers":0,"default_branch":"master"}},"base":{"label":"machine-intelligence:master","ref":"master","sha":"72d4a081a5635cc218e2940e9d0f136eb4dd53e4","user":{"login":"machine-intelligence","id":7153909,"avatar_url":"https://avatars.githubusercontent.com/u/7153909?v=3","gravatar_id":"","url":"https://api.github.com/users/machine-intelligence","html_url":"https://github.com/machine-intelligence","followers_url":"https://api.github.com/users/machine-intelligence/followers","following_url":"https://api.github.com/users/machine-intelligence/following{/other_user}","gists_url":"https://api.github.com/users/machine-intelligence/gists{/gist_id}","starred_url":"https://api.github.com/users/machine-intelligence/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/machine-intelligence/subscriptions","organizations_url":"https://api.github.com/users/machine-intelligence/orgs","repos_url":"https://api.github.com/users/machine-intelligence/repos","events_url":"https://api.github.com/users/machine-intelligence/events{/privacy}","received_events_url":"https://api.github.com/users/machine-intelligence/received_events","type":"Organization","site_admin":false},"repo":{"id":25705676,"name":"research-forum","full_name":"machine-intelligence/research-forum","owner":{"login":"machine-intelligence","id":7153909,"avatar_url":"https://avatars.githubusercontent.com/u/7153909?v=3","gravatar_id":"","url":"https://api.github.com/users/machine-intelligence","html_url":"https://github.com/machine-intelligence","followers_url":"https://api.github.com/users/machine-intelligence/followers","following_url":"https://api.github.com/users/machine-intelligence/following{/other_user}","gists_url":"https://api.github.com/users/machine-intelligence/gists{/gist_id}","starred_url":"https://api.github.com/users/machine-intelligence/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/machine-intelligence/subscriptions","organizations_url":"https://api.github.com/users/machine-intelligence/orgs","repos_url":"https://api.github.com/users/machine-intelligence/repos","events_url":"https://api.github.com/users/machine-intelligence/events{/privacy}","received_events_url":"https://api.github.com/users/machine-intelligence/received_events","type":"Organization","site_admin":false},"private":false,"html_url":"https://github.com/machine-intelligence/research-forum","description":"","fork":false,"url":"https://api.github.com/repos/machine-intelligence/research-forum","forks_url":"https://api.github.com/repos/machine-intelligence/research-forum/forks","keys_url":"https://api.github.com/repos/machine-intelligence/research-forum/keys{/key_id}","collaborators_url":"https://api.github.com/repos/machine-intelligence/research-forum/collaborators{/collaborator}","teams_url":"https://api.github.com/repos/machine-intelligence/research-forum/teams","hooks_url":"https://api.github.com/repos/machine-intelligence/research-forum/hooks","issue_events_url":"https://api.github.com/repos/machine-intelligence/research-forum/issues/events{/number}","events_url":"https://api.github.com/repos/machine-intelligence/research-forum/events","assignees_url":"https://api.github.com/repos/machine-intelligence/research-forum/assignees{/user}","branches_url":"https://api.github.com/repos/machine-intelligence/research-forum/branches{/branch}","tags_url":"https://api.github.com/repos/machine-intelligence/research-forum/tags","blobs_url":"https://api.github.com/repos/machine-intelligence/research-forum/git/blobs{/sha}","git_tags_url":"https://api.github.com/repos/machine-intelligence/research-forum/git/tags{/sha}","git_refs_url":"https://api.github.com/repos/machine-intelligence/research-forum/git/refs{/sha}","trees_url":"https://api.github.com/repos/machine-intelligence/research-forum/git/trees{/sha}","statuses_url":"https://api.github.com/repos/machine-intelligence/research-forum/statuses/{sha}","languages_url":"https://api.github.com/repos/machine-intelligence/research-forum/languages","stargazers_url":"https://api.github.com/repos/machine-intelligence/research-forum/stargazers","contributors_url":"https://api.github.com/repos/machine-intelligence/research-forum/contributors","subscribers_url":"https://api.github.com/repos/machine-intelligence/research-forum/subscribers","subscription_url":"https://api.github.com/repos/machine-intelligence/research-forum/subscription","commits_url":"https://api.github.com/repos/machine-intelligence/research-forum/commits{/sha}","git_commits_url":"https://api.github.com/repos/machine-intelligence/research-forum/git/commits{/sha}","comments_url":"https://api.github.com/repos/machine-intelligence/research-forum/comments{/number}","issue_comment_url":"https://api.github.com/repos/machine-intelligence/research-forum/issues/comments/{number}","contents_url":"https://api.github.com/repos/machine-intelligence/research-forum/contents/{+path}","compare_url":"https://api.github.com/repos/machine-intelligence/research-forum/compare/{base}...{head}","merges_url":"https://api.github.com/repos/machine-intelligence/research-forum/merges","archive_url":"https://api.github.com/repos/machine-intelligence/research-forum/{archive_format}{/ref}","downloads_url":"https://api.github.com/repos/machine-intelligence/research-forum/downloads","issues_url":"https://api.github.com/repos/machine-intelligence/research-forum/issues{/number}","pulls_url":"https://api.github.com/repos/machine-intelligence/research-forum/pulls{/number}","milestones_url":"https://api.github.com/repos/machine-intelligence/research-forum/milestones{/number}","notifications_url":"https://api.github.com/repos/machine-intelligence/research-forum/notifications{?since,all,participating}","labels_url":"https://api.github.com/repos/machine-intelligence/research-forum/labels{/name}","releases_url":"https://api.github.com/repos/machine-intelligence/research-forum/releases{/id}","created_at":"2014-10-24T20:02:46Z","updated_at":"2014-12-16T14:48:44Z","pushed_at":"2015-01-01T01:03:14Z","git_url":"git://github.com/machine-intelligence/research-forum.git","ssh_url":"git@github.com:machine-intelligence/research-forum.git","clone_url":"https://github.com/machine-intelligence/research-forum.git","svn_url":"https://github.com/machine-intelligence/research-forum","homepage":null,"size":952,"stargazers_count":0,"watchers_count":0,"language":"Arc","has_issues":true,"has_downloads":true,"has_wiki":true,"has_pages":false,"forks_count":0,"mirror_url":null,"open_issues_count":1,"forks":0,"open_issues":1,"watchers":0,"default_branch":"master"}},"_links":{"self":{"href":"https://api.github.com/repos/machine-intelligence/research-forum/pulls/62"},"html":{"href":"https://github.com/machine-intelligence/research-forum/pull/62"},"issue":{"href":"https://api.github.com/repos/machine-intelligence/research-forum/issues/62"},"comments":{"href":"https://api.github.com/repos/machine-intelligence/research-forum/issues/62/comments"},"review_comments":{"href":"https://api.github.com/repos/machine-intelligence/research-forum/pulls/62/comments"},"review_comment":{"href":"https://api.github.com/repos/machine-intelligence/research-forum/pulls/comments/{number}"},"commits":{"href":"https://api.github.com/repos/machine-intelligence/research-forum/pulls/62/commits"},"statuses":{"href":"https://api.github.com/repos/machine-intelligence/research-forum/statuses/f50826580c1451f8724025ba97df13b45d3a827c"}},"merged":true,"mergeable":null,"mergeable_state":"unknown","merged_by":{"login":"robot-dreams","id":4276679,"avatar_url":"https://avatars.githubusercontent.com/u/4276679?v=3","gravatar_id":"","url":"https://api.github.com/users/robot-dreams","html_url":"https://github.com/robot-dreams","followers_url":"https://api.github.com/users/robot-dreams/followers","following_url":"https://api.github.com/users/robot-dreams/following{/other_user}","gists_url":"https://api.github.com/users/robot-dreams/gists{/gist_id}","starred_url":"https://api.github.com/users/robot-dreams/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/robot-dreams/subscriptions","organizations_url":"https://api.github.com/users/robot-dreams/orgs","repos_url":"https://api.github.com/users/robot-dreams/repos","events_url":"https://api.github.com/users/robot-dreams/events{/privacy}","received_events_url":"https://api.github.com/users/robot-dreams/received_events","type":"User","site_admin":false},"comments":0,"review_comments":0,"commits":2,"additions":82,"deletions":26,"changed_files":4}},"public":true,"created_at":"2015-01-01T01:03:14Z","org":{"id":7153909,"login":"machine-intelligence","gravatar_id":"","url":"https://api.github.com/orgs/machine-intelligence","avatar_url":"https://avatars.githubusercontent.com/u/7153909?"}}
{"id":"2489397291","type":"PushEvent","actor":{"id":7905778,"login":"pankajmalhotra","gravatar_id":"","url":"https://api.github.com/users/pankajmalhotra","avatar_url":"https://avatars.githubusercontent.com/u/7905778?"},"repo":{"id":22740858,"name":"ulini/ops","url":"https://api.github.com/repos/ulini/ops"},"payload":{"push_id":536752882,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"1431274619c45efb20987f0a62260e85dccb48ef","before":"7d2237bdbf424692f909cae67c2a5e8c13335a38","commits":[{"sha":"1431274619c45efb20987f0a62260e85dccb48ef","author":{"email":"114151935e80b69b2f2bbc308c3a6960936b4e1a@ul.com","name":"pankajmalhotra"},"message":"Added Ruby & Make","distinct":true,"url":"https://api.github.com/repos/ulini/ops/commits/1431274619c45efb20987f0a62260e85dccb48ef"}]},"public":true,"created_at":"2015-01-01T01:03:15Z","org":{"id":6116922,"login":"ulini","gravatar_id":"","url":"https://api.github.com/orgs/ulini","avatar_url":"https://avatars.githubusercontent.com/u/6116922?"}}
{"id":"2489397293","type":"PushEvent","actor":{"id":4276679,"login":"robot-dreams","gravatar_id":"","url":"https://api.github.com/users/robot-dreams","avatar_url":"https://avatars.githubusercontent.com/u/4276679?"},"repo":{"id":25705676,"name":"machine-intelligence/research-forum","url":"https://api.github.com/repos/machine-intelligence/research-forum"},"payload":{"push_id":536752883,"size":3,"distinct_size":1,"ref":"refs/heads/master","head":"e81e3986d5db27d1c631ae46f003f4a06c61a816","before":"72d4a081a5635cc218e2940e9d0f136eb4dd53e4","commits":[{"sha":"0829853c4b6ac56bbf7beee570b7b279fc02ae0e","author":{"email":"f44b7b9bbcd65117b7d5272f0703ff2e82101e98@gmail.com","name":"Malo Bourgon"},"message":"Improved look and feel (thanks Brent!)","distinct":false,"url":"https://api.github.com/repos/machine-intelligence/research-forum/commits/0829853c4b6ac56bbf7beee570b7b279fc02ae0e"},{"sha":"f50826580c1451f8724025ba97df13b45d3a827c","author":{"email":"f63b26569c1369b3dd67f2a7834b6651712fe1d3@gmail.com","name":"Elliott Jin"},"message":"Content-length -> Content-Length, remove trailing whitespace","distinct":false,"url":"https://api.github.com/repos/machine-intelligence/research-forum/commits/f50826580c1451f8724025ba97df13b45d3a827c"},{"sha":"e81e3986d5db27d1c631ae46f003f4a06c61a816","author":{"email":"f63b26569c1369b3dd67f2a7834b6651712fe1d3@gmail.com","name":"robot-dreams"},"message":"Merge pull request #62 from machine-intelligence/feature/look-and-feel\n\nFeature/look and feel","distinct":true,"url":"https://api.github.com/repos/machine-intelligence/research-forum/commits/e81e3986d5db27d1c631ae46f003f4a06c61a816"}]},"public":true,"created_at":"2015-01-01T01:03:15Z","org":{"id":7153909,"login":"machine-intelligence","gravatar_id":"","url":"https://api.github.com/orgs/machine-intelligence","avatar_url":"https://avatars.githubusercontent.com/u/7153909?"}}
{"id":"2489397296","type":"IssueCommentEvent","actor":{"id":3203500,"login":"aaroncrawford","gravatar_id":"","url":"https://api.github.com/users/aaroncrawford","avatar_url":"https://avatars.githubusercontent.com/u/3203500?"},"repo":{"id":8170346,"name":"artberri/sidr","url":"https://api.github.com/repos/artberri/sidr"},"payload":{"action":"created","issue":{"url":"https://api.github.com/repos/artberri/sidr/issues/4","labels_url":"https://api.github.com/repos/artberri/sidr/issues/4/labels{/name}","comments_url":"https://api.github.com/repos/artberri/sidr/issues/4/comments","events_url":"https://api.github.com/repos/artberri/sidr/issues/4/events","html_url":"https://github.com/artberri/sidr/issues/4","id":12322955,"number":4,"title":"Choppy animation","user":{"login":"jdifelice","id":3942185,"avatar_url":"https://avatars.githubusercontent.com/u/3942185?v=3","gravatar_id":"","url":"https://api.github.com/users/jdifelice","html_url":"https://github.com/jdifelice","followers_url":"https://api.github.com/users/jdifelice/followers","following_url":"https://api.github.com/users/jdifelice/following{/other_user}","gists_url":"https://api.github.com/users/jdifelice/gists{/gist_id}","starred_url":"https://api.github.com/users/jdifelice/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/jdifelice/subscriptions","organizations_url":"https://api.github.com/users/jdifelice/orgs","repos_url":"https://api.github.com/users/jdifelice/repos","events_url":"https://api.github.com/users/jdifelice/events{/privacy}","received_events_url":"https://api.github.com/users/jdifelice/received_events","type":"User","site_admin":false},"labels":[{"url":"https://api.github.com/repos/artberri/sidr/labels/enhancement","name":"enhancement","color":"84b6eb"}],"state":"open","locked":false,"assignee":null,"milestone":null,"comments":11,"created_at":"2013-03-22T15:08:36Z","updated_at":"2015-01-01T01:03:15Z","closed_at":null,"body":"Nice work on the plugin.  I have noticed, however, that the sliding animation is choppy.  Is there a way to make it more smooth?  Is there an option I've missed?\r\n\r\nI am running the plugin within a PhoneGap build on an iPhone 5 running iOS 6.1.2, but it's choppy even when viewed in desktop Chrome v20.0.1132.47.\r\n\r\nThanks."},"comment":{"url":"https://api.github.com/repos/artberri/sidr/issues/comments/68477281","html_url":"https://github.com/artberri/sidr/issues/4#issuecomment-68477281","issue_url":"https://api.github.com/repos/artberri/sidr/issues/4","id":68477281,"user":{"login":"aaroncrawford","id":3203500,"avatar_url":"https://avatars.githubusercontent.com/u/3203500?v=3","gravatar_id":"","url":"https://api.github.com/users/aaroncrawford","html_url":"https://github.com/aaroncrawford","followers_url":"https://api.github.com/users/aaroncrawford/followers","following_url":"https://api.github.com/users/aaroncrawford/following{/other_user}","gists_url":"https://api.github.com/users/aaroncrawford/gists{/gist_id}","starred_url":"https://api.github.com/users/aaroncrawford/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/aaroncrawford/subscriptions","organizations_url":"https://api.github.com/users/aaroncrawford/orgs","repos_url":"https://api.github.com/users/aaroncrawford/repos","events_url":"https://api.github.com/users/aaroncrawford/events{/privacy}","received_events_url":"https://api.github.com/users/aaroncrawford/received_events","type":"User","site_admin":false},"created_at":"2015-01-01T01:03:15Z","updated_at":"2015-01-01T01:03:15Z","body":"This should be addressed - relying on jquery for animation doesn't invoke the GPU."}},"public":true,"created_at":"2015-01-01T01:03:15Z"}
{"id":"2489397305","type":"CreateEvent","actor":{"id":1308363,"login":"paymonp","gravatar_id":"","url":"https://api.github.com/users/paymonp","avatar_url":"https://avatars.githubusercontent.com/u/1308363?"},"repo":{"id":28678242,"name":"paymonp/forecast_wrapper","url":"https://api.github.com/repos/paymonp/forecast_wrapper"},"payload":{"ref":null,"ref_type":"repository","master_branch":"master","description":"A wrapper to simplify Forecast API data, and add some extra functionality (Ex. determining current night/day status for a location).","pusher_type":"user"},"public":true,"created_at":"2015-01-01T01:03:18Z"}
{"id":"2489397309","type":"CreateEvent","actor":{"id":693815,"login":"apburnes","gravatar_id":"","url":"https://api.github.com/users/apburnes","avatar_url":"https://avatars.githubusercontent.com/u/693815?"},"repo":{"id":28678243,"name":"apburnes/sf_3D_elevation","url":"https://api.github.com/repos/apburnes/sf_3D_elevation"},"payload":{"ref":null,"ref_type":"repository","master_branch":"master","description":"STL file of SF based on 5ft contour points.","pusher_type":"user"},"public":true,"created_at":"2015-01-01T01:03:18Z"}
{"id":"2489397311","type":"IssueCommentEvent","actor":{"id":8508800,"login":"cmp-202","gravatar_id":"","url":"https://api.github.com/users/cmp-202","avatar_url":"https://avatars.githubusercontent.com/u/8508800?"},"repo":{"id":23310272,"name":"cmp-202/ssh2shell","url":"https://api.github.com/repos/cmp-202/ssh2shell"},"payload":{"action":"created","issue":{"url":"https://api.github.com/repos/cmp-202/ssh2shell/issues/10","labels_url":"https://api.github.com/repos/cmp-202/ssh2shell/issues/10/labels{/name}","comments_url":"https://api.github.com/repos/cmp-202/ssh2shell/issues/10/comments","events_url":"https://api.github.com/repos/cmp-202/ssh2shell/issues/10/events","html_url":"https://github.com/cmp-202/ssh2shell/issues/10","id":53071635,"number":10,"title":"Timeout error (part 2)","user":{"login":"macirex","id":1192393,"avatar_url":"https://avatars.githubusercontent.com/u/1192393?v=3","gravatar_id":"","url":"https://api.github.com/users/macirex","html_url":"https://github.com/macirex","followers_url":"https://api.github.com/users/macirex/followers","following_url":"https://api.github.com/users/macirex/following{/other_user}","gists_url":"https://api.github.com/users/macirex/gists{/gist_id}","starred_url":"https://api.github.com/users/macirex/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/macirex/subscriptions","organizations_url":"https://api.github.com/users/macirex/orgs","repos_url":"https://api.github.com/users/macirex/repos","events_url":"https://api.github.com/users/macirex/events{/privacy}","received_events_url":"https://api.github.com/users/macirex/received_events","type":"User","site_admin":false},"labels":[],"state":"open","locked":false,"assignee":null,"milestone":null,"comments":7,"created_at":"2014-12-29T21:04:44Z","updated_at":"2015-01-01T01:03:18Z","closed_at":null,"body":"Hello cmp,\r\n\r\nI´m sorry to bother you again but I´ve encountered the another time out issue.\r\n\r\nLet me provide some context first:\r\n\r\nA group of servers I administer have some restricted policies:\r\n\r\n- Root and application domain users are inaccessible via ssh.\r\n- None of the application users have password.\r\n- There´s only one user available for ssh connection, it is used for everything and it has limited permissions, for references this will be called \"simpleuser\". \r\n- Only way to administer a server is to connect via ssh to the \"simpleuser\" and then do a su to root. \r\n\r\nBasically the flow goes like this: \r\nLogin -> su - root -> su - domainapp ->  [Here I do what I need to do]   \r\n\r\nThe list of commands I´m trying is:\r\n  commands:           [\r\n    \"su - root\", \r\n    \"echo hello\" \r\n    \"su - webapp\",\r\n    \"ls -lthr\",\r\n  ]\r\n\r\nI managed to log into root using the event on commandProcessing and writing the password directly into the stream:\r\n\r\n<code>\r\nSSH.on ('commandProcessing', function onCommandProcessing( command, response, sshObj, stream ) {   \r\n            if (command.match(/root/)&& response.indexOf(\"Password:\") != -1) {\r\n\t           if (!admin)\r\n\t\t   {\r\n\t\t\tstream.write('password\\n');\r\n\t\t\tadmin = true;\r\n\t\t    }\r\n              });\r\n</code>\r\n\r\nAfter that, I try to do another su, this time to the domain I need to check but it fails with: \r\nTimeout error: 10.164.12.159: Command timed out after 5 seconds\r\n\r\nHere´s the output my app generates:\r\n\r\nConnected\r\nRunning commands Now\r\n10.164.12.159 verbose:Your password will expire in 8 days.\r\n[user01@machine043]>\r\n10.164.12.159 verbose:su - root\r\nPassword:\r\n[root@machine043]>\r\n10.164.12.159 verbose:echo hello\r\nhello\r\n[root@machine043]>\r\nTimeout error: 10.164.12.159: Command timed out after 5 seconds\r\nCompleted\r\n\r\nAny commands I execute before trying the second su, it works perfectly but after the second su I only get Timeout error.\r\n\r\nThis is the full session responses:\r\nConnected to 10.164.12.159\r\nsu - root\r\nPassword:\r\n[root@machine043]> echo hello\r\nhello\r\n[root@machine043]> su - webapp\r\nmachine043@webapp:~>\r\n\r\nAny insights you could share with me?\r\nCould this be happening because the name of the prompt is different from the first two?  Where simpleuser and root has username@machinename and webapp has machinename@username?\r\n\r\nBtw, merry christmas! and have a happy new year!"},"comment":{"url":"https://api.github.com/repos/cmp-202/ssh2shell/issues/comments/68477282","html_url":"https://github.com/cmp-202/ssh2shell/issues/10#issuecomment-68477282","issue_url":"https://api.github.com/repos/cmp-202/ssh2shell/issues/10","id":68477282,"user":{"login":"cmp-202","id":8508800,"avatar_url":"https://avatars.githubusercontent.com/u/8508800?v=3","gravatar_id":"","url":"https://api.github.com/users/cmp-202","html_url":"https://github.com/cmp-202","followers_url":"https://api.github.com/users/cmp-202/followers","following_url":"https://api.github.com/users/cmp-202/following{/other_user}","gists_url":"https://api.github.com/users/cmp-202/gists{/gist_id}","starred_url":"https://api.github.com/users/cmp-202/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/cmp-202/subscriptions","organizations_url":"https://api.github.com/users/cmp-202/orgs","repos_url":"https://api.github.com/users/cmp-202/repos","events_url":"https://api.github.com/users/cmp-202/events{/privacy}","received_events_url":"https://api.github.com/users/cmp-202/received_events","type":"User","site_admin":false},"created_at":"2015-01-01T01:03:18Z","updated_at":"2015-01-01T01:03:18Z","body":"you can increase the timeout value to allow for the scripts to run `host.idleTimeOut = 10000`"}},"public":true,"created_at":"2015-01-01T01:03:18Z"}
{"id":"2489397317","type":"CreateEvent","actor":{"id":1398544,"login":"joelpurra","gravatar_id":"","url":"https://api.github.com/users/joelpurra","avatar_url":"https://avatars.githubusercontent.com/u/1398544?"},"repo":{"id":28595466,"name":"joelpurra/jqnpm","url":"https://api.github.com/repos/joelpurra/jqnpm"},"payload":{"ref":"v0.3.3","ref_type":"tag","master_branch":"master","description":"A package manager built for jq as an example implementation.","pusher_type":"user"},"public":true,"created_at":"2015-01-01T01:03:19Z"}
{"id":"2489397322","type":"CreateEvent","actor":{"id":10263666,"login":"katiekroik","gravatar_id":"","url":"https://api.github.com/users/katiekroik","avatar_url":"https://avatars.githubusercontent.com/u/10263666?"},"repo":{"id":28677679,"name":"jl4282/swirlwebsite","url":"https://api.github.com/repos/jl4282/swirlwebsite"},"payload":{"ref":"develop","ref_type":"branch","master_branch":"master","description":"","pusher_type":"user"},"public":true,"created_at":"2015-01-01T01:03:20Z"}
{"id":"2489397327","type":"PushEvent","actor":{"id":2961036,"login":"codemercenary","gravatar_id":"","url":"https://api.github.com/users/codemercenary","avatar_url":"https://avatars.githubusercontent.com/u/2961036?"},"repo":{"id":22234733,"name":"leapmotion/autowiring","url":"https://api.github.com/repos/leapmotion/autowiring"},"payload":{"push_id":536752898,"size":2,"distinct_size":1,"ref":"refs/heads/fix-autoboost","head":"3f0c9d9becf969aab74c7b4fe222854a6eebe58b","before":"36b2b53a58e4725efd0cf1a9823175cd492ad044","commits":[{"sha":"72c45ac5ebe38bb3581a26ebd6600b3769e6022c","author":{"email":"2766fce9ce519d0471f8fc0cf2c841e5384821e2@gmail.com","name":"Ted Nitz"},"message":"Merge pull request #313 from leapmotion/fix-cmakewarn\n\nEliminate unnecessary quoted variable expansions","distinct":false,"url":"https://api.github.com/repos/leapmotion/autowiring/commits/72c45ac5ebe38bb3581a26ebd6600b3769e6022c"},{"sha":"3f0c9d9becf969aab74c7b4fe222854a6eebe58b","author":{"email":"f4b726eb4428c94ec1239af9e3b06d73d64a2f9c@gmail.com","name":"Jason Lokerson"},"message":"Rename boost to autoboost\n\nHuge modification, requiring adjustements to namespaces, macros, file names, and header guards.  This change introduces a private version of Boost 1.57.0 that can be linked externally on platforms which do not have full STL11 support without colliding in any way with those platforms' independent use of boost.","distinct":true,"url":"https://api.github.com/repos/leapmotion/autowiring/commits/3f0c9d9becf969aab74c7b4fe222854a6eebe58b"}]},"public":true,"created_at":"2015-01-01T01:03:21Z","org":{"id":2242710,"login":"leapmotion","gravatar_id":"","url":"https://api.github.com/orgs/leapmotion","avatar_url":"https://avatars.githubusercontent.com/u/2242710?"}}
{"id":"2489397328","type":"IssuesEvent","actor":{"id":762599,"login":"natedavis","gravatar_id":"","url":"https://api.github.com/users/natedavis","avatar_url":"https://avatars.githubusercontent.com/u/762599?"},"repo":{"id":8348465,"name":"BF2Statistics/ControlCenter","url":"https://api.github.com/repos/BF2Statistics/ControlCenter"},"payload":{"action":"opened","issue":{"url":"https://api.github.com/repos/BF2Statistics/ControlCenter/issues/2","labels_url":"https://api.github.com/repos/BF2Statistics/ControlCenter/issues/2/labels{/name}","comments_url":"https://api.github.com/repos/BF2Statistics/ControlCenter/issues/2/comments","events_url":"https://api.github.com/repos/BF2Statistics/ControlCenter/issues/2/events","html_url":"https://github.com/BF2Statistics/ControlCenter/issues/2","id":53210225,"number":2,"title":"Launch Server invalid Path name","user":{"login":"natedavis","id":762599,"avatar_url":"https://avatars.githubusercontent.com/u/762599?v=3","gravatar_id":"","url":"https://api.github.com/users/natedavis","html_url":"https://github.com/natedavis","followers_url":"https://api.github.com/users/natedavis/followers","following_url":"https://api.github.com/users/natedavis/following{/other_user}","gists_url":"https://api.github.com/users/natedavis/gists{/gist_id}","starred_url":"https://api.github.com/users/natedavis/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/natedavis/subscriptions","organizations_url":"https://api.github.com/users/natedavis/orgs","repos_url":"https://api.github.com/users/natedavis/repos","events_url":"https://api.github.com/users/natedavis/events{/privacy}","received_events_url":"https://api.github.com/users/natedavis/received_events","type":"User","site_admin":false},"labels":[],"state":"open","locked":false,"assignee":null,"milestone":null,"comments":0,"created_at":"2015-01-01T01:03:21Z","updated_at":"2015-01-01T01:03:21Z","closed_at":null,"body":"System: Server 2008 R2\r\n\r\nBF2 is installed:\r\nC:\\Program Files (x86)\\EA Games\\Battlefield 2 Server\\\r\nBF2Statistics is install:\r\nC:\\Program Files (x86)\\BF2Statistics\\BF2Statistics Control Center\\\r\n\r\nWhen I try and Launch the game with \"Use Global Settings File\" The Server will not launch with my settings.\r\n\r\nFrom the command line, I tested the following...\r\n\r\nPath Generated in MainForm.cs on line 457 - Which is not working:\r\nbf2_w32ded.exe +modPath mods/bf2 +config C:\\\\Program Files (x86)\\\\BF2Statistics\\\\BF2Statistics Control Center\\\\Python\\\\GlobalServerSettings.con\r\n\r\nIf I use the following to Launch the server manually it works great:\r\nbf2_w32ded.exe +modPath mods/bf2 +config \"C:\\Program Files (x86)\\BF2Statistics\\BF2Statistics Control Center\\Python\\GlobalServerSettings.con\"\r\n\r\nQuotes at the end and beginning with no escaping \\s.\r\n\r\n\r\n"}},"public":true,"created_at":"2015-01-01T01:03:22Z","org":{"id":2574835,"login":"BF2Statistics","gravatar_id":"","url":"https://api.github.com/orgs/BF2Statistics","avatar_url":"https://avatars.githubusercontent.com/u/2574835?"}}
{"id":"2489397337","type":"PullRequestEvent","actor":{"id":447569,"login":"tom-henderson","gravatar_id":"","url":"https://api.github.com/users/tom-henderson","avatar_url":"https://avatars.githubusercontent.com/u/447569?"},"repo":{"id":11580119,"name":"joerick/django-timecode","url":"https://api.github.com/repos/joerick/django-timecode"},"payload":{"action":"opened","number":1,"pull_request":{"url":"https://api.github.com/repos/joerick/django-timecode/pulls/1","id":26739431,"html_url":"https://github.com/joerick/django-timecode/pull/1","diff_url":"https://github.com/joerick/django-timecode/pull/1.diff","patch_url":"https://github.com/joerick/django-timecode/pull/1.patch","issue_url":"https://api.github.com/repos/joerick/django-timecode/issues/1","number":1,"state":"open","locked":false,"title":"Django jquery","user":{"login":"tom-henderson","id":447569,"avatar_url":"https://avatars.githubusercontent.com/u/447569?v=3","gravatar_id":"","url":"https://api.github.com/users/tom-henderson","html_url":"https://github.com/tom-henderson","followers_url":"https://api.github.com/users/tom-henderson/followers","following_url":"https://api.github.com/users/tom-henderson/following{/other_user}","gists_url":"https://api.github.com/users/tom-henderson/gists{/gist_id}","starred_url":"https://api.github.com/users/tom-henderson/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/tom-henderson/subscriptions","organizations_url":"https://api.github.com/users/tom-henderson/orgs","repos_url":"https://api.github.com/users/tom-henderson/repos","events_url":"https://api.github.com/users/tom-henderson/events{/privacy}","received_events_url":"https://api.github.com/users/tom-henderson/received_events","type":"User","site_admin":false},"body":"Use jQuery from the Django namespace so timecode fields work in the django admin.","created_at":"2015-01-01T01:03:22Z","updated_at":"2015-01-01T01:03:23Z","closed_at":null,"merged_at":null,"merge_commit_sha":null,"assignee":null,"milestone":null,"commits_url":"https://api.github.com/repos/joerick/django-timecode/pulls/1/commits","review_comments_url":"https://api.github.com/repos/joerick/django-timecode/pulls/1/comments","review_comment_url":"https://api.github.com/repos/joerick/django-timecode/pulls/comments/{number}","comments_url":"https://api.github.com/repos/joerick/django-timecode/issues/1/comments","statuses_url":"https://api.github.com/repos/joerick/django-timecode/statuses/567af7c7dd6130eb9cea3c3f9065c0bc1d801df1","head":{"label":"tom-henderson:django-jquery","ref":"django-jquery","sha":"567af7c7dd6130eb9cea3c3f9065c0bc1d801df1","user":{"login":"tom-henderson","id":447569,"avatar_url":"https://avatars.githubusercontent.com/u/447569?v=3","gravatar_id":"","url":"https://api.github.com/users/tom-henderson","html_url":"https://github.com/tom-henderson","followers_url":"https://api.github.com/users/tom-henderson/followers","following_url":"https://api.github.com/users/tom-henderson/following{/other_user}","gists_url":"https://api.github.com/users/tom-henderson/gists{/gist_id}","starred_url":"https://api.github.com/users/tom-henderson/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/tom-henderson/subscriptions","organizations_url":"https://api.github.com/users/tom-henderson/orgs","repos_url":"https://api.github.com/users/tom-henderson/repos","events_url":"https://api.github.com/users/tom-henderson/events{/privacy}","received_events_url":"https://api.github.com/users/tom-henderson/received_events","type":"User","site_admin":false},"repo":{"id":28677632,"name":"django-timecode","full_name":"tom-henderson/django-timecode","owner":{"login":"tom-henderson","id":447569,"avatar_url":"https://avatars.githubusercontent.com/u/447569?v=3","gravatar_id":"","url":"https://api.github.com/users/tom-henderson","html_url":"https://github.com/tom-henderson","followers_url":"https://api.github.com/users/tom-henderson/followers","following_url":"https://api.github.com/users/tom-henderson/following{/other_user}","gists_url":"https://api.github.com/users/tom-henderson/gists{/gist_id}","starred_url":"https://api.github.com/users/tom-henderson/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/tom-henderson/subscriptions","organizations_url":"https://api.github.com/users/tom-henderson/orgs","repos_url":"https://api.github.com/users/tom-henderson/repos","events_url":"https://api.github.com/users/tom-henderson/events{/privacy}","received_events_url":"https://api.github.com/users/tom-henderson/received_events","type":"User","site_admin":false},"private":false,"html_url":"https://github.com/tom-henderson/django-timecode","description":"A python class for a timecode and accompanying django field","fork":true,"url":"https://api.github.com/repos/tom-henderson/django-timecode","forks_url":"https://api.github.com/repos/tom-henderson/django-timecode/forks","keys_url":"https://api.github.com/repos/tom-henderson/django-timecode/keys{/key_id}","collaborators_url":"https://api.github.com/repos/tom-henderson/django-timecode/collaborators{/collaborator}","teams_url":"https://api.github.com/repos/tom-henderson/django-timecode/teams","hooks_url":"https://api.github.com/repos/tom-henderson/django-timecode/hooks","issue_events_url":"https://api.github.com/repos/tom-henderson/django-timecode/issues/events{/number}","events_url":"https://api.github.com/repos/tom-henderson/django-timecode/events","assignees_url":"https://api.github.com/repos/tom-henderson/django-timecode/assignees{/user}","branches_url":"https://api.github.com/repos/tom-henderson/django-timecode/branches{/branch}","tags_url":"https://api.github.com/repos/tom-henderson/django-timecode/tags","blobs_url":"https://api.github.com/repos/tom-henderson/django-timecode/git/blobs{/sha}","git_tags_url":"https://api.github.com/repos/tom-henderson/django-timecode/git/tags{/sha}","git_refs_url":"https://api.github.com/repos/tom-henderson/django-timecode/git/refs{/sha}","trees_url":"https://api.github.com/repos/tom-henderson/django-timecode/git/trees{/sha}","statuses_url":"https://api.github.com/repos/tom-henderson/django-timecode/statuses/{sha}","languages_url":"https://api.github.com/repos/tom-henderson/django-timecode/languages","stargazers_url":"https://api.github.com/repos/tom-henderson/django-timecode/stargazers","contributors_url":"https://api.github.com/repos/tom-henderson/django-timecode/contributors","subscribers_url":"https://api.github.com/repos/tom-henderson/django-timecode/subscribers","subscription_url":"https://api.github.com/repos/tom-henderson/django-timecode/subscription","commits_url":"https://api.github.com/repos/tom-henderson/django-timecode/commits{/sha}","git_commits_url":"https://api.github.com/repos/tom-henderson/django-timecode/git/commits{/sha}","comments_url":"https://api.github.com/repos/tom-henderson/django-timecode/comments{/number}","issue_comment_url":"https://api.github.com/repos/tom-henderson/django-timecode/issues/comments/{number}","contents_url":"https://api.github.com/repos/tom-henderson/django-timecode/contents/{+path}","compare_url":"https://api.github.com/repos/tom-henderson/django-timecode/compare/{base}...{head}","merges_url":"https://api.github.com/repos/tom-henderson/django-timecode/merges","archive_url":"https://api.github.com/repos/tom-henderson/django-timecode/{archive_format}{/ref}","downloads_url":"https://api.github.com/repos/tom-henderson/django-timecode/downloads","issues_url":"https://api.github.com/repos/tom-henderson/django-timecode/issues{/number}","pulls_url":"https://api.github.com/repos/tom-henderson/django-timecode/pulls{/number}","milestones_url":"https://api.github.com/repos/tom-henderson/django-timecode/milestones{/number}","notifications_url":"https://api.github.com/repos/tom-henderson/django-timecode/notifications{?since,all,participating}","labels_url":"https://api.github.com/repos/tom-henderson/django-timecode/labels{/name}","releases_url":"https://api.github.com/repos/tom-henderson/django-timecode/releases{/id}","created_at":"2015-01-01T00:07:05Z","updated_at":"2015-01-01T00:07:06Z","pushed_at":"2015-01-01T00:54:15Z","git_url":"git://github.com/tom-henderson/django-timecode.git","ssh_url":"git@github.com:tom-henderson/django-timecode.git","clone_url":"https://github.com/tom-henderson/django-timecode.git","svn_url":"https://github.com/tom-henderson/django-timecode","homepage":"","size":156,"stargazers_count":0,"watchers_count":0,"language":"Python","has_issues":false,"has_downloads":true,"has_wiki":true,"has_pages":false,"forks_count":0,"mirror_url":null,"open_issues_count":0,"forks":0,"open_issues":0,"watchers":0,"default_branch":"master"}},"base":{"label":"joerick:master","ref":"master","sha":"737f138d8c3cbdb72e08419cf2d10dd1eb4e72d6","user":{"login":"joerick","id":1244307,"avatar_url":"https://avatars.githubusercontent.com/u/1244307?v=3","gravatar_id":"","url":"https://api.github.com/users/joerick","html_url":"https://github.com/joerick","followers_url":"https://api.github.com/users/joerick/followers","following_url":"https://api.github.com/users/joerick/following{/other_user}","gists_url":"https://api.github.com/users/joerick/gists{/gist_id}","starred_url":"https://api.github.com/users/joerick/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/joerick/subscriptions","organizations_url":"https://api.github.com/users/joerick/orgs","repos_url":"https://api.github.com/users/joerick/repos","events_url":"https://api.github.com/users/joerick/events{/privacy}","received_events_url":"https://api.github.com/users/joerick/received_events","type":"User","site_admin":false},"repo":{"id":11580119,"name":"django-timecode","full_name":"joerick/django-timecode","owner":{"login":"joerick","id":1244307,"avatar_url":"https://avatars.githubusercontent.com/u/1244307?v=3","gravatar_id":"","url":"https://api.github.com/users/joerick","html_url":"https://github.com/joerick","followers_url":"https://api.github.com/users/joerick/followers","following_url":"https://api.github.com/users/joerick/following{/other_user}","gists_url":"https://api.github.com/users/joerick/gists{/gist_id}","starred_url":"https://api.github.com/users/joerick/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/joerick/subscriptions","organizations_url":"https://api.github.com/users/joerick/orgs","repos_url":"https://api.github.com/users/joerick/repos","events_url":"https://api.github.com/users/joerick/events{/privacy}","received_events_url":"https://api.github.com/users/joerick/received_events","type":"User","site_admin":false},"private":false,"html_url":"https://github.com/joerick/django-timecode","description":"A python class for a timecode and accompanying django field","fork":false,"url":"https://api.github.com/repos/joerick/django-timecode","forks_url":"https://api.github.com/repos/joerick/django-timecode/forks","keys_url":"https://api.github.com/repos/joerick/django-timecode/keys{/key_id}","collaborators_url":"https://api.github.com/repos/joerick/django-timecode/collaborators{/collaborator}","teams_url":"https://api.github.com/repos/joerick/django-timecode/teams","hooks_url":"https://api.github.com/repos/joerick/django-timecode/hooks","issue_events_url":"https://api.github.com/repos/joerick/django-timecode/issues/events{/number}","events_url":"https://api.github.com/repos/joerick/django-timecode/events","assignees_url":"https://api.github.com/repos/joerick/django-timecode/assignees{/user}","branches_url":"https://api.github.com/repos/joerick/django-timecode/branches{/branch}","tags_url":"https://api.github.com/repos/joerick/django-timecode/tags","blobs_url":"https://api.github.com/repos/joerick/django-timecode/git/blobs{/sha}","git_tags_url":"https://api.github.com/repos/joerick/django-timecode/git/tags{/sha}","git_refs_url":"https://api.github.com/repos/joerick/django-timecode/git/refs{/sha}","trees_url":"https://api.github.com/repos/joerick/django-timecode/git/trees{/sha}","statuses_url":"https://api.github.com/repos/joerick/django-timecode/statuses/{sha}","languages_url":"https://api.github.com/repos/joerick/django-timecode/languages","stargazers_url":"https://api.github.com/repos/joerick/django-timecode/stargazers","contributors_url":"https://api.github.com/repos/joerick/django-timecode/contributors","subscribers_url":"https://api.github.com/repos/joerick/django-timecode/subscribers","subscription_url":"https://api.github.com/repos/joerick/django-timecode/subscription","commits_url":"https://api.github.com/repos/joerick/django-timecode/commits{/sha}","git_commits_url":"https://api.github.com/repos/joerick/django-timecode/git/commits{/sha}","comments_url":"https://api.github.com/repos/joerick/django-timecode/comments{/number}","issue_comment_url":"https://api.github.com/repos/joerick/django-timecode/issues/comments/{number}","contents_url":"https://api.github.com/repos/joerick/django-timecode/contents/{+path}","compare_url":"https://api.github.com/repos/joerick/django-timecode/compare/{base}...{head}","merges_url":"https://api.github.com/repos/joerick/django-timecode/merges","archive_url":"https://api.github.com/repos/joerick/django-timecode/{archive_format}{/ref}","downloads_url":"https://api.github.com/repos/joerick/django-timecode/downloads","issues_url":"https://api.github.com/repos/joerick/django-timecode/issues{/number}","pulls_url":"https://api.github.com/repos/joerick/django-timecode/pulls{/number}","milestones_url":"https://api.github.com/repos/joerick/django-timecode/milestones{/number}","notifications_url":"https://api.github.com/repos/joerick/django-timecode/notifications{?since,all,participating}","labels_url":"https://api.github.com/repos/joerick/django-timecode/labels{/name}","releases_url":"https://api.github.com/repos/joerick/django-timecode/releases{/id}","created_at":"2013-07-22T11:50:44Z","updated_at":"2014-09-15T16:05:53Z","pushed_at":"2014-01-13T16:01:08Z","git_url":"git://github.com/joerick/django-timecode.git","ssh_url":"git@github.com:joerick/django-timecode.git","clone_url":"https://github.com/joerick/django-timecode.git","svn_url":"https://github.com/joerick/django-timecode","homepage":"","size":156,"stargazers_count":2,"watchers_count":2,"language":"Python","has_issues":true,"has_downloads":true,"has_wiki":true,"has_pages":false,"forks_count":1,"mirror_url":null,"open_issues_count":1,"forks":1,"open_issues":1,"watchers":2,"default_branch":"master"}},"_links":{"self":{"href":"https://api.github.com/repos/joerick/django-timecode/pulls/1"},"html":{"href":"https://github.com/joerick/django-timecode/pull/1"},"issue":{"href":"https://api.github.com/repos/joerick/django-timecode/issues/1"},"comments":{"href":"https://api.github.com/repos/joerick/django-timecode/issues/1/comments"},"review_comments":{"href":"https://api.github.com/repos/joerick/django-timecode/pulls/1/comments"},"review_comment":{"href":"https://api.github.com/repos/joerick/django-timecode/pulls/comments/{number}"},"commits":{"href":"https://api.github.com/repos/joerick/django-timecode/pulls/1/commits"},"statuses":{"href":"https://api.github.com/repos/joerick/django-timecode/statuses/567af7c7dd6130eb9cea3c3f9065c0bc1d801df1"}},"merged":false,"mergeable":null,"mergeable_state":"unknown","merged_by":null,"comments":0,"review_comments":0,"commits":3,"additions":25,"deletions":23,"changed_files":2}},"public":true,"created_at":"2015-01-01T01:03:23Z"}
{"id":"2489397338","type":"PushEvent","actor":{"id":6563665,"login":"mikeberger","gravatar_id":"","url":"https://api.github.com/users/mikeberger","avatar_url":"https://avatars.githubusercontent.com/u/6563665?"},"repo":{"id":16442206,"name":"mikeberger/borg_calendar","url":"https://api.github.com/repos/mikeberger/borg_calendar"},"payload":{"push_id":536752904,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"5a79ba420970577f91cc0677f413cbecc8be3e4d","before":"14da87ea2655e8a729a0ec537720221cfc32852f","commits":[{"sha":"5a79ba420970577f91cc0677f413cbecc8be3e4d","author":{"email":"a17fed27eaa842282862ff7c1b9c8395a26ac320@mbcsoft.com","name":"Mike Berger"},"message":"update category pulldown in appointment editors when the categories change. Also fix memory leak.","distinct":true,"url":"https://api.github.com/repos/mikeberger/borg_calendar/commits/5a79ba420970577f91cc0677f413cbecc8be3e4d"}]},"public":true,"created_at":"2015-01-01T01:03:23Z"}
{"id":"2489397348","type":"PushEvent","actor":{"id":6325631,"login":"pirej","gravatar_id":"","url":"https://api.github.com/users/pirej","avatar_url":"https://avatars.githubusercontent.com/u/6325631?"},"repo":{"id":27978759,"name":"lollipoop/android_device_sony_montblanc-common","url":"https://api.github.com/repos/lollipoop/android_device_sony_montblanc-common"},"payload":{"push_id":536752906,"size":1,"distinct_size":1,"ref":"refs/heads/m4","head":"4dea1e80ea185145d16f8a27b53c49004a82486a","before":"81c8b8e24cebad126b22e7eee0e5ad490d0da7ee","commits":[{"sha":"4dea1e80ea185145d16f8a27b53c49004a82486a","author":{"email":"1286c54ccb8bc261f2349e0273c6fbd8e8811d8d@yahoo.com","name":"pirej"},"message":"Update BoardConfigCommon.mk","distinct":true,"url":"https://api.github.com/repos/lollipoop/android_device_sony_montblanc-common/commits/4dea1e80ea185145d16f8a27b53c49004a82486a"}]},"public":true,"created_at":"2015-01-01T01:03:25Z","org":{"id":10051895,"login":"lollipoop","gravatar_id":"","url":"https://api.github.com/orgs/lollipoop","avatar_url":"https://avatars.githubusercontent.com/u/10051895?"}}
{"id":"2489397352","type":"PushEvent","actor":{"id":674513,"login":"jonesde","gravatar_id":"","url":"https://api.github.com/users/jonesde","avatar_url":"https://avatars.githubusercontent.com/u/674513?"},"repo":{"id":23584277,"name":"sssonline/mantle","url":"https://api.github.com/repos/sssonline/mantle"},"payload":{"push_id":536752908,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"e09da87aef6c7dc586dea4fbc905b700a5a45766","before":"d51d27b9328f9625588ab93bd9be509a8fa775bd","commits":[{"sha":"e09da87aef6c7dc586dea4fbc905b700a5a45766","author":{"email":"2c659b141cba72e98a27345389f1cac5e8612a49@dejc.com","name":"David E Jones"},"message":"Changed AssetRegistration to have a sub-sequence key instead of using fromDate, may have multiple records with the same fromDate so it isn't a good key","distinct":true,"url":"https://api.github.com/repos/sssonline/mantle/commits/e09da87aef6c7dc586dea4fbc905b700a5a45766"}]},"public":true,"created_at":"2015-01-01T01:03:26Z"}
{"id":"2489397355","type":"PushEvent","actor":{"id":803768,"login":"backbone","gravatar_id":"","url":"https://api.github.com/users/backbone","avatar_url":"https://avatars.githubusercontent.com/u/803768?"},"repo":{"id":24404721,"name":"backbone/portage-tree","url":"https://api.github.com/repos/backbone/portage-tree"},"payload":{"push_id":536752911,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"b1677769b2847c0a94f6f8015bffeed5d1a24204","before":"dccafb540891dd450a885612cabf712d3129dbdf","commits":[{"sha":"b1677769b2847c0a94f6f8015bffeed5d1a24204","author":{"email":"4da38e79dbf743adc207e22b3829ee998325e896@backbone.ws","name":"Kolan Sh"},"message":"Sync with portage [Thu Jan  1 04:03:20 MSK 2015].","distinct":true,"url":"https://api.github.com/repos/backbone/portage-tree/commits/b1677769b2847c0a94f6f8015bffeed5d1a24204"}]},"public":true,"created_at":"2015-01-01T01:03:26Z"}
{"id":"2489397357","type":"PushEvent","actor":{"id":10176820,"login":"chalavadivishnu","gravatar_id":"","url":"https://api.github.com/users/chalavadivishnu","avatar_url":"https://avatars.githubusercontent.com/u/10176820?"},"repo":{"id":28678150,"name":"chalavadivishnu/Face-Detection","url":"https://api.github.com/repos/chalavadivishnu/Face-Detection"},"payload":{"push_id":536752912,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"96f7f02d9551bb3c922c9c6303b9d144e2c31398","before":"74e68efacee23b35716fa9b2b46d0926e552250b","commits":[{"sha":"96f7f02d9551bb3c922c9c6303b9d144e2c31398","author":{"email":"ce8044f02eb2a26b631671f5297317036d398e79@gmail.com","name":"Chalavadi Vishnu"},"message":"load images","distinct":true,"url":"https://api.github.com/repos/chalavadivishnu/Face-Detection/commits/96f7f02d9551bb3c922c9c6303b9d144e2c31398"}]},"public":true,"created_at":"2015-01-01T01:03:26Z"}
{"id":"2489397358","type":"PushEvent","actor":{"id":904370,"login":"helhum","gravatar_id":"","url":"https://api.github.com/users/helhum","avatar_url":"https://avatars.githubusercontent.com/u/904370?"},"repo":{"id":21070637,"name":"TYPO3-Surf-CMS/TYPO3SurfCms.SurfTools","url":"https://api.github.com/repos/TYPO3-Surf-CMS/TYPO3SurfCms.SurfTools"},"payload":{"push_id":536752913,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"e9f19e894cc8cb5777c9343c6bdb2fbf5e3f2945","before":"03ce16ec5d355a60057fb57f8d27d7116422f722","commits":[{"sha":"e9f19e894cc8cb5777c9343c6bdb2fbf5e3f2945","author":{"email":"6bf857ca7de026fbed4ae790a809a0ea640901f4@helmuthummel.de","name":"Helmut Hummel"},"message":"Update README.md","distinct":true,"url":"https://api.github.com/repos/TYPO3-Surf-CMS/TYPO3SurfCms.SurfTools/commits/e9f19e894cc8cb5777c9343c6bdb2fbf5e3f2945"}]},"public":true,"created_at":"2015-01-01T01:03:27Z","org":{"id":7921669,"login":"TYPO3-Surf-CMS","gravatar_id":"","url":"https://api.github.com/orgs/TYPO3-Surf-CMS","avatar_url":"https://avatars.githubusercontent.com/u/7921669?"}}
{"id":"2489397369","type":"PushEvent","actor":{"id":512573,"login":"SamWhited","gravatar_id":"","url":"https://api.github.com/users/SamWhited","avatar_url":"https://avatars.githubusercontent.com/u/512573?"},"repo":{"id":27289261,"name":"campaul/ph.sh","url":"https://api.github.com/repos/campaul/ph.sh"},"payload":{"push_id":536752919,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"688e49dcbc4acfb6b4b1871debaaa712f1f7410e","before":"51db74f429e57b90e1cc9ca18551ca5e74b7db49","commits":[{"sha":"688e49dcbc4acfb6b4b1871debaaa712f1f7410e","author":{"email":"f16bed56189e249fe4ca8ed10a1ecae60e8ceac0@samwhited.com","name":"Sam Whited"},"message":"Fix in-place import","distinct":true,"url":"https://api.github.com/repos/campaul/ph.sh/commits/688e49dcbc4acfb6b4b1871debaaa712f1f7410e"}]},"public":true,"created_at":"2015-01-01T01:03:28Z"}
{"id":"2489397370","type":"CreateEvent","actor":{"id":1059214,"login":"wlaurance","gravatar_id":"","url":"https://api.github.com/users/wlaurance","avatar_url":"https://avatars.githubusercontent.com/u/1059214?"},"repo":{"id":28050478,"name":"empirical-org/Quill-Grammar","url":"https://api.github.com/repos/empirical-org/Quill-Grammar"},"payload":{"ref":"feature/teacher-form","ref_type":"branch","master_branch":"master","description":"Quill Grammar App","pusher_type":"user"},"public":true,"created_at":"2015-01-01T01:03:28Z","org":{"id":4258432,"login":"empirical-org","gravatar_id":"","url":"https://api.github.com/orgs/empirical-org","avatar_url":"https://avatars.githubusercontent.com/u/4258432?"}}
{"id":"2489397372","type":"CreateEvent","actor":{"id":840120,"login":"joaoalf","gravatar_id":"","url":"https://api.github.com/users/joaoalf","avatar_url":"https://avatars.githubusercontent.com/u/840120?"},"repo":{"id":21998771,"name":"savoirfairelinux/partner-contact","url":"https://api.github.com/repos/savoirfairelinux/partner-contact"},"payload":{"ref":"7.0_fix_function_partner_import_issue","ref_type":"branch","master_branch":"master","description":"","pusher_type":"user"},"public":true,"created_at":"2015-01-01T01:03:28Z","org":{"id":2735545,"login":"savoirfairelinux","gravatar_id":"","url":"https://api.github.com/orgs/savoirfairelinux","avatar_url":"https://avatars.githubusercontent.com/u/2735545?"}}
{"id":"2489397375","type":"PushEvent","actor":{"id":8396076,"login":"chris-kobrzak","gravatar_id":"","url":"https://api.github.com/users/chris-kobrzak","avatar_url":"https://avatars.githubusercontent.com/u/8396076?"},"repo":{"id":28611088,"name":"chris-kobrzak/natalia.dns4e.net","url":"https://api.github.com/repos/chris-kobrzak/natalia.dns4e.net"},"payload":{"push_id":536752923,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"dbc61a3aeb6b13937d9b1345ca46f9965a2eb950","before":"1e3a5af2be263253fdc3343d7bc23cf456058531","commits":[{"sha":"dbc61a3aeb6b13937d9b1345ca46f9965a2eb950","author":{"email":"33a9c8b3090a200dac7ed5d8b6d398372695ff06@gmail.com","name":"Chris Kobrzak"},"message":"Initial version of Natalie's image gallery","distinct":true,"url":"https://api.github.com/repos/chris-kobrzak/natalia.dns4e.net/commits/dbc61a3aeb6b13937d9b1345ca46f9965a2eb950"}]},"public":true,"created_at":"2015-01-01T01:03:29Z"}
{"id":"2489397376","type":"GollumEvent","actor":{"id":720678,"login":"kongr45gpen","gravatar_id":"","url":"https://api.github.com/users/kongr45gpen","avatar_url":"https://avatars.githubusercontent.com/u/720678?"},"repo":{"id":11615971,"name":"allejo/bzion","url":"https://api.github.com/repos/allejo/bzion"},"payload":{"pages":[{"page_name":"Installation","title":"Installation","summary":null,"action":"edited","sha":"a2a782b24c716c5e675ec38ccda1c620edeafbf1","html_url":"https://github.com/allejo/bzion/wiki/Installation"}]},"public":true,"created_at":"2015-01-01T01:03:29Z"}
{"id":"2489397377","type":"IssuesEvent","actor":{"id":1313396,"login":"castvoid","gravatar_id":"","url":"https://api.github.com/users/castvoid","avatar_url":"https://avatars.githubusercontent.com/u/1313396?"},"repo":{"id":28132069,"name":"adbsjb/Website","url":"https://api.github.com/repos/adbsjb/Website"},"payload":{"action":"opened","issue":{"url":"https://api.github.com/repos/adbsjb/Website/issues/1","labels_url":"https://api.github.com/repos/adbsjb/Website/issues/1/labels{/name}","comments_url":"https://api.github.com/repos/adbsjb/Website/issues/1/comments","events_url":"https://api.github.com/repos/adbsjb/Website/issues/1/events","html_url":"https://github.com/adbsjb/Website/issues/1","id":53210229,"number":1,"title":"Lack of pictures of Gleb","user":{"login":"castvoid","id":1313396,"avatar_url":"https://avatars.githubusercontent.com/u/1313396?v=3","gravatar_id":"","url":"https://api.github.com/users/castvoid","html_url":"https://github.com/castvoid","followers_url":"https://api.github.com/users/castvoid/followers","following_url":"https://api.github.com/users/castvoid/following{/other_user}","gists_url":"https://api.github.com/users/castvoid/gists{/gist_id}","starred_url":"https://api.github.com/users/castvoid/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/castvoid/subscriptions","organizations_url":"https://api.github.com/users/castvoid/orgs","repos_url":"https://api.github.com/users/castvoid/repos","events_url":"https://api.github.com/users/castvoid/events{/privacy}","received_events_url":"https://api.github.com/users/castvoid/received_events","type":"User","site_admin":false},"labels":[],"state":"open","locked":false,"assignee":null,"milestone":null,"comments":0,"created_at":"2015-01-01T01:03:29Z","updated_at":"2015-01-01T01:03:29Z","closed_at":null,"body":"See title"}},"public":true,"created_at":"2015-01-01T01:03:29Z"}
{"id":"2489397384","type":"PushEvent","actor":{"id":280212,"login":"KenanSulayman","gravatar_id":"","url":"https://api.github.com/users/KenanSulayman","avatar_url":"https://avatars.githubusercontent.com/u/280212?"},"repo":{"id":21481110,"name":"KenanSulayman/heartbeat","url":"https://api.github.com/repos/KenanSulayman/heartbeat"},"payload":{"push_id":536752925,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"c085f224e47c8147e6085f897cb91a07834211b1","before":"d3f1564c71b9e115435146f52c4c7c5771f819c7","commits":[{"sha":"c085f224e47c8147e6085f897cb91a07834211b1","author":{"email":"9176253dfc0bc82671a5e984646605f93319147a@sly.mn","name":"Kenan Sulayman"},"message":"1420074208651\n\nMuLnvTUe41hdRnmxxHnfDhkDkxsJfepcQfRosAA0g3I=","distinct":true,"url":"https://api.github.com/repos/KenanSulayman/heartbeat/commits/c085f224e47c8147e6085f897cb91a07834211b1"}]},"public":true,"created_at":"2015-01-01T01:03:30Z"}
{"id":"2489397385","type":"PushEvent","actor":{"id":8908463,"login":"ivankp","gravatar_id":"","url":"https://api.github.com/users/ivankp","avatar_url":"https://avatars.githubusercontent.com/u/8908463?"},"repo":{"id":26780993,"name":"ivankp/bh_analysis","url":"https://api.github.com/repos/ivankp/bh_analysis"},"payload":{"push_id":536752926,"size":1,"distinct_size":1,"ref":"refs/heads/testing","head":"54b3cd7571257f9c38f4cfb5ad5fbb379419d827","before":"1cd6e64b009254caf84067f3a836e3b1d5f98218","commits":[{"sha":"54b3cd7571257f9c38f4cfb5ad5fbb379419d827","author":{"email":"9c1affc1d2e05e5eafd0291f399cde138f8c80d5@gmail.com","name":"ivankp"},"message":"reweigh scales","distinct":true,"url":"https://api.github.com/repos/ivankp/bh_analysis/commits/54b3cd7571257f9c38f4cfb5ad5fbb379419d827"}]},"public":true,"created_at":"2015-01-01T01:03:30Z"}
{"id":"2489397389","type":"PushEvent","actor":{"id":5049892,"login":"Brawl345","gravatar_id":"","url":"https://api.github.com/users/Brawl345","avatar_url":"https://avatars.githubusercontent.com/u/5049892?"},"repo":{"id":19072701,"name":"Brawl345/dotfiles","url":"https://api.github.com/repos/Brawl345/dotfiles"},"payload":{"push_id":536752927,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"4c41a4d670beb420424b3e0c3d589614bf7307a7","before":"a867a28418d4ca895f96fe9902914a1cd6ac56b9","commits":[{"sha":"4c41a4d670beb420424b3e0c3d589614bf7307a7","author":{"email":"3a3e021605a88f7e51d5787c2ebbb30bfb66608d@outlook.com","name":"Andreas Bielawski"},"message":"changes","distinct":true,"url":"https://api.github.com/repos/Brawl345/dotfiles/commits/4c41a4d670beb420424b3e0c3d589614bf7307a7"}]},"public":true,"created_at":"2015-01-01T01:03:31Z"}
{"id":"2489397392","type":"PushEvent","actor":{"id":512573,"login":"SamWhited","gravatar_id":"","url":"https://api.github.com/users/SamWhited","avatar_url":"https://avatars.githubusercontent.com/u/512573?"},"repo":{"id":28072019,"name":"SamWhited/ph.sh","url":"https://api.github.com/repos/SamWhited/ph.sh"},"payload":{"push_id":536752928,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"688e49dcbc4acfb6b4b1871debaaa712f1f7410e","before":"51db74f429e57b90e1cc9ca18551ca5e74b7db49","commits":[{"sha":"688e49dcbc4acfb6b4b1871debaaa712f1f7410e","author":{"email":"f16bed56189e249fe4ca8ed10a1ecae60e8ceac0@samwhited.com","name":"Sam Whited"},"message":"Fix in-place import","distinct":true,"url":"https://api.github.com/repos/SamWhited/ph.sh/commits/688e49dcbc4acfb6b4b1871debaaa712f1f7410e"}]},"public":true,"created_at":"2015-01-01T01:03:31Z"}
{"id":"2489397405","type":"PushEvent","actor":{"id":6132327,"login":"nboneh","gravatar_id":"","url":"https://api.github.com/users/nboneh","avatar_url":"https://avatars.githubusercontent.com/u/6132327?"},"repo":{"id":25111641,"name":"nboneh/RingSynth","url":"https://api.github.com/repos/nboneh/RingSynth"},"payload":{"push_id":536752932,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"880ddf590a2e7d0fbe3a536cd726ac4bf3979d6f","before":"e8ac58f4157f0a86f6ca8f45fb79692b0160cc6f","commits":[{"sha":"880ddf590a2e7d0fbe3a536cd726ac4bf3979d6f","author":{"email":"158d4d4d94da2b7d5e7618d078746dcf02ab54d3@gmail.com","name":"Nir Boneh"},"message":"Normal tunin around A4","distinct":true,"url":"https://api.github.com/repos/nboneh/RingSynth/commits/880ddf590a2e7d0fbe3a536cd726ac4bf3979d6f"}]},"public":true,"created_at":"2015-01-01T01:03:33Z"}
{"id":"2489397406","type":"PushEvent","actor":{"id":4228183,"login":"batchpause","gravatar_id":"","url":"https://api.github.com/users/batchpause","avatar_url":"https://avatars.githubusercontent.com/u/4228183?"},"repo":{"id":9607679,"name":"batchpause/PAUSE-git","url":"https://api.github.com/repos/batchpause/PAUSE-git"},"payload":{"push_id":536752933,"size":12,"distinct_size":12,"ref":"refs/heads/master","head":"03e53dd011cc8cc2c7054959bf5be8af53086102","before":"6f0e51444646919a9f112644a693a93cc4896d18","commits":[{"sha":"69f1e847fb31e24851a4e1f85e1a7c2f6a357a36","author":{"email":"dc76e9f0c0006e8f919e0c515c66dbba3982f785@pause2.develooper.com","name":"root"},"message":"indexer run at 1420049821, pid 12413","distinct":true,"url":"https://api.github.com/repos/batchpause/PAUSE-git/commits/69f1e847fb31e24851a4e1f85e1a7c2f6a357a36"},{"sha":"300581b6d8e97a15e79c78fcdc0553074d21e2b8","author":{"email":"dc76e9f0c0006e8f919e0c515c66dbba3982f785@pause2.develooper.com","name":"root"},"message":"indexer run at 1420053421, pid 29312","distinct":true,"url":"https://api.github.com/repos/batchpause/PAUSE-git/commits/300581b6d8e97a15e79c78fcdc0553074d21e2b8"},{"sha":"f914295d5506187cb5d5db6a5f7d049e6c3cc508","author":{"email":"dc76e9f0c0006e8f919e0c515c66dbba3982f785@pause2.develooper.com","name":"root"},"message":"indexer run at 1420054141, pid 32521","distinct":true,"url":"https://api.github.com/repos/batchpause/PAUSE-git/commits/f914295d5506187cb5d5db6a5f7d049e6c3cc508"},{"sha":"6edc4a6f42a7b97a735e12feb7de76d44c3eceb0","author":{"email":"dc76e9f0c0006e8f919e0c515c66dbba3982f785@pause2.develooper.com","name":"root"},"message":"indexer run at 1420055521, pid 6611","distinct":true,"url":"https://api.github.com/repos/batchpause/PAUSE-git/commits/6edc4a6f42a7b97a735e12feb7de76d44c3eceb0"},{"sha":"3d82f7f78b9120ae7212d87b03ef758b03521713","author":{"email":"dc76e9f0c0006e8f919e0c515c66dbba3982f785@pause2.develooper.com","name":"root"},"message":"indexer run at 1420057741, pid 16831","distinct":true,"url":"https://api.github.com/repos/batchpause/PAUSE-git/commits/3d82f7f78b9120ae7212d87b03ef758b03521713"},{"sha":"1966ca6fb94b2f5a2f3496393844fed222c9539e","author":{"email":"dc76e9f0c0006e8f919e0c515c66dbba3982f785@pause2.develooper.com","name":"root"},"message":"indexer run at 1420059121, pid 23302","distinct":true,"url":"https://api.github.com/repos/batchpause/PAUSE-git/commits/1966ca6fb94b2f5a2f3496393844fed222c9539e"},{"sha":"ddb77db4360f2a0d022f6db25f11a1f200e941b5","author":{"email":"dc76e9f0c0006e8f919e0c515c66dbba3982f785@pause2.develooper.com","name":"root"},"message":"indexer run at 1420060621, pid 30382","distinct":true,"url":"https://api.github.com/repos/batchpause/PAUSE-git/commits/ddb77db4360f2a0d022f6db25f11a1f200e941b5"},{"sha":"9c063587abbc1d241ed2d95baf137018ede84b3a","author":{"email":"dc76e9f0c0006e8f919e0c515c66dbba3982f785@pause2.develooper.com","name":"root"},"message":"indexer run at 1420065661, pid 21556","distinct":true,"url":"https://api.github.com/repos/batchpause/PAUSE-git/commits/9c063587abbc1d241ed2d95baf137018ede84b3a"},{"sha":"e4ce769b39fbf9a0d3c9ad3452759744ee123375","author":{"email":"dc76e9f0c0006e8f919e0c515c66dbba3982f785@pause2.develooper.com","name":"root"},"message":"indexer run at 1420066321, pid 24279","distinct":true,"url":"https://api.github.com/repos/batchpause/PAUSE-git/commits/e4ce769b39fbf9a0d3c9ad3452759744ee123375"},{"sha":"5f7fca1f705bbbec76e25b603aff759186946c3d","author":{"email":"dc76e9f0c0006e8f919e0c515c66dbba3982f785@pause2.develooper.com","name":"root"},"message":"indexer run at 1420067821, pid 31331","distinct":true,"url":"https://api.github.com/repos/batchpause/PAUSE-git/commits/5f7fca1f705bbbec76e25b603aff759186946c3d"},{"sha":"d19321137942b348af0d16c79207c601c19fdeda","author":{"email":"dc76e9f0c0006e8f919e0c515c66dbba3982f785@pause2.develooper.com","name":"root"},"message":"indexer run at 1420071421, pid 15880","distinct":true,"url":"https://api.github.com/repos/batchpause/PAUSE-git/commits/d19321137942b348af0d16c79207c601c19fdeda"},{"sha":"03e53dd011cc8cc2c7054959bf5be8af53086102","author":{"email":"dc76e9f0c0006e8f919e0c515c66dbba3982f785@pause2.develooper.com","name":"root"},"message":"indexer run at 1420072141, pid 19132","distinct":true,"url":"https://api.github.com/repos/batchpause/PAUSE-git/commits/03e53dd011cc8cc2c7054959bf5be8af53086102"}]},"public":true,"created_at":"2015-01-01T01:03:33Z"}
{"id":"2489397411","type":"PushEvent","actor":{"id":6911419,"login":"himynameisdom","gravatar_id":"","url":"https://api.github.com/users/himynameisdom","avatar_url":"https://avatars.githubusercontent.com/u/6911419?"},"repo":{"id":28657371,"name":"himynameisdom/latte","url":"https://api.github.com/repos/himynameisdom/latte"},"payload":{"push_id":536752935,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"c938cdd2820f9df06645b463b9b239e94f160504","before":"1a6d4186c93cdd68fe4af3ef75ac245c9ba9ee2e","commits":[{"sha":"c938cdd2820f9df06645b463b9b239e94f160504","author":{"email":"8d86c1bc9ce7bebe830a6a6d940e2e017bda9d78@me.com","name":"Dominic Michalec"},"message":"added bootstrap javascript and nav collapse","distinct":true,"url":"https://api.github.com/repos/himynameisdom/latte/commits/c938cdd2820f9df06645b463b9b239e94f160504"}]},"public":true,"created_at":"2015-01-01T01:03:33Z"}
{"id":"2489397412","type":"PushEvent","actor":{"id":5544031,"login":"at1as","gravatar_id":"","url":"https://api.github.com/users/at1as","avatar_url":"https://avatars.githubusercontent.com/u/5544031?"},"repo":{"id":23708117,"name":"at1as/IMDB-Scrape","url":"https://api.github.com/repos/at1as/IMDB-Scrape"},"payload":{"push_id":536752937,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"6e651be941874f6469b13a0e96f4ae7ce7b5e1c4","before":"e47021c22914dab6dd09ed5d700dbf07b31c3462","commits":[{"sha":"6e651be941874f6469b13a0e96f4ae7ce7b5e1c4","author":{"email":"68c46a606457643eab92053c1c05574abb26f861@willems.ca","name":"Jason"},"message":"Search by title string, no link","distinct":true,"url":"https://api.github.com/repos/at1as/IMDB-Scrape/commits/6e651be941874f6469b13a0e96f4ae7ce7b5e1c4"}]},"public":true,"created_at":"2015-01-01T01:03:33Z"}
{"id":"2489397414","type":"WatchEvent","actor":{"id":1865407,"login":"slacktracer","gravatar_id":"","url":"https://api.github.com/users/slacktracer","avatar_url":"https://avatars.githubusercontent.com/u/1865407?"},"repo":{"id":26742634,"name":"auchenberg/chrome-devtools-app","url":"https://api.github.com/repos/auchenberg/chrome-devtools-app"},"payload":{"action":"started"},"public":true,"created_at":"2015-01-01T01:03:34Z"}
{"id":"2489397422","type":"PushEvent","actor":{"id":4760248,"login":"hxkclan","gravatar_id":"","url":"https://api.github.com/users/hxkclan","avatar_url":"https://avatars.githubusercontent.com/u/4760248?"},"repo":{"id":28668307,"name":"hxkclan/jade-for-wordpress","url":"https://api.github.com/repos/hxkclan/jade-for-wordpress"},"payload":{"push_id":536752941,"size":9,"distinct_size":9,"ref":"refs/heads/develop","head":"3a45dfdf3aa479fb0f27f66033f22331f04eec58","before":"145fefffb0df917bab1db9838d9e5089c1c24ca6","commits":[{"sha":"30c9c73c6ad9e1425fc140269e186bd8a0340d50","author":{"email":"3212f40cb710c917428034396bc51225b7378866@gmail.com","name":"Michael Boumann"},"message":"add body class from wp","distinct":true,"url":"https://api.github.com/repos/hxkclan/jade-for-wordpress/commits/30c9c73c6ad9e1425fc140269e186bd8a0340d50"},{"sha":"451a600ef7231036ce55eaf1b966031fcf2dabd7","author":{"email":"3212f40cb710c917428034396bc51225b7378866@gmail.com","name":"Michael Boumann"},"message":"fix alignment stuff","distinct":true,"url":"https://api.github.com/repos/hxkclan/jade-for-wordpress/commits/451a600ef7231036ce55eaf1b966031fcf2dabd7"},{"sha":"e8fd1b20152923d0175867c7ec3d2981df4f122b","author":{"email":"3212f40cb710c917428034396bc51225b7378866@gmail.com","name":"Michael Boumann"},"message":"add sidebar + container inside class","distinct":true,"url":"https://api.github.com/repos/hxkclan/jade-for-wordpress/commits/e8fd1b20152923d0175867c7ec3d2981df4f122b"},{"sha":"9deb4be8fca26bab9e71ae32bf83b07e6ad63169","author":{"email":"3212f40cb710c917428034396bc51225b7378866@gmail.com","name":"Michael Boumann"},"message":"added sidebar","distinct":true,"url":"https://api.github.com/repos/hxkclan/jade-for-wordpress/commits/9deb4be8fca26bab9e71ae32bf83b07e6ad63169"},{"sha":"638a2eadaafdba2f2dbd9fbde2a082b5219d98e8","author":{"email":"3212f40cb710c917428034396bc51225b7378866@gmail.com","name":"Michael Boumann"},"message":"added sidebar","distinct":true,"url":"https://api.github.com/repos/hxkclan/jade-for-wordpress/commits/638a2eadaafdba2f2dbd9fbde2a082b5219d98e8"},{"sha":"25d67ef22a56b2d7e22ed6ad885ad57416e76914","author":{"email":"3212f40cb710c917428034396bc51225b7378866@gmail.com","name":"Michael Boumann"},"message":"added sidebar to index","distinct":true,"url":"https://api.github.com/repos/hxkclan/jade-for-wordpress/commits/25d67ef22a56b2d7e22ed6ad885ad57416e76914"},{"sha":"0879c07121649e04b0b946c109d8c50cce4f5230","author":{"email":"3212f40cb710c917428034396bc51225b7378866@gmail.com","name":"Michael Boumann"},"message":"seperate edit post and bottom of post","distinct":true,"url":"https://api.github.com/repos/hxkclan/jade-for-wordpress/commits/0879c07121649e04b0b946c109d8c50cce4f5230"},{"sha":"000847605ea5bcda1640d6956a3e79c9924b5b78","author":{"email":"3212f40cb710c917428034396bc51225b7378866@gmail.com","name":"Michael Boumann"},"message":"corrected mistake with sidebar + backtotop","distinct":true,"url":"https://api.github.com/repos/hxkclan/jade-for-wordpress/commits/000847605ea5bcda1640d6956a3e79c9924b5b78"},{"sha":"3a45dfdf3aa479fb0f27f66033f22331f04eec58","author":{"email":"3212f40cb710c917428034396bc51225b7378866@gmail.com","name":"Michael Boumann"},"message":"fix in pages setup","distinct":true,"url":"https://api.github.com/repos/hxkclan/jade-for-wordpress/commits/3a45dfdf3aa479fb0f27f66033f22331f04eec58"}]},"public":true,"created_at":"2015-01-01T01:03:36Z"}
{"id":"2489397425","type":"IssuesEvent","actor":{"id":416564,"login":"johnryan","gravatar_id":"","url":"https://api.github.com/users/johnryan","avatar_url":"https://avatars.githubusercontent.com/u/416564?"},"repo":{"id":9185941,"name":"segmentio/analytics-android","url":"https://api.github.com/repos/segmentio/analytics-android"},"payload":{"action":"opened","issue":{"url":"https://api.github.com/repos/segmentio/analytics-android/issues/153","labels_url":"https://api.github.com/repos/segmentio/analytics-android/issues/153/labels{/name}","comments_url":"https://api.github.com/repos/segmentio/analytics-android/issues/153/comments","events_url":"https://api.github.com/repos/segmentio/analytics-android/issues/153/events","html_url":"https://github.com/segmentio/analytics-android/issues/153","id":53210234,"number":153,"title":"Use different api keys for debug/release","user":{"login":"johnryan","id":416564,"avatar_url":"https://avatars.githubusercontent.com/u/416564?v=3","gravatar_id":"","url":"https://api.github.com/users/johnryan","html_url":"https://github.com/johnryan","followers_url":"https://api.github.com/users/johnryan/followers","following_url":"https://api.github.com/users/johnryan/following{/other_user}","gists_url":"https://api.github.com/users/johnryan/gists{/gist_id}","starred_url":"https://api.github.com/users/johnryan/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/johnryan/subscriptions","organizations_url":"https://api.github.com/users/johnryan/orgs","repos_url":"https://api.github.com/users/johnryan/repos","events_url":"https://api.github.com/users/johnryan/events{/privacy}","received_events_url":"https://api.github.com/users/johnryan/received_events","type":"User","site_admin":false},"labels":[],"state":"open","locked":false,"assignee":null,"milestone":null,"comments":0,"created_at":"2015-01-01T01:03:36Z","updated_at":"2015-01-01T01:03:36Z","closed_at":null,"body":"Is there any way to set a different api key for debug vs release? This seems impossible since the key is set from the analytics.xml file."}},"public":true,"created_at":"2015-01-01T01:03:36Z","org":{"id":819518,"login":"segmentio","gravatar_id":"","url":"https://api.github.com/orgs/segmentio","avatar_url":"https://avatars.githubusercontent.com/u/819518?"}}
{"id":"2489397426","type":"IssueCommentEvent","actor":{"id":4275617,"login":"i2amroy","gravatar_id":"","url":"https://api.github.com/users/i2amroy","avatar_url":"https://avatars.githubusercontent.com/u/4275617?"},"repo":{"id":5973855,"name":"CleverRaven/Cataclysm-DDA","url":"https://api.github.com/repos/CleverRaven/Cataclysm-DDA"},"payload":{"action":"created","issue":{"url":"https://api.github.com/repos/CleverRaven/Cataclysm-DDA/issues/10655","labels_url":"https://api.github.com/repos/CleverRaven/Cataclysm-DDA/issues/10655/labels{/name}","comments_url":"https://api.github.com/repos/CleverRaven/Cataclysm-DDA/issues/10655/comments","events_url":"https://api.github.com/repos/CleverRaven/Cataclysm-DDA/issues/10655/events","html_url":"https://github.com/CleverRaven/Cataclysm-DDA/issues/10655","id":52968085,"number":10655,"title":"[WIP] Medical Updates","user":{"login":"DavidKeaton","id":1715605,"avatar_url":"https://avatars.githubusercontent.com/u/1715605?v=3","gravatar_id":"","url":"https://api.github.com/users/DavidKeaton","html_url":"https://github.com/DavidKeaton","followers_url":"https://api.github.com/users/DavidKeaton/followers","following_url":"https://api.github.com/users/DavidKeaton/following{/other_user}","gists_url":"https://api.github.com/users/DavidKeaton/gists{/gist_id}","starred_url":"https://api.github.com/users/DavidKeaton/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/DavidKeaton/subscriptions","organizations_url":"https://api.github.com/users/DavidKeaton/orgs","repos_url":"https://api.github.com/users/DavidKeaton/repos","events_url":"https://api.github.com/users/DavidKeaton/events{/privacy}","received_events_url":"https://api.github.com/users/DavidKeaton/received_events","type":"User","site_admin":false},"labels":[],"state":"open","locked":false,"assignee":null,"milestone":null,"comments":14,"created_at":"2014-12-27T23:00:10Z","updated_at":"2015-01-01T01:03:36Z","closed_at":null,"body":"### Intro\r\nOkay, so I closed the PR and reopened this as an issue. Some comments on @narc0tiq 's thread about scrapes and bruises sort of gave me some ideas where I want this to go.\r\n(beep boop calling @KA101 because `u r mad dope son`)\r\n\r\nAny and ALL comments welcome!\r\n\r\n### Briefing\r\nMy first notion is to abstract the notion of underlying anatomical 'systems' into a class that can be derived from. In said class, any arbitrary number of arbitrary `groups` of `anatomical_parts` can be together. So if you have 2 legs, 2 hands, 2 arms, a sweet eye patch, a hangover, and no dignity; most of these can theoretically be listed in this class. I have setup the very basics of it, along with a notion of design (a modicum I assure you, not an overzealous person or anything). I plan on migrating to JSON loadable files so these 'parts' and 'groups' can be super *dope* and expanded upon easily. Each `anatomical_part` falls into one or more `anatomical_group`s . These groups I hope to be expandable with the help of either/both Lua or JSON, or black magic I ain't judgin'. \r\n\r\nSo parts fall into groups, groups can provide flags to what these parts do. For an example of the slice of my code thus far...\r\n\r\n```\r\nenum anatomical_function {\r\n    // motor functions\r\n    AF_AMBULATION = 0,                          /* orthostasis, ambulating, etc */\r\n    // five senses\r\n    AF_OCULAR,                                  /* sight */\r\n    AF_OLFACTORY,                               /* smell */\r\n    AF_AUDITORY,                                /* hearing */\r\n    AF_GUSTATORY,                               /* taste */\r\n    AF_TACTILE,                                 /* touch */\r\n    // circulatory\r\n    AF_RESPIRATORY,                             /* breathing */\r\n    AF_NEUROVASCULAR,                           /* nervous [+ vascular] system */\r\n    AF_CARDIOVASCULAR,                          /* heart & vascular system */\r\n    // chassis, engine, and driver\r\n    AF_SKELETAL,                                /* bones */\r\n    AF_MUSCULAR,                                /* as it says */\r\n    AF_NEUROLOGICAL,                            /* brain/nervous system */\r\n    // non-humanoid functions\r\n    AF_ANTENNAE,                                /* sensory perception via antennae */\r\n    num_af\r\n};\r\n```\r\n\r\nSo with these `functions` lumped together with both `parts` and `groups`, you could have specific effects or diseases target these systems. \r\n\r\nOR MAYBE I AM OVERTHINKING THE `functions` PART A BIT, I DUNNO, BRAINSTORMING AND STUFF.\r\n\r\nSo what this roundabouts would look like further implemented, is things you have to watch for. Do you want to go into v-tach? *Nah dawg, you don't. So stop sniffing coke son.*\r\n\r\nBeen overdoing the stimulants for a fair amount, and have taken some cardiac damage? *You gun die son.*\r\n\r\nOh man, you have gone and broke that finger. *Guess you can't blap blap now.*\r\n\r\nHappen to have cut your fingertip too much with a knife, guess you goin'ta have some scar tissue son, *guess you are.*\r\n\r\nOkay so maybe it won't get _that_ crazy, but I would like a decently dynamic medical system, so it is more than just \"chug vitamins, don't do drugs, use first aid kit, done.\" Broken bones should be a reality before arm health reaches zero, more limbs and appendages should be a thing _anyway_ (hell maybe we could spin that off for mutated `anatomy`)! *GASP SON*\r\n\r\n# EAST COAST\r\n\r\n### TODO\r\n- [ ] Implement `anatomy` for creatures/critters/players/space-monsters/etc.\r\n- [ ] JSONify the `anatomy` aspects a bit, so as to make adding new `parts` and whatnot is legit as hell.\r\n- [ ] Implement new UI to better fit how *baller* this update will be.\r\n- [x] Realize that I am mad baller and fly as hell. Damn you sexy. \r\n- [ ] ~~Play way too much Cataclysm~~ Implement vital signs (BP, MAP, O2%)\r\n\r\n<bountysource-plugin>\r\n\r\n---\r\nWant to back this issue? **[Place a bounty on it!](https://www.bountysource.com/issues/7315679-wip-medical-updates?utm_campaign=plugin&utm_content=tracker%2F146201&utm_medium=issues&utm_source=github)** We accept bounties via [Bountysource](https://www.bountysource.com/?utm_campaign=plugin&utm_content=tracker%2F146201&utm_medium=issues&utm_source=github).\r\n</bountysource-plugin>"},"comment":{"url":"https://api.github.com/repos/CleverRaven/Cataclysm-DDA/issues/comments/68477285","html_url":"https://github.com/CleverRaven/Cataclysm-DDA/issues/10655#issuecomment-68477285","issue_url":"https://api.github.com/repos/CleverRaven/Cataclysm-DDA/issues/10655","id":68477285,"user":{"login":"i2amroy","id":4275617,"avatar_url":"https://avatars.githubusercontent.com/u/4275617?v=3","gravatar_id":"","url":"https://api.github.com/users/i2amroy","html_url":"https://github.com/i2amroy","followers_url":"https://api.github.com/users/i2amroy/followers","following_url":"https://api.github.com/users/i2amroy/following{/other_user}","gists_url":"https://api.github.com/users/i2amroy/gists{/gist_id}","starred_url":"https://api.github.com/users/i2amroy/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/i2amroy/subscriptions","organizations_url":"https://api.github.com/users/i2amroy/orgs","repos_url":"https://api.github.com/users/i2amroy/repos","events_url":"https://api.github.com/users/i2amroy/events{/privacy}","received_events_url":"https://api.github.com/users/i2amroy/received_events","type":"User","site_admin":false},"created_at":"2015-01-01T01:03:36Z","updated_at":"2015-01-01T01:03:36Z","body":"I think a lot of the feasibility of this design comes down to the nitty-gritty exact implementation level. If it can be implemented in a way that is easy for the players to see, easy for the modders to handle in json, and easy for future developers to understand then I don't see a problem with implementing something like this. It just happens that it's a lot of work and a all three of those facts depend on your exact implementation."}},"public":true,"created_at":"2015-01-01T01:03:36Z","org":{"id":4367009,"login":"CleverRaven","gravatar_id":"","url":"https://api.github.com/orgs/CleverRaven","avatar_url":"https://avatars.githubusercontent.com/u/4367009?"}}
{"id":"2489397429","type":"PullRequestEvent","actor":{"id":2961036,"login":"codemercenary","gravatar_id":"","url":"https://api.github.com/users/codemercenary","avatar_url":"https://avatars.githubusercontent.com/u/2961036?"},"repo":{"id":22234733,"name":"leapmotion/autowiring","url":"https://api.github.com/repos/leapmotion/autowiring"},"payload":{"action":"opened","number":314,"pull_request":{"url":"https://api.github.com/repos/leapmotion/autowiring/pulls/314","id":26739436,"html_url":"https://github.com/leapmotion/autowiring/pull/314","diff_url":"https://github.com/leapmotion/autowiring/pull/314.diff","patch_url":"https://github.com/leapmotion/autowiring/pull/314.patch","issue_url":"https://api.github.com/repos/leapmotion/autowiring/issues/314","number":314,"state":"open","locked":false,"title":"Rename boost to autoboost","user":{"login":"codemercenary","id":2961036,"avatar_url":"https://avatars.githubusercontent.com/u/2961036?v=3","gravatar_id":"","url":"https://api.github.com/users/codemercenary","html_url":"https://github.com/codemercenary","followers_url":"https://api.github.com/users/codemercenary/followers","following_url":"https://api.github.com/users/codemercenary/following{/other_user}","gists_url":"https://api.github.com/users/codemercenary/gists{/gist_id}","starred_url":"https://api.github.com/users/codemercenary/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/codemercenary/subscriptions","organizations_url":"https://api.github.com/users/codemercenary/orgs","repos_url":"https://api.github.com/users/codemercenary/repos","events_url":"https://api.github.com/users/codemercenary/events{/privacy}","received_events_url":"https://api.github.com/users/codemercenary/received_events","type":"User","site_admin":false},"body":"Huge modification, requiring adjustements to namespaces, macros, file names, and header guards.  This change introduces a private version of Boost 1.57.0 that can be linked externally on platforms which do not have full STL11 support without colliding in any way with those platforms' independent use of boost.","created_at":"2015-01-01T01:03:37Z","updated_at":"2015-01-01T01:03:37Z","closed_at":null,"merged_at":null,"merge_commit_sha":null,"assignee":null,"milestone":null,"commits_url":"https://api.github.com/repos/leapmotion/autowiring/pulls/314/commits","review_comments_url":"https://api.github.com/repos/leapmotion/autowiring/pulls/314/comments","review_comment_url":"https://api.github.com/repos/leapmotion/autowiring/pulls/comments/{number}","comments_url":"https://api.github.com/repos/leapmotion/autowiring/issues/314/comments","statuses_url":"https://api.github.com/repos/leapmotion/autowiring/statuses/3f0c9d9becf969aab74c7b4fe222854a6eebe58b","head":{"label":"leapmotion:fix-autoboost","ref":"fix-autoboost","sha":"3f0c9d9becf969aab74c7b4fe222854a6eebe58b","user":{"login":"leapmotion","id":2242710,"avatar_url":"https://avatars.githubusercontent.com/u/2242710?v=3","gravatar_id":"","url":"https://api.github.com/users/leapmotion","html_url":"https://github.com/leapmotion","followers_url":"https://api.github.com/users/leapmotion/followers","following_url":"https://api.github.com/users/leapmotion/following{/other_user}","gists_url":"https://api.github.com/users/leapmotion/gists{/gist_id}","starred_url":"https://api.github.com/users/leapmotion/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/leapmotion/subscriptions","organizations_url":"https://api.github.com/users/leapmotion/orgs","repos_url":"https://api.github.com/users/leapmotion/repos","events_url":"https://api.github.com/users/leapmotion/events{/privacy}","received_events_url":"https://api.github.com/users/leapmotion/received_events","type":"Organization","site_admin":false},"repo":{"id":22234733,"name":"autowiring","full_name":"leapmotion/autowiring","owner":{"login":"leapmotion","id":2242710,"avatar_url":"https://avatars.githubusercontent.com/u/2242710?v=3","gravatar_id":"","url":"https://api.github.com/users/leapmotion","html_url":"https://github.com/leapmotion","followers_url":"https://api.github.com/users/leapmotion/followers","following_url":"https://api.github.com/users/leapmotion/following{/other_user}","gists_url":"https://api.github.com/users/leapmotion/gists{/gist_id}","starred_url":"https://api.github.com/users/leapmotion/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/leapmotion/subscriptions","organizations_url":"https://api.github.com/users/leapmotion/orgs","repos_url":"https://api.github.com/users/leapmotion/repos","events_url":"https://api.github.com/users/leapmotion/events{/privacy}","received_events_url":"https://api.github.com/users/leapmotion/received_events","type":"Organization","site_admin":false},"private":false,"html_url":"https://github.com/leapmotion/autowiring","description":"A C++ Inversion of Control Framework","fork":false,"url":"https://api.github.com/repos/leapmotion/autowiring","forks_url":"https://api.github.com/repos/leapmotion/autowiring/forks","keys_url":"https://api.github.com/repos/leapmotion/autowiring/keys{/key_id}","collaborators_url":"https://api.github.com/repos/leapmotion/autowiring/collaborators{/collaborator}","teams_url":"https://api.github.com/repos/leapmotion/autowiring/teams","hooks_url":"https://api.github.com/repos/leapmotion/autowiring/hooks","issue_events_url":"https://api.github.com/repos/leapmotion/autowiring/issues/events{/number}","events_url":"https://api.github.com/repos/leapmotion/autowiring/events","assignees_url":"https://api.github.com/repos/leapmotion/autowiring/assignees{/user}","branches_url":"https://api.github.com/repos/leapmotion/autowiring/branches{/branch}","tags_url":"https://api.github.com/repos/leapmotion/autowiring/tags","blobs_url":"https://api.github.com/repos/leapmotion/autowiring/git/blobs{/sha}","git_tags_url":"https://api.github.com/repos/leapmotion/autowiring/git/tags{/sha}","git_refs_url":"https://api.github.com/repos/leapmotion/autowiring/git/refs{/sha}","trees_url":"https://api.github.com/repos/leapmotion/autowiring/git/trees{/sha}","statuses_url":"https://api.github.com/repos/leapmotion/autowiring/statuses/{sha}","languages_url":"https://api.github.com/repos/leapmotion/autowiring/languages","stargazers_url":"https://api.github.com/repos/leapmotion/autowiring/stargazers","contributors_url":"https://api.github.com/repos/leapmotion/autowiring/contributors","subscribers_url":"https://api.github.com/repos/leapmotion/autowiring/subscribers","subscription_url":"https://api.github.com/repos/leapmotion/autowiring/subscription","commits_url":"https://api.github.com/repos/leapmotion/autowiring/commits{/sha}","git_commits_url":"https://api.github.com/repos/leapmotion/autowiring/git/commits{/sha}","comments_url":"https://api.github.com/repos/leapmotion/autowiring/comments{/number}","issue_comment_url":"https://api.github.com/repos/leapmotion/autowiring/issues/comments/{number}","contents_url":"https://api.github.com/repos/leapmotion/autowiring/contents/{+path}","compare_url":"https://api.github.com/repos/leapmotion/autowiring/compare/{base}...{head}","merges_url":"https://api.github.com/repos/leapmotion/autowiring/merges","archive_url":"https://api.github.com/repos/leapmotion/autowiring/{archive_format}{/ref}","downloads_url":"https://api.github.com/repos/leapmotion/autowiring/downloads","issues_url":"https://api.github.com/repos/leapmotion/autowiring/issues{/number}","pulls_url":"https://api.github.com/repos/leapmotion/autowiring/pulls{/number}","milestones_url":"https://api.github.com/repos/leapmotion/autowiring/milestones{/number}","notifications_url":"https://api.github.com/repos/leapmotion/autowiring/notifications{?since,all,participating}","labels_url":"https://api.github.com/repos/leapmotion/autowiring/labels{/name}","releases_url":"https://api.github.com/repos/leapmotion/autowiring/releases{/id}","created_at":"2014-07-24T22:39:49Z","updated_at":"2014-12-30T23:40:39Z","pushed_at":"2015-01-01T01:03:20Z","git_url":"git://github.com/leapmotion/autowiring.git","ssh_url":"git@github.com:leapmotion/autowiring.git","clone_url":"https://github.com/leapmotion/autowiring.git","svn_url":"https://github.com/leapmotion/autowiring","homepage":"http://autowiring.io/","size":27882,"stargazers_count":68,"watchers_count":68,"language":"C++","has_issues":true,"has_downloads":true,"has_wiki":true,"has_pages":true,"forks_count":7,"mirror_url":null,"open_issues_count":2,"forks":7,"open_issues":2,"watchers":68,"default_branch":"develop"}},"base":{"label":"leapmotion:develop","ref":"develop","sha":"72c45ac5ebe38bb3581a26ebd6600b3769e6022c","user":{"login":"leapmotion","id":2242710,"avatar_url":"https://avatars.githubusercontent.com/u/2242710?v=3","gravatar_id":"","url":"https://api.github.com/users/leapmotion","html_url":"https://github.com/leapmotion","followers_url":"https://api.github.com/users/leapmotion/followers","following_url":"https://api.github.com/users/leapmotion/following{/other_user}","gists_url":"https://api.github.com/users/leapmotion/gists{/gist_id}","starred_url":"https://api.github.com/users/leapmotion/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/leapmotion/subscriptions","organizations_url":"https://api.github.com/users/leapmotion/orgs","repos_url":"https://api.github.com/users/leapmotion/repos","events_url":"https://api.github.com/users/leapmotion/events{/privacy}","received_events_url":"https://api.github.com/users/leapmotion/received_events","type":"Organization","site_admin":false},"repo":{"id":22234733,"name":"autowiring","full_name":"leapmotion/autowiring","owner":{"login":"leapmotion","id":2242710,"avatar_url":"https://avatars.githubusercontent.com/u/2242710?v=3","gravatar_id":"","url":"https://api.github.com/users/leapmotion","html_url":"https://github.com/leapmotion","followers_url":"https://api.github.com/users/leapmotion/followers","following_url":"https://api.github.com/users/leapmotion/following{/other_user}","gists_url":"https://api.github.com/users/leapmotion/gists{/gist_id}","starred_url":"https://api.github.com/users/leapmotion/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/leapmotion/subscriptions","organizations_url":"https://api.github.com/users/leapmotion/orgs","repos_url":"https://api.github.com/users/leapmotion/repos","events_url":"https://api.github.com/users/leapmotion/events{/privacy}","received_events_url":"https://api.github.com/users/leapmotion/received_events","type":"Organization","site_admin":false},"private":false,"html_url":"https://github.com/leapmotion/autowiring","description":"A C++ Inversion of Control Framework","fork":false,"url":"https://api.github.com/repos/leapmotion/autowiring","forks_url":"https://api.github.com/repos/leapmotion/autowiring/forks","keys_url":"https://api.github.com/repos/leapmotion/autowiring/keys{/key_id}","collaborators_url":"https://api.github.com/repos/leapmotion/autowiring/collaborators{/collaborator}","teams_url":"https://api.github.com/repos/leapmotion/autowiring/teams","hooks_url":"https://api.github.com/repos/leapmotion/autowiring/hooks","issue_events_url":"https://api.github.com/repos/leapmotion/autowiring/issues/events{/number}","events_url":"https://api.github.com/repos/leapmotion/autowiring/events","assignees_url":"https://api.github.com/repos/leapmotion/autowiring/assignees{/user}","branches_url":"https://api.github.com/repos/leapmotion/autowiring/branches{/branch}","tags_url":"https://api.github.com/repos/leapmotion/autowiring/tags","blobs_url":"https://api.github.com/repos/leapmotion/autowiring/git/blobs{/sha}","git_tags_url":"https://api.github.com/repos/leapmotion/autowiring/git/tags{/sha}","git_refs_url":"https://api.github.com/repos/leapmotion/autowiring/git/refs{/sha}","trees_url":"https://api.github.com/repos/leapmotion/autowiring/git/trees{/sha}","statuses_url":"https://api.github.com/repos/leapmotion/autowiring/statuses/{sha}","languages_url":"https://api.github.com/repos/leapmotion/autowiring/languages","stargazers_url":"https://api.github.com/repos/leapmotion/autowiring/stargazers","contributors_url":"https://api.github.com/repos/leapmotion/autowiring/contributors","subscribers_url":"https://api.github.com/repos/leapmotion/autowiring/subscribers","subscription_url":"https://api.github.com/repos/leapmotion/autowiring/subscription","commits_url":"https://api.github.com/repos/leapmotion/autowiring/commits{/sha}","git_commits_url":"https://api.github.com/repos/leapmotion/autowiring/git/commits{/sha}","comments_url":"https://api.github.com/repos/leapmotion/autowiring/comments{/number}","issue_comment_url":"https://api.github.com/repos/leapmotion/autowiring/issues/comments/{number}","contents_url":"https://api.github.com/repos/leapmotion/autowiring/contents/{+path}","compare_url":"https://api.github.com/repos/leapmotion/autowiring/compare/{base}...{head}","merges_url":"https://api.github.com/repos/leapmotion/autowiring/merges","archive_url":"https://api.github.com/repos/leapmotion/autowiring/{archive_format}{/ref}","downloads_url":"https://api.github.com/repos/leapmotion/autowiring/downloads","issues_url":"https://api.github.com/repos/leapmotion/autowiring/issues{/number}","pulls_url":"https://api.github.com/repos/leapmotion/autowiring/pulls{/number}","milestones_url":"https://api.github.com/repos/leapmotion/autowiring/milestones{/number}","notifications_url":"https://api.github.com/repos/leapmotion/autowiring/notifications{?since,all,participating}","labels_url":"https://api.github.com/repos/leapmotion/autowiring/labels{/name}","releases_url":"https://api.github.com/repos/leapmotion/autowiring/releases{/id}","created_at":"2014-07-24T22:39:49Z","updated_at":"2014-12-30T23:40:39Z","pushed_at":"2015-01-01T01:03:20Z","git_url":"git://github.com/leapmotion/autowiring.git","ssh_url":"git@github.com:leapmotion/autowiring.git","clone_url":"https://github.com/leapmotion/autowiring.git","svn_url":"https://github.com/leapmotion/autowiring","homepage":"http://autowiring.io/","size":27882,"stargazers_count":68,"watchers_count":68,"language":"C++","has_issues":true,"has_downloads":true,"has_wiki":true,"has_pages":true,"forks_count":7,"mirror_url":null,"open_issues_count":2,"forks":7,"open_issues":2,"watchers":68,"default_branch":"develop"}},"_links":{"self":{"href":"https://api.github.com/repos/leapmotion/autowiring/pulls/314"},"html":{"href":"https://github.com/leapmotion/autowiring/pull/314"},"issue":{"href":"https://api.github.com/repos/leapmotion/autowiring/issues/314"},"comments":{"href":"https://api.github.com/repos/leapmotion/autowiring/issues/314/comments"},"review_comments":{"href":"https://api.github.com/repos/leapmotion/autowiring/pulls/314/comments"},"review_comment":{"href":"https://api.github.com/repos/leapmotion/autowiring/pulls/comments/{number}"},"commits":{"href":"https://api.github.com/repos/leapmotion/autowiring/pulls/314/commits"},"statuses":{"href":"https://api.github.com/repos/leapmotion/autowiring/statuses/3f0c9d9becf969aab74c7b4fe222854a6eebe58b"}},"merged":false,"mergeable":null,"mergeable_state":"unknown","merged_by":null,"comments":0,"review_comments":0,"commits":1,"additions":29030,"deletions":145,"changed_files":6453}},"public":true,"created_at":"2015-01-01T01:03:37Z","org":{"id":2242710,"login":"leapmotion","gravatar_id":"","url":"https://api.github.com/orgs/leapmotion","avatar_url":"https://avatars.githubusercontent.com/u/2242710?"}}
{"id":"2489397434","type":"PushEvent","actor":{"id":979046,"login":"pippijn","gravatar_id":"","url":"https://api.github.com/users/pippijn","avatar_url":"https://avatars.githubusercontent.com/u/979046?"},"repo":{"id":27788257,"name":"pippijn/tox4j","url":"https://api.github.com/repos/pippijn/tox4j"},"payload":{"push_id":536752943,"size":3,"distinct_size":3,"ref":"refs/heads/master","head":"e6e54153e3d800e5f6c7972f9dfa78a17efe76d5","before":"48e0b41044a58a4f896d07ad29e65e1ac63e6010","commits":[{"sha":"8d429c6a4ef8d5596c660fb307a58d9904486149","author":{"email":"7113361f3b566fbf12c30d00f1a3671d2dbf9616@gmail.com","name":"Pippijn van Steenhoven"},"message":"Generate more cmake code => less redundancy.","distinct":true,"url":"https://api.github.com/repos/pippijn/tox4j/commits/8d429c6a4ef8d5596c660fb307a58d9904486149"},{"sha":"388e614c9032e14462f9e1fe77fab86310c2c1e6","author":{"email":"7113361f3b566fbf12c30d00f1a3671d2dbf9616@gmail.com","name":"Pippijn van Steenhoven"},"message":"Added tool to update tox4j version to current toxcore version.","distinct":true,"url":"https://api.github.com/repos/pippijn/tox4j/commits/388e614c9032e14462f9e1fe77fab86310c2c1e6"},{"sha":"e6e54153e3d800e5f6c7972f9dfa78a17efe76d5","author":{"email":"7113361f3b566fbf12c30d00f1a3671d2dbf9616@gmail.com","name":"Pippijn van Steenhoven"},"message":"Give RepeatedLanDiscoveryTest a correct main() signature.","distinct":true,"url":"https://api.github.com/repos/pippijn/tox4j/commits/e6e54153e3d800e5f6c7972f9dfa78a17efe76d5"}]},"public":true,"created_at":"2015-01-01T01:03:37Z"}
{"id":"2489397436","type":"PushEvent","actor":{"id":10225575,"login":"ExclusiveOrange","gravatar_id":"","url":"https://api.github.com/users/ExclusiveOrange","avatar_url":"https://avatars.githubusercontent.com/u/10225575?"},"repo":{"id":28677579,"name":"ExclusiveOrange/synthesizer","url":"https://api.github.com/repos/ExclusiveOrange/synthesizer"},"payload":{"push_id":536752944,"size":0,"distinct_size":0,"ref":"refs/heads/master","head":"0e64036d5ac0d9c24b4cbe39bb778570db49caba","before":"0e64036d5ac0d9c24b4cbe39bb778570db49caba","commits":[]},"public":true,"created_at":"2015-01-01T01:03:37Z"}
{"id":"2489397439","type":"PullRequestEvent","actor":{"id":8562199,"login":"sguan-actuate","gravatar_id":"","url":"https://api.github.com/users/sguan-actuate","avatar_url":"https://avatars.githubusercontent.com/u/8562199?"},"repo":{"id":19821157,"name":"eclipse/birt","url":"https://api.github.com/repos/eclipse/birt"},"payload":{"action":"opened","number":70,"pull_request":{"url":"https://api.github.com/repos/eclipse/birt/pulls/70","id":26739437,"html_url":"https://github.com/eclipse/birt/pull/70","diff_url":"https://github.com/eclipse/birt/pull/70.diff","patch_url":"https://github.com/eclipse/birt/pull/70.patch","issue_url":"https://api.github.com/repos/eclipse/birt/issues/70","number":70,"state":"open","locked":false,"title":"Internal refactor apis and document code","user":{"login":"sguan-actuate","id":8562199,"avatar_url":"https://avatars.githubusercontent.com/u/8562199?v=3","gravatar_id":"","url":"https://api.github.com/users/sguan-actuate","html_url":"https://github.com/sguan-actuate","followers_url":"https://api.github.com/users/sguan-actuate/followers","following_url":"https://api.github.com/users/sguan-actuate/following{/other_user}","gists_url":"https://api.github.com/users/sguan-actuate/gists{/gist_id}","starred_url":"https://api.github.com/users/sguan-actuate/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/sguan-actuate/subscriptions","organizations_url":"https://api.github.com/users/sguan-actuate/orgs","repos_url":"https://api.github.com/users/sguan-actuate/repos","events_url":"https://api.github.com/users/sguan-actuate/events{/privacy}","received_events_url":"https://api.github.com/users/sguan-actuate/received_events","type":"User","site_admin":false},"body":"Internal refactor apis to avoid IQueryDefinition.setAutoBinding \r\nand comment on code\r\n\r\nSigned-off-by: sguan <sguan@actuate.com>","created_at":"2015-01-01T01:03:38Z","updated_at":"2015-01-01T01:03:38Z","closed_at":null,"merged_at":null,"merge_commit_sha":null,"assignee":null,"milestone":null,"commits_url":"https://api.github.com/repos/eclipse/birt/pulls/70/commits","review_comments_url":"https://api.github.com/repos/eclipse/birt/pulls/70/comments","review_comment_url":"https://api.github.com/repos/eclipse/birt/pulls/comments/{number}","comments_url":"https://api.github.com/repos/eclipse/birt/issues/70/comments","statuses_url":"https://api.github.com/repos/eclipse/birt/statuses/7efab4d3fe077789a3e65be0fcd80a6078557360","head":{"label":"sguan-actuate:master","ref":"master","sha":"7efab4d3fe077789a3e65be0fcd80a6078557360","user":{"login":"sguan-actuate","id":8562199,"avatar_url":"https://avatars.githubusercontent.com/u/8562199?v=3","gravatar_id":"","url":"https://api.github.com/users/sguan-actuate","html_url":"https://github.com/sguan-actuate","followers_url":"https://api.github.com/users/sguan-actuate/followers","following_url":"https://api.github.com/users/sguan-actuate/following{/other_user}","gists_url":"https://api.github.com/users/sguan-actuate/gists{/gist_id}","starred_url":"https://api.github.com/users/sguan-actuate/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/sguan-actuate/subscriptions","organizations_url":"https://api.github.com/users/sguan-actuate/orgs","repos_url":"https://api.github.com/users/sguan-actuate/repos","events_url":"https://api.github.com/users/sguan-actuate/events{/privacy}","received_events_url":"https://api.github.com/users/sguan-actuate/received_events","type":"User","site_admin":false},"repo":{"id":28415488,"name":"birt","full_name":"sguan-actuate/birt","owner":{"login":"sguan-actuate","id":8562199,"avatar_url":"https://avatars.githubusercontent.com/u/8562199?v=3","gravatar_id":"","url":"https://api.github.com/users/sguan-actuate","html_url":"https://github.com/sguan-actuate","followers_url":"https://api.github.com/users/sguan-actuate/followers","following_url":"https://api.github.com/users/sguan-actuate/following{/other_user}","gists_url":"https://api.github.com/users/sguan-actuate/gists{/gist_id}","starred_url":"https://api.github.com/users/sguan-actuate/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/sguan-actuate/subscriptions","organizations_url":"https://api.github.com/users/sguan-actuate/orgs","repos_url":"https://api.github.com/users/sguan-actuate/repos","events_url":"https://api.github.com/users/sguan-actuate/events{/privacy}","received_events_url":"https://api.github.com/users/sguan-actuate/received_events","type":"User","site_admin":false},"private":false,"html_url":"https://github.com/sguan-actuate/birt","description":"The open source Eclipse BIRT reporting and data visualization project. ","fork":true,"url":"https://api.github.com/repos/sguan-actuate/birt","forks_url":"https://api.github.com/repos/sguan-actuate/birt/forks","keys_url":"https://api.github.com/repos/sguan-actuate/birt/keys{/key_id}","collaborators_url":"https://api.github.com/repos/sguan-actuate/birt/collaborators{/collaborator}","teams_url":"https://api.github.com/repos/sguan-actuate/birt/teams","hooks_url":"https://api.github.com/repos/sguan-actuate/birt/hooks","issue_events_url":"https://api.github.com/repos/sguan-actuate/birt/issues/events{/number}","events_url":"https://api.github.com/repos/sguan-actuate/birt/events","assignees_url":"https://api.github.com/repos/sguan-actuate/birt/assignees{/user}","branches_url":"https://api.github.com/repos/sguan-actuate/birt/branches{/branch}","tags_url":"https://api.github.com/repos/sguan-actuate/birt/tags","blobs_url":"https://api.github.com/repos/sguan-actuate/birt/git/blobs{/sha}","git_tags_url":"https://api.github.com/repos/sguan-actuate/birt/git/tags{/sha}","git_refs_url":"https://api.github.com/repos/sguan-actuate/birt/git/refs{/sha}","trees_url":"https://api.github.com/repos/sguan-actuate/birt/git/trees{/sha}","statuses_url":"https://api.github.com/repos/sguan-actuate/birt/statuses/{sha}","languages_url":"https://api.github.com/repos/sguan-actuate/birt/languages","stargazers_url":"https://api.github.com/repos/sguan-actuate/birt/stargazers","contributors_url":"https://api.github.com/repos/sguan-actuate/birt/contributors","subscribers_url":"https://api.github.com/repos/sguan-actuate/birt/subscribers","subscription_url":"https://api.github.com/repos/sguan-actuate/birt/subscription","commits_url":"https://api.github.com/repos/sguan-actuate/birt/commits{/sha}","git_commits_url":"https://api.github.com/repos/sguan-actuate/birt/git/commits{/sha}","comments_url":"https://api.github.com/repos/sguan-actuate/birt/comments{/number}","issue_comment_url":"https://api.github.com/repos/sguan-actuate/birt/issues/comments/{number}","contents_url":"https://api.github.com/repos/sguan-actuate/birt/contents/{+path}","compare_url":"https://api.github.com/repos/sguan-actuate/birt/compare/{base}...{head}","merges_url":"https://api.github.com/repos/sguan-actuate/birt/merges","archive_url":"https://api.github.com/repos/sguan-actuate/birt/{archive_format}{/ref}","downloads_url":"https://api.github.com/repos/sguan-actuate/birt/downloads","issues_url":"https://api.github.com/repos/sguan-actuate/birt/issues{/number}","pulls_url":"https://api.github.com/repos/sguan-actuate/birt/pulls{/number}","milestones_url":"https://api.github.com/repos/sguan-actuate/birt/milestones{/number}","notifications_url":"https://api.github.com/repos/sguan-actuate/birt/notifications{?since,all,participating}","labels_url":"https://api.github.com/repos/sguan-actuate/birt/labels{/name}","releases_url":"https://api.github.com/repos/sguan-actuate/birt/releases{/id}","created_at":"2014-12-23T19:25:25Z","updated_at":"2015-01-01T00:23:05Z","pushed_at":"2015-01-01T00:23:05Z","git_url":"git://github.com/sguan-actuate/birt.git","ssh_url":"git@github.com:sguan-actuate/birt.git","clone_url":"https://github.com/sguan-actuate/birt.git","svn_url":"https://github.com/sguan-actuate/birt","homepage":"http://www.eclipse.org/birt","size":171178,"stargazers_count":0,"watchers_count":0,"language":"Java","has_issues":false,"has_downloads":true,"has_wiki":false,"has_pages":false,"forks_count":0,"mirror_url":null,"open_issues_count":0,"forks":0,"open_issues":0,"watchers":0,"default_branch":"master"}},"base":{"label":"eclipse:master","ref":"master","sha":"9e12f3e628b2b0657a557bbeda71fa13337cdfe2","user":{"login":"eclipse","id":56974,"avatar_url":"https://avatars.githubusercontent.com/u/56974?v=3","gravatar_id":"","url":"https://api.github.com/users/eclipse","html_url":"https://github.com/eclipse","followers_url":"https://api.github.com/users/eclipse/followers","following_url":"https://api.github.com/users/eclipse/following{/other_user}","gists_url":"https://api.github.com/users/eclipse/gists{/gist_id}","starred_url":"https://api.github.com/users/eclipse/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/eclipse/subscriptions","organizations_url":"https://api.github.com/users/eclipse/orgs","repos_url":"https://api.github.com/users/eclipse/repos","events_url":"https://api.github.com/users/eclipse/events{/privacy}","received_events_url":"https://api.github.com/users/eclipse/received_events","type":"Organization","site_admin":false},"repo":{"id":19821157,"name":"birt","full_name":"eclipse/birt","owner":{"login":"eclipse","id":56974,"avatar_url":"https://avatars.githubusercontent.com/u/56974?v=3","gravatar_id":"","url":"https://api.github.com/users/eclipse","html_url":"https://github.com/eclipse","followers_url":"https://api.github.com/users/eclipse/followers","following_url":"https://api.github.com/users/eclipse/following{/other_user}","gists_url":"https://api.github.com/users/eclipse/gists{/gist_id}","starred_url":"https://api.github.com/users/eclipse/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/eclipse/subscriptions","organizations_url":"https://api.github.com/users/eclipse/orgs","repos_url":"https://api.github.com/users/eclipse/repos","events_url":"https://api.github.com/users/eclipse/events{/privacy}","received_events_url":"https://api.github.com/users/eclipse/received_events","type":"Organization","site_admin":false},"private":false,"html_url":"https://github.com/eclipse/birt","description":"The open source Eclipse BIRT reporting and data visualization project. ","fork":false,"url":"https://api.github.com/repos/eclipse/birt","forks_url":"https://api.github.com/repos/eclipse/birt/forks","keys_url":"https://api.github.com/repos/eclipse/birt/keys{/key_id}","collaborators_url":"https://api.github.com/repos/eclipse/birt/collaborators{/collaborator}","teams_url":"https://api.github.com/repos/eclipse/birt/teams","hooks_url":"https://api.github.com/repos/eclipse/birt/hooks","issue_events_url":"https://api.github.com/repos/eclipse/birt/issues/events{/number}","events_url":"https://api.github.com/repos/eclipse/birt/events","assignees_url":"https://api.github.com/repos/eclipse/birt/assignees{/user}","branches_url":"https://api.github.com/repos/eclipse/birt/branches{/branch}","tags_url":"https://api.github.com/repos/eclipse/birt/tags","blobs_url":"https://api.github.com/repos/eclipse/birt/git/blobs{/sha}","git_tags_url":"https://api.github.com/repos/eclipse/birt/git/tags{/sha}","git_refs_url":"https://api.github.com/repos/eclipse/birt/git/refs{/sha}","trees_url":"https://api.github.com/repos/eclipse/birt/git/trees{/sha}","statuses_url":"https://api.github.com/repos/eclipse/birt/statuses/{sha}","languages_url":"https://api.github.com/repos/eclipse/birt/languages","stargazers_url":"https://api.github.com/repos/eclipse/birt/stargazers","contributors_url":"https://api.github.com/repos/eclipse/birt/contributors","subscribers_url":"https://api.github.com/repos/eclipse/birt/subscribers","subscription_url":"https://api.github.com/repos/eclipse/birt/subscription","commits_url":"https://api.github.com/repos/eclipse/birt/commits{/sha}","git_commits_url":"https://api.github.com/repos/eclipse/birt/git/commits{/sha}","comments_url":"https://api.github.com/repos/eclipse/birt/comments{/number}","issue_comment_url":"https://api.github.com/repos/eclipse/birt/issues/comments/{number}","contents_url":"https://api.github.com/repos/eclipse/birt/contents/{+path}","compare_url":"https://api.github.com/repos/eclipse/birt/compare/{base}...{head}","merges_url":"https://api.github.com/repos/eclipse/birt/merges","archive_url":"https://api.github.com/repos/eclipse/birt/{archive_format}{/ref}","downloads_url":"https://api.github.com/repos/eclipse/birt/downloads","issues_url":"https://api.github.com/repos/eclipse/birt/issues{/number}","pulls_url":"https://api.github.com/repos/eclipse/birt/pulls{/number}","milestones_url":"https://api.github.com/repos/eclipse/birt/milestones{/number}","notifications_url":"https://api.github.com/repos/eclipse/birt/notifications{?since,all,participating}","labels_url":"https://api.github.com/repos/eclipse/birt/labels{/name}","releases_url":"https://api.github.com/repos/eclipse/birt/releases{/id}","created_at":"2014-05-15T13:55:31Z","updated_at":"2015-01-01T00:31:05Z","pushed_at":"2015-01-01T00:31:05Z","git_url":"git://github.com/eclipse/birt.git","ssh_url":"git@github.com:eclipse/birt.git","clone_url":"https://github.com/eclipse/birt.git","svn_url":"https://github.com/eclipse/birt","homepage":"http://www.eclipse.org/birt","size":939311,"stargazers_count":8,"watchers_count":8,"language":"Java","has_issues":false,"has_downloads":true,"has_wiki":false,"has_pages":false,"forks_count":20,"mirror_url":null,"open_issues_count":1,"forks":20,"open_issues":1,"watchers":8,"default_branch":"master"}},"_links":{"self":{"href":"https://api.github.com/repos/eclipse/birt/pulls/70"},"html":{"href":"https://github.com/eclipse/birt/pull/70"},"issue":{"href":"https://api.github.com/repos/eclipse/birt/issues/70"},"comments":{"href":"https://api.github.com/repos/eclipse/birt/issues/70/comments"},"review_comments":{"href":"https://api.github.com/repos/eclipse/birt/pulls/70/comments"},"review_comment":{"href":"https://api.github.com/repos/eclipse/birt/pulls/comments/{number}"},"commits":{"href":"https://api.github.com/repos/eclipse/birt/pulls/70/commits"},"statuses":{"href":"https://api.github.com/repos/eclipse/birt/statuses/7efab4d3fe077789a3e65be0fcd80a6078557360"}},"merged":false,"mergeable":null,"mergeable_state":"unknown","merged_by":null,"comments":0,"review_comments":0,"commits":2,"additions":59,"deletions":14,"changed_files":4}},"public":true,"created_at":"2015-01-01T01:03:38Z","org":{"id":56974,"login":"eclipse","gravatar_id":"","url":"https://api.github.com/orgs/eclipse","avatar_url":"https://avatars.githubusercontent.com/u/56974?"}}
{"id":"2489397442","type":"CreateEvent","actor":{"id":1398544,"login":"joelpurra","gravatar_id":"","url":"https://api.github.com/users/joelpurra","avatar_url":"https://avatars.githubusercontent.com/u/1398544?"},"repo":{"id":28595466,"name":"joelpurra/jqnpm","url":"https://api.github.com/repos/joelpurra/jqnpm"},"payload":{"ref":"import_659","ref_type":"branch","master_branch":"master","description":"A package manager built for jq as an example implementation.","pusher_type":"user"},"public":true,"created_at":"2015-01-01T01:03:38Z"}
{"id":"2489397443","type":"PushEvent","actor":{"id":10350323,"login":"nik7273","gravatar_id":"","url":"https://api.github.com/users/nik7273","avatar_url":"https://avatars.githubusercontent.com/u/10350323?"},"repo":{"id":28635375,"name":"nik7273/wikipedia-access-thru-API","url":"https://api.github.com/repos/nik7273/wikipedia-access-thru-API"},"payload":{"push_id":536752948,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"6adff88c4820e3e820c949eebb7ed57521cb5e26","before":"ce036d56a80edcb460c0c2c71d4c410f2709ded8","commits":[{"sha":"6adff88c4820e3e820c949eebb7ed57521cb5e26","author":{"email":"40527771d623df543fb2bc588362a230688f2063@gmail.com","name":"nik7273"},"message":"Update README.md","distinct":true,"url":"https://api.github.com/repos/nik7273/wikipedia-access-thru-API/commits/6adff88c4820e3e820c949eebb7ed57521cb5e26"}]},"public":true,"created_at":"2015-01-01T01:03:38Z"}
{"id":"2489397445","type":"IssueCommentEvent","actor":{"id":1693373,"login":"puhley","gravatar_id":"","url":"https://api.github.com/users/puhley","avatar_url":"https://avatars.githubusercontent.com/u/1693373?"},"repo":{"id":18814466,"name":"crits/crits","url":"https://api.github.com/repos/crits/crits"},"payload":{"action":"created","issue":{"url":"https://api.github.com/repos/crits/crits/issues/333","labels_url":"https://api.github.com/repos/crits/crits/issues/333/labels{/name}","comments_url":"https://api.github.com/repos/crits/crits/issues/333/comments","events_url":"https://api.github.com/repos/crits/crits/issues/333/events","html_url":"https://github.com/crits/crits/pull/333","id":50806180,"number":333,"title":"API delete support for domains and IPs","user":{"login":"puhley","id":1693373,"avatar_url":"https://avatars.githubusercontent.com/u/1693373?v=3","gravatar_id":"","url":"https://api.github.com/users/puhley","html_url":"https://github.com/puhley","followers_url":"https://api.github.com/users/puhley/followers","following_url":"https://api.github.com/users/puhley/following{/other_user}","gists_url":"https://api.github.com/users/puhley/gists{/gist_id}","starred_url":"https://api.github.com/users/puhley/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/puhley/subscriptions","organizations_url":"https://api.github.com/users/puhley/orgs","repos_url":"https://api.github.com/users/puhley/repos","events_url":"https://api.github.com/users/puhley/events{/privacy}","received_events_url":"https://api.github.com/users/puhley/received_events","type":"User","site_admin":false},"labels":[],"state":"open","locked":false,"assignee":null,"milestone":null,"comments":8,"created_at":"2014-12-03T09:10:11Z","updated_at":"2015-01-01T01:03:38Z","closed_at":null,"pull_request":{"url":"https://api.github.com/repos/crits/crits/pulls/333","html_url":"https://github.com/crits/crits/pull/333","diff_url":"https://github.com/crits/crits/pull/333.diff","patch_url":"https://github.com/crits/crits/pull/333.patch"},"body":"This is a rough draft of code that will enable delete support for the IP and domain APIs. Since an IP or domain can be associated with multiple sources and campaigns, this approach allows you to delete an individual reference or to delete the entire record. If you provide a campaign and source along with the record ID, then this will just delete the references to that campaign and source. If you only provide the record ID, then it will delete the entire record.\r\n\r\nThe code for delete support in the domain API is a little complicated. The django-tastypie-mongoengine won't accept a DELETE request with parameters passed in the body of the request. Therefore, the DELETE request must pass the parameters in the URL. However, in order to pass the request to the generate_domain_jtable, the request must be converted into a POST format. Since I didn't know the jtable code well enough to reformat it, I got around the issue by creating a fake POST object and passing that instead. This isn't the most elegant solution but it allowed me to contain the changes to the API code.\r\n\r\nBeing able to delete an IP or API reference would be useful for people who want to use CRITs to track only the current list of threats. For instance, IPs are sometimes removed from IOC lists because the compromised host has been fixed. These changes would allow you to remove the IP from the current list of threats via the API. This code still requires the user to have admin privileges in order to perform the deletion.\r\n\r\nPlease take a look at the code and let me know your thoughts. "},"comment":{"url":"https://api.github.com/repos/crits/crits/issues/comments/68477286","html_url":"https://github.com/crits/crits/pull/333#issuecomment-68477286","issue_url":"https://api.github.com/repos/crits/crits/issues/333","id":68477286,"user":{"login":"puhley","id":1693373,"avatar_url":"https://avatars.githubusercontent.com/u/1693373?v=3","gravatar_id":"","url":"https://api.github.com/users/puhley","html_url":"https://github.com/puhley","followers_url":"https://api.github.com/users/puhley/followers","following_url":"https://api.github.com/users/puhley/following{/other_user}","gists_url":"https://api.github.com/users/puhley/gists{/gist_id}","starred_url":"https://api.github.com/users/puhley/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/puhley/subscriptions","organizations_url":"https://api.github.com/users/puhley/orgs","repos_url":"https://api.github.com/users/puhley/repos","events_url":"https://api.github.com/users/puhley/events{/privacy}","received_events_url":"https://api.github.com/users/puhley/received_events","type":"User","site_admin":false},"created_at":"2015-01-01T01:03:38Z","updated_at":"2015-01-01T01:03:38Z","body":"* I changed the logic from “removing the campaign from the domain” to “removing a domain from the campaign”. This eliminates the redundant campaign removal logic for each TLO. The new code will allow you to remove any type of object from a campaign.\r\n* I added the ability to delete a campaign. I saw that functionality requested in one of the threads.\r\n* All of the TLOs used jtable_ajax_delete. Therefore, I split jtable_ajax_delete into 2 functions so that both the UI (via jtable_ajax_delete -> delete_id) and the API (via a direct call to delete_id) could reference the same deletion code for ObjectIds.\r\n* I added validate_objectid to the mongo_tools library to centralize validation code for ObjectIds."}},"public":true,"created_at":"2015-01-01T01:03:39Z","org":{"id":5392624,"login":"crits","gravatar_id":"","url":"https://api.github.com/orgs/crits","avatar_url":"https://avatars.githubusercontent.com/u/5392624?"}}
{"id":"2489397449","type":"PushEvent","actor":{"id":6267945,"login":"lakotadlustig","gravatar_id":"","url":"https://api.github.com/users/lakotadlustig","avatar_url":"https://avatars.githubusercontent.com/u/6267945?"},"repo":{"id":28615365,"name":"korlabs/tippr","url":"https://api.github.com/repos/korlabs/tippr"},"payload":{"push_id":536752950,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"cf31abd3724db74c818220b0d13c26ebcecfc128","before":"010ba4d2a839b14d435b0d2c2ea75a861cab3e5d","commits":[{"sha":"cf31abd3724db74c818220b0d13c26ebcecfc128","author":{"email":"3280e741e838010abad30f9c64878ae2d3f3e766@podbe.at","name":"Lakota Lustig"},"message":"Added ability to have tips refunded.\n\nRequires wallet URL to be saved to a text file sadly, but it was the only way.","distinct":true,"url":"https://api.github.com/repos/korlabs/tippr/commits/cf31abd3724db74c818220b0d13c26ebcecfc128"}]},"public":true,"created_at":"2015-01-01T01:03:39Z","org":{"id":7786022,"login":"korlabs","gravatar_id":"","url":"https://api.github.com/orgs/korlabs","avatar_url":"https://avatars.githubusercontent.com/u/7786022?"}}
{"id":"2489397454","type":"PushEvent","actor":{"id":3933623,"login":"tonyblank","gravatar_id":"","url":"https://api.github.com/users/tonyblank","avatar_url":"https://avatars.githubusercontent.com/u/3933623?"},"repo":{"id":28676606,"name":"tonyblank/Beerman","url":"https://api.github.com/repos/tonyblank/Beerman"},"payload":{"push_id":536752951,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"3971df1986b9944235005eac430da3525adcd81b","before":"bac32fd982495634fa319f0ba38161a47ee9be01","commits":[{"sha":"3971df1986b9944235005eac430da3525adcd81b","author":{"email":"b1c1d8736f20db3fb6c1c66bb1455ed43909f0d8@tonyblank.com","name":"Tony Blank"},"message":"created ROUGH readme with install instruction summary","distinct":true,"url":"https://api.github.com/repos/tonyblank/Beerman/commits/3971df1986b9944235005eac430da3525adcd81b"}]},"public":true,"created_at":"2015-01-01T01:03:41Z"}
{"id":"2489397455","type":"PushEvent","actor":{"id":1359331,"login":"yepher","gravatar_id":"","url":"https://api.github.com/users/yepher","avatar_url":"https://avatars.githubusercontent.com/u/1359331?"},"repo":{"id":28612273,"name":"yepher/littlebits","url":"https://api.github.com/repos/yepher/littlebits"},"payload":{"push_id":536752952,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"ad8f676eb03c36491ba1459349574c8f3b308602","before":"f6c00396a9221646c39f7fc97fe2d8b24a6baed7","commits":[{"sha":"ad8f676eb03c36491ba1459349574c8f3b308602","author":{"email":"711c73f64afdce07b7e38039a96d2224209e9a6c@mfluent.com","name":"Chris Wilson"},"message":"Adds some documentation","distinct":true,"url":"https://api.github.com/repos/yepher/littlebits/commits/ad8f676eb03c36491ba1459349574c8f3b308602"}]},"public":true,"created_at":"2015-01-01T01:03:41Z"}
{"id":"2489397456","type":"PushEvent","actor":{"id":3794984,"login":"abustamam","gravatar_id":"","url":"https://api.github.com/users/abustamam","avatar_url":"https://avatars.githubusercontent.com/u/3794984?"},"repo":{"id":25110710,"name":"abustamam/Udacity-Portfolio","url":"https://api.github.com/repos/abustamam/Udacity-Portfolio"},"payload":{"push_id":536752953,"size":2,"distinct_size":2,"ref":"refs/heads/master","head":"5776bf9082fbc389cc986d9159e7367cc2fcdf20","before":"b39e5ac9096f3ddcc10a485bd9df8dbedcfda5ef","commits":[{"sha":"e323ac3bd7451b41388d083ec83e1dc3a4d94022","author":{"email":"1f8e819f7c9fbaadfc4b5b78cc4be161892e8692@gmail.com","name":"Rasheed Bustamam"},"message":"Change project 1 img","distinct":true,"url":"https://api.github.com/repos/abustamam/Udacity-Portfolio/commits/e323ac3bd7451b41388d083ec83e1dc3a4d94022"},{"sha":"5776bf9082fbc389cc986d9159e7367cc2fcdf20","author":{"email":"1f8e819f7c9fbaadfc4b5b78cc4be161892e8692@gmail.com","name":"Rasheed Bustamam"},"message":"Merge branch 'master' of github.com:abustamam/Udacity-Portfolio\n\nPull readme","distinct":true,"url":"https://api.github.com/repos/abustamam/Udacity-Portfolio/commits/5776bf9082fbc389cc986d9159e7367cc2fcdf20"}]},"public":true,"created_at":"2015-01-01T01:03:41Z"}
{"id":"2489397457","type":"IssueCommentEvent","actor":{"id":923144,"login":"pythonesque","gravatar_id":"","url":"https://api.github.com/users/pythonesque","avatar_url":"https://avatars.githubusercontent.com/u/923144?"},"repo":{"id":724712,"name":"rust-lang/rust","url":"https://api.github.com/repos/rust-lang/rust"},"payload":{"action":"created","issue":{"url":"https://api.github.com/repos/rust-lang/rust/issues/20355","labels_url":"https://api.github.com/repos/rust-lang/rust/issues/20355/labels{/name}","comments_url":"https://api.github.com/repos/rust-lang/rust/issues/20355/comments","events_url":"https://api.github.com/repos/rust-lang/rust/issues/20355/events","html_url":"https://github.com/rust-lang/rust/issues/20355","id":53157956,"number":20355,"title":"Segfault in `Hasher<SipState>::hash`","user":{"login":"fitzgen","id":74571,"avatar_url":"https://avatars.githubusercontent.com/u/74571?v=3","gravatar_id":"","url":"https://api.github.com/users/fitzgen","html_url":"https://github.com/fitzgen","followers_url":"https://api.github.com/users/fitzgen/followers","following_url":"https://api.github.com/users/fitzgen/following{/other_user}","gists_url":"https://api.github.com/users/fitzgen/gists{/gist_id}","starred_url":"https://api.github.com/users/fitzgen/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/fitzgen/subscriptions","organizations_url":"https://api.github.com/users/fitzgen/orgs","repos_url":"https://api.github.com/users/fitzgen/repos","events_url":"https://api.github.com/users/fitzgen/events{/privacy}","received_events_url":"https://api.github.com/users/fitzgen/received_events","type":"User","site_admin":false},"labels":[{"url":"https://api.github.com/repos/rust-lang/rust/labels/I-crash","name":"I-crash","color":"e10c02"}],"state":"open","locked":false,"assignee":null,"milestone":null,"comments":6,"created_at":"2014-12-31T00:04:46Z","updated_at":"2015-01-01T01:03:40Z","closed_at":null,"body":"Test case is branch `sip-hasher-segault` of this repo: https://github.com/fitzgen/oxischeme/tree/sip-hasher-segfault\r\n\r\n    $ rustc --version --verbose\r\n    rustc --version --verbose\r\n    rustc 0.13.0-nightly (5ba610265 2014-12-25 18:01:36 +0000)\r\n    binary: rustc\r\n    commit-hash: 5ba6102657a892457063d2d6a7cbb9632ce282c6\r\n    commit-date: 2014-12-25 18:01:36 +0000\r\n    host: x86_64-apple-darwin\r\n    release: 0.13.0-nightly\r\n    $ rustc -g --test src/main.rs -o target/test\r\n    $ lldb ./target/test\r\n    lldb ./target/test\r\n    (lldb) target create \"./target/test\"\r\n    Current executable set to './target/test' (x86_64).\r\n    (lldb) run\r\n    Process 8270 launched: './target/test' (x86_64)\r\n\r\n    running 20 tests\r\n    Process 8270 stopped\r\n    * thread #2: tid = 0x25693, 0x0000000100008bed test`hash::sip::SipHasher.Hasher$LT$SipState$GT$::hash::h16497116303610205953 + 61, stop reason = EXC_BAD_ACCESS (code=1, address=0x3ffd9)\r\n        frame #0: 0x0000000100008bed test`hash::sip::SipHasher.Hasher$LT$SipState$GT$::hash::h16497116303610205953 + 61\r\n    test`hash::sip::SipHasher.Hasher$LT$SipState$GT$::hash::h16497116303610205953 + 61:\r\n    -> 0x100008bed:  movq   (%rsi), %rsi\r\n       0x100008bf0:  movq   -0x8(%rbp), %rdi\r\n       0x100008bf4:  movq   0x8(%rdi), %rdx\r\n       0x100008bf8:  movq   %rax, %rdi\r\n    (lldb) bt\r\n    * thread #2: tid = 0x25693, 0x0000000100008bed test`hash::sip::SipHasher.Hasher$LT$SipState$GT$::hash::h16497116303610205953 + 61, stop reason = EXC_BAD_ACCESS (code=1, address=0x3ffd9)\r\n      * frame #0: 0x0000000100008bed test`hash::sip::SipHasher.Hasher$LT$SipState$GT$::hash::h16497116303610205953 + 61\r\n        frame #1: 0x0000000105401810\r\n        frame #2: 0x0000000100008ba2 test`hash::RandomSipHasher.Hasher$LT$sip..SipState$GT$::hash::h10512232733763305808 + 66\r\n        frame #3: 0x0000000100008b0e test`collections::hash::table::make_hash::h9604696550138645665 + 62\r\n        frame #4: 0x0000000100008abe test`collections::hash::map::HashMap$LT$K$C$$u{20}V$C$$u{20}H$GT$::make_hash::h15786379260790357760 + 62\r\n        frame #5: 0x0000000100008963 test`collections::hash::map::HashMap$LT$K$C$$u{20}V$C$$u{20}H$GT$::insert::h6805880362953821147 + 131\r\n        frame #6: 0x0000000100006aea test`main::environment::Environment::define(self=0x000000000003ffc1, sym=String at 0x0000000105401a50, val=0x0000000105401c38) + 218 at environment.rs:92\r\n        frame #7: 0x0000000100018486 test`main::eval::evaluate_definition(heap=0x00000001054034e8, env=0x0000000105402d10, form=0x0000000105402ce0) + 2406 at eval.rs:195\r\n        frame #8: 0x0000000100013f1b test`main::eval::evaluate(heap=0x00000001054034e8, env=0x0000000105402d90, form=0x0000000105402f30) + 1355 at eval.rs:79\r\n        frame #9: 0x0000000100013909 test`main::eval::evaluate_in_global_env(heap=0x00000001054034e8, form=0x0000000105402f30) + 105 at eval.rs:38\r\n        frame #10: 0x000000010001cd7b test`main::eval::evaluate_file(heap=0x00000001054034e8, file_path=(data_ptr = \"./tests/test_eval_closures.scmsrc/heap.rsArenaPtr(, )Rooted(\", length = 30)) + 1035 at <std macros>:286\r\n        frame #11: 0x000000010002c071 test`main::eval::test_eval_closures + 129 at eval.rs:403\r\n        frame #12: 0x0000000100087154 test`thunk::F.Invoke$LT$A$C$$u{20}R$GT$::invoke::h5218640484166224076 + 52\r\n        frame #13: 0x0000000100091e32 test`thunk::F.Invoke$LT$A$C$$u{20}R$GT$::invoke::h13672304839710771993 + 162\r\n        frame #14: 0x0000000100088912 test`thunk::F.Invoke$LT$A$C$$u{20}R$GT$::invoke::h15490786364890695979 + 1138\r\n        frame #15: 0x0000000100088db0 test`rt::unwind::try::try_fn::h10439459448986358359 + 160\r\n        frame #16: 0x000000010010a4f9 test`rust_try_inner + 9\r\n        frame #17: 0x000000010010a4e6 test`rust_try + 6\r\n        frame #18: 0x00000001000894ab test`thunk::F.Invoke$LT$A$C$$u{20}R$GT$::invoke::h13206639752781900349 + 1179\r\n        frame #19: 0x0000000100106eb4 test`sys::thread::thread_start::h2cb22211a4c7d938vFw + 164\r\n        frame #20: 0x00007fff875d3899 libsystem_pthread.dylib`_pthread_body + 138\r\n        frame #21: 0x00007fff875d372a libsystem_pthread.dylib`_pthread_start + 137\r\n        frame #22: 0x00007fff875d7fc9 libsystem_pthread.dylib`thread_start + 13\r\n"},"comment":{"url":"https://api.github.com/repos/rust-lang/rust/issues/comments/68477288","html_url":"https://github.com/rust-lang/rust/issues/20355#issuecomment-68477288","issue_url":"https://api.github.com/repos/rust-lang/rust/issues/20355","id":68477288,"user":{"login":"pythonesque","id":923144,"avatar_url":"https://avatars.githubusercontent.com/u/923144?v=3","gravatar_id":"","url":"https://api.github.com/users/pythonesque","html_url":"https://github.com/pythonesque","followers_url":"https://api.github.com/users/pythonesque/followers","following_url":"https://api.github.com/users/pythonesque/following{/other_user}","gists_url":"https://api.github.com/users/pythonesque/gists{/gist_id}","starred_url":"https://api.github.com/users/pythonesque/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/pythonesque/subscriptions","organizations_url":"https://api.github.com/users/pythonesque/orgs","repos_url":"https://api.github.com/users/pythonesque/repos","events_url":"https://api.github.com/users/pythonesque/events{/privacy}","received_events_url":"https://api.github.com/users/pythonesque/received_events","type":"User","site_admin":false},"created_at":"2015-01-01T01:03:40Z","updated_at":"2015-01-01T01:03:40Z","body":"I probably would.  But if you can find a reproducible test case that doesn't use any unsafe code, you can always reopen it :)"}},"public":true,"created_at":"2015-01-01T01:03:41Z","org":{"id":5430905,"login":"rust-lang","gravatar_id":"","url":"https://api.github.com/orgs/rust-lang","avatar_url":"https://avatars.githubusercontent.com/u/5430905?"}}
{"id":"2489397466","type":"PushEvent","actor":{"id":1727112,"login":"nucleardreamer","gravatar_id":"","url":"https://api.github.com/users/nucleardreamer","avatar_url":"https://avatars.githubusercontent.com/u/1727112?"},"repo":{"id":28675721,"name":"nucleardreamer/tdc","url":"https://api.github.com/repos/nucleardreamer/tdc"},"payload":{"push_id":536752957,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"5763af4a3216ce785215e64ec213ce78130c2b0f","before":"07a6ae5cdb39596d5aed1b3794229968810bce1f","commits":[{"sha":"5763af4a3216ce785215e64ec213ce78130c2b0f","author":{"email":"61996574b2cb2f66e0c7dcf5a13359213bfaba5a@gmail.com","name":"nucleardreamer"},"message":"updating mask image","distinct":true,"url":"https://api.github.com/repos/nucleardreamer/tdc/commits/5763af4a3216ce785215e64ec213ce78130c2b0f"}]},"public":true,"created_at":"2015-01-01T01:03:42Z"}
{"id":"2489397467","type":"PushEvent","actor":{"id":3596952,"login":"priseborough","gravatar_id":"","url":"https://api.github.com/users/priseborough","avatar_url":"https://avatars.githubusercontent.com/u/3596952?"},"repo":{"id":8208289,"name":"priseborough/ardupilot","url":"https://api.github.com/repos/priseborough/ardupilot"},"payload":{"push_id":536752958,"size":4,"distinct_size":4,"ref":"refs/heads/ekfUpdates","head":"5a91d89607bd9552e9767239f90802aae6e95675","before":"fce220571dcbd8a4621c9743d90aa48f5a487940","commits":[{"sha":"b1be8e09be78483f31ec47ee6bec00606e72184d","author":{"email":"95a043cc2b9ec25c579a602c10711cec6c80724d@live.com.au","name":"priseborough"},"message":"# This is a combination of 2 commits.\n# The first commit's message is:\n\nAP_NavEKF: Enumerate Position and Velocity Aiding\n\n# This is the 2nd commit message:\n\nAP_NavEKF: Fix bug in declaration of enumerated aiding mode variable","distinct":true,"url":"https://api.github.com/repos/priseborough/ardupilot/commits/b1be8e09be78483f31ec47ee6bec00606e72184d"},{"sha":"9ce6b6502df2a96be13b0698193271cec028039a","author":{"email":"95a043cc2b9ec25c579a602c10711cec6c80724d@live.com.au","name":"priseborough"},"message":"AP_NavEKF: Make reversion to no GPS mode unambiguous","distinct":true,"url":"https://api.github.com/repos/priseborough/ardupilot/commits/9ce6b6502df2a96be13b0698193271cec028039a"},{"sha":"200c088c50d34ecb4d7f9ed1c35fa7d4d173582b","author":{"email":"95a043cc2b9ec25c579a602c10711cec6c80724d@live.com.au","name":"priseborough"},"message":"AP_NavEKF: Consolidate constant velocity mode decision logic\n\nThe decision to switch to constant velocity mode during optical flow operation and te decision to switch back were previously being made in two different places in code. Both decisions are now made in the one place which makes the code easier to follow and maintain.","distinct":true,"url":"https://api.github.com/repos/priseborough/ardupilot/commits/200c088c50d34ecb4d7f9ed1c35fa7d4d173582b"},{"sha":"5a91d89607bd9552e9767239f90802aae6e95675","author":{"email":"95a043cc2b9ec25c579a602c10711cec6c80724d@live.com.au","name":"priseborough"},"message":"AP_NavEKF: Consistent initialisation of tuning parameters and variables\n\nNon user adjustable parameters are now declared as 'const' with values assigned in the header.\nThe _ prefix has been removed from non user adjustable tuning parameters.\nVariables that were being initialised in the constructor are now initialised in the function call along with the other filter variables. We use a function call rather than a constructor to initialise variables because it enables the filter to be re-started in flight if necessary.\n\nSigned-off-by: priseborough <p_riseborough@live.com.au>\n\nConflicts:\n\tlibraries/AP_NavEKF/AP_NavEKF.h","distinct":true,"url":"https://api.github.com/repos/priseborough/ardupilot/commits/5a91d89607bd9552e9767239f90802aae6e95675"}]},"public":true,"created_at":"2015-01-01T01:03:42Z"}
{"id":"2489397469","type":"PushEvent","actor":{"id":10324417,"login":"kerned-code","gravatar_id":"","url":"https://api.github.com/users/kerned-code","avatar_url":"https://avatars.githubusercontent.com/u/10324417?"},"repo":{"id":28541287,"name":"kerned-code/dpl-403","url":"https://api.github.com/repos/kerned-code/dpl-403"},"payload":{"push_id":536752959,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"6fbb8ed9aaa4357dd3a48f5a383d9223710102c9","before":"fee005c1ed537333e00cffd8de45b1104543ca6b","commits":[{"sha":"6fbb8ed9aaa4357dd3a48f5a383d9223710102c9","author":{"email":"44d17961b0395a23aed103901a26e8bd0af6ae21@users.noreply.github.com","name":"kerned-code"},"message":"Expand README\n\nWith details about function calls and built-in functions.","distinct":true,"url":"https://api.github.com/repos/kerned-code/dpl-403/commits/6fbb8ed9aaa4357dd3a48f5a383d9223710102c9"}]},"public":true,"created_at":"2015-01-01T01:03:43Z"}
{"id":"2489397471","type":"IssueCommentEvent","actor":{"id":9170481,"login":"scott46743","gravatar_id":"","url":"https://api.github.com/users/scott46743","avatar_url":"https://avatars.githubusercontent.com/u/9170481?"},"repo":{"id":25050352,"name":"MCGamerNetwork/Issues","url":"https://api.github.com/repos/MCGamerNetwork/Issues"},"payload":{"action":"created","issue":{"url":"https://api.github.com/repos/MCGamerNetwork/Issues/issues/474","labels_url":"https://api.github.com/repos/MCGamerNetwork/Issues/issues/474/labels{/name}","comments_url":"https://api.github.com/repos/MCGamerNetwork/Issues/issues/474/comments","events_url":"https://api.github.com/repos/MCGamerNetwork/Issues/issues/474/events","html_url":"https://github.com/MCGamerNetwork/Issues/issues/474","id":51627486,"number":474,"title":"Recent Reports Section on Xime","user":{"login":"scott46743","id":9170481,"avatar_url":"https://avatars.githubusercontent.com/u/9170481?v=3","gravatar_id":"","url":"https://api.github.com/users/scott46743","html_url":"https://github.com/scott46743","followers_url":"https://api.github.com/users/scott46743/followers","following_url":"https://api.github.com/users/scott46743/following{/other_user}","gists_url":"https://api.github.com/users/scott46743/gists{/gist_id}","starred_url":"https://api.github.com/users/scott46743/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/scott46743/subscriptions","organizations_url":"https://api.github.com/users/scott46743/orgs","repos_url":"https://api.github.com/users/scott46743/repos","events_url":"https://api.github.com/users/scott46743/events{/privacy}","received_events_url":"https://api.github.com/users/scott46743/received_events","type":"User","site_admin":false},"labels":[],"state":"open","locked":false,"assignee":null,"milestone":null,"comments":9,"created_at":"2014-12-10T23:49:39Z","updated_at":"2015-01-01T01:03:43Z","closed_at":null,"body":"Environment\r\nXime panel.\r\n\r\nThe issue\r\nThe recent report section has stopped working, and doesn't show any reports as of 12/06/14 at 8:38 EST. In addition, the latest reports included XAC reports, which I don't believe are supposed to show up. \r\n\r\nSteps to reproduce\r\nCheck recent reports section: http://manage.mcgamer.net/punishment/reports/\r\n\r\nMiscellaneous information\r\n\r\n"},"comment":{"url":"https://api.github.com/repos/MCGamerNetwork/Issues/issues/comments/68477289","html_url":"https://github.com/MCGamerNetwork/Issues/issues/474#issuecomment-68477289","issue_url":"https://api.github.com/repos/MCGamerNetwork/Issues/issues/474","id":68477289,"user":{"login":"scott46743","id":9170481,"avatar_url":"https://avatars.githubusercontent.com/u/9170481?v=3","gravatar_id":"","url":"https://api.github.com/users/scott46743","html_url":"https://github.com/scott46743","followers_url":"https://api.github.com/users/scott46743/followers","following_url":"https://api.github.com/users/scott46743/following{/other_user}","gists_url":"https://api.github.com/users/scott46743/gists{/gist_id}","starred_url":"https://api.github.com/users/scott46743/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/scott46743/subscriptions","organizations_url":"https://api.github.com/users/scott46743/orgs","repos_url":"https://api.github.com/users/scott46743/repos","events_url":"https://api.github.com/users/scott46743/events{/privacy}","received_events_url":"https://api.github.com/users/scott46743/received_events","type":"User","site_admin":false},"created_at":"2015-01-01T01:03:43Z","updated_at":"2015-01-01T01:03:43Z","body":"@sheldor-da-great @subv3rsion It appears to have been fixed by @kpwn243 and it hasn't been frozen for days. I think it's alright to close this :+1: "}},"public":true,"created_at":"2015-01-01T01:03:43Z","org":{"id":6956717,"login":"MCGamerNetwork","gravatar_id":"","url":"https://api.github.com/orgs/MCGamerNetwork","avatar_url":"https://avatars.githubusercontent.com/u/6956717?"}}
{"id":"2489397472","type":"PushEvent","actor":{"id":3656079,"login":"marklrh","gravatar_id":"","url":"https://api.github.com/users/marklrh","avatar_url":"https://avatars.githubusercontent.com/u/3656079?"},"repo":{"id":27470715,"name":"marklrh/ocaml-cohttp-test","url":"https://api.github.com/repos/marklrh/ocaml-cohttp-test"},"payload":{"push_id":536752962,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"1a309ab4cddecc0469c8a9c51733570a9624ea54","before":"7525c74ee31f49f576408a7d50d1cf8b9d3d1441","commits":[{"sha":"1a309ab4cddecc0469c8a9c51733570a9624ea54","author":{"email":"e0e04a2320844b42511db0376599e166ab5bda54@gmail.com","name":"Runhang Li"},"message":"lint README","distinct":true,"url":"https://api.github.com/repos/marklrh/ocaml-cohttp-test/commits/1a309ab4cddecc0469c8a9c51733570a9624ea54"}]},"public":true,"created_at":"2015-01-01T01:03:43Z"}
{"id":"2489397475","type":"IssueCommentEvent","actor":{"id":19967,"login":"nicholasf","gravatar_id":"","url":"https://api.github.com/users/nicholasf","avatar_url":"https://avatars.githubusercontent.com/u/19967?"},"repo":{"id":25658193,"name":"rockpoollabs/env","url":"https://api.github.com/repos/rockpoollabs/env"},"payload":{"action":"created","issue":{"url":"https://api.github.com/repos/rockpoollabs/env/issues/6","labels_url":"https://api.github.com/repos/rockpoollabs/env/issues/6/labels{/name}","comments_url":"https://api.github.com/repos/rockpoollabs/env/issues/6/comments","events_url":"https://api.github.com/repos/rockpoollabs/env/issues/6/events","html_url":"https://github.com/rockpoollabs/env/pull/6","id":53202302,"number":6,"title":"Cleaned up shell code.","user":{"login":"wayneeseguin","id":18,"avatar_url":"https://avatars.githubusercontent.com/u/18?v=3","gravatar_id":"","url":"https://api.github.com/users/wayneeseguin","html_url":"https://github.com/wayneeseguin","followers_url":"https://api.github.com/users/wayneeseguin/followers","following_url":"https://api.github.com/users/wayneeseguin/following{/other_user}","gists_url":"https://api.github.com/users/wayneeseguin/gists{/gist_id}","starred_url":"https://api.github.com/users/wayneeseguin/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/wayneeseguin/subscriptions","organizations_url":"https://api.github.com/users/wayneeseguin/orgs","repos_url":"https://api.github.com/users/wayneeseguin/repos","events_url":"https://api.github.com/users/wayneeseguin/events{/privacy}","received_events_url":"https://api.github.com/users/wayneeseguin/received_events","type":"User","site_admin":false},"labels":[],"state":"open","locked":false,"assignee":null,"milestone":null,"comments":2,"created_at":"2014-12-31T20:35:45Z","updated_at":"2015-01-01T01:03:43Z","closed_at":null,"pull_request":{"url":"https://api.github.com/repos/rockpoollabs/env/pulls/6","html_url":"https://github.com/rockpoollabs/env/pull/6","diff_url":"https://github.com/rockpoollabs/env/pull/6.diff","patch_url":"https://github.com/rockpoollabs/env/pull/6.patch"},"body":"I came across your repository and was browsing it, when I got to this file I couldn't resist sending a few suggestions your way:\r\n \r\n* $PWD is automatically available when using BASH, so there is no need for PWD=`pwd`\r\n* If you were to use a subshell be sure to use $() instead of ``.\r\n* it DRY's things up a bit to have a single export line for the variables if you are exporting multiple variables\r\n* Technically exporting PATH is redundant since it is exported by default, but being explicit doesn't hurt.\r\n* Quoting the variable assignments ensures that you are never caught by spaces and perhaps other special characters in your path name which would break the script otherwise.\r\n* Best to reserve all uppercase variable names for exported variables only, script local variables use lower case variable names with naming conventions similar to go style."},"comment":{"url":"https://api.github.com/repos/rockpoollabs/env/issues/comments/68477290","html_url":"https://github.com/rockpoollabs/env/pull/6#issuecomment-68477290","issue_url":"https://api.github.com/repos/rockpoollabs/env/issues/6","id":68477290,"user":{"login":"nicholasf","id":19967,"avatar_url":"https://avatars.githubusercontent.com/u/19967?v=3","gravatar_id":"","url":"https://api.github.com/users/nicholasf","html_url":"https://github.com/nicholasf","followers_url":"https://api.github.com/users/nicholasf/followers","following_url":"https://api.github.com/users/nicholasf/following{/other_user}","gists_url":"https://api.github.com/users/nicholasf/gists{/gist_id}","starred_url":"https://api.github.com/users/nicholasf/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/nicholasf/subscriptions","organizations_url":"https://api.github.com/users/nicholasf/orgs","repos_url":"https://api.github.com/users/nicholasf/repos","events_url":"https://api.github.com/users/nicholasf/events{/privacy}","received_events_url":"https://api.github.com/users/nicholasf/received_events","type":"User","site_admin":false},"created_at":"2015-01-01T01:03:43Z","updated_at":"2015-01-01T01:03:43Z","body":"Thanks Wayne.\r\n\r\nInteresting comments. We'll look at this on Monday (the 5th), when we're back from holidays.\r\n\r\nHappy 2015.\r\n"}},"public":true,"created_at":"2015-01-01T01:03:43Z","org":{"id":4385125,"login":"rockpoollabs","gravatar_id":"","url":"https://api.github.com/orgs/rockpoollabs","avatar_url":"https://avatars.githubusercontent.com/u/4385125?"}}
{"id":"2489397479","type":"IssuesEvent","actor":{"id":5497952,"login":"g19-mr","gravatar_id":"","url":"https://api.github.com/users/g19-mr","avatar_url":"https://avatars.githubusercontent.com/u/5497952?"},"repo":{"id":25435487,"name":"g19-mr/azh","url":"https://api.github.com/repos/g19-mr/azh"},"payload":{"action":"opened","issue":{"url":"https://api.github.com/repos/g19-mr/azh/issues/82","labels_url":"https://api.github.com/repos/g19-mr/azh/issues/82/labels{/name}","comments_url":"https://api.github.com/repos/g19-mr/azh/issues/82/comments","events_url":"https://api.github.com/repos/g19-mr/azh/issues/82/events","html_url":"https://github.com/g19-mr/azh/issues/82","id":53210240,"number":82,"title":"Add background color to done buttons in all Webviews","user":{"login":"g19-mr","id":5497952,"avatar_url":"https://avatars.githubusercontent.com/u/5497952?v=3","gravatar_id":"","url":"https://api.github.com/users/g19-mr","html_url":"https://github.com/g19-mr","followers_url":"https://api.github.com/users/g19-mr/followers","following_url":"https://api.github.com/users/g19-mr/following{/other_user}","gists_url":"https://api.github.com/users/g19-mr/gists{/gist_id}","starred_url":"https://api.github.com/users/g19-mr/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/g19-mr/subscriptions","organizations_url":"https://api.github.com/users/g19-mr/orgs","repos_url":"https://api.github.com/users/g19-mr/repos","events_url":"https://api.github.com/users/g19-mr/events{/privacy}","received_events_url":"https://api.github.com/users/g19-mr/received_events","type":"User","site_admin":false},"labels":[{"url":"https://api.github.com/repos/g19-mr/azh/labels/improvement","name":"improvement","color":"84b6eb"}],"state":"open","locked":false,"assignee":{"login":"g19-mr","id":5497952,"avatar_url":"https://avatars.githubusercontent.com/u/5497952?v=3","gravatar_id":"","url":"https://api.github.com/users/g19-mr","html_url":"https://github.com/g19-mr","followers_url":"https://api.github.com/users/g19-mr/followers","following_url":"https://api.github.com/users/g19-mr/following{/other_user}","gists_url":"https://api.github.com/users/g19-mr/gists{/gist_id}","starred_url":"https://api.github.com/users/g19-mr/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/g19-mr/subscriptions","organizations_url":"https://api.github.com/users/g19-mr/orgs","repos_url":"https://api.github.com/users/g19-mr/repos","events_url":"https://api.github.com/users/g19-mr/events{/privacy}","received_events_url":"https://api.github.com/users/g19-mr/received_events","type":"User","site_admin":false},"milestone":{"url":"https://api.github.com/repos/g19-mr/azh/milestones/2","labels_url":"https://api.github.com/repos/g19-mr/azh/milestones/2/labels","id":873798,"number":2,"title":"Android 1.0.1","description":null,"creator":{"login":"g19-mr","id":5497952,"avatar_url":"https://avatars.githubusercontent.com/u/5497952?v=3","gravatar_id":"","url":"https://api.github.com/users/g19-mr","html_url":"https://github.com/g19-mr","followers_url":"https://api.github.com/users/g19-mr/followers","following_url":"https://api.github.com/users/g19-mr/following{/other_user}","gists_url":"https://api.github.com/users/g19-mr/gists{/gist_id}","starred_url":"https://api.github.com/users/g19-mr/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/g19-mr/subscriptions","organizations_url":"https://api.github.com/users/g19-mr/orgs","repos_url":"https://api.github.com/users/g19-mr/repos","events_url":"https://api.github.com/users/g19-mr/events{/privacy}","received_events_url":"https://api.github.com/users/g19-mr/received_events","type":"User","site_admin":false},"open_issues":6,"closed_issues":10,"state":"open","created_at":"2014-11-20T05:20:02Z","updated_at":"2015-01-01T01:03:44Z","due_on":null,"closed_at":null},"comments":0,"created_at":"2015-01-01T01:03:44Z","updated_at":"2015-01-01T01:03:44Z","closed_at":null,"body":"- 2 on Donate screen\r\n- 1 on About screen"}},"public":true,"created_at":"2015-01-01T01:03:44Z"}
{"id":"2489397484","type":"PushEvent","actor":{"id":3032425,"login":"qq978304139","gravatar_id":"","url":"https://api.github.com/users/qq978304139","avatar_url":"https://avatars.githubusercontent.com/u/3032425?"},"repo":{"id":22276837,"name":"qq978304139/pj_git","url":"https://api.github.com/repos/qq978304139/pj_git"},"payload":{"push_id":536752965,"size":2,"distinct_size":2,"ref":"refs/heads/master_dev","head":"17bd49147c1bffd3f69b9d45a7de1b0492eb0f6e","before":"287a09b687ea3c1328474454d6ea534bc4e03960","commits":[{"sha":"28a720004dad4f9c0d71198b85aa326dcce210c8","author":{"email":"b29612f187963685a9f710ed6e44f9006a30c278@gmail.com","name":"hepeng"},"message":"add dump_stack for linux","distinct":true,"url":"https://api.github.com/repos/qq978304139/pj_git/commits/28a720004dad4f9c0d71198b85aa326dcce210c8"},{"sha":"17bd49147c1bffd3f69b9d45a7de1b0492eb0f6e","author":{"email":"b29612f187963685a9f710ed6e44f9006a30c278@gmail.com","name":"hepeng"},"message":"play wav to remote caller","distinct":true,"url":"https://api.github.com/repos/qq978304139/pj_git/commits/17bd49147c1bffd3f69b9d45a7de1b0492eb0f6e"}]},"public":true,"created_at":"2015-01-01T01:03:45Z"}
{"id":"2489397488","type":"IssuesEvent","actor":{"id":732655,"login":"KindOne-","gravatar_id":"","url":"https://api.github.com/users/KindOne-","avatar_url":"https://avatars.githubusercontent.com/u/732655?"},"repo":{"id":20344030,"name":"irssi/irssi","url":"https://api.github.com/repos/irssi/irssi"},"payload":{"action":"opened","issue":{"url":"https://api.github.com/repos/irssi/irssi/issues/194","labels_url":"https://api.github.com/repos/irssi/irssi/issues/194/labels{/name}","comments_url":"https://api.github.com/repos/irssi/irssi/issues/194/comments","events_url":"https://api.github.com/repos/irssi/irssi/issues/194/events","html_url":"https://github.com/irssi/irssi/issues/194","id":53210242,"number":194,"title":"Initial CTCP Action of an query goes into the status window. ","user":{"login":"KindOne-","id":732655,"avatar_url":"https://avatars.githubusercontent.com/u/732655?v=3","gravatar_id":"","url":"https://api.github.com/users/KindOne-","html_url":"https://github.com/KindOne-","followers_url":"https://api.github.com/users/KindOne-/followers","following_url":"https://api.github.com/users/KindOne-/following{/other_user}","gists_url":"https://api.github.com/users/KindOne-/gists{/gist_id}","starred_url":"https://api.github.com/users/KindOne-/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/KindOne-/subscriptions","organizations_url":"https://api.github.com/users/KindOne-/orgs","repos_url":"https://api.github.com/users/KindOne-/repos","events_url":"https://api.github.com/users/KindOne-/events{/privacy}","received_events_url":"https://api.github.com/users/KindOne-/received_events","type":"User","site_admin":false},"labels":[],"state":"open","locked":false,"assignee":null,"milestone":null,"comments":0,"created_at":"2015-01-01T01:03:45Z","updated_at":"2015-01-01T01:03:45Z","closed_at":null,"body":"```Irssi 0.8.18-head (20141216) - http://irssi.org/``` Inside cygwin  (can also replicate in Ubuntu 14.10)\r\n\r\nNot quite sure how to describe this, if someone sends me an ```/me ....``` and I do not have a query window with them,  that ```/me ....``` will get placed into the status window and irssi will also open a blank query window with that person.\r\n\r\n![irssi](https://cloud.githubusercontent.com/assets/732655/5591401/a7ba5096-9126-11e4-980e-7517e78fcd3c.PNG)"}},"public":true,"created_at":"2015-01-01T01:03:46Z","org":{"id":7750489,"login":"irssi","gravatar_id":"","url":"https://api.github.com/orgs/irssi","avatar_url":"https://avatars.githubusercontent.com/u/7750489?"}}
{"id":"2489397493","type":"CreateEvent","actor":{"id":2829718,"login":"phister","gravatar_id":"","url":"https://api.github.com/users/phister","avatar_url":"https://avatars.githubusercontent.com/u/2829718?"},"repo":{"id":28678235,"name":"phister/Cfb","url":"https://api.github.com/repos/phister/Cfb"},"payload":{"ref":"master","ref_type":"branch","master_branch":"master","description":"College football playoffs","pusher_type":"user"},"public":true,"created_at":"2015-01-01T01:03:47Z"}
{"id":"2489397494","type":"PushEvent","actor":{"id":8933459,"login":"lmontopo","gravatar_id":"","url":"https://api.github.com/users/lmontopo","avatar_url":"https://avatars.githubusercontent.com/u/8933459?"},"repo":{"id":24911711,"name":"lmontopo/lmontopo.github.io","url":"https://api.github.com/repos/lmontopo/lmontopo.github.io"},"payload":{"push_id":536752973,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"06846c61830010de57ca6db802797133ceee8b7c","before":"3511319efef8d59a76434c6884cbc57ab11b9aa5","commits":[{"sha":"06846c61830010de57ca6db802797133ceee8b7c","author":{"email":"6beaeb38ccda0977b766148789e916197124dfed@gmail.com","name":"Leta Montopoli"},"message":"Generate Pelican site","distinct":true,"url":"https://api.github.com/repos/lmontopo/lmontopo.github.io/commits/06846c61830010de57ca6db802797133ceee8b7c"}]},"public":true,"created_at":"2015-01-01T01:03:47Z"}
{"id":"2489397496","type":"CreateEvent","actor":{"id":1754250,"login":"shinji-kono","gravatar_id":"","url":"https://api.github.com/users/shinji-kono","avatar_url":"https://avatars.githubusercontent.com/u/1754250?"},"repo":{"id":28678246,"name":"shinji-kono/nmh-nkf","url":"https://api.github.com/repos/shinji-kono/nmh-nkf"},"payload":{"ref":null,"ref_type":"repository","master_branch":"master","description":"a branch of nmh for Japanese user. UTF8 only. scan, pick and mhl handle Japanese","pusher_type":"user"},"public":true,"created_at":"2015-01-01T01:03:47Z"}
{"id":"2489397497","type":"IssueCommentEvent","actor":{"id":64050,"login":"gjtorikian","gravatar_id":"","url":"https://api.github.com/users/gjtorikian","avatar_url":"https://avatars.githubusercontent.com/u/64050?"},"repo":{"id":10376685,"name":"gjtorikian/markdowntutorial.com","url":"https://api.github.com/repos/gjtorikian/markdowntutorial.com"},"payload":{"action":"created","issue":{"url":"https://api.github.com/repos/gjtorikian/markdowntutorial.com/issues/37","labels_url":"https://api.github.com/repos/gjtorikian/markdowntutorial.com/issues/37/labels{/name}","comments_url":"https://api.github.com/repos/gjtorikian/markdowntutorial.com/issues/37/comments","events_url":"https://api.github.com/repos/gjtorikian/markdowntutorial.com/issues/37/events","html_url":"https://github.com/gjtorikian/markdowntutorial.com/issues/37","id":53166139,"number":37,"title":"Second exercise in Lesson 6","user":{"login":"cliffvick","id":72509,"avatar_url":"https://avatars.githubusercontent.com/u/72509?v=3","gravatar_id":"","url":"https://api.github.com/users/cliffvick","html_url":"https://github.com/cliffvick","followers_url":"https://api.github.com/users/cliffvick/followers","following_url":"https://api.github.com/users/cliffvick/following{/other_user}","gists_url":"https://api.github.com/users/cliffvick/gists{/gist_id}","starred_url":"https://api.github.com/users/cliffvick/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/cliffvick/subscriptions","organizations_url":"https://api.github.com/users/cliffvick/orgs","repos_url":"https://api.github.com/users/cliffvick/repos","events_url":"https://api.github.com/users/cliffvick/events{/privacy}","received_events_url":"https://api.github.com/users/cliffvick/received_events","type":"User","site_admin":false},"labels":[],"state":"open","locked":false,"assignee":null,"milestone":null,"comments":1,"created_at":"2014-12-31T04:07:58Z","updated_at":"2015-01-01T01:03:47Z","closed_at":null,"body":"The criteria for continuing on to the next exercise in the lesson is incorrect in the js/lesson_plans.coffee file (line 69).  The provided text omits the periods, but the lesson plan expects a period after each item."},"comment":{"url":"https://api.github.com/repos/gjtorikian/markdowntutorial.com/issues/comments/68477292","html_url":"https://github.com/gjtorikian/markdowntutorial.com/issues/37#issuecomment-68477292","issue_url":"https://api.github.com/repos/gjtorikian/markdowntutorial.com/issues/37","id":68477292,"user":{"login":"gjtorikian","id":64050,"avatar_url":"https://avatars.githubusercontent.com/u/64050?v=3","gravatar_id":"","url":"https://api.github.com/users/gjtorikian","html_url":"https://github.com/gjtorikian","followers_url":"https://api.github.com/users/gjtorikian/followers","following_url":"https://api.github.com/users/gjtorikian/following{/other_user}","gists_url":"https://api.github.com/users/gjtorikian/gists{/gist_id}","starred_url":"https://api.github.com/users/gjtorikian/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/gjtorikian/subscriptions","organizations_url":"https://api.github.com/users/gjtorikian/orgs","repos_url":"https://api.github.com/users/gjtorikian/repos","events_url":"https://api.github.com/users/gjtorikian/events{/privacy}","received_events_url":"https://api.github.com/users/gjtorikian/received_events","type":"User","site_admin":true},"created_at":"2015-01-01T01:03:47Z","updated_at":"2015-01-01T01:03:47Z","body":"Thanks for the report. The provided text *should* omit the periods, since it's initially a sequence with commas:\r\n\r\n![screen shot 2014-12-31 at 5 02 45 pm](https://cloud.githubusercontent.com/assets/64050/5591410/ddcaf0d6-910e-11e4-8f69-e496814afb5d.png)\r\n\r\nAs it's a list of proper sentences, you create the ordered list, and then provide periods:\r\n\r\n![screen shot 2014-12-31 at 5 02 31 pm](https://cloud.githubusercontent.com/assets/64050/5591411/e874c764-910e-11e4-9206-31ca6b39bda9.png)\r\n\r\nHope that helps. Please feel free to reopen if I've missed something. Happy new year!"}},"public":true,"created_at":"2015-01-01T01:03:47Z"}
{"id":"2489397500","type":"PushEvent","actor":{"id":409860,"login":"flussence","gravatar_id":"","url":"https://api.github.com/users/flussence","avatar_url":"https://avatars.githubusercontent.com/u/409860?"},"repo":{"id":24519248,"name":"flussence/ebuilds","url":"https://api.github.com/repos/flussence/ebuilds"},"payload":{"push_id":536752975,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"7b3ee839d933b0fbe405cf022d9e1003e867be6b","before":"e1531f885892d899210024f54374a4f1880749dc","commits":[{"sha":"7b3ee839d933b0fbe405cf022d9e1003e867be6b","author":{"email":"ddb018d72dce150cce5ca65306dfca4b86fbc0bf@gmail.com","name":"Anthony Parsons"},"message":"Recategorise sys-libs -> dev-libs/libtsm\n\nHopefully I did this right and nobody'll notice.","distinct":true,"url":"https://api.github.com/repos/flussence/ebuilds/commits/7b3ee839d933b0fbe405cf022d9e1003e867be6b"}]},"public":true,"created_at":"2015-01-01T01:03:48Z"}
{"id":"2489397501","type":"PushEvent","actor":{"id":1356088,"login":"Zaryafaraj","gravatar_id":"","url":"https://api.github.com/users/Zaryafaraj","avatar_url":"https://avatars.githubusercontent.com/u/1356088?"},"repo":{"id":26995510,"name":"Fathalian/Guild","url":"https://api.github.com/repos/Fathalian/Guild"},"payload":{"push_id":536752976,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"eb4c4ba011689300a2f0ed76890368347f3ccc29","before":"29abf0e942463dd27cf0666ddf54abda099859b2","commits":[{"sha":"eb4c4ba011689300a2f0ed76890368347f3ccc29","author":{"email":"de8898f6c55e335aa0a2b937fae65fb756ee038f@gmail.com","name":"Zaryafaraj"},"message":"modal style change","distinct":true,"url":"https://api.github.com/repos/Fathalian/Guild/commits/eb4c4ba011689300a2f0ed76890368347f3ccc29"}]},"public":true,"created_at":"2015-01-01T01:03:48Z"}
{"id":"2489397507","type":"PushEvent","actor":{"id":1785816,"login":"natashavlahakis","gravatar_id":"","url":"https://api.github.com/users/natashavlahakis","avatar_url":"https://avatars.githubusercontent.com/u/1785816?"},"repo":{"id":27246389,"name":"natashavlahakis/figtree","url":"https://api.github.com/repos/natashavlahakis/figtree"},"payload":{"push_id":536752979,"size":1,"distinct_size":1,"ref":"refs/heads/gh-pages","head":"03e086487f01d5fff1574e9906ad4a4e06082211","before":"55edd29c904072c7dfaf84e396fe6bfb812f941e","commits":[{"sha":"03e086487f01d5fff1574e9906ad4a4e06082211","author":{"email":"84a888d1cdc9202fb22178d441aabd7da0eefd07@gmail.com","name":"Natasha Vlahakis"},"message":"edited layout","distinct":true,"url":"https://api.github.com/repos/natashavlahakis/figtree/commits/03e086487f01d5fff1574e9906ad4a4e06082211"}]},"public":true,"created_at":"2015-01-01T01:03:49Z"}
{"id":"2489397510","type":"PushEvent","actor":{"id":436691,"login":"lfarrell","gravatar_id":"","url":"https://api.github.com/users/lfarrell","avatar_url":"https://avatars.githubusercontent.com/u/436691?"},"repo":{"id":27356689,"name":"lfarrell/DPLA-Metadata-Explorer","url":"https://api.github.com/repos/lfarrell/DPLA-Metadata-Explorer"},"payload":{"push_id":536752980,"size":2,"distinct_size":2,"ref":"refs/heads/master","head":"acf158b3040f94659f754c8ad186fc36f55cf0dd","before":"f9ae98f6d8e374619499e96a23aea453a4f1f0be","commits":[{"sha":"db329fb82c4c829f037c23d34c2a719ff5748c9d","author":{"email":"b11d4f2999ccc74f2c93bc88775bb7be7fad72d9@gmail.com","name":"Larry Farrell"},"message":"Zoom works in space between nodes now.","distinct":true,"url":"https://api.github.com/repos/lfarrell/DPLA-Metadata-Explorer/commits/db329fb82c4c829f037c23d34c2a719ff5748c9d"},{"sha":"acf158b3040f94659f754c8ad186fc36f55cf0dd","author":{"email":"b11d4f2999ccc74f2c93bc88775bb7be7fad72d9@gmail.com","name":"Larry Farrell"},"message":"Add link out searching.","distinct":true,"url":"https://api.github.com/repos/lfarrell/DPLA-Metadata-Explorer/commits/acf158b3040f94659f754c8ad186fc36f55cf0dd"}]},"public":true,"created_at":"2015-01-01T01:03:50Z"}
{"id":"2489397511","type":"PushEvent","actor":{"id":8289520,"login":"BenAndy","gravatar_id":"","url":"https://api.github.com/users/BenAndy","avatar_url":"https://avatars.githubusercontent.com/u/8289520?"},"repo":{"id":22988319,"name":"BenAndy/BenAndy.github.io","url":"https://api.github.com/repos/BenAndy/BenAndy.github.io"},"payload":{"push_id":536752981,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"7a84f9d0a292787455f9b63ccd8a79ecc79960e3","before":"cb2e14fdddd091905629a90787593292f4757e02","commits":[{"sha":"7a84f9d0a292787455f9b63ccd8a79ecc79960e3","author":{"email":"b4047af9f9c6db4af7a5f2314edc0d82e0e1385c@gmail.com","name":"Ben Andy"},"message":"AutoPlug ALPHA test 0.2.55","distinct":true,"url":"https://api.github.com/repos/BenAndy/BenAndy.github.io/commits/7a84f9d0a292787455f9b63ccd8a79ecc79960e3"}]},"public":true,"created_at":"2015-01-01T01:03:50Z"}
{"id":"2489397512","type":"PushEvent","actor":{"id":171043,"login":"jeffnv","gravatar_id":"","url":"https://api.github.com/users/jeffnv","avatar_url":"https://avatars.githubusercontent.com/u/171043?"},"repo":{"id":28159277,"name":"jeffnv/elite-golf","url":"https://api.github.com/repos/jeffnv/elite-golf"},"payload":{"push_id":536752982,"size":2,"distinct_size":0,"ref":"refs/heads/gh-pages","head":"12162bb9f224c179a9ea7d8abbac7dadec15ee2a","before":"a5fe0bfb72e4489e4a22c90733db8392e1728ea0","commits":[{"sha":"a88fa3bfffc1d1f4ce9b668412981ff071d9920e","author":{"email":"a4a950aede9822deccc73582f88e82e913eb89d5@gmail.com","name":"Jeff Fiddler"},"message":"course creator has undo now","distinct":false,"url":"https://api.github.com/repos/jeffnv/elite-golf/commits/a88fa3bfffc1d1f4ce9b668412981ff071d9920e"},{"sha":"12162bb9f224c179a9ea7d8abbac7dadec15ee2a","author":{"email":"a4a950aede9822deccc73582f88e82e913eb89d5@gmail.com","name":"Jeff Fiddler"},"message":"more useful alert when clicking idle creator map","distinct":false,"url":"https://api.github.com/repos/jeffnv/elite-golf/commits/12162bb9f224c179a9ea7d8abbac7dadec15ee2a"}]},"public":true,"created_at":"2015-01-01T01:03:50Z"}
{"id":"2489397513","type":"PushEvent","actor":{"id":7387879,"login":"dsm-git","gravatar_id":"","url":"https://api.github.com/users/dsm-git","avatar_url":"https://avatars.githubusercontent.com/u/7387879?"},"repo":{"id":28354666,"name":"Door43/d43-ar-x-dcv","url":"https://api.github.com/repos/Door43/d43-ar-x-dcv"},"payload":{"push_id":536752983,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"2bfd58ab618f202c44a4010ce9d2eb6b66da57a5","before":"6158b50e1a2b200c5efba979f08248b153ced502","commits":[{"sha":"2bfd58ab618f202c44a4010ce9d2eb6b66da57a5","author":{"email":"62eb0db178518a8376b23676c2639eb2732c0be8@us.door43.org","name":"Apache"},"message":"Page Edit [40]:  [EricWatt]","distinct":true,"url":"https://api.github.com/repos/Door43/d43-ar-x-dcv/commits/2bfd58ab618f202c44a4010ce9d2eb6b66da57a5"}]},"public":true,"created_at":"2015-01-01T01:03:50Z","org":{"id":4982125,"login":"Door43","gravatar_id":"","url":"https://api.github.com/orgs/Door43","avatar_url":"https://avatars.githubusercontent.com/u/4982125?"}}
{"id":"2489397515","type":"PullRequestReviewCommentEvent","actor":{"id":3103764,"login":"carymrobbins","gravatar_id":"","url":"https://api.github.com/users/carymrobbins","avatar_url":"https://avatars.githubusercontent.com/u/3103764?"},"repo":{"id":15573192,"name":"carymrobbins/intellij-haskforce","url":"https://api.github.com/repos/carymrobbins/intellij-haskforce"},"payload":{"action":"created","comment":{"url":"https://api.github.com/repos/carymrobbins/intellij-haskforce/pulls/comments/22397275","id":22397275,"diff_hunk":"@@ -0,0 +1,56 @@\n+package com.haskforce.highlighting.annotation;\n+\n+import com.google.common.collect.Lists;\n+import com.haskforce.highlighting.annotation.external.GhcMod;\n+import com.haskforce.highlighting.annotation.external.GhcModi;\n+import com.haskforce.highlighting.annotation.external.HaskellExternalAnnotator;\n+import com.haskforce.highlighting.annotation.external.TypeInfoUtil;\n+import com.haskforce.settings.ToolKey;\n+import com.haskforce.utils.ExecUtil;\n+import com.intellij.lang.documentation.AbstractDocumentationProvider;\n+import com.intellij.openapi.editor.Document;\n+import com.intellij.openapi.editor.Editor;\n+import com.intellij.openapi.editor.LogicalPosition;\n+import com.intellij.openapi.editor.VisualPosition;\n+import com.intellij.openapi.fileEditor.FileDocumentManager;\n+import com.intellij.openapi.fileEditor.FileEditorManager;\n+import com.intellij.openapi.module.Module;\n+import com.intellij.openapi.module.ModuleUtilCore;\n+import com.intellij.openapi.project.Project;\n+import com.intellij.openapi.vfs.VirtualFile;\n+import com.intellij.psi.PsiElement;\n+import com.intellij.psi.PsiFile;\n+import com.intellij.psi.PsiManager;\n+import org.jetbrains.annotations.Nullable;\n+\n+import java.awt.*;\n+import java.util.List;\n+import java.util.concurrent.ExecutionException;\n+\n+public class HaskellDocumentationProvider extends AbstractDocumentationProvider {","path":"src/com/haskforce/highlighting/annotation/HaskellDocumentationProvider.java","position":30,"original_position":30,"commit_id":"73ec576f11ba5aa0906e1ca03bc9390ca94b40e2","original_commit_id":"73ec576f11ba5aa0906e1ca03bc9390ca94b40e2","user":{"login":"carymrobbins","id":3103764,"avatar_url":"https://avatars.githubusercontent.com/u/3103764?v=3","gravatar_id":"","url":"https://api.github.com/users/carymrobbins","html_url":"https://github.com/carymrobbins","followers_url":"https://api.github.com/users/carymrobbins/followers","following_url":"https://api.github.com/users/carymrobbins/following{/other_user}","gists_url":"https://api.github.com/users/carymrobbins/gists{/gist_id}","starred_url":"https://api.github.com/users/carymrobbins/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/carymrobbins/subscriptions","organizations_url":"https://api.github.com/users/carymrobbins/orgs","repos_url":"https://api.github.com/users/carymrobbins/repos","events_url":"https://api.github.com/users/carymrobbins/events{/privacy}","received_events_url":"https://api.github.com/users/carymrobbins/received_events","type":"User","site_admin":false},"body":"This doesn't seem to work for me...not sure if I'm doing something wrong.","created_at":"2015-01-01T01:03:50Z","updated_at":"2015-01-01T01:03:50Z","html_url":"https://github.com/carymrobbins/intellij-haskforce/pull/105#discussion_r22397275","pull_request_url":"https://api.github.com/repos/carymrobbins/intellij-haskforce/pulls/105","_links":{"self":{"href":"https://api.github.com/repos/carymrobbins/intellij-haskforce/pulls/comments/22397275"},"html":{"href":"https://github.com/carymrobbins/intellij-haskforce/pull/105#discussion_r22397275"},"pull_request":{"href":"https://api.github.com/repos/carymrobbins/intellij-haskforce/pulls/105"}}},"pull_request":{"url":"https://api.github.com/repos/carymrobbins/intellij-haskforce/pulls/105","id":26615813,"html_url":"https://github.com/carymrobbins/intellij-haskforce/pull/105","diff_url":"https://github.com/carymrobbins/intellij-haskforce/pull/105.diff","patch_url":"https://github.com/carymrobbins/intellij-haskforce/pull/105.patch","issue_url":"https://api.github.com/repos/carymrobbins/intellij-haskforce/issues/105","number":105,"state":"open","locked":false,"title":"Issue90 type information","user":{"login":"KasperJanssens","id":5415995,"avatar_url":"https://avatars.githubusercontent.com/u/5415995?v=3","gravatar_id":"","url":"https://api.github.com/users/KasperJanssens","html_url":"https://github.com/KasperJanssens","followers_url":"https://api.github.com/users/KasperJanssens/followers","following_url":"https://api.github.com/users/KasperJanssens/following{/other_user}","gists_url":"https://api.github.com/users/KasperJanssens/gists{/gist_id}","starred_url":"https://api.github.com/users/KasperJanssens/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/KasperJanssens/subscriptions","organizations_url":"https://api.github.com/users/KasperJanssens/orgs","repos_url":"https://api.github.com/users/KasperJanssens/repos","events_url":"https://api.github.com/users/KasperJanssens/events{/privacy}","received_events_url":"https://api.github.com/users/KasperJanssens/received_events","type":"User","site_admin":false},"body":"Cary,\r\n\r\nFirst try of the type information. It seems quite stable, been using it for a few days (provided the configuration is correct, I suppose, didn't test what happens when ghc-modi is not correctly configured).\r\n\r\nI bound the type info call to the DocumentationProvider as well as to an action (alt - equals, like scala). I prefer the action, I think the documentation provider doesn't work so well. There are tests of the parsing of the output of ghc-modi, but not really of the documentationprovider, basically because of the abundance of static calls and the fact that I think they can only be mocked while testing, and statics can only be mocked through Powermock if I recall correctly, which would mean an extra test dependency and so on and so forth, so I left that to be your call.\r\n\r\nAlso, there is a weird behaviour that getting the editor creates a stack trace of around 5 kilometers long, something that seems like a threading issue, but the function seems to work. I don't really know why the stack trace happens, all the more because it only happens when calling the type information through the documentation provider (same code path is used when the action is called, but no stack trace). Maybe you know more what could go wrong, it looks like something intellij-related.\r\n\r\nSo, consider this a \"request for comment\" more than a pull request ;-)\r\n\r\nKasper","created_at":"2014-12-27T16:19:07Z","updated_at":"2015-01-01T01:03:50Z","closed_at":null,"merged_at":null,"merge_commit_sha":"b32a5f3ef0bc14eebea4baa946ec2e66008086dd","assignee":null,"milestone":null,"commits_url":"https://api.github.com/repos/carymrobbins/intellij-haskforce/pulls/105/commits","review_comments_url":"https://api.github.com/repos/carymrobbins/intellij-haskforce/pulls/105/comments","review_comment_url":"https://api.github.com/repos/carymrobbins/intellij-haskforce/pulls/comments/{number}","comments_url":"https://api.github.com/repos/carymrobbins/intellij-haskforce/issues/105/comments","statuses_url":"https://api.github.com/repos/carymrobbins/intellij-haskforce/statuses/73ec576f11ba5aa0906e1ca03bc9390ca94b40e2","head":{"label":"KasperJanssens:issue90TypeInformation","ref":"issue90TypeInformation","sha":"73ec576f11ba5aa0906e1ca03bc9390ca94b40e2","user":{"login":"KasperJanssens","id":5415995,"avatar_url":"https://avatars.githubusercontent.com/u/5415995?v=3","gravatar_id":"","url":"https://api.github.com/users/KasperJanssens","html_url":"https://github.com/KasperJanssens","followers_url":"https://api.github.com/users/KasperJanssens/followers","following_url":"https://api.github.com/users/KasperJanssens/following{/other_user}","gists_url":"https://api.github.com/users/KasperJanssens/gists{/gist_id}","starred_url":"https://api.github.com/users/KasperJanssens/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/KasperJanssens/subscriptions","organizations_url":"https://api.github.com/users/KasperJanssens/orgs","repos_url":"https://api.github.com/users/KasperJanssens/repos","events_url":"https://api.github.com/users/KasperJanssens/events{/privacy}","received_events_url":"https://api.github.com/users/KasperJanssens/received_events","type":"User","site_admin":false},"repo":{"id":28540684,"name":"intellij-haskforce","full_name":"KasperJanssens/intellij-haskforce","owner":{"login":"KasperJanssens","id":5415995,"avatar_url":"https://avatars.githubusercontent.com/u/5415995?v=3","gravatar_id":"","url":"https://api.github.com/users/KasperJanssens","html_url":"https://github.com/KasperJanssens","followers_url":"https://api.github.com/users/KasperJanssens/followers","following_url":"https://api.github.com/users/KasperJanssens/following{/other_user}","gists_url":"https://api.github.com/users/KasperJanssens/gists{/gist_id}","starred_url":"https://api.github.com/users/KasperJanssens/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/KasperJanssens/subscriptions","organizations_url":"https://api.github.com/users/KasperJanssens/orgs","repos_url":"https://api.github.com/users/KasperJanssens/repos","events_url":"https://api.github.com/users/KasperJanssens/events{/privacy}","received_events_url":"https://api.github.com/users/KasperJanssens/received_events","type":"User","site_admin":false},"private":false,"html_url":"https://github.com/KasperJanssens/intellij-haskforce","description":"Haskell plugin for IntelliJ IDEA Community Edition","fork":true,"url":"https://api.github.com/repos/KasperJanssens/intellij-haskforce","forks_url":"https://api.github.com/repos/KasperJanssens/intellij-haskforce/forks","keys_url":"https://api.github.com/repos/KasperJanssens/intellij-haskforce/keys{/key_id}","collaborators_url":"https://api.github.com/repos/KasperJanssens/intellij-haskforce/collaborators{/collaborator}","teams_url":"https://api.github.com/repos/KasperJanssens/intellij-haskforce/teams","hooks_url":"https://api.github.com/repos/KasperJanssens/intellij-haskforce/hooks","issue_events_url":"https://api.github.com/repos/KasperJanssens/intellij-haskforce/issues/events{/number}","events_url":"https://api.github.com/repos/KasperJanssens/intellij-haskforce/events","assignees_url":"https://api.github.com/repos/KasperJanssens/intellij-haskforce/assignees{/user}","branches_url":"https://api.github.com/repos/KasperJanssens/intellij-haskforce/branches{/branch}","tags_url":"https://api.github.com/repos/KasperJanssens/intellij-haskforce/tags","blobs_url":"https://api.github.com/repos/KasperJanssens/intellij-haskforce/git/blobs{/sha}","git_tags_url":"https://api.github.com/repos/KasperJanssens/intellij-haskforce/git/tags{/sha}","git_refs_url":"https://api.github.com/repos/KasperJanssens/intellij-haskforce/git/refs{/sha}","trees_url":"https://api.github.com/repos/KasperJanssens/intellij-haskforce/git/trees{/sha}","statuses_url":"https://api.github.com/repos/KasperJanssens/intellij-haskforce/statuses/{sha}","languages_url":"https://api.github.com/repos/KasperJanssens/intellij-haskforce/languages","stargazers_url":"https://api.github.com/repos/KasperJanssens/intellij-haskforce/stargazers","contributors_url":"https://api.github.com/repos/KasperJanssens/intellij-haskforce/contributors","subscribers_url":"https://api.github.com/repos/KasperJanssens/intellij-haskforce/subscribers","subscription_url":"https://api.github.com/repos/KasperJanssens/intellij-haskforce/subscription","commits_url":"https://api.github.com/repos/KasperJanssens/intellij-haskforce/commits{/sha}","git_commits_url":"https://api.github.com/repos/KasperJanssens/intellij-haskforce/git/commits{/sha}","comments_url":"https://api.github.com/repos/KasperJanssens/intellij-haskforce/comments{/number}","issue_comment_url":"https://api.github.com/repos/KasperJanssens/intellij-haskforce/issues/comments/{number}","contents_url":"https://api.github.com/repos/KasperJanssens/intellij-haskforce/contents/{+path}","compare_url":"https://api.github.com/repos/KasperJanssens/intellij-haskforce/compare/{base}...{head}","merges_url":"https://api.github.com/repos/KasperJanssens/intellij-haskforce/merges","archive_url":"https://api.github.com/repos/KasperJanssens/intellij-haskforce/{archive_format}{/ref}","downloads_url":"https://api.github.com/repos/KasperJanssens/intellij-haskforce/downloads","issues_url":"https://api.github.com/repos/KasperJanssens/intellij-haskforce/issues{/number}","pulls_url":"https://api.github.com/repos/KasperJanssens/intellij-haskforce/pulls{/number}","milestones_url":"https://api.github.com/repos/KasperJanssens/intellij-haskforce/milestones{/number}","notifications_url":"https://api.github.com/repos/KasperJanssens/intellij-haskforce/notifications{?since,all,participating}","labels_url":"https://api.github.com/repos/KasperJanssens/intellij-haskforce/labels{/name}","releases_url":"https://api.github.com/repos/KasperJanssens/intellij-haskforce/releases{/id}","created_at":"2014-12-27T16:11:01Z","updated_at":"2014-12-27T16:11:03Z","pushed_at":"2014-12-31T15:44:48Z","git_url":"git://github.com/KasperJanssens/intellij-haskforce.git","ssh_url":"git@github.com:KasperJanssens/intellij-haskforce.git","clone_url":"https://github.com/KasperJanssens/intellij-haskforce.git","svn_url":"https://github.com/KasperJanssens/intellij-haskforce","homepage":"http://carymrobbins.github.io/intellij-haskforce/","size":7553,"stargazers_count":0,"watchers_count":0,"language":"Java","has_issues":false,"has_downloads":true,"has_wiki":true,"has_pages":true,"forks_count":0,"mirror_url":null,"open_issues_count":0,"forks":0,"open_issues":0,"watchers":0,"default_branch":"master"}},"base":{"label":"carymrobbins:master","ref":"master","sha":"19442eb58293650dc699e30ccf2d5482e1c688d8","user":{"login":"carymrobbins","id":3103764,"avatar_url":"https://avatars.githubusercontent.com/u/3103764?v=3","gravatar_id":"","url":"https://api.github.com/users/carymrobbins","html_url":"https://github.com/carymrobbins","followers_url":"https://api.github.com/users/carymrobbins/followers","following_url":"https://api.github.com/users/carymrobbins/following{/other_user}","gists_url":"https://api.github.com/users/carymrobbins/gists{/gist_id}","starred_url":"https://api.github.com/users/carymrobbins/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/carymrobbins/subscriptions","organizations_url":"https://api.github.com/users/carymrobbins/orgs","repos_url":"https://api.github.com/users/carymrobbins/repos","events_url":"https://api.github.com/users/carymrobbins/events{/privacy}","received_events_url":"https://api.github.com/users/carymrobbins/received_events","type":"User","site_admin":false},"repo":{"id":15573192,"name":"intellij-haskforce","full_name":"carymrobbins/intellij-haskforce","owner":{"login":"carymrobbins","id":3103764,"avatar_url":"https://avatars.githubusercontent.com/u/3103764?v=3","gravatar_id":"","url":"https://api.github.com/users/carymrobbins","html_url":"https://github.com/carymrobbins","followers_url":"https://api.github.com/users/carymrobbins/followers","following_url":"https://api.github.com/users/carymrobbins/following{/other_user}","gists_url":"https://api.github.com/users/carymrobbins/gists{/gist_id}","starred_url":"https://api.github.com/users/carymrobbins/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/carymrobbins/subscriptions","organizations_url":"https://api.github.com/users/carymrobbins/orgs","repos_url":"https://api.github.com/users/carymrobbins/repos","events_url":"https://api.github.com/users/carymrobbins/events{/privacy}","received_events_url":"https://api.github.com/users/carymrobbins/received_events","type":"User","site_admin":false},"private":false,"html_url":"https://github.com/carymrobbins/intellij-haskforce","description":"Haskell plugin for IntelliJ IDEA Community Edition","fork":false,"url":"https://api.github.com/repos/carymrobbins/intellij-haskforce","forks_url":"https://api.github.com/repos/carymrobbins/intellij-haskforce/forks","keys_url":"https://api.github.com/repos/carymrobbins/intellij-haskforce/keys{/key_id}","collaborators_url":"https://api.github.com/repos/carymrobbins/intellij-haskforce/collaborators{/collaborator}","teams_url":"https://api.github.com/repos/carymrobbins/intellij-haskforce/teams","hooks_url":"https://api.github.com/repos/carymrobbins/intellij-haskforce/hooks","issue_events_url":"https://api.github.com/repos/carymrobbins/intellij-haskforce/issues/events{/number}","events_url":"https://api.github.com/repos/carymrobbins/intellij-haskforce/events","assignees_url":"https://api.github.com/repos/carymrobbins/intellij-haskforce/assignees{/user}","branches_url":"https://api.github.com/repos/carymrobbins/intellij-haskforce/branches{/branch}","tags_url":"https://api.github.com/repos/carymrobbins/intellij-haskforce/tags","blobs_url":"https://api.github.com/repos/carymrobbins/intellij-haskforce/git/blobs{/sha}","git_tags_url":"https://api.github.com/repos/carymrobbins/intellij-haskforce/git/tags{/sha}","git_refs_url":"https://api.github.com/repos/carymrobbins/intellij-haskforce/git/refs{/sha}","trees_url":"https://api.github.com/repos/carymrobbins/intellij-haskforce/git/trees{/sha}","statuses_url":"https://api.github.com/repos/carymrobbins/intellij-haskforce/statuses/{sha}","languages_url":"https://api.github.com/repos/carymrobbins/intellij-haskforce/languages","stargazers_url":"https://api.github.com/repos/carymrobbins/intellij-haskforce/stargazers","contributors_url":"https://api.github.com/repos/carymrobbins/intellij-haskforce/contributors","subscribers_url":"https://api.github.com/repos/carymrobbins/intellij-haskforce/subscribers","subscription_url":"https://api.github.com/repos/carymrobbins/intellij-haskforce/subscription","commits_url":"https://api.github.com/repos/carymrobbins/intellij-haskforce/commits{/sha}","git_commits_url":"https://api.github.com/repos/carymrobbins/intellij-haskforce/git/commits{/sha}","comments_url":"https://api.github.com/repos/carymrobbins/intellij-haskforce/comments{/number}","issue_comment_url":"https://api.github.com/repos/carymrobbins/intellij-haskforce/issues/comments/{number}","contents_url":"https://api.github.com/repos/carymrobbins/intellij-haskforce/contents/{+path}","compare_url":"https://api.github.com/repos/carymrobbins/intellij-haskforce/compare/{base}...{head}","merges_url":"https://api.github.com/repos/carymrobbins/intellij-haskforce/merges","archive_url":"https://api.github.com/repos/carymrobbins/intellij-haskforce/{archive_format}{/ref}","downloads_url":"https://api.github.com/repos/carymrobbins/intellij-haskforce/downloads","issues_url":"https://api.github.com/repos/carymrobbins/intellij-haskforce/issues{/number}","pulls_url":"https://api.github.com/repos/carymrobbins/intellij-haskforce/pulls{/number}","milestones_url":"https://api.github.com/repos/carymrobbins/intellij-haskforce/milestones{/number}","notifications_url":"https://api.github.com/repos/carymrobbins/intellij-haskforce/notifications{?since,all,participating}","labels_url":"https://api.github.com/repos/carymrobbins/intellij-haskforce/labels{/name}","releases_url":"https://api.github.com/repos/carymrobbins/intellij-haskforce/releases{/id}","created_at":"2014-01-02T01:28:54Z","updated_at":"2014-12-30T16:15:50Z","pushed_at":"2014-12-27T04:28:50Z","git_url":"git://github.com/carymrobbins/intellij-haskforce.git","ssh_url":"git@github.com:carymrobbins/intellij-haskforce.git","clone_url":"https://github.com/carymrobbins/intellij-haskforce.git","svn_url":"https://github.com/carymrobbins/intellij-haskforce","homepage":"http://carymrobbins.github.io/intellij-haskforce/","size":11390,"stargazers_count":159,"watchers_count":159,"language":"Java","has_issues":true,"has_downloads":true,"has_wiki":true,"has_pages":true,"forks_count":9,"mirror_url":null,"open_issues_count":30,"forks":9,"open_issues":30,"watchers":159,"default_branch":"master"}},"_links":{"self":{"href":"https://api.github.com/repos/carymrobbins/intellij-haskforce/pulls/105"},"html":{"href":"https://github.com/carymrobbins/intellij-haskforce/pull/105"},"issue":{"href":"https://api.github.com/repos/carymrobbins/intellij-haskforce/issues/105"},"comments":{"href":"https://api.github.com/repos/carymrobbins/intellij-haskforce/issues/105/comments"},"review_comments":{"href":"https://api.github.com/repos/carymrobbins/intellij-haskforce/pulls/105/comments"},"review_comment":{"href":"https://api.github.com/repos/carymrobbins/intellij-haskforce/pulls/comments/{number}"},"commits":{"href":"https://api.github.com/repos/carymrobbins/intellij-haskforce/pulls/105/commits"},"statuses":{"href":"https://api.github.com/repos/carymrobbins/intellij-haskforce/statuses/73ec576f11ba5aa0906e1ca03bc9390ca94b40e2"}}}},"public":true,"created_at":"2015-01-01T01:03:50Z"}
{"id":"2489397517","type":"IssuesEvent","actor":{"id":1742369,"login":"gbathree","gravatar_id":"","url":"https://api.github.com/users/gbathree","avatar_url":"https://avatars.githubusercontent.com/u/1742369?"},"repo":{"id":20705156,"name":"Photosynq/PhotosynQ-ChromeApp","url":"https://api.github.com/repos/Photosynq/PhotosynQ-ChromeApp"},"payload":{"action":"opened","issue":{"url":"https://api.github.com/repos/Photosynq/PhotosynQ-ChromeApp/issues/15","labels_url":"https://api.github.com/repos/Photosynq/PhotosynQ-ChromeApp/issues/15/labels{/name}","comments_url":"https://api.github.com/repos/Photosynq/PhotosynQ-ChromeApp/issues/15/comments","events_url":"https://api.github.com/repos/Photosynq/PhotosynQ-ChromeApp/issues/15/events","html_url":"https://github.com/Photosynq/PhotosynQ-ChromeApp/issues/15","id":53210243,"number":15,"title":"add 'light_intensity_raw\" - this measures the raw value from the light intensity sensor","user":{"login":"gbathree","id":1742369,"avatar_url":"https://avatars.githubusercontent.com/u/1742369?v=3","gravatar_id":"","url":"https://api.github.com/users/gbathree","html_url":"https://github.com/gbathree","followers_url":"https://api.github.com/users/gbathree/followers","following_url":"https://api.github.com/users/gbathree/following{/other_user}","gists_url":"https://api.github.com/users/gbathree/gists{/gist_id}","starred_url":"https://api.github.com/users/gbathree/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/gbathree/subscriptions","organizations_url":"https://api.github.com/users/gbathree/orgs","repos_url":"https://api.github.com/users/gbathree/repos","events_url":"https://api.github.com/users/gbathree/events{/privacy}","received_events_url":"https://api.github.com/users/gbathree/received_events","type":"User","site_admin":false},"labels":[{"url":"https://api.github.com/repos/Photosynq/PhotosynQ-ChromeApp/labels/enhancement","name":"enhancement","color":"84b6eb"}],"state":"open","locked":false,"assignee":null,"milestone":null,"comments":0,"created_at":"2015-01-01T01:03:50Z","updated_at":"2015-01-01T01:03:50Z","closed_at":null,"body":"Works exactly like \"light_intensity\".  Also, please change 'light intensity [lumen]' to 'light intensity [micro-einsteins]' (this also applies to data explorer)"}},"public":true,"created_at":"2015-01-01T01:03:52Z","org":{"id":5068236,"login":"Photosynq","gravatar_id":"","url":"https://api.github.com/orgs/Photosynq","avatar_url":"https://avatars.githubusercontent.com/u/5068236?"}}
{"id":"2489397524","type":"PushEvent","actor":{"id":906529,"login":"dpwolfe","gravatar_id":"","url":"https://api.github.com/users/dpwolfe","avatar_url":"https://avatars.githubusercontent.com/u/906529?"},"repo":{"id":26579311,"name":"dpwolfe/otucha","url":"https://api.github.com/repos/dpwolfe/otucha"},"payload":{"push_id":536752985,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"6f79c0b71c6d4a7e3a7d538ed3b96a889c2a33e0","before":"a9a695f1f7a3395f7394ae668feab71f35a5f622","commits":[{"sha":"6f79c0b71c6d4a7e3a7d538ed3b96a889c2a33e0","author":{"email":"b7dfe270ecb2603aba704ea15b776485da19da15@gmail.com","name":"David Wolfe"},"message":"Update README.md","distinct":true,"url":"https://api.github.com/repos/dpwolfe/otucha/commits/6f79c0b71c6d4a7e3a7d538ed3b96a889c2a33e0"}]},"public":true,"created_at":"2015-01-01T01:03:52Z"}
{"id":"2489397525","type":"DeleteEvent","actor":{"id":1398544,"login":"joelpurra","gravatar_id":"","url":"https://api.github.com/users/joelpurra","avatar_url":"https://avatars.githubusercontent.com/u/1398544?"},"repo":{"id":28595466,"name":"joelpurra/jqnpm","url":"https://api.github.com/repos/joelpurra/jqnpm"},"payload":{"ref":"import_659","ref_type":"branch","pusher_type":"user"},"public":true,"created_at":"2015-01-01T01:03:52Z"}
{"id":"2489397528","type":"PushEvent","actor":{"id":3187965,"login":"kuanslove","gravatar_id":"","url":"https://api.github.com/users/kuanslove","avatar_url":"https://avatars.githubusercontent.com/u/3187965?"},"repo":{"id":27238819,"name":"kuanslove/kuanslove.github.io","url":"https://api.github.com/repos/kuanslove/kuanslove.github.io"},"payload":{"push_id":536752988,"size":2,"distinct_size":2,"ref":"refs/heads/master","head":"e754d70538d1113870734d3cb9a54ceaf708297b","before":"2a58eea671292f434c57c8d4126da39793759d58","commits":[{"sha":"f2395a46dd91bf7d50caf080f4dd19b24445b8e0","author":{"email":"5cf2a1a0b5edf64f8c031f9fcd867f256dcbfa6e@hotmail.com","name":"kuanslove"},"message":"add right menu icon and adjust move effect","distinct":true,"url":"https://api.github.com/repos/kuanslove/kuanslove.github.io/commits/f2395a46dd91bf7d50caf080f4dd19b24445b8e0"},{"sha":"e754d70538d1113870734d3cb9a54ceaf708297b","author":{"email":"5cf2a1a0b5edf64f8c031f9fcd867f256dcbfa6e@hotmail.com","name":"kuanslove"},"message":"merge from remote","distinct":true,"url":"https://api.github.com/repos/kuanslove/kuanslove.github.io/commits/e754d70538d1113870734d3cb9a54ceaf708297b"}]},"public":true,"created_at":"2015-01-01T01:03:53Z"}
{"id":"2489397530","type":"PushEvent","actor":{"id":3196313,"login":"dpastoor","gravatar_id":"","url":"https://api.github.com/users/dpastoor","avatar_url":"https://avatars.githubusercontent.com/u/3196313?"},"repo":{"id":16302099,"name":"dpastoor/PKPDmisc","url":"https://api.github.com/repos/dpastoor/PKPDmisc"},"payload":{"push_id":536752990,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"fd066526d30949d63be752722534a2354edcc5d9","before":"81e56dd1160f5bbe8628cb61de33f4636e4588f0","commits":[{"sha":"fd066526d30949d63be752722534a2354edcc5d9","author":{"email":"5480d79f0d3b1ca7acc7421688b095f8d1e51564@gmail.com","name":"Devin Pastoor"},"message":"add pauc documentation","distinct":true,"url":"https://api.github.com/repos/dpastoor/PKPDmisc/commits/fd066526d30949d63be752722534a2354edcc5d9"}]},"public":true,"created_at":"2015-01-01T01:03:53Z"}
{"id":"2489397533","type":"PullRequestEvent","actor":{"id":19792,"login":"wiredfool","gravatar_id":"","url":"https://api.github.com/users/wiredfool","avatar_url":"https://avatars.githubusercontent.com/u/19792?"},"repo":{"id":5171600,"name":"python-pillow/Pillow","url":"https://api.github.com/repos/python-pillow/Pillow"},"payload":{"action":"opened","number":1061,"pull_request":{"url":"https://api.github.com/repos/python-pillow/Pillow/pulls/1061","id":26739441,"html_url":"https://github.com/python-pillow/Pillow/pull/1061","diff_url":"https://github.com/python-pillow/Pillow/pull/1061.diff","patch_url":"https://github.com/python-pillow/Pillow/pull/1061.patch","issue_url":"https://api.github.com/repos/python-pillow/Pillow/issues/1061","number":1061,"state":"open","locked":false,"title":"Release notes","user":{"login":"wiredfool","id":19792,"avatar_url":"https://avatars.githubusercontent.com/u/19792?v=3","gravatar_id":"","url":"https://api.github.com/users/wiredfool","html_url":"https://github.com/wiredfool","followers_url":"https://api.github.com/users/wiredfool/followers","following_url":"https://api.github.com/users/wiredfool/following{/other_user}","gists_url":"https://api.github.com/users/wiredfool/gists{/gist_id}","starred_url":"https://api.github.com/users/wiredfool/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/wiredfool/subscriptions","organizations_url":"https://api.github.com/users/wiredfool/orgs","repos_url":"https://api.github.com/users/wiredfool/repos","events_url":"https://api.github.com/users/wiredfool/events{/privacy}","received_events_url":"https://api.github.com/users/wiredfool/received_events","type":"User","site_admin":false},"body":"Changes/additions for docs and release notes. ","created_at":"2015-01-01T01:03:54Z","updated_at":"2015-01-01T01:03:54Z","closed_at":null,"merged_at":null,"merge_commit_sha":null,"assignee":null,"milestone":null,"commits_url":"https://api.github.com/repos/python-pillow/Pillow/pulls/1061/commits","review_comments_url":"https://api.github.com/repos/python-pillow/Pillow/pulls/1061/comments","review_comment_url":"https://api.github.com/repos/python-pillow/Pillow/pulls/comments/{number}","comments_url":"https://api.github.com/repos/python-pillow/Pillow/issues/1061/comments","statuses_url":"https://api.github.com/repos/python-pillow/Pillow/statuses/80c7dcbce47437e5fb3fdb05c1fbbdbae0b31e88","head":{"label":"wiredfool:release-notes","ref":"release-notes","sha":"80c7dcbce47437e5fb3fdb05c1fbbdbae0b31e88","user":{"login":"wiredfool","id":19792,"avatar_url":"https://avatars.githubusercontent.com/u/19792?v=3","gravatar_id":"","url":"https://api.github.com/users/wiredfool","html_url":"https://github.com/wiredfool","followers_url":"https://api.github.com/users/wiredfool/followers","following_url":"https://api.github.com/users/wiredfool/following{/other_user}","gists_url":"https://api.github.com/users/wiredfool/gists{/gist_id}","starred_url":"https://api.github.com/users/wiredfool/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/wiredfool/subscriptions","organizations_url":"https://api.github.com/users/wiredfool/orgs","repos_url":"https://api.github.com/users/wiredfool/repos","events_url":"https://api.github.com/users/wiredfool/events{/privacy}","received_events_url":"https://api.github.com/users/wiredfool/received_events","type":"User","site_admin":false},"repo":{"id":8664379,"name":"Pillow","full_name":"wiredfool/Pillow","owner":{"login":"wiredfool","id":19792,"avatar_url":"https://avatars.githubusercontent.com/u/19792?v=3","gravatar_id":"","url":"https://api.github.com/users/wiredfool","html_url":"https://github.com/wiredfool","followers_url":"https://api.github.com/users/wiredfool/followers","following_url":"https://api.github.com/users/wiredfool/following{/other_user}","gists_url":"https://api.github.com/users/wiredfool/gists{/gist_id}","starred_url":"https://api.github.com/users/wiredfool/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/wiredfool/subscriptions","organizations_url":"https://api.github.com/users/wiredfool/orgs","repos_url":"https://api.github.com/users/wiredfool/repos","events_url":"https://api.github.com/users/wiredfool/events{/privacy}","received_events_url":"https://api.github.com/users/wiredfool/received_events","type":"User","site_admin":false},"private":false,"html_url":"https://github.com/wiredfool/Pillow","description":"Pillow is the \"friendly\" PIL fork","fork":true,"url":"https://api.github.com/repos/wiredfool/Pillow","forks_url":"https://api.github.com/repos/wiredfool/Pillow/forks","keys_url":"https://api.github.com/repos/wiredfool/Pillow/keys{/key_id}","collaborators_url":"https://api.github.com/repos/wiredfool/Pillow/collaborators{/collaborator}","teams_url":"https://api.github.com/repos/wiredfool/Pillow/teams","hooks_url":"https://api.github.com/repos/wiredfool/Pillow/hooks","issue_events_url":"https://api.github.com/repos/wiredfool/Pillow/issues/events{/number}","events_url":"https://api.github.com/repos/wiredfool/Pillow/events","assignees_url":"https://api.github.com/repos/wiredfool/Pillow/assignees{/user}","branches_url":"https://api.github.com/repos/wiredfool/Pillow/branches{/branch}","tags_url":"https://api.github.com/repos/wiredfool/Pillow/tags","blobs_url":"https://api.github.com/repos/wiredfool/Pillow/git/blobs{/sha}","git_tags_url":"https://api.github.com/repos/wiredfool/Pillow/git/tags{/sha}","git_refs_url":"https://api.github.com/repos/wiredfool/Pillow/git/refs{/sha}","trees_url":"https://api.github.com/repos/wiredfool/Pillow/git/trees{/sha}","statuses_url":"https://api.github.com/repos/wiredfool/Pillow/statuses/{sha}","languages_url":"https://api.github.com/repos/wiredfool/Pillow/languages","stargazers_url":"https://api.github.com/repos/wiredfool/Pillow/stargazers","contributors_url":"https://api.github.com/repos/wiredfool/Pillow/contributors","subscribers_url":"https://api.github.com/repos/wiredfool/Pillow/subscribers","subscription_url":"https://api.github.com/repos/wiredfool/Pillow/subscription","commits_url":"https://api.github.com/repos/wiredfool/Pillow/commits{/sha}","git_commits_url":"https://api.github.com/repos/wiredfool/Pillow/git/commits{/sha}","comments_url":"https://api.github.com/repos/wiredfool/Pillow/comments{/number}","issue_comment_url":"https://api.github.com/repos/wiredfool/Pillow/issues/comments/{number}","contents_url":"https://api.github.com/repos/wiredfool/Pillow/contents/{+path}","compare_url":"https://api.github.com/repos/wiredfool/Pillow/compare/{base}...{head}","merges_url":"https://api.github.com/repos/wiredfool/Pillow/merges","archive_url":"https://api.github.com/repos/wiredfool/Pillow/{archive_format}{/ref}","downloads_url":"https://api.github.com/repos/wiredfool/Pillow/downloads","issues_url":"https://api.github.com/repos/wiredfool/Pillow/issues{/number}","pulls_url":"https://api.github.com/repos/wiredfool/Pillow/pulls{/number}","milestones_url":"https://api.github.com/repos/wiredfool/Pillow/milestones{/number}","notifications_url":"https://api.github.com/repos/wiredfool/Pillow/notifications{?since,all,participating}","labels_url":"https://api.github.com/repos/wiredfool/Pillow/labels{/name}","releases_url":"https://api.github.com/repos/wiredfool/Pillow/releases{/id}","created_at":"2013-03-09T03:12:08Z","updated_at":"2014-12-31T23:15:11Z","pushed_at":"2015-01-01T00:37:45Z","git_url":"git://github.com/wiredfool/Pillow.git","ssh_url":"git@github.com:wiredfool/Pillow.git","clone_url":"https://github.com/wiredfool/Pillow.git","svn_url":"https://github.com/wiredfool/Pillow","homepage":"http://python-imaging.github.com","size":14870,"stargazers_count":1,"watchers_count":1,"language":"Python","has_issues":false,"has_downloads":true,"has_wiki":false,"has_pages":true,"forks_count":0,"mirror_url":null,"open_issues_count":0,"forks":0,"open_issues":0,"watchers":1,"default_branch":"master"}},"base":{"label":"python-pillow:master","ref":"master","sha":"4889ae776ccbf27a7f955204067812f2aceefba3","user":{"login":"python-pillow","id":2036701,"avatar_url":"https://avatars.githubusercontent.com/u/2036701?v=3","gravatar_id":"","url":"https://api.github.com/users/python-pillow","html_url":"https://github.com/python-pillow","followers_url":"https://api.github.com/users/python-pillow/followers","following_url":"https://api.github.com/users/python-pillow/following{/other_user}","gists_url":"https://api.github.com/users/python-pillow/gists{/gist_id}","starred_url":"https://api.github.com/users/python-pillow/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/python-pillow/subscriptions","organizations_url":"https://api.github.com/users/python-pillow/orgs","repos_url":"https://api.github.com/users/python-pillow/repos","events_url":"https://api.github.com/users/python-pillow/events{/privacy}","received_events_url":"https://api.github.com/users/python-pillow/received_events","type":"Organization","site_admin":false},"repo":{"id":5171600,"name":"Pillow","full_name":"python-pillow/Pillow","owner":{"login":"python-pillow","id":2036701,"avatar_url":"https://avatars.githubusercontent.com/u/2036701?v=3","gravatar_id":"","url":"https://api.github.com/users/python-pillow","html_url":"https://github.com/python-pillow","followers_url":"https://api.github.com/users/python-pillow/followers","following_url":"https://api.github.com/users/python-pillow/following{/other_user}","gists_url":"https://api.github.com/users/python-pillow/gists{/gist_id}","starred_url":"https://api.github.com/users/python-pillow/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/python-pillow/subscriptions","organizations_url":"https://api.github.com/users/python-pillow/orgs","repos_url":"https://api.github.com/users/python-pillow/repos","events_url":"https://api.github.com/users/python-pillow/events{/privacy}","received_events_url":"https://api.github.com/users/python-pillow/received_events","type":"Organization","site_admin":false},"private":false,"html_url":"https://github.com/python-pillow/Pillow","description":"The friendly PIL fork","fork":false,"url":"https://api.github.com/repos/python-pillow/Pillow","forks_url":"https://api.github.com/repos/python-pillow/Pillow/forks","keys_url":"https://api.github.com/repos/python-pillow/Pillow/keys{/key_id}","collaborators_url":"https://api.github.com/repos/python-pillow/Pillow/collaborators{/collaborator}","teams_url":"https://api.github.com/repos/python-pillow/Pillow/teams","hooks_url":"https://api.github.com/repos/python-pillow/Pillow/hooks","issue_events_url":"https://api.github.com/repos/python-pillow/Pillow/issues/events{/number}","events_url":"https://api.github.com/repos/python-pillow/Pillow/events","assignees_url":"https://api.github.com/repos/python-pillow/Pillow/assignees{/user}","branches_url":"https://api.github.com/repos/python-pillow/Pillow/branches{/branch}","tags_url":"https://api.github.com/repos/python-pillow/Pillow/tags","blobs_url":"https://api.github.com/repos/python-pillow/Pillow/git/blobs{/sha}","git_tags_url":"https://api.github.com/repos/python-pillow/Pillow/git/tags{/sha}","git_refs_url":"https://api.github.com/repos/python-pillow/Pillow/git/refs{/sha}","trees_url":"https://api.github.com/repos/python-pillow/Pillow/git/trees{/sha}","statuses_url":"https://api.github.com/repos/python-pillow/Pillow/statuses/{sha}","languages_url":"https://api.github.com/repos/python-pillow/Pillow/languages","stargazers_url":"https://api.github.com/repos/python-pillow/Pillow/stargazers","contributors_url":"https://api.github.com/repos/python-pillow/Pillow/contributors","subscribers_url":"https://api.github.com/repos/python-pillow/Pillow/subscribers","subscription_url":"https://api.github.com/repos/python-pillow/Pillow/subscription","commits_url":"https://api.github.com/repos/python-pillow/Pillow/commits{/sha}","git_commits_url":"https://api.github.com/repos/python-pillow/Pillow/git/commits{/sha}","comments_url":"https://api.github.com/repos/python-pillow/Pillow/comments{/number}","issue_comment_url":"https://api.github.com/repos/python-pillow/Pillow/issues/comments/{number}","contents_url":"https://api.github.com/repos/python-pillow/Pillow/contents/{+path}","compare_url":"https://api.github.com/repos/python-pillow/Pillow/compare/{base}...{head}","merges_url":"https://api.github.com/repos/python-pillow/Pillow/merges","archive_url":"https://api.github.com/repos/python-pillow/Pillow/{archive_format}{/ref}","downloads_url":"https://api.github.com/repos/python-pillow/Pillow/downloads","issues_url":"https://api.github.com/repos/python-pillow/Pillow/issues{/number}","pulls_url":"https://api.github.com/repos/python-pillow/Pillow/pulls{/number}","milestones_url":"https://api.github.com/repos/python-pillow/Pillow/milestones{/number}","notifications_url":"https://api.github.com/repos/python-pillow/Pillow/notifications{?since,all,participating}","labels_url":"https://api.github.com/repos/python-pillow/Pillow/labels{/name}","releases_url":"https://api.github.com/repos/python-pillow/Pillow/releases{/id}","created_at":"2012-07-24T21:38:39Z","updated_at":"2014-12-31T22:44:33Z","pushed_at":"2014-12-31T22:44:33Z","git_url":"git://github.com/python-pillow/Pillow.git","ssh_url":"git@github.com:python-pillow/Pillow.git","clone_url":"https://github.com/python-pillow/Pillow.git","svn_url":"https://github.com/python-pillow/Pillow","homepage":"http://python-pillow.github.io/","size":20365,"stargazers_count":1391,"watchers_count":1391,"language":"Python","has_issues":true,"has_downloads":true,"has_wiki":true,"has_pages":true,"forks_count":319,"mirror_url":null,"open_issues_count":64,"forks":319,"open_issues":64,"watchers":1391,"default_branch":"master"}},"_links":{"self":{"href":"https://api.github.com/repos/python-pillow/Pillow/pulls/1061"},"html":{"href":"https://github.com/python-pillow/Pillow/pull/1061"},"issue":{"href":"https://api.github.com/repos/python-pillow/Pillow/issues/1061"},"comments":{"href":"https://api.github.com/repos/python-pillow/Pillow/issues/1061/comments"},"review_comments":{"href":"https://api.github.com/repos/python-pillow/Pillow/pulls/1061/comments"},"review_comment":{"href":"https://api.github.com/repos/python-pillow/Pillow/pulls/comments/{number}"},"commits":{"href":"https://api.github.com/repos/python-pillow/Pillow/pulls/1061/commits"},"statuses":{"href":"https://api.github.com/repos/python-pillow/Pillow/statuses/80c7dcbce47437e5fb3fdb05c1fbbdbae0b31e88"}},"merged":false,"mergeable":null,"mergeable_state":"unknown","merged_by":null,"comments":0,"review_comments":0,"commits":2,"additions":32,"deletions":2,"changed_files":2}},"public":true,"created_at":"2015-01-01T01:03:55Z","org":{"id":2036701,"login":"python-pillow","gravatar_id":"","url":"https://api.github.com/orgs/python-pillow","avatar_url":"https://avatars.githubusercontent.com/u/2036701?"}}
{"id":"2489397536","type":"PushEvent","actor":{"id":4153853,"login":"jlumijarvi","gravatar_id":"","url":"https://api.github.com/users/jlumijarvi","avatar_url":"https://avatars.githubusercontent.com/u/4153853?"},"repo":{"id":28678176,"name":"jlumijarvi/csv2xml","url":"https://api.github.com/repos/jlumijarvi/csv2xml"},"payload":{"push_id":536752992,"size":2,"distinct_size":2,"ref":"refs/heads/master","head":"44f7054077780dd70b8ad070b9b04640a65282ec","before":"b3500640ddd547415a82cbc026d91be7f76ff14f","commits":[{"sha":"b35627f00738be747dc53479874ce39c15437c68","author":{"email":"40e6fc59d2535c98bfd5d19357e20df6e95cef64@gmail.com","name":"jlumijarvi"},"message":"Added comments","distinct":true,"url":"https://api.github.com/repos/jlumijarvi/csv2xml/commits/b35627f00738be747dc53479874ce39c15437c68"},{"sha":"44f7054077780dd70b8ad070b9b04640a65282ec","author":{"email":"40e6fc59d2535c98bfd5d19357e20df6e95cef64@gmail.com","name":"jlumijarvi"},"message":"Merge branch 'master' of https://github.com/jlumijarvi/csv2xml.git","distinct":true,"url":"https://api.github.com/repos/jlumijarvi/csv2xml/commits/44f7054077780dd70b8ad070b9b04640a65282ec"}]},"public":true,"created_at":"2015-01-01T01:03:55Z"}
{"id":"2489397537","type":"PushEvent","actor":{"id":4332428,"login":"mengqhai","gravatar_id":"","url":"https://api.github.com/users/mengqhai","avatar_url":"https://avatars.githubusercontent.com/u/4332428?"},"repo":{"id":16940729,"name":"mengqhai/appbasement","url":"https://api.github.com/repos/mengqhai/appbasement"},"payload":{"push_id":536752993,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"74fd11ab7ae2271f59aa5515885a015ce60e7e58","before":"7690349b1b0ab8689df9049dced11b17a573f225","commits":[{"sha":"74fd11ab7ae2271f59aa5515885a015ce60e7e58","author":{"email":"06b3b513462d14ed6ea9d26d510982ff74cb83ea@gmail.com","name":"Qinghai Meng"},"message":"re-implemented the revision with JPA in a separated table","distinct":true,"url":"https://api.github.com/repos/mengqhai/appbasement/commits/74fd11ab7ae2271f59aa5515885a015ce60e7e58"}]},"public":true,"created_at":"2015-01-01T01:03:55Z"}
{"id":"2489397540","type":"IssuesEvent","actor":{"id":64050,"login":"gjtorikian","gravatar_id":"","url":"https://api.github.com/users/gjtorikian","avatar_url":"https://avatars.githubusercontent.com/u/64050?"},"repo":{"id":10376685,"name":"gjtorikian/markdowntutorial.com","url":"https://api.github.com/repos/gjtorikian/markdowntutorial.com"},"payload":{"action":"closed","issue":{"url":"https://api.github.com/repos/gjtorikian/markdowntutorial.com/issues/37","labels_url":"https://api.github.com/repos/gjtorikian/markdowntutorial.com/issues/37/labels{/name}","comments_url":"https://api.github.com/repos/gjtorikian/markdowntutorial.com/issues/37/comments","events_url":"https://api.github.com/repos/gjtorikian/markdowntutorial.com/issues/37/events","html_url":"https://github.com/gjtorikian/markdowntutorial.com/issues/37","id":53166139,"number":37,"title":"Second exercise in Lesson 6","user":{"login":"cliffvick","id":72509,"avatar_url":"https://avatars.githubusercontent.com/u/72509?v=3","gravatar_id":"","url":"https://api.github.com/users/cliffvick","html_url":"https://github.com/cliffvick","followers_url":"https://api.github.com/users/cliffvick/followers","following_url":"https://api.github.com/users/cliffvick/following{/other_user}","gists_url":"https://api.github.com/users/cliffvick/gists{/gist_id}","starred_url":"https://api.github.com/users/cliffvick/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/cliffvick/subscriptions","organizations_url":"https://api.github.com/users/cliffvick/orgs","repos_url":"https://api.github.com/users/cliffvick/repos","events_url":"https://api.github.com/users/cliffvick/events{/privacy}","received_events_url":"https://api.github.com/users/cliffvick/received_events","type":"User","site_admin":false},"labels":[],"state":"closed","locked":false,"assignee":null,"milestone":null,"comments":1,"created_at":"2014-12-31T04:07:58Z","updated_at":"2015-01-01T01:03:56Z","closed_at":"2015-01-01T01:03:56Z","body":"The criteria for continuing on to the next exercise in the lesson is incorrect in the js/lesson_plans.coffee file (line 69).  The provided text omits the periods, but the lesson plan expects a period after each item."}},"public":true,"created_at":"2015-01-01T01:03:57Z"}
{"id":"2489397542","type":"IssuesEvent","actor":{"id":4296161,"login":"jefftune","gravatar_id":"","url":"https://api.github.com/users/jefftune","avatar_url":"https://avatars.githubusercontent.com/u/4296161?"},"repo":{"id":25269705,"name":"MobileAppTracking/tune-reporting-python","url":"https://api.github.com/repos/MobileAppTracking/tune-reporting-python"},"payload":{"action":"opened","issue":{"url":"https://api.github.com/repos/MobileAppTracking/tune-reporting-python/issues/71","labels_url":"https://api.github.com/repos/MobileAppTracking/tune-reporting-python/issues/71/labels{/name}","comments_url":"https://api.github.com/repos/MobileAppTracking/tune-reporting-python/issues/71/comments","events_url":"https://api.github.com/repos/MobileAppTracking/tune-reporting-python/issues/71/events","html_url":"https://github.com/MobileAppTracking/tune-reporting-python/issues/71","id":53210246,"number":71,"title":"Python -- Set Configuration","user":{"login":"jefftune","id":4296161,"avatar_url":"https://avatars.githubusercontent.com/u/4296161?v=3","gravatar_id":"","url":"https://api.github.com/users/jefftune","html_url":"https://github.com/jefftune","followers_url":"https://api.github.com/users/jefftune/followers","following_url":"https://api.github.com/users/jefftune/following{/other_user}","gists_url":"https://api.github.com/users/jefftune/gists{/gist_id}","starred_url":"https://api.github.com/users/jefftune/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/jefftune/subscriptions","organizations_url":"https://api.github.com/users/jefftune/orgs","repos_url":"https://api.github.com/users/jefftune/repos","events_url":"https://api.github.com/users/jefftune/events{/privacy}","received_events_url":"https://api.github.com/users/jefftune/received_events","type":"User","site_admin":false},"labels":[{"url":"https://api.github.com/repos/MobileAppTracking/tune-reporting-python/labels/Development","name":"Development","color":"0052cc"}],"state":"open","locked":false,"assignee":{"login":"jefftune","id":4296161,"avatar_url":"https://avatars.githubusercontent.com/u/4296161?v=3","gravatar_id":"","url":"https://api.github.com/users/jefftune","html_url":"https://github.com/jefftune","followers_url":"https://api.github.com/users/jefftune/followers","following_url":"https://api.github.com/users/jefftune/following{/other_user}","gists_url":"https://api.github.com/users/jefftune/gists{/gist_id}","starred_url":"https://api.github.com/users/jefftune/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/jefftune/subscriptions","organizations_url":"https://api.github.com/users/jefftune/orgs","repos_url":"https://api.github.com/users/jefftune/repos","events_url":"https://api.github.com/users/jefftune/events{/privacy}","received_events_url":"https://api.github.com/users/jefftune/received_events","type":"User","site_admin":false},"milestone":{"url":"https://api.github.com/repos/MobileAppTracking/tune-reporting-python/milestones/5","labels_url":"https://api.github.com/repos/MobileAppTracking/tune-reporting-python/milestones/5/labels","id":899375,"number":5,"title":"2014-12-30","description":"","creator":{"login":"jefftune","id":4296161,"avatar_url":"https://avatars.githubusercontent.com/u/4296161?v=3","gravatar_id":"","url":"https://api.github.com/users/jefftune","html_url":"https://github.com/jefftune","followers_url":"https://api.github.com/users/jefftune/followers","following_url":"https://api.github.com/users/jefftune/following{/other_user}","gists_url":"https://api.github.com/users/jefftune/gists{/gist_id}","starred_url":"https://api.github.com/users/jefftune/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/jefftune/subscriptions","organizations_url":"https://api.github.com/users/jefftune/orgs","repos_url":"https://api.github.com/users/jefftune/repos","events_url":"https://api.github.com/users/jefftune/events{/privacy}","received_events_url":"https://api.github.com/users/jefftune/received_events","type":"User","site_admin":false},"open_issues":2,"closed_issues":7,"state":"open","created_at":"2014-12-10T19:53:05Z","updated_at":"2015-01-01T01:03:56Z","due_on":"2014-12-30T08:00:00Z","closed_at":null},"comments":0,"created_at":"2015-01-01T01:03:56Z","updated_at":"2015-01-01T01:03:56Z","closed_at":null,"body":""}},"public":true,"created_at":"2015-01-01T01:03:57Z","org":{"id":1920066,"login":"MobileAppTracking","gravatar_id":"","url":"https://api.github.com/orgs/MobileAppTracking","avatar_url":"https://avatars.githubusercontent.com/u/1920066?"}}
{"id":"2489397543","type":"IssueCommentEvent","actor":{"id":13026,"login":"titanous","gravatar_id":"","url":"https://api.github.com/users/titanous","avatar_url":"https://avatars.githubusercontent.com/u/13026?"},"repo":{"id":11290232,"name":"flynn/flynn","url":"https://api.github.com/repos/flynn/flynn"},"payload":{"action":"created","issue":{"url":"https://api.github.com/repos/flynn/flynn/issues/547","labels_url":"https://api.github.com/repos/flynn/flynn/issues/547/labels{/name}","comments_url":"https://api.github.com/repos/flynn/flynn/issues/547/comments","events_url":"https://api.github.com/repos/flynn/flynn/issues/547/events","html_url":"https://github.com/flynn/flynn/pull/547","id":50875297,"number":547,"title":"Add queue package","user":{"login":"lmars","id":488515,"avatar_url":"https://avatars.githubusercontent.com/u/488515?v=3","gravatar_id":"","url":"https://api.github.com/users/lmars","html_url":"https://github.com/lmars","followers_url":"https://api.github.com/users/lmars/followers","following_url":"https://api.github.com/users/lmars/following{/other_user}","gists_url":"https://api.github.com/users/lmars/gists{/gist_id}","starred_url":"https://api.github.com/users/lmars/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/lmars/subscriptions","organizations_url":"https://api.github.com/users/lmars/orgs","repos_url":"https://api.github.com/users/lmars/repos","events_url":"https://api.github.com/users/lmars/events{/privacy}","received_events_url":"https://api.github.com/users/lmars/received_events","type":"User","site_admin":false},"labels":[],"state":"open","locked":false,"assignee":null,"milestone":null,"comments":12,"created_at":"2014-12-03T18:42:18Z","updated_at":"2015-01-01T01:03:55Z","closed_at":null,"pull_request":{"url":"https://api.github.com/repos/flynn/flynn/pulls/547","html_url":"https://github.com/flynn/flynn/pull/547","diff_url":"https://github.com/flynn/flynn/pull/547.diff","patch_url":"https://github.com/flynn/flynn/pull/547.patch"},"body":"This is based on the [Ruby QueueClassic library](https://github.com/QueueClassic/queue_classic).\r\n\r\nOpening now for early feedback.\r\n\r\nPrerequisite for #536 "},"comment":{"url":"https://api.github.com/repos/flynn/flynn/issues/comments/68477294","html_url":"https://github.com/flynn/flynn/pull/547#issuecomment-68477294","issue_url":"https://api.github.com/repos/flynn/flynn/issues/547","id":68477294,"user":{"login":"titanous","id":13026,"avatar_url":"https://avatars.githubusercontent.com/u/13026?v=3","gravatar_id":"","url":"https://api.github.com/users/titanous","html_url":"https://github.com/titanous","followers_url":"https://api.github.com/users/titanous/followers","following_url":"https://api.github.com/users/titanous/following{/other_user}","gists_url":"https://api.github.com/users/titanous/gists{/gist_id}","starred_url":"https://api.github.com/users/titanous/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/titanous/subscriptions","organizations_url":"https://api.github.com/users/titanous/orgs","repos_url":"https://api.github.com/users/titanous/repos","events_url":"https://api.github.com/users/titanous/events{/privacy}","received_events_url":"https://api.github.com/users/titanous/received_events","type":"User","site_admin":false},"created_at":"2015-01-01T01:03:55Z","updated_at":"2015-01-01T01:03:55Z","body":"It's worth looking at https://github.com/bgentry/que-go which claims to use faster queries and appears to solve the locking issues by using a different pg driver which makes more guarantees about connection usage."}},"public":true,"created_at":"2015-01-01T01:03:57Z","org":{"id":4973613,"login":"flynn","gravatar_id":"","url":"https://api.github.com/orgs/flynn","avatar_url":"https://avatars.githubusercontent.com/u/4973613?"}}
{"id":"2489397544","type":"WatchEvent","actor":{"id":1015032,"login":"miketahani","gravatar_id":"","url":"https://api.github.com/users/miketahani","avatar_url":"https://avatars.githubusercontent.com/u/1015032?"},"repo":{"id":20197962,"name":"kenjiSpecial/100day-canvas-bootcamp-training","url":"https://api.github.com/repos/kenjiSpecial/100day-canvas-bootcamp-training"},"payload":{"action":"started"},"public":true,"created_at":"2015-01-01T01:03:57Z"}
{"id":"2489397548","type":"ForkEvent","actor":{"id":3395224,"login":"sunnyy02","gravatar_id":"","url":"https://api.github.com/users/sunnyy02","avatar_url":"https://avatars.githubusercontent.com/u/3395224?"},"repo":{"id":18972654,"name":"jquintus/spikes","url":"https://api.github.com/repos/jquintus/spikes"},"payload":{"forkee":{"id":28678247,"name":"spikes","full_name":"sunnyy02/spikes","owner":{"login":"sunnyy02","id":3395224,"avatar_url":"https://avatars.githubusercontent.com/u/3395224?v=3","gravatar_id":"","url":"https://api.github.com/users/sunnyy02","html_url":"https://github.com/sunnyy02","followers_url":"https://api.github.com/users/sunnyy02/followers","following_url":"https://api.github.com/users/sunnyy02/following{/other_user}","gists_url":"https://api.github.com/users/sunnyy02/gists{/gist_id}","starred_url":"https://api.github.com/users/sunnyy02/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/sunnyy02/subscriptions","organizations_url":"https://api.github.com/users/sunnyy02/orgs","repos_url":"https://api.github.com/users/sunnyy02/repos","events_url":"https://api.github.com/users/sunnyy02/events{/privacy}","received_events_url":"https://api.github.com/users/sunnyy02/received_events","type":"User","site_admin":false},"private":false,"html_url":"https://github.com/sunnyy02/spikes","description":"Test and simple sample code.  Nothing fancy, lots of dead ends.  No dragons.","fork":true,"url":"https://api.github.com/repos/sunnyy02/spikes","forks_url":"https://api.github.com/repos/sunnyy02/spikes/forks","keys_url":"https://api.github.com/repos/sunnyy02/spikes/keys{/key_id}","collaborators_url":"https://api.github.com/repos/sunnyy02/spikes/collaborators{/collaborator}","teams_url":"https://api.github.com/repos/sunnyy02/spikes/teams","hooks_url":"https://api.github.com/repos/sunnyy02/spikes/hooks","issue_events_url":"https://api.github.com/repos/sunnyy02/spikes/issues/events{/number}","events_url":"https://api.github.com/repos/sunnyy02/spikes/events","assignees_url":"https://api.github.com/repos/sunnyy02/spikes/assignees{/user}","branches_url":"https://api.github.com/repos/sunnyy02/spikes/branches{/branch}","tags_url":"https://api.github.com/repos/sunnyy02/spikes/tags","blobs_url":"https://api.github.com/repos/sunnyy02/spikes/git/blobs{/sha}","git_tags_url":"https://api.github.com/repos/sunnyy02/spikes/git/tags{/sha}","git_refs_url":"https://api.github.com/repos/sunnyy02/spikes/git/refs{/sha}","trees_url":"https://api.github.com/repos/sunnyy02/spikes/git/trees{/sha}","statuses_url":"https://api.github.com/repos/sunnyy02/spikes/statuses/{sha}","languages_url":"https://api.github.com/repos/sunnyy02/spikes/languages","stargazers_url":"https://api.github.com/repos/sunnyy02/spikes/stargazers","contributors_url":"https://api.github.com/repos/sunnyy02/spikes/contributors","subscribers_url":"https://api.github.com/repos/sunnyy02/spikes/subscribers","subscription_url":"https://api.github.com/repos/sunnyy02/spikes/subscription","commits_url":"https://api.github.com/repos/sunnyy02/spikes/commits{/sha}","git_commits_url":"https://api.github.com/repos/sunnyy02/spikes/git/commits{/sha}","comments_url":"https://api.github.com/repos/sunnyy02/spikes/comments{/number}","issue_comment_url":"https://api.github.com/repos/sunnyy02/spikes/issues/comments/{number}","contents_url":"https://api.github.com/repos/sunnyy02/spikes/contents/{+path}","compare_url":"https://api.github.com/repos/sunnyy02/spikes/compare/{base}...{head}","merges_url":"https://api.github.com/repos/sunnyy02/spikes/merges","archive_url":"https://api.github.com/repos/sunnyy02/spikes/{archive_format}{/ref}","downloads_url":"https://api.github.com/repos/sunnyy02/spikes/downloads","issues_url":"https://api.github.com/repos/sunnyy02/spikes/issues{/number}","pulls_url":"https://api.github.com/repos/sunnyy02/spikes/pulls{/number}","milestones_url":"https://api.github.com/repos/sunnyy02/spikes/milestones{/number}","notifications_url":"https://api.github.com/repos/sunnyy02/spikes/notifications{?since,all,participating}","labels_url":"https://api.github.com/repos/sunnyy02/spikes/labels{/name}","releases_url":"https://api.github.com/repos/sunnyy02/spikes/releases{/id}","created_at":"2015-01-01T01:03:57Z","updated_at":"2014-12-27T20:43:44Z","pushed_at":"2014-12-04T21:54:59Z","git_url":"git://github.com/sunnyy02/spikes.git","ssh_url":"git@github.com:sunnyy02/spikes.git","clone_url":"https://github.com/sunnyy02/spikes.git","svn_url":"https://github.com/sunnyy02/spikes","homepage":null,"size":24175,"stargazers_count":0,"watchers_count":0,"language":null,"has_issues":false,"has_downloads":true,"has_wiki":true,"has_pages":false,"forks_count":0,"mirror_url":null,"open_issues_count":0,"forks":0,"open_issues":0,"watchers":0,"default_branch":"master","public":true}},"public":true,"created_at":"2015-01-01T01:03:57Z"}
{"id":"2489397553","type":"PushEvent","actor":{"id":8508709,"login":"raabbajam","gravatar_id":"","url":"https://api.github.com/users/raabbajam","avatar_url":"https://avatars.githubusercontent.com/u/8508709?"},"repo":{"id":26143713,"name":"raabbajam/priceCacheCalendar","url":"https://api.github.com/repos/raabbajam/priceCacheCalendar"},"payload":{"push_id":536752996,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"7153d3eb326cc465ab28f1c1fe366343773cce1e","before":"d53d4a81198a108a2eb66fd506dc3e7f159a6a23","commits":[{"sha":"7153d3eb326cc465ab28f1c1fe366343773cce1e","author":{"email":"a6d869d99a512698feb7bc061802b95b71e0b394@gmail.com","name":"Muhammad Abdul Jabbaar"},"message":"sr@looper change parallel","distinct":true,"url":"https://api.github.com/repos/raabbajam/priceCacheCalendar/commits/7153d3eb326cc465ab28f1c1fe366343773cce1e"}]},"public":true,"created_at":"2015-01-01T01:03:57Z"}
{"id":"2489397555","type":"PushEvent","actor":{"id":7671394,"login":"seinosuke","gravatar_id":"","url":"https://api.github.com/users/seinosuke","avatar_url":"https://avatars.githubusercontent.com/u/7671394?"},"repo":{"id":27248287,"name":"seinosuke/moritan_bot","url":"https://api.github.com/repos/seinosuke/moritan_bot"},"payload":{"push_id":536752998,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"cd2a54765a2ef7c40e377466bb873a22787c93e1","before":"eff699194d79382606198a11cc257715fac32073","commits":[{"sha":"cd2a54765a2ef7c40e377466bb873a22787c93e1","author":{"email":"bf9e3b55334d2166aced4606c08396ce6b193d78@gmail.com","name":"seinosuke"},"message":"Don't repeat yourself入門","distinct":true,"url":"https://api.github.com/repos/seinosuke/moritan_bot/commits/cd2a54765a2ef7c40e377466bb873a22787c93e1"}]},"public":true,"created_at":"2015-01-01T01:03:57Z"}
{"id":"2489397556","type":"PushEvent","actor":{"id":2829600,"login":"GrahamCampbell","gravatar_id":"","url":"https://api.github.com/users/GrahamCampbell","avatar_url":"https://avatars.githubusercontent.com/u/2829600?"},"repo":{"id":26726717,"name":"StyleCI/Fixer","url":"https://api.github.com/repos/StyleCI/Fixer"},"payload":{"push_id":536752999,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"f0214192687388ffe5167091fa3fa4fe4db0139c","before":"c99705b02b76d09d6fbc1734421ef4ef8207d943","commits":[{"sha":"f0214192687388ffe5167091fa3fa4fe4db0139c","author":{"email":"5ca27e75aea3e5e83a04c6cfa5f1b63d358cd03d@mineuk.com","name":"Graham Campbell"},"message":"Updated license noticies","distinct":true,"url":"https://api.github.com/repos/StyleCI/Fixer/commits/f0214192687388ffe5167091fa3fa4fe4db0139c"}]},"public":true,"created_at":"2015-01-01T01:03:57Z","org":{"id":10179029,"login":"StyleCI","gravatar_id":"","url":"https://api.github.com/orgs/StyleCI","avatar_url":"https://avatars.githubusercontent.com/u/10179029?"}}
{"id":"2489397561","type":"PushEvent","actor":{"id":238354,"login":"variousred","gravatar_id":"","url":"https://api.github.com/users/variousred","avatar_url":"https://avatars.githubusercontent.com/u/238354?"},"repo":{"id":6274404,"name":"G5/g5-content-management-system","url":"https://api.github.com/repos/G5/g5-content-management-system"},"payload":{"push_id":536753002,"size":1,"distinct_size":1,"ref":"refs/heads/fix-deep-clone","head":"81baf7738ce7da9084ecd6f657cd3c0e60f888a2","before":"e77a319f12682833e503da292a55f3a5f32cde28","commits":[{"sha":"81baf7738ce7da9084ecd6f657cd3c0e60f888a2","author":{"email":"16ea8d52c08316685a257e07ddecf7165a502f6d@gmail.com","name":"Michael Mitchell"},"message":"refactors specs,\n@ckeckert this one failing test remaining might atually be uncovering a real bug. It seems we are creating an extra widget in the clone process.","distinct":true,"url":"https://api.github.com/repos/G5/g5-content-management-system/commits/81baf7738ce7da9084ecd6f657cd3c0e60f888a2"}]},"public":true,"created_at":"2015-01-01T01:03:57Z","org":{"id":2396851,"login":"G5","gravatar_id":"","url":"https://api.github.com/orgs/G5","avatar_url":"https://avatars.githubusercontent.com/u/2396851?"}}
{"id":"2489397563","type":"PushEvent","actor":{"id":501642,"login":"plouc","gravatar_id":"","url":"https://api.github.com/users/plouc","avatar_url":"https://avatars.githubusercontent.com/u/501642?"},"repo":{"id":28498113,"name":"plouc/mozaik","url":"https://api.github.com/repos/plouc/mozaik"},"payload":{"push_id":536753003,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"eaa14dd02a30069e42cd770d5ddf478e6cd17086","before":"0b27989723feb4b183d5f87813fef146b670b1d1","commits":[{"sha":"eaa14dd02a30069e42cd770d5ddf478e6cd17086","author":{"email":"7c5a0c567b5584a13fde407456875318a5bec977@gmail.com","name":"Raphaël Benitte"},"message":"Update README","distinct":true,"url":"https://api.github.com/repos/plouc/mozaik/commits/eaa14dd02a30069e42cd770d5ddf478e6cd17086"}]},"public":true,"created_at":"2015-01-01T01:03:57Z"}
{"id":"2489397581","type":"PushEvent","actor":{"id":899410,"login":"mikeferguson","gravatar_id":"","url":"https://api.github.com/users/mikeferguson","avatar_url":"https://avatars.githubusercontent.com/u/899410?"},"repo":{"id":26391646,"name":"mikeferguson/robot_calibration","url":"https://api.github.com/repos/mikeferguson/robot_calibration"},"payload":{"push_id":536753009,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"e60f2c778394e62a9fa7c2401d2c8820d057e6dc","before":"2c5350c469f355dee1e421e448ac1a1277776be4","commits":[{"sha":"e60f2c778394e62a9fa7c2401d2c8820d057e6dc","author":{"email":"0b5e4dd894fb6bcaed9be1bfeed1c6d2ad1491ba@gmail.com","name":"Michael Ferguson"},"message":"load parameters from ros","distinct":true,"url":"https://api.github.com/repos/mikeferguson/robot_calibration/commits/e60f2c778394e62a9fa7c2401d2c8820d057e6dc"}]},"public":true,"created_at":"2015-01-01T01:03:59Z"}
{"id":"2489397599","type":"IssuesEvent","actor":{"id":839216,"login":"rohni","gravatar_id":"","url":"https://api.github.com/users/rohni","avatar_url":"https://avatars.githubusercontent.com/u/839216?"},"repo":{"id":10087975,"name":"tailrecursion/hoplon","url":"https://api.github.com/repos/tailrecursion/hoplon"},"payload":{"action":"opened","issue":{"url":"https://api.github.com/repos/tailrecursion/hoplon/issues/50","labels_url":"https://api.github.com/repos/tailrecursion/hoplon/issues/50/labels{/name}","comments_url":"https://api.github.com/repos/tailrecursion/hoplon/issues/50/comments","events_url":"https://api.github.com/repos/tailrecursion/hoplon/issues/50/events","html_url":"https://github.com/tailrecursion/hoplon/issues/50","id":53210250,"number":50,"title":"Following hoplon Getting Started, fails on Step 2","user":{"login":"rohni","id":839216,"avatar_url":"https://avatars.githubusercontent.com/u/839216?v=3","gravatar_id":"","url":"https://api.github.com/users/rohni","html_url":"https://github.com/rohni","followers_url":"https://api.github.com/users/rohni/followers","following_url":"https://api.github.com/users/rohni/following{/other_user}","gists_url":"https://api.github.com/users/rohni/gists{/gist_id}","starred_url":"https://api.github.com/users/rohni/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/rohni/subscriptions","organizations_url":"https://api.github.com/users/rohni/orgs","repos_url":"https://api.github.com/users/rohni/repos","events_url":"https://api.github.com/users/rohni/events{/privacy}","received_events_url":"https://api.github.com/users/rohni/received_events","type":"User","site_admin":false},"labels":[],"state":"open","locked":false,"assignee":null,"milestone":null,"comments":0,"created_at":"2015-01-01T01:04:01Z","updated_at":"2015-01-01T01:04:01Z","closed_at":null,"body":"Hi there,\r\nI was really excited to try out hoplon, but ran into this snag:\r\n\r\n     Task 2: Compile the project.\r\n\r\n     $ boot development\r\n\r\nHowever, this fails with:\r\n\r\n    java.lang.RuntimeException: No reader function for tag tailrecursion.boot.core/version\r\n\r\nI tried upgrading boot:\r\n\r\n    Retrieving boot-2.0.0-rc4.jar from http://clojars.org/repo/\r\n    #https://github.com/boot-clj/boot\r\n    #Thu Jan 01 01:58:12 CET 2015\r\n    BOOT_CLOJURE_VERSION=1.6.0\r\n    BOOT_VERSION=2.0.0-rc4\r\n\r\nBut just received the same error.\r\n\r\nI am stuck, and in need of sleep. :)  If anyone can figure out what is going wrong here I would love to move onto exploring hoplon.\r\n\r\nThanks,\r\n\r\nRohni"}},"public":true,"created_at":"2015-01-01T01:04:01Z","org":{"id":3443819,"login":"tailrecursion","gravatar_id":"","url":"https://api.github.com/orgs/tailrecursion","avatar_url":"https://avatars.githubusercontent.com/u/3443819?"}}
{"id":"2489397603","type":"ForkEvent","actor":{"id":8671867,"login":"Meehoweq","gravatar_id":"","url":"https://api.github.com/users/Meehoweq","avatar_url":"https://avatars.githubusercontent.com/u/8671867?"},"repo":{"id":24366589,"name":"Dzikoysk/FunnyGuilds","url":"https://api.github.com/repos/Dzikoysk/FunnyGuilds"},"payload":{"forkee":{"id":28678250,"name":"FunnyGuilds","full_name":"Meehoweq/FunnyGuilds","owner":{"login":"Meehoweq","id":8671867,"avatar_url":"https://avatars.githubusercontent.com/u/8671867?v=3","gravatar_id":"","url":"https://api.github.com/users/Meehoweq","html_url":"https://github.com/Meehoweq","followers_url":"https://api.github.com/users/Meehoweq/followers","following_url":"https://api.github.com/users/Meehoweq/following{/other_user}","gists_url":"https://api.github.com/users/Meehoweq/gists{/gist_id}","starred_url":"https://api.github.com/users/Meehoweq/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/Meehoweq/subscriptions","organizations_url":"https://api.github.com/users/Meehoweq/orgs","repos_url":"https://api.github.com/users/Meehoweq/repos","events_url":"https://api.github.com/users/Meehoweq/events{/privacy}","received_events_url":"https://api.github.com/users/Meehoweq/received_events","type":"User","site_admin":false},"private":false,"html_url":"https://github.com/Meehoweq/FunnyGuilds","description":"","fork":true,"url":"https://api.github.com/repos/Meehoweq/FunnyGuilds","forks_url":"https://api.github.com/repos/Meehoweq/FunnyGuilds/forks","keys_url":"https://api.github.com/repos/Meehoweq/FunnyGuilds/keys{/key_id}","collaborators_url":"https://api.github.com/repos/Meehoweq/FunnyGuilds/collaborators{/collaborator}","teams_url":"https://api.github.com/repos/Meehoweq/FunnyGuilds/teams","hooks_url":"https://api.github.com/repos/Meehoweq/FunnyGuilds/hooks","issue_events_url":"https://api.github.com/repos/Meehoweq/FunnyGuilds/issues/events{/number}","events_url":"https://api.github.com/repos/Meehoweq/FunnyGuilds/events","assignees_url":"https://api.github.com/repos/Meehoweq/FunnyGuilds/assignees{/user}","branches_url":"https://api.github.com/repos/Meehoweq/FunnyGuilds/branches{/branch}","tags_url":"https://api.github.com/repos/Meehoweq/FunnyGuilds/tags","blobs_url":"https://api.github.com/repos/Meehoweq/FunnyGuilds/git/blobs{/sha}","git_tags_url":"https://api.github.com/repos/Meehoweq/FunnyGuilds/git/tags{/sha}","git_refs_url":"https://api.github.com/repos/Meehoweq/FunnyGuilds/git/refs{/sha}","trees_url":"https://api.github.com/repos/Meehoweq/FunnyGuilds/git/trees{/sha}","statuses_url":"https://api.github.com/repos/Meehoweq/FunnyGuilds/statuses/{sha}","languages_url":"https://api.github.com/repos/Meehoweq/FunnyGuilds/languages","stargazers_url":"https://api.github.com/repos/Meehoweq/FunnyGuilds/stargazers","contributors_url":"https://api.github.com/repos/Meehoweq/FunnyGuilds/contributors","subscribers_url":"https://api.github.com/repos/Meehoweq/FunnyGuilds/subscribers","subscription_url":"https://api.github.com/repos/Meehoweq/FunnyGuilds/subscription","commits_url":"https://api.github.com/repos/Meehoweq/FunnyGuilds/commits{/sha}","git_commits_url":"https://api.github.com/repos/Meehoweq/FunnyGuilds/git/commits{/sha}","comments_url":"https://api.github.com/repos/Meehoweq/FunnyGuilds/comments{/number}","issue_comment_url":"https://api.github.com/repos/Meehoweq/FunnyGuilds/issues/comments/{number}","contents_url":"https://api.github.com/repos/Meehoweq/FunnyGuilds/contents/{+path}","compare_url":"https://api.github.com/repos/Meehoweq/FunnyGuilds/compare/{base}...{head}","merges_url":"https://api.github.com/repos/Meehoweq/FunnyGuilds/merges","archive_url":"https://api.github.com/repos/Meehoweq/FunnyGuilds/{archive_format}{/ref}","downloads_url":"https://api.github.com/repos/Meehoweq/FunnyGuilds/downloads","issues_url":"https://api.github.com/repos/Meehoweq/FunnyGuilds/issues{/number}","pulls_url":"https://api.github.com/repos/Meehoweq/FunnyGuilds/pulls{/number}","milestones_url":"https://api.github.com/repos/Meehoweq/FunnyGuilds/milestones{/number}","notifications_url":"https://api.github.com/repos/Meehoweq/FunnyGuilds/notifications{?since,all,participating}","labels_url":"https://api.github.com/repos/Meehoweq/FunnyGuilds/labels{/name}","releases_url":"https://api.github.com/repos/Meehoweq/FunnyGuilds/releases{/id}","created_at":"2015-01-01T01:04:01Z","updated_at":"2014-12-31T21:12:33Z","pushed_at":"2014-12-31T21:21:42Z","git_url":"git://github.com/Meehoweq/FunnyGuilds.git","ssh_url":"git@github.com:Meehoweq/FunnyGuilds.git","clone_url":"https://github.com/Meehoweq/FunnyGuilds.git","svn_url":"https://github.com/Meehoweq/FunnyGuilds","homepage":"","size":959,"stargazers_count":0,"watchers_count":0,"language":null,"has_issues":false,"has_downloads":true,"has_wiki":true,"has_pages":false,"forks_count":0,"mirror_url":null,"open_issues_count":0,"forks":0,"open_issues":0,"watchers":0,"default_branch":"master","public":true}},"public":true,"created_at":"2015-01-01T01:04:01Z"}
{"id":"2489397607","type":"CreateEvent","actor":{"id":5831804,"login":"YueLinHo","gravatar_id":"","url":"https://api.github.com/users/YueLinHo","avatar_url":"https://avatars.githubusercontent.com/u/5831804?"},"repo":{"id":21376277,"name":"YueLinHo/TortoiseGit","url":"https://api.github.com/repos/YueLinHo/TortoiseGit"},"payload":{"ref":"ylh/happy_new_year_2015","ref_type":"branch","master_branch":"master","description":"Windows Explorer Extension to Operate Git; Mirror of GoogleCode repository","pusher_type":"user"},"public":true,"created_at":"2015-01-01T01:04:02Z"}
{"id":"2489397612","type":"GollumEvent","actor":{"id":7797609,"login":"ivanwfr","gravatar_id":"","url":"https://api.github.com/users/ivanwfr","avatar_url":"https://avatars.githubusercontent.com/u/7797609?"},"repo":{"id":808316,"name":"cswetenham/tabspace2.1","url":"https://api.github.com/repos/cswetenham/tabspace2.1"},"payload":{"pages":[{"page_name":"Home","title":"Home","summary":null,"action":"edited","sha":"be2f83e475fa43ab7785aa503ab92d4c098015c0","html_url":"https://github.com/cswetenham/tabspace2.1/wiki/Home"}]},"public":true,"created_at":"2015-01-01T01:04:02Z"}
{"id":"2489397613","type":"PushEvent","actor":{"id":3599988,"login":"wesdizzle","gravatar_id":"","url":"https://api.github.com/users/wesdizzle","avatar_url":"https://avatars.githubusercontent.com/u/3599988?"},"repo":{"id":28250120,"name":"wesdizzle/gagglelog","url":"https://api.github.com/repos/wesdizzle/gagglelog"},"payload":{"push_id":536753016,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"fc86231b5063c1b8f2ed07b8d1ae887580869fcf","before":"699893742e393b99eb2250f17b2aad8979d7b454","commits":[{"sha":"fc86231b5063c1b8f2ed07b8d1ae887580869fcf","author":{"email":"baaa01a5d45f86e3d8f7008866cf0d37bea55570@gmail.com","name":"Wesley Miller"},"message":"changed Index from bit to int in DistributionMethods for cases with more than two distribution methods tha need to be sorted (Genesis Cartridge, 32X Cartridge, CD)","distinct":true,"url":"https://api.github.com/repos/wesdizzle/gagglelog/commits/fc86231b5063c1b8f2ed07b8d1ae887580869fcf"}]},"public":true,"created_at":"2015-01-01T01:04:02Z"}
{"id":"2489397617","type":"CreateEvent","actor":{"id":200511,"login":"alexanderdean","gravatar_id":"","url":"https://api.github.com/users/alexanderdean","avatar_url":"https://avatars.githubusercontent.com/u/200511?"},"repo":{"id":28678252,"name":"alexanderdean/lambda-example-project","url":"https://api.github.com/repos/alexanderdean/lambda-example-project"},"payload":{"ref":null,"ref_type":"repository","master_branch":"master","description":"An example AWS Lambda application for processing a Kinesis stream of Snowplow enriched events ","pusher_type":"user"},"public":true,"created_at":"2015-01-01T01:04:02Z"}
{"id":"2489397620","type":"PushEvent","actor":{"id":433707,"login":"ile","gravatar_id":"","url":"https://api.github.com/users/ile","avatar_url":"https://avatars.githubusercontent.com/u/433707?"},"repo":{"id":26847132,"name":"kantele/k-templates","url":"https://api.github.com/repos/kantele/k-templates"},"payload":{"push_id":536753019,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"0c74567d174b0901cf19bde2f2ddc65e1d4ff6e1","before":"53ba5e0e3194a42192f5aa9f9cd3fd2d79281ce4","commits":[{"sha":"0c74567d174b0901cf19bde2f2ddc65e1d4ff6e1","author":{"email":"4f3407de78bccc8cc160ee4d278d5efe7162e6b5@nateps.com","name":"Nate Smith"},"message":"0.2.0\n\nConflicts:\n\tpackage.json","distinct":true,"url":"https://api.github.com/repos/kantele/k-templates/commits/0c74567d174b0901cf19bde2f2ddc65e1d4ff6e1"}]},"public":true,"created_at":"2015-01-01T01:04:03Z","org":{"id":5687585,"login":"kantele","gravatar_id":"","url":"https://api.github.com/orgs/kantele","avatar_url":"https://avatars.githubusercontent.com/u/5687585?"}}
{"id":"2489397621","type":"PushEvent","actor":{"id":1362216,"login":"gmenih341","gravatar_id":"","url":"https://api.github.com/users/gmenih341","avatar_url":"https://avatars.githubusercontent.com/u/1362216?"},"repo":{"id":28205917,"name":"gmenih341/gm_webpage","url":"https://api.github.com/repos/gmenih341/gm_webpage"},"payload":{"push_id":536753020,"size":6,"distinct_size":0,"ref":"refs/heads/master","head":"44b4ebfe84e066b96aa9a1e99351030e539f5020","before":"a9289eb4413ceb90e8c4ef9d1ba3510dc1a5cc79","commits":[{"sha":"b79ef407608a48bbf713e6cac3e0da901439ef47","author":{"email":"0b197f5d14de9a1e08df323456fabeaf2b9315d7@gmail.com","name":"gmenih341"},"message":"adding files to branch","distinct":false,"url":"https://api.github.com/repos/gmenih341/gm_webpage/commits/b79ef407608a48bbf713e6cac3e0da901439ef47"},{"sha":"7bb277f4b421943b47dd57547bb8f15aaaa8dc4e","author":{"email":"0b197f5d14de9a1e08df323456fabeaf2b9315d7@gmail.com","name":"gmenih341"},"message":"Removed all files","distinct":false,"url":"https://api.github.com/repos/gmenih341/gm_webpage/commits/7bb277f4b421943b47dd57547bb8f15aaaa8dc4e"},{"sha":"0927195f20d7f7ee7726d6eaeaeb2a7c138c4e75","author":{"email":"0b197f5d14de9a1e08df323456fabeaf2b9315d7@gmail.com","name":"gmenih341"},"message":"Ported to ExpressJS","distinct":false,"url":"https://api.github.com/repos/gmenih341/gm_webpage/commits/0927195f20d7f7ee7726d6eaeaeb2a7c138c4e75"},{"sha":"26efa9dbb30fc9f7ab5a7324a5b55b0f4d015c66","author":{"email":"0b197f5d14de9a1e08df323456fabeaf2b9315d7@gmail.com","name":"Gregor Menih"},"message":"Create README.md","distinct":false,"url":"https://api.github.com/repos/gmenih341/gm_webpage/commits/26efa9dbb30fc9f7ab5a7324a5b55b0f4d015c66"},{"sha":"934f504d8abd4adceb718a6767e9d56c5f7fa856","author":{"email":"0b197f5d14de9a1e08df323456fabeaf2b9315d7@gmail.com","name":"gmenih341"},"message":"Added mongo & monk dependencies","distinct":false,"url":"https://api.github.com/repos/gmenih341/gm_webpage/commits/934f504d8abd4adceb718a6767e9d56c5f7fa856"},{"sha":"44b4ebfe84e066b96aa9a1e99351030e539f5020","author":{"email":"0b197f5d14de9a1e08df323456fabeaf2b9315d7@gmail.com","name":"gmenih341"},"message":"updated readme","distinct":false,"url":"https://api.github.com/repos/gmenih341/gm_webpage/commits/44b4ebfe84e066b96aa9a1e99351030e539f5020"}]},"public":true,"created_at":"2015-01-01T01:04:03Z"}
{"id":"2489397623","type":"PushEvent","actor":{"id":6413475,"login":"vlj","gravatar_id":"","url":"https://api.github.com/users/vlj","avatar_url":"https://avatars.githubusercontent.com/u/6413475?"},"repo":{"id":15920273,"name":"supertuxkart/stk-code","url":"https://api.github.com/repos/supertuxkart/stk-code"},"payload":{"push_id":536753018,"size":1,"distinct_size":1,"ref":"refs/heads/lspsm","head":"08fed2cfe31a7280384ae8ef494af462af62267d","before":"26ffdd0e55e79ad7d97b5bcb86085b538cd1a032","commits":[{"sha":"08fed2cfe31a7280384ae8ef494af462af62267d","author":{"email":"adf7f962d8c1003f9d5aad5ecae5c2ca1bbdee24@ovi.com","name":"Vincent Lejeune"},"message":"Use lspsm with pcf","distinct":true,"url":"https://api.github.com/repos/supertuxkart/stk-code/commits/08fed2cfe31a7280384ae8ef494af462af62267d"}]},"public":true,"created_at":"2015-01-01T01:04:03Z","org":{"id":6138677,"login":"supertuxkart","gravatar_id":"","url":"https://api.github.com/orgs/supertuxkart","avatar_url":"https://avatars.githubusercontent.com/u/6138677?"}}
{"id":"2489397622","type":"IssuesEvent","actor":{"id":8426440,"login":"nickspring","gravatar_id":"","url":"https://api.github.com/users/nickspring","avatar_url":"https://avatars.githubusercontent.com/u/8426440?"},"repo":{"id":6890589,"name":"etsy/etsyapi","url":"https://api.github.com/repos/etsy/etsyapi"},"payload":{"action":"opened","issue":{"url":"https://api.github.com/repos/etsy/etsyapi/issues/108","labels_url":"https://api.github.com/repos/etsy/etsyapi/issues/108/labels{/name}","comments_url":"https://api.github.com/repos/etsy/etsyapi/issues/108/comments","events_url":"https://api.github.com/repos/etsy/etsyapi/issues/108/events","html_url":"https://github.com/etsy/etsyapi/issues/108","id":53210252,"number":108,"title":"Length of description field with non-English symbols 2","user":{"login":"nickspring","id":8426440,"avatar_url":"https://avatars.githubusercontent.com/u/8426440?v=3","gravatar_id":"","url":"https://api.github.com/users/nickspring","html_url":"https://github.com/nickspring","followers_url":"https://api.github.com/users/nickspring/followers","following_url":"https://api.github.com/users/nickspring/following{/other_user}","gists_url":"https://api.github.com/users/nickspring/gists{/gist_id}","starred_url":"https://api.github.com/users/nickspring/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/nickspring/subscriptions","organizations_url":"https://api.github.com/users/nickspring/orgs","repos_url":"https://api.github.com/users/nickspring/repos","events_url":"https://api.github.com/users/nickspring/events{/privacy}","received_events_url":"https://api.github.com/users/nickspring/received_events","type":"User","site_admin":false},"labels":[],"state":"open","locked":false,"assignee":null,"milestone":null,"comments":0,"created_at":"2015-01-01T01:04:03Z","updated_at":"2015-01-01T01:04:03Z","closed_at":null,"body":"I’m trying to update FR translation of one listing. Description has length 245 symbols (251 in bytes!!!) but Etsy API responds with error \"Value for description must be 255 characters or less.”\r\nIt seems that API calculates length of non-English strings incorrectly. See PHP example below.\r\n\r\nThere is no such problem if I use English string (without diacritics etc).\r\n\r\n```php\r\n<?php\r\n\r\ndefine('OAUTH_CONSUMER_KEY', '');\r\ndefine('OAUTH_CONSUMER_SECRET', '');\r\n$access_token = '';\r\n$access_token_secret = '';\r\n\r\n$oauth = new OAuth(OAUTH_CONSUMER_KEY, OAUTH_CONSUMER_SECRET,\r\n                   OAUTH_SIG_METHOD_HMACSHA1, OAUTH_AUTH_TYPE_URI);\r\n$oauth->setToken($access_token, $access_token_secret);\r\n\r\ntry {\r\n    \r\n    # try to change FR translation of one listing \r\n       \r\n    $params = array(\r\n    'description'=>\"Couleur: Argent, Violet (d'un côté - de l'argent, d'autres un pourpre clair) \r\nTaille (mm): 5mm x 7mm \r\nForme: Preciosa PIP Perles / Pétale de Fleur / Fleur \r\nVendus en paquets de 60pcs. \r\n\r\n▶ Merci de vous abonner à notre NEWSLETTER: http://eepurl.c\",\r\n    'tags'=>'SKU-17634,4mm de semilla de pe,7 0 checa semilla de,cordón,checa semilla de per',\r\n    'language'=>'fr',\r\n    'listing_id'=>216087470,\r\n    'title'=>'60pcs Argent Violet PIP Perles de Verre tchèque PIP Preciosa PIP Perles tchèque Fleur Plate Pétale de Fleur de Perles 5mm x 7mm',\r\n    );\r\n\r\n    echo \"THE LENGTH OF DESCRIPTION STRING IS \", mb_strlen($params['description'], 'utf-8'), \" BUT WE HAVE SUCH ERROR:\\n\\n\";\r\n    $data = $oauth->fetch(\"https://openapi.etsy.com/v2/listings/216087470/translations/fr\", $params, OAUTH_HTTP_METHOD_POST);\r\n    \r\n    \r\n} catch (OAuthException $e) {\r\n    error_log($e->getMessage());\r\n    error_log(print_r($oauth->getLastResponse(), true));\r\n    exit;\r\n}\r\n\r\n?>\r\n```"}},"public":true,"created_at":"2015-01-01T01:04:03Z","org":{"id":193389,"login":"etsy","gravatar_id":"","url":"https://api.github.com/orgs/etsy","avatar_url":"https://avatars.githubusercontent.com/u/193389?"}}
{"id":"2489397624","type":"PushEvent","actor":{"id":1362216,"login":"gmenih341","gravatar_id":"","url":"https://api.github.com/users/gmenih341","avatar_url":"https://avatars.githubusercontent.com/u/1362216?"},"repo":{"id":28205917,"name":"gmenih341/gm_webpage","url":"https://api.github.com/repos/gmenih341/gm_webpage"},"payload":{"push_id":536753021,"size":2,"distinct_size":0,"ref":"refs/heads/nodeJs","head":"44b4ebfe84e066b96aa9a1e99351030e539f5020","before":"26efa9dbb30fc9f7ab5a7324a5b55b0f4d015c66","commits":[{"sha":"934f504d8abd4adceb718a6767e9d56c5f7fa856","author":{"email":"0b197f5d14de9a1e08df323456fabeaf2b9315d7@gmail.com","name":"gmenih341"},"message":"Added mongo & monk dependencies","distinct":false,"url":"https://api.github.com/repos/gmenih341/gm_webpage/commits/934f504d8abd4adceb718a6767e9d56c5f7fa856"},{"sha":"44b4ebfe84e066b96aa9a1e99351030e539f5020","author":{"email":"0b197f5d14de9a1e08df323456fabeaf2b9315d7@gmail.com","name":"gmenih341"},"message":"updated readme","distinct":false,"url":"https://api.github.com/repos/gmenih341/gm_webpage/commits/44b4ebfe84e066b96aa9a1e99351030e539f5020"}]},"public":true,"created_at":"2015-01-01T01:04:03Z"}
{"id":"2489397626","type":"PushEvent","actor":{"id":155953,"login":"saitodisse","gravatar_id":"","url":"https://api.github.com/users/saitodisse","avatar_url":"https://avatars.githubusercontent.com/u/155953?"},"repo":{"id":28519068,"name":"saitodisse/code_rewrite","url":"https://api.github.com/repos/saitodisse/code_rewrite"},"payload":{"push_id":536753023,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"d3df589bd52bfaefb7df4c7ab055f37e0d3b5023","before":"0a48d64aee06d7d3075bc62e9e5c980a6ebe6b68","commits":[{"sha":"d3df589bd52bfaefb7df4c7ab055f37e0d3b5023","author":{"email":"2ba0b9c8a539cf0353ba4c5654aacbc724b4002e@gmail.com","name":"Julio Makdisse Saito"},"message":"partial","distinct":true,"url":"https://api.github.com/repos/saitodisse/code_rewrite/commits/d3df589bd52bfaefb7df4c7ab055f37e0d3b5023"}]},"public":true,"created_at":"2015-01-01T01:04:04Z"}
{"id":"2489397632","type":"IssuesEvent","actor":{"id":5509466,"login":"Arisae","gravatar_id":"","url":"https://api.github.com/users/Arisae","avatar_url":"https://avatars.githubusercontent.com/u/5509466?"},"repo":{"id":28179339,"name":"YGGDRASIL-STUDIO/Discouraged-Workers","url":"https://api.github.com/repos/YGGDRASIL-STUDIO/Discouraged-Workers"},"payload":{"action":"opened","issue":{"url":"https://api.github.com/repos/YGGDRASIL-STUDIO/Discouraged-Workers/issues/153","labels_url":"https://api.github.com/repos/YGGDRASIL-STUDIO/Discouraged-Workers/issues/153/labels{/name}","comments_url":"https://api.github.com/repos/YGGDRASIL-STUDIO/Discouraged-Workers/issues/153/comments","events_url":"https://api.github.com/repos/YGGDRASIL-STUDIO/Discouraged-Workers/issues/153/events","html_url":"https://github.com/YGGDRASIL-STUDIO/Discouraged-Workers/issues/153","id":53210253,"number":153,"title":"Add Bridge of the Life License in README.html","user":{"login":"Arisae","id":5509466,"avatar_url":"https://avatars.githubusercontent.com/u/5509466?v=3","gravatar_id":"","url":"https://api.github.com/users/Arisae","html_url":"https://github.com/Arisae","followers_url":"https://api.github.com/users/Arisae/followers","following_url":"https://api.github.com/users/Arisae/following{/other_user}","gists_url":"https://api.github.com/users/Arisae/gists{/gist_id}","starred_url":"https://api.github.com/users/Arisae/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/Arisae/subscriptions","organizations_url":"https://api.github.com/users/Arisae/orgs","repos_url":"https://api.github.com/users/Arisae/repos","events_url":"https://api.github.com/users/Arisae/events{/privacy}","received_events_url":"https://api.github.com/users/Arisae/received_events","type":"User","site_admin":false},"labels":[{"url":"https://api.github.com/repos/YGGDRASIL-STUDIO/Discouraged-Workers/labels/enhancement","name":"enhancement","color":"84b6eb"}],"state":"open","locked":false,"assignee":{"login":"Arisae","id":5509466,"avatar_url":"https://avatars.githubusercontent.com/u/5509466?v=3","gravatar_id":"","url":"https://api.github.com/users/Arisae","html_url":"https://github.com/Arisae","followers_url":"https://api.github.com/users/Arisae/followers","following_url":"https://api.github.com/users/Arisae/following{/other_user}","gists_url":"https://api.github.com/users/Arisae/gists{/gist_id}","starred_url":"https://api.github.com/users/Arisae/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/Arisae/subscriptions","organizations_url":"https://api.github.com/users/Arisae/orgs","repos_url":"https://api.github.com/users/Arisae/repos","events_url":"https://api.github.com/users/Arisae/events{/privacy}","received_events_url":"https://api.github.com/users/Arisae/received_events","type":"User","site_admin":false},"milestone":{"url":"https://api.github.com/repos/YGGDRASIL-STUDIO/Discouraged-Workers/milestones/12","labels_url":"https://api.github.com/repos/YGGDRASIL-STUDIO/Discouraged-Workers/milestones/12/labels","id":914871,"number":12,"title":"ETC","description":"License, Manual, ETC","creator":{"login":"Arisae","id":5509466,"avatar_url":"https://avatars.githubusercontent.com/u/5509466?v=3","gravatar_id":"","url":"https://api.github.com/users/Arisae","html_url":"https://github.com/Arisae","followers_url":"https://api.github.com/users/Arisae/followers","following_url":"https://api.github.com/users/Arisae/following{/other_user}","gists_url":"https://api.github.com/users/Arisae/gists{/gist_id}","starred_url":"https://api.github.com/users/Arisae/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/Arisae/subscriptions","organizations_url":"https://api.github.com/users/Arisae/orgs","repos_url":"https://api.github.com/users/Arisae/repos","events_url":"https://api.github.com/users/Arisae/events{/privacy}","received_events_url":"https://api.github.com/users/Arisae/received_events","type":"User","site_admin":false},"open_issues":4,"closed_issues":0,"state":"open","created_at":"2014-12-26T04:10:21Z","updated_at":"2015-01-01T01:04:05Z","due_on":"2015-12-30T15:00:00Z","closed_at":null},"comments":0,"created_at":"2015-01-01T01:04:05Z","updated_at":"2015-01-01T01:04:05Z","closed_at":null,"body":""}},"public":true,"created_at":"2015-01-01T01:04:05Z","org":{"id":10226289,"login":"YGGDRASIL-STUDIO","gravatar_id":"","url":"https://api.github.com/orgs/YGGDRASIL-STUDIO","avatar_url":"https://avatars.githubusercontent.com/u/10226289?"}}
{"id":"2489397638","type":"PushEvent","actor":{"id":1373703,"login":"team3cord","gravatar_id":"","url":"https://api.github.com/users/team3cord","avatar_url":"https://avatars.githubusercontent.com/u/1373703?"},"repo":{"id":20268125,"name":"team3cord/mc-dotfiles","url":"https://api.github.com/repos/team3cord/mc-dotfiles"},"payload":{"push_id":536753025,"size":6,"distinct_size":1,"ref":"refs/heads/OSX","head":"731064c30578713735d183022092299605dcf83a","before":"460e8c219d89fcf24c4f961765a63c7a8e4185f1","commits":[{"sha":"7ebd9b4cc70e2b3a2f044d7ff4ef63c2b27d7451","author":{"email":"67bcad84ab1facdcd6a44cf7083c26cfa2e421e4@gmail.com","name":"MattCordeiro"},"message":"Updating for linux","distinct":false,"url":"https://api.github.com/repos/team3cord/mc-dotfiles/commits/7ebd9b4cc70e2b3a2f044d7ff4ef63c2b27d7451"},{"sha":"beb1f3edadc32c3d451800028eafcaf8f753e124","author":{"email":"67bcad84ab1facdcd6a44cf7083c26cfa2e421e4@gmail.com","name":"MattCordeiro"},"message":"Readme","distinct":false,"url":"https://api.github.com/repos/team3cord/mc-dotfiles/commits/beb1f3edadc32c3d451800028eafcaf8f753e124"},{"sha":"4d83ec65b7161a9c5a1bab69642d2ba15e748201","author":{"email":"67bcad84ab1facdcd6a44cf7083c26cfa2e421e4@gmail.com","name":"MattCordeiro"},"message":"Updated TODO's","distinct":false,"url":"https://api.github.com/repos/team3cord/mc-dotfiles/commits/4d83ec65b7161a9c5a1bab69642d2ba15e748201"},{"sha":"57e4c5c28b8fed6b308b24f86432d3676fd8d96e","author":{"email":"67bcad84ab1facdcd6a44cf7083c26cfa2e421e4@gmail.com","name":"MattCordeiro"},"message":"Bannished DS","distinct":false,"url":"https://api.github.com/repos/team3cord/mc-dotfiles/commits/57e4c5c28b8fed6b308b24f86432d3676fd8d96e"},{"sha":"c274de69b1397e2b2b3a92b5cbba22b87211ffa0","author":{"email":"67bcad84ab1facdcd6a44cf7083c26cfa2e421e4@gmail.com","name":"MattCordeiro"},"message":"Updated vim configuration","distinct":false,"url":"https://api.github.com/repos/team3cord/mc-dotfiles/commits/c274de69b1397e2b2b3a92b5cbba22b87211ffa0"},{"sha":"731064c30578713735d183022092299605dcf83a","author":{"email":"67bcad84ab1facdcd6a44cf7083c26cfa2e421e4@gmail.com","name":"MattCordeiro"},"message":"Uncommented OSX specific aliases","distinct":true,"url":"https://api.github.com/repos/team3cord/mc-dotfiles/commits/731064c30578713735d183022092299605dcf83a"}]},"public":true,"created_at":"2015-01-01T01:04:05Z"}
{"id":"2489397640","type":"IssueCommentEvent","actor":{"id":135605,"login":"joneslee85","gravatar_id":"","url":"https://api.github.com/users/joneslee85","avatar_url":"https://avatars.githubusercontent.com/u/135605?"},"repo":{"id":16760719,"name":"lotus/model","url":"https://api.github.com/repos/lotus/model"},"payload":{"action":"created","issue":{"url":"https://api.github.com/repos/lotus/model/issues/137","labels_url":"https://api.github.com/repos/lotus/model/issues/137/labels{/name}","comments_url":"https://api.github.com/repos/lotus/model/issues/137/comments","events_url":"https://api.github.com/repos/lotus/model/issues/137/events","html_url":"https://github.com/lotus/model/pull/137","id":53171581,"number":137,"title":"Refactor attributes DSL","user":{"login":"joneslee85","id":135605,"avatar_url":"https://avatars.githubusercontent.com/u/135605?v=3","gravatar_id":"","url":"https://api.github.com/users/joneslee85","html_url":"https://github.com/joneslee85","followers_url":"https://api.github.com/users/joneslee85/followers","following_url":"https://api.github.com/users/joneslee85/following{/other_user}","gists_url":"https://api.github.com/users/joneslee85/gists{/gist_id}","starred_url":"https://api.github.com/users/joneslee85/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/joneslee85/subscriptions","organizations_url":"https://api.github.com/users/joneslee85/orgs","repos_url":"https://api.github.com/users/joneslee85/repos","events_url":"https://api.github.com/users/joneslee85/events{/privacy}","received_events_url":"https://api.github.com/users/joneslee85/received_events","type":"User","site_admin":false},"labels":[],"state":"open","locked":false,"assignee":null,"milestone":null,"comments":3,"created_at":"2014-12-31T07:27:28Z","updated_at":"2015-01-01T01:04:05Z","closed_at":null,"pull_request":{"url":"https://api.github.com/repos/lotus/model/pulls/137","html_url":"https://github.com/lotus/model/pull/137","diff_url":"https://github.com/lotus/model/pull/137.diff","patch_url":"https://github.com/lotus/model/pull/137.patch"},"body":"* [x] Consolidate constructor\r\n* [x] Does not gracefully handle unknown attributes"},"comment":{"url":"https://api.github.com/repos/lotus/model/issues/comments/68477296","html_url":"https://github.com/lotus/model/pull/137#issuecomment-68477296","issue_url":"https://api.github.com/repos/lotus/model/issues/137","id":68477296,"user":{"login":"joneslee85","id":135605,"avatar_url":"https://avatars.githubusercontent.com/u/135605?v=3","gravatar_id":"","url":"https://api.github.com/users/joneslee85","html_url":"https://github.com/joneslee85","followers_url":"https://api.github.com/users/joneslee85/followers","following_url":"https://api.github.com/users/joneslee85/following{/other_user}","gists_url":"https://api.github.com/users/joneslee85/gists{/gist_id}","starred_url":"https://api.github.com/users/joneslee85/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/joneslee85/subscriptions","organizations_url":"https://api.github.com/users/joneslee85/orgs","repos_url":"https://api.github.com/users/joneslee85/repos","events_url":"https://api.github.com/users/joneslee85/events{/privacy}","received_events_url":"https://api.github.com/users/joneslee85/received_events","type":"User","site_admin":false},"created_at":"2015-01-01T01:04:05Z","updated_at":"2015-01-01T01:04:05Z","body":"@AlfonsoUceda not yet, I have yet heard back from @jodosha, need more discussion"}},"public":true,"created_at":"2015-01-01T01:04:05Z","org":{"id":3210273,"login":"lotus","gravatar_id":"","url":"https://api.github.com/orgs/lotus","avatar_url":"https://avatars.githubusercontent.com/u/3210273?"}}
{"id":"2489397641","type":"PullRequestReviewCommentEvent","actor":{"id":663212,"login":"tdas","gravatar_id":"","url":"https://api.github.com/users/tdas","avatar_url":"https://avatars.githubusercontent.com/u/663212?"},"repo":{"id":17165658,"name":"apache/spark","url":"https://api.github.com/repos/apache/spark"},"payload":{"action":"created","comment":{"url":"https://api.github.com/repos/apache/spark/pulls/comments/22397277","id":22397277,"diff_hunk":"@@ -17,31 +17,65 @@\n \n package org.apache.spark.streaming.mqtt\n \n-import org.scalatest.FunSuite\n-\n+import org.scalatest.{BeforeAndAfter, FunSuite}\n+import org.scalatest.concurrent.Eventually\n+import scala.concurrent.duration._\n import org.apache.spark.streaming.{Seconds, StreamingContext}\n import org.apache.spark.storage.StorageLevel\n import org.apache.spark.streaming.dstream.ReceiverInputDStream\n+import org.eclipse.paho.client.mqttv3._\n+import org.eclipse.paho.client.mqttv3.persist.MqttDefaultFilePersistence\n \n-class MQTTStreamSuite extends FunSuite {\n-\n-  val batchDuration = Seconds(1)\n+class MQTTStreamSuite extends FunSuite with Eventually with BeforeAndAfter {\n \n+  private val batchDuration = Seconds(1)\n   private val master: String = \"local[2]\"\n-\n   private val framework: String = this.getClass.getSimpleName\n+  private val brokerUrl = \"tcp://localhost:1883\"\n+  private val topic = \"def\"\n+  private var ssc: StreamingContext = _\n \n-  test(\"mqtt input stream\") {\n-    val ssc = new StreamingContext(master, framework, batchDuration)\n-    val brokerUrl = \"abc\"\n-    val topic = \"def\"\n+  before {\n+    ssc = new StreamingContext(master, framework, batchDuration)\n+  }\n+  after {\n+    if (ssc != null) {\n+      ssc.stop()\n+      ssc = null\n+    }\n+  }\n \n-    // tests the API, does not actually test data receiving\n-    val test1: ReceiverInputDStream[String] = MQTTUtils.createStream(ssc, brokerUrl, topic)\n-    val test2: ReceiverInputDStream[String] =\n+  test(\"mqtt input stream\") {\n+    val sendMessage = \"MQTT demo for spark streaming\"\n+    publishData(sendMessage)\n+    val receiveStream: ReceiverInputDStream[String] =\n       MQTTUtils.createStream(ssc, brokerUrl, topic, StorageLevel.MEMORY_AND_DISK_SER_2)\n-\n-    // TODO: Actually test receiving data\n+    var receiveMessage: String = \"\"\n+    receiveStream.foreachRDD { rdd =>\n+      receiveMessage = rdd.first\n+      receiveMessage\n+    }\n+    ssc.start()\n+    eventually(timeout(10000 milliseconds), interval(100 milliseconds)) {\n+      assert(sendMessage.equals(receiveMessage))\n+    }\n     ssc.stop()\n   }\n+\n+  def publishData(sendMessage: String): Unit = {\n+    try {\n+      val persistence: MqttClientPersistence = new MqttDefaultFilePersistence(\"/tmp\")\n+      val client: MqttClient = new MqttClient(brokerUrl, MqttClient.generateClientId(), persistence)\n+      client.connect()\n+      val msgTopic: MqttTopic = client.getTopic(topic)\n+      val message: MqttMessage = new MqttMessage(String.valueOf(sendMessage).getBytes(\"utf-8\"))\n+      message.setQos(1)\n+      message.setRetained(true)\n+      msgTopic.publish(message)\n+      println(\"Published data \\ntopic: \" + msgTopic.getName() + \"\\nMessage: \" + message)\n+      client.disconnect()\n+    } catch {\n+      case e: MqttException => println(\"Exception Caught: \" + e)\n+    }","path":"external/mqtt/src/test/scala/org/apache/spark/streaming/mqtt/MQTTStreamSuite.scala","position":78,"original_position":78,"commit_id":"fc8eb286db6aa8e78a567537996011f554eed969","original_commit_id":"fc8eb286db6aa8e78a567537996011f554eed969","user":{"login":"tdas","id":663212,"avatar_url":"https://avatars.githubusercontent.com/u/663212?v=3","gravatar_id":"","url":"https://api.github.com/users/tdas","html_url":"https://github.com/tdas","followers_url":"https://api.github.com/users/tdas/followers","following_url":"https://api.github.com/users/tdas/following{/other_user}","gists_url":"https://api.github.com/users/tdas/gists{/gist_id}","starred_url":"https://api.github.com/users/tdas/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/tdas/subscriptions","organizations_url":"https://api.github.com/users/tdas/orgs","repos_url":"https://api.github.com/users/tdas/repos","events_url":"https://api.github.com/users/tdas/events{/privacy}","received_events_url":"https://api.github.com/users/tdas/received_events","type":"User","site_admin":false},"body":"Shouldnt there be a `finally` to close any running servers (client, etc.)?","created_at":"2015-01-01T01:04:05Z","updated_at":"2015-01-01T01:04:05Z","html_url":"https://github.com/apache/spark/pull/3844#discussion_r22397277","pull_request_url":"https://api.github.com/repos/apache/spark/pulls/3844","_links":{"self":{"href":"https://api.github.com/repos/apache/spark/pulls/comments/22397277"},"html":{"href":"https://github.com/apache/spark/pull/3844#discussion_r22397277"},"pull_request":{"href":"https://api.github.com/repos/apache/spark/pulls/3844"}}},"pull_request":{"url":"https://api.github.com/repos/apache/spark/pulls/3844","id":26684823,"html_url":"https://github.com/apache/spark/pull/3844","diff_url":"https://github.com/apache/spark/pull/3844.diff","patch_url":"https://github.com/apache/spark/pull/3844.patch","issue_url":"https://api.github.com/repos/apache/spark/issues/3844","number":3844,"state":"open","locked":false,"title":"[SPARK-4631] unit test for MQTT","user":{"login":"Bilna","id":7123586,"avatar_url":"https://avatars.githubusercontent.com/u/7123586?v=3","gravatar_id":"","url":"https://api.github.com/users/Bilna","html_url":"https://github.com/Bilna","followers_url":"https://api.github.com/users/Bilna/followers","following_url":"https://api.github.com/users/Bilna/following{/other_user}","gists_url":"https://api.github.com/users/Bilna/gists{/gist_id}","starred_url":"https://api.github.com/users/Bilna/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/Bilna/subscriptions","organizations_url":"https://api.github.com/users/Bilna/orgs","repos_url":"https://api.github.com/users/Bilna/repos","events_url":"https://api.github.com/users/Bilna/events{/privacy}","received_events_url":"https://api.github.com/users/Bilna/received_events","type":"User","site_admin":false},"body":"Please review the unit test for MQTT","created_at":"2014-12-30T13:12:33Z","updated_at":"2015-01-01T01:04:05Z","closed_at":null,"merged_at":null,"merge_commit_sha":"78f53f74b7089734c2cc3a2f701e6044194cda1d","assignee":null,"milestone":null,"commits_url":"https://api.github.com/repos/apache/spark/pulls/3844/commits","review_comments_url":"https://api.github.com/repos/apache/spark/pulls/3844/comments","review_comment_url":"https://api.github.com/repos/apache/spark/pulls/comments/{number}","comments_url":"https://api.github.com/repos/apache/spark/issues/3844/comments","statuses_url":"https://api.github.com/repos/apache/spark/statuses/fc8eb286db6aa8e78a567537996011f554eed969","head":{"label":"Bilna:master","ref":"master","sha":"fc8eb286db6aa8e78a567537996011f554eed969","user":{"login":"Bilna","id":7123586,"avatar_url":"https://avatars.githubusercontent.com/u/7123586?v=3","gravatar_id":"","url":"https://api.github.com/users/Bilna","html_url":"https://github.com/Bilna","followers_url":"https://api.github.com/users/Bilna/followers","following_url":"https://api.github.com/users/Bilna/following{/other_user}","gists_url":"https://api.github.com/users/Bilna/gists{/gist_id}","starred_url":"https://api.github.com/users/Bilna/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/Bilna/subscriptions","organizations_url":"https://api.github.com/users/Bilna/orgs","repos_url":"https://api.github.com/users/Bilna/repos","events_url":"https://api.github.com/users/Bilna/events{/privacy}","received_events_url":"https://api.github.com/users/Bilna/received_events","type":"User","site_admin":false},"repo":{"id":28630516,"name":"spark","full_name":"Bilna/spark","owner":{"login":"Bilna","id":7123586,"avatar_url":"https://avatars.githubusercontent.com/u/7123586?v=3","gravatar_id":"","url":"https://api.github.com/users/Bilna","html_url":"https://github.com/Bilna","followers_url":"https://api.github.com/users/Bilna/followers","following_url":"https://api.github.com/users/Bilna/following{/other_user}","gists_url":"https://api.github.com/users/Bilna/gists{/gist_id}","starred_url":"https://api.github.com/users/Bilna/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/Bilna/subscriptions","organizations_url":"https://api.github.com/users/Bilna/orgs","repos_url":"https://api.github.com/users/Bilna/repos","events_url":"https://api.github.com/users/Bilna/events{/privacy}","received_events_url":"https://api.github.com/users/Bilna/received_events","type":"User","site_admin":false},"private":false,"html_url":"https://github.com/Bilna/spark","description":"Mirror of Apache Spark","fork":true,"url":"https://api.github.com/repos/Bilna/spark","forks_url":"https://api.github.com/repos/Bilna/spark/forks","keys_url":"https://api.github.com/repos/Bilna/spark/keys{/key_id}","collaborators_url":"https://api.github.com/repos/Bilna/spark/collaborators{/collaborator}","teams_url":"https://api.github.com/repos/Bilna/spark/teams","hooks_url":"https://api.github.com/repos/Bilna/spark/hooks","issue_events_url":"https://api.github.com/repos/Bilna/spark/issues/events{/number}","events_url":"https://api.github.com/repos/Bilna/spark/events","assignees_url":"https://api.github.com/repos/Bilna/spark/assignees{/user}","branches_url":"https://api.github.com/repos/Bilna/spark/branches{/branch}","tags_url":"https://api.github.com/repos/Bilna/spark/tags","blobs_url":"https://api.github.com/repos/Bilna/spark/git/blobs{/sha}","git_tags_url":"https://api.github.com/repos/Bilna/spark/git/tags{/sha}","git_refs_url":"https://api.github.com/repos/Bilna/spark/git/refs{/sha}","trees_url":"https://api.github.com/repos/Bilna/spark/git/trees{/sha}","statuses_url":"https://api.github.com/repos/Bilna/spark/statuses/{sha}","languages_url":"https://api.github.com/repos/Bilna/spark/languages","stargazers_url":"https://api.github.com/repos/Bilna/spark/stargazers","contributors_url":"https://api.github.com/repos/Bilna/spark/contributors","subscribers_url":"https://api.github.com/repos/Bilna/spark/subscribers","subscription_url":"https://api.github.com/repos/Bilna/spark/subscription","commits_url":"https://api.github.com/repos/Bilna/spark/commits{/sha}","git_commits_url":"https://api.github.com/repos/Bilna/spark/git/commits{/sha}","comments_url":"https://api.github.com/repos/Bilna/spark/comments{/number}","issue_comment_url":"https://api.github.com/repos/Bilna/spark/issues/comments/{number}","contents_url":"https://api.github.com/repos/Bilna/spark/contents/{+path}","compare_url":"https://api.github.com/repos/Bilna/spark/compare/{base}...{head}","merges_url":"https://api.github.com/repos/Bilna/spark/merges","archive_url":"https://api.github.com/repos/Bilna/spark/{archive_format}{/ref}","downloads_url":"https://api.github.com/repos/Bilna/spark/downloads","issues_url":"https://api.github.com/repos/Bilna/spark/issues{/number}","pulls_url":"https://api.github.com/repos/Bilna/spark/pulls{/number}","milestones_url":"https://api.github.com/repos/Bilna/spark/milestones{/number}","notifications_url":"https://api.github.com/repos/Bilna/spark/notifications{?since,all,participating}","labels_url":"https://api.github.com/repos/Bilna/spark/labels{/name}","releases_url":"https://api.github.com/repos/Bilna/spark/releases{/id}","created_at":"2014-12-30T12:47:01Z","updated_at":"2014-12-31T09:52:36Z","pushed_at":"2014-12-31T09:52:35Z","git_url":"git://github.com/Bilna/spark.git","ssh_url":"git@github.com:Bilna/spark.git","clone_url":"https://github.com/Bilna/spark.git","svn_url":"https://github.com/Bilna/spark","homepage":null,"size":87823,"stargazers_count":1,"watchers_count":1,"language":"Scala","has_issues":false,"has_downloads":true,"has_wiki":false,"has_pages":false,"forks_count":0,"mirror_url":null,"open_issues_count":0,"forks":0,"open_issues":0,"watchers":1,"default_branch":"master"}},"base":{"label":"apache:master","ref":"master","sha":"352ed6bbe3c3b67e52e298e7c535ae414d96beca","user":{"login":"apache","id":47359,"avatar_url":"https://avatars.githubusercontent.com/u/47359?v=3","gravatar_id":"","url":"https://api.github.com/users/apache","html_url":"https://github.com/apache","followers_url":"https://api.github.com/users/apache/followers","following_url":"https://api.github.com/users/apache/following{/other_user}","gists_url":"https://api.github.com/users/apache/gists{/gist_id}","starred_url":"https://api.github.com/users/apache/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/apache/subscriptions","organizations_url":"https://api.github.com/users/apache/orgs","repos_url":"https://api.github.com/users/apache/repos","events_url":"https://api.github.com/users/apache/events{/privacy}","received_events_url":"https://api.github.com/users/apache/received_events","type":"Organization","site_admin":false},"repo":{"id":17165658,"name":"spark","full_name":"apache/spark","owner":{"login":"apache","id":47359,"avatar_url":"https://avatars.githubusercontent.com/u/47359?v=3","gravatar_id":"","url":"https://api.github.com/users/apache","html_url":"https://github.com/apache","followers_url":"https://api.github.com/users/apache/followers","following_url":"https://api.github.com/users/apache/following{/other_user}","gists_url":"https://api.github.com/users/apache/gists{/gist_id}","starred_url":"https://api.github.com/users/apache/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/apache/subscriptions","organizations_url":"https://api.github.com/users/apache/orgs","repos_url":"https://api.github.com/users/apache/repos","events_url":"https://api.github.com/users/apache/events{/privacy}","received_events_url":"https://api.github.com/users/apache/received_events","type":"Organization","site_admin":false},"private":false,"html_url":"https://github.com/apache/spark","description":"Mirror of Apache Spark","fork":false,"url":"https://api.github.com/repos/apache/spark","forks_url":"https://api.github.com/repos/apache/spark/forks","keys_url":"https://api.github.com/repos/apache/spark/keys{/key_id}","collaborators_url":"https://api.github.com/repos/apache/spark/collaborators{/collaborator}","teams_url":"https://api.github.com/repos/apache/spark/teams","hooks_url":"https://api.github.com/repos/apache/spark/hooks","issue_events_url":"https://api.github.com/repos/apache/spark/issues/events{/number}","events_url":"https://api.github.com/repos/apache/spark/events","assignees_url":"https://api.github.com/repos/apache/spark/assignees{/user}","branches_url":"https://api.github.com/repos/apache/spark/branches{/branch}","tags_url":"https://api.github.com/repos/apache/spark/tags","blobs_url":"https://api.github.com/repos/apache/spark/git/blobs{/sha}","git_tags_url":"https://api.github.com/repos/apache/spark/git/tags{/sha}","git_refs_url":"https://api.github.com/repos/apache/spark/git/refs{/sha}","trees_url":"https://api.github.com/repos/apache/spark/git/trees{/sha}","statuses_url":"https://api.github.com/repos/apache/spark/statuses/{sha}","languages_url":"https://api.github.com/repos/apache/spark/languages","stargazers_url":"https://api.github.com/repos/apache/spark/stargazers","contributors_url":"https://api.github.com/repos/apache/spark/contributors","subscribers_url":"https://api.github.com/repos/apache/spark/subscribers","subscription_url":"https://api.github.com/repos/apache/spark/subscription","commits_url":"https://api.github.com/repos/apache/spark/commits{/sha}","git_commits_url":"https://api.github.com/repos/apache/spark/git/commits{/sha}","comments_url":"https://api.github.com/repos/apache/spark/comments{/number}","issue_comment_url":"https://api.github.com/repos/apache/spark/issues/comments/{number}","contents_url":"https://api.github.com/repos/apache/spark/contents/{+path}","compare_url":"https://api.github.com/repos/apache/spark/compare/{base}...{head}","merges_url":"https://api.github.com/repos/apache/spark/merges","archive_url":"https://api.github.com/repos/apache/spark/{archive_format}{/ref}","downloads_url":"https://api.github.com/repos/apache/spark/downloads","issues_url":"https://api.github.com/repos/apache/spark/issues{/number}","pulls_url":"https://api.github.com/repos/apache/spark/pulls{/number}","milestones_url":"https://api.github.com/repos/apache/spark/milestones{/number}","notifications_url":"https://api.github.com/repos/apache/spark/notifications{?since,all,participating}","labels_url":"https://api.github.com/repos/apache/spark/labels{/name}","releases_url":"https://api.github.com/repos/apache/spark/releases{/id}","created_at":"2014-02-25T08:00:08Z","updated_at":"2015-01-01T00:59:33Z","pushed_at":"2015-01-01T00:59:33Z","git_url":"git://github.com/apache/spark.git","ssh_url":"git@github.com:apache/spark.git","clone_url":"https://github.com/apache/spark.git","svn_url":"https://github.com/apache/spark","homepage":null,"size":1083068,"stargazers_count":2458,"watchers_count":2458,"language":"Scala","has_issues":false,"has_downloads":true,"has_wiki":false,"has_pages":false,"forks_count":2179,"mirror_url":"git://git.apache.org/spark.git","open_issues_count":268,"forks":2179,"open_issues":268,"watchers":2458,"default_branch":"master"}},"_links":{"self":{"href":"https://api.github.com/repos/apache/spark/pulls/3844"},"html":{"href":"https://github.com/apache/spark/pull/3844"},"issue":{"href":"https://api.github.com/repos/apache/spark/issues/3844"},"comments":{"href":"https://api.github.com/repos/apache/spark/issues/3844/comments"},"review_comments":{"href":"https://api.github.com/repos/apache/spark/pulls/3844/comments"},"review_comment":{"href":"https://api.github.com/repos/apache/spark/pulls/comments/{number}"},"commits":{"href":"https://api.github.com/repos/apache/spark/pulls/3844/commits"},"statuses":{"href":"https://api.github.com/repos/apache/spark/statuses/fc8eb286db6aa8e78a567537996011f554eed969"}}}},"public":true,"created_at":"2015-01-01T01:04:05Z","org":{"id":47359,"login":"apache","gravatar_id":"","url":"https://api.github.com/orgs/apache","avatar_url":"https://avatars.githubusercontent.com/u/47359?"}}
{"id":"2489397645","type":"CreateEvent","actor":{"id":1398544,"login":"joelpurra","gravatar_id":"","url":"https://api.github.com/users/joelpurra","avatar_url":"https://avatars.githubusercontent.com/u/1398544?"},"repo":{"id":28595466,"name":"joelpurra/jqnpm","url":"https://api.github.com/repos/joelpurra/jqnpm"},"payload":{"ref":"import_659","ref_type":"branch","master_branch":"master","description":"A package manager built for jq as an example implementation.","pusher_type":"user"},"public":true,"created_at":"2015-01-01T01:04:06Z"}
{"id":"2489397653","type":"PullRequestEvent","actor":{"id":9831378,"login":"Amit-P-Amin","gravatar_id":"","url":"https://api.github.com/users/Amit-P-Amin","avatar_url":"https://avatars.githubusercontent.com/u/9831378?"},"repo":{"id":12024210,"name":"appacademy/active_record_lite","url":"https://api.github.com/repos/appacademy/active_record_lite"},"payload":{"action":"opened","number":17,"pull_request":{"url":"https://api.github.com/repos/appacademy/active_record_lite/pulls/17","id":26739446,"html_url":"https://github.com/appacademy/active_record_lite/pull/17","diff_url":"https://github.com/appacademy/active_record_lite/pull/17.diff","patch_url":"https://github.com/appacademy/active_record_lite/pull/17.patch","issue_url":"https://api.github.com/repos/appacademy/active_record_lite/issues/17","number":17,"state":"open","locked":false,"title":"Update 03_associatable_spec.rb","user":{"login":"Amit-P-Amin","id":9831378,"avatar_url":"https://avatars.githubusercontent.com/u/9831378?v=3","gravatar_id":"","url":"https://api.github.com/users/Amit-P-Amin","html_url":"https://github.com/Amit-P-Amin","followers_url":"https://api.github.com/users/Amit-P-Amin/followers","following_url":"https://api.github.com/users/Amit-P-Amin/following{/other_user}","gists_url":"https://api.github.com/users/Amit-P-Amin/gists{/gist_id}","starred_url":"https://api.github.com/users/Amit-P-Amin/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/Amit-P-Amin/subscriptions","organizations_url":"https://api.github.com/users/Amit-P-Amin/orgs","repos_url":"https://api.github.com/users/Amit-P-Amin/repos","events_url":"https://api.github.com/users/Amit-P-Amin/events{/privacy}","received_events_url":"https://api.github.com/users/Amit-P-Amin/received_events","type":"User","site_admin":false},"body":"Was confused for a while because \"AssocOptions #model_class returns class of associated object\" was failing. This is because that spec tests 2 methods, but the description just mentions 1 (only model class, instead of model class and table name). I split the test into two, one for the model class and one for the table name.","created_at":"2015-01-01T01:04:07Z","updated_at":"2015-01-01T01:04:07Z","closed_at":null,"merged_at":null,"merge_commit_sha":null,"assignee":null,"milestone":null,"commits_url":"https://api.github.com/repos/appacademy/active_record_lite/pulls/17/commits","review_comments_url":"https://api.github.com/repos/appacademy/active_record_lite/pulls/17/comments","review_comment_url":"https://api.github.com/repos/appacademy/active_record_lite/pulls/comments/{number}","comments_url":"https://api.github.com/repos/appacademy/active_record_lite/issues/17/comments","statuses_url":"https://api.github.com/repos/appacademy/active_record_lite/statuses/b5ac327b20f2041652e3228ce4612880aae97beb","head":{"label":"Amit-P-Amin:patch-1","ref":"patch-1","sha":"b5ac327b20f2041652e3228ce4612880aae97beb","user":{"login":"Amit-P-Amin","id":9831378,"avatar_url":"https://avatars.githubusercontent.com/u/9831378?v=3","gravatar_id":"","url":"https://api.github.com/users/Amit-P-Amin","html_url":"https://github.com/Amit-P-Amin","followers_url":"https://api.github.com/users/Amit-P-Amin/followers","following_url":"https://api.github.com/users/Amit-P-Amin/following{/other_user}","gists_url":"https://api.github.com/users/Amit-P-Amin/gists{/gist_id}","starred_url":"https://api.github.com/users/Amit-P-Amin/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/Amit-P-Amin/subscriptions","organizations_url":"https://api.github.com/users/Amit-P-Amin/orgs","repos_url":"https://api.github.com/users/Amit-P-Amin/repos","events_url":"https://api.github.com/users/Amit-P-Amin/events{/privacy}","received_events_url":"https://api.github.com/users/Amit-P-Amin/received_events","type":"User","site_admin":false},"repo":{"id":28678217,"name":"active_record_lite","full_name":"Amit-P-Amin/active_record_lite","owner":{"login":"Amit-P-Amin","id":9831378,"avatar_url":"https://avatars.githubusercontent.com/u/9831378?v=3","gravatar_id":"","url":"https://api.github.com/users/Amit-P-Amin","html_url":"https://github.com/Amit-P-Amin","followers_url":"https://api.github.com/users/Amit-P-Amin/followers","following_url":"https://api.github.com/users/Amit-P-Amin/following{/other_user}","gists_url":"https://api.github.com/users/Amit-P-Amin/gists{/gist_id}","starred_url":"https://api.github.com/users/Amit-P-Amin/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/Amit-P-Amin/subscriptions","organizations_url":"https://api.github.com/users/Amit-P-Amin/orgs","repos_url":"https://api.github.com/users/Amit-P-Amin/repos","events_url":"https://api.github.com/users/Amit-P-Amin/events{/privacy}","received_events_url":"https://api.github.com/users/Amit-P-Amin/received_events","type":"User","site_admin":false},"private":false,"html_url":"https://github.com/Amit-P-Amin/active_record_lite","description":"","fork":true,"url":"https://api.github.com/repos/Amit-P-Amin/active_record_lite","forks_url":"https://api.github.com/repos/Amit-P-Amin/active_record_lite/forks","keys_url":"https://api.github.com/repos/Amit-P-Amin/active_record_lite/keys{/key_id}","collaborators_url":"https://api.github.com/repos/Amit-P-Amin/active_record_lite/collaborators{/collaborator}","teams_url":"https://api.github.com/repos/Amit-P-Amin/active_record_lite/teams","hooks_url":"https://api.github.com/repos/Amit-P-Amin/active_record_lite/hooks","issue_events_url":"https://api.github.com/repos/Amit-P-Amin/active_record_lite/issues/events{/number}","events_url":"https://api.github.com/repos/Amit-P-Amin/active_record_lite/events","assignees_url":"https://api.github.com/repos/Amit-P-Amin/active_record_lite/assignees{/user}","branches_url":"https://api.github.com/repos/Amit-P-Amin/active_record_lite/branches{/branch}","tags_url":"https://api.github.com/repos/Amit-P-Amin/active_record_lite/tags","blobs_url":"https://api.github.com/repos/Amit-P-Amin/active_record_lite/git/blobs{/sha}","git_tags_url":"https://api.github.com/repos/Amit-P-Amin/active_record_lite/git/tags{/sha}","git_refs_url":"https://api.github.com/repos/Amit-P-Amin/active_record_lite/git/refs{/sha}","trees_url":"https://api.github.com/repos/Amit-P-Amin/active_record_lite/git/trees{/sha}","statuses_url":"https://api.github.com/repos/Amit-P-Amin/active_record_lite/statuses/{sha}","languages_url":"https://api.github.com/repos/Amit-P-Amin/active_record_lite/languages","stargazers_url":"https://api.github.com/repos/Amit-P-Amin/active_record_lite/stargazers","contributors_url":"https://api.github.com/repos/Amit-P-Amin/active_record_lite/contributors","subscribers_url":"https://api.github.com/repos/Amit-P-Amin/active_record_lite/subscribers","subscription_url":"https://api.github.com/repos/Amit-P-Amin/active_record_lite/subscription","commits_url":"https://api.github.com/repos/Amit-P-Amin/active_record_lite/commits{/sha}","git_commits_url":"https://api.github.com/repos/Amit-P-Amin/active_record_lite/git/commits{/sha}","comments_url":"https://api.github.com/repos/Amit-P-Amin/active_record_lite/comments{/number}","issue_comment_url":"https://api.github.com/repos/Amit-P-Amin/active_record_lite/issues/comments/{number}","contents_url":"https://api.github.com/repos/Amit-P-Amin/active_record_lite/contents/{+path}","compare_url":"https://api.github.com/repos/Amit-P-Amin/active_record_lite/compare/{base}...{head}","merges_url":"https://api.github.com/repos/Amit-P-Amin/active_record_lite/merges","archive_url":"https://api.github.com/repos/Amit-P-Amin/active_record_lite/{archive_format}{/ref}","downloads_url":"https://api.github.com/repos/Amit-P-Amin/active_record_lite/downloads","issues_url":"https://api.github.com/repos/Amit-P-Amin/active_record_lite/issues{/number}","pulls_url":"https://api.github.com/repos/Amit-P-Amin/active_record_lite/pulls{/number}","milestones_url":"https://api.github.com/repos/Amit-P-Amin/active_record_lite/milestones{/number}","notifications_url":"https://api.github.com/repos/Amit-P-Amin/active_record_lite/notifications{?since,all,participating}","labels_url":"https://api.github.com/repos/Amit-P-Amin/active_record_lite/labels{/name}","releases_url":"https://api.github.com/repos/Amit-P-Amin/active_record_lite/releases{/id}","created_at":"2015-01-01T01:00:39Z","updated_at":"2015-01-01T01:00:39Z","pushed_at":"2015-01-01T01:02:23Z","git_url":"git://github.com/Amit-P-Amin/active_record_lite.git","ssh_url":"git@github.com:Amit-P-Amin/active_record_lite.git","clone_url":"https://github.com/Amit-P-Amin/active_record_lite.git","svn_url":"https://github.com/Amit-P-Amin/active_record_lite","homepage":null,"size":632,"stargazers_count":0,"watchers_count":0,"language":"Ruby","has_issues":false,"has_downloads":true,"has_wiki":true,"has_pages":false,"forks_count":0,"mirror_url":null,"open_issues_count":0,"forks":0,"open_issues":0,"watchers":0,"default_branch":"master"}},"base":{"label":"appacademy:master","ref":"master","sha":"ca4e169591deec6c4b30b611e8ed5bdf89b3386a","user":{"login":"appacademy","id":2138704,"avatar_url":"https://avatars.githubusercontent.com/u/2138704?v=3","gravatar_id":"","url":"https://api.github.com/users/appacademy","html_url":"https://github.com/appacademy","followers_url":"https://api.github.com/users/appacademy/followers","following_url":"https://api.github.com/users/appacademy/following{/other_user}","gists_url":"https://api.github.com/users/appacademy/gists{/gist_id}","starred_url":"https://api.github.com/users/appacademy/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/appacademy/subscriptions","organizations_url":"https://api.github.com/users/appacademy/orgs","repos_url":"https://api.github.com/users/appacademy/repos","events_url":"https://api.github.com/users/appacademy/events{/privacy}","received_events_url":"https://api.github.com/users/appacademy/received_events","type":"Organization","site_admin":false},"repo":{"id":12024210,"name":"active_record_lite","full_name":"appacademy/active_record_lite","owner":{"login":"appacademy","id":2138704,"avatar_url":"https://avatars.githubusercontent.com/u/2138704?v=3","gravatar_id":"","url":"https://api.github.com/users/appacademy","html_url":"https://github.com/appacademy","followers_url":"https://api.github.com/users/appacademy/followers","following_url":"https://api.github.com/users/appacademy/following{/other_user}","gists_url":"https://api.github.com/users/appacademy/gists{/gist_id}","starred_url":"https://api.github.com/users/appacademy/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/appacademy/subscriptions","organizations_url":"https://api.github.com/users/appacademy/orgs","repos_url":"https://api.github.com/users/appacademy/repos","events_url":"https://api.github.com/users/appacademy/events{/privacy}","received_events_url":"https://api.github.com/users/appacademy/received_events","type":"Organization","site_admin":false},"private":false,"html_url":"https://github.com/appacademy/active_record_lite","description":"","fork":false,"url":"https://api.github.com/repos/appacademy/active_record_lite","forks_url":"https://api.github.com/repos/appacademy/active_record_lite/forks","keys_url":"https://api.github.com/repos/appacademy/active_record_lite/keys{/key_id}","collaborators_url":"https://api.github.com/repos/appacademy/active_record_lite/collaborators{/collaborator}","teams_url":"https://api.github.com/repos/appacademy/active_record_lite/teams","hooks_url":"https://api.github.com/repos/appacademy/active_record_lite/hooks","issue_events_url":"https://api.github.com/repos/appacademy/active_record_lite/issues/events{/number}","events_url":"https://api.github.com/repos/appacademy/active_record_lite/events","assignees_url":"https://api.github.com/repos/appacademy/active_record_lite/assignees{/user}","branches_url":"https://api.github.com/repos/appacademy/active_record_lite/branches{/branch}","tags_url":"https://api.github.com/repos/appacademy/active_record_lite/tags","blobs_url":"https://api.github.com/repos/appacademy/active_record_lite/git/blobs{/sha}","git_tags_url":"https://api.github.com/repos/appacademy/active_record_lite/git/tags{/sha}","git_refs_url":"https://api.github.com/repos/appacademy/active_record_lite/git/refs{/sha}","trees_url":"https://api.github.com/repos/appacademy/active_record_lite/git/trees{/sha}","statuses_url":"https://api.github.com/repos/appacademy/active_record_lite/statuses/{sha}","languages_url":"https://api.github.com/repos/appacademy/active_record_lite/languages","stargazers_url":"https://api.github.com/repos/appacademy/active_record_lite/stargazers","contributors_url":"https://api.github.com/repos/appacademy/active_record_lite/contributors","subscribers_url":"https://api.github.com/repos/appacademy/active_record_lite/subscribers","subscription_url":"https://api.github.com/repos/appacademy/active_record_lite/subscription","commits_url":"https://api.github.com/repos/appacademy/active_record_lite/commits{/sha}","git_commits_url":"https://api.github.com/repos/appacademy/active_record_lite/git/commits{/sha}","comments_url":"https://api.github.com/repos/appacademy/active_record_lite/comments{/number}","issue_comment_url":"https://api.github.com/repos/appacademy/active_record_lite/issues/comments/{number}","contents_url":"https://api.github.com/repos/appacademy/active_record_lite/contents/{+path}","compare_url":"https://api.github.com/repos/appacademy/active_record_lite/compare/{base}...{head}","merges_url":"https://api.github.com/repos/appacademy/active_record_lite/merges","archive_url":"https://api.github.com/repos/appacademy/active_record_lite/{archive_format}{/ref}","downloads_url":"https://api.github.com/repos/appacademy/active_record_lite/downloads","issues_url":"https://api.github.com/repos/appacademy/active_record_lite/issues{/number}","pulls_url":"https://api.github.com/repos/appacademy/active_record_lite/pulls{/number}","milestones_url":"https://api.github.com/repos/appacademy/active_record_lite/milestones{/number}","notifications_url":"https://api.github.com/repos/appacademy/active_record_lite/notifications{?since,all,participating}","labels_url":"https://api.github.com/repos/appacademy/active_record_lite/labels{/name}","releases_url":"https://api.github.com/repos/appacademy/active_record_lite/releases{/id}","created_at":"2013-08-10T17:32:19Z","updated_at":"2014-10-23T23:33:55Z","pushed_at":"2014-10-26T23:37:38Z","git_url":"git://github.com/appacademy/active_record_lite.git","ssh_url":"git@github.com:appacademy/active_record_lite.git","clone_url":"https://github.com/appacademy/active_record_lite.git","svn_url":"https://github.com/appacademy/active_record_lite","homepage":null,"size":632,"stargazers_count":0,"watchers_count":0,"language":"Ruby","has_issues":true,"has_downloads":true,"has_wiki":true,"has_pages":false,"forks_count":13,"mirror_url":null,"open_issues_count":2,"forks":13,"open_issues":2,"watchers":0,"default_branch":"master"}},"_links":{"self":{"href":"https://api.github.com/repos/appacademy/active_record_lite/pulls/17"},"html":{"href":"https://github.com/appacademy/active_record_lite/pull/17"},"issue":{"href":"https://api.github.com/repos/appacademy/active_record_lite/issues/17"},"comments":{"href":"https://api.github.com/repos/appacademy/active_record_lite/issues/17/comments"},"review_comments":{"href":"https://api.github.com/repos/appacademy/active_record_lite/pulls/17/comments"},"review_comment":{"href":"https://api.github.com/repos/appacademy/active_record_lite/pulls/comments/{number}"},"commits":{"href":"https://api.github.com/repos/appacademy/active_record_lite/pulls/17/commits"},"statuses":{"href":"https://api.github.com/repos/appacademy/active_record_lite/statuses/b5ac327b20f2041652e3228ce4612880aae97beb"}},"merged":false,"mergeable":null,"mergeable_state":"unknown","merged_by":null,"comments":0,"review_comments":0,"commits":1,"additions":7,"deletions":1,"changed_files":1}},"public":true,"created_at":"2015-01-01T01:04:07Z","org":{"id":2138704,"login":"appacademy","gravatar_id":"","url":"https://api.github.com/orgs/appacademy","avatar_url":"https://avatars.githubusercontent.com/u/2138704?"}}
{"id":"2489397654","type":"PushEvent","actor":{"id":8800150,"login":"troyeagle","gravatar_id":"","url":"https://api.github.com/users/troyeagle","avatar_url":"https://avatars.githubusercontent.com/u/8800150?"},"repo":{"id":24052643,"name":"zzt93/Hw-Client","url":"https://api.github.com/repos/zzt93/Hw-Client"},"payload":{"push_id":536753031,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"c8b1d6ea7905faf630d57ebb283d880ca6e655e7","before":"897452d98a4d094571441ac5a4f55a22884a7764","commits":[{"sha":"c8b1d6ea7905faf630d57ebb283d880ca6e655e7","author":{"email":"cae9f45d02c4e43ad3a912954969d5845cb0e620@qq.com","name":"troyeagle"},"message":"刷新","distinct":true,"url":"https://api.github.com/repos/zzt93/Hw-Client/commits/c8b1d6ea7905faf630d57ebb283d880ca6e655e7"}]},"public":true,"created_at":"2015-01-01T01:04:07Z"}
{"id":"2489397656","type":"IssueCommentEvent","actor":{"id":1932804,"login":"coldmind","gravatar_id":"","url":"https://api.github.com/users/coldmind","avatar_url":"https://avatars.githubusercontent.com/u/1932804?"},"repo":{"id":4164482,"name":"django/django","url":"https://api.github.com/repos/django/django"},"payload":{"action":"created","issue":{"url":"https://api.github.com/repos/django/django/issues/3821","labels_url":"https://api.github.com/repos/django/django/issues/3821/labels{/name}","comments_url":"https://api.github.com/repos/django/django/issues/3821/comments","events_url":"https://api.github.com/repos/django/django/issues/3821/events","html_url":"https://github.com/django/django/pull/3821","id":53200969,"number":3821,"title":"[WIP] Fixed #24064 - Prevented database access in compile time in spatialite models","user":{"login":"coldmind","id":1932804,"avatar_url":"https://avatars.githubusercontent.com/u/1932804?v=3","gravatar_id":"","url":"https://api.github.com/users/coldmind","html_url":"https://github.com/coldmind","followers_url":"https://api.github.com/users/coldmind/followers","following_url":"https://api.github.com/users/coldmind/following{/other_user}","gists_url":"https://api.github.com/users/coldmind/gists{/gist_id}","starred_url":"https://api.github.com/users/coldmind/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/coldmind/subscriptions","organizations_url":"https://api.github.com/users/coldmind/orgs","repos_url":"https://api.github.com/users/coldmind/repos","events_url":"https://api.github.com/users/coldmind/events{/privacy}","received_events_url":"https://api.github.com/users/coldmind/received_events","type":"User","site_admin":false},"labels":[],"state":"open","locked":false,"assignee":null,"milestone":null,"comments":5,"created_at":"2014-12-31T20:02:17Z","updated_at":"2015-01-01T01:04:07Z","closed_at":null,"pull_request":{"url":"https://api.github.com/repos/django/django/pulls/3821","html_url":"https://github.com/django/django/pull/3821","diff_url":"https://github.com/django/django/pull/3821.diff","patch_url":"https://github.com/django/django/pull/3821.patch"},"body":"Here is the patch that can fix problem.\r\nIdeas about improvements are welcome."},"comment":{"url":"https://api.github.com/repos/django/django/issues/comments/68477298","html_url":"https://github.com/django/django/pull/3821#issuecomment-68477298","issue_url":"https://api.github.com/repos/django/django/issues/3821","id":68477298,"user":{"login":"coldmind","id":1932804,"avatar_url":"https://avatars.githubusercontent.com/u/1932804?v=3","gravatar_id":"","url":"https://api.github.com/users/coldmind","html_url":"https://github.com/coldmind","followers_url":"https://api.github.com/users/coldmind/followers","following_url":"https://api.github.com/users/coldmind/following{/other_user}","gists_url":"https://api.github.com/users/coldmind/gists{/gist_id}","starred_url":"https://api.github.com/users/coldmind/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/coldmind/subscriptions","organizations_url":"https://api.github.com/users/coldmind/orgs","repos_url":"https://api.github.com/users/coldmind/repos","events_url":"https://api.github.com/users/coldmind/events{/privacy}","received_events_url":"https://api.github.com/users/coldmind/received_events","type":"User","site_admin":false},"created_at":"2015-01-01T01:04:07Z","updated_at":"2015-01-01T01:04:07Z","body":"buildbot, test this please"}},"public":true,"created_at":"2015-01-01T01:04:07Z","org":{"id":27804,"login":"django","gravatar_id":"","url":"https://api.github.com/orgs/django","avatar_url":"https://avatars.githubusercontent.com/u/27804?"}}
{"id":"2489397661","type":"PushEvent","actor":{"id":9201970,"login":"qdm","gravatar_id":"","url":"https://api.github.com/users/qdm","avatar_url":"https://avatars.githubusercontent.com/u/9201970?"},"repo":{"id":25173910,"name":"qdm/qdm.github.io","url":"https://api.github.com/repos/qdm/qdm.github.io"},"payload":{"push_id":536753035,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"dbcd229108e512d575dcd1e4595183ce055f8e2f","before":"94683ca14e320a286452e2f2e873ff5d603f1a98","commits":[{"sha":"dbcd229108e512d575dcd1e4595183ce055f8e2f","author":{"email":"de163e90d3aeef9f404d1de71c48e234a211e3c3@gmail.com","name":"KT"},"message":"Update","distinct":true,"url":"https://api.github.com/repos/qdm/qdm.github.io/commits/dbcd229108e512d575dcd1e4595183ce055f8e2f"}]},"public":true,"created_at":"2015-01-01T01:04:08Z"}
{"id":"2489397666","type":"IssueCommentEvent","actor":{"id":405446,"login":"quickfur","gravatar_id":"","url":"https://api.github.com/users/quickfur","avatar_url":"https://avatars.githubusercontent.com/u/405446?"},"repo":{"id":1257080,"name":"D-Programming-Language/dlang.org","url":"https://api.github.com/repos/D-Programming-Language/dlang.org"},"payload":{"action":"created","issue":{"url":"https://api.github.com/repos/D-Programming-Language/dlang.org/issues/734","labels_url":"https://api.github.com/repos/D-Programming-Language/dlang.org/issues/734/labels{/name}","comments_url":"https://api.github.com/repos/D-Programming-Language/dlang.org/issues/734/comments","events_url":"https://api.github.com/repos/D-Programming-Language/dlang.org/issues/734/events","html_url":"https://github.com/D-Programming-Language/dlang.org/pull/734","id":53083284,"number":734,"title":"Much nicer jump-to anchors","user":{"login":"andralex","id":566679,"avatar_url":"https://avatars.githubusercontent.com/u/566679?v=3","gravatar_id":"","url":"https://api.github.com/users/andralex","html_url":"https://github.com/andralex","followers_url":"https://api.github.com/users/andralex/followers","following_url":"https://api.github.com/users/andralex/following{/other_user}","gists_url":"https://api.github.com/users/andralex/gists{/gist_id}","starred_url":"https://api.github.com/users/andralex/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/andralex/subscriptions","organizations_url":"https://api.github.com/users/andralex/orgs","repos_url":"https://api.github.com/users/andralex/repos","events_url":"https://api.github.com/users/andralex/events{/privacy}","received_events_url":"https://api.github.com/users/andralex/received_events","type":"User","site_admin":false},"labels":[],"state":"closed","locked":false,"assignee":null,"milestone":null,"comments":5,"created_at":"2014-12-30T00:18:24Z","updated_at":"2015-01-01T01:04:08Z","closed_at":"2014-12-30T01:03:48Z","pull_request":{"url":"https://api.github.com/repos/D-Programming-Language/dlang.org/pulls/734","html_url":"https://github.com/D-Programming-Language/dlang.org/pull/734","diff_url":"https://github.com/D-Programming-Language/dlang.org/pull/734.diff","patch_url":"https://github.com/D-Programming-Language/dlang.org/pull/734.patch"},"body":"Example: http://erdani.com/d/phobos-prerelease/std_range_package.html"},"comment":{"url":"https://api.github.com/repos/D-Programming-Language/dlang.org/issues/comments/68477299","html_url":"https://github.com/D-Programming-Language/dlang.org/pull/734#issuecomment-68477299","issue_url":"https://api.github.com/repos/D-Programming-Language/dlang.org/issues/734","id":68477299,"user":{"login":"quickfur","id":405446,"avatar_url":"https://avatars.githubusercontent.com/u/405446?v=3","gravatar_id":"","url":"https://api.github.com/users/quickfur","html_url":"https://github.com/quickfur","followers_url":"https://api.github.com/users/quickfur/followers","following_url":"https://api.github.com/users/quickfur/following{/other_user}","gists_url":"https://api.github.com/users/quickfur/gists{/gist_id}","starred_url":"https://api.github.com/users/quickfur/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/quickfur/subscriptions","organizations_url":"https://api.github.com/users/quickfur/orgs","repos_url":"https://api.github.com/users/quickfur/repos","events_url":"https://api.github.com/users/quickfur/events{/privacy}","received_events_url":"https://api.github.com/users/quickfur/received_events","type":"User","site_admin":false},"created_at":"2015-01-01T01:04:08Z","updated_at":"2015-01-01T01:04:08Z","body":"This PR has broken Phobos docs builds. If you clone a clean copy of dlang.org and phobos and build dlang.org then `cd phobos; make -f posix.mak html`, it will produce documentation pages with no content in `phobos-prerelease`. I'd revert this PR, but the github reverter seems to have trouble with this, as it appears to be conflicting with subsequent changes in the repo."}},"public":true,"created_at":"2015-01-01T01:04:08Z","org":{"id":565913,"login":"D-Programming-Language","gravatar_id":"","url":"https://api.github.com/orgs/D-Programming-Language","avatar_url":"https://avatars.githubusercontent.com/u/565913?"}}
{"id":"2489397678","type":"PushEvent","actor":{"id":1017605,"login":"wangshan","gravatar_id":"","url":"https://api.github.com/users/wangshan","avatar_url":"https://avatars.githubusercontent.com/u/1017605?"},"repo":{"id":28666633,"name":"wangshan/wangshan.github.io","url":"https://api.github.com/repos/wangshan/wangshan.github.io"},"payload":{"push_id":536753040,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"0efdedb4a49bebd1456119ad89cad76ada7e2c91","before":"5a94fdd12e5d88be38cca22321e943d374d3e4d5","commits":[{"sha":"0efdedb4a49bebd1456119ad89cad76ada7e2c91","author":{"email":"e3e97680eb29c788f35181af31eb442b3251e18f@gmail.com","name":"Shan"},"message":"Update 2012-03-03-mac-development-environment-setup.md","distinct":true,"url":"https://api.github.com/repos/wangshan/wangshan.github.io/commits/0efdedb4a49bebd1456119ad89cad76ada7e2c91"}]},"public":true,"created_at":"2015-01-01T01:04:10Z"}
{"id":"2489397679","type":"PushEvent","actor":{"id":5202416,"login":"Hardmath123","gravatar_id":"","url":"https://api.github.com/users/Hardmath123","avatar_url":"https://avatars.githubusercontent.com/u/5202416?"},"repo":{"id":16244731,"name":"Hardmath123/hardmath123.github.io","url":"https://api.github.com/repos/Hardmath123/hardmath123.github.io"},"payload":{"push_id":536753041,"size":2,"distinct_size":2,"ref":"refs/heads/master","head":"f030c9bc614ac41d120f96aa33a1a9d386851f6e","before":"a3a57f52045048dda77f285c9da30fcbfafda094","commits":[{"sha":"0ffe5ea18ffb4330fd8fd85058dd563fe978d4e6","author":{"email":"430380b60638190ff73296b54585d989728b087a@gmail.com","name":"Hardmath123"},"message":"header in helvetica","distinct":true,"url":"https://api.github.com/repos/Hardmath123/hardmath123.github.io/commits/0ffe5ea18ffb4330fd8fd85058dd563fe978d4e6"},{"sha":"f030c9bc614ac41d120f96aa33a1a9d386851f6e","author":{"email":"430380b60638190ff73296b54585d989728b087a@gmail.com","name":"Hardmath123"},"message":"ok justification was a mistake. i can't justify that decision...","distinct":true,"url":"https://api.github.com/repos/Hardmath123/hardmath123.github.io/commits/f030c9bc614ac41d120f96aa33a1a9d386851f6e"}]},"public":true,"created_at":"2015-01-01T01:04:10Z"}
{"id":"2489397681","type":"PushEvent","actor":{"id":11417,"login":"malept","gravatar_id":"","url":"https://api.github.com/users/malept","avatar_url":"https://avatars.githubusercontent.com/u/11417?"},"repo":{"id":22760055,"name":"malept/octoaudit","url":"https://api.github.com/repos/malept/octoaudit"},"payload":{"push_id":536753042,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"50e1f3dcd88d928c991b8a5a1b85d797e27aa54b","before":"d306ec83113e82e1d11244084dc47333360aefda","commits":[{"sha":"50e1f3dcd88d928c991b8a5a1b85d797e27aa54b","author":{"email":"1133a844dd6eb8a9702546324bc949f27bda666a@lazymalevolence.com","name":"Mark Lee"},"message":"Travis: account for cache directory creation","distinct":true,"url":"https://api.github.com/repos/malept/octoaudit/commits/50e1f3dcd88d928c991b8a5a1b85d797e27aa54b"}]},"public":true,"created_at":"2015-01-01T01:04:10Z"}
{"id":"2489397683","type":"IssuesEvent","actor":{"id":716644,"login":"amandaharlin","gravatar_id":"","url":"https://api.github.com/users/amandaharlin","avatar_url":"https://avatars.githubusercontent.com/u/716644?"},"repo":{"id":24870992,"name":"codeforokc/codeforokc","url":"https://api.github.com/repos/codeforokc/codeforokc"},"payload":{"action":"opened","issue":{"url":"https://api.github.com/repos/codeforokc/codeforokc/issues/5","labels_url":"https://api.github.com/repos/codeforokc/codeforokc/issues/5/labels{/name}","comments_url":"https://api.github.com/repos/codeforokc/codeforokc/issues/5/comments","events_url":"https://api.github.com/repos/codeforokc/codeforokc/issues/5/events","html_url":"https://github.com/codeforokc/codeforokc/issues/5","id":53210256,"number":5,"title":"Other pages to add?","user":{"login":"amandaharlin","id":716644,"avatar_url":"https://avatars.githubusercontent.com/u/716644?v=3","gravatar_id":"","url":"https://api.github.com/users/amandaharlin","html_url":"https://github.com/amandaharlin","followers_url":"https://api.github.com/users/amandaharlin/followers","following_url":"https://api.github.com/users/amandaharlin/following{/other_user}","gists_url":"https://api.github.com/users/amandaharlin/gists{/gist_id}","starred_url":"https://api.github.com/users/amandaharlin/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/amandaharlin/subscriptions","organizations_url":"https://api.github.com/users/amandaharlin/orgs","repos_url":"https://api.github.com/users/amandaharlin/repos","events_url":"https://api.github.com/users/amandaharlin/events{/privacy}","received_events_url":"https://api.github.com/users/amandaharlin/received_events","type":"User","site_admin":false},"labels":[],"state":"open","locked":false,"assignee":null,"milestone":null,"comments":0,"created_at":"2015-01-01T01:04:10Z","updated_at":"2015-01-01T01:04:10Z","closed_at":null,"body":"In the config.yml i saw other not-yet-implemented menu items, like:\r\n\r\n  #Meetings: /meetings\r\n  #Forum: https://github.com/codeforokc/discussions/issues\r\n  #Chat: https://gitter.im/codeforokc/discussions\r\n  #Join Us: /join-us\r\n  #Archives: /archives\r\n\r\ndo you want to add these in still?"}},"public":true,"created_at":"2015-01-01T01:04:11Z","org":{"id":8738523,"login":"codeforokc","gravatar_id":"","url":"https://api.github.com/orgs/codeforokc","avatar_url":"https://avatars.githubusercontent.com/u/8738523?"}}
{"id":"2489397686","type":"PushEvent","actor":{"id":5384580,"login":"oridb","gravatar_id":"","url":"https://api.github.com/users/oridb","avatar_url":"https://avatars.githubusercontent.com/u/5384580?"},"repo":{"id":16144976,"name":"oridb/mc","url":"https://api.github.com/repos/oridb/mc"},"payload":{"push_id":536753043,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"fc13f8699b5f3702525fcf5a2692b1800763aa53","before":"d45042b7a8b06f0bc1a82a4aa32687aef08cf2b2","commits":[{"sha":"fc13f8699b5f3702525fcf5a2692b1800763aa53","author":{"email":"6c720b6ece72a4972cc39d6436cb370514e267ec@eigenstate.org","name":"Ori Bernstein"},"message":"Fix up libstd on plan9.","distinct":true,"url":"https://api.github.com/repos/oridb/mc/commits/fc13f8699b5f3702525fcf5a2692b1800763aa53"}]},"public":true,"created_at":"2015-01-01T01:04:11Z"}
{"id":"2489397693","type":"PushEvent","actor":{"id":1026154,"login":"Fizzadar","gravatar_id":"","url":"https://api.github.com/users/Fizzadar","avatar_url":"https://avatars.githubusercontent.com/u/1026154?"},"repo":{"id":28368289,"name":"Fizzadar/multiselect","url":"https://api.github.com/repos/Fizzadar/multiselect"},"payload":{"push_id":536753046,"size":2,"distinct_size":2,"ref":"refs/heads/develop","head":"aa30e8c6c8be5ab3095b78a53f9a48607217caea","before":"596c8a453d7a734053f9688663abf5061b7dca33","commits":[{"sha":"fb51964b06e1a83ea9f2233014ea43cb4ff42636","author":{"email":"75ef9faee755c70589550b513ad881e5a603182c@oxygem.com","name":"Nick Barrett"},"message":"Correct bug in initalizing option lists","distinct":true,"url":"https://api.github.com/repos/Fizzadar/multiselect/commits/fb51964b06e1a83ea9f2233014ea43cb4ff42636"},{"sha":"aa30e8c6c8be5ab3095b78a53f9a48607217caea","author":{"email":"75ef9faee755c70589550b513ad881e5a603182c@oxygem.com","name":"Nick Barrett"},"message":"+build","distinct":true,"url":"https://api.github.com/repos/Fizzadar/multiselect/commits/aa30e8c6c8be5ab3095b78a53f9a48607217caea"}]},"public":true,"created_at":"2015-01-01T01:04:12Z"}
{"id":"2489397694","type":"PushEvent","actor":{"id":2263283,"login":"iraikov","gravatar_id":"","url":"https://api.github.com/users/iraikov","avatar_url":"https://avatars.githubusercontent.com/u/2263283?"},"repo":{"id":22903078,"name":"iraikov/Sims.jl","url":"https://api.github.com/repos/iraikov/Sims.jl"},"payload":{"push_id":536753047,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"418f7577926273d814040ede54f0873ae5b9d17e","before":"bffecb12bb56348f7065ad7670144bd787799879","commits":[{"sha":"418f7577926273d814040ede54f0873ae5b9d17e","author":{"email":"af431cb13887b0da5947004f417999c37e85ed49@gmail.com","name":"Ivan Raikov"},"message":"copy parameters on structural changes to ensure any modifications are preserved","distinct":true,"url":"https://api.github.com/repos/iraikov/Sims.jl/commits/418f7577926273d814040ede54f0873ae5b9d17e"}]},"public":true,"created_at":"2015-01-01T01:04:12Z"}
{"id":"2489397701","type":"PushEvent","actor":{"id":378599,"login":"deborah-ufw","gravatar_id":"","url":"https://api.github.com/users/deborah-ufw","avatar_url":"https://avatars.githubusercontent.com/u/378599?"},"repo":{"id":23501674,"name":"deborah-ufw/deborah-ufw.github.io","url":"https://api.github.com/repos/deborah-ufw/deborah-ufw.github.io"},"payload":{"push_id":536753051,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"ad602b16440a0546ffde289477a3699a8b7a1800","before":"636739a0b83baf6ccd6b38a78f49502363a19778","commits":[{"sha":"ad602b16440a0546ffde289477a3699a8b7a1800","author":{"email":"b0969288fc07bf7a2f076f214eeab18bf2a0cd1c@hotmail.com","name":"deborah"},"message":"ticket tweak question for complete mode","distinct":true,"url":"https://api.github.com/repos/deborah-ufw/deborah-ufw.github.io/commits/ad602b16440a0546ffde289477a3699a8b7a1800"}]},"public":true,"created_at":"2015-01-01T01:04:13Z"}
{"id":"2489397702","type":"WatchEvent","actor":{"id":220358,"login":"ankane","gravatar_id":"","url":"https://api.github.com/users/ankane","avatar_url":"https://avatars.githubusercontent.com/u/220358?"},"repo":{"id":1359757,"name":"SchemaPlus/schema_plus","url":"https://api.github.com/repos/SchemaPlus/schema_plus"},"payload":{"action":"started"},"public":true,"created_at":"2015-01-01T01:04:14Z","org":{"id":614848,"login":"SchemaPlus","gravatar_id":"","url":"https://api.github.com/orgs/SchemaPlus","avatar_url":"https://avatars.githubusercontent.com/u/614848?"}}
{"id":"2489397706","type":"PushEvent","actor":{"id":1558033,"login":"wpears","gravatar_id":"","url":"https://api.github.com/users/wpears","avatar_url":"https://avatars.githubusercontent.com/u/1558033?"},"repo":{"id":23894134,"name":"wpears/twopane","url":"https://api.github.com/repos/wpears/twopane"},"payload":{"push_id":536753053,"size":1,"distinct_size":1,"ref":"refs/heads/dev","head":"d8c403b3bceb31ce36ff1c0b5e7fcf18bc7914fc","before":"d81881adaff8ddb3e0da1d02315ab74efa175102","commits":[{"sha":"d8c403b3bceb31ce36ff1c0b5e7fcf18bc7914fc","author":{"email":"ce362ed51a9d769761b4ab97740ccf6e6615e394@gmail.com","name":"Wyatt Pearsall"},"message":"Cleaned up twopane.js","distinct":true,"url":"https://api.github.com/repos/wpears/twopane/commits/d8c403b3bceb31ce36ff1c0b5e7fcf18bc7914fc"}]},"public":true,"created_at":"2015-01-01T01:04:14Z"}
{"id":"2489397709","type":"PushEvent","actor":{"id":280212,"login":"KenanSulayman","gravatar_id":"","url":"https://api.github.com/users/KenanSulayman","avatar_url":"https://avatars.githubusercontent.com/u/280212?"},"repo":{"id":21481110,"name":"KenanSulayman/heartbeat","url":"https://api.github.com/repos/KenanSulayman/heartbeat"},"payload":{"push_id":536753054,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"f673aef9bc6b115cda55214d362fde50d301ea25","before":"c085f224e47c8147e6085f897cb91a07834211b1","commits":[{"sha":"f673aef9bc6b115cda55214d362fde50d301ea25","author":{"email":"9176253dfc0bc82671a5e984646605f93319147a@sly.mn","name":"Kenan Sulayman"},"message":"1420074253830\n\n36ErTuCI1v1YILLcBrCP+M1Dl7YcJfq0JhOl6oV84vA=","distinct":true,"url":"https://api.github.com/repos/KenanSulayman/heartbeat/commits/f673aef9bc6b115cda55214d362fde50d301ea25"}]},"public":true,"created_at":"2015-01-01T01:04:15Z"}
{"id":"2489397720","type":"PushEvent","actor":{"id":6298185,"login":"salrodgom","gravatar_id":"","url":"https://api.github.com/users/salrodgom","avatar_url":"https://avatars.githubusercontent.com/u/6298185?"},"repo":{"id":28646555,"name":"salrodgom/MC-MD_hybrid_cycles","url":"https://api.github.com/repos/salrodgom/MC-MD_hybrid_cycles"},"payload":{"push_id":536753057,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"d2e6b275229477c0b9f94bcb22452f56402643a8","before":"a762ae78e5c09457dcced64e3a6f6138906759f3","commits":[{"sha":"d2e6b275229477c0b9f94bcb22452f56402643a8","author":{"email":"98ac177e5ce7190d101150b0bffa6dca0bd0984b@hipocampo.upo.es","name":"Salvador Rodríguez Gómez"},"message":"modified:   mc_md_script_opti.sct","distinct":true,"url":"https://api.github.com/repos/salrodgom/MC-MD_hybrid_cycles/commits/d2e6b275229477c0b9f94bcb22452f56402643a8"}]},"public":true,"created_at":"2015-01-01T01:04:17Z"}
{"id":"2489397721","type":"PushEvent","actor":{"id":10144074,"login":"carodew","gravatar_id":"","url":"https://api.github.com/users/carodew","avatar_url":"https://avatars.githubusercontent.com/u/10144074?"},"repo":{"id":27844858,"name":"carodew/carodew.github.io","url":"https://api.github.com/repos/carodew/carodew.github.io"},"payload":{"push_id":536753058,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"62bd3e248d57b48720930200d73b4273993a2e66","before":"19643dcb3388a0ae99570e176fc592e0fd666c81","commits":[{"sha":"62bd3e248d57b48720930200d73b4273993a2e66","author":{"email":"6e3c6f0214740e9061d9ca5c79eb6e0ff9cc1741@unknown542696dd77af.gateway.pace.com","name":"Carolyn"},"message":"update ux projects to new format","distinct":true,"url":"https://api.github.com/repos/carodew/carodew.github.io/commits/62bd3e248d57b48720930200d73b4273993a2e66"}]},"public":true,"created_at":"2015-01-01T01:04:17Z"}
{"id":"2489397722","type":"IssueCommentEvent","actor":{"id":279669,"login":"sachin-handiekar","gravatar_id":"","url":"https://api.github.com/users/sachin-handiekar","avatar_url":"https://avatars.githubusercontent.com/u/279669?"},"repo":{"id":1987667,"name":"sachin-handiekar/jInstagram","url":"https://api.github.com/repos/sachin-handiekar/jInstagram"},"payload":{"action":"created","issue":{"url":"https://api.github.com/repos/sachin-handiekar/jInstagram/issues/78","labels_url":"https://api.github.com/repos/sachin-handiekar/jInstagram/issues/78/labels{/name}","comments_url":"https://api.github.com/repos/sachin-handiekar/jInstagram/issues/78/comments","events_url":"https://api.github.com/repos/sachin-handiekar/jInstagram/issues/78/events","html_url":"https://github.com/sachin-handiekar/jInstagram/issues/78","id":53177876,"number":78,"title":"Configure Travis-CI build to deploy snapshot to Maven Repositories","user":{"login":"sachin-handiekar","id":279669,"avatar_url":"https://avatars.githubusercontent.com/u/279669?v=3","gravatar_id":"","url":"https://api.github.com/users/sachin-handiekar","html_url":"https://github.com/sachin-handiekar","followers_url":"https://api.github.com/users/sachin-handiekar/followers","following_url":"https://api.github.com/users/sachin-handiekar/following{/other_user}","gists_url":"https://api.github.com/users/sachin-handiekar/gists{/gist_id}","starred_url":"https://api.github.com/users/sachin-handiekar/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/sachin-handiekar/subscriptions","organizations_url":"https://api.github.com/users/sachin-handiekar/orgs","repos_url":"https://api.github.com/users/sachin-handiekar/repos","events_url":"https://api.github.com/users/sachin-handiekar/events{/privacy}","received_events_url":"https://api.github.com/users/sachin-handiekar/received_events","type":"User","site_admin":false},"labels":[{"url":"https://api.github.com/repos/sachin-handiekar/jInstagram/labels/infrastructure","name":"infrastructure","color":"fbca04"}],"state":"closed","locked":false,"assignee":{"login":"sachin-handiekar","id":279669,"avatar_url":"https://avatars.githubusercontent.com/u/279669?v=3","gravatar_id":"","url":"https://api.github.com/users/sachin-handiekar","html_url":"https://github.com/sachin-handiekar","followers_url":"https://api.github.com/users/sachin-handiekar/followers","following_url":"https://api.github.com/users/sachin-handiekar/following{/other_user}","gists_url":"https://api.github.com/users/sachin-handiekar/gists{/gist_id}","starred_url":"https://api.github.com/users/sachin-handiekar/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/sachin-handiekar/subscriptions","organizations_url":"https://api.github.com/users/sachin-handiekar/orgs","repos_url":"https://api.github.com/users/sachin-handiekar/repos","events_url":"https://api.github.com/users/sachin-handiekar/events{/privacy}","received_events_url":"https://api.github.com/users/sachin-handiekar/received_events","type":"User","site_admin":false},"milestone":null,"comments":1,"created_at":"2014-12-31T10:37:34Z","updated_at":"2015-01-01T01:04:17Z","closed_at":"2015-01-01T01:04:17Z","body":"Configure Travis-CI build to deploy snapshot to Maven Repositories\r\n\r\nhttp://notbarjo.blogspot.co.uk/2014/09/travis-ci-maven-deploy.html"},"comment":{"url":"https://api.github.com/repos/sachin-handiekar/jInstagram/issues/comments/68477301","html_url":"https://github.com/sachin-handiekar/jInstagram/issues/78#issuecomment-68477301","issue_url":"https://api.github.com/repos/sachin-handiekar/jInstagram/issues/78","id":68477301,"user":{"login":"sachin-handiekar","id":279669,"avatar_url":"https://avatars.githubusercontent.com/u/279669?v=3","gravatar_id":"","url":"https://api.github.com/users/sachin-handiekar","html_url":"https://github.com/sachin-handiekar","followers_url":"https://api.github.com/users/sachin-handiekar/followers","following_url":"https://api.github.com/users/sachin-handiekar/following{/other_user}","gists_url":"https://api.github.com/users/sachin-handiekar/gists{/gist_id}","starred_url":"https://api.github.com/users/sachin-handiekar/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/sachin-handiekar/subscriptions","organizations_url":"https://api.github.com/users/sachin-handiekar/orgs","repos_url":"https://api.github.com/users/sachin-handiekar/repos","events_url":"https://api.github.com/users/sachin-handiekar/events{/privacy}","received_events_url":"https://api.github.com/users/sachin-handiekar/received_events","type":"User","site_admin":false},"created_at":"2015-01-01T01:04:17Z","updated_at":"2015-01-01T01:04:17Z","body":"Updated pom.xml and .travis.yml to upload snapshot to snapshot repository. \r\n\r\nhttps://oss.sonatype.org/content/repositories/snapshots/com/sachinhandiekar/jInstagram/"}},"public":true,"created_at":"2015-01-01T01:04:18Z"}
{"id":"2489397723","type":"IssuesEvent","actor":{"id":279669,"login":"sachin-handiekar","gravatar_id":"","url":"https://api.github.com/users/sachin-handiekar","avatar_url":"https://avatars.githubusercontent.com/u/279669?"},"repo":{"id":1987667,"name":"sachin-handiekar/jInstagram","url":"https://api.github.com/repos/sachin-handiekar/jInstagram"},"payload":{"action":"closed","issue":{"url":"https://api.github.com/repos/sachin-handiekar/jInstagram/issues/78","labels_url":"https://api.github.com/repos/sachin-handiekar/jInstagram/issues/78/labels{/name}","comments_url":"https://api.github.com/repos/sachin-handiekar/jInstagram/issues/78/comments","events_url":"https://api.github.com/repos/sachin-handiekar/jInstagram/issues/78/events","html_url":"https://github.com/sachin-handiekar/jInstagram/issues/78","id":53177876,"number":78,"title":"Configure Travis-CI build to deploy snapshot to Maven Repositories","user":{"login":"sachin-handiekar","id":279669,"avatar_url":"https://avatars.githubusercontent.com/u/279669?v=3","gravatar_id":"","url":"https://api.github.com/users/sachin-handiekar","html_url":"https://github.com/sachin-handiekar","followers_url":"https://api.github.com/users/sachin-handiekar/followers","following_url":"https://api.github.com/users/sachin-handiekar/following{/other_user}","gists_url":"https://api.github.com/users/sachin-handiekar/gists{/gist_id}","starred_url":"https://api.github.com/users/sachin-handiekar/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/sachin-handiekar/subscriptions","organizations_url":"https://api.github.com/users/sachin-handiekar/orgs","repos_url":"https://api.github.com/users/sachin-handiekar/repos","events_url":"https://api.github.com/users/sachin-handiekar/events{/privacy}","received_events_url":"https://api.github.com/users/sachin-handiekar/received_events","type":"User","site_admin":false},"labels":[{"url":"https://api.github.com/repos/sachin-handiekar/jInstagram/labels/infrastructure","name":"infrastructure","color":"fbca04"}],"state":"closed","locked":false,"assignee":{"login":"sachin-handiekar","id":279669,"avatar_url":"https://avatars.githubusercontent.com/u/279669?v=3","gravatar_id":"","url":"https://api.github.com/users/sachin-handiekar","html_url":"https://github.com/sachin-handiekar","followers_url":"https://api.github.com/users/sachin-handiekar/followers","following_url":"https://api.github.com/users/sachin-handiekar/following{/other_user}","gists_url":"https://api.github.com/users/sachin-handiekar/gists{/gist_id}","starred_url":"https://api.github.com/users/sachin-handiekar/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/sachin-handiekar/subscriptions","organizations_url":"https://api.github.com/users/sachin-handiekar/orgs","repos_url":"https://api.github.com/users/sachin-handiekar/repos","events_url":"https://api.github.com/users/sachin-handiekar/events{/privacy}","received_events_url":"https://api.github.com/users/sachin-handiekar/received_events","type":"User","site_admin":false},"milestone":null,"comments":1,"created_at":"2014-12-31T10:37:34Z","updated_at":"2015-01-01T01:04:17Z","closed_at":"2015-01-01T01:04:17Z","body":"Configure Travis-CI build to deploy snapshot to Maven Repositories\r\n\r\nhttp://notbarjo.blogspot.co.uk/2014/09/travis-ci-maven-deploy.html"}},"public":true,"created_at":"2015-01-01T01:04:18Z"}
{"id":"2489397727","type":"CreateEvent","actor":{"id":9505729,"login":"alishadot","gravatar_id":"","url":"https://api.github.com/users/alishadot","avatar_url":"https://avatars.githubusercontent.com/u/9505729?"},"repo":{"id":28678253,"name":"alishadot/keepcloud","url":"https://api.github.com/repos/alishadot/keepcloud"},"payload":{"ref":null,"ref_type":"repository","master_branch":"master","description":"","pusher_type":"user"},"public":true,"created_at":"2015-01-01T01:04:18Z"}
{"id":"2489397731","type":"PullRequestReviewCommentEvent","actor":{"id":523287,"login":"j2sol","gravatar_id":"","url":"https://api.github.com/users/j2sol","avatar_url":"https://avatars.githubusercontent.com/u/523287?"},"repo":{"id":11848896,"name":"blueboxgroup/ursula","url":"https://api.github.com/repos/blueboxgroup/ursula"},"payload":{"action":"created","comment":{"url":"https://api.github.com/repos/blueboxgroup/ursula/pulls/comments/22397281","id":22397281,"diff_hunk":"@@ -1,121 +1,92 @@\n ---\n-- name: install apache\n-  apt: pkg={{ item }}\n-  with_items:\n-    - apache2\n-    - libapache2-mod-wsgi\n-\n - name: lesscpy must be in apache PATH\n   pip: name=lesscpy version=0.9j\n \n - name: get horizon source repo\n-  git: repo={{ openstack.git_mirror }}/horizon.git\n-       dest=/opt/stack/horizon\n-       version={{ horizon.rev }}\n-       update={{ openstack.git_update }}\n+  git: |\n+    repo={{ openstack.git_mirror}}/horizon.git\n+    dest=/opt/stack/horizon\n+    version={{ horizon.rev }}\n+    update={{ openstack.git_update }}\n   notify:\n     - setup horizon venv\n     - compress horizon assets\n \n-- template: src=opt/stack/horizon/hide-external-networks.patch dest=/opt/stack/horizon/hide-external-networks.patch mode=0644\n-- shell: patch -p1 < hide-external-networks.patch chdir=/opt/stack/horizon\n-  notify:\n-    - setup horizon venv\n-\n - name: add python-memcached to horizon requirements\n-  lineinfile: dest=/opt/stack/horizon/requirements.txt\n-              regexp=^python-memcached\n-              line=python-memcached\n+  lineinfile: dest=/opt/stack/horizon/requirements.txt regexp=^python-memcached line=python-memcached\n   notify:\n     - setup horizon venv\n \n-- name: disable apache status\n-  command: a2dismod status\n-  notify:\n-    - restart apache\n-\n-- name: apache ports config\n-  template: src=etc/apache2/ports.conf\n-            dest=/etc/apache2/ports.conf\n-  notify:\n-    - restart apache\n-\n-- name: disable default apache site\n-  command: a2dissite 000-default\n+- name: make sure apache knows about horizon ports\n+  lineinfile: dest=/etc/apache2/ports.conf line=\"Listen 8080\"\n   notify:\n-    - restart apache\n+    - reload apache\n \n-- name: openstack dashboard config (12.04)\n-  template: src=etc/apache2/sites-available/openstack_dashboard.conf\n-            dest=/etc/apache2/sites-available/openstack_dashboard\n+- name: create dashboard virtualhost on precise\n+  template: |\n+    src=etc/apache2/sites-available/openstack_dashboard.conf\n+    dest=/etc/apache2/sites-available/openstack_dashboard\n   when: ansible_distribution_version == \"12.04\"\n   notify:\n-    - restart apache\n+    - reload apache\n \n-- name: openstack dashboard config\n-  template: src=etc/apache2/sites-available/openstack_dashboard.conf\n-            dest=/etc/apache2/sites-available/openstack_dashboard.conf\n+- name: create dashboard virtualhost on other\n+  template: |","path":"roles/horizon/tasks/main.yml","position":73,"original_position":73,"commit_id":"2a6f35313b9936ce4450aba823d09287626bed6f","original_commit_id":"2a6f35313b9936ce4450aba823d09287626bed6f","user":{"login":"j2sol","id":523287,"avatar_url":"https://avatars.githubusercontent.com/u/523287?v=3","gravatar_id":"","url":"https://api.github.com/users/j2sol","html_url":"https://github.com/j2sol","followers_url":"https://api.github.com/users/j2sol/followers","following_url":"https://api.github.com/users/j2sol/following{/other_user}","gists_url":"https://api.github.com/users/j2sol/gists{/gist_id}","starred_url":"https://api.github.com/users/j2sol/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/j2sol/subscriptions","organizations_url":"https://api.github.com/users/j2sol/orgs","repos_url":"https://api.github.com/users/j2sol/repos","events_url":"https://api.github.com/users/j2sol/events{/privacy}","received_events_url":"https://api.github.com/users/j2sol/received_events","type":"User","site_admin":false},"body":"why the continuation?","created_at":"2015-01-01T01:04:18Z","updated_at":"2015-01-01T01:04:18Z","html_url":"https://github.com/blueboxgroup/ursula/pull/705#discussion_r22397281","pull_request_url":"https://api.github.com/repos/blueboxgroup/ursula/pulls/705","_links":{"self":{"href":"https://api.github.com/repos/blueboxgroup/ursula/pulls/comments/22397281"},"html":{"href":"https://github.com/blueboxgroup/ursula/pull/705#discussion_r22397281"},"pull_request":{"href":"https://api.github.com/repos/blueboxgroup/ursula/pulls/705"}}},"pull_request":{"url":"https://api.github.com/repos/blueboxgroup/ursula/pulls/705","id":26738851,"html_url":"https://github.com/blueboxgroup/ursula/pull/705","diff_url":"https://github.com/blueboxgroup/ursula/pull/705.diff","patch_url":"https://github.com/blueboxgroup/ursula/pull/705.patch","issue_url":"https://api.github.com/repos/blueboxgroup/ursula/issues/705","number":705,"state":"open","locked":false,"title":"WIP:  apache for loadbalancing","user":{"login":"paulczar","id":2488346,"avatar_url":"https://avatars.githubusercontent.com/u/2488346?v=3","gravatar_id":"","url":"https://api.github.com/users/paulczar","html_url":"https://github.com/paulczar","followers_url":"https://api.github.com/users/paulczar/followers","following_url":"https://api.github.com/users/paulczar/following{/other_user}","gists_url":"https://api.github.com/users/paulczar/gists{/gist_id}","starred_url":"https://api.github.com/users/paulczar/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/paulczar/subscriptions","organizations_url":"https://api.github.com/users/paulczar/orgs","repos_url":"https://api.github.com/users/paulczar/repos","events_url":"https://api.github.com/users/paulczar/events{/privacy}","received_events_url":"https://api.github.com/users/paulczar/received_events","type":"User","site_admin":false},"body":"This is a quick POC / WIP to demo using apache instead of haproxy for loadbalancing our APIs.\r\n\r\nI think this gives us more flexibiltiy as we can enable in the APIs role itself ( in this case in keystone ) rather than a big monolithic haproxy.conf.      We also already have apache running for horizon, so it could reduce number of services.    apache also has better logging options that haproxy which can only log to syslog. ","created_at":"2015-01-01T00:04:13Z","updated_at":"2015-01-01T01:04:18Z","closed_at":null,"merged_at":null,"merge_commit_sha":"9b91693f11e166c9ee53836f19697868d412bf76","assignee":null,"milestone":null,"commits_url":"https://api.github.com/repos/blueboxgroup/ursula/pulls/705/commits","review_comments_url":"https://api.github.com/repos/blueboxgroup/ursula/pulls/705/comments","review_comment_url":"https://api.github.com/repos/blueboxgroup/ursula/pulls/comments/{number}","comments_url":"https://api.github.com/repos/blueboxgroup/ursula/issues/705/comments","statuses_url":"https://api.github.com/repos/blueboxgroup/ursula/statuses/2a6f35313b9936ce4450aba823d09287626bed6f","head":{"label":"blueboxgroup:use_apache_for_lb","ref":"use_apache_for_lb","sha":"2a6f35313b9936ce4450aba823d09287626bed6f","user":{"login":"blueboxgroup","id":458705,"avatar_url":"https://avatars.githubusercontent.com/u/458705?v=3","gravatar_id":"","url":"https://api.github.com/users/blueboxgroup","html_url":"https://github.com/blueboxgroup","followers_url":"https://api.github.com/users/blueboxgroup/followers","following_url":"https://api.github.com/users/blueboxgroup/following{/other_user}","gists_url":"https://api.github.com/users/blueboxgroup/gists{/gist_id}","starred_url":"https://api.github.com/users/blueboxgroup/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/blueboxgroup/subscriptions","organizations_url":"https://api.github.com/users/blueboxgroup/orgs","repos_url":"https://api.github.com/users/blueboxgroup/repos","events_url":"https://api.github.com/users/blueboxgroup/events{/privacy}","received_events_url":"https://api.github.com/users/blueboxgroup/received_events","type":"Organization","site_admin":false},"repo":{"id":11848896,"name":"ursula","full_name":"blueboxgroup/ursula","owner":{"login":"blueboxgroup","id":458705,"avatar_url":"https://avatars.githubusercontent.com/u/458705?v=3","gravatar_id":"","url":"https://api.github.com/users/blueboxgroup","html_url":"https://github.com/blueboxgroup","followers_url":"https://api.github.com/users/blueboxgroup/followers","following_url":"https://api.github.com/users/blueboxgroup/following{/other_user}","gists_url":"https://api.github.com/users/blueboxgroup/gists{/gist_id}","starred_url":"https://api.github.com/users/blueboxgroup/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/blueboxgroup/subscriptions","organizations_url":"https://api.github.com/users/blueboxgroup/orgs","repos_url":"https://api.github.com/users/blueboxgroup/repos","events_url":"https://api.github.com/users/blueboxgroup/events{/privacy}","received_events_url":"https://api.github.com/users/blueboxgroup/received_events","type":"Organization","site_admin":false},"private":false,"html_url":"https://github.com/blueboxgroup/ursula","description":"Ansible playbooks for operating OpenStack","fork":false,"url":"https://api.github.com/repos/blueboxgroup/ursula","forks_url":"https://api.github.com/repos/blueboxgroup/ursula/forks","keys_url":"https://api.github.com/repos/blueboxgroup/ursula/keys{/key_id}","collaborators_url":"https://api.github.com/repos/blueboxgroup/ursula/collaborators{/collaborator}","teams_url":"https://api.github.com/repos/blueboxgroup/ursula/teams","hooks_url":"https://api.github.com/repos/blueboxgroup/ursula/hooks","issue_events_url":"https://api.github.com/repos/blueboxgroup/ursula/issues/events{/number}","events_url":"https://api.github.com/repos/blueboxgroup/ursula/events","assignees_url":"https://api.github.com/repos/blueboxgroup/ursula/assignees{/user}","branches_url":"https://api.github.com/repos/blueboxgroup/ursula/branches{/branch}","tags_url":"https://api.github.com/repos/blueboxgroup/ursula/tags","blobs_url":"https://api.github.com/repos/blueboxgroup/ursula/git/blobs{/sha}","git_tags_url":"https://api.github.com/repos/blueboxgroup/ursula/git/tags{/sha}","git_refs_url":"https://api.github.com/repos/blueboxgroup/ursula/git/refs{/sha}","trees_url":"https://api.github.com/repos/blueboxgroup/ursula/git/trees{/sha}","statuses_url":"https://api.github.com/repos/blueboxgroup/ursula/statuses/{sha}","languages_url":"https://api.github.com/repos/blueboxgroup/ursula/languages","stargazers_url":"https://api.github.com/repos/blueboxgroup/ursula/stargazers","contributors_url":"https://api.github.com/repos/blueboxgroup/ursula/contributors","subscribers_url":"https://api.github.com/repos/blueboxgroup/ursula/subscribers","subscription_url":"https://api.github.com/repos/blueboxgroup/ursula/subscription","commits_url":"https://api.github.com/repos/blueboxgroup/ursula/commits{/sha}","git_commits_url":"https://api.github.com/repos/blueboxgroup/ursula/git/commits{/sha}","comments_url":"https://api.github.com/repos/blueboxgroup/ursula/comments{/number}","issue_comment_url":"https://api.github.com/repos/blueboxgroup/ursula/issues/comments/{number}","contents_url":"https://api.github.com/repos/blueboxgroup/ursula/contents/{+path}","compare_url":"https://api.github.com/repos/blueboxgroup/ursula/compare/{base}...{head}","merges_url":"https://api.github.com/repos/blueboxgroup/ursula/merges","archive_url":"https://api.github.com/repos/blueboxgroup/ursula/{archive_format}{/ref}","downloads_url":"https://api.github.com/repos/blueboxgroup/ursula/downloads","issues_url":"https://api.github.com/repos/blueboxgroup/ursula/issues{/number}","pulls_url":"https://api.github.com/repos/blueboxgroup/ursula/pulls{/number}","milestones_url":"https://api.github.com/repos/blueboxgroup/ursula/milestones{/number}","notifications_url":"https://api.github.com/repos/blueboxgroup/ursula/notifications{?since,all,participating}","labels_url":"https://api.github.com/repos/blueboxgroup/ursula/labels{/name}","releases_url":"https://api.github.com/repos/blueboxgroup/ursula/releases{/id}","created_at":"2013-08-02T17:37:26Z","updated_at":"2014-12-31T21:03:28Z","pushed_at":"2015-01-01T00:01:35Z","git_url":"git://github.com/blueboxgroup/ursula.git","ssh_url":"git@github.com:blueboxgroup/ursula.git","clone_url":"https://github.com/blueboxgroup/ursula.git","svn_url":"https://github.com/blueboxgroup/ursula","homepage":null,"size":9036,"stargazers_count":45,"watchers_count":45,"language":"Python","has_issues":true,"has_downloads":true,"has_wiki":true,"has_pages":false,"forks_count":23,"mirror_url":null,"open_issues_count":26,"forks":23,"open_issues":26,"watchers":45,"default_branch":"master"}},"base":{"label":"blueboxgroup:master","ref":"master","sha":"34b83c65ff0de2f8b006d8ce4f76919fe0167bbf","user":{"login":"blueboxgroup","id":458705,"avatar_url":"https://avatars.githubusercontent.com/u/458705?v=3","gravatar_id":"","url":"https://api.github.com/users/blueboxgroup","html_url":"https://github.com/blueboxgroup","followers_url":"https://api.github.com/users/blueboxgroup/followers","following_url":"https://api.github.com/users/blueboxgroup/following{/other_user}","gists_url":"https://api.github.com/users/blueboxgroup/gists{/gist_id}","starred_url":"https://api.github.com/users/blueboxgroup/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/blueboxgroup/subscriptions","organizations_url":"https://api.github.com/users/blueboxgroup/orgs","repos_url":"https://api.github.com/users/blueboxgroup/repos","events_url":"https://api.github.com/users/blueboxgroup/events{/privacy}","received_events_url":"https://api.github.com/users/blueboxgroup/received_events","type":"Organization","site_admin":false},"repo":{"id":11848896,"name":"ursula","full_name":"blueboxgroup/ursula","owner":{"login":"blueboxgroup","id":458705,"avatar_url":"https://avatars.githubusercontent.com/u/458705?v=3","gravatar_id":"","url":"https://api.github.com/users/blueboxgroup","html_url":"https://github.com/blueboxgroup","followers_url":"https://api.github.com/users/blueboxgroup/followers","following_url":"https://api.github.com/users/blueboxgroup/following{/other_user}","gists_url":"https://api.github.com/users/blueboxgroup/gists{/gist_id}","starred_url":"https://api.github.com/users/blueboxgroup/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/blueboxgroup/subscriptions","organizations_url":"https://api.github.com/users/blueboxgroup/orgs","repos_url":"https://api.github.com/users/blueboxgroup/repos","events_url":"https://api.github.com/users/blueboxgroup/events{/privacy}","received_events_url":"https://api.github.com/users/blueboxgroup/received_events","type":"Organization","site_admin":false},"private":false,"html_url":"https://github.com/blueboxgroup/ursula","description":"Ansible playbooks for operating OpenStack","fork":false,"url":"https://api.github.com/repos/blueboxgroup/ursula","forks_url":"https://api.github.com/repos/blueboxgroup/ursula/forks","keys_url":"https://api.github.com/repos/blueboxgroup/ursula/keys{/key_id}","collaborators_url":"https://api.github.com/repos/blueboxgroup/ursula/collaborators{/collaborator}","teams_url":"https://api.github.com/repos/blueboxgroup/ursula/teams","hooks_url":"https://api.github.com/repos/blueboxgroup/ursula/hooks","issue_events_url":"https://api.github.com/repos/blueboxgroup/ursula/issues/events{/number}","events_url":"https://api.github.com/repos/blueboxgroup/ursula/events","assignees_url":"https://api.github.com/repos/blueboxgroup/ursula/assignees{/user}","branches_url":"https://api.github.com/repos/blueboxgroup/ursula/branches{/branch}","tags_url":"https://api.github.com/repos/blueboxgroup/ursula/tags","blobs_url":"https://api.github.com/repos/blueboxgroup/ursula/git/blobs{/sha}","git_tags_url":"https://api.github.com/repos/blueboxgroup/ursula/git/tags{/sha}","git_refs_url":"https://api.github.com/repos/blueboxgroup/ursula/git/refs{/sha}","trees_url":"https://api.github.com/repos/blueboxgroup/ursula/git/trees{/sha}","statuses_url":"https://api.github.com/repos/blueboxgroup/ursula/statuses/{sha}","languages_url":"https://api.github.com/repos/blueboxgroup/ursula/languages","stargazers_url":"https://api.github.com/repos/blueboxgroup/ursula/stargazers","contributors_url":"https://api.github.com/repos/blueboxgroup/ursula/contributors","subscribers_url":"https://api.github.com/repos/blueboxgroup/ursula/subscribers","subscription_url":"https://api.github.com/repos/blueboxgroup/ursula/subscription","commits_url":"https://api.github.com/repos/blueboxgroup/ursula/commits{/sha}","git_commits_url":"https://api.github.com/repos/blueboxgroup/ursula/git/commits{/sha}","comments_url":"https://api.github.com/repos/blueboxgroup/ursula/comments{/number}","issue_comment_url":"https://api.github.com/repos/blueboxgroup/ursula/issues/comments/{number}","contents_url":"https://api.github.com/repos/blueboxgroup/ursula/contents/{+path}","compare_url":"https://api.github.com/repos/blueboxgroup/ursula/compare/{base}...{head}","merges_url":"https://api.github.com/repos/blueboxgroup/ursula/merges","archive_url":"https://api.github.com/repos/blueboxgroup/ursula/{archive_format}{/ref}","downloads_url":"https://api.github.com/repos/blueboxgroup/ursula/downloads","issues_url":"https://api.github.com/repos/blueboxgroup/ursula/issues{/number}","pulls_url":"https://api.github.com/repos/blueboxgroup/ursula/pulls{/number}","milestones_url":"https://api.github.com/repos/blueboxgroup/ursula/milestones{/number}","notifications_url":"https://api.github.com/repos/blueboxgroup/ursula/notifications{?since,all,participating}","labels_url":"https://api.github.com/repos/blueboxgroup/ursula/labels{/name}","releases_url":"https://api.github.com/repos/blueboxgroup/ursula/releases{/id}","created_at":"2013-08-02T17:37:26Z","updated_at":"2014-12-31T21:03:28Z","pushed_at":"2015-01-01T00:01:35Z","git_url":"git://github.com/blueboxgroup/ursula.git","ssh_url":"git@github.com:blueboxgroup/ursula.git","clone_url":"https://github.com/blueboxgroup/ursula.git","svn_url":"https://github.com/blueboxgroup/ursula","homepage":null,"size":9036,"stargazers_count":45,"watchers_count":45,"language":"Python","has_issues":true,"has_downloads":true,"has_wiki":true,"has_pages":false,"forks_count":23,"mirror_url":null,"open_issues_count":26,"forks":23,"open_issues":26,"watchers":45,"default_branch":"master"}},"_links":{"self":{"href":"https://api.github.com/repos/blueboxgroup/ursula/pulls/705"},"html":{"href":"https://github.com/blueboxgroup/ursula/pull/705"},"issue":{"href":"https://api.github.com/repos/blueboxgroup/ursula/issues/705"},"comments":{"href":"https://api.github.com/repos/blueboxgroup/ursula/issues/705/comments"},"review_comments":{"href":"https://api.github.com/repos/blueboxgroup/ursula/pulls/705/comments"},"review_comment":{"href":"https://api.github.com/repos/blueboxgroup/ursula/pulls/comments/{number}"},"commits":{"href":"https://api.github.com/repos/blueboxgroup/ursula/pulls/705/commits"},"statuses":{"href":"https://api.github.com/repos/blueboxgroup/ursula/statuses/2a6f35313b9936ce4450aba823d09287626bed6f"}}}},"public":true,"created_at":"2015-01-01T01:04:18Z","org":{"id":458705,"login":"blueboxgroup","gravatar_id":"","url":"https://api.github.com/orgs/blueboxgroup","avatar_url":"https://avatars.githubusercontent.com/u/458705?"}}
{"id":"2489397732","type":"PushEvent","actor":{"id":5728403,"login":"patrick-hudson","gravatar_id":"","url":"https://api.github.com/users/patrick-hudson","avatar_url":"https://avatars.githubusercontent.com/u/5728403?"},"repo":{"id":25392255,"name":"patrick-hudson/EggDrop","url":"https://api.github.com/repos/patrick-hudson/EggDrop"},"payload":{"push_id":536753062,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"84116936c4f6805f56a1e643eb9898ebdc854334","before":"cb11cf77a4d9d7625c14e50c27fe61d387d2c95e","commits":[{"sha":"84116936c4f6805f56a1e643eb9898ebdc854334","author":{"email":"cbb7353e6d953ef360baf960c122346276c6e320@hudson.bz","name":"Patrick Hudson"},"message":"Scripted auto-commit on change (2014-12-31 20:04:17) by gitwatch.sh","distinct":true,"url":"https://api.github.com/repos/patrick-hudson/EggDrop/commits/84116936c4f6805f56a1e643eb9898ebdc854334"}]},"public":true,"created_at":"2015-01-01T01:04:19Z"}
{"id":"2489397735","type":"PushEvent","actor":{"id":419567,"login":"kethinov","gravatar_id":"","url":"https://api.github.com/users/kethinov","avatar_url":"https://avatars.githubusercontent.com/u/419567?"},"repo":{"id":24020924,"name":"kethinov/node-webkit-app-template","url":"https://api.github.com/repos/kethinov/node-webkit-app-template"},"payload":{"push_id":536753063,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"5048243e66f207ee8e325e1b2b3bfa24505d8ebf","before":"b4dbedc97bcd361f835762d676533f1879d99151","commits":[{"sha":"5048243e66f207ee8e325e1b2b3bfa24505d8ebf","author":{"email":"63dafb7843374487f4b5809d77124751ec24f51b@gmail.com","name":"Eric Newport"},"message":"issue link","distinct":true,"url":"https://api.github.com/repos/kethinov/node-webkit-app-template/commits/5048243e66f207ee8e325e1b2b3bfa24505d8ebf"}]},"public":true,"created_at":"2015-01-01T01:04:19Z"}
{"id":"2489397736","type":"PushEvent","actor":{"id":7126826,"login":"laufi","gravatar_id":"","url":"https://api.github.com/users/laufi","avatar_url":"https://avatars.githubusercontent.com/u/7126826?"},"repo":{"id":28243875,"name":"laufi/heisserdraht-nova","url":"https://api.github.com/repos/laufi/heisserdraht-nova"},"payload":{"push_id":536753064,"size":2,"distinct_size":2,"ref":"refs/heads/master","head":"818fe73d0bde07012797b8e347a1c9c83af244be","before":"230f624d56385ab4d3cb8c6a67d5956b16d1f66e","commits":[{"sha":"d77e08b7213a6529dc6484b5997120970f3315a5","author":{"email":"b45c0673cfcf01be8a6ebb140d24652d100db872@outlook.com","name":"laufi"},"message":"BUGFIX: Auch Konstruktor mit zwei Eingabefeldern müsste float sein!","distinct":true,"url":"https://api.github.com/repos/laufi/heisserdraht-nova/commits/d77e08b7213a6529dc6484b5997120970f3315a5"},{"sha":"818fe73d0bde07012797b8e347a1c9c83af244be","author":{"email":"b45c0673cfcf01be8a6ebb140d24652d100db872@outlook.com","name":"laufi"},"message":"Möglichkeit sich mit Namen einzutragen eingefügt","distinct":true,"url":"https://api.github.com/repos/laufi/heisserdraht-nova/commits/818fe73d0bde07012797b8e347a1c9c83af244be"}]},"public":true,"created_at":"2015-01-01T01:04:19Z"}
{"id":"2489397739","type":"PushEvent","actor":{"id":10176820,"login":"chalavadivishnu","gravatar_id":"","url":"https://api.github.com/users/chalavadivishnu","avatar_url":"https://avatars.githubusercontent.com/u/10176820?"},"repo":{"id":28678150,"name":"chalavadivishnu/Face-Detection","url":"https://api.github.com/repos/chalavadivishnu/Face-Detection"},"payload":{"push_id":536753066,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"b5f47548e309ef787dfcd2c424330ff2a645956b","before":"96f7f02d9551bb3c922c9c6303b9d144e2c31398","commits":[{"sha":"b5f47548e309ef787dfcd2c424330ff2a645956b","author":{"email":"ce8044f02eb2a26b631671f5297317036d398e79@gmail.com","name":"Chalavadi Vishnu"},"message":"training images function","distinct":true,"url":"https://api.github.com/repos/chalavadivishnu/Face-Detection/commits/b5f47548e309ef787dfcd2c424330ff2a645956b"}]},"public":true,"created_at":"2015-01-01T01:04:20Z"}
{"id":"2489397743","type":"PushEvent","actor":{"id":7992035,"login":"amycodes","gravatar_id":"","url":"https://api.github.com/users/amycodes","avatar_url":"https://avatars.githubusercontent.com/u/7992035?"},"repo":{"id":28671701,"name":"amycodes/stackexchange-findanswers","url":"https://api.github.com/repos/amycodes/stackexchange-findanswers"},"payload":{"push_id":536753069,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"d925c0b925a4eefd5b2402dfc42f4ba9e1f1d3cc","before":"0e67154d9b55e9f5adb516ea0ba99bf635c1585e","commits":[{"sha":"d925c0b925a4eefd5b2402dfc42f4ba9e1f1d3cc","author":{"email":"da0cee525ea095cebd642feb98c0fe5678fb7db3@get.it","name":"Amy Negrette"},"message":"Changed [] to array() to work in prod","distinct":true,"url":"https://api.github.com/repos/amycodes/stackexchange-findanswers/commits/d925c0b925a4eefd5b2402dfc42f4ba9e1f1d3cc"}]},"public":true,"created_at":"2015-01-01T01:04:20Z"}
{"id":"2489397744","type":"PushEvent","actor":{"id":10313856,"login":"uhumph","gravatar_id":"","url":"https://api.github.com/users/uhumph","avatar_url":"https://avatars.githubusercontent.com/u/10313856?"},"repo":{"id":28540040,"name":"uhumph/docker-mailstack","url":"https://api.github.com/repos/uhumph/docker-mailstack"},"payload":{"push_id":536753070,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"8ff001a4315046f5578f9ad30493d6a5ccafe099","before":"da210967679d5ef4169fcb6102003bfd4df0384e","commits":[{"sha":"8ff001a4315046f5578f9ad30493d6a5ccafe099","author":{"email":"911c8ba17707a1b9f8955686b6e596e09ecc489d@slo-computer.com","name":"uhumph"},"message":"Update setup.sh","distinct":true,"url":"https://api.github.com/repos/uhumph/docker-mailstack/commits/8ff001a4315046f5578f9ad30493d6a5ccafe099"}]},"public":true,"created_at":"2015-01-01T01:04:20Z"}
{"id":"2489397750","type":"PushEvent","actor":{"id":83665,"login":"petrfaitl","gravatar_id":"","url":"https://api.github.com/users/petrfaitl","avatar_url":"https://avatars.githubusercontent.com/u/83665?"},"repo":{"id":28532783,"name":"petrfaitl/Activity_Exporter","url":"https://api.github.com/repos/petrfaitl/Activity_Exporter"},"payload":{"push_id":536753073,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"2416d43f35ec05a75b07399cc79967bdf57dbcca","before":"27048cac241b72ed223a0809f4bcb440c2d56f0e","commits":[{"sha":"2416d43f35ec05a75b07399cc79967bdf57dbcca","author":{"email":"23f6690d1a592ecb333159d73d3c2545c06271d5@gmail.com","name":"Petr Faitl"},"message":"Fixes to Garmin data format to suppport hr and cadence.\nFixes to UI to support alternative file output\nFixes to null value output at the start activity","distinct":true,"url":"https://api.github.com/repos/petrfaitl/Activity_Exporter/commits/2416d43f35ec05a75b07399cc79967bdf57dbcca"}]},"public":true,"created_at":"2015-01-01T01:04:20Z"}
{"id":"2489397751","type":"PushEvent","actor":{"id":3694248,"login":"tevenfeng","gravatar_id":"","url":"https://api.github.com/users/tevenfeng","avatar_url":"https://avatars.githubusercontent.com/u/3694248?"},"repo":{"id":28070401,"name":"tevenfeng/ppt2pdf.net","url":"https://api.github.com/repos/tevenfeng/ppt2pdf.net"},"payload":{"push_id":536753074,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"87f1e4d775f88ca111b178d499f2ab83b9e5f7cd","before":"ac8fb58d01ba8f8e0b8d7047761ddc62b42bd1ff","commits":[{"sha":"87f1e4d775f88ca111b178d499f2ab83b9e5f7cd","author":{"email":"6a1cb8b3a19ff60a6f85a39cf0fac4ed28b3ccc7@outlook.com","name":"Teven Feng"},"message":"add LGPL license","distinct":true,"url":"https://api.github.com/repos/tevenfeng/ppt2pdf.net/commits/87f1e4d775f88ca111b178d499f2ab83b9e5f7cd"}]},"public":true,"created_at":"2015-01-01T01:04:20Z"}
{"id":"2489397755","type":"CreateEvent","actor":{"id":1308363,"login":"paymonp","gravatar_id":"","url":"https://api.github.com/users/paymonp","avatar_url":"https://avatars.githubusercontent.com/u/1308363?"},"repo":{"id":28678242,"name":"paymonp/forecast_wrapper","url":"https://api.github.com/repos/paymonp/forecast_wrapper"},"payload":{"ref":"master","ref_type":"branch","master_branch":"master","description":"A wrapper to simplify Forecast API data, and add some extra functionality (Ex. determining current night/day status for a location).","pusher_type":"user"},"public":true,"created_at":"2015-01-01T01:04:21Z"}
{"id":"2489397757","type":"GollumEvent","actor":{"id":7797609,"login":"ivanwfr","gravatar_id":"","url":"https://api.github.com/users/ivanwfr","avatar_url":"https://avatars.githubusercontent.com/u/7797609?"},"repo":{"id":808316,"name":"cswetenham/tabspace2.1","url":"https://api.github.com/repos/cswetenham/tabspace2.1"},"payload":{"pages":[{"page_name":"Mapping Layout","title":"Mapping Layout","summary":null,"action":"edited","sha":"5c14947b1fd1e254da5541ed0a7981bcc265cfe8","html_url":"https://github.com/cswetenham/tabspace2.1/wiki/Mapping-Layout"}]},"public":true,"created_at":"2015-01-01T01:04:21Z"}
{"id":"2489397758","type":"PushEvent","actor":{"id":3720783,"login":"designerwebhosting","gravatar_id":"","url":"https://api.github.com/users/designerwebhosting","avatar_url":"https://avatars.githubusercontent.com/u/3720783?"},"repo":{"id":20527117,"name":"designerwebhosting/christopherbyrne.github.io","url":"https://api.github.com/repos/designerwebhosting/christopherbyrne.github.io"},"payload":{"push_id":536753077,"size":1,"distinct_size":1,"ref":"refs/heads/gh-pages","head":"19f1368a9acc50e9b1cc2b936c165c9704040889","before":"b8aa926ae3fee18580b31846a3b3dfcea5ad032f","commits":[{"sha":"19f1368a9acc50e9b1cc2b936c165c9704040889","author":{"email":"4bb0acc6ff8c0b6c31e50417877e6e3b3f1c65f0@googlemail.com","name":"Peter Noblee"},"message":"update 'date'","distinct":true,"url":"https://api.github.com/repos/designerwebhosting/christopherbyrne.github.io/commits/19f1368a9acc50e9b1cc2b936c165c9704040889"}]},"public":true,"created_at":"2015-01-01T01:04:22Z"}
{"id":"2489397763","type":"CreateEvent","actor":{"id":2784341,"login":"RyanMurphy86","gravatar_id":"","url":"https://api.github.com/users/RyanMurphy86","avatar_url":"https://avatars.githubusercontent.com/u/2784341?"},"repo":{"id":28678257,"name":"RyanMurphy86/2skewed","url":"https://api.github.com/repos/RyanMurphy86/2skewed"},"payload":{"ref":null,"ref_type":"repository","master_branch":"master","description":"","pusher_type":"user"},"public":true,"created_at":"2015-01-01T01:04:22Z"}
{"id":"2489397764","type":"ForkEvent","actor":{"id":4997404,"login":"chenxinyong","gravatar_id":"","url":"https://api.github.com/users/chenxinyong","avatar_url":"https://avatars.githubusercontent.com/u/4997404?"},"repo":{"id":22034912,"name":"POPWorldMedia/POPForums","url":"https://api.github.com/repos/POPWorldMedia/POPForums"},"payload":{"forkee":{"id":28678258,"name":"POPForums","full_name":"chenxinyong/POPForums","owner":{"login":"chenxinyong","id":4997404,"avatar_url":"https://avatars.githubusercontent.com/u/4997404?v=3","gravatar_id":"","url":"https://api.github.com/users/chenxinyong","html_url":"https://github.com/chenxinyong","followers_url":"https://api.github.com/users/chenxinyong/followers","following_url":"https://api.github.com/users/chenxinyong/following{/other_user}","gists_url":"https://api.github.com/users/chenxinyong/gists{/gist_id}","starred_url":"https://api.github.com/users/chenxinyong/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/chenxinyong/subscriptions","organizations_url":"https://api.github.com/users/chenxinyong/orgs","repos_url":"https://api.github.com/users/chenxinyong/repos","events_url":"https://api.github.com/users/chenxinyong/events{/privacy}","received_events_url":"https://api.github.com/users/chenxinyong/received_events","type":"User","site_admin":false},"private":false,"html_url":"https://github.com/chenxinyong/POPForums","description":"A forum application running on ASP.NET MVC, available in six languages.","fork":true,"url":"https://api.github.com/repos/chenxinyong/POPForums","forks_url":"https://api.github.com/repos/chenxinyong/POPForums/forks","keys_url":"https://api.github.com/repos/chenxinyong/POPForums/keys{/key_id}","collaborators_url":"https://api.github.com/repos/chenxinyong/POPForums/collaborators{/collaborator}","teams_url":"https://api.github.com/repos/chenxinyong/POPForums/teams","hooks_url":"https://api.github.com/repos/chenxinyong/POPForums/hooks","issue_events_url":"https://api.github.com/repos/chenxinyong/POPForums/issues/events{/number}","events_url":"https://api.github.com/repos/chenxinyong/POPForums/events","assignees_url":"https://api.github.com/repos/chenxinyong/POPForums/assignees{/user}","branches_url":"https://api.github.com/repos/chenxinyong/POPForums/branches{/branch}","tags_url":"https://api.github.com/repos/chenxinyong/POPForums/tags","blobs_url":"https://api.github.com/repos/chenxinyong/POPForums/git/blobs{/sha}","git_tags_url":"https://api.github.com/repos/chenxinyong/POPForums/git/tags{/sha}","git_refs_url":"https://api.github.com/repos/chenxinyong/POPForums/git/refs{/sha}","trees_url":"https://api.github.com/repos/chenxinyong/POPForums/git/trees{/sha}","statuses_url":"https://api.github.com/repos/chenxinyong/POPForums/statuses/{sha}","languages_url":"https://api.github.com/repos/chenxinyong/POPForums/languages","stargazers_url":"https://api.github.com/repos/chenxinyong/POPForums/stargazers","contributors_url":"https://api.github.com/repos/chenxinyong/POPForums/contributors","subscribers_url":"https://api.github.com/repos/chenxinyong/POPForums/subscribers","subscription_url":"https://api.github.com/repos/chenxinyong/POPForums/subscription","commits_url":"https://api.github.com/repos/chenxinyong/POPForums/commits{/sha}","git_commits_url":"https://api.github.com/repos/chenxinyong/POPForums/git/commits{/sha}","comments_url":"https://api.github.com/repos/chenxinyong/POPForums/comments{/number}","issue_comment_url":"https://api.github.com/repos/chenxinyong/POPForums/issues/comments/{number}","contents_url":"https://api.github.com/repos/chenxinyong/POPForums/contents/{+path}","compare_url":"https://api.github.com/repos/chenxinyong/POPForums/compare/{base}...{head}","merges_url":"https://api.github.com/repos/chenxinyong/POPForums/merges","archive_url":"https://api.github.com/repos/chenxinyong/POPForums/{archive_format}{/ref}","downloads_url":"https://api.github.com/repos/chenxinyong/POPForums/downloads","issues_url":"https://api.github.com/repos/chenxinyong/POPForums/issues{/number}","pulls_url":"https://api.github.com/repos/chenxinyong/POPForums/pulls{/number}","milestones_url":"https://api.github.com/repos/chenxinyong/POPForums/milestones{/number}","notifications_url":"https://api.github.com/repos/chenxinyong/POPForums/notifications{?since,all,participating}","labels_url":"https://api.github.com/repos/chenxinyong/POPForums/labels{/name}","releases_url":"https://api.github.com/repos/chenxinyong/POPForums/releases{/id}","created_at":"2015-01-01T01:04:22Z","updated_at":"2014-12-20T03:14:29Z","pushed_at":"2014-12-10T03:33:27Z","git_url":"git://github.com/chenxinyong/POPForums.git","ssh_url":"git@github.com:chenxinyong/POPForums.git","clone_url":"https://github.com/chenxinyong/POPForums.git","svn_url":"https://github.com/chenxinyong/POPForums","homepage":"http://popforums.com/","size":24896,"stargazers_count":0,"watchers_count":0,"language":null,"has_issues":false,"has_downloads":true,"has_wiki":true,"has_pages":false,"forks_count":0,"mirror_url":null,"open_issues_count":0,"forks":0,"open_issues":0,"watchers":0,"default_branch":"master","public":true}},"public":true,"created_at":"2015-01-01T01:04:22Z","org":{"id":8217691,"login":"POPWorldMedia","gravatar_id":"","url":"https://api.github.com/orgs/POPWorldMedia","avatar_url":"https://avatars.githubusercontent.com/u/8217691?"}}
{"id":"2489397766","type":"IssueCommentEvent","actor":{"id":8508800,"login":"cmp-202","gravatar_id":"","url":"https://api.github.com/users/cmp-202","avatar_url":"https://avatars.githubusercontent.com/u/8508800?"},"repo":{"id":23310272,"name":"cmp-202/ssh2shell","url":"https://api.github.com/repos/cmp-202/ssh2shell"},"payload":{"action":"created","issue":{"url":"https://api.github.com/repos/cmp-202/ssh2shell/issues/10","labels_url":"https://api.github.com/repos/cmp-202/ssh2shell/issues/10/labels{/name}","comments_url":"https://api.github.com/repos/cmp-202/ssh2shell/issues/10/comments","events_url":"https://api.github.com/repos/cmp-202/ssh2shell/issues/10/events","html_url":"https://github.com/cmp-202/ssh2shell/issues/10","id":53071635,"number":10,"title":"Timeout error (part 2)","user":{"login":"macirex","id":1192393,"avatar_url":"https://avatars.githubusercontent.com/u/1192393?v=3","gravatar_id":"","url":"https://api.github.com/users/macirex","html_url":"https://github.com/macirex","followers_url":"https://api.github.com/users/macirex/followers","following_url":"https://api.github.com/users/macirex/following{/other_user}","gists_url":"https://api.github.com/users/macirex/gists{/gist_id}","starred_url":"https://api.github.com/users/macirex/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/macirex/subscriptions","organizations_url":"https://api.github.com/users/macirex/orgs","repos_url":"https://api.github.com/users/macirex/repos","events_url":"https://api.github.com/users/macirex/events{/privacy}","received_events_url":"https://api.github.com/users/macirex/received_events","type":"User","site_admin":false},"labels":[],"state":"open","locked":false,"assignee":null,"milestone":null,"comments":8,"created_at":"2014-12-29T21:04:44Z","updated_at":"2015-01-01T01:04:23Z","closed_at":null,"body":"Hello cmp,\r\n\r\nI´m sorry to bother you again but I´ve encountered the another time out issue.\r\n\r\nLet me provide some context first:\r\n\r\nA group of servers I administer have some restricted policies:\r\n\r\n- Root and application domain users are inaccessible via ssh.\r\n- None of the application users have password.\r\n- There´s only one user available for ssh connection, it is used for everything and it has limited permissions, for references this will be called \"simpleuser\". \r\n- Only way to administer a server is to connect via ssh to the \"simpleuser\" and then do a su to root. \r\n\r\nBasically the flow goes like this: \r\nLogin -> su - root -> su - domainapp ->  [Here I do what I need to do]   \r\n\r\nThe list of commands I´m trying is:\r\n  commands:           [\r\n    \"su - root\", \r\n    \"echo hello\" \r\n    \"su - webapp\",\r\n    \"ls -lthr\",\r\n  ]\r\n\r\nI managed to log into root using the event on commandProcessing and writing the password directly into the stream:\r\n\r\n<code>\r\nSSH.on ('commandProcessing', function onCommandProcessing( command, response, sshObj, stream ) {   \r\n            if (command.match(/root/)&& response.indexOf(\"Password:\") != -1) {\r\n\t           if (!admin)\r\n\t\t   {\r\n\t\t\tstream.write('password\\n');\r\n\t\t\tadmin = true;\r\n\t\t    }\r\n              });\r\n</code>\r\n\r\nAfter that, I try to do another su, this time to the domain I need to check but it fails with: \r\nTimeout error: 10.164.12.159: Command timed out after 5 seconds\r\n\r\nHere´s the output my app generates:\r\n\r\nConnected\r\nRunning commands Now\r\n10.164.12.159 verbose:Your password will expire in 8 days.\r\n[user01@machine043]>\r\n10.164.12.159 verbose:su - root\r\nPassword:\r\n[root@machine043]>\r\n10.164.12.159 verbose:echo hello\r\nhello\r\n[root@machine043]>\r\nTimeout error: 10.164.12.159: Command timed out after 5 seconds\r\nCompleted\r\n\r\nAny commands I execute before trying the second su, it works perfectly but after the second su I only get Timeout error.\r\n\r\nThis is the full session responses:\r\nConnected to 10.164.12.159\r\nsu - root\r\nPassword:\r\n[root@machine043]> echo hello\r\nhello\r\n[root@machine043]> su - webapp\r\nmachine043@webapp:~>\r\n\r\nAny insights you could share with me?\r\nCould this be happening because the name of the prompt is different from the first two?  Where simpleuser and root has username@machinename and webapp has machinename@username?\r\n\r\nBtw, merry christmas! and have a happy new year!"},"comment":{"url":"https://api.github.com/repos/cmp-202/ssh2shell/issues/comments/68477303","html_url":"https://github.com/cmp-202/ssh2shell/issues/10#issuecomment-68477303","issue_url":"https://api.github.com/repos/cmp-202/ssh2shell/issues/10","id":68477303,"user":{"login":"cmp-202","id":8508800,"avatar_url":"https://avatars.githubusercontent.com/u/8508800?v=3","gravatar_id":"","url":"https://api.github.com/users/cmp-202","html_url":"https://github.com/cmp-202","followers_url":"https://api.github.com/users/cmp-202/followers","following_url":"https://api.github.com/users/cmp-202/following{/other_user}","gists_url":"https://api.github.com/users/cmp-202/gists{/gist_id}","starred_url":"https://api.github.com/users/cmp-202/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/cmp-202/subscriptions","organizations_url":"https://api.github.com/users/cmp-202/orgs","repos_url":"https://api.github.com/users/cmp-202/repos","events_url":"https://api.github.com/users/cmp-202/events{/privacy}","received_events_url":"https://api.github.com/users/cmp-202/received_events","type":"User","site_admin":false},"created_at":"2015-01-01T01:04:23Z","updated_at":"2015-01-01T01:04:23Z","body":"could you show me the debug output."}},"public":true,"created_at":"2015-01-01T01:04:23Z"}
{"id":"2489397767","type":"GollumEvent","actor":{"id":720678,"login":"kongr45gpen","gravatar_id":"","url":"https://api.github.com/users/kongr45gpen","avatar_url":"https://avatars.githubusercontent.com/u/720678?"},"repo":{"id":11615971,"name":"allejo/bzion","url":"https://api.github.com/repos/allejo/bzion"},"payload":{"pages":[{"page_name":"Installation","title":"Installation","summary":null,"action":"edited","sha":"2abf7f83955235fa9a1bf76f57b9fdad0be16772","html_url":"https://github.com/allejo/bzion/wiki/Installation"}]},"public":true,"created_at":"2015-01-01T01:04:23Z"}
{"id":"2489397775","type":"PushEvent","actor":{"id":4362193,"login":"derickc","gravatar_id":"","url":"https://api.github.com/users/derickc","avatar_url":"https://avatars.githubusercontent.com/u/4362193?"},"repo":{"id":27286576,"name":"ADML1/adml1.github.io","url":"https://api.github.com/repos/ADML1/adml1.github.io"},"payload":{"push_id":536753081,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"b3ebd99a730a450c2adc2feb0654647710abf78e","before":"378bfcffc91f8fa212d96dd2eba5abc21e3fc4c0","commits":[{"sha":"b3ebd99a730a450c2adc2feb0654647710abf78e","author":{"email":"45a58c873e280dbee110e79514ff8a5e02d3e2be@gmail.com","name":"Derick"},"message":"Update draft and change padding to make more mobile friendly.","distinct":true,"url":"https://api.github.com/repos/ADML1/adml1.github.io/commits/b3ebd99a730a450c2adc2feb0654647710abf78e"}]},"public":true,"created_at":"2015-01-01T01:04:25Z","org":{"id":9938744,"login":"ADML1","gravatar_id":"","url":"https://api.github.com/orgs/ADML1","avatar_url":"https://avatars.githubusercontent.com/u/9938744?"}}
{"id":"2489397776","type":"PushEvent","actor":{"id":5567815,"login":"alexlovesprogramming","gravatar_id":"","url":"https://api.github.com/users/alexlovesprogramming","avatar_url":"https://avatars.githubusercontent.com/u/5567815?"},"repo":{"id":28524892,"name":"alexlovesprogramming/longstreetliving","url":"https://api.github.com/repos/alexlovesprogramming/longstreetliving"},"payload":{"push_id":536753082,"size":2,"distinct_size":2,"ref":"refs/heads/master","head":"edebc67bf340a3c896cc6204a94332e03f67b52f","before":"81b81aba6f76f0b9816556e3267bba820f867c5f","commits":[{"sha":"cd4288723ab21d37c17079153f566ab827a0bc5d","author":{"email":"bf67c384ca4ec67ca70eb215259e583bfbc24f58@gmail.com","name":"Alex Johnson"},"message":"signature","distinct":true,"url":"https://api.github.com/repos/alexlovesprogramming/longstreetliving/commits/cd4288723ab21d37c17079153f566ab827a0bc5d"},{"sha":"edebc67bf340a3c896cc6204a94332e03f67b52f","author":{"email":"bf67c384ca4ec67ca70eb215259e583bfbc24f58@gmail.com","name":"Alex Johnson"},"message":"Merge branch 'master' of https://server.longstreetliving.com/Bonobo.Git.Server/longstreetliving","distinct":true,"url":"https://api.github.com/repos/alexlovesprogramming/longstreetliving/commits/edebc67bf340a3c896cc6204a94332e03f67b52f"}]},"public":true,"created_at":"2015-01-01T01:04:25Z"}
{"id":"2489397779","type":"IssueCommentEvent","actor":{"id":1203825,"login":"huonw","gravatar_id":"","url":"https://api.github.com/users/huonw","avatar_url":"https://avatars.githubusercontent.com/u/1203825?"},"repo":{"id":724712,"name":"rust-lang/rust","url":"https://api.github.com/repos/rust-lang/rust"},"payload":{"action":"created","issue":{"url":"https://api.github.com/repos/rust-lang/rust/issues/20379","labels_url":"https://api.github.com/repos/rust-lang/rust/issues/20379/labels{/name}","comments_url":"https://api.github.com/repos/rust-lang/rust/issues/20379/comments","events_url":"https://api.github.com/repos/rust-lang/rust/issues/20379/events","html_url":"https://github.com/rust-lang/rust/issues/20379","id":53207500,"number":20379,"title":"recursion dependent on global offset table","user":{"login":"ragingSloth","id":3530278,"avatar_url":"https://avatars.githubusercontent.com/u/3530278?v=3","gravatar_id":"","url":"https://api.github.com/users/ragingSloth","html_url":"https://github.com/ragingSloth","followers_url":"https://api.github.com/users/ragingSloth/followers","following_url":"https://api.github.com/users/ragingSloth/following{/other_user}","gists_url":"https://api.github.com/users/ragingSloth/gists{/gist_id}","starred_url":"https://api.github.com/users/ragingSloth/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/ragingSloth/subscriptions","organizations_url":"https://api.github.com/users/ragingSloth/orgs","repos_url":"https://api.github.com/users/ragingSloth/repos","events_url":"https://api.github.com/users/ragingSloth/events{/privacy}","received_events_url":"https://api.github.com/users/ragingSloth/received_events","type":"User","site_admin":false},"labels":[],"state":"open","locked":false,"assignee":null,"milestone":null,"comments":1,"created_at":"2014-12-31T23:03:06Z","updated_at":"2015-01-01T01:04:25Z","closed_at":null,"body":"While trying to use rust freestanding I found that any attempt to use recursion resulted in an error while linking. \r\n\r\n    main.o: In function `put':\r\n    main.0.rs:(.text.put+0xc): undefined reference to `_GLOBAL_OFFSET_TABLE_'\r\n    main.o: In function `r_write':\r\n    main.0.rs:(.text.r_write+0xf): undefined reference to `_GLOBAL_OFFSET_TABLE_'\r\n\r\nI'm not sure if this is an issue, but I can't find any way to use recursion without a global offset table. I'm compiling with `#[no_std]` and `-O --target i686-unknown-linux-gnu --crate-type lib --emit obj`, and I recieve errors when trying to link separately. "},"comment":{"url":"https://api.github.com/repos/rust-lang/rust/issues/comments/68477305","html_url":"https://github.com/rust-lang/rust/issues/20379#issuecomment-68477305","issue_url":"https://api.github.com/repos/rust-lang/rust/issues/20379","id":68477305,"user":{"login":"huonw","id":1203825,"avatar_url":"https://avatars.githubusercontent.com/u/1203825?v=3","gravatar_id":"","url":"https://api.github.com/users/huonw","html_url":"https://github.com/huonw","followers_url":"https://api.github.com/users/huonw/followers","following_url":"https://api.github.com/users/huonw/following{/other_user}","gists_url":"https://api.github.com/users/huonw/gists{/gist_id}","starred_url":"https://api.github.com/users/huonw/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/huonw/subscriptions","organizations_url":"https://api.github.com/users/huonw/orgs","repos_url":"https://api.github.com/users/huonw/repos","events_url":"https://api.github.com/users/huonw/events{/privacy}","received_events_url":"https://api.github.com/users/huonw/received_events","type":"User","site_admin":false},"created_at":"2015-01-01T01:04:25Z","updated_at":"2015-01-01T01:04:25Z","body":"Do you happen to have a code example that demonstrates this?"}},"public":true,"created_at":"2015-01-01T01:04:26Z","org":{"id":5430905,"login":"rust-lang","gravatar_id":"","url":"https://api.github.com/orgs/rust-lang","avatar_url":"https://avatars.githubusercontent.com/u/5430905?"}}
{"id":"2489397781","type":"PullRequestEvent","actor":{"id":706947,"login":"d3athrow","gravatar_id":"","url":"https://api.github.com/users/d3athrow","avatar_url":"https://avatars.githubusercontent.com/u/706947?"},"repo":{"id":10441188,"name":"d3athrow/vgstation13","url":"https://api.github.com/repos/d3athrow/vgstation13"},"payload":{"action":"closed","number":2417,"pull_request":{"url":"https://api.github.com/repos/d3athrow/vgstation13/pulls/2417","id":26723211,"html_url":"https://github.com/d3athrow/vgstation13/pull/2417","diff_url":"https://github.com/d3athrow/vgstation13/pull/2417.diff","patch_url":"https://github.com/d3athrow/vgstation13/pull/2417.patch","issue_url":"https://api.github.com/repos/d3athrow/vgstation13/issues/2417","number":2417,"state":"closed","locked":false,"title":"A few defficiency fixes","user":{"login":"Duny-","id":5224390,"avatar_url":"https://avatars.githubusercontent.com/u/5224390?v=3","gravatar_id":"","url":"https://api.github.com/users/Duny-","html_url":"https://github.com/Duny-","followers_url":"https://api.github.com/users/Duny-/followers","following_url":"https://api.github.com/users/Duny-/following{/other_user}","gists_url":"https://api.github.com/users/Duny-/gists{/gist_id}","starred_url":"https://api.github.com/users/Duny-/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/Duny-/subscriptions","organizations_url":"https://api.github.com/users/Duny-/orgs","repos_url":"https://api.github.com/users/Duny-/repos","events_url":"https://api.github.com/users/Duny-/events{/privacy}","received_events_url":"https://api.github.com/users/Duny-/received_events","type":"User","site_admin":false},"body":"- Added all missing holodeck settings.\r\n- Fixed missing pipe in supermatter room.\r\n- Tweaked toxins launcher to hopefully work correctly in higher ZAS settings.","created_at":"2014-12-31T12:38:43Z","updated_at":"2015-01-01T01:04:26Z","closed_at":"2015-01-01T01:04:26Z","merged_at":"2015-01-01T01:04:26Z","merge_commit_sha":"0aba215d4d761c270f9e576576832eea9cb48658","assignee":null,"milestone":null,"commits_url":"https://api.github.com/repos/d3athrow/vgstation13/pulls/2417/commits","review_comments_url":"https://api.github.com/repos/d3athrow/vgstation13/pulls/2417/comments","review_comment_url":"https://api.github.com/repos/d3athrow/vgstation13/pulls/comments/{number}","comments_url":"https://api.github.com/repos/d3athrow/vgstation13/issues/2417/comments","statuses_url":"https://api.github.com/repos/d3athrow/vgstation13/statuses/34f7fa7b80f675ce4e56f4bc148338104b8155ee","head":{"label":"Duny-:Bleeding-Edge","ref":"Bleeding-Edge","sha":"34f7fa7b80f675ce4e56f4bc148338104b8155ee","user":{"login":"Duny-","id":5224390,"avatar_url":"https://avatars.githubusercontent.com/u/5224390?v=3","gravatar_id":"","url":"https://api.github.com/users/Duny-","html_url":"https://github.com/Duny-","followers_url":"https://api.github.com/users/Duny-/followers","following_url":"https://api.github.com/users/Duny-/following{/other_user}","gists_url":"https://api.github.com/users/Duny-/gists{/gist_id}","starred_url":"https://api.github.com/users/Duny-/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/Duny-/subscriptions","organizations_url":"https://api.github.com/users/Duny-/orgs","repos_url":"https://api.github.com/users/Duny-/repos","events_url":"https://api.github.com/users/Duny-/events{/privacy}","received_events_url":"https://api.github.com/users/Duny-/received_events","type":"User","site_admin":false},"repo":{"id":20945462,"name":"vgstation13","full_name":"Duny-/vgstation13","owner":{"login":"Duny-","id":5224390,"avatar_url":"https://avatars.githubusercontent.com/u/5224390?v=3","gravatar_id":"","url":"https://api.github.com/users/Duny-","html_url":"https://github.com/Duny-","followers_url":"https://api.github.com/users/Duny-/followers","following_url":"https://api.github.com/users/Duny-/following{/other_user}","gists_url":"https://api.github.com/users/Duny-/gists{/gist_id}","starred_url":"https://api.github.com/users/Duny-/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/Duny-/subscriptions","organizations_url":"https://api.github.com/users/Duny-/orgs","repos_url":"https://api.github.com/users/Duny-/repos","events_url":"https://api.github.com/users/Duny-/events{/privacy}","received_events_url":"https://api.github.com/users/Duny-/received_events","type":"User","site_admin":false},"private":false,"html_url":"https://github.com/Duny-/vgstation13","description":"This is the vgstation's fork of baystation12's code.","fork":true,"url":"https://api.github.com/repos/Duny-/vgstation13","forks_url":"https://api.github.com/repos/Duny-/vgstation13/forks","keys_url":"https://api.github.com/repos/Duny-/vgstation13/keys{/key_id}","collaborators_url":"https://api.github.com/repos/Duny-/vgstation13/collaborators{/collaborator}","teams_url":"https://api.github.com/repos/Duny-/vgstation13/teams","hooks_url":"https://api.github.com/repos/Duny-/vgstation13/hooks","issue_events_url":"https://api.github.com/repos/Duny-/vgstation13/issues/events{/number}","events_url":"https://api.github.com/repos/Duny-/vgstation13/events","assignees_url":"https://api.github.com/repos/Duny-/vgstation13/assignees{/user}","branches_url":"https://api.github.com/repos/Duny-/vgstation13/branches{/branch}","tags_url":"https://api.github.com/repos/Duny-/vgstation13/tags","blobs_url":"https://api.github.com/repos/Duny-/vgstation13/git/blobs{/sha}","git_tags_url":"https://api.github.com/repos/Duny-/vgstation13/git/tags{/sha}","git_refs_url":"https://api.github.com/repos/Duny-/vgstation13/git/refs{/sha}","trees_url":"https://api.github.com/repos/Duny-/vgstation13/git/trees{/sha}","statuses_url":"https://api.github.com/repos/Duny-/vgstation13/statuses/{sha}","languages_url":"https://api.github.com/repos/Duny-/vgstation13/languages","stargazers_url":"https://api.github.com/repos/Duny-/vgstation13/stargazers","contributors_url":"https://api.github.com/repos/Duny-/vgstation13/contributors","subscribers_url":"https://api.github.com/repos/Duny-/vgstation13/subscribers","subscription_url":"https://api.github.com/repos/Duny-/vgstation13/subscription","commits_url":"https://api.github.com/repos/Duny-/vgstation13/commits{/sha}","git_commits_url":"https://api.github.com/repos/Duny-/vgstation13/git/commits{/sha}","comments_url":"https://api.github.com/repos/Duny-/vgstation13/comments{/number}","issue_comment_url":"https://api.github.com/repos/Duny-/vgstation13/issues/comments/{number}","contents_url":"https://api.github.com/repos/Duny-/vgstation13/contents/{+path}","compare_url":"https://api.github.com/repos/Duny-/vgstation13/compare/{base}...{head}","merges_url":"https://api.github.com/repos/Duny-/vgstation13/merges","archive_url":"https://api.github.com/repos/Duny-/vgstation13/{archive_format}{/ref}","downloads_url":"https://api.github.com/repos/Duny-/vgstation13/downloads","issues_url":"https://api.github.com/repos/Duny-/vgstation13/issues{/number}","pulls_url":"https://api.github.com/repos/Duny-/vgstation13/pulls{/number}","milestones_url":"https://api.github.com/repos/Duny-/vgstation13/milestones{/number}","notifications_url":"https://api.github.com/repos/Duny-/vgstation13/notifications{?since,all,participating}","labels_url":"https://api.github.com/repos/Duny-/vgstation13/labels{/name}","releases_url":"https://api.github.com/repos/Duny-/vgstation13/releases{/id}","created_at":"2014-06-18T01:41:53Z","updated_at":"2014-12-31T16:30:54Z","pushed_at":"2014-12-31T16:30:54Z","git_url":"git://github.com/Duny-/vgstation13.git","ssh_url":"git@github.com:Duny-/vgstation13.git","clone_url":"https://github.com/Duny-/vgstation13.git","svn_url":"https://github.com/Duny-/vgstation13","homepage":"","size":712478,"stargazers_count":0,"watchers_count":0,"language":"DM","has_issues":true,"has_downloads":true,"has_wiki":false,"has_pages":false,"forks_count":0,"mirror_url":null,"open_issues_count":18,"forks":0,"open_issues":18,"watchers":0,"default_branch":"Bleeding-Edge"}},"base":{"label":"d3athrow:Bleeding-Edge","ref":"Bleeding-Edge","sha":"5e8624143efbf348ed553421b76293ef84acac57","user":{"login":"d3athrow","id":706947,"avatar_url":"https://avatars.githubusercontent.com/u/706947?v=3","gravatar_id":"","url":"https://api.github.com/users/d3athrow","html_url":"https://github.com/d3athrow","followers_url":"https://api.github.com/users/d3athrow/followers","following_url":"https://api.github.com/users/d3athrow/following{/other_user}","gists_url":"https://api.github.com/users/d3athrow/gists{/gist_id}","starred_url":"https://api.github.com/users/d3athrow/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/d3athrow/subscriptions","organizations_url":"https://api.github.com/users/d3athrow/orgs","repos_url":"https://api.github.com/users/d3athrow/repos","events_url":"https://api.github.com/users/d3athrow/events{/privacy}","received_events_url":"https://api.github.com/users/d3athrow/received_events","type":"User","site_admin":false},"repo":{"id":10441188,"name":"vgstation13","full_name":"d3athrow/vgstation13","owner":{"login":"d3athrow","id":706947,"avatar_url":"https://avatars.githubusercontent.com/u/706947?v=3","gravatar_id":"","url":"https://api.github.com/users/d3athrow","html_url":"https://github.com/d3athrow","followers_url":"https://api.github.com/users/d3athrow/followers","following_url":"https://api.github.com/users/d3athrow/following{/other_user}","gists_url":"https://api.github.com/users/d3athrow/gists{/gist_id}","starred_url":"https://api.github.com/users/d3athrow/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/d3athrow/subscriptions","organizations_url":"https://api.github.com/users/d3athrow/orgs","repos_url":"https://api.github.com/users/d3athrow/repos","events_url":"https://api.github.com/users/d3athrow/events{/privacy}","received_events_url":"https://api.github.com/users/d3athrow/received_events","type":"User","site_admin":false},"private":false,"html_url":"https://github.com/d3athrow/vgstation13","description":"This is the vgstation's fork of baystation12's code.","fork":true,"url":"https://api.github.com/repos/d3athrow/vgstation13","forks_url":"https://api.github.com/repos/d3athrow/vgstation13/forks","keys_url":"https://api.github.com/repos/d3athrow/vgstation13/keys{/key_id}","collaborators_url":"https://api.github.com/repos/d3athrow/vgstation13/collaborators{/collaborator}","teams_url":"https://api.github.com/repos/d3athrow/vgstation13/teams","hooks_url":"https://api.github.com/repos/d3athrow/vgstation13/hooks","issue_events_url":"https://api.github.com/repos/d3athrow/vgstation13/issues/events{/number}","events_url":"https://api.github.com/repos/d3athrow/vgstation13/events","assignees_url":"https://api.github.com/repos/d3athrow/vgstation13/assignees{/user}","branches_url":"https://api.github.com/repos/d3athrow/vgstation13/branches{/branch}","tags_url":"https://api.github.com/repos/d3athrow/vgstation13/tags","blobs_url":"https://api.github.com/repos/d3athrow/vgstation13/git/blobs{/sha}","git_tags_url":"https://api.github.com/repos/d3athrow/vgstation13/git/tags{/sha}","git_refs_url":"https://api.github.com/repos/d3athrow/vgstation13/git/refs{/sha}","trees_url":"https://api.github.com/repos/d3athrow/vgstation13/git/trees{/sha}","statuses_url":"https://api.github.com/repos/d3athrow/vgstation13/statuses/{sha}","languages_url":"https://api.github.com/repos/d3athrow/vgstation13/languages","stargazers_url":"https://api.github.com/repos/d3athrow/vgstation13/stargazers","contributors_url":"https://api.github.com/repos/d3athrow/vgstation13/contributors","subscribers_url":"https://api.github.com/repos/d3athrow/vgstation13/subscribers","subscription_url":"https://api.github.com/repos/d3athrow/vgstation13/subscription","commits_url":"https://api.github.com/repos/d3athrow/vgstation13/commits{/sha}","git_commits_url":"https://api.github.com/repos/d3athrow/vgstation13/git/commits{/sha}","comments_url":"https://api.github.com/repos/d3athrow/vgstation13/comments{/number}","issue_comment_url":"https://api.github.com/repos/d3athrow/vgstation13/issues/comments/{number}","contents_url":"https://api.github.com/repos/d3athrow/vgstation13/contents/{+path}","compare_url":"https://api.github.com/repos/d3athrow/vgstation13/compare/{base}...{head}","merges_url":"https://api.github.com/repos/d3athrow/vgstation13/merges","archive_url":"https://api.github.com/repos/d3athrow/vgstation13/{archive_format}{/ref}","downloads_url":"https://api.github.com/repos/d3athrow/vgstation13/downloads","issues_url":"https://api.github.com/repos/d3athrow/vgstation13/issues{/number}","pulls_url":"https://api.github.com/repos/d3athrow/vgstation13/pulls{/number}","milestones_url":"https://api.github.com/repos/d3athrow/vgstation13/milestones{/number}","notifications_url":"https://api.github.com/repos/d3athrow/vgstation13/notifications{?since,all,participating}","labels_url":"https://api.github.com/repos/d3athrow/vgstation13/labels{/name}","releases_url":"https://api.github.com/repos/d3athrow/vgstation13/releases{/id}","created_at":"2013-06-02T19:39:54Z","updated_at":"2014-12-31T20:06:46Z","pushed_at":"2015-01-01T01:04:26Z","git_url":"git://github.com/d3athrow/vgstation13.git","ssh_url":"git@github.com:d3athrow/vgstation13.git","clone_url":"https://github.com/d3athrow/vgstation13.git","svn_url":"https://github.com/d3athrow/vgstation13","homepage":"","size":937605,"stargazers_count":45,"watchers_count":45,"language":"DM","has_issues":true,"has_downloads":true,"has_wiki":true,"has_pages":false,"forks_count":135,"mirror_url":null,"open_issues_count":259,"forks":135,"open_issues":259,"watchers":45,"default_branch":"master"}},"_links":{"self":{"href":"https://api.github.com/repos/d3athrow/vgstation13/pulls/2417"},"html":{"href":"https://github.com/d3athrow/vgstation13/pull/2417"},"issue":{"href":"https://api.github.com/repos/d3athrow/vgstation13/issues/2417"},"comments":{"href":"https://api.github.com/repos/d3athrow/vgstation13/issues/2417/comments"},"review_comments":{"href":"https://api.github.com/repos/d3athrow/vgstation13/pulls/2417/comments"},"review_comment":{"href":"https://api.github.com/repos/d3athrow/vgstation13/pulls/comments/{number}"},"commits":{"href":"https://api.github.com/repos/d3athrow/vgstation13/pulls/2417/commits"},"statuses":{"href":"https://api.github.com/repos/d3athrow/vgstation13/statuses/34f7fa7b80f675ce4e56f4bc148338104b8155ee"}},"merged":true,"mergeable":null,"mergeable_state":"unknown","merged_by":{"login":"d3athrow","id":706947,"avatar_url":"https://avatars.githubusercontent.com/u/706947?v=3","gravatar_id":"","url":"https://api.github.com/users/d3athrow","html_url":"https://github.com/d3athrow","followers_url":"https://api.github.com/users/d3athrow/followers","following_url":"https://api.github.com/users/d3athrow/following{/other_user}","gists_url":"https://api.github.com/users/d3athrow/gists{/gist_id}","starred_url":"https://api.github.com/users/d3athrow/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/d3athrow/subscriptions","organizations_url":"https://api.github.com/users/d3athrow/orgs","repos_url":"https://api.github.com/users/d3athrow/repos","events_url":"https://api.github.com/users/d3athrow/events{/privacy}","received_events_url":"https://api.github.com/users/d3athrow/received_events","type":"User","site_admin":false},"comments":0,"review_comments":0,"commits":3,"additions":115,"deletions":42,"changed_files":2}},"public":true,"created_at":"2015-01-01T01:04:26Z"}
{"id":"2489397782","type":"PushEvent","actor":{"id":568018,"login":"jon-jacky","gravatar_id":"","url":"https://api.github.com/users/jon-jacky","avatar_url":"https://avatars.githubusercontent.com/u/568018?"},"repo":{"id":3722889,"name":"jon-jacky/home","url":"https://api.github.com/repos/jon-jacky/home"},"payload":{"push_id":536753085,"size":1,"distinct_size":1,"ref":"refs/heads/gh-pages","head":"ca7c98c62a6cf4709b98f5d5bb453c1b2dd120bc","before":"11b7788a7c84834415f6f53b531b9c20ddf887b8","commits":[{"sha":"ca7c98c62a6cf4709b98f5d5bb453c1b2dd120bc","author":{"email":"44f878afe53efc66b76772bd845eb65944ed8232@u.washington.edu","name":"Jon Jacky"},"message":"Turing's manual for Mark II in computer architecture","distinct":true,"url":"https://api.github.com/repos/jon-jacky/home/commits/ca7c98c62a6cf4709b98f5d5bb453c1b2dd120bc"}]},"public":true,"created_at":"2015-01-01T01:04:26Z"}
{"id":"2489397787","type":"PushEvent","actor":{"id":1588951,"login":"TAGC","gravatar_id":"","url":"https://api.github.com/users/TAGC","avatar_url":"https://avatars.githubusercontent.com/u/1588951?"},"repo":{"id":28516105,"name":"TAGC/Semver","url":"https://api.github.com/repos/TAGC/Semver"},"payload":{"push_id":536753087,"size":1,"distinct_size":1,"ref":"refs/heads/develop","head":"c14bd6aeef1be553879694e2c3ba8535749f5380","before":"cbeb387cb6c3ba0f1d6b42ad32cf700f296424ba","commits":[{"sha":"c14bd6aeef1be553879694e2c3ba8535749f5380","author":{"email":"ff51050dd5988c994d7cae2035c2292721cc7625@gmail.com","name":"David"},"message":"Update README.md\n\nUpdate README to reflect changes brought about in v0.3.0","distinct":true,"url":"https://api.github.com/repos/TAGC/Semver/commits/c14bd6aeef1be553879694e2c3ba8535749f5380"}]},"public":true,"created_at":"2015-01-01T01:04:27Z"}
{"id":"2489397788","type":"PushEvent","actor":{"id":5681361,"login":"snoguchi","gravatar_id":"","url":"https://api.github.com/users/snoguchi","avatar_url":"https://avatars.githubusercontent.com/u/5681361?"},"repo":{"id":19981496,"name":"snoguchi/dotfiles","url":"https://api.github.com/repos/snoguchi/dotfiles"},"payload":{"push_id":536753088,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"3d73778740a21a43e90a97d76d0b316fd0d051a1","before":"34d21e71013bd74f2050e32eac38d65d8d19d2ab","commits":[{"sha":"3d73778740a21a43e90a97d76d0b316fd0d051a1","author":{"email":"6ae999552a0d2dca14d62e2bc8b764d377b1dd6c","name":"U-X220\\noguchi"},"message":"change key bindings","distinct":true,"url":"https://api.github.com/repos/snoguchi/dotfiles/commits/3d73778740a21a43e90a97d76d0b316fd0d051a1"}]},"public":true,"created_at":"2015-01-01T01:04:27Z"}
{"id":"2489397789","type":"PushEvent","actor":{"id":1684950,"login":"naijaping","gravatar_id":"","url":"https://api.github.com/users/naijaping","avatar_url":"https://avatars.githubusercontent.com/u/1684950?"},"repo":{"id":28650038,"name":"naijaping/awonlist","url":"https://api.github.com/repos/naijaping/awonlist"},"payload":{"push_id":536753089,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"f454a5a195625a9128fddb04b192fcc457e82091","before":"e80946e9abd94a00ce15b06ad502211a518e2ffd","commits":[{"sha":"f454a5a195625a9128fddb04b192fcc457e82091","author":{"email":"8a1440b218d23a283d388025f7c9dc3555009ec5@gmail.com","name":"naijaping"},"message":"Update uk","distinct":true,"url":"https://api.github.com/repos/naijaping/awonlist/commits/f454a5a195625a9128fddb04b192fcc457e82091"}]},"public":true,"created_at":"2015-01-01T01:04:27Z"}
{"id":"2489397791","type":"IssueCommentEvent","actor":{"id":594255,"login":"Xaekai","gravatar_id":"","url":"https://api.github.com/users/Xaekai","avatar_url":"https://avatars.githubusercontent.com/u/594255?"},"repo":{"id":8231654,"name":"calzoneman/sync","url":"https://api.github.com/repos/calzoneman/sync"},"payload":{"action":"created","issue":{"url":"https://api.github.com/repos/calzoneman/sync/issues/423","labels_url":"https://api.github.com/repos/calzoneman/sync/issues/423/labels{/name}","comments_url":"https://api.github.com/repos/calzoneman/sync/issues/423/comments","events_url":"https://api.github.com/repos/calzoneman/sync/issues/423/events","html_url":"https://github.com/calzoneman/sync/issues/423","id":53191677,"number":423,"title":"tab completion","user":{"login":"estillesemae","id":10359338,"avatar_url":"https://avatars.githubusercontent.com/u/10359338?v=3","gravatar_id":"","url":"https://api.github.com/users/estillesemae","html_url":"https://github.com/estillesemae","followers_url":"https://api.github.com/users/estillesemae/followers","following_url":"https://api.github.com/users/estillesemae/following{/other_user}","gists_url":"https://api.github.com/users/estillesemae/gists{/gist_id}","starred_url":"https://api.github.com/users/estillesemae/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/estillesemae/subscriptions","organizations_url":"https://api.github.com/users/estillesemae/orgs","repos_url":"https://api.github.com/users/estillesemae/repos","events_url":"https://api.github.com/users/estillesemae/events{/privacy}","received_events_url":"https://api.github.com/users/estillesemae/received_events","type":"User","site_admin":false},"labels":[],"state":"closed","locked":false,"assignee":null,"milestone":null,"comments":3,"created_at":"2014-12-31T16:38:03Z","updated_at":"2015-01-01T01:04:28Z","closed_at":"2014-12-31T16:55:56Z","body":"There is an issue with tab completion in the mlp anniversary room. Xaekai is sleeping, I thought I would inform you.\r\n\r\nMost of the time, when tab completion is used, an \"image.channel-emote\" appears. It is a blank box with nothing in it. Cannot click or anything. \r\nhttp://i.imgur.com/zZuj6hf.png\r\nhttp://i.imgur.com/Y1D8P4e.png\r\n\r\nI noticed it is only in the anni room though. I don't know if you can help, but that would be great!!\r\n\r\nEstillesemae"},"comment":{"url":"https://api.github.com/repos/calzoneman/sync/issues/comments/68477307","html_url":"https://github.com/calzoneman/sync/issues/423#issuecomment-68477307","issue_url":"https://api.github.com/repos/calzoneman/sync/issues/423","id":68477307,"user":{"login":"Xaekai","id":594255,"avatar_url":"https://avatars.githubusercontent.com/u/594255?v=3","gravatar_id":"","url":"https://api.github.com/users/Xaekai","html_url":"https://github.com/Xaekai","followers_url":"https://api.github.com/users/Xaekai/followers","following_url":"https://api.github.com/users/Xaekai/following{/other_user}","gists_url":"https://api.github.com/users/Xaekai/gists{/gist_id}","starred_url":"https://api.github.com/users/Xaekai/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/Xaekai/subscriptions","organizations_url":"https://api.github.com/users/Xaekai/orgs","repos_url":"https://api.github.com/users/Xaekai/repos","events_url":"https://api.github.com/users/Xaekai/events{/privacy}","received_events_url":"https://api.github.com/users/Xaekai/received_events","type":"User","site_admin":false},"created_at":"2015-01-01T01:04:28Z","updated_at":"2015-01-01T01:04:28Z","body":"@estillesemae My room features aren't calzoneman's problem or domain. Nice to see you using the dev console to figure shit out though."}},"public":true,"created_at":"2015-01-01T01:04:28Z"}
{"id":"2489397792","type":"IssueCommentEvent","actor":{"id":238354,"login":"variousred","gravatar_id":"","url":"https://api.github.com/users/variousred","avatar_url":"https://avatars.githubusercontent.com/u/238354?"},"repo":{"id":6274404,"name":"G5/g5-content-management-system","url":"https://api.github.com/repos/G5/g5-content-management-system"},"payload":{"action":"created","issue":{"url":"https://api.github.com/repos/G5/g5-content-management-system/issues/551","labels_url":"https://api.github.com/repos/G5/g5-content-management-system/issues/551/labels{/name}","comments_url":"https://api.github.com/repos/G5/g5-content-management-system/issues/551/comments","events_url":"https://api.github.com/repos/G5/g5-content-management-system/issues/551/events","html_url":"https://github.com/G5/g5-content-management-system/pull/551","id":53061666,"number":551,"title":"WIP: Fix Deep Clone","user":{"login":"ceckert","id":779559,"avatar_url":"https://avatars.githubusercontent.com/u/779559?v=3","gravatar_id":"","url":"https://api.github.com/users/ceckert","html_url":"https://github.com/ceckert","followers_url":"https://api.github.com/users/ceckert/followers","following_url":"https://api.github.com/users/ceckert/following{/other_user}","gists_url":"https://api.github.com/users/ceckert/gists{/gist_id}","starred_url":"https://api.github.com/users/ceckert/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/ceckert/subscriptions","organizations_url":"https://api.github.com/users/ceckert/orgs","repos_url":"https://api.github.com/users/ceckert/repos","events_url":"https://api.github.com/users/ceckert/events{/privacy}","received_events_url":"https://api.github.com/users/ceckert/received_events","type":"User","site_admin":false},"labels":[],"state":"open","locked":false,"assignee":null,"milestone":null,"comments":2,"created_at":"2014-12-29T18:51:49Z","updated_at":"2015-01-01T01:04:28Z","closed_at":null,"pull_request":{"url":"https://api.github.com/repos/G5/g5-content-management-system/pulls/551","html_url":"https://github.com/G5/g5-content-management-system/pull/551","diff_url":"https://github.com/G5/g5-content-management-system/pull/551.diff","patch_url":"https://github.com/G5/g5-content-management-system/pull/551.patch"},"body":"Deep clone was only cloning one level deep. This adds recursive cloning. "},"comment":{"url":"https://api.github.com/repos/G5/g5-content-management-system/issues/comments/68477308","html_url":"https://github.com/G5/g5-content-management-system/pull/551#issuecomment-68477308","issue_url":"https://api.github.com/repos/G5/g5-content-management-system/issues/551","id":68477308,"user":{"login":"variousred","id":238354,"avatar_url":"https://avatars.githubusercontent.com/u/238354?v=3","gravatar_id":"","url":"https://api.github.com/users/variousred","html_url":"https://github.com/variousred","followers_url":"https://api.github.com/users/variousred/followers","following_url":"https://api.github.com/users/variousred/following{/other_user}","gists_url":"https://api.github.com/users/variousred/gists{/gist_id}","starred_url":"https://api.github.com/users/variousred/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/variousred/subscriptions","organizations_url":"https://api.github.com/users/variousred/orgs","repos_url":"https://api.github.com/users/variousred/repos","events_url":"https://api.github.com/users/variousred/events{/privacy}","received_events_url":"https://api.github.com/users/variousred/received_events","type":"User","site_admin":false},"created_at":"2015-01-01T01:04:28Z","updated_at":"2015-01-01T01:04:28Z","body":"@ceckert this one failing test remaining might atually be uncovering a real bug. It seems we are creating an extra widget in the clone process."}},"public":true,"created_at":"2015-01-01T01:04:28Z","org":{"id":2396851,"login":"G5","gravatar_id":"","url":"https://api.github.com/orgs/G5","avatar_url":"https://avatars.githubusercontent.com/u/2396851?"}}
{"id":"2489397796","type":"PushEvent","actor":{"id":3056753,"login":"Yukariko","gravatar_id":"","url":"https://api.github.com/users/Yukariko","avatar_url":"https://avatars.githubusercontent.com/u/3056753?"},"repo":{"id":21538859,"name":"Yukariko/acm","url":"https://api.github.com/repos/Yukariko/acm"},"payload":{"push_id":536753092,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"cfa04165890a46738082b2f56b58b525ba1579d5","before":"bb9f0c6c8871960d6a68bd3d5ae8817b2ec112f9","commits":[{"sha":"cfa04165890a46738082b2f56b58b525ba1579d5","author":{"email":"5644dc45614202cf4a35cbeeaf0c6d61d1144e06@naver.com","name":"Yukariko"},"message":"Accept","distinct":true,"url":"https://api.github.com/repos/Yukariko/acm/commits/cfa04165890a46738082b2f56b58b525ba1579d5"}]},"public":true,"created_at":"2015-01-01T01:04:28Z"}
{"id":"2489397797","type":"PushEvent","actor":{"id":8454656,"login":"klob","gravatar_id":"","url":"https://api.github.com/users/klob","avatar_url":"https://avatars.githubusercontent.com/u/8454656?"},"repo":{"id":27668613,"name":"diandy/diandy1.2.0","url":"https://api.github.com/repos/diandy/diandy1.2.0"},"payload":{"push_id":536753093,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"d4cbddba067260c9b55d5b1b164f0fdb65a11bf1","before":"a2bc2dfcd2cdfca23b7e371302a6d56cf8f68115","commits":[{"sha":"d4cbddba067260c9b55d5b1b164f0fdb65a11bf1","author":{"email":"eae7ed76150cb5d2ded6223b270823aba8a08eb9@qq.com","name":"klob"},"message":" all changelist","distinct":true,"url":"https://api.github.com/repos/diandy/diandy1.2.0/commits/d4cbddba067260c9b55d5b1b164f0fdb65a11bf1"}]},"public":true,"created_at":"2015-01-01T01:04:28Z","org":{"id":10010251,"login":"diandy","gravatar_id":"","url":"https://api.github.com/orgs/diandy","avatar_url":"https://avatars.githubusercontent.com/u/10010251?"}}
{"id":"2489397799","type":"PushEvent","actor":{"id":433707,"login":"ile","gravatar_id":"","url":"https://api.github.com/users/ile","avatar_url":"https://avatars.githubusercontent.com/u/433707?"},"repo":{"id":26847132,"name":"kantele/k-templates","url":"https://api.github.com/repos/kantele/k-templates"},"payload":{"push_id":536753095,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"a2211fba71212268a1c0f0b3dc4ddb1412bf72b6","before":"0c74567d174b0901cf19bde2f2ddc65e1d4ff6e1","commits":[{"sha":"a2211fba71212268a1c0f0b3dc4ddb1412bf72b6","author":{"email":"4f3407de78bccc8cc160ee4d278d5efe7162e6b5@nateps.com","name":"Nate Smith"},"message":"$markComponent => $component","distinct":true,"url":"https://api.github.com/repos/kantele/k-templates/commits/a2211fba71212268a1c0f0b3dc4ddb1412bf72b6"}]},"public":true,"created_at":"2015-01-01T01:04:29Z","org":{"id":5687585,"login":"kantele","gravatar_id":"","url":"https://api.github.com/orgs/kantele","avatar_url":"https://avatars.githubusercontent.com/u/5687585?"}}
{"id":"2489397802","type":"PushEvent","actor":{"id":8819701,"login":"r-ggraham","gravatar_id":"","url":"https://api.github.com/users/r-ggraham","avatar_url":"https://avatars.githubusercontent.com/u/8819701?"},"repo":{"id":28678173,"name":"r-ggraham/Crumpet_Bot","url":"https://api.github.com/repos/r-ggraham/Crumpet_Bot"},"payload":{"push_id":536753097,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"ee45c3d188e25fa5ee1d0d5a8a9f3646854ccbc7","before":"51951542e9d518f59ff62753725e5186d4111822","commits":[{"sha":"ee45c3d188e25fa5ee1d0d5a8a9f3646854ccbc7","author":{"email":"f2f9dd43aa4244d32208a2ccfa0c7c9e9c48f7e7@uni.worc.ac.uk","name":"Rob G"},"message":"formatting","distinct":true,"url":"https://api.github.com/repos/r-ggraham/Crumpet_Bot/commits/ee45c3d188e25fa5ee1d0d5a8a9f3646854ccbc7"}]},"public":true,"created_at":"2015-01-01T01:04:29Z"}
{"id":"2489397805","type":"IssueCommentEvent","actor":{"id":5497952,"login":"g19-mr","gravatar_id":"","url":"https://api.github.com/users/g19-mr","avatar_url":"https://avatars.githubusercontent.com/u/5497952?"},"repo":{"id":25435487,"name":"g19-mr/azh","url":"https://api.github.com/repos/g19-mr/azh"},"payload":{"action":"created","issue":{"url":"https://api.github.com/repos/g19-mr/azh/issues/82","labels_url":"https://api.github.com/repos/g19-mr/azh/issues/82/labels{/name}","comments_url":"https://api.github.com/repos/g19-mr/azh/issues/82/comments","events_url":"https://api.github.com/repos/g19-mr/azh/issues/82/events","html_url":"https://github.com/g19-mr/azh/issues/82","id":53210240,"number":82,"title":"Add background color to done buttons in all Webviews","user":{"login":"g19-mr","id":5497952,"avatar_url":"https://avatars.githubusercontent.com/u/5497952?v=3","gravatar_id":"","url":"https://api.github.com/users/g19-mr","html_url":"https://github.com/g19-mr","followers_url":"https://api.github.com/users/g19-mr/followers","following_url":"https://api.github.com/users/g19-mr/following{/other_user}","gists_url":"https://api.github.com/users/g19-mr/gists{/gist_id}","starred_url":"https://api.github.com/users/g19-mr/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/g19-mr/subscriptions","organizations_url":"https://api.github.com/users/g19-mr/orgs","repos_url":"https://api.github.com/users/g19-mr/repos","events_url":"https://api.github.com/users/g19-mr/events{/privacy}","received_events_url":"https://api.github.com/users/g19-mr/received_events","type":"User","site_admin":false},"labels":[{"url":"https://api.github.com/repos/g19-mr/azh/labels/improvement","name":"improvement","color":"84b6eb"}],"state":"closed","locked":false,"assignee":{"login":"g19-mr","id":5497952,"avatar_url":"https://avatars.githubusercontent.com/u/5497952?v=3","gravatar_id":"","url":"https://api.github.com/users/g19-mr","html_url":"https://github.com/g19-mr","followers_url":"https://api.github.com/users/g19-mr/followers","following_url":"https://api.github.com/users/g19-mr/following{/other_user}","gists_url":"https://api.github.com/users/g19-mr/gists{/gist_id}","starred_url":"https://api.github.com/users/g19-mr/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/g19-mr/subscriptions","organizations_url":"https://api.github.com/users/g19-mr/orgs","repos_url":"https://api.github.com/users/g19-mr/repos","events_url":"https://api.github.com/users/g19-mr/events{/privacy}","received_events_url":"https://api.github.com/users/g19-mr/received_events","type":"User","site_admin":false},"milestone":{"url":"https://api.github.com/repos/g19-mr/azh/milestones/2","labels_url":"https://api.github.com/repos/g19-mr/azh/milestones/2/labels","id":873798,"number":2,"title":"Android 1.0.1","description":null,"creator":{"login":"g19-mr","id":5497952,"avatar_url":"https://avatars.githubusercontent.com/u/5497952?v=3","gravatar_id":"","url":"https://api.github.com/users/g19-mr","html_url":"https://github.com/g19-mr","followers_url":"https://api.github.com/users/g19-mr/followers","following_url":"https://api.github.com/users/g19-mr/following{/other_user}","gists_url":"https://api.github.com/users/g19-mr/gists{/gist_id}","starred_url":"https://api.github.com/users/g19-mr/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/g19-mr/subscriptions","organizations_url":"https://api.github.com/users/g19-mr/orgs","repos_url":"https://api.github.com/users/g19-mr/repos","events_url":"https://api.github.com/users/g19-mr/events{/privacy}","received_events_url":"https://api.github.com/users/g19-mr/received_events","type":"User","site_admin":false},"open_issues":5,"closed_issues":11,"state":"open","created_at":"2014-11-20T05:20:02Z","updated_at":"2015-01-01T01:04:29Z","due_on":null,"closed_at":null},"comments":1,"created_at":"2015-01-01T01:03:44Z","updated_at":"2015-01-01T01:04:29Z","closed_at":"2015-01-01T01:04:29Z","body":"- 2 on Donate screen\r\n- 1 on About screen"},"comment":{"url":"https://api.github.com/repos/g19-mr/azh/issues/comments/68477309","html_url":"https://github.com/g19-mr/azh/issues/82#issuecomment-68477309","issue_url":"https://api.github.com/repos/g19-mr/azh/issues/82","id":68477309,"user":{"login":"g19-mr","id":5497952,"avatar_url":"https://avatars.githubusercontent.com/u/5497952?v=3","gravatar_id":"","url":"https://api.github.com/users/g19-mr","html_url":"https://github.com/g19-mr","followers_url":"https://api.github.com/users/g19-mr/followers","following_url":"https://api.github.com/users/g19-mr/following{/other_user}","gists_url":"https://api.github.com/users/g19-mr/gists{/gist_id}","starred_url":"https://api.github.com/users/g19-mr/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/g19-mr/subscriptions","organizations_url":"https://api.github.com/users/g19-mr/orgs","repos_url":"https://api.github.com/users/g19-mr/repos","events_url":"https://api.github.com/users/g19-mr/events{/privacy}","received_events_url":"https://api.github.com/users/g19-mr/received_events","type":"User","site_admin":false},"created_at":"2015-01-01T01:04:29Z","updated_at":"2015-01-01T01:04:29Z","body":"Made Done buttons the same color as buttons on about screen"}},"public":true,"created_at":"2015-01-01T01:04:30Z"}
{"id":"2489397806","type":"IssuesEvent","actor":{"id":5497952,"login":"g19-mr","gravatar_id":"","url":"https://api.github.com/users/g19-mr","avatar_url":"https://avatars.githubusercontent.com/u/5497952?"},"repo":{"id":25435487,"name":"g19-mr/azh","url":"https://api.github.com/repos/g19-mr/azh"},"payload":{"action":"closed","issue":{"url":"https://api.github.com/repos/g19-mr/azh/issues/82","labels_url":"https://api.github.com/repos/g19-mr/azh/issues/82/labels{/name}","comments_url":"https://api.github.com/repos/g19-mr/azh/issues/82/comments","events_url":"https://api.github.com/repos/g19-mr/azh/issues/82/events","html_url":"https://github.com/g19-mr/azh/issues/82","id":53210240,"number":82,"title":"Add background color to done buttons in all Webviews","user":{"login":"g19-mr","id":5497952,"avatar_url":"https://avatars.githubusercontent.com/u/5497952?v=3","gravatar_id":"","url":"https://api.github.com/users/g19-mr","html_url":"https://github.com/g19-mr","followers_url":"https://api.github.com/users/g19-mr/followers","following_url":"https://api.github.com/users/g19-mr/following{/other_user}","gists_url":"https://api.github.com/users/g19-mr/gists{/gist_id}","starred_url":"https://api.github.com/users/g19-mr/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/g19-mr/subscriptions","organizations_url":"https://api.github.com/users/g19-mr/orgs","repos_url":"https://api.github.com/users/g19-mr/repos","events_url":"https://api.github.com/users/g19-mr/events{/privacy}","received_events_url":"https://api.github.com/users/g19-mr/received_events","type":"User","site_admin":false},"labels":[{"url":"https://api.github.com/repos/g19-mr/azh/labels/improvement","name":"improvement","color":"84b6eb"}],"state":"closed","locked":false,"assignee":{"login":"g19-mr","id":5497952,"avatar_url":"https://avatars.githubusercontent.com/u/5497952?v=3","gravatar_id":"","url":"https://api.github.com/users/g19-mr","html_url":"https://github.com/g19-mr","followers_url":"https://api.github.com/users/g19-mr/followers","following_url":"https://api.github.com/users/g19-mr/following{/other_user}","gists_url":"https://api.github.com/users/g19-mr/gists{/gist_id}","starred_url":"https://api.github.com/users/g19-mr/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/g19-mr/subscriptions","organizations_url":"https://api.github.com/users/g19-mr/orgs","repos_url":"https://api.github.com/users/g19-mr/repos","events_url":"https://api.github.com/users/g19-mr/events{/privacy}","received_events_url":"https://api.github.com/users/g19-mr/received_events","type":"User","site_admin":false},"milestone":{"url":"https://api.github.com/repos/g19-mr/azh/milestones/2","labels_url":"https://api.github.com/repos/g19-mr/azh/milestones/2/labels","id":873798,"number":2,"title":"Android 1.0.1","description":null,"creator":{"login":"g19-mr","id":5497952,"avatar_url":"https://avatars.githubusercontent.com/u/5497952?v=3","gravatar_id":"","url":"https://api.github.com/users/g19-mr","html_url":"https://github.com/g19-mr","followers_url":"https://api.github.com/users/g19-mr/followers","following_url":"https://api.github.com/users/g19-mr/following{/other_user}","gists_url":"https://api.github.com/users/g19-mr/gists{/gist_id}","starred_url":"https://api.github.com/users/g19-mr/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/g19-mr/subscriptions","organizations_url":"https://api.github.com/users/g19-mr/orgs","repos_url":"https://api.github.com/users/g19-mr/repos","events_url":"https://api.github.com/users/g19-mr/events{/privacy}","received_events_url":"https://api.github.com/users/g19-mr/received_events","type":"User","site_admin":false},"open_issues":5,"closed_issues":11,"state":"open","created_at":"2014-11-20T05:20:02Z","updated_at":"2015-01-01T01:04:29Z","due_on":null,"closed_at":null},"comments":1,"created_at":"2015-01-01T01:03:44Z","updated_at":"2015-01-01T01:04:29Z","closed_at":"2015-01-01T01:04:29Z","body":"- 2 on Donate screen\r\n- 1 on About screen"}},"public":true,"created_at":"2015-01-01T01:04:30Z"}
{"id":"2489397807","type":"IssueCommentEvent","actor":{"id":1682199,"login":"JayBeavers","gravatar_id":"","url":"https://api.github.com/users/JayBeavers","avatar_url":"https://avatars.githubusercontent.com/u/1682199?"},"repo":{"id":21885551,"name":"erikringsmuth/app-router","url":"https://api.github.com/repos/erikringsmuth/app-router"},"payload":{"action":"created","issue":{"url":"https://api.github.com/repos/erikringsmuth/app-router/issues/63","labels_url":"https://api.github.com/repos/erikringsmuth/app-router/issues/63/labels{/name}","comments_url":"https://api.github.com/repos/erikringsmuth/app-router/issues/63/comments","events_url":"https://api.github.com/repos/erikringsmuth/app-router/issues/63/events","html_url":"https://github.com/erikringsmuth/app-router/issues/63","id":53209410,"number":63,"title":"Advice on passing a fullbleed Polymer flexbox layout through the router","user":{"login":"JayBeavers","id":1682199,"avatar_url":"https://avatars.githubusercontent.com/u/1682199?v=3","gravatar_id":"","url":"https://api.github.com/users/JayBeavers","html_url":"https://github.com/JayBeavers","followers_url":"https://api.github.com/users/JayBeavers/followers","following_url":"https://api.github.com/users/JayBeavers/following{/other_user}","gists_url":"https://api.github.com/users/JayBeavers/gists{/gist_id}","starred_url":"https://api.github.com/users/JayBeavers/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/JayBeavers/subscriptions","organizations_url":"https://api.github.com/users/JayBeavers/orgs","repos_url":"https://api.github.com/users/JayBeavers/repos","events_url":"https://api.github.com/users/JayBeavers/events{/privacy}","received_events_url":"https://api.github.com/users/JayBeavers/received_events","type":"User","site_admin":false},"labels":[],"state":"closed","locked":false,"assignee":null,"milestone":null,"comments":2,"created_at":"2015-01-01T00:19:01Z","updated_at":"2015-01-01T01:04:30Z","closed_at":"2015-01-01T01:04:30Z","body":"I'm writing a full-screen app (fullbleed) and relying on the flexbox/layout features of Polymer for my layout design.\r\n\r\nWhen I moved to the app-router approach, I lost my screen measurements and have been working through the implications since.  At this point, I'm liberally applying 'layout/flex' to my app and I seem to be getting somewhere, but I'm still losing my flexbox support when I cross the app-route/import boundary.\r\n\r\nBefore I go trundling down the path of debugging/modifying app-router itself, is this something others have played with in the past?  Is there an established pattern I should be following?  Unfortunately I'm simultanouesly new to Polymer, flexbox/layouts, and app-router at the same time so I'm not really certain what is 'supposed' to work and what needs custom coding.\r\n\r\nRight now my pseduo-code is looking like:\r\n\r\n    <html>\r\n      <body fullbleed layout vertical unresolved>\r\n        <app-router flex layout vertical>\r\n          <app-route flex layout vertical> <!-- flex here isn't working as its dividing the screen real-estate amoung all my routes, I really mean 'flex but only on the active route' -->\r\n            <imported-page-template flex layout vertical> <!-- flex isn't working at all here, does not seem to cross the import boundary -->\r\n              ...\r\n\r\nAny thoughts for the lost and weary?"},"comment":{"url":"https://api.github.com/repos/erikringsmuth/app-router/issues/comments/68477310","html_url":"https://github.com/erikringsmuth/app-router/issues/63#issuecomment-68477310","issue_url":"https://api.github.com/repos/erikringsmuth/app-router/issues/63","id":68477310,"user":{"login":"JayBeavers","id":1682199,"avatar_url":"https://avatars.githubusercontent.com/u/1682199?v=3","gravatar_id":"","url":"https://api.github.com/users/JayBeavers","html_url":"https://github.com/JayBeavers","followers_url":"https://api.github.com/users/JayBeavers/followers","following_url":"https://api.github.com/users/JayBeavers/following{/other_user}","gists_url":"https://api.github.com/users/JayBeavers/gists{/gist_id}","starred_url":"https://api.github.com/users/JayBeavers/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/JayBeavers/subscriptions","organizations_url":"https://api.github.com/users/JayBeavers/orgs","repos_url":"https://api.github.com/users/JayBeavers/repos","events_url":"https://api.github.com/users/JayBeavers/events{/privacy}","received_events_url":"https://api.github.com/users/JayBeavers/received_events","type":"User","site_admin":false},"created_at":"2015-01-01T01:04:29Z","updated_at":"2015-01-01T01:04:29Z","body":"OK, thanks for the advice.  I was able to narrow down the attributes to get the system 'working as expected', at least after moderate testing to:\r\n\r\n```\r\n    <html>\r\n      <body fullbleed layout vertical unresolved>\r\n        <app-router>\r\n          <app-route import='...'>\r\n            <polymer-element>\r\n              <template>\r\n                <div layout vertical center>\r\n                  ...\r\n```\r\n\r\nThis seemed to pick up the information it needed, my missing step was that I needed a containing div inside the template of my polymer-element/page."}},"public":true,"created_at":"2015-01-01T01:04:30Z"}
{"id":"2489397808","type":"IssuesEvent","actor":{"id":1682199,"login":"JayBeavers","gravatar_id":"","url":"https://api.github.com/users/JayBeavers","avatar_url":"https://avatars.githubusercontent.com/u/1682199?"},"repo":{"id":21885551,"name":"erikringsmuth/app-router","url":"https://api.github.com/repos/erikringsmuth/app-router"},"payload":{"action":"closed","issue":{"url":"https://api.github.com/repos/erikringsmuth/app-router/issues/63","labels_url":"https://api.github.com/repos/erikringsmuth/app-router/issues/63/labels{/name}","comments_url":"https://api.github.com/repos/erikringsmuth/app-router/issues/63/comments","events_url":"https://api.github.com/repos/erikringsmuth/app-router/issues/63/events","html_url":"https://github.com/erikringsmuth/app-router/issues/63","id":53209410,"number":63,"title":"Advice on passing a fullbleed Polymer flexbox layout through the router","user":{"login":"JayBeavers","id":1682199,"avatar_url":"https://avatars.githubusercontent.com/u/1682199?v=3","gravatar_id":"","url":"https://api.github.com/users/JayBeavers","html_url":"https://github.com/JayBeavers","followers_url":"https://api.github.com/users/JayBeavers/followers","following_url":"https://api.github.com/users/JayBeavers/following{/other_user}","gists_url":"https://api.github.com/users/JayBeavers/gists{/gist_id}","starred_url":"https://api.github.com/users/JayBeavers/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/JayBeavers/subscriptions","organizations_url":"https://api.github.com/users/JayBeavers/orgs","repos_url":"https://api.github.com/users/JayBeavers/repos","events_url":"https://api.github.com/users/JayBeavers/events{/privacy}","received_events_url":"https://api.github.com/users/JayBeavers/received_events","type":"User","site_admin":false},"labels":[],"state":"closed","locked":false,"assignee":null,"milestone":null,"comments":2,"created_at":"2015-01-01T00:19:01Z","updated_at":"2015-01-01T01:04:30Z","closed_at":"2015-01-01T01:04:30Z","body":"I'm writing a full-screen app (fullbleed) and relying on the flexbox/layout features of Polymer for my layout design.\r\n\r\nWhen I moved to the app-router approach, I lost my screen measurements and have been working through the implications since.  At this point, I'm liberally applying 'layout/flex' to my app and I seem to be getting somewhere, but I'm still losing my flexbox support when I cross the app-route/import boundary.\r\n\r\nBefore I go trundling down the path of debugging/modifying app-router itself, is this something others have played with in the past?  Is there an established pattern I should be following?  Unfortunately I'm simultanouesly new to Polymer, flexbox/layouts, and app-router at the same time so I'm not really certain what is 'supposed' to work and what needs custom coding.\r\n\r\nRight now my pseduo-code is looking like:\r\n\r\n    <html>\r\n      <body fullbleed layout vertical unresolved>\r\n        <app-router flex layout vertical>\r\n          <app-route flex layout vertical> <!-- flex here isn't working as its dividing the screen real-estate amoung all my routes, I really mean 'flex but only on the active route' -->\r\n            <imported-page-template flex layout vertical> <!-- flex isn't working at all here, does not seem to cross the import boundary -->\r\n              ...\r\n\r\nAny thoughts for the lost and weary?"}},"public":true,"created_at":"2015-01-01T01:04:30Z"}
{"id":"2489397809","type":"PushEvent","actor":{"id":706947,"login":"d3athrow","gravatar_id":"","url":"https://api.github.com/users/d3athrow","avatar_url":"https://avatars.githubusercontent.com/u/706947?"},"repo":{"id":10441188,"name":"d3athrow/vgstation13","url":"https://api.github.com/repos/d3athrow/vgstation13"},"payload":{"push_id":536753099,"size":4,"distinct_size":4,"ref":"refs/heads/Bleeding-Edge","head":"54c4e0ffb341dc6ebdf8ce724b13e357234b9af0","before":"d274ed664f000dd393d16d6ebd5234332985ac8d","commits":[{"sha":"19881ecd196d4282777ba1ce93929aae3d4ca71c","author":{"email":"4b46b39232cc3015db82c31a969ae73f4e58ae9a@gmail.com","name":"Duny-"},"message":"A few defficiency fixes\n\n- Added all missing holodeck settings\n- Added missing pipe in the supermatter room\n- Tweaked toxins launcher, hopefully it doesn't refuse to launch bombs\nin higher ZAS settings anymore","distinct":true,"url":"https://api.github.com/repos/d3athrow/vgstation13/commits/19881ecd196d4282777ba1ce93929aae3d4ca71c"},{"sha":"ebd9ca32a9b118aa3f81188d375a5d9447f32514","author":{"email":"4b46b39232cc3015db82c31a969ae73f4e58ae9a@gmail.com","name":"Duny-"},"message":"Changelog","distinct":true,"url":"https://api.github.com/repos/d3athrow/vgstation13/commits/ebd9ca32a9b118aa3f81188d375a5d9447f32514"},{"sha":"34f7fa7b80f675ce4e56f4bc148338104b8155ee","author":{"email":"4b46b39232cc3015db82c31a969ae73f4e58ae9a@gmail.com","name":"Duny-"},"message":"Tiny lil fix","distinct":true,"url":"https://api.github.com/repos/d3athrow/vgstation13/commits/34f7fa7b80f675ce4e56f4bc148338104b8155ee"},{"sha":"54c4e0ffb341dc6ebdf8ce724b13e357234b9af0","author":{"email":"bf439111772c53efe08334e0c2bcb283a1d320cb@yahoo.com","name":"d3athrow"},"message":"Merge pull request #2417 from Duny-/Bleeding-Edge\n\nA few defficiency fixes","distinct":true,"url":"https://api.github.com/repos/d3athrow/vgstation13/commits/54c4e0ffb341dc6ebdf8ce724b13e357234b9af0"}]},"public":true,"created_at":"2015-01-01T01:04:30Z"}
{"id":"2489397821","type":"PushEvent","actor":{"id":6355392,"login":"githanwang1","gravatar_id":"","url":"https://api.github.com/users/githanwang1","avatar_url":"https://avatars.githubusercontent.com/u/6355392?"},"repo":{"id":28543231,"name":"githanwang1/django-blog","url":"https://api.github.com/repos/githanwang1/django-blog"},"payload":{"push_id":536753105,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"130cfc38c0c001e58f84398948b72b138ccce717","before":"84d296175511f1df9097fb18be3ec500e8acc701","commits":[{"sha":"130cfc38c0c001e58f84398948b72b138ccce717","author":{"email":"053e32d42d025177f9df81fc22020283a55f18ff@berkeley.edu","name":"Han Wang"},"message":"new blog lel","distinct":true,"url":"https://api.github.com/repos/githanwang1/django-blog/commits/130cfc38c0c001e58f84398948b72b138ccce717"}]},"public":true,"created_at":"2015-01-01T01:04:32Z"}
{"id":"2489397824","type":"PushEvent","actor":{"id":1779595,"login":"dcbaker","gravatar_id":"","url":"https://api.github.com/users/dcbaker","avatar_url":"https://avatars.githubusercontent.com/u/1779595?"},"repo":{"id":8488437,"name":"dcbaker/piglit","url":"https://api.github.com/repos/dcbaker/piglit"},"payload":{"push_id":536753107,"size":0,"distinct_size":0,"ref":"refs/heads/wip/command-list-only-v5","head":"cf5cf7224385c3c3d086762b5bc1d8f7df031ae7","before":"e81f4b28bf6ad78c7fb05257e77e42fe237a09ed","commits":[]},"public":true,"created_at":"2015-01-01T01:04:32Z"}
{"id":"2489397826","type":"PushEvent","actor":{"id":170479,"login":"tdhooper","gravatar_id":"","url":"https://api.github.com/users/tdhooper","avatar_url":"https://avatars.githubusercontent.com/u/170479?"},"repo":{"id":19411601,"name":"tdhooper/starstoloves","url":"https://api.github.com/repos/tdhooper/starstoloves"},"payload":{"push_id":536753109,"size":2,"distinct_size":2,"ref":"refs/heads/master","head":"b75fca64d82ce8d4c496bb3ab353bc7bed89a46c","before":"249d09e95e69c92cf5b1fd133d659271495d59a3","commits":[{"sha":"cd1431978800b65553ad260162efa5d346f49d57","author":{"email":"c136eba45d3ee7ac4dbbfc7f9f9d33c11a99a23f@Macintosh.local","name":"Thomas Hooper"},"message":"Show time loved","distinct":true,"url":"https://api.github.com/repos/tdhooper/starstoloves/commits/cd1431978800b65553ad260162efa5d346f49d57"},{"sha":"b75fca64d82ce8d4c496bb3ab353bc7bed89a46c","author":{"email":"c136eba45d3ee7ac4dbbfc7f9f9d33c11a99a23f@Macintosh.local","name":"Thomas Hooper"},"message":"Get fresh loved tracks after loving","distinct":true,"url":"https://api.github.com/repos/tdhooper/starstoloves/commits/b75fca64d82ce8d4c496bb3ab353bc7bed89a46c"}]},"public":true,"created_at":"2015-01-01T01:04:33Z"}
{"id":"2489397827","type":"GollumEvent","actor":{"id":46323,"login":"paulcon","gravatar_id":"","url":"https://api.github.com/users/paulcon","avatar_url":"https://avatars.githubusercontent.com/u/46323?"},"repo":{"id":28157780,"name":"paulcon/active_subspaces","url":"https://api.github.com/repos/paulcon/active_subspaces"},"payload":{"pages":[{"page_name":"_Footer","title":"_Footer","summary":null,"action":"edited","sha":"bab75a681aedf8288c9da56929fca226c67102f3","html_url":"https://github.com/paulcon/active_subspaces/wiki/_Footer"}]},"public":true,"created_at":"2015-01-01T01:04:33Z"}
{"id":"2489397831","type":"PushEvent","actor":{"id":904370,"login":"helhum","gravatar_id":"","url":"https://api.github.com/users/helhum","avatar_url":"https://avatars.githubusercontent.com/u/904370?"},"repo":{"id":26716312,"name":"TYPO3-Surf-CMS/Surf.CMS","url":"https://api.github.com/repos/TYPO3-Surf-CMS/Surf.CMS"},"payload":{"push_id":536753110,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"0ab6946565a1611c3bf27a34d8686bad2b88a5d7","before":"6c5278184c56a725e3cefd459de3cc77c78e0908","commits":[{"sha":"0ab6946565a1611c3bf27a34d8686bad2b88a5d7","author":{"email":"6bf857ca7de026fbed4ae790a809a0ea640901f4@helmuthummel.de","name":"Helmut Hummel"},"message":"Update README.md","distinct":true,"url":"https://api.github.com/repos/TYPO3-Surf-CMS/Surf.CMS/commits/0ab6946565a1611c3bf27a34d8686bad2b88a5d7"}]},"public":true,"created_at":"2015-01-01T01:04:33Z","org":{"id":7921669,"login":"TYPO3-Surf-CMS","gravatar_id":"","url":"https://api.github.com/orgs/TYPO3-Surf-CMS","avatar_url":"https://avatars.githubusercontent.com/u/7921669?"}}
{"id":"2489397835","type":"PushEvent","actor":{"id":18191,"login":"jc00ke","gravatar_id":"","url":"https://api.github.com/users/jc00ke","avatar_url":"https://avatars.githubusercontent.com/u/18191?"},"repo":{"id":28678223,"name":"jc00ke/chruby-fish","url":"https://api.github.com/repos/jc00ke/chruby-fish"},"payload":{"push_id":536753112,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"859d6a993456f190598eda5b2a188d96af984cf2","before":"e8f28035e7570cbf90568e7dd087810ae7958c8d","commits":[{"sha":"859d6a993456f190598eda5b2a188d96af984cf2","author":{"email":"a5c95b3d7cb4d0ae05a15c79c79ab458dc2c8f9e@jc00ke.com","name":"Jesse Cooke"},"message":"Document known PATH warning","distinct":true,"url":"https://api.github.com/repos/jc00ke/chruby-fish/commits/859d6a993456f190598eda5b2a188d96af984cf2"}]},"public":true,"created_at":"2015-01-01T01:04:34Z"}
{"id":"2489397840","type":"CreateEvent","actor":{"id":7637494,"login":"Kf4btg","gravatar_id":"","url":"https://api.github.com/users/Kf4btg","avatar_url":"https://avatars.githubusercontent.com/u/7637494?"},"repo":{"id":28275582,"name":"Kf4btg/TIH_tAPImod","url":"https://api.github.com/repos/Kf4btg/TIH_tAPImod"},"payload":{"ref":"1.1.2","ref_type":"tag","master_branch":"master","description":"","pusher_type":"user"},"public":true,"created_at":"2015-01-01T01:04:35Z"}
{"id":"2489397842","type":"IssuesEvent","actor":{"id":74571,"login":"fitzgen","gravatar_id":"","url":"https://api.github.com/users/fitzgen","avatar_url":"https://avatars.githubusercontent.com/u/74571?"},"repo":{"id":724712,"name":"rust-lang/rust","url":"https://api.github.com/repos/rust-lang/rust"},"payload":{"action":"closed","issue":{"url":"https://api.github.com/repos/rust-lang/rust/issues/20355","labels_url":"https://api.github.com/repos/rust-lang/rust/issues/20355/labels{/name}","comments_url":"https://api.github.com/repos/rust-lang/rust/issues/20355/comments","events_url":"https://api.github.com/repos/rust-lang/rust/issues/20355/events","html_url":"https://github.com/rust-lang/rust/issues/20355","id":53157956,"number":20355,"title":"Segfault in `Hasher<SipState>::hash`","user":{"login":"fitzgen","id":74571,"avatar_url":"https://avatars.githubusercontent.com/u/74571?v=3","gravatar_id":"","url":"https://api.github.com/users/fitzgen","html_url":"https://github.com/fitzgen","followers_url":"https://api.github.com/users/fitzgen/followers","following_url":"https://api.github.com/users/fitzgen/following{/other_user}","gists_url":"https://api.github.com/users/fitzgen/gists{/gist_id}","starred_url":"https://api.github.com/users/fitzgen/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/fitzgen/subscriptions","organizations_url":"https://api.github.com/users/fitzgen/orgs","repos_url":"https://api.github.com/users/fitzgen/repos","events_url":"https://api.github.com/users/fitzgen/events{/privacy}","received_events_url":"https://api.github.com/users/fitzgen/received_events","type":"User","site_admin":false},"labels":[{"url":"https://api.github.com/repos/rust-lang/rust/labels/I-crash","name":"I-crash","color":"e10c02"}],"state":"closed","locked":false,"assignee":null,"milestone":null,"comments":6,"created_at":"2014-12-31T00:04:46Z","updated_at":"2015-01-01T01:04:35Z","closed_at":"2015-01-01T01:04:35Z","body":"Test case is branch `sip-hasher-segault` of this repo: https://github.com/fitzgen/oxischeme/tree/sip-hasher-segfault\r\n\r\n    $ rustc --version --verbose\r\n    rustc --version --verbose\r\n    rustc 0.13.0-nightly (5ba610265 2014-12-25 18:01:36 +0000)\r\n    binary: rustc\r\n    commit-hash: 5ba6102657a892457063d2d6a7cbb9632ce282c6\r\n    commit-date: 2014-12-25 18:01:36 +0000\r\n    host: x86_64-apple-darwin\r\n    release: 0.13.0-nightly\r\n    $ rustc -g --test src/main.rs -o target/test\r\n    $ lldb ./target/test\r\n    lldb ./target/test\r\n    (lldb) target create \"./target/test\"\r\n    Current executable set to './target/test' (x86_64).\r\n    (lldb) run\r\n    Process 8270 launched: './target/test' (x86_64)\r\n\r\n    running 20 tests\r\n    Process 8270 stopped\r\n    * thread #2: tid = 0x25693, 0x0000000100008bed test`hash::sip::SipHasher.Hasher$LT$SipState$GT$::hash::h16497116303610205953 + 61, stop reason = EXC_BAD_ACCESS (code=1, address=0x3ffd9)\r\n        frame #0: 0x0000000100008bed test`hash::sip::SipHasher.Hasher$LT$SipState$GT$::hash::h16497116303610205953 + 61\r\n    test`hash::sip::SipHasher.Hasher$LT$SipState$GT$::hash::h16497116303610205953 + 61:\r\n    -> 0x100008bed:  movq   (%rsi), %rsi\r\n       0x100008bf0:  movq   -0x8(%rbp), %rdi\r\n       0x100008bf4:  movq   0x8(%rdi), %rdx\r\n       0x100008bf8:  movq   %rax, %rdi\r\n    (lldb) bt\r\n    * thread #2: tid = 0x25693, 0x0000000100008bed test`hash::sip::SipHasher.Hasher$LT$SipState$GT$::hash::h16497116303610205953 + 61, stop reason = EXC_BAD_ACCESS (code=1, address=0x3ffd9)\r\n      * frame #0: 0x0000000100008bed test`hash::sip::SipHasher.Hasher$LT$SipState$GT$::hash::h16497116303610205953 + 61\r\n        frame #1: 0x0000000105401810\r\n        frame #2: 0x0000000100008ba2 test`hash::RandomSipHasher.Hasher$LT$sip..SipState$GT$::hash::h10512232733763305808 + 66\r\n        frame #3: 0x0000000100008b0e test`collections::hash::table::make_hash::h9604696550138645665 + 62\r\n        frame #4: 0x0000000100008abe test`collections::hash::map::HashMap$LT$K$C$$u{20}V$C$$u{20}H$GT$::make_hash::h15786379260790357760 + 62\r\n        frame #5: 0x0000000100008963 test`collections::hash::map::HashMap$LT$K$C$$u{20}V$C$$u{20}H$GT$::insert::h6805880362953821147 + 131\r\n        frame #6: 0x0000000100006aea test`main::environment::Environment::define(self=0x000000000003ffc1, sym=String at 0x0000000105401a50, val=0x0000000105401c38) + 218 at environment.rs:92\r\n        frame #7: 0x0000000100018486 test`main::eval::evaluate_definition(heap=0x00000001054034e8, env=0x0000000105402d10, form=0x0000000105402ce0) + 2406 at eval.rs:195\r\n        frame #8: 0x0000000100013f1b test`main::eval::evaluate(heap=0x00000001054034e8, env=0x0000000105402d90, form=0x0000000105402f30) + 1355 at eval.rs:79\r\n        frame #9: 0x0000000100013909 test`main::eval::evaluate_in_global_env(heap=0x00000001054034e8, form=0x0000000105402f30) + 105 at eval.rs:38\r\n        frame #10: 0x000000010001cd7b test`main::eval::evaluate_file(heap=0x00000001054034e8, file_path=(data_ptr = \"./tests/test_eval_closures.scmsrc/heap.rsArenaPtr(, )Rooted(\", length = 30)) + 1035 at <std macros>:286\r\n        frame #11: 0x000000010002c071 test`main::eval::test_eval_closures + 129 at eval.rs:403\r\n        frame #12: 0x0000000100087154 test`thunk::F.Invoke$LT$A$C$$u{20}R$GT$::invoke::h5218640484166224076 + 52\r\n        frame #13: 0x0000000100091e32 test`thunk::F.Invoke$LT$A$C$$u{20}R$GT$::invoke::h13672304839710771993 + 162\r\n        frame #14: 0x0000000100088912 test`thunk::F.Invoke$LT$A$C$$u{20}R$GT$::invoke::h15490786364890695979 + 1138\r\n        frame #15: 0x0000000100088db0 test`rt::unwind::try::try_fn::h10439459448986358359 + 160\r\n        frame #16: 0x000000010010a4f9 test`rust_try_inner + 9\r\n        frame #17: 0x000000010010a4e6 test`rust_try + 6\r\n        frame #18: 0x00000001000894ab test`thunk::F.Invoke$LT$A$C$$u{20}R$GT$::invoke::h13206639752781900349 + 1179\r\n        frame #19: 0x0000000100106eb4 test`sys::thread::thread_start::h2cb22211a4c7d938vFw + 164\r\n        frame #20: 0x00007fff875d3899 libsystem_pthread.dylib`_pthread_body + 138\r\n        frame #21: 0x00007fff875d372a libsystem_pthread.dylib`_pthread_start + 137\r\n        frame #22: 0x00007fff875d7fc9 libsystem_pthread.dylib`thread_start + 13\r\n"}},"public":true,"created_at":"2015-01-01T01:04:35Z","org":{"id":5430905,"login":"rust-lang","gravatar_id":"","url":"https://api.github.com/orgs/rust-lang","avatar_url":"https://avatars.githubusercontent.com/u/5430905?"}}
{"id":"2489397845","type":"PushEvent","actor":{"id":2284601,"login":"citrix-openstack-build","gravatar_id":"","url":"https://api.github.com/users/citrix-openstack-build","avatar_url":"https://avatars.githubusercontent.com/u/2284601?"},"repo":{"id":13325270,"name":"citrix-openstack-build/keystone","url":"https://api.github.com/repos/citrix-openstack-build/keystone"},"payload":{"push_id":536753115,"size":4,"distinct_size":4,"ref":"refs/heads/ctx-nova-network-smoke-latest","head":"503da84ac51a3f5f4d173fe5d1b19c98ed12ed7d","before":"eb3556e9b9c4413030b230c6a6fd04a934328773","commits":[{"sha":"637845df1ef857dfd5f23658ac77312f0212c7c7","author":{"email":"38c8728ee30e7562e7872660a2fab1bda7c7a859@us.ibm.com","name":"Brant Knudson"},"message":"Enhance FakeLdap to require base entry for subtree search\n\nThe FakeLdap implementation didn't raise ldap.NO_SUCH_OBJECT when the\nbase entry didn't exist. A real LDAP server would raise if the base\nentry didn't exist.\n\nChange-Id: If26d4cff5882ad13c9e00b8a894920f244238c49\nCloses-Bug: #1368772","distinct":true,"url":"https://api.github.com/repos/citrix-openstack-build/keystone/commits/637845df1ef857dfd5f23658ac77312f0212c7c7"},{"sha":"e06a463e961403d665608252a71efff4b7a415ab","author":{"email":"1150688ef4531a9968266ddcbdddd37ed9b81ac8@huawei.com","name":"wanghong"},"message":"improve the EP-FILTER catalog length check in test_v3.py\n\nUse matcher.HasLength to do EP-FILTER catalog length check in\ntest_v3.py. There are two reason to do this:\n1. Currrently, we check more than but not equal, this may cover bug\n2. When test fails, it just give an useless message:\n   AssertionError: False is not true\n\nChange-Id: I20d521690e79957031bdf4bf5b240f8a4790553c","distinct":true,"url":"https://api.github.com/repos/citrix-openstack-build/keystone/commits/e06a463e961403d665608252a71efff4b7a415ab"},{"sha":"ded5608f38c6629752228a411b620e8c6614410d","author":{"email":"d95b56ce41a2e1ac4cecdd398defd7414407cc08@review.openstack.org","name":"Jenkins"},"message":"Merge \"Enhance FakeLdap to require base entry for subtree search\"","distinct":true,"url":"https://api.github.com/repos/citrix-openstack-build/keystone/commits/ded5608f38c6629752228a411b620e8c6614410d"},{"sha":"503da84ac51a3f5f4d173fe5d1b19c98ed12ed7d","author":{"email":"d95b56ce41a2e1ac4cecdd398defd7414407cc08@review.openstack.org","name":"Jenkins"},"message":"Merge \"improve the EP-FILTER catalog length check in test_v3.py\"","distinct":true,"url":"https://api.github.com/repos/citrix-openstack-build/keystone/commits/503da84ac51a3f5f4d173fe5d1b19c98ed12ed7d"}]},"public":true,"created_at":"2015-01-01T01:04:36Z"}
{"id":"2489397847","type":"PushEvent","actor":{"id":4356609,"login":"dcrousso","gravatar_id":"","url":"https://api.github.com/users/dcrousso","avatar_url":"https://avatars.githubusercontent.com/u/4356609?"},"repo":{"id":25148806,"name":"dcrousso/ProjectEuler","url":"https://api.github.com/repos/dcrousso/ProjectEuler"},"payload":{"push_id":536753116,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"e8da582cd7c82a56b23ac566b7bb8b8edf5ce415","before":"b2b6712812e289ed0a75eb185113dd69a9e43dd9","commits":[{"sha":"e8da582cd7c82a56b23ac566b7bb8b8edf5ce415","author":{"email":"9ebcc5dc367a76bd13fea77254fcbce737f76b12@gmail.com","name":"Devin Rousso"},"message":"Completed 123","distinct":true,"url":"https://api.github.com/repos/dcrousso/ProjectEuler/commits/e8da582cd7c82a56b23ac566b7bb8b8edf5ce415"}]},"public":true,"created_at":"2015-01-01T01:04:36Z"}
{"id":"2489397852","type":"PullRequestReviewCommentEvent","actor":{"id":523287,"login":"j2sol","gravatar_id":"","url":"https://api.github.com/users/j2sol","avatar_url":"https://avatars.githubusercontent.com/u/523287?"},"repo":{"id":11848896,"name":"blueboxgroup/ursula","url":"https://api.github.com/repos/blueboxgroup/ursula"},"payload":{"action":"created","comment":{"url":"https://api.github.com/repos/blueboxgroup/ursula/pulls/comments/22397285","id":22397285,"diff_hunk":"@@ -1,121 +1,92 @@\n ---\n-- name: install apache\n-  apt: pkg={{ item }}\n-  with_items:\n-    - apache2\n-    - libapache2-mod-wsgi\n-\n - name: lesscpy must be in apache PATH\n   pip: name=lesscpy version=0.9j\n \n - name: get horizon source repo\n-  git: repo={{ openstack.git_mirror }}/horizon.git\n-       dest=/opt/stack/horizon\n-       version={{ horizon.rev }}\n-       update={{ openstack.git_update }}\n+  git: |\n+    repo={{ openstack.git_mirror}}/horizon.git\n+    dest=/opt/stack/horizon\n+    version={{ horizon.rev }}\n+    update={{ openstack.git_update }}\n   notify:\n     - setup horizon venv\n     - compress horizon assets\n \n-- template: src=opt/stack/horizon/hide-external-networks.patch dest=/opt/stack/horizon/hide-external-networks.patch mode=0644\n-- shell: patch -p1 < hide-external-networks.patch chdir=/opt/stack/horizon\n-  notify:\n-    - setup horizon venv\n-\n - name: add python-memcached to horizon requirements\n-  lineinfile: dest=/opt/stack/horizon/requirements.txt\n-              regexp=^python-memcached\n-              line=python-memcached\n+  lineinfile: dest=/opt/stack/horizon/requirements.txt regexp=^python-memcached line=python-memcached\n   notify:\n     - setup horizon venv\n \n-- name: disable apache status\n-  command: a2dismod status\n-  notify:\n-    - restart apache\n-\n-- name: apache ports config\n-  template: src=etc/apache2/ports.conf\n-            dest=/etc/apache2/ports.conf\n-  notify:\n-    - restart apache\n-\n-- name: disable default apache site\n-  command: a2dissite 000-default\n+- name: make sure apache knows about horizon ports\n+  lineinfile: dest=/etc/apache2/ports.conf line=\"Listen 8080\"\n   notify:\n-    - restart apache\n+    - reload apache\n \n-- name: openstack dashboard config (12.04)\n-  template: src=etc/apache2/sites-available/openstack_dashboard.conf\n-            dest=/etc/apache2/sites-available/openstack_dashboard\n+- name: create dashboard virtualhost on precise\n+  template: |\n+    src=etc/apache2/sites-available/openstack_dashboard.conf\n+    dest=/etc/apache2/sites-available/openstack_dashboard\n   when: ansible_distribution_version == \"12.04\"\n   notify:\n-    - restart apache\n+    - reload apache\n \n-- name: openstack dashboard config\n-  template: src=etc/apache2/sites-available/openstack_dashboard.conf\n-            dest=/etc/apache2/sites-available/openstack_dashboard.conf\n+- name: create dashboard virtualhost on other\n+  template: |\n+    src=etc/apache2/sites-available/openstack_dashboard.conf\n+    dest=/etc/apache2/sites-available/openstack_dashboard.conf\n   when: ansible_distribution_version != \"12.04\"\n   notify:\n-    - restart apache\n+    - reload apache\n \n - name: enable horizon apache site\n-  command: a2ensite openstack_dashboard\n+  apache2_site: state=enabled name=openstack_dashboard\n   notify:\n-    - restart apache\n-\n-- name: static asset directories\n-  file: dest={{ item }}\n-        state=directory\n-        owner=www-data\n-        group=www-data\n-        mode=0755\n+    - reload apache\n+\n+- name: create static asset dirs\n+  file: |","path":"roles/horizon/tasks/main.yml","position":96,"original_position":96,"commit_id":"2a6f35313b9936ce4450aba823d09287626bed6f","original_commit_id":"2a6f35313b9936ce4450aba823d09287626bed6f","user":{"login":"j2sol","id":523287,"avatar_url":"https://avatars.githubusercontent.com/u/523287?v=3","gravatar_id":"","url":"https://api.github.com/users/j2sol","html_url":"https://github.com/j2sol","followers_url":"https://api.github.com/users/j2sol/followers","following_url":"https://api.github.com/users/j2sol/following{/other_user}","gists_url":"https://api.github.com/users/j2sol/gists{/gist_id}","starred_url":"https://api.github.com/users/j2sol/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/j2sol/subscriptions","organizations_url":"https://api.github.com/users/j2sol/orgs","repos_url":"https://api.github.com/users/j2sol/repos","events_url":"https://api.github.com/users/j2sol/events{/privacy}","received_events_url":"https://api.github.com/users/j2sol/received_events","type":"User","site_admin":false},"body":"why so continuation?","created_at":"2015-01-01T01:04:37Z","updated_at":"2015-01-01T01:04:37Z","html_url":"https://github.com/blueboxgroup/ursula/pull/705#discussion_r22397285","pull_request_url":"https://api.github.com/repos/blueboxgroup/ursula/pulls/705","_links":{"self":{"href":"https://api.github.com/repos/blueboxgroup/ursula/pulls/comments/22397285"},"html":{"href":"https://github.com/blueboxgroup/ursula/pull/705#discussion_r22397285"},"pull_request":{"href":"https://api.github.com/repos/blueboxgroup/ursula/pulls/705"}}},"pull_request":{"url":"https://api.github.com/repos/blueboxgroup/ursula/pulls/705","id":26738851,"html_url":"https://github.com/blueboxgroup/ursula/pull/705","diff_url":"https://github.com/blueboxgroup/ursula/pull/705.diff","patch_url":"https://github.com/blueboxgroup/ursula/pull/705.patch","issue_url":"https://api.github.com/repos/blueboxgroup/ursula/issues/705","number":705,"state":"open","locked":false,"title":"WIP:  apache for loadbalancing","user":{"login":"paulczar","id":2488346,"avatar_url":"https://avatars.githubusercontent.com/u/2488346?v=3","gravatar_id":"","url":"https://api.github.com/users/paulczar","html_url":"https://github.com/paulczar","followers_url":"https://api.github.com/users/paulczar/followers","following_url":"https://api.github.com/users/paulczar/following{/other_user}","gists_url":"https://api.github.com/users/paulczar/gists{/gist_id}","starred_url":"https://api.github.com/users/paulczar/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/paulczar/subscriptions","organizations_url":"https://api.github.com/users/paulczar/orgs","repos_url":"https://api.github.com/users/paulczar/repos","events_url":"https://api.github.com/users/paulczar/events{/privacy}","received_events_url":"https://api.github.com/users/paulczar/received_events","type":"User","site_admin":false},"body":"This is a quick POC / WIP to demo using apache instead of haproxy for loadbalancing our APIs.\r\n\r\nI think this gives us more flexibiltiy as we can enable in the APIs role itself ( in this case in keystone ) rather than a big monolithic haproxy.conf.      We also already have apache running for horizon, so it could reduce number of services.    apache also has better logging options that haproxy which can only log to syslog. ","created_at":"2015-01-01T00:04:13Z","updated_at":"2015-01-01T01:04:37Z","closed_at":null,"merged_at":null,"merge_commit_sha":"9b91693f11e166c9ee53836f19697868d412bf76","assignee":null,"milestone":null,"commits_url":"https://api.github.com/repos/blueboxgroup/ursula/pulls/705/commits","review_comments_url":"https://api.github.com/repos/blueboxgroup/ursula/pulls/705/comments","review_comment_url":"https://api.github.com/repos/blueboxgroup/ursula/pulls/comments/{number}","comments_url":"https://api.github.com/repos/blueboxgroup/ursula/issues/705/comments","statuses_url":"https://api.github.com/repos/blueboxgroup/ursula/statuses/2a6f35313b9936ce4450aba823d09287626bed6f","head":{"label":"blueboxgroup:use_apache_for_lb","ref":"use_apache_for_lb","sha":"2a6f35313b9936ce4450aba823d09287626bed6f","user":{"login":"blueboxgroup","id":458705,"avatar_url":"https://avatars.githubusercontent.com/u/458705?v=3","gravatar_id":"","url":"https://api.github.com/users/blueboxgroup","html_url":"https://github.com/blueboxgroup","followers_url":"https://api.github.com/users/blueboxgroup/followers","following_url":"https://api.github.com/users/blueboxgroup/following{/other_user}","gists_url":"https://api.github.com/users/blueboxgroup/gists{/gist_id}","starred_url":"https://api.github.com/users/blueboxgroup/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/blueboxgroup/subscriptions","organizations_url":"https://api.github.com/users/blueboxgroup/orgs","repos_url":"https://api.github.com/users/blueboxgroup/repos","events_url":"https://api.github.com/users/blueboxgroup/events{/privacy}","received_events_url":"https://api.github.com/users/blueboxgroup/received_events","type":"Organization","site_admin":false},"repo":{"id":11848896,"name":"ursula","full_name":"blueboxgroup/ursula","owner":{"login":"blueboxgroup","id":458705,"avatar_url":"https://avatars.githubusercontent.com/u/458705?v=3","gravatar_id":"","url":"https://api.github.com/users/blueboxgroup","html_url":"https://github.com/blueboxgroup","followers_url":"https://api.github.com/users/blueboxgroup/followers","following_url":"https://api.github.com/users/blueboxgroup/following{/other_user}","gists_url":"https://api.github.com/users/blueboxgroup/gists{/gist_id}","starred_url":"https://api.github.com/users/blueboxgroup/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/blueboxgroup/subscriptions","organizations_url":"https://api.github.com/users/blueboxgroup/orgs","repos_url":"https://api.github.com/users/blueboxgroup/repos","events_url":"https://api.github.com/users/blueboxgroup/events{/privacy}","received_events_url":"https://api.github.com/users/blueboxgroup/received_events","type":"Organization","site_admin":false},"private":false,"html_url":"https://github.com/blueboxgroup/ursula","description":"Ansible playbooks for operating OpenStack","fork":false,"url":"https://api.github.com/repos/blueboxgroup/ursula","forks_url":"https://api.github.com/repos/blueboxgroup/ursula/forks","keys_url":"https://api.github.com/repos/blueboxgroup/ursula/keys{/key_id}","collaborators_url":"https://api.github.com/repos/blueboxgroup/ursula/collaborators{/collaborator}","teams_url":"https://api.github.com/repos/blueboxgroup/ursula/teams","hooks_url":"https://api.github.com/repos/blueboxgroup/ursula/hooks","issue_events_url":"https://api.github.com/repos/blueboxgroup/ursula/issues/events{/number}","events_url":"https://api.github.com/repos/blueboxgroup/ursula/events","assignees_url":"https://api.github.com/repos/blueboxgroup/ursula/assignees{/user}","branches_url":"https://api.github.com/repos/blueboxgroup/ursula/branches{/branch}","tags_url":"https://api.github.com/repos/blueboxgroup/ursula/tags","blobs_url":"https://api.github.com/repos/blueboxgroup/ursula/git/blobs{/sha}","git_tags_url":"https://api.github.com/repos/blueboxgroup/ursula/git/tags{/sha}","git_refs_url":"https://api.github.com/repos/blueboxgroup/ursula/git/refs{/sha}","trees_url":"https://api.github.com/repos/blueboxgroup/ursula/git/trees{/sha}","statuses_url":"https://api.github.com/repos/blueboxgroup/ursula/statuses/{sha}","languages_url":"https://api.github.com/repos/blueboxgroup/ursula/languages","stargazers_url":"https://api.github.com/repos/blueboxgroup/ursula/stargazers","contributors_url":"https://api.github.com/repos/blueboxgroup/ursula/contributors","subscribers_url":"https://api.github.com/repos/blueboxgroup/ursula/subscribers","subscription_url":"https://api.github.com/repos/blueboxgroup/ursula/subscription","commits_url":"https://api.github.com/repos/blueboxgroup/ursula/commits{/sha}","git_commits_url":"https://api.github.com/repos/blueboxgroup/ursula/git/commits{/sha}","comments_url":"https://api.github.com/repos/blueboxgroup/ursula/comments{/number}","issue_comment_url":"https://api.github.com/repos/blueboxgroup/ursula/issues/comments/{number}","contents_url":"https://api.github.com/repos/blueboxgroup/ursula/contents/{+path}","compare_url":"https://api.github.com/repos/blueboxgroup/ursula/compare/{base}...{head}","merges_url":"https://api.github.com/repos/blueboxgroup/ursula/merges","archive_url":"https://api.github.com/repos/blueboxgroup/ursula/{archive_format}{/ref}","downloads_url":"https://api.github.com/repos/blueboxgroup/ursula/downloads","issues_url":"https://api.github.com/repos/blueboxgroup/ursula/issues{/number}","pulls_url":"https://api.github.com/repos/blueboxgroup/ursula/pulls{/number}","milestones_url":"https://api.github.com/repos/blueboxgroup/ursula/milestones{/number}","notifications_url":"https://api.github.com/repos/blueboxgroup/ursula/notifications{?since,all,participating}","labels_url":"https://api.github.com/repos/blueboxgroup/ursula/labels{/name}","releases_url":"https://api.github.com/repos/blueboxgroup/ursula/releases{/id}","created_at":"2013-08-02T17:37:26Z","updated_at":"2014-12-31T21:03:28Z","pushed_at":"2015-01-01T00:01:35Z","git_url":"git://github.com/blueboxgroup/ursula.git","ssh_url":"git@github.com:blueboxgroup/ursula.git","clone_url":"https://github.com/blueboxgroup/ursula.git","svn_url":"https://github.com/blueboxgroup/ursula","homepage":null,"size":9036,"stargazers_count":45,"watchers_count":45,"language":"Python","has_issues":true,"has_downloads":true,"has_wiki":true,"has_pages":false,"forks_count":23,"mirror_url":null,"open_issues_count":26,"forks":23,"open_issues":26,"watchers":45,"default_branch":"master"}},"base":{"label":"blueboxgroup:master","ref":"master","sha":"34b83c65ff0de2f8b006d8ce4f76919fe0167bbf","user":{"login":"blueboxgroup","id":458705,"avatar_url":"https://avatars.githubusercontent.com/u/458705?v=3","gravatar_id":"","url":"https://api.github.com/users/blueboxgroup","html_url":"https://github.com/blueboxgroup","followers_url":"https://api.github.com/users/blueboxgroup/followers","following_url":"https://api.github.com/users/blueboxgroup/following{/other_user}","gists_url":"https://api.github.com/users/blueboxgroup/gists{/gist_id}","starred_url":"https://api.github.com/users/blueboxgroup/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/blueboxgroup/subscriptions","organizations_url":"https://api.github.com/users/blueboxgroup/orgs","repos_url":"https://api.github.com/users/blueboxgroup/repos","events_url":"https://api.github.com/users/blueboxgroup/events{/privacy}","received_events_url":"https://api.github.com/users/blueboxgroup/received_events","type":"Organization","site_admin":false},"repo":{"id":11848896,"name":"ursula","full_name":"blueboxgroup/ursula","owner":{"login":"blueboxgroup","id":458705,"avatar_url":"https://avatars.githubusercontent.com/u/458705?v=3","gravatar_id":"","url":"https://api.github.com/users/blueboxgroup","html_url":"https://github.com/blueboxgroup","followers_url":"https://api.github.com/users/blueboxgroup/followers","following_url":"https://api.github.com/users/blueboxgroup/following{/other_user}","gists_url":"https://api.github.com/users/blueboxgroup/gists{/gist_id}","starred_url":"https://api.github.com/users/blueboxgroup/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/blueboxgroup/subscriptions","organizations_url":"https://api.github.com/users/blueboxgroup/orgs","repos_url":"https://api.github.com/users/blueboxgroup/repos","events_url":"https://api.github.com/users/blueboxgroup/events{/privacy}","received_events_url":"https://api.github.com/users/blueboxgroup/received_events","type":"Organization","site_admin":false},"private":false,"html_url":"https://github.com/blueboxgroup/ursula","description":"Ansible playbooks for operating OpenStack","fork":false,"url":"https://api.github.com/repos/blueboxgroup/ursula","forks_url":"https://api.github.com/repos/blueboxgroup/ursula/forks","keys_url":"https://api.github.com/repos/blueboxgroup/ursula/keys{/key_id}","collaborators_url":"https://api.github.com/repos/blueboxgroup/ursula/collaborators{/collaborator}","teams_url":"https://api.github.com/repos/blueboxgroup/ursula/teams","hooks_url":"https://api.github.com/repos/blueboxgroup/ursula/hooks","issue_events_url":"https://api.github.com/repos/blueboxgroup/ursula/issues/events{/number}","events_url":"https://api.github.com/repos/blueboxgroup/ursula/events","assignees_url":"https://api.github.com/repos/blueboxgroup/ursula/assignees{/user}","branches_url":"https://api.github.com/repos/blueboxgroup/ursula/branches{/branch}","tags_url":"https://api.github.com/repos/blueboxgroup/ursula/tags","blobs_url":"https://api.github.com/repos/blueboxgroup/ursula/git/blobs{/sha}","git_tags_url":"https://api.github.com/repos/blueboxgroup/ursula/git/tags{/sha}","git_refs_url":"https://api.github.com/repos/blueboxgroup/ursula/git/refs{/sha}","trees_url":"https://api.github.com/repos/blueboxgroup/ursula/git/trees{/sha}","statuses_url":"https://api.github.com/repos/blueboxgroup/ursula/statuses/{sha}","languages_url":"https://api.github.com/repos/blueboxgroup/ursula/languages","stargazers_url":"https://api.github.com/repos/blueboxgroup/ursula/stargazers","contributors_url":"https://api.github.com/repos/blueboxgroup/ursula/contributors","subscribers_url":"https://api.github.com/repos/blueboxgroup/ursula/subscribers","subscription_url":"https://api.github.com/repos/blueboxgroup/ursula/subscription","commits_url":"https://api.github.com/repos/blueboxgroup/ursula/commits{/sha}","git_commits_url":"https://api.github.com/repos/blueboxgroup/ursula/git/commits{/sha}","comments_url":"https://api.github.com/repos/blueboxgroup/ursula/comments{/number}","issue_comment_url":"https://api.github.com/repos/blueboxgroup/ursula/issues/comments/{number}","contents_url":"https://api.github.com/repos/blueboxgroup/ursula/contents/{+path}","compare_url":"https://api.github.com/repos/blueboxgroup/ursula/compare/{base}...{head}","merges_url":"https://api.github.com/repos/blueboxgroup/ursula/merges","archive_url":"https://api.github.com/repos/blueboxgroup/ursula/{archive_format}{/ref}","downloads_url":"https://api.github.com/repos/blueboxgroup/ursula/downloads","issues_url":"https://api.github.com/repos/blueboxgroup/ursula/issues{/number}","pulls_url":"https://api.github.com/repos/blueboxgroup/ursula/pulls{/number}","milestones_url":"https://api.github.com/repos/blueboxgroup/ursula/milestones{/number}","notifications_url":"https://api.github.com/repos/blueboxgroup/ursula/notifications{?since,all,participating}","labels_url":"https://api.github.com/repos/blueboxgroup/ursula/labels{/name}","releases_url":"https://api.github.com/repos/blueboxgroup/ursula/releases{/id}","created_at":"2013-08-02T17:37:26Z","updated_at":"2014-12-31T21:03:28Z","pushed_at":"2015-01-01T00:01:35Z","git_url":"git://github.com/blueboxgroup/ursula.git","ssh_url":"git@github.com:blueboxgroup/ursula.git","clone_url":"https://github.com/blueboxgroup/ursula.git","svn_url":"https://github.com/blueboxgroup/ursula","homepage":null,"size":9036,"stargazers_count":45,"watchers_count":45,"language":"Python","has_issues":true,"has_downloads":true,"has_wiki":true,"has_pages":false,"forks_count":23,"mirror_url":null,"open_issues_count":26,"forks":23,"open_issues":26,"watchers":45,"default_branch":"master"}},"_links":{"self":{"href":"https://api.github.com/repos/blueboxgroup/ursula/pulls/705"},"html":{"href":"https://github.com/blueboxgroup/ursula/pull/705"},"issue":{"href":"https://api.github.com/repos/blueboxgroup/ursula/issues/705"},"comments":{"href":"https://api.github.com/repos/blueboxgroup/ursula/issues/705/comments"},"review_comments":{"href":"https://api.github.com/repos/blueboxgroup/ursula/pulls/705/comments"},"review_comment":{"href":"https://api.github.com/repos/blueboxgroup/ursula/pulls/comments/{number}"},"commits":{"href":"https://api.github.com/repos/blueboxgroup/ursula/pulls/705/commits"},"statuses":{"href":"https://api.github.com/repos/blueboxgroup/ursula/statuses/2a6f35313b9936ce4450aba823d09287626bed6f"}}}},"public":true,"created_at":"2015-01-01T01:04:37Z","org":{"id":458705,"login":"blueboxgroup","gravatar_id":"","url":"https://api.github.com/orgs/blueboxgroup","avatar_url":"https://avatars.githubusercontent.com/u/458705?"}}
{"id":"2489397854","type":"PushEvent","actor":{"id":163915,"login":"fponticelli","gravatar_id":"","url":"https://api.github.com/users/fponticelli","avatar_url":"https://avatars.githubusercontent.com/u/163915?"},"repo":{"id":28647473,"name":"fponticelli/thx.benchmark","url":"https://api.github.com/repos/fponticelli/thx.benchmark"},"payload":{"push_id":536753119,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"f6a2f0275338378ee5e3c4674e5cef6a9029f6b1","before":"203d2bfd757e0619e7b8e7732a16ea15bed09c2e","commits":[{"sha":"f6a2f0275338378ee5e3c4674e5cef6a9029f6b1","author":{"email":"05a4419b3ba135c9a2552a2fac2f13cfe3d22f12@gmail.com","name":"Franco Ponticelli"},"message":"changed decimals in mills","distinct":true,"url":"https://api.github.com/repos/fponticelli/thx.benchmark/commits/f6a2f0275338378ee5e3c4674e5cef6a9029f6b1"}]},"public":true,"created_at":"2015-01-01T01:04:37Z"}
{"id":"2489397855","type":"PushEvent","actor":{"id":69068,"login":"someara","gravatar_id":"","url":"https://api.github.com/users/someara","avatar_url":"https://avatars.githubusercontent.com/u/69068?"},"repo":{"id":28658028,"name":"someara/slacker-packer","url":"https://api.github.com/repos/someara/slacker-packer"},"payload":{"push_id":536753120,"size":2,"distinct_size":2,"ref":"refs/heads/master","head":"a167b8d1405621a26333fda5325d389eeccc05ff","before":"6c580a76c4800bd2707e53fef9c722c78ad0d742","commits":[{"sha":"09f12c2d299252470229258e6f4a98f439bd025e","author":{"email":"a08f4e77dc67cec36ca0d3194df5d081f3357efd@gmail.com","name":"hypomonk"},"message":"fixed shutdown and trimmed bootup time","distinct":true,"url":"https://api.github.com/repos/someara/slacker-packer/commits/09f12c2d299252470229258e6f4a98f439bd025e"},{"sha":"a167b8d1405621a26333fda5325d389eeccc05ff","author":{"email":"d7e19930cc1f42c2d0781f4d9e6f1fe5891bf9cf@chef.io","name":"Sean OMeara"},"message":"adding .gitignore and --no-check-certificates","distinct":true,"url":"https://api.github.com/repos/someara/slacker-packer/commits/a167b8d1405621a26333fda5325d389eeccc05ff"}]},"public":true,"created_at":"2015-01-01T01:04:37Z"}
{"id":"2489397856","type":"PushEvent","actor":{"id":166301,"login":"bcomnes","gravatar_id":"","url":"https://api.github.com/users/bcomnes","avatar_url":"https://avatars.githubusercontent.com/u/166301?"},"repo":{"id":6861308,"name":"bcomnes/bcomnes.github.io","url":"https://api.github.com/repos/bcomnes/bcomnes.github.io"},"payload":{"push_id":536753122,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"821968b470015bf7a6d5f86aeea8d739dd1aadbe","before":"6443459c46498095409d23205ceadb9e7b575182","commits":[{"sha":"821968b470015bf7a6d5f86aeea8d739dd1aadbe","author":{"email":"6df4fba95631fe4f4c4337307cda4e0fc4c27d16@gmail.com","name":"Bret"},"message":"gitpub posted a new post","distinct":true,"url":"https://api.github.com/repos/bcomnes/bcomnes.github.io/commits/821968b470015bf7a6d5f86aeea8d739dd1aadbe"}]},"public":true,"created_at":"2015-01-01T01:04:37Z"}
{"id":"2489397861","type":"PushEvent","actor":{"id":3720783,"login":"designerwebhosting","gravatar_id":"","url":"https://api.github.com/users/designerwebhosting","avatar_url":"https://avatars.githubusercontent.com/u/3720783?"},"repo":{"id":20527117,"name":"designerwebhosting/christopherbyrne.github.io","url":"https://api.github.com/repos/designerwebhosting/christopherbyrne.github.io"},"payload":{"push_id":536753125,"size":1,"distinct_size":1,"ref":"refs/heads/gh-pages","head":"52997f806edc1645856950072f9919dea680b5a7","before":"19f1368a9acc50e9b1cc2b936c165c9704040889","commits":[{"sha":"52997f806edc1645856950072f9919dea680b5a7","author":{"email":"4bb0acc6ff8c0b6c31e50417877e6e3b3f1c65f0@googlemail.com","name":"Peter Noblee"},"message":"update 'date'","distinct":true,"url":"https://api.github.com/repos/designerwebhosting/christopherbyrne.github.io/commits/52997f806edc1645856950072f9919dea680b5a7"}]},"public":true,"created_at":"2015-01-01T01:04:38Z"}
{"id":"2489397862","type":"PullRequestEvent","actor":{"id":568036,"login":"Tyilo","gravatar_id":"","url":"https://api.github.com/users/Tyilo","avatar_url":"https://avatars.githubusercontent.com/u/568036?"},"repo":{"id":21377779,"name":"isaacg1/pyth","url":"https://api.github.com/repos/isaacg1/pyth"},"payload":{"action":"opened","number":11,"pull_request":{"url":"https://api.github.com/repos/isaacg1/pyth/pulls/11","id":26739449,"html_url":"https://github.com/isaacg1/pyth/pull/11","diff_url":"https://github.com/isaacg1/pyth/pull/11.diff","patch_url":"https://github.com/isaacg1/pyth/pull/11.patch","issue_url":"https://api.github.com/repos/isaacg1/pyth/issues/11","number":11,"state":"open","locked":false,"title":"Move server functionality into different functions","user":{"login":"Tyilo","id":568036,"avatar_url":"https://avatars.githubusercontent.com/u/568036?v=3","gravatar_id":"","url":"https://api.github.com/users/Tyilo","html_url":"https://github.com/Tyilo","followers_url":"https://api.github.com/users/Tyilo/followers","following_url":"https://api.github.com/users/Tyilo/following{/other_user}","gists_url":"https://api.github.com/users/Tyilo/gists{/gist_id}","starred_url":"https://api.github.com/users/Tyilo/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/Tyilo/subscriptions","organizations_url":"https://api.github.com/users/Tyilo/orgs","repos_url":"https://api.github.com/users/Tyilo/repos","events_url":"https://api.github.com/users/Tyilo/events{/privacy}","received_events_url":"https://api.github.com/users/Tyilo/received_events","type":"User","site_admin":false},"body":"As suggested by @Maltysen in #10 ","created_at":"2015-01-01T01:04:38Z","updated_at":"2015-01-01T01:04:38Z","closed_at":null,"merged_at":null,"merge_commit_sha":null,"assignee":null,"milestone":null,"commits_url":"https://api.github.com/repos/isaacg1/pyth/pulls/11/commits","review_comments_url":"https://api.github.com/repos/isaacg1/pyth/pulls/11/comments","review_comment_url":"https://api.github.com/repos/isaacg1/pyth/pulls/comments/{number}","comments_url":"https://api.github.com/repos/isaacg1/pyth/issues/11/comments","statuses_url":"https://api.github.com/repos/isaacg1/pyth/statuses/8e2dd59a2966cb41ec28faf879d33fa5b6d2ad75","head":{"label":"Tyilo:patch-2","ref":"patch-2","sha":"8e2dd59a2966cb41ec28faf879d33fa5b6d2ad75","user":{"login":"Tyilo","id":568036,"avatar_url":"https://avatars.githubusercontent.com/u/568036?v=3","gravatar_id":"","url":"https://api.github.com/users/Tyilo","html_url":"https://github.com/Tyilo","followers_url":"https://api.github.com/users/Tyilo/followers","following_url":"https://api.github.com/users/Tyilo/following{/other_user}","gists_url":"https://api.github.com/users/Tyilo/gists{/gist_id}","starred_url":"https://api.github.com/users/Tyilo/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/Tyilo/subscriptions","organizations_url":"https://api.github.com/users/Tyilo/orgs","repos_url":"https://api.github.com/users/Tyilo/repos","events_url":"https://api.github.com/users/Tyilo/events{/privacy}","received_events_url":"https://api.github.com/users/Tyilo/received_events","type":"User","site_admin":false},"repo":{"id":28676548,"name":"pyth","full_name":"Tyilo/pyth","owner":{"login":"Tyilo","id":568036,"avatar_url":"https://avatars.githubusercontent.com/u/568036?v=3","gravatar_id":"","url":"https://api.github.com/users/Tyilo","html_url":"https://github.com/Tyilo","followers_url":"https://api.github.com/users/Tyilo/followers","following_url":"https://api.github.com/users/Tyilo/following{/other_user}","gists_url":"https://api.github.com/users/Tyilo/gists{/gist_id}","starred_url":"https://api.github.com/users/Tyilo/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/Tyilo/subscriptions","organizations_url":"https://api.github.com/users/Tyilo/orgs","repos_url":"https://api.github.com/users/Tyilo/repos","events_url":"https://api.github.com/users/Tyilo/events{/privacy}","received_events_url":"https://api.github.com/users/Tyilo/received_events","type":"User","site_admin":false},"private":false,"html_url":"https://github.com/Tyilo/pyth","description":"Pyth, an extremely concise language. Try it here:","fork":true,"url":"https://api.github.com/repos/Tyilo/pyth","forks_url":"https://api.github.com/repos/Tyilo/pyth/forks","keys_url":"https://api.github.com/repos/Tyilo/pyth/keys{/key_id}","collaborators_url":"https://api.github.com/repos/Tyilo/pyth/collaborators{/collaborator}","teams_url":"https://api.github.com/repos/Tyilo/pyth/teams","hooks_url":"https://api.github.com/repos/Tyilo/pyth/hooks","issue_events_url":"https://api.github.com/repos/Tyilo/pyth/issues/events{/number}","events_url":"https://api.github.com/repos/Tyilo/pyth/events","assignees_url":"https://api.github.com/repos/Tyilo/pyth/assignees{/user}","branches_url":"https://api.github.com/repos/Tyilo/pyth/branches{/branch}","tags_url":"https://api.github.com/repos/Tyilo/pyth/tags","blobs_url":"https://api.github.com/repos/Tyilo/pyth/git/blobs{/sha}","git_tags_url":"https://api.github.com/repos/Tyilo/pyth/git/tags{/sha}","git_refs_url":"https://api.github.com/repos/Tyilo/pyth/git/refs{/sha}","trees_url":"https://api.github.com/repos/Tyilo/pyth/git/trees{/sha}","statuses_url":"https://api.github.com/repos/Tyilo/pyth/statuses/{sha}","languages_url":"https://api.github.com/repos/Tyilo/pyth/languages","stargazers_url":"https://api.github.com/repos/Tyilo/pyth/stargazers","contributors_url":"https://api.github.com/repos/Tyilo/pyth/contributors","subscribers_url":"https://api.github.com/repos/Tyilo/pyth/subscribers","subscription_url":"https://api.github.com/repos/Tyilo/pyth/subscription","commits_url":"https://api.github.com/repos/Tyilo/pyth/commits{/sha}","git_commits_url":"https://api.github.com/repos/Tyilo/pyth/git/commits{/sha}","comments_url":"https://api.github.com/repos/Tyilo/pyth/comments{/number}","issue_comment_url":"https://api.github.com/repos/Tyilo/pyth/issues/comments/{number}","contents_url":"https://api.github.com/repos/Tyilo/pyth/contents/{+path}","compare_url":"https://api.github.com/repos/Tyilo/pyth/compare/{base}...{head}","merges_url":"https://api.github.com/repos/Tyilo/pyth/merges","archive_url":"https://api.github.com/repos/Tyilo/pyth/{archive_format}{/ref}","downloads_url":"https://api.github.com/repos/Tyilo/pyth/downloads","issues_url":"https://api.github.com/repos/Tyilo/pyth/issues{/number}","pulls_url":"https://api.github.com/repos/Tyilo/pyth/pulls{/number}","milestones_url":"https://api.github.com/repos/Tyilo/pyth/milestones{/number}","notifications_url":"https://api.github.com/repos/Tyilo/pyth/notifications{?since,all,participating}","labels_url":"https://api.github.com/repos/Tyilo/pyth/labels{/name}","releases_url":"https://api.github.com/repos/Tyilo/pyth/releases{/id}","created_at":"2014-12-31T22:38:59Z","updated_at":"2014-12-31T22:39:00Z","pushed_at":"2015-01-01T01:03:03Z","git_url":"git://github.com/Tyilo/pyth.git","ssh_url":"git@github.com:Tyilo/pyth.git","clone_url":"https://github.com/Tyilo/pyth.git","svn_url":"https://github.com/Tyilo/pyth","homepage":"http://isaacg.scripts.mit.edu/pyth/index.py","size":540,"stargazers_count":0,"watchers_count":0,"language":"Python","has_issues":false,"has_downloads":true,"has_wiki":true,"has_pages":false,"forks_count":0,"mirror_url":null,"open_issues_count":0,"forks":0,"open_issues":0,"watchers":0,"default_branch":"master"}},"base":{"label":"isaacg1:master","ref":"master","sha":"8dcc542711ab74a5454b34ac2d10fda566e4d465","user":{"login":"isaacg1","id":8034059,"avatar_url":"https://avatars.githubusercontent.com/u/8034059?v=3","gravatar_id":"","url":"https://api.github.com/users/isaacg1","html_url":"https://github.com/isaacg1","followers_url":"https://api.github.com/users/isaacg1/followers","following_url":"https://api.github.com/users/isaacg1/following{/other_user}","gists_url":"https://api.github.com/users/isaacg1/gists{/gist_id}","starred_url":"https://api.github.com/users/isaacg1/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/isaacg1/subscriptions","organizations_url":"https://api.github.com/users/isaacg1/orgs","repos_url":"https://api.github.com/users/isaacg1/repos","events_url":"https://api.github.com/users/isaacg1/events{/privacy}","received_events_url":"https://api.github.com/users/isaacg1/received_events","type":"User","site_admin":false},"repo":{"id":21377779,"name":"pyth","full_name":"isaacg1/pyth","owner":{"login":"isaacg1","id":8034059,"avatar_url":"https://avatars.githubusercontent.com/u/8034059?v=3","gravatar_id":"","url":"https://api.github.com/users/isaacg1","html_url":"https://github.com/isaacg1","followers_url":"https://api.github.com/users/isaacg1/followers","following_url":"https://api.github.com/users/isaacg1/following{/other_user}","gists_url":"https://api.github.com/users/isaacg1/gists{/gist_id}","starred_url":"https://api.github.com/users/isaacg1/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/isaacg1/subscriptions","organizations_url":"https://api.github.com/users/isaacg1/orgs","repos_url":"https://api.github.com/users/isaacg1/repos","events_url":"https://api.github.com/users/isaacg1/events{/privacy}","received_events_url":"https://api.github.com/users/isaacg1/received_events","type":"User","site_admin":false},"private":false,"html_url":"https://github.com/isaacg1/pyth","description":"Pyth, an extremely concise language. Try it here:","fork":false,"url":"https://api.github.com/repos/isaacg1/pyth","forks_url":"https://api.github.com/repos/isaacg1/pyth/forks","keys_url":"https://api.github.com/repos/isaacg1/pyth/keys{/key_id}","collaborators_url":"https://api.github.com/repos/isaacg1/pyth/collaborators{/collaborator}","teams_url":"https://api.github.com/repos/isaacg1/pyth/teams","hooks_url":"https://api.github.com/repos/isaacg1/pyth/hooks","issue_events_url":"https://api.github.com/repos/isaacg1/pyth/issues/events{/number}","events_url":"https://api.github.com/repos/isaacg1/pyth/events","assignees_url":"https://api.github.com/repos/isaacg1/pyth/assignees{/user}","branches_url":"https://api.github.com/repos/isaacg1/pyth/branches{/branch}","tags_url":"https://api.github.com/repos/isaacg1/pyth/tags","blobs_url":"https://api.github.com/repos/isaacg1/pyth/git/blobs{/sha}","git_tags_url":"https://api.github.com/repos/isaacg1/pyth/git/tags{/sha}","git_refs_url":"https://api.github.com/repos/isaacg1/pyth/git/refs{/sha}","trees_url":"https://api.github.com/repos/isaacg1/pyth/git/trees{/sha}","statuses_url":"https://api.github.com/repos/isaacg1/pyth/statuses/{sha}","languages_url":"https://api.github.com/repos/isaacg1/pyth/languages","stargazers_url":"https://api.github.com/repos/isaacg1/pyth/stargazers","contributors_url":"https://api.github.com/repos/isaacg1/pyth/contributors","subscribers_url":"https://api.github.com/repos/isaacg1/pyth/subscribers","subscription_url":"https://api.github.com/repos/isaacg1/pyth/subscription","commits_url":"https://api.github.com/repos/isaacg1/pyth/commits{/sha}","git_commits_url":"https://api.github.com/repos/isaacg1/pyth/git/commits{/sha}","comments_url":"https://api.github.com/repos/isaacg1/pyth/comments{/number}","issue_comment_url":"https://api.github.com/repos/isaacg1/pyth/issues/comments/{number}","contents_url":"https://api.github.com/repos/isaacg1/pyth/contents/{+path}","compare_url":"https://api.github.com/repos/isaacg1/pyth/compare/{base}...{head}","merges_url":"https://api.github.com/repos/isaacg1/pyth/merges","archive_url":"https://api.github.com/repos/isaacg1/pyth/{archive_format}{/ref}","downloads_url":"https://api.github.com/repos/isaacg1/pyth/downloads","issues_url":"https://api.github.com/repos/isaacg1/pyth/issues{/number}","pulls_url":"https://api.github.com/repos/isaacg1/pyth/pulls{/number}","milestones_url":"https://api.github.com/repos/isaacg1/pyth/milestones{/number}","notifications_url":"https://api.github.com/repos/isaacg1/pyth/notifications{?since,all,participating}","labels_url":"https://api.github.com/repos/isaacg1/pyth/labels{/name}","releases_url":"https://api.github.com/repos/isaacg1/pyth/releases{/id}","created_at":"2014-07-01T06:44:21Z","updated_at":"2015-01-01T00:39:57Z","pushed_at":"2015-01-01T00:39:56Z","git_url":"git://github.com/isaacg1/pyth.git","ssh_url":"git@github.com:isaacg1/pyth.git","clone_url":"https://github.com/isaacg1/pyth.git","svn_url":"https://github.com/isaacg1/pyth","homepage":"https://pyth.herokuapp.com/","size":540,"stargazers_count":22,"watchers_count":22,"language":"Python","has_issues":true,"has_downloads":true,"has_wiki":true,"has_pages":false,"forks_count":2,"mirror_url":null,"open_issues_count":1,"forks":2,"open_issues":1,"watchers":22,"default_branch":"master"}},"_links":{"self":{"href":"https://api.github.com/repos/isaacg1/pyth/pulls/11"},"html":{"href":"https://github.com/isaacg1/pyth/pull/11"},"issue":{"href":"https://api.github.com/repos/isaacg1/pyth/issues/11"},"comments":{"href":"https://api.github.com/repos/isaacg1/pyth/issues/11/comments"},"review_comments":{"href":"https://api.github.com/repos/isaacg1/pyth/pulls/11/comments"},"review_comment":{"href":"https://api.github.com/repos/isaacg1/pyth/pulls/comments/{number}"},"commits":{"href":"https://api.github.com/repos/isaacg1/pyth/pulls/11/commits"},"statuses":{"href":"https://api.github.com/repos/isaacg1/pyth/statuses/8e2dd59a2966cb41ec28faf879d33fa5b6d2ad75"}},"merged":false,"mergeable":null,"mergeable_state":"unknown","merged_by":null,"comments":0,"review_comments":0,"commits":1,"additions":36,"deletions":36,"changed_files":3}},"public":true,"created_at":"2015-01-01T01:04:38Z"}
{"id":"2489397867","type":"CreateEvent","actor":{"id":3267533,"login":"brentpicasso","gravatar_id":"","url":"https://api.github.com/users/brentpicasso","avatar_url":"https://avatars.githubusercontent.com/u/3267533?"},"repo":{"id":28678261,"name":"autosportlabs/TempX","url":"https://api.github.com/repos/autosportlabs/TempX"},"payload":{"ref":null,"ref_type":"repository","master_branch":"master","description":"TempX is a temperature sensor breakout board for the TMP36 active temperature sensor","pusher_type":"user"},"public":true,"created_at":"2015-01-01T01:04:39Z","org":{"id":1274125,"login":"autosportlabs","gravatar_id":"","url":"https://api.github.com/orgs/autosportlabs","avatar_url":"https://avatars.githubusercontent.com/u/1274125?"}}
{"id":"2489397873","type":"ForkEvent","actor":{"id":1671640,"login":"alex6lc","gravatar_id":"","url":"https://api.github.com/users/alex6lc","avatar_url":"https://avatars.githubusercontent.com/u/1671640?"},"repo":{"id":27458466,"name":"gpbl/material-ui-sass","url":"https://api.github.com/repos/gpbl/material-ui-sass"},"payload":{"forkee":{"id":28678262,"name":"material-ui-sass","full_name":"alex6lc/material-ui-sass","owner":{"login":"alex6lc","id":1671640,"avatar_url":"https://avatars.githubusercontent.com/u/1671640?v=3","gravatar_id":"","url":"https://api.github.com/users/alex6lc","html_url":"https://github.com/alex6lc","followers_url":"https://api.github.com/users/alex6lc/followers","following_url":"https://api.github.com/users/alex6lc/following{/other_user}","gists_url":"https://api.github.com/users/alex6lc/gists{/gist_id}","starred_url":"https://api.github.com/users/alex6lc/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/alex6lc/subscriptions","organizations_url":"https://api.github.com/users/alex6lc/orgs","repos_url":"https://api.github.com/users/alex6lc/repos","events_url":"https://api.github.com/users/alex6lc/events{/privacy}","received_events_url":"https://api.github.com/users/alex6lc/received_events","type":"User","site_admin":false},"private":false,"html_url":"https://github.com/alex6lc/material-ui-sass","description":"The Sass counterpart of the material-ui framework for React","fork":true,"url":"https://api.github.com/repos/alex6lc/material-ui-sass","forks_url":"https://api.github.com/repos/alex6lc/material-ui-sass/forks","keys_url":"https://api.github.com/repos/alex6lc/material-ui-sass/keys{/key_id}","collaborators_url":"https://api.github.com/repos/alex6lc/material-ui-sass/collaborators{/collaborator}","teams_url":"https://api.github.com/repos/alex6lc/material-ui-sass/teams","hooks_url":"https://api.github.com/repos/alex6lc/material-ui-sass/hooks","issue_events_url":"https://api.github.com/repos/alex6lc/material-ui-sass/issues/events{/number}","events_url":"https://api.github.com/repos/alex6lc/material-ui-sass/events","assignees_url":"https://api.github.com/repos/alex6lc/material-ui-sass/assignees{/user}","branches_url":"https://api.github.com/repos/alex6lc/material-ui-sass/branches{/branch}","tags_url":"https://api.github.com/repos/alex6lc/material-ui-sass/tags","blobs_url":"https://api.github.com/repos/alex6lc/material-ui-sass/git/blobs{/sha}","git_tags_url":"https://api.github.com/repos/alex6lc/material-ui-sass/git/tags{/sha}","git_refs_url":"https://api.github.com/repos/alex6lc/material-ui-sass/git/refs{/sha}","trees_url":"https://api.github.com/repos/alex6lc/material-ui-sass/git/trees{/sha}","statuses_url":"https://api.github.com/repos/alex6lc/material-ui-sass/statuses/{sha}","languages_url":"https://api.github.com/repos/alex6lc/material-ui-sass/languages","stargazers_url":"https://api.github.com/repos/alex6lc/material-ui-sass/stargazers","contributors_url":"https://api.github.com/repos/alex6lc/material-ui-sass/contributors","subscribers_url":"https://api.github.com/repos/alex6lc/material-ui-sass/subscribers","subscription_url":"https://api.github.com/repos/alex6lc/material-ui-sass/subscription","commits_url":"https://api.github.com/repos/alex6lc/material-ui-sass/commits{/sha}","git_commits_url":"https://api.github.com/repos/alex6lc/material-ui-sass/git/commits{/sha}","comments_url":"https://api.github.com/repos/alex6lc/material-ui-sass/comments{/number}","issue_comment_url":"https://api.github.com/repos/alex6lc/material-ui-sass/issues/comments/{number}","contents_url":"https://api.github.com/repos/alex6lc/material-ui-sass/contents/{+path}","compare_url":"https://api.github.com/repos/alex6lc/material-ui-sass/compare/{base}...{head}","merges_url":"https://api.github.com/repos/alex6lc/material-ui-sass/merges","archive_url":"https://api.github.com/repos/alex6lc/material-ui-sass/{archive_format}{/ref}","downloads_url":"https://api.github.com/repos/alex6lc/material-ui-sass/downloads","issues_url":"https://api.github.com/repos/alex6lc/material-ui-sass/issues{/number}","pulls_url":"https://api.github.com/repos/alex6lc/material-ui-sass/pulls{/number}","milestones_url":"https://api.github.com/repos/alex6lc/material-ui-sass/milestones{/number}","notifications_url":"https://api.github.com/repos/alex6lc/material-ui-sass/notifications{?since,all,participating}","labels_url":"https://api.github.com/repos/alex6lc/material-ui-sass/labels{/name}","releases_url":"https://api.github.com/repos/alex6lc/material-ui-sass/releases{/id}","created_at":"2015-01-01T01:04:40Z","updated_at":"2014-12-30T20:38:38Z","pushed_at":"2014-12-27T16:36:27Z","git_url":"git://github.com/alex6lc/material-ui-sass.git","ssh_url":"git@github.com:alex6lc/material-ui-sass.git","clone_url":"https://github.com/alex6lc/material-ui-sass.git","svn_url":"https://github.com/alex6lc/material-ui-sass","homepage":"","size":2075,"stargazers_count":0,"watchers_count":0,"language":null,"has_issues":false,"has_downloads":true,"has_wiki":false,"has_pages":false,"forks_count":0,"mirror_url":null,"open_issues_count":0,"forks":0,"open_issues":0,"watchers":0,"default_branch":"master","public":true}},"public":true,"created_at":"2015-01-01T01:04:40Z"}
{"id":"2489397875","type":"PushEvent","actor":{"id":1422772,"login":"lighttroupe","gravatar_id":"","url":"https://api.github.com/users/lighttroupe","avatar_url":"https://avatars.githubusercontent.com/u/1422772?"},"repo":{"id":19626154,"name":"lighttroupe/luz-next","url":"https://api.github.com/repos/lighttroupe/luz-next"},"payload":{"push_id":536753128,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"3c99b61327454468c31f6c0db4045e73dc1bca01","before":"f1651f527ad2fa7edd1a3fbcd6a3ae16e38dec66","commits":[{"sha":"3c99b61327454468c31f6c0db4045e73dc1bca01","author":{"email":"57a33a5496950fec8433e4dd83347673459dcdfc@openanswers.org","name":"Ian McIntosh"},"message":"- add placeholder message bar background","distinct":true,"url":"https://api.github.com/repos/lighttroupe/luz-next/commits/3c99b61327454468c31f6c0db4045e73dc1bca01"}]},"public":true,"created_at":"2015-01-01T01:04:40Z"}
{"id":"2489397876","type":"PullRequestEvent","actor":{"id":1813305,"login":"Bart39","gravatar_id":"","url":"https://api.github.com/users/Bart39","avatar_url":"https://avatars.githubusercontent.com/u/1813305?"},"repo":{"id":9683876,"name":"nZEDb/nZEDb","url":"https://api.github.com/repos/nZEDb/nZEDb"},"payload":{"action":"closed","number":1573,"pull_request":{"url":"https://api.github.com/repos/nZEDb/nZEDb/pulls/1573","id":26736047,"html_url":"https://github.com/nZEDb/nZEDb/pull/1573","diff_url":"https://github.com/nZEDb/nZEDb/pull/1573.diff","patch_url":"https://github.com/nZEDb/nZEDb/pull/1573.patch","issue_url":"https://api.github.com/repos/nZEDb/nZEDb/issues/1573","number":1573,"state":"closed","locked":false,"title":"Changed trakt.tv imdb search to new format","user":{"login":"DariusIII","id":3399658,"avatar_url":"https://avatars.githubusercontent.com/u/3399658?v=3","gravatar_id":"","url":"https://api.github.com/users/DariusIII","html_url":"https://github.com/DariusIII","followers_url":"https://api.github.com/users/DariusIII/followers","following_url":"https://api.github.com/users/DariusIII/following{/other_user}","gists_url":"https://api.github.com/users/DariusIII/gists{/gist_id}","starred_url":"https://api.github.com/users/DariusIII/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/DariusIII/subscriptions","organizations_url":"https://api.github.com/users/DariusIII/orgs","repos_url":"https://api.github.com/users/DariusIII/repos","events_url":"https://api.github.com/users/DariusIII/events{/privacy}","received_events_url":"https://api.github.com/users/DariusIII/received_events","type":"User","site_admin":false},"body":"","created_at":"2014-12-31T21:28:06Z","updated_at":"2015-01-01T01:04:40Z","closed_at":"2015-01-01T01:04:40Z","merged_at":"2015-01-01T01:04:40Z","merge_commit_sha":"5cb2802b75980591233ac3f40676585c9a14af25","assignee":null,"milestone":null,"commits_url":"https://api.github.com/repos/nZEDb/nZEDb/pulls/1573/commits","review_comments_url":"https://api.github.com/repos/nZEDb/nZEDb/pulls/1573/comments","review_comment_url":"https://api.github.com/repos/nZEDb/nZEDb/pulls/comments/{number}","comments_url":"https://api.github.com/repos/nZEDb/nZEDb/issues/1573/comments","statuses_url":"https://api.github.com/repos/nZEDb/nZEDb/statuses/b309b85c959a9fae595119a4aa6b02a129d368f9","head":{"label":"DariusIII:dev","ref":"dev","sha":"b309b85c959a9fae595119a4aa6b02a129d368f9","user":{"login":"DariusIII","id":3399658,"avatar_url":"https://avatars.githubusercontent.com/u/3399658?v=3","gravatar_id":"","url":"https://api.github.com/users/DariusIII","html_url":"https://github.com/DariusIII","followers_url":"https://api.github.com/users/DariusIII/followers","following_url":"https://api.github.com/users/DariusIII/following{/other_user}","gists_url":"https://api.github.com/users/DariusIII/gists{/gist_id}","starred_url":"https://api.github.com/users/DariusIII/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/DariusIII/subscriptions","organizations_url":"https://api.github.com/users/DariusIII/orgs","repos_url":"https://api.github.com/users/DariusIII/repos","events_url":"https://api.github.com/users/DariusIII/events{/privacy}","received_events_url":"https://api.github.com/users/DariusIII/received_events","type":"User","site_admin":false},"repo":{"id":21434059,"name":"nZEDb","full_name":"DariusIII/nZEDb","owner":{"login":"DariusIII","id":3399658,"avatar_url":"https://avatars.githubusercontent.com/u/3399658?v=3","gravatar_id":"","url":"https://api.github.com/users/DariusIII","html_url":"https://github.com/DariusIII","followers_url":"https://api.github.com/users/DariusIII/followers","following_url":"https://api.github.com/users/DariusIII/following{/other_user}","gists_url":"https://api.github.com/users/DariusIII/gists{/gist_id}","starred_url":"https://api.github.com/users/DariusIII/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/DariusIII/subscriptions","organizations_url":"https://api.github.com/users/DariusIII/orgs","repos_url":"https://api.github.com/users/DariusIII/repos","events_url":"https://api.github.com/users/DariusIII/events{/privacy}","received_events_url":"https://api.github.com/users/DariusIII/received_events","type":"User","site_admin":false},"private":false,"html_url":"https://github.com/DariusIII/nZEDb","description":"nZEDb - a fork of nnplus(2011) | NNTP / Usenet / Newsgroup indexer.","fork":true,"url":"https://api.github.com/repos/DariusIII/nZEDb","forks_url":"https://api.github.com/repos/DariusIII/nZEDb/forks","keys_url":"https://api.github.com/repos/DariusIII/nZEDb/keys{/key_id}","collaborators_url":"https://api.github.com/repos/DariusIII/nZEDb/collaborators{/collaborator}","teams_url":"https://api.github.com/repos/DariusIII/nZEDb/teams","hooks_url":"https://api.github.com/repos/DariusIII/nZEDb/hooks","issue_events_url":"https://api.github.com/repos/DariusIII/nZEDb/issues/events{/number}","events_url":"https://api.github.com/repos/DariusIII/nZEDb/events","assignees_url":"https://api.github.com/repos/DariusIII/nZEDb/assignees{/user}","branches_url":"https://api.github.com/repos/DariusIII/nZEDb/branches{/branch}","tags_url":"https://api.github.com/repos/DariusIII/nZEDb/tags","blobs_url":"https://api.github.com/repos/DariusIII/nZEDb/git/blobs{/sha}","git_tags_url":"https://api.github.com/repos/DariusIII/nZEDb/git/tags{/sha}","git_refs_url":"https://api.github.com/repos/DariusIII/nZEDb/git/refs{/sha}","trees_url":"https://api.github.com/repos/DariusIII/nZEDb/git/trees{/sha}","statuses_url":"https://api.github.com/repos/DariusIII/nZEDb/statuses/{sha}","languages_url":"https://api.github.com/repos/DariusIII/nZEDb/languages","stargazers_url":"https://api.github.com/repos/DariusIII/nZEDb/stargazers","contributors_url":"https://api.github.com/repos/DariusIII/nZEDb/contributors","subscribers_url":"https://api.github.com/repos/DariusIII/nZEDb/subscribers","subscription_url":"https://api.github.com/repos/DariusIII/nZEDb/subscription","commits_url":"https://api.github.com/repos/DariusIII/nZEDb/commits{/sha}","git_commits_url":"https://api.github.com/repos/DariusIII/nZEDb/git/commits{/sha}","comments_url":"https://api.github.com/repos/DariusIII/nZEDb/comments{/number}","issue_comment_url":"https://api.github.com/repos/DariusIII/nZEDb/issues/comments/{number}","contents_url":"https://api.github.com/repos/DariusIII/nZEDb/contents/{+path}","compare_url":"https://api.github.com/repos/DariusIII/nZEDb/compare/{base}...{head}","merges_url":"https://api.github.com/repos/DariusIII/nZEDb/merges","archive_url":"https://api.github.com/repos/DariusIII/nZEDb/{archive_format}{/ref}","downloads_url":"https://api.github.com/repos/DariusIII/nZEDb/downloads","issues_url":"https://api.github.com/repos/DariusIII/nZEDb/issues{/number}","pulls_url":"https://api.github.com/repos/DariusIII/nZEDb/pulls{/number}","milestones_url":"https://api.github.com/repos/DariusIII/nZEDb/milestones{/number}","notifications_url":"https://api.github.com/repos/DariusIII/nZEDb/notifications{?since,all,participating}","labels_url":"https://api.github.com/repos/DariusIII/nZEDb/labels{/name}","releases_url":"https://api.github.com/repos/DariusIII/nZEDb/releases{/id}","created_at":"2014-07-02T17:46:47Z","updated_at":"2014-12-30T10:21:52Z","pushed_at":"2014-12-31T21:26:54Z","git_url":"git://github.com/DariusIII/nZEDb.git","ssh_url":"git@github.com:DariusIII/nZEDb.git","clone_url":"https://github.com/DariusIII/nZEDb.git","svn_url":"https://github.com/DariusIII/nZEDb","homepage":"http://forums.nzedb.com","size":53328,"stargazers_count":0,"watchers_count":0,"language":"PHP","has_issues":false,"has_downloads":true,"has_wiki":true,"has_pages":false,"forks_count":0,"mirror_url":null,"open_issues_count":0,"forks":0,"open_issues":0,"watchers":0,"default_branch":"master"}},"base":{"label":"nZEDb:dev","ref":"dev","sha":"1ec7a576cfae11fdcdbe929cf9053e73dda2c43d","user":{"login":"nZEDb","id":4260270,"avatar_url":"https://avatars.githubusercontent.com/u/4260270?v=3","gravatar_id":"","url":"https://api.github.com/users/nZEDb","html_url":"https://github.com/nZEDb","followers_url":"https://api.github.com/users/nZEDb/followers","following_url":"https://api.github.com/users/nZEDb/following{/other_user}","gists_url":"https://api.github.com/users/nZEDb/gists{/gist_id}","starred_url":"https://api.github.com/users/nZEDb/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/nZEDb/subscriptions","organizations_url":"https://api.github.com/users/nZEDb/orgs","repos_url":"https://api.github.com/users/nZEDb/repos","events_url":"https://api.github.com/users/nZEDb/events{/privacy}","received_events_url":"https://api.github.com/users/nZEDb/received_events","type":"Organization","site_admin":false},"repo":{"id":9683876,"name":"nZEDb","full_name":"nZEDb/nZEDb","owner":{"login":"nZEDb","id":4260270,"avatar_url":"https://avatars.githubusercontent.com/u/4260270?v=3","gravatar_id":"","url":"https://api.github.com/users/nZEDb","html_url":"https://github.com/nZEDb","followers_url":"https://api.github.com/users/nZEDb/followers","following_url":"https://api.github.com/users/nZEDb/following{/other_user}","gists_url":"https://api.github.com/users/nZEDb/gists{/gist_id}","starred_url":"https://api.github.com/users/nZEDb/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/nZEDb/subscriptions","organizations_url":"https://api.github.com/users/nZEDb/orgs","repos_url":"https://api.github.com/users/nZEDb/repos","events_url":"https://api.github.com/users/nZEDb/events{/privacy}","received_events_url":"https://api.github.com/users/nZEDb/received_events","type":"Organization","site_admin":false},"private":false,"html_url":"https://github.com/nZEDb/nZEDb","description":"nZEDb - a fork of nnplus(2011) | NNTP / Usenet / Newsgroup indexer.","fork":false,"url":"https://api.github.com/repos/nZEDb/nZEDb","forks_url":"https://api.github.com/repos/nZEDb/nZEDb/forks","keys_url":"https://api.github.com/repos/nZEDb/nZEDb/keys{/key_id}","collaborators_url":"https://api.github.com/repos/nZEDb/nZEDb/collaborators{/collaborator}","teams_url":"https://api.github.com/repos/nZEDb/nZEDb/teams","hooks_url":"https://api.github.com/repos/nZEDb/nZEDb/hooks","issue_events_url":"https://api.github.com/repos/nZEDb/nZEDb/issues/events{/number}","events_url":"https://api.github.com/repos/nZEDb/nZEDb/events","assignees_url":"https://api.github.com/repos/nZEDb/nZEDb/assignees{/user}","branches_url":"https://api.github.com/repos/nZEDb/nZEDb/branches{/branch}","tags_url":"https://api.github.com/repos/nZEDb/nZEDb/tags","blobs_url":"https://api.github.com/repos/nZEDb/nZEDb/git/blobs{/sha}","git_tags_url":"https://api.github.com/repos/nZEDb/nZEDb/git/tags{/sha}","git_refs_url":"https://api.github.com/repos/nZEDb/nZEDb/git/refs{/sha}","trees_url":"https://api.github.com/repos/nZEDb/nZEDb/git/trees{/sha}","statuses_url":"https://api.github.com/repos/nZEDb/nZEDb/statuses/{sha}","languages_url":"https://api.github.com/repos/nZEDb/nZEDb/languages","stargazers_url":"https://api.github.com/repos/nZEDb/nZEDb/stargazers","contributors_url":"https://api.github.com/repos/nZEDb/nZEDb/contributors","subscribers_url":"https://api.github.com/repos/nZEDb/nZEDb/subscribers","subscription_url":"https://api.github.com/repos/nZEDb/nZEDb/subscription","commits_url":"https://api.github.com/repos/nZEDb/nZEDb/commits{/sha}","git_commits_url":"https://api.github.com/repos/nZEDb/nZEDb/git/commits{/sha}","comments_url":"https://api.github.com/repos/nZEDb/nZEDb/comments{/number}","issue_comment_url":"https://api.github.com/repos/nZEDb/nZEDb/issues/comments/{number}","contents_url":"https://api.github.com/repos/nZEDb/nZEDb/contents/{+path}","compare_url":"https://api.github.com/repos/nZEDb/nZEDb/compare/{base}...{head}","merges_url":"https://api.github.com/repos/nZEDb/nZEDb/merges","archive_url":"https://api.github.com/repos/nZEDb/nZEDb/{archive_format}{/ref}","downloads_url":"https://api.github.com/repos/nZEDb/nZEDb/downloads","issues_url":"https://api.github.com/repos/nZEDb/nZEDb/issues{/number}","pulls_url":"https://api.github.com/repos/nZEDb/nZEDb/pulls{/number}","milestones_url":"https://api.github.com/repos/nZEDb/nZEDb/milestones{/number}","notifications_url":"https://api.github.com/repos/nZEDb/nZEDb/notifications{?since,all,participating}","labels_url":"https://api.github.com/repos/nZEDb/nZEDb/labels{/name}","releases_url":"https://api.github.com/repos/nZEDb/nZEDb/releases{/id}","created_at":"2013-04-25T23:45:28Z","updated_at":"2014-12-31T06:19:27Z","pushed_at":"2015-01-01T01:04:40Z","git_url":"git://github.com/nZEDb/nZEDb.git","ssh_url":"git@github.com:nZEDb/nZEDb.git","clone_url":"https://github.com/nZEDb/nZEDb.git","svn_url":"https://github.com/nZEDb/nZEDb","homepage":"http://forums.nzedb.com","size":77901,"stargazers_count":189,"watchers_count":189,"language":"PHP","has_issues":true,"has_downloads":true,"has_wiki":true,"has_pages":false,"forks_count":102,"mirror_url":null,"open_issues_count":30,"forks":102,"open_issues":30,"watchers":189,"default_branch":"master"}},"_links":{"self":{"href":"https://api.github.com/repos/nZEDb/nZEDb/pulls/1573"},"html":{"href":"https://github.com/nZEDb/nZEDb/pull/1573"},"issue":{"href":"https://api.github.com/repos/nZEDb/nZEDb/issues/1573"},"comments":{"href":"https://api.github.com/repos/nZEDb/nZEDb/issues/1573/comments"},"review_comments":{"href":"https://api.github.com/repos/nZEDb/nZEDb/pulls/1573/comments"},"review_comment":{"href":"https://api.github.com/repos/nZEDb/nZEDb/pulls/comments/{number}"},"commits":{"href":"https://api.github.com/repos/nZEDb/nZEDb/pulls/1573/commits"},"statuses":{"href":"https://api.github.com/repos/nZEDb/nZEDb/statuses/b309b85c959a9fae595119a4aa6b02a129d368f9"}},"merged":true,"mergeable":null,"mergeable_state":"unknown","merged_by":{"login":"Bart39","id":1813305,"avatar_url":"https://avatars.githubusercontent.com/u/1813305?v=3","gravatar_id":"","url":"https://api.github.com/users/Bart39","html_url":"https://github.com/Bart39","followers_url":"https://api.github.com/users/Bart39/followers","following_url":"https://api.github.com/users/Bart39/following{/other_user}","gists_url":"https://api.github.com/users/Bart39/gists{/gist_id}","starred_url":"https://api.github.com/users/Bart39/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/Bart39/subscriptions","organizations_url":"https://api.github.com/users/Bart39/orgs","repos_url":"https://api.github.com/users/Bart39/repos","events_url":"https://api.github.com/users/Bart39/events{/privacy}","received_events_url":"https://api.github.com/users/Bart39/received_events","type":"User","site_admin":false},"comments":0,"review_comments":0,"commits":40,"additions":7,"deletions":7,"changed_files":7}},"public":true,"created_at":"2015-01-01T01:04:40Z","org":{"id":4260270,"login":"nZEDb","gravatar_id":"","url":"https://api.github.com/orgs/nZEDb","avatar_url":"https://avatars.githubusercontent.com/u/4260270?"}}
{"id":"2489397878","type":"PushEvent","actor":{"id":42681,"login":"walnotes","gravatar_id":"","url":"https://api.github.com/users/walnotes","avatar_url":"https://avatars.githubusercontent.com/u/42681?"},"repo":{"id":22087319,"name":"walnotes/ngo360","url":"https://api.github.com/repos/walnotes/ngo360"},"payload":{"push_id":536753130,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"0e762d5e66602e8fc7f5d3639f65f3e0bad26134","before":"0a7af8c18ab72bf805d9c94d4483512765220a95","commits":[{"sha":"0e762d5e66602e8fc7f5d3639f65f3e0bad26134","author":{"email":"5d8024bfa9e39eb0b6834fe5420b9e92861b675c@yahoo.com","name":"Walter"},"message":"Added audio and video to controller, model and views","distinct":true,"url":"https://api.github.com/repos/walnotes/ngo360/commits/0e762d5e66602e8fc7f5d3639f65f3e0bad26134"}]},"public":true,"created_at":"2015-01-01T01:04:41Z"}
{"id":"2489397883","type":"PushEvent","actor":{"id":1813305,"login":"Bart39","gravatar_id":"","url":"https://api.github.com/users/Bart39","avatar_url":"https://avatars.githubusercontent.com/u/1813305?"},"repo":{"id":9683876,"name":"nZEDb/nZEDb","url":"https://api.github.com/repos/nZEDb/nZEDb"},"payload":{"push_id":536753131,"size":42,"distinct_size":42,"ref":"refs/heads/dev","head":"cfda73aed869f40b3e19a4345dda9c4d65f27937","before":"1ec7a576cfae11fdcdbe929cf9053e73dda2c43d","commits":[{"sha":"7d042c6422274c6ffb3e3869e107c053fd55553c","author":{"email":"d905a83fce9ca7a3ba493d139e06a7bc091e7008@gmail.com","name":"DariusIII"},"message":"Merge pull request #176 from nZEDb/dev\n\nDev","distinct":true,"url":"https://api.github.com/repos/nZEDb/nZEDb/commits/7d042c6422274c6ffb3e3869e107c053fd55553c"},{"sha":"fc1f764e87b4cd471e946aa782cb1c8f5e141fc4","author":{"email":"d905a83fce9ca7a3ba493d139e06a7bc091e7008@gmail.com","name":"DariusIII"},"message":"Merge pull request #177 from nZEDb/dev\n\nDev","distinct":true,"url":"https://api.github.com/repos/nZEDb/nZEDb/commits/fc1f764e87b4cd471e946aa782cb1c8f5e141fc4"},{"sha":"47d118f8112bcc0152430080dabfefcaf7913b80","author":{"email":"d905a83fce9ca7a3ba493d139e06a7bc091e7008@gmail.com","name":"DariusIII"},"message":"Merge pull request #179 from nZEDb/dev\n\nDev","distinct":true,"url":"https://api.github.com/repos/nZEDb/nZEDb/commits/47d118f8112bcc0152430080dabfefcaf7913b80"},{"sha":"54abdf31cd2795f28c3ae7eb583c8bff89299110","author":{"email":"d905a83fce9ca7a3ba493d139e06a7bc091e7008@gmail.com","name":"DariusIII"},"message":"Merge pull request #180 from nZEDb/dev\n\nDev","distinct":true,"url":"https://api.github.com/repos/nZEDb/nZEDb/commits/54abdf31cd2795f28c3ae7eb583c8bff89299110"},{"sha":"b1a90beb996cc6151d4d33636e75d4858b32ddde","author":{"email":"d905a83fce9ca7a3ba493d139e06a7bc091e7008@gmail.com","name":"DariusIII"},"message":"Merge pull request #181 from nZEDb/dev\n\nDev","distinct":true,"url":"https://api.github.com/repos/nZEDb/nZEDb/commits/b1a90beb996cc6151d4d33636e75d4858b32ddde"},{"sha":"080ff5e1da53af3f3bf1cdbf04326d5bf90479b4","author":{"email":"d905a83fce9ca7a3ba493d139e06a7bc091e7008@gmail.com","name":"DariusIII"},"message":"Merge pull request #182 from nZEDb/dev\n\nDev","distinct":true,"url":"https://api.github.com/repos/nZEDb/nZEDb/commits/080ff5e1da53af3f3bf1cdbf04326d5bf90479b4"},{"sha":"034f6b6b0d1731ccf5c36c1f382c2bed5c7b48d4","author":{"email":"d905a83fce9ca7a3ba493d139e06a7bc091e7008@gmail.com","name":"DariusIII"},"message":"Merge pull request #183 from nZEDb/dev\n\nDev","distinct":true,"url":"https://api.github.com/repos/nZEDb/nZEDb/commits/034f6b6b0d1731ccf5c36c1f382c2bed5c7b48d4"},{"sha":"c50d536090b7fdcf766ac1efead18ec9cdc4370a","author":{"email":"d905a83fce9ca7a3ba493d139e06a7bc091e7008@gmail.com","name":"DariusIII"},"message":"Merge pull request #185 from nZEDb/dev\n\nDev","distinct":true,"url":"https://api.github.com/repos/nZEDb/nZEDb/commits/c50d536090b7fdcf766ac1efead18ec9cdc4370a"},{"sha":"c255c8dd11150ecdfaedf44a9880b268ee4661cc","author":{"email":"d905a83fce9ca7a3ba493d139e06a7bc091e7008@gmail.com","name":"DariusIII"},"message":"Merge pull request #186 from nZEDb/dev\n\nDev","distinct":true,"url":"https://api.github.com/repos/nZEDb/nZEDb/commits/c255c8dd11150ecdfaedf44a9880b268ee4661cc"},{"sha":"c19f38122706de1739b40a84b1b946a40213b47c","author":{"email":"d905a83fce9ca7a3ba493d139e06a7bc091e7008@gmail.com","name":"DariusIII"},"message":"Merge pull request #187 from nZEDb/dev\n\nDev","distinct":true,"url":"https://api.github.com/repos/nZEDb/nZEDb/commits/c19f38122706de1739b40a84b1b946a40213b47c"},{"sha":"a472784834e7720c420c3d0e0b3f491b3b99c1f4","author":{"email":"d905a83fce9ca7a3ba493d139e06a7bc091e7008@gmail.com","name":"DariusIII"},"message":"Merge pull request #189 from nZEDb/dev\n\nDev","distinct":true,"url":"https://api.github.com/repos/nZEDb/nZEDb/commits/a472784834e7720c420c3d0e0b3f491b3b99c1f4"},{"sha":"e5b0feebd61f02bf79b987ab95d79362862484fe","author":{"email":"d905a83fce9ca7a3ba493d139e06a7bc091e7008@gmail.com","name":"DariusIII"},"message":"Merge pull request #190 from nZEDb/dev\n\nDev","distinct":true,"url":"https://api.github.com/repos/nZEDb/nZEDb/commits/e5b0feebd61f02bf79b987ab95d79362862484fe"},{"sha":"8798c62d19bd328232c4f574272344149781d015","author":{"email":"d905a83fce9ca7a3ba493d139e06a7bc091e7008@gmail.com","name":"DariusIII"},"message":"Merge pull request #192 from nZEDb/dev\n\nDev","distinct":true,"url":"https://api.github.com/repos/nZEDb/nZEDb/commits/8798c62d19bd328232c4f574272344149781d015"},{"sha":"52089bc28eab88d4769ef823c46e913274b0ef21","author":{"email":"d905a83fce9ca7a3ba493d139e06a7bc091e7008@gmail.com","name":"DariusIII"},"message":"Merge pull request #193 from nZEDb/dev\n\nDev","distinct":true,"url":"https://api.github.com/repos/nZEDb/nZEDb/commits/52089bc28eab88d4769ef823c46e913274b0ef21"},{"sha":"e594fe80e431f51e82349a7d15f5ae661597d770","author":{"email":"d905a83fce9ca7a3ba493d139e06a7bc091e7008@gmail.com","name":"DariusIII"},"message":"Merge pull request #194 from nZEDb/dev\n\nFix: Issue #1477 - MySQL Full-Text Search broken after implementation of...","distinct":true,"url":"https://api.github.com/repos/nZEDb/nZEDb/commits/e594fe80e431f51e82349a7d15f5ae661597d770"},{"sha":"6a0e8832337f45491503157c46ee33f5a6032306","author":{"email":"d905a83fce9ca7a3ba493d139e06a7bc091e7008@gmail.com","name":"DariusIII"},"message":"Merge pull request #195 from nZEDb/dev\n\nDev","distinct":true,"url":"https://api.github.com/repos/nZEDb/nZEDb/commits/6a0e8832337f45491503157c46ee33f5a6032306"},{"sha":"a064bb19dd13b1dab7a3f34bc7f3c870f514b387","author":{"email":"d905a83fce9ca7a3ba493d139e06a7bc091e7008@gmail.com","name":"DariusIII"},"message":"Merge pull request #196 from nZEDb/dev\n\nDev","distinct":true,"url":"https://api.github.com/repos/nZEDb/nZEDb/commits/a064bb19dd13b1dab7a3f34bc7f3c870f514b387"},{"sha":"559306637c70572e4c80c4b44495805f99b05f5b","author":{"email":"d905a83fce9ca7a3ba493d139e06a7bc091e7008@gmail.com","name":"DariusIII"},"message":"Merge pull request #198 from nZEDb/dev\n\nDev","distinct":true,"url":"https://api.github.com/repos/nZEDb/nZEDb/commits/559306637c70572e4c80c4b44495805f99b05f5b"},{"sha":"3ea408ad2181277a229cc5653078124b9be544d9","author":{"email":"d905a83fce9ca7a3ba493d139e06a7bc091e7008@gmail.com","name":"DariusIII"},"message":"Merge pull request #199 from nZEDb/dev\n\nDev","distinct":true,"url":"https://api.github.com/repos/nZEDb/nZEDb/commits/3ea408ad2181277a229cc5653078124b9be544d9"},{"sha":"82c22a2f1b9f14e21835036a947a7e20ed983702","author":{"email":"d905a83fce9ca7a3ba493d139e06a7bc091e7008@gmail.com","name":"DariusIII"},"message":"Merge pull request #200 from nZEDb/dev\n\nDev","distinct":true,"url":"https://api.github.com/repos/nZEDb/nZEDb/commits/82c22a2f1b9f14e21835036a947a7e20ed983702"}]},"public":true,"created_at":"2015-01-01T01:04:42Z","org":{"id":4260270,"login":"nZEDb","gravatar_id":"","url":"https://api.github.com/orgs/nZEDb","avatar_url":"https://avatars.githubusercontent.com/u/4260270?"}}
{"id":"2489397885","type":"IssueCommentEvent","actor":{"id":6964047,"login":"TTMTT","gravatar_id":"","url":"https://api.github.com/users/TTMTT","avatar_url":"https://avatars.githubusercontent.com/u/6964047?"},"repo":{"id":26192763,"name":"HarisDevs/iCl0udinSupport","url":"https://api.github.com/repos/HarisDevs/iCl0udinSupport"},"payload":{"action":"created","issue":{"url":"https://api.github.com/repos/HarisDevs/iCl0udinSupport/issues/6","labels_url":"https://api.github.com/repos/HarisDevs/iCl0udinSupport/issues/6/labels{/name}","comments_url":"https://api.github.com/repos/HarisDevs/iCl0udinSupport/issues/6/comments","events_url":"https://api.github.com/repos/HarisDevs/iCl0udinSupport/issues/6/events","html_url":"https://github.com/HarisDevs/iCl0udinSupport/issues/6","id":48839033,"number":6,"title":"Discuss9 ","user":{"login":"HarisDevs","id":8019549,"avatar_url":"https://avatars.githubusercontent.com/u/8019549?v=3","gravatar_id":"","url":"https://api.github.com/users/HarisDevs","html_url":"https://github.com/HarisDevs","followers_url":"https://api.github.com/users/HarisDevs/followers","following_url":"https://api.github.com/users/HarisDevs/following{/other_user}","gists_url":"https://api.github.com/users/HarisDevs/gists{/gist_id}","starred_url":"https://api.github.com/users/HarisDevs/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/HarisDevs/subscriptions","organizations_url":"https://api.github.com/users/HarisDevs/orgs","repos_url":"https://api.github.com/users/HarisDevs/repos","events_url":"https://api.github.com/users/HarisDevs/events{/privacy}","received_events_url":"https://api.github.com/users/HarisDevs/received_events","type":"User","site_admin":false},"labels":[],"state":"open","locked":false,"assignee":null,"milestone":null,"comments":424,"created_at":"2014-11-14T21:00:03Z","updated_at":"2015-01-01T01:04:42Z","closed_at":null,"body":"<pre>Originally written by Magd, @TTMTT. </pre>\r\nHi..\r\nI just open this discuss9 becose the old topic is full and slow for browser .. \r\n\r\n------------------------------------------------------------------------------------------------------------------------------\r\n\r\n\r\nWow, ipod touch 5G (8.1) - iCL0udin v1.0 bypass activation (icloud)\r\n-------------------------------------------------------------------------------------\r\nhttp://youtu.be/tZmEdlDGNu4\r\n--------------------------------------\r\n\r\n------------------------------------------------------------------------------------------------------------------------------\r\n\r\niCL0udin v1.0 bypass activation (icloud) - ipad mini 2G (7.1.1)\r\n------------------------------------------------------------------------------\r\nhttp://youtu.be/tevYyBN2QCQ\r\n------------------------------------\r\n\r\n------------------------------------------------------------------------------------------------------------------------------\r\n\r\nVideo for bypass icloud (iCL0udin v1.0) for iphone 4 CDMA ..\r\n------------------------------------------------------------------------------\r\nhttp://youtu.be/i85-D6N2YLk\r\n------------------------------------\r\n\r\n-------------------------------------------------------------------------------------------------------\r\n\r\nNew video for iCL0udin v1.0 bypass icloud (3 iphones 7.1.2):\r\n-----------------------------------------------------------------------------\r\nhttp://youtu.be/p51TNlCr7ug\r\n-----------------------------------------\r\n\r\niCL0udin v1.0 -> %97\r\n----------------------------\r\nRemaining: %3 testing with some people..\r\n-------------------------------------\r\n\r\nLast Method:\r\n---------------------\r\n\r\nmethod 1 : via (other xml not to deviceservices - exploit)\r\nmethod 2 : via (apple cert & key and i can downgrade to any ios)\r\nmethod 3 : via (change some string by hex on ELF file << some times i got error)\r\nmethod 4 : via (use apple ssl cert or real ssl in server and change some string in iphone)\r\n\r\niCL0udin v1.0 have this method:\r\n-----------------------------------------\r\n\r\nmethod 1 : via (other xml not to deviceservices - exploit)\r\nmethod 2 : via (apple cert & key and i can downgrade to any ios)"},"comment":{"url":"https://api.github.com/repos/HarisDevs/iCl0udinSupport/issues/comments/68477314","html_url":"https://github.com/HarisDevs/iCl0udinSupport/issues/6#issuecomment-68477314","issue_url":"https://api.github.com/repos/HarisDevs/iCl0udinSupport/issues/6","id":68477314,"user":{"login":"TTMTT","id":6964047,"avatar_url":"https://avatars.githubusercontent.com/u/6964047?v=3","gravatar_id":"","url":"https://api.github.com/users/TTMTT","html_url":"https://github.com/TTMTT","followers_url":"https://api.github.com/users/TTMTT/followers","following_url":"https://api.github.com/users/TTMTT/following{/other_user}","gists_url":"https://api.github.com/users/TTMTT/gists{/gist_id}","starred_url":"https://api.github.com/users/TTMTT/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/TTMTT/subscriptions","organizations_url":"https://api.github.com/users/TTMTT/orgs","repos_url":"https://api.github.com/users/TTMTT/repos","events_url":"https://api.github.com/users/TTMTT/events{/privacy}","received_events_url":"https://api.github.com/users/TTMTT/received_events","type":"User","site_admin":false},"created_at":"2015-01-01T01:04:42Z","updated_at":"2015-01-01T01:04:42Z","body":"@HarisDevs \r\nexcuse me i open a new discuss for (iCL0udin v1.0):\r\n--------------------------------------------------------\r\nhttps://github.com/TTMTT/iCL0udin/issues/1\r\n--------------------------------------------------------"}},"public":true,"created_at":"2015-01-01T01:04:42Z"}
{"id":"2489397887","type":"WatchEvent","actor":{"id":103510,"login":"chengjunjian","gravatar_id":"","url":"https://api.github.com/users/chengjunjian","avatar_url":"https://avatars.githubusercontent.com/u/103510?"},"repo":{"id":22340661,"name":"kaimu/ionic-vs2013-intellisense","url":"https://api.github.com/repos/kaimu/ionic-vs2013-intellisense"},"payload":{"action":"started"},"public":true,"created_at":"2015-01-01T01:04:43Z"}
{"id":"2489397892","type":"PullRequestEvent","actor":{"id":18191,"login":"jc00ke","gravatar_id":"","url":"https://api.github.com/users/jc00ke","avatar_url":"https://avatars.githubusercontent.com/u/18191?"},"repo":{"id":10488201,"name":"JeanMertz/chruby-fish","url":"https://api.github.com/repos/JeanMertz/chruby-fish"},"payload":{"action":"opened","number":15,"pull_request":{"url":"https://api.github.com/repos/JeanMertz/chruby-fish/pulls/15","id":26739450,"html_url":"https://github.com/JeanMertz/chruby-fish/pull/15","diff_url":"https://github.com/JeanMertz/chruby-fish/pull/15.diff","patch_url":"https://github.com/JeanMertz/chruby-fish/pull/15.patch","issue_url":"https://api.github.com/repos/JeanMertz/chruby-fish/issues/15","number":15,"state":"open","locked":false,"title":"Document known PATH warning","user":{"login":"jc00ke","id":18191,"avatar_url":"https://avatars.githubusercontent.com/u/18191?v=3","gravatar_id":"","url":"https://api.github.com/users/jc00ke","html_url":"https://github.com/jc00ke","followers_url":"https://api.github.com/users/jc00ke/followers","following_url":"https://api.github.com/users/jc00ke/following{/other_user}","gists_url":"https://api.github.com/users/jc00ke/gists{/gist_id}","starred_url":"https://api.github.com/users/jc00ke/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/jc00ke/subscriptions","organizations_url":"https://api.github.com/users/jc00ke/orgs","repos_url":"https://api.github.com/users/jc00ke/repos","events_url":"https://api.github.com/users/jc00ke/events{/privacy}","received_events_url":"https://api.github.com/users/jc00ke/received_events","type":"User","site_admin":false},"body":"","created_at":"2015-01-01T01:04:45Z","updated_at":"2015-01-01T01:04:45Z","closed_at":null,"merged_at":null,"merge_commit_sha":null,"assignee":null,"milestone":null,"commits_url":"https://api.github.com/repos/JeanMertz/chruby-fish/pulls/15/commits","review_comments_url":"https://api.github.com/repos/JeanMertz/chruby-fish/pulls/15/comments","review_comment_url":"https://api.github.com/repos/JeanMertz/chruby-fish/pulls/comments/{number}","comments_url":"https://api.github.com/repos/JeanMertz/chruby-fish/issues/15/comments","statuses_url":"https://api.github.com/repos/JeanMertz/chruby-fish/statuses/859d6a993456f190598eda5b2a188d96af984cf2","head":{"label":"jc00ke:master","ref":"master","sha":"859d6a993456f190598eda5b2a188d96af984cf2","user":{"login":"jc00ke","id":18191,"avatar_url":"https://avatars.githubusercontent.com/u/18191?v=3","gravatar_id":"","url":"https://api.github.com/users/jc00ke","html_url":"https://github.com/jc00ke","followers_url":"https://api.github.com/users/jc00ke/followers","following_url":"https://api.github.com/users/jc00ke/following{/other_user}","gists_url":"https://api.github.com/users/jc00ke/gists{/gist_id}","starred_url":"https://api.github.com/users/jc00ke/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/jc00ke/subscriptions","organizations_url":"https://api.github.com/users/jc00ke/orgs","repos_url":"https://api.github.com/users/jc00ke/repos","events_url":"https://api.github.com/users/jc00ke/events{/privacy}","received_events_url":"https://api.github.com/users/jc00ke/received_events","type":"User","site_admin":false},"repo":{"id":28678223,"name":"chruby-fish","full_name":"jc00ke/chruby-fish","owner":{"login":"jc00ke","id":18191,"avatar_url":"https://avatars.githubusercontent.com/u/18191?v=3","gravatar_id":"","url":"https://api.github.com/users/jc00ke","html_url":"https://github.com/jc00ke","followers_url":"https://api.github.com/users/jc00ke/followers","following_url":"https://api.github.com/users/jc00ke/following{/other_user}","gists_url":"https://api.github.com/users/jc00ke/gists{/gist_id}","starred_url":"https://api.github.com/users/jc00ke/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/jc00ke/subscriptions","organizations_url":"https://api.github.com/users/jc00ke/orgs","repos_url":"https://api.github.com/users/jc00ke/repos","events_url":"https://api.github.com/users/jc00ke/events{/privacy}","received_events_url":"https://api.github.com/users/jc00ke/received_events","type":"User","site_admin":false},"private":false,"html_url":"https://github.com/jc00ke/chruby-fish","description":"Thin wrapper around chruby to make it work with the Fish shell","fork":true,"url":"https://api.github.com/repos/jc00ke/chruby-fish","forks_url":"https://api.github.com/repos/jc00ke/chruby-fish/forks","keys_url":"https://api.github.com/repos/jc00ke/chruby-fish/keys{/key_id}","collaborators_url":"https://api.github.com/repos/jc00ke/chruby-fish/collaborators{/collaborator}","teams_url":"https://api.github.com/repos/jc00ke/chruby-fish/teams","hooks_url":"https://api.github.com/repos/jc00ke/chruby-fish/hooks","issue_events_url":"https://api.github.com/repos/jc00ke/chruby-fish/issues/events{/number}","events_url":"https://api.github.com/repos/jc00ke/chruby-fish/events","assignees_url":"https://api.github.com/repos/jc00ke/chruby-fish/assignees{/user}","branches_url":"https://api.github.com/repos/jc00ke/chruby-fish/branches{/branch}","tags_url":"https://api.github.com/repos/jc00ke/chruby-fish/tags","blobs_url":"https://api.github.com/repos/jc00ke/chruby-fish/git/blobs{/sha}","git_tags_url":"https://api.github.com/repos/jc00ke/chruby-fish/git/tags{/sha}","git_refs_url":"https://api.github.com/repos/jc00ke/chruby-fish/git/refs{/sha}","trees_url":"https://api.github.com/repos/jc00ke/chruby-fish/git/trees{/sha}","statuses_url":"https://api.github.com/repos/jc00ke/chruby-fish/statuses/{sha}","languages_url":"https://api.github.com/repos/jc00ke/chruby-fish/languages","stargazers_url":"https://api.github.com/repos/jc00ke/chruby-fish/stargazers","contributors_url":"https://api.github.com/repos/jc00ke/chruby-fish/contributors","subscribers_url":"https://api.github.com/repos/jc00ke/chruby-fish/subscribers","subscription_url":"https://api.github.com/repos/jc00ke/chruby-fish/subscription","commits_url":"https://api.github.com/repos/jc00ke/chruby-fish/commits{/sha}","git_commits_url":"https://api.github.com/repos/jc00ke/chruby-fish/git/commits{/sha}","comments_url":"https://api.github.com/repos/jc00ke/chruby-fish/comments{/number}","issue_comment_url":"https://api.github.com/repos/jc00ke/chruby-fish/issues/comments/{number}","contents_url":"https://api.github.com/repos/jc00ke/chruby-fish/contents/{+path}","compare_url":"https://api.github.com/repos/jc00ke/chruby-fish/compare/{base}...{head}","merges_url":"https://api.github.com/repos/jc00ke/chruby-fish/merges","archive_url":"https://api.github.com/repos/jc00ke/chruby-fish/{archive_format}{/ref}","downloads_url":"https://api.github.com/repos/jc00ke/chruby-fish/downloads","issues_url":"https://api.github.com/repos/jc00ke/chruby-fish/issues{/number}","pulls_url":"https://api.github.com/repos/jc00ke/chruby-fish/pulls{/number}","milestones_url":"https://api.github.com/repos/jc00ke/chruby-fish/milestones{/number}","notifications_url":"https://api.github.com/repos/jc00ke/chruby-fish/notifications{?since,all,participating}","labels_url":"https://api.github.com/repos/jc00ke/chruby-fish/labels{/name}","releases_url":"https://api.github.com/repos/jc00ke/chruby-fish/releases{/id}","created_at":"2015-01-01T01:00:59Z","updated_at":"2015-01-01T01:04:34Z","pushed_at":"2015-01-01T01:04:34Z","git_url":"git://github.com/jc00ke/chruby-fish.git","ssh_url":"git@github.com:jc00ke/chruby-fish.git","clone_url":"https://github.com/jc00ke/chruby-fish.git","svn_url":"https://github.com/jc00ke/chruby-fish","homepage":"","size":1047,"stargazers_count":0,"watchers_count":0,"language":"Shell","has_issues":false,"has_downloads":true,"has_wiki":false,"has_pages":false,"forks_count":0,"mirror_url":null,"open_issues_count":0,"forks":0,"open_issues":0,"watchers":0,"default_branch":"master"}},"base":{"label":"JeanMertz:master","ref":"master","sha":"e8f28035e7570cbf90568e7dd087810ae7958c8d","user":{"login":"JeanMertz","id":383250,"avatar_url":"https://avatars.githubusercontent.com/u/383250?v=3","gravatar_id":"","url":"https://api.github.com/users/JeanMertz","html_url":"https://github.com/JeanMertz","followers_url":"https://api.github.com/users/JeanMertz/followers","following_url":"https://api.github.com/users/JeanMertz/following{/other_user}","gists_url":"https://api.github.com/users/JeanMertz/gists{/gist_id}","starred_url":"https://api.github.com/users/JeanMertz/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/JeanMertz/subscriptions","organizations_url":"https://api.github.com/users/JeanMertz/orgs","repos_url":"https://api.github.com/users/JeanMertz/repos","events_url":"https://api.github.com/users/JeanMertz/events{/privacy}","received_events_url":"https://api.github.com/users/JeanMertz/received_events","type":"User","site_admin":false},"repo":{"id":10488201,"name":"chruby-fish","full_name":"JeanMertz/chruby-fish","owner":{"login":"JeanMertz","id":383250,"avatar_url":"https://avatars.githubusercontent.com/u/383250?v=3","gravatar_id":"","url":"https://api.github.com/users/JeanMertz","html_url":"https://github.com/JeanMertz","followers_url":"https://api.github.com/users/JeanMertz/followers","following_url":"https://api.github.com/users/JeanMertz/following{/other_user}","gists_url":"https://api.github.com/users/JeanMertz/gists{/gist_id}","starred_url":"https://api.github.com/users/JeanMertz/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/JeanMertz/subscriptions","organizations_url":"https://api.github.com/users/JeanMertz/orgs","repos_url":"https://api.github.com/users/JeanMertz/repos","events_url":"https://api.github.com/users/JeanMertz/events{/privacy}","received_events_url":"https://api.github.com/users/JeanMertz/received_events","type":"User","site_admin":false},"private":false,"html_url":"https://github.com/JeanMertz/chruby-fish","description":"Thin wrapper around chruby to make it work with the Fish shell","fork":false,"url":"https://api.github.com/repos/JeanMertz/chruby-fish","forks_url":"https://api.github.com/repos/JeanMertz/chruby-fish/forks","keys_url":"https://api.github.com/repos/JeanMertz/chruby-fish/keys{/key_id}","collaborators_url":"https://api.github.com/repos/JeanMertz/chruby-fish/collaborators{/collaborator}","teams_url":"https://api.github.com/repos/JeanMertz/chruby-fish/teams","hooks_url":"https://api.github.com/repos/JeanMertz/chruby-fish/hooks","issue_events_url":"https://api.github.com/repos/JeanMertz/chruby-fish/issues/events{/number}","events_url":"https://api.github.com/repos/JeanMertz/chruby-fish/events","assignees_url":"https://api.github.com/repos/JeanMertz/chruby-fish/assignees{/user}","branches_url":"https://api.github.com/repos/JeanMertz/chruby-fish/branches{/branch}","tags_url":"https://api.github.com/repos/JeanMertz/chruby-fish/tags","blobs_url":"https://api.github.com/repos/JeanMertz/chruby-fish/git/blobs{/sha}","git_tags_url":"https://api.github.com/repos/JeanMertz/chruby-fish/git/tags{/sha}","git_refs_url":"https://api.github.com/repos/JeanMertz/chruby-fish/git/refs{/sha}","trees_url":"https://api.github.com/repos/JeanMertz/chruby-fish/git/trees{/sha}","statuses_url":"https://api.github.com/repos/JeanMertz/chruby-fish/statuses/{sha}","languages_url":"https://api.github.com/repos/JeanMertz/chruby-fish/languages","stargazers_url":"https://api.github.com/repos/JeanMertz/chruby-fish/stargazers","contributors_url":"https://api.github.com/repos/JeanMertz/chruby-fish/contributors","subscribers_url":"https://api.github.com/repos/JeanMertz/chruby-fish/subscribers","subscription_url":"https://api.github.com/repos/JeanMertz/chruby-fish/subscription","commits_url":"https://api.github.com/repos/JeanMertz/chruby-fish/commits{/sha}","git_commits_url":"https://api.github.com/repos/JeanMertz/chruby-fish/git/commits{/sha}","comments_url":"https://api.github.com/repos/JeanMertz/chruby-fish/comments{/number}","issue_comment_url":"https://api.github.com/repos/JeanMertz/chruby-fish/issues/comments/{number}","contents_url":"https://api.github.com/repos/JeanMertz/chruby-fish/contents/{+path}","compare_url":"https://api.github.com/repos/JeanMertz/chruby-fish/compare/{base}...{head}","merges_url":"https://api.github.com/repos/JeanMertz/chruby-fish/merges","archive_url":"https://api.github.com/repos/JeanMertz/chruby-fish/{archive_format}{/ref}","downloads_url":"https://api.github.com/repos/JeanMertz/chruby-fish/downloads","issues_url":"https://api.github.com/repos/JeanMertz/chruby-fish/issues{/number}","pulls_url":"https://api.github.com/repos/JeanMertz/chruby-fish/pulls{/number}","milestones_url":"https://api.github.com/repos/JeanMertz/chruby-fish/milestones{/number}","notifications_url":"https://api.github.com/repos/JeanMertz/chruby-fish/notifications{?since,all,participating}","labels_url":"https://api.github.com/repos/JeanMertz/chruby-fish/labels{/name}","releases_url":"https://api.github.com/repos/JeanMertz/chruby-fish/releases{/id}","created_at":"2013-06-04T20:33:07Z","updated_at":"2014-12-14T22:38:55Z","pushed_at":"2014-12-14T22:38:55Z","git_url":"git://github.com/JeanMertz/chruby-fish.git","ssh_url":"git@github.com:JeanMertz/chruby-fish.git","clone_url":"https://github.com/JeanMertz/chruby-fish.git","svn_url":"https://github.com/JeanMertz/chruby-fish","homepage":"","size":1047,"stargazers_count":23,"watchers_count":23,"language":"Shell","has_issues":true,"has_downloads":true,"has_wiki":false,"has_pages":false,"forks_count":6,"mirror_url":null,"open_issues_count":4,"forks":6,"open_issues":4,"watchers":23,"default_branch":"master"}},"_links":{"self":{"href":"https://api.github.com/repos/JeanMertz/chruby-fish/pulls/15"},"html":{"href":"https://github.com/JeanMertz/chruby-fish/pull/15"},"issue":{"href":"https://api.github.com/repos/JeanMertz/chruby-fish/issues/15"},"comments":{"href":"https://api.github.com/repos/JeanMertz/chruby-fish/issues/15/comments"},"review_comments":{"href":"https://api.github.com/repos/JeanMertz/chruby-fish/pulls/15/comments"},"review_comment":{"href":"https://api.github.com/repos/JeanMertz/chruby-fish/pulls/comments/{number}"},"commits":{"href":"https://api.github.com/repos/JeanMertz/chruby-fish/pulls/15/commits"},"statuses":{"href":"https://api.github.com/repos/JeanMertz/chruby-fish/statuses/859d6a993456f190598eda5b2a188d96af984cf2"}},"merged":false,"mergeable":null,"mergeable_state":"unknown","merged_by":null,"comments":0,"review_comments":0,"commits":1,"additions":14,"deletions":0,"changed_files":1}},"public":true,"created_at":"2015-01-01T01:04:45Z"}
{"id":"2489397894","type":"PushEvent","actor":{"id":1059214,"login":"wlaurance","gravatar_id":"","url":"https://api.github.com/users/wlaurance","avatar_url":"https://avatars.githubusercontent.com/u/1059214?"},"repo":{"id":28050478,"name":"empirical-org/Quill-Grammar","url":"https://api.github.com/repos/empirical-org/Quill-Grammar"},"payload":{"push_id":536753132,"size":2,"distinct_size":1,"ref":"refs/heads/feature/crud-firebase","head":"47e38def07f43835e7e91dcde60e8db5edaac315","before":"88ee40bc42c418eb0298e525f5cd6137657ff377","commits":[{"sha":"9835f267914e973c8ca53b28b85b94bdf3086ba2","author":{"email":"c55061f2e98089f7f71676646e4a1dbbd0f0ebe8@gmail.com","name":"Peter Gault"},"message":"Update README.md","distinct":false,"url":"https://api.github.com/repos/empirical-org/Quill-Grammar/commits/9835f267914e973c8ca53b28b85b94bdf3086ba2"},{"sha":"47e38def07f43835e7e91dcde60e8db5edaac315","author":{"email":"bc033e145f35c466dd9a9e87a3be67317de99120@gmail.com","name":"wlaurance"},"message":"Merge branch 'feature/crud-firebase' of github.com:Empirical-Org/Quill-Grammar into feature/crud-firebase","distinct":true,"url":"https://api.github.com/repos/empirical-org/Quill-Grammar/commits/47e38def07f43835e7e91dcde60e8db5edaac315"}]},"public":true,"created_at":"2015-01-01T01:04:45Z","org":{"id":4258432,"login":"empirical-org","gravatar_id":"","url":"https://api.github.com/orgs/empirical-org","avatar_url":"https://avatars.githubusercontent.com/u/4258432?"}}
{"id":"2489397896","type":"IssueCommentEvent","actor":{"id":3489773,"login":"captainkirkby","gravatar_id":"","url":"https://api.github.com/users/captainkirkby","avatar_url":"https://avatars.githubusercontent.com/u/3489773?"},"repo":{"id":15461243,"name":"captainkirkby/Gears","url":"https://api.github.com/repos/captainkirkby/Gears"},"payload":{"action":"created","issue":{"url":"https://api.github.com/repos/captainkirkby/Gears/issues/30","labels_url":"https://api.github.com/repos/captainkirkby/Gears/issues/30/labels{/name}","comments_url":"https://api.github.com/repos/captainkirkby/Gears/issues/30/comments","events_url":"https://api.github.com/repos/captainkirkby/Gears/issues/30/events","html_url":"https://github.com/captainkirkby/Gears/issues/30","id":53210138,"number":30,"title":"Replaying Binary Data","user":{"login":"captainkirkby","id":3489773,"avatar_url":"https://avatars.githubusercontent.com/u/3489773?v=3","gravatar_id":"","url":"https://api.github.com/users/captainkirkby","html_url":"https://github.com/captainkirkby","followers_url":"https://api.github.com/users/captainkirkby/followers","following_url":"https://api.github.com/users/captainkirkby/following{/other_user}","gists_url":"https://api.github.com/users/captainkirkby/gists{/gist_id}","starred_url":"https://api.github.com/users/captainkirkby/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/captainkirkby/subscriptions","organizations_url":"https://api.github.com/users/captainkirkby/orgs","repos_url":"https://api.github.com/users/captainkirkby/repos","events_url":"https://api.github.com/users/captainkirkby/events{/privacy}","received_events_url":"https://api.github.com/users/captainkirkby/received_events","type":"User","site_admin":false},"labels":[{"url":"https://api.github.com/repos/captainkirkby/Gears/labels/documentation","name":"documentation","color":"eb6420"}],"state":"open","locked":false,"assignee":null,"milestone":null,"comments":1,"created_at":"2015-01-01T00:58:37Z","updated_at":"2015-01-01T01:04:46Z","closed_at":null,"body":"The binary file generated as a result of [this](https://github.com/captainkirkby/Gears/commit/24b67ea3dc1bcbc604053689187b41b1ccdac9cd) commit can be replayed and analyzed for anything unexpected that is causing the program to fail."},"comment":{"url":"https://api.github.com/repos/captainkirkby/Gears/issues/comments/68477315","html_url":"https://github.com/captainkirkby/Gears/issues/30#issuecomment-68477315","issue_url":"https://api.github.com/repos/captainkirkby/Gears/issues/30","id":68477315,"user":{"login":"captainkirkby","id":3489773,"avatar_url":"https://avatars.githubusercontent.com/u/3489773?v=3","gravatar_id":"","url":"https://api.github.com/users/captainkirkby","html_url":"https://github.com/captainkirkby","followers_url":"https://api.github.com/users/captainkirkby/followers","following_url":"https://api.github.com/users/captainkirkby/following{/other_user}","gists_url":"https://api.github.com/users/captainkirkby/gists{/gist_id}","starred_url":"https://api.github.com/users/captainkirkby/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/captainkirkby/subscriptions","organizations_url":"https://api.github.com/users/captainkirkby/orgs","repos_url":"https://api.github.com/users/captainkirkby/repos","events_url":"https://api.github.com/users/captainkirkby/events{/privacy}","received_events_url":"https://api.github.com/users/captainkirkby/received_events","type":"User","site_admin":false},"created_at":"2015-01-01T01:04:45Z","updated_at":"2015-01-01T01:04:45Z","body":"*Output*\r\n\r\nInvalid Data Packet Header!\r\nGood Header: fe fe fe 1 15 de 8 0 0 0 0 0 0 0 0 0 0 0 0 0 b1 2e 9c a 0 0 13 8a 1 0 3b c0 6e 72 0 0 20 6 7 0 0 0 0 40 0 0 3c 37 9f a 0 0 0 0 0 0 0 0 3 8 c f 15 1b 21 27 2f 39 41 4c 56 61 6f 7b 88 96 a5 b5 c5 d5 e7 f9 a 1c 2f 42 57 69 7d 91 a4 bb ce e2 f6 a 1e 31 44 57 6a 7c 8e 9f b0 c2 d2 e2 f1 0 10 1c 2a 36 42 4e 59 63 6d 76 7e 87 8d 94 9a 9e a1 a3 a3 a4 a7 a7 a7 a6 a7 a8 a9 a7 a6 a7 a9 a8 a7 a7 a8 a9 a8 a6 a7 a8 a9 a7 a6 a7 a8 a8 a7 a6 a7 a9 a8 a6 a6 a8 a8 a7 a6 a6 a8 a8 a7 a6 a7 a7 a7 a6 a6 a7 a8 a7 a6 a6 a7 a7 a7 a7 a7 a8 a8 a6 a6 a7 a8 a7 a6 a6 a7 a8 a7 a6 a7 a8 a7 a7 a6 a7 a9 a7 a6 a6 a7 a9 a7 a6 a6 a7 a8 a7 a6 a6 a8 a8 a7 a6 a7 a8 a7 a6 a6 a7 a9 a7 a6 a6 a8 a8 a7 a6 a7 a8 a7 a6 a6 a7 a8 a8 a6 a6 a8 a9 a7 a6 a7 a9 a8 a7 a6 a8 a9 a8 a7 a7 a8 a9 a8 a7 a7 a9 a9 a7 a6 a8 a9 a9 a7 a6 a7 a7 a6 a4 a2 a2 a0 9b 94 8d 84 7a 70 65 59 4b 3e 30 22 12 3 f1 df ce bb a8 95 82 6f 5b 46 31 1e 9 f5 e0 cb b8 a3 8e 7c 69 56 44 32 20 10 fe ee de cf c1 b2 a4 97 8b 7f 72 68 5e 56 4c 44 3c 33 2d 25 1e 1a 15 10 c 8 5 3 1 1 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 3 4 a f 15 19 1f 26 2e 39 41 4a 54 61 6d 79 87 95 a5 b3 c4 d4 e6 f9 9 1d 2f 42 57 69 7e 92 a7 bb d0 e3 f7 d 20 34 47 5a 6e 7f 91 a3 b4 c6 d6 e6 f5 4 12 21 2d 39 46 51 5d 65 6f 7a 81 89 90 96 9c 9f a1 a2 a4 a6 a7 a7 a6 a6 a8 a9 a8 a7 a7 a8 a9 a8 a6 a7 a9 a9 a7 a6 a8 a9 a8 a7 a6 a7 a9 a8 a6 a7 a8 a7 a7 a6 a7 a8 a8 a6 a6 a8 a8 a7 a6 a6 a7 a8 a7 a6 a6 a8 a8 a7 a6 a6 a8 0 a9 a7 a6 a7 a8 a7 a7 a6 a7 a8 a7 a6 a6 a7 a8 a7 a6 a6 a8 a8 a7 a6 a7 a8 a7 a6 a6 a7 a8 a8 a6 a6 a8 a8 a7 a6 a6 a8 a7 a7 a6 a6 a8 a7 a7 a6 a7 a8 a8 a6 a6 a8 a8 a7 a6 a6 a7 a7 a7 a6 a6 a8 0 a8 a7 a6 a7 a8 a9 a7 a6 a7 a9 a8 a7 a7 a8 a9 a8 a6 a7 a8 a9 a8 a6 a7 a9 a9 a7 a7 a8 a9 a7 a6 a6 a6 a6 a3 a1 9f 9c 96 90 87 7e 73 68 5c 50 43 35 25 16 7 f6 e5 d3 c1 b0 9c 88 75 61 4e 3a 25 11 fe e8 d4 bf ab 98 84 70 5e 4c 3a 28 16 6 f7 e5 d5 c6 b7 ab 9d 90 84 77 6d 62 58 4f 47 3f 37 2f 27 23 1c 16 10 e b 4 4 2 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 1 4 d b e 14 18 1f 25 2d 35 3f 49 53 5e 6a 76 85 91 a0 af bf d0 e1 f2 3 16 29 3c 4e 62 77 8a 9d b1 c6 db ee 2 16 2a 3d 50 62 74 88 99 aa bb cc dc ec fb 9 18 25 33 3f 4a 56 60 6b 73 7c 85 8d 93 99 9c a0 a3 a4 a4 a5 a7 a7 a7 a7 a8 a9 a9 a8 a7 a8 a9 a8 a8 a7 a8 a9 a8 a7 a8 a9 a8 a7 a7 a8 a9 a8 a6 a6 a8 a9 a8 a6 a7 a8 a9 a7 a6 a7 a9 a8 a6 a6 a8 a9 a8 a6 a7 a8 a8 a7 a6 a7 a9 a8 a7 a6 a8 a8 a8 a6 a6 a8 a8 a7 a6 a7 a9 a8 a6 a6 a8 a9 a7 a6 a7 a8 a8 a7 a6 a7 a9 a8 a6 a7 a7 a9 a8 a6 a7 a8 a8 a7 a7 a7 a8 a8 a6 a6 a7 a9 a8 a6 a6 a8 a9 a7 a6 a7 a9 a8 a6 a6 a7 a9 a7 a6 a6 a8 a8 a7 a6 a7 a8 a7 a7 a6 a7 a9 a8 a6 a6 a8 a9 a7 a6 a7 a9 a8 a7 a6 a7 a9 a7 a6 a7 a7 a8 a7 a6 a7 a9 a8 a7 a6 a7 a8 a8 a6 a6 a8 a9 a7 a6 a7 a8 a7 a7 a6 a7 a9 a7 a6 a6 a8 a8 a7 a6 a7 a8 a8 a7 a6 a7 a9 a8 a6 a6 a8 a8 a8 a6 a7 a8 a8 a7 a6 a7 a9 a8 a6 a6 a8 a9 a7 a6 a7 a8 a8 a7 a6 a7 a9 a8 a6 a6 a8 a8 a7 a6 a6 a8 a8 a7 a6 a7 a8 a8 a6 a6 a7 a9 a7 a6 a7 a8 a9 a7 a6 a7 a8 a8 a6 a6 a8 a8 a7 a6 a6 a8 a8 a7 a6 a7 a9 a8 a6 a6 a8 a9 a8 a6 a6 a8 a8 a7 a6 a7 a8 a8 a7 a6 a7 a9 a7 a6 a7 a8 a7 a7 a6 a7 a8 a8 a7 a6 a7 a8 a7 a6 a6 a7 a9 a7 a6 a6 a8 a8 a7 a6 a7 a8 a8 a7 a6 a7 a8 a8 a6 a6 a8 a9 a8 a6 a7 a8 a8 a7 a6 a7 a8 a8 a6 a6 a8 a9 a7 a6 a6 a8 a9 a7 a6 a7 a9 a8 a7 a6 a7 a8 a7 a6 a6 a8 a8 a7 a6 a7 a7 a8 a7 a6 a7 a8 a8 a6 a6 a8 a8 a7 a6 a7 a8 a8 a7 a6 a8 a9 a8 a6 a6 a7 a9 a8 a6 a7 a9 a9 a7 a6 a7 a8 a8 a7 a6 a8 a9 a7 a6 a7 a8 a8 a7 a6 a7 a8 a8 a7 a6 a7 a7 a8 a6 a6 a7 a8 a7 a6 a6 a7 a8 a7 a6 a6 a7 a8 a7 a6 a7 a8 a8 a7 a6 a7 a8 a7 a6 a6 a7 a8 a8 a6 a6 a8 a9 a7 a6 a7 a8 a8 a7 a6 a8 a9 a8 a6 a6 a8 a9 a7 a6 a7 a8 a8 a7 a6 a7 a8 a7 a6 a6 a7 a8 a7 a6 a6 a8 a8 a7 a6 a7 a8 a8 a6 a6 a8 a9 a7 a6 a7 a8 a8 a7 a6 a7 a8 a7 a6 a6 a7 a8 a8 a6 a6 a8 a8 a7 a6 a7 a8 a8 a7 a6 a7 a8 a7 a6 a6 a7 a8 a7 a6 a7 a7 a7 a6 a6 a7 a7 a7 a6 a6 a7 a8 a7 a6 a6 a7 a7 a7 a6 a7 a8 a8 a6 a6 a7 a7 a7 a6 a7 a8 a7 a7 a6 a7 a8 a7 a6 a6 a7 a9 a7 a6 a6 a8 a7 a7 a6 a7 a7 a8 a6 a6 a7 a9 a7 a6 a6 a7 a8 a7 a6 a7 a8 a8 a7 a6 a7 a7 a7 a6 a6 a7 a8 a7 a6 a7 a8 a7 a7 a6 a7 a8 a7 a7 a6 a7 a9 a7 a6 a6 a8 a8 a7 a6 a7 a8 a8 a7 a6 a7 a9 a8 a6 a6 a8 a7 a7 a6 a7 a7 a8 a7 a6 a7 a9 a8 a7 a6 a8 a9 a9 a7 a8 a9 a9 a8 a8 a8 a9 a9 a8 a8 a9 aa a8 a8 a8 a9 a9 a8 a8 a8 aa a9 a8 a7 a8 a7 a6 a4 a4 a2 a0 9b 94 8e 84 7a 6f 64 57 4a 3c 2d 20 10 ff ef dd cc b9 a6 94 81 6c 59 45 30 1d 8 f3 e0 cb b7 a3 8f 7c 6a 57 44 33 21 11 ff ef e0 d0 c3 b4 a6 99 8d 80 75 6a 60 57 4d 45 3d 36 2f 28 20 1b 17 11 c 8 c 3 1 1 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 **fe fe fe 1 16 de 8 0 0 0 0 0 0 0 0 0 0**\r\n\r\n\r\n\r\nBad Header: 0 0 0 36 2f 9c a 0 0 19 8a 1 0 36 c0 9f 72 0 0 84 0 7 0 0 0 0 40 0 0 3c af 76 4b a8 a6 a8 a9 a8 a6 a7 a8 a9 a8 a6 a7 a9 a8 a6 a7 a8 a9 a8 a6 a7 a9 a9 a7 a6 a8 a9 a8 a7 a7 a8 a9 a8 a6 a7 a9 a8 a7 a6 a8 a9 a7 a6 a7 a8 a8 a7 a6 a8 a9 a8 a7 a7 a8 a9 a8 a6 a7 a9 a8 a7 a7 a8 a9 a8 a6 a7 a9 a9 a7 a8 a8 a9 a8 a7 a7 a8 a9 a7 a6 a7 a9 a8 a7 a7 a8 a9 a8 a6 a7 a8 a8 a7 a6 a8 a9 a8 a7 a7 a9 a9 a7 a6 a7 a9 a8 a6 a7 a8 a9 a8 a6 a7 a9 a8 a7 a6 a8 a9 a8 a6 a7 a8 a9 a8 a6 a7 a9 a8 a7 a6 a8 a6 a7 a8 a9 a8 a6 a7 a9 a9 a7 a6 a7 a8 a8 a6 a6 a8 a9 a7 a6 a7 a9 a9 a7 a6 a8 a9 a8 a6 a7 a8 a9 a7 a6 a8 a9 a8 a6 a7 a8 a9 a7 a6 a7 a9 a9 a8 a6 a7 a9 a8 a6 a6 a8 a9 a8 a7 a7 a9 a9 a7 a6 a8 a9 a8 a7 a7 a8 a9 a8 a7 a8 a9 a8 a7 a7 a8 a9 a8 a6 a7 a9 a9 a7 a6 a7 a9 a8 a6 a7 a9 a9 a7 a7 a8 a9 a8 a6 a7 a8 a9 a8 a6 a7 a9 a8 a7 a6 a8 a9 a8 a6 a7 a8 a9 a7 a6 a8 a9 a8 a7 a6 a8 a9 a8 a6 a8 a9 a9 a8 a7 a8 a9 a8 a6 a7 a8 a8 a7 a6 a7 a9 a8 a7 a6 a7 a9 a8 a7 a7 a8 a9 a8 a6 a8 a9 a8 a6 a6 a8 a9 a8 a6 a7 a9 a9 a7 a6 a8 a9 a8 a7 a6 a8 a9 a8 a6 a7 a9 a8 a7 a7 a8 a9 a8 a6 a7 a8 a9 a8 a7 a7 a8 a8 a7 a6 a8 a9 a8 a6 a7 a8 a9 a7 a6 a7 a9 a8 a7 a7 a8 a9 a8 a7 a7 a9 a9 a8 a6 a8 a9 a8 a7 a6 a8 a9 a8 a6 a7 a9 a8 a7 a6 a8 a9 a8 a8 a7 a9 a9 a8 a6 a8 a9 a9 a8 a8 a8 a9 a8 a8 a8 a9 a9 a8 a8 a8 a9 a9 a8 a7 a8 a8 a6 a5 a6 a5 a3 a1 9e 9c 97 90 88 82 78 6f 63 59 4e 42 35 28 1b d ff ef df ce bd ab 99 88 76 63 51 3d 2c 17 3 ef db c7 b2 9e 8a 77 63 50 3c 29 18 5 f2 e1 d0 bf b0 a0 92 85 76 69 5e 52 49 3e 35 2c 25 1f 18 11 e b 5 5 2 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 2 4 a e 11 16 1c 22 2a 30 38 40 47 51 5a 64 6f 7b 87 92 9e ad bb ca d9 e9 f9 9 1b 2c 3e 51 62 75 88 9c b1 c4 d8 ec 2 16 29 3d 51 65 78 8c 9f b1 c5 d6 e8 f9 8 19 28 37 44 52 5e 6b 75 80 8b 92 98 9d 9f a2 a5 a6 a5 a6 a7 a9 a8 a6 a8 a9 a9 a8 a8 a8 a9 a9 a8 a7 a9 a9 a8 a8 a8 a9 a9 a7 a7 a8 a9 a8 a8 a7 a9 a9 a7 a6 a8 a9 a8 a7 a7 a9 a9 a8 a6 a7 a9 a8 a7 a7 a8 a9 a8 a7 a7 a9 a8 a7 a7 a8 a9 a8 a7 a7 a8 a9 a8 a6 a7 a9 a8 a7 a7 a8 a9 a8 a8 a7 a8 a9 a7 a6 a8 a9 a9 a8 a7 a8 a9 a8 a7 a7 a8 a8 a8 a6 a7 a9 a8 a7 a6 a8 a9 a8 a6 a7 a8 a9 a7 a6 a8 a9 a8 a7 a7 a8 a9 a8 a6 a7 a8 a9 a8 a7 a8 a9 a8 a7 a7 a8 a9 a8 a7 a8 a9 a9 a8 a8 a8 a9 a8 a7 a7 a9 a9 a8 a7 a7 a7 a7 a5 a4 a4 a2 9f 9b 98 92 8a 81 79 70 67 5b 50 45 38 2b 1e 10 2 f3 e3 d2 c3 b0 9f 8c 7a 68 55 42 2e 1b 7 f4 df ca b7 a1 8d 78 65 51 3e 2a 18 7 f3 e1 d0 c0 b1 a0 92 84 77 6a 5e 52 47 3f 35 2c 25 1e 19 12 d a a 3 2 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 4 e b f 12 16 1d 23 29 30 37 41 49 51 5a 64 70 7a 86 92 9f ae bb c9 d9 e8 f8 9 18 2b 3e 4f 62 74 87 9c af c3 d7 ec 0 15 29 3d 53 66 7a 8d a0 b3 c5 d7 e8 fa a 1a 29 38 47 53 60 69 75 80 8a 92 98 9d a2 a3 a5 a4 a6 a7 a7 a7 a6 a8 a9 a9 a8 a7 a8 a9 a8 a7 a8 a9 a9 a8 a7 a8 a9 a9 a8 a8 a8 a9 a9 a7 a7 a8 a9 a8 a7 a7 a8 a9 a8 a6 a7 a9 a9 a7 a7 a8 a9 a8 a6 a6 a8 a9 a7 a6 a7 a9 a9 a7 a7 a8 a9 a8 a7 a6 a8 a9 a8 a7 a8 a9 a9 a8 a6 a8 a9 a8 a7 a7 a8 a9 a8 a6 a7 a9 a9 a7 a6 a7 a9 a8 a7 a7 a8 a9 a8 a7 a7 a8 a9 a7 a6 a8 a9 a8 a7 a7 a8 a9 a8 a6 a7 a9 a9 a7 a7 a8 a9 a9 a7 a7 a8 a9 a8 a6 a7 a9 a9 a7 a7 a7 a9 a8 a7 a7 a8 a9 a8 a7 a8 a9 a9 a8 a6 a8 a9 a8 a7 a6 a7 a7 a6 a4 a4 a4 a2 9e 9a 97 91 88 80 78 6e 65 5a 4f 44 38 2b 1d f 0 f2 e2 d1 c2 b0 9f 8d 7c 6a 57 43 30 1c 9 f5 e1 cd b9 a4 90 7c 68 55 42 2e 1c a f8 e7 d5 c4 b5 a5 96 88 7b 6d 61 56 4b 42 39 2f 27 20 1b 15 f b a 3 2 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 3 3 a e 13 19 1c 22 2a 30 39 3f 48 51 5b 64 6e 7a 85 92 9e ac ba c9 d8 e8 f6 7 19 2a 3b 4d 60 73 86 99 ad c2 d6 ea fe 12 26 3b 4e 62 76 8a 9d b0 c2 d6 e6 f7 6 17 27 36 43 51 5e 6a 76 7f 89 92 99 9e a0 a2 a5 a7 a7 a7 a8 a9 a9 a8 a8 a8 aa a9 a8 a8 a9 aa a9 a8 a8 aa a9 a8 a8 a8 aa a9 a8 a8 a9 a9 a8 a7 a7 a9 a9 a7 a7 a8 a9 a8 a8 a7 a8 a9 a7 a6 a8 a9 a8 a7 a7 a8 a9 a8 a6 a7 a9 a9 a7 a6 a8 a9 a8 a7 a7 a9 a9 a7 a6 a8 a9 a8 a7 a7 a8 a9 a8 a6 a7 a9 a8 a7 a6 a8 a9 a8 a7 a7 a9 a8 a7 a6 a7 a9 a8 a7 a6 a8 a9 a8 a7 a7 a8 a8 a7 a6 a8 a9 a8 a7 a7 a8 a9 a7 a6 a7 a9 a8 a7 a7 a8 a9 a8 a7 a7 a9 a8 a7 a6 a7 a9 a8 a7 a7 a9 a9 a8 a7 a7 a9 a8 a6 a6 a8 a9 a8 a7 a7 a9 a9 a7 a6 a8 a9 a8 a7 a7 a8 a9 a8 a7 a7 a9 a8 a7 a7 a8 a9 a8 a7 a7 a9 a9 a8 a6 a8 a9 a8 a7 a7 a8 a9 a7 a6 a7 a9 a8 a7 a6 a8 a9 a8 a6 a7 a8 a9 a7 a6 a7 a9 a8 a7 a6 a8 a8 a7 a6 a7 a9 a9 a8 a6 a7 a9 a8 a7 a7 a9 a9 a8 a6 a7 a9 a8 a6 a6 a8 a9 a8 a7 a7 a9 a9 a7 a6 a8 a9 a8 a7 a7 a8 a9 a8 a7 a8 a9 a8 a6 a6 a8 a9 a7 a6 a8 a9 a9 a8 a6 a8 a9 a7 a6 a8 a9 a9 fe fe fe 1 17 de 8 0 0 0 0 0 0 0 0 0 0 \r\n"}},"public":true,"created_at":"2015-01-01T01:04:46Z"}
{"id":"2489397899","type":"PushEvent","actor":{"id":4418470,"login":"VapidLinus","gravatar_id":"","url":"https://api.github.com/users/VapidLinus","avatar_url":"https://avatars.githubusercontent.com/u/4418470?"},"repo":{"id":28103737,"name":"VapidLinus/ludum","url":"https://api.github.com/repos/VapidLinus/ludum"},"payload":{"push_id":536753136,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"71d9e25ca28ee11bd0f7b2e0e4aa3284d327634d","before":"7651a033556ffb15be11022a1705eab9ee38b748","commits":[{"sha":"71d9e25ca28ee11bd0f7b2e0e4aa3284d327634d","author":{"email":"2186255cea3741ffd28e8c68c5a7c2030a5f82da@gmail.com","name":"Linus Närkling-Larsson"},"message":"Restructure","distinct":true,"url":"https://api.github.com/repos/VapidLinus/ludum/commits/71d9e25ca28ee11bd0f7b2e0e4aa3284d327634d"}]},"public":true,"created_at":"2015-01-01T01:04:47Z"}
{"id":"2489397900","type":"DeleteEvent","actor":{"id":2066666,"login":"amadornes","gravatar_id":"","url":"https://api.github.com/users/amadornes","avatar_url":"https://avatars.githubusercontent.com/u/2066666?"},"repo":{"id":21494560,"name":"Qmunity/BluePower","url":"https://api.github.com/repos/Qmunity/BluePower"},"payload":{"ref":"NewMultipart","ref_type":"branch","pusher_type":"user"},"public":true,"created_at":"2015-01-01T01:04:47Z","org":{"id":8006321,"login":"Qmunity","gravatar_id":"","url":"https://api.github.com/orgs/Qmunity","avatar_url":"https://avatars.githubusercontent.com/u/8006321?"}}
{"id":"2489397903","type":"PushEvent","actor":{"id":8350185,"login":"Johannes-Larsson","gravatar_id":"","url":"https://api.github.com/users/Johannes-Larsson","avatar_url":"https://avatars.githubusercontent.com/u/8350185?"},"repo":{"id":28634222,"name":"Johannes-Larsson/towerDefence","url":"https://api.github.com/repos/Johannes-Larsson/towerDefence"},"payload":{"push_id":536753137,"size":2,"distinct_size":2,"ref":"refs/heads/master","head":"25b4d5160036fa439a4b44cdb10579f1807610fa","before":"348fbe1d9736ea23729e344a37e1f68b669709cc","commits":[{"sha":"9874efb97644ec0e3dcf44deffcb81407b4d9a69","author":{"email":"521728287efe6ca64f05202f1df9a036cc8f0398@gmail.com","name":"Johannes-Larsson"},"message":"fixed ugly testing of tower upgrade texture system","distinct":true,"url":"https://api.github.com/repos/Johannes-Larsson/towerDefence/commits/9874efb97644ec0e3dcf44deffcb81407b4d9a69"},{"sha":"25b4d5160036fa439a4b44cdb10579f1807610fa","author":{"email":"521728287efe6ca64f05202f1df9a036cc8f0398@gmail.com","name":"Johannes-Larsson"},"message":"made clicking anywhere exit upgradingMenu","distinct":true,"url":"https://api.github.com/repos/Johannes-Larsson/towerDefence/commits/25b4d5160036fa439a4b44cdb10579f1807610fa"}]},"public":true,"created_at":"2015-01-01T01:04:47Z"}
{"id":"2489397911","type":"PushEvent","actor":{"id":906529,"login":"dpwolfe","gravatar_id":"","url":"https://api.github.com/users/dpwolfe","avatar_url":"https://avatars.githubusercontent.com/u/906529?"},"repo":{"id":26579311,"name":"dpwolfe/otucha","url":"https://api.github.com/repos/dpwolfe/otucha"},"payload":{"push_id":536753141,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"89bbbe832e8916afacae2fe98885ae5af5391a7a","before":"6f79c0b71c6d4a7e3a7d538ed3b96a889c2a33e0","commits":[{"sha":"89bbbe832e8916afacae2fe98885ae5af5391a7a","author":{"email":"b7dfe270ecb2603aba704ea15b776485da19da15@gmail.com","name":"David Wolfe"},"message":"Update README.md","distinct":true,"url":"https://api.github.com/repos/dpwolfe/otucha/commits/89bbbe832e8916afacae2fe98885ae5af5391a7a"}]},"public":true,"created_at":"2015-01-01T01:04:48Z"}
{"id":"2489397912","type":"ForkEvent","actor":{"id":416575,"login":"frewsxcv","gravatar_id":"","url":"https://api.github.com/users/frewsxcv","avatar_url":"https://avatars.githubusercontent.com/u/416575?"},"repo":{"id":3545112,"name":"arthur-e/Wicket","url":"https://api.github.com/repos/arthur-e/Wicket"},"payload":{"forkee":{"id":28678263,"name":"Wicket","full_name":"frewsxcv/Wicket","owner":{"login":"frewsxcv","id":416575,"avatar_url":"https://avatars.githubusercontent.com/u/416575?v=3","gravatar_id":"","url":"https://api.github.com/users/frewsxcv","html_url":"https://github.com/frewsxcv","followers_url":"https://api.github.com/users/frewsxcv/followers","following_url":"https://api.github.com/users/frewsxcv/following{/other_user}","gists_url":"https://api.github.com/users/frewsxcv/gists{/gist_id}","starred_url":"https://api.github.com/users/frewsxcv/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/frewsxcv/subscriptions","organizations_url":"https://api.github.com/users/frewsxcv/orgs","repos_url":"https://api.github.com/users/frewsxcv/repos","events_url":"https://api.github.com/users/frewsxcv/events{/privacy}","received_events_url":"https://api.github.com/users/frewsxcv/received_events","type":"User","site_admin":false},"private":false,"html_url":"https://github.com/frewsxcv/Wicket","description":"A modest library for moving between Well-Known Text (WKT) and various framework geometries","fork":true,"url":"https://api.github.com/repos/frewsxcv/Wicket","forks_url":"https://api.github.com/repos/frewsxcv/Wicket/forks","keys_url":"https://api.github.com/repos/frewsxcv/Wicket/keys{/key_id}","collaborators_url":"https://api.github.com/repos/frewsxcv/Wicket/collaborators{/collaborator}","teams_url":"https://api.github.com/repos/frewsxcv/Wicket/teams","hooks_url":"https://api.github.com/repos/frewsxcv/Wicket/hooks","issue_events_url":"https://api.github.com/repos/frewsxcv/Wicket/issues/events{/number}","events_url":"https://api.github.com/repos/frewsxcv/Wicket/events","assignees_url":"https://api.github.com/repos/frewsxcv/Wicket/assignees{/user}","branches_url":"https://api.github.com/repos/frewsxcv/Wicket/branches{/branch}","tags_url":"https://api.github.com/repos/frewsxcv/Wicket/tags","blobs_url":"https://api.github.com/repos/frewsxcv/Wicket/git/blobs{/sha}","git_tags_url":"https://api.github.com/repos/frewsxcv/Wicket/git/tags{/sha}","git_refs_url":"https://api.github.com/repos/frewsxcv/Wicket/git/refs{/sha}","trees_url":"https://api.github.com/repos/frewsxcv/Wicket/git/trees{/sha}","statuses_url":"https://api.github.com/repos/frewsxcv/Wicket/statuses/{sha}","languages_url":"https://api.github.com/repos/frewsxcv/Wicket/languages","stargazers_url":"https://api.github.com/repos/frewsxcv/Wicket/stargazers","contributors_url":"https://api.github.com/repos/frewsxcv/Wicket/contributors","subscribers_url":"https://api.github.com/repos/frewsxcv/Wicket/subscribers","subscription_url":"https://api.github.com/repos/frewsxcv/Wicket/subscription","commits_url":"https://api.github.com/repos/frewsxcv/Wicket/commits{/sha}","git_commits_url":"https://api.github.com/repos/frewsxcv/Wicket/git/commits{/sha}","comments_url":"https://api.github.com/repos/frewsxcv/Wicket/comments{/number}","issue_comment_url":"https://api.github.com/repos/frewsxcv/Wicket/issues/comments/{number}","contents_url":"https://api.github.com/repos/frewsxcv/Wicket/contents/{+path}","compare_url":"https://api.github.com/repos/frewsxcv/Wicket/compare/{base}...{head}","merges_url":"https://api.github.com/repos/frewsxcv/Wicket/merges","archive_url":"https://api.github.com/repos/frewsxcv/Wicket/{archive_format}{/ref}","downloads_url":"https://api.github.com/repos/frewsxcv/Wicket/downloads","issues_url":"https://api.github.com/repos/frewsxcv/Wicket/issues{/number}","pulls_url":"https://api.github.com/repos/frewsxcv/Wicket/pulls{/number}","milestones_url":"https://api.github.com/repos/frewsxcv/Wicket/milestones{/number}","notifications_url":"https://api.github.com/repos/frewsxcv/Wicket/notifications{?since,all,participating}","labels_url":"https://api.github.com/repos/frewsxcv/Wicket/labels{/name}","releases_url":"https://api.github.com/repos/frewsxcv/Wicket/releases{/id}","created_at":"2015-01-01T01:04:48Z","updated_at":"2014-12-18T11:08:34Z","pushed_at":"2014-11-12T13:58:08Z","git_url":"git://github.com/frewsxcv/Wicket.git","ssh_url":"git@github.com:frewsxcv/Wicket.git","clone_url":"https://github.com/frewsxcv/Wicket.git","svn_url":"https://github.com/frewsxcv/Wicket","homepage":"http://arthur-e.github.com/Wicket","size":1032,"stargazers_count":0,"watchers_count":0,"language":null,"has_issues":false,"has_downloads":true,"has_wiki":true,"has_pages":false,"forks_count":0,"mirror_url":null,"open_issues_count":0,"forks":0,"open_issues":0,"watchers":0,"default_branch":"master","public":true}},"public":true,"created_at":"2015-01-01T01:04:48Z"}
{"id":"2489397913","type":"WatchEvent","actor":{"id":3913258,"login":"blumu","gravatar_id":"","url":"https://api.github.com/users/blumu","avatar_url":"https://avatars.githubusercontent.com/u/3913258?"},"repo":{"id":2087064,"name":"SignalR/SignalR","url":"https://api.github.com/repos/SignalR/SignalR"},"payload":{"action":"started"},"public":true,"created_at":"2015-01-01T01:04:49Z","org":{"id":931666,"login":"SignalR","gravatar_id":"","url":"https://api.github.com/orgs/SignalR","avatar_url":"https://avatars.githubusercontent.com/u/931666?"}}
{"id":"2489397915","type":"PushEvent","actor":{"id":6982503,"login":"josephsands","gravatar_id":"","url":"https://api.github.com/users/josephsands","avatar_url":"https://avatars.githubusercontent.com/u/6982503?"},"repo":{"id":28678205,"name":"josephsands/josephsands.github.io","url":"https://api.github.com/repos/josephsands/josephsands.github.io"},"payload":{"push_id":536753142,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"230208da74a1d0f76aca87882a3ed3954c9aa3ac","before":"1db4c2b9fabe365629330df61852a56f8d3abf2d","commits":[{"sha":"230208da74a1d0f76aca87882a3ed3954c9aa3ac","author":{"email":"793a20fb71e8611e634b8b771001d6777640050d@Anitas-MBP.home","name":"Joseph Sands"},"message":"Site updated at 2015-01-01 01:04:46 UTC","distinct":true,"url":"https://api.github.com/repos/josephsands/josephsands.github.io/commits/230208da74a1d0f76aca87882a3ed3954c9aa3ac"}]},"public":true,"created_at":"2015-01-01T01:04:49Z"}
{"id":"2489397916","type":"PushEvent","actor":{"id":259982,"login":"kigster","gravatar_id":"","url":"https://api.github.com/users/kigster","avatar_url":"https://avatars.githubusercontent.com/u/259982?"},"repo":{"id":20339421,"name":"wanelo-chef/postmodern","url":"https://api.github.com/repos/wanelo-chef/postmodern"},"payload":{"push_id":536753143,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"e8c6d4d0d091c90b4e4a6b70a33e79247b7e770c","before":"f64e8f114159054ab23fc9883b5476feddcfd6ed","commits":[{"sha":"e8c6d4d0d091c90b4e4a6b70a33e79247b7e770c","author":{"email":"fdced6b9ecadb87ee4278610f60ef5876a49575d@gmail.com","name":"Konstantin Gredeskoul"},"message":"Explicitly include ShellOut so ruby is happy\n\nWas getting this error on feed-db200.prod after adding \nfeed-db-replica role.\n\n[2015-01-01T00:54:19+00:00] WARN: Current  service[nad]: /var/chef/cache/cookbooks/nad/recipes/default.rb:135:in `from_file'\n\n  ================================================================================\n  Recipe Compile Error in /var/chef/cache/cookbooks/wanelo-feed/recipes/database_server.rb\n  ================================================================================\n\n  NoMethodError\n  -------------\n  No resource or method named `shell_out' for `Chef::Recipe \"default\"'\n\n  Cookbook Trace:\n  ---------------\n    /var/chef/cache/cookbooks/postmodern/recipes/default.rb:6:in `from_file'\n    /var/chef/cache/cookbooks/wanelo-feed/recipes/database_server.rb:55:in `from_file'","distinct":true,"url":"https://api.github.com/repos/wanelo-chef/postmodern/commits/e8c6d4d0d091c90b4e4a6b70a33e79247b7e770c"}]},"public":true,"created_at":"2015-01-01T01:04:49Z","org":{"id":2664866,"login":"wanelo-chef","gravatar_id":"","url":"https://api.github.com/orgs/wanelo-chef","avatar_url":"https://avatars.githubusercontent.com/u/2664866?"}}
{"id":"2489397920","type":"WatchEvent","actor":{"id":1015032,"login":"miketahani","gravatar_id":"","url":"https://api.github.com/users/miketahani","avatar_url":"https://avatars.githubusercontent.com/u/1015032?"},"repo":{"id":1935061,"name":"sunng87/node-geohash","url":"https://api.github.com/repos/sunng87/node-geohash"},"payload":{"action":"started"},"public":true,"created_at":"2015-01-01T01:04:50Z"}
{"id":"2489397936","type":"IssuesEvent","actor":{"id":8218499,"login":"GunZi200","gravatar_id":"","url":"https://api.github.com/users/GunZi200","avatar_url":"https://avatars.githubusercontent.com/u/8218499?"},"repo":{"id":27030606,"name":"GunZi200/Memory-Colour","url":"https://api.github.com/repos/GunZi200/Memory-Colour"},"payload":{"action":"opened","issue":{"url":"https://api.github.com/repos/GunZi200/Memory-Colour/issues/1","labels_url":"https://api.github.com/repos/GunZi200/Memory-Colour/issues/1/labels{/name}","comments_url":"https://api.github.com/repos/GunZi200/Memory-Colour/issues/1/comments","events_url":"https://api.github.com/repos/GunZi200/Memory-Colour/issues/1/events","html_url":"https://github.com/GunZi200/Memory-Colour/issues/1","id":53210268,"number":1,"title":"iPad drawing issue","user":{"login":"GunZi200","id":8218499,"avatar_url":"https://avatars.githubusercontent.com/u/8218499?v=3","gravatar_id":"","url":"https://api.github.com/users/GunZi200","html_url":"https://github.com/GunZi200","followers_url":"https://api.github.com/users/GunZi200/followers","following_url":"https://api.github.com/users/GunZi200/following{/other_user}","gists_url":"https://api.github.com/users/GunZi200/gists{/gist_id}","starred_url":"https://api.github.com/users/GunZi200/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/GunZi200/subscriptions","organizations_url":"https://api.github.com/users/GunZi200/orgs","repos_url":"https://api.github.com/users/GunZi200/repos","events_url":"https://api.github.com/users/GunZi200/events{/privacy}","received_events_url":"https://api.github.com/users/GunZi200/received_events","type":"User","site_admin":false},"labels":[{"url":"https://api.github.com/repos/GunZi200/Memory-Colour/labels/bug","name":"bug","color":"fc2929"}],"state":"open","locked":false,"assignee":null,"milestone":null,"comments":0,"created_at":"2015-01-01T01:04:52Z","updated_at":"2015-01-01T01:04:52Z","closed_at":null,"body":"There is a known issue I will fix sometime soon. That is the iPad version of Colour Trio.\r\n\r\nThe program prints over the black buttons each time your tap a correct colour. Displaying the start screen... really.\r\n\r\n"}},"public":true,"created_at":"2015-01-01T01:04:52Z"}
{"id":"2489397938","type":"PushEvent","actor":{"id":480938,"login":"hubot","gravatar_id":"","url":"https://api.github.com/users/hubot","avatar_url":"https://avatars.githubusercontent.com/u/480938?"},"repo":{"id":2389274,"name":"eclipse/eclipse.platform.swt","url":"https://api.github.com/repos/eclipse/eclipse.platform.swt"},"payload":{"push_id":536753150,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"1d2c32bfdfd0569960bbd941e6670f1e366946a3","before":"231816a5d4318faedbe56a995e907e59c9a91836","commits":[{"sha":"1d2c32bfdfd0569960bbd941e6670f1e366946a3","author":{"email":"7080c0b5db7f1b7254ce7ee1b5cbbb7b6872b877@in.ibm.com","name":"Arun Thondapu"},"message":"v4509","distinct":true,"url":"https://api.github.com/repos/eclipse/eclipse.platform.swt/commits/1d2c32bfdfd0569960bbd941e6670f1e366946a3"}]},"public":true,"created_at":"2015-01-01T01:04:53Z","org":{"id":56974,"login":"eclipse","gravatar_id":"","url":"https://api.github.com/orgs/eclipse","avatar_url":"https://avatars.githubusercontent.com/u/56974?"}}
{"id":"2489397941","type":"PushEvent","actor":{"id":5975070,"login":"marcellodibello","gravatar_id":"","url":"https://api.github.com/users/marcellodibello","avatar_url":"https://avatars.githubusercontent.com/u/5975070?"},"repo":{"id":17580814,"name":"marcellodibello/marcellodibello.github.io","url":"https://api.github.com/repos/marcellodibello/marcellodibello.github.io"},"payload":{"push_id":536753151,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"1194cc3417673dbd3baf1a625d7ce4e374fd755a","before":"7995cfd2d91a5b11eff75239ac124fae9af80d6d","commits":[{"sha":"1194cc3417673dbd3baf1a625d7ce4e374fd755a","author":{"email":"babd00909fb78351e79d40af26c77fc37bb4ed59@gmail.com","name":"marcellodibello"},"message":"Update index.html","distinct":true,"url":"https://api.github.com/repos/marcellodibello/marcellodibello.github.io/commits/1194cc3417673dbd3baf1a625d7ce4e374fd755a"}]},"public":true,"created_at":"2015-01-01T01:04:53Z"}
{"id":"2489397944","type":"WatchEvent","actor":{"id":6161385,"login":"mycaule","gravatar_id":"","url":"https://api.github.com/users/mycaule","avatar_url":"https://avatars.githubusercontent.com/u/6161385?"},"repo":{"id":211666,"name":"joyent/node","url":"https://api.github.com/repos/joyent/node"},"payload":{"action":"started"},"public":true,"created_at":"2015-01-01T01:04:53Z","org":{"id":10161,"login":"joyent","gravatar_id":"","url":"https://api.github.com/orgs/joyent","avatar_url":"https://avatars.githubusercontent.com/u/10161?"}}
{"id":"2489397946","type":"PushEvent","actor":{"id":1165609,"login":"bleroy","gravatar_id":"","url":"https://api.github.com/users/bleroy","avatar_url":"https://avatars.githubusercontent.com/u/1165609?"},"repo":{"id":28653536,"name":"DecentCMS/DecentCMS","url":"https://api.github.com/repos/DecentCMS/DecentCMS"},"payload":{"push_id":536753152,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"81ac106d21544f7cd0cca46d172c1d3174f7db4a","before":"4c55fad17d09de43a3566d8d77a2999317a671f9","commits":[{"sha":"81ac106d21544f7cd0cca46d172c1d3174f7db4a","author":{"email":"aff71552ea35fa74bb03c867fe0c4cde09895eea@gmail.com","name":"Bertrand Le Roy"},"message":"Rename Winston module to Logging.","distinct":true,"url":"https://api.github.com/repos/DecentCMS/DecentCMS/commits/81ac106d21544f7cd0cca46d172c1d3174f7db4a"}]},"public":true,"created_at":"2015-01-01T01:04:53Z","org":{"id":10110483,"login":"DecentCMS","gravatar_id":"","url":"https://api.github.com/orgs/DecentCMS","avatar_url":"https://avatars.githubusercontent.com/u/10110483?"}}
{"id":"2489397948","type":"PushEvent","actor":{"id":2916016,"login":"TylerSandman","gravatar_id":"","url":"https://api.github.com/users/TylerSandman","avatar_url":"https://avatars.githubusercontent.com/u/2916016?"},"repo":{"id":28609731,"name":"TylerSandman/poro-cv","url":"https://api.github.com/repos/TylerSandman/poro-cv"},"payload":{"push_id":536753153,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"e400f73a414aea729b6b5b01ec55a427bc140fd4","before":"a9d9ff7fb436827e80293189d26d864aff80c6e4","commits":[{"sha":"e400f73a414aea729b6b5b01ec55a427bc140fd4","author":{"email":"069eabe48263b36d2b5eab03e90d3687ed30521d@gmail.com","name":"Tyler Sanderson"},"message":"Added result handling after poro detection","distinct":true,"url":"https://api.github.com/repos/TylerSandman/poro-cv/commits/e400f73a414aea729b6b5b01ec55a427bc140fd4"}]},"public":true,"created_at":"2015-01-01T01:04:53Z"}
{"id":"2489397952","type":"CreateEvent","actor":{"id":8890114,"login":"speeldoos","gravatar_id":"","url":"https://api.github.com/users/speeldoos","avatar_url":"https://avatars.githubusercontent.com/u/8890114?"},"repo":{"id":28678093,"name":"speeldoos/hello-world","url":"https://api.github.com/repos/speeldoos/hello-world"},"payload":{"ref":"readme-edits","ref_type":"branch","master_branch":"master","description":"testing testing","pusher_type":"user"},"public":true,"created_at":"2015-01-01T01:04:54Z"}
{"id":"2489397954","type":"PushEvent","actor":{"id":2715854,"login":"miguelgrinberg","gravatar_id":"","url":"https://api.github.com/users/miguelgrinberg","avatar_url":"https://avatars.githubusercontent.com/u/2715854?"},"repo":{"id":28583035,"name":"miguelgrinberg/flask-celery-example","url":"https://api.github.com/repos/miguelgrinberg/flask-celery-example"},"payload":{"push_id":536753156,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"968b9d6aa0440d1063237d0d128abbb89961f920","before":"234a991f30f75a7a93e97bd535183f6b81067f2d","commits":[{"sha":"968b9d6aa0440d1063237d0d128abbb89961f920","author":{"email":"867e6f7716cd7d89b2aa6d04c9799a31b0e6903e@gmail.com","name":"Miguel Grinberg"},"message":"initial version","distinct":true,"url":"https://api.github.com/repos/miguelgrinberg/flask-celery-example/commits/968b9d6aa0440d1063237d0d128abbb89961f920"}]},"public":true,"created_at":"2015-01-01T01:04:54Z"}
{"id":"2489397955","type":"GollumEvent","actor":{"id":46323,"login":"paulcon","gravatar_id":"","url":"https://api.github.com/users/paulcon","avatar_url":"https://avatars.githubusercontent.com/u/46323?"},"repo":{"id":28157780,"name":"paulcon/active_subspaces","url":"https://api.github.com/repos/paulcon/active_subspaces"},"payload":{"pages":[{"page_name":"_Footer","title":"_Footer","summary":null,"action":"edited","sha":"ffa925d0740eb5600fc7c2a54271d4b925a8a8f8","html_url":"https://github.com/paulcon/active_subspaces/wiki/_Footer"}]},"public":true,"created_at":"2015-01-01T01:04:54Z"}
{"id":"2489397957","type":"PushEvent","actor":{"id":183517,"login":"troglobit","gravatar_id":"","url":"https://api.github.com/users/troglobit","avatar_url":"https://avatars.githubusercontent.com/u/183517?"},"repo":{"id":5778132,"name":"troglobit/finit","url":"https://api.github.com/repos/troglobit/finit"},"payload":{"push_id":536753159,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"8f1c16a8a5872d87197c7c346957f2e7e7262c5e","before":"b149dbc73e701f4385cb414ba7b87dd58b345b7d","commits":[{"sha":"8f1c16a8a5872d87197c7c346957f2e7e7262c5e","author":{"email":"583c295fd7602c168ad814279bbc3894ba65f5d6@gmail.com","name":"Joachim Nilsson"},"message":"Update TODO with section on Cron.\n\nSigned-off-by: Joachim Nilsson <troglobit@gmail.com>","distinct":true,"url":"https://api.github.com/repos/troglobit/finit/commits/8f1c16a8a5872d87197c7c346957f2e7e7262c5e"}]},"public":true,"created_at":"2015-01-01T01:04:54Z"}
{"id":"2489397960","type":"WatchEvent","actor":{"id":7576774,"login":"lovelybigdata","gravatar_id":"","url":"https://api.github.com/users/lovelybigdata","avatar_url":"https://avatars.githubusercontent.com/u/7576774?"},"repo":{"id":14681876,"name":"codelucas/newspaper","url":"https://api.github.com/repos/codelucas/newspaper"},"payload":{"action":"started"},"public":true,"created_at":"2015-01-01T01:04:55Z"}
{"id":"2489397963","type":"PushEvent","actor":{"id":3720783,"login":"designerwebhosting","gravatar_id":"","url":"https://api.github.com/users/designerwebhosting","avatar_url":"https://avatars.githubusercontent.com/u/3720783?"},"repo":{"id":20527117,"name":"designerwebhosting/christopherbyrne.github.io","url":"https://api.github.com/repos/designerwebhosting/christopherbyrne.github.io"},"payload":{"push_id":536753161,"size":1,"distinct_size":1,"ref":"refs/heads/gh-pages","head":"7e3ee7d19b64e0f0571098be4edb9729d09fb4f4","before":"52997f806edc1645856950072f9919dea680b5a7","commits":[{"sha":"7e3ee7d19b64e0f0571098be4edb9729d09fb4f4","author":{"email":"4bb0acc6ff8c0b6c31e50417877e6e3b3f1c65f0@googlemail.com","name":"Peter Noblee"},"message":"update 'date'","distinct":true,"url":"https://api.github.com/repos/designerwebhosting/christopherbyrne.github.io/commits/7e3ee7d19b64e0f0571098be4edb9729d09fb4f4"}]},"public":true,"created_at":"2015-01-01T01:04:55Z"}
{"id":"2489397964","type":"ReleaseEvent","actor":{"id":3134745,"login":"Vextil","gravatar_id":"","url":"https://api.github.com/users/Vextil","avatar_url":"https://avatars.githubusercontent.com/u/3134745?"},"repo":{"id":28277457,"name":"Vextil/WAMD","url":"https://api.github.com/repos/Vextil/WAMD"},"payload":{"action":"published","release":{"url":"https://api.github.com/repos/Vextil/WAMD/releases/818218","assets_url":"https://api.github.com/repos/Vextil/WAMD/releases/818218/assets","upload_url":"https://uploads.github.com/repos/Vextil/WAMD/releases/818218/assets{?name}","html_url":"https://github.com/Vextil/WAMD/releases/tag/2.1.0-release","id":818218,"tag_name":"2.1.0-release","target_commitish":"master","name":"2.1.0 Release","draft":false,"author":{"login":"Vextil","id":3134745,"avatar_url":"https://avatars.githubusercontent.com/u/3134745?v=3","gravatar_id":"","url":"https://api.github.com/users/Vextil","html_url":"https://github.com/Vextil","followers_url":"https://api.github.com/users/Vextil/followers","following_url":"https://api.github.com/users/Vextil/following{/other_user}","gists_url":"https://api.github.com/users/Vextil/gists{/gist_id}","starred_url":"https://api.github.com/users/Vextil/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/Vextil/subscriptions","organizations_url":"https://api.github.com/users/Vextil/orgs","repos_url":"https://api.github.com/users/Vextil/repos","events_url":"https://api.github.com/users/Vextil/events{/privacy}","received_events_url":"https://api.github.com/users/Vextil/received_events","type":"User","site_admin":false},"prerelease":false,"created_at":"2015-01-01T00:40:15Z","published_at":"2015-01-01T01:04:55Z","assets":[{"url":"https://api.github.com/repos/Vextil/WAMD/releases/assets/362005","id":362005,"name":"WhatsAppMD.G_.Google_Emojis.apk","label":null,"uploader":{"login":"Vextil","id":3134745,"avatar_url":"https://avatars.githubusercontent.com/u/3134745?v=3","gravatar_id":"","url":"https://api.github.com/users/Vextil","html_url":"https://github.com/Vextil","followers_url":"https://api.github.com/users/Vextil/followers","following_url":"https://api.github.com/users/Vextil/following{/other_user}","gists_url":"https://api.github.com/users/Vextil/gists{/gist_id}","starred_url":"https://api.github.com/users/Vextil/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/Vextil/subscriptions","organizations_url":"https://api.github.com/users/Vextil/orgs","repos_url":"https://api.github.com/users/Vextil/repos","events_url":"https://api.github.com/users/Vextil/events{/privacy}","received_events_url":"https://api.github.com/users/Vextil/received_events","type":"User","site_admin":false},"content_type":"application/vnd.android.package-archive","state":"uploaded","size":22511638,"download_count":0,"created_at":"2015-01-01T00:59:56Z","updated_at":"2015-01-01T01:01:45Z","browser_download_url":"https://github.com/Vextil/WAMD/releases/download/2.1.0-release/WhatsAppMD.G_.Google_Emojis.apk"},{"url":"https://api.github.com/repos/Vextil/WAMD/releases/assets/362004","id":362004,"name":"WhatsAppMD.S_.Stock_Emojis.apk","label":null,"uploader":{"login":"Vextil","id":3134745,"avatar_url":"https://avatars.githubusercontent.com/u/3134745?v=3","gravatar_id":"","url":"https://api.github.com/users/Vextil","html_url":"https://github.com/Vextil","followers_url":"https://api.github.com/users/Vextil/followers","following_url":"https://api.github.com/users/Vextil/following{/other_user}","gists_url":"https://api.github.com/users/Vextil/gists{/gist_id}","starred_url":"https://api.github.com/users/Vextil/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/Vextil/subscriptions","organizations_url":"https://api.github.com/users/Vextil/orgs","repos_url":"https://api.github.com/users/Vextil/repos","events_url":"https://api.github.com/users/Vextil/events{/privacy}","received_events_url":"https://api.github.com/users/Vextil/received_events","type":"User","site_admin":false},"content_type":"application/vnd.android.package-archive","state":"uploaded","size":18707397,"download_count":0,"created_at":"2015-01-01T00:59:56Z","updated_at":"2015-01-01T01:01:07Z","browser_download_url":"https://github.com/Vextil/WAMD/releases/download/2.1.0-release/WhatsAppMD.S_.Stock_Emojis.apk"}],"tarball_url":"https://api.github.com/repos/Vextil/WAMD/tarball/2.1.0-release","zipball_url":"https://api.github.com/repos/Vextil/WAMD/zipball/2.1.0-release","body":"**5.0.0 and up:**\r\n- No specific changes for this version\r\n\r\n**4.4.4 and down:**\r\n- Added tinted statusbar for KitKat\r\n\r\n**All Android versions:**\r\n- Fixed attach menu black background in MDPI\r\n- About screen now shows WhatsAppMD version info too\r\n- Removed camera icon in chat text field\r\n- (For modders) Layout files are more readable\r\n- Improved chat text field design\r\n- The screed now has a dim white overlay when the FAB is opened\r\n- Changed FAB text label design\r\n- FAB no longer stays open when leaving and coming back"}},"public":true,"created_at":"2015-01-01T01:04:55Z"}
{"id":"2489397966","type":"PushEvent","actor":{"id":126935,"login":"theresaanna","gravatar_id":"","url":"https://api.github.com/users/theresaanna","avatar_url":"https://avatars.githubusercontent.com/u/126935?"},"repo":{"id":25273785,"name":"18F/openFEC-web-app","url":"https://api.github.com/repos/18F/openFEC-web-app"},"payload":{"push_id":536753162,"size":1,"distinct_size":1,"ref":"refs/heads/selenium","head":"837d603ad978daad675b2b387500eab3750b5ce1","before":"b213b555b98a97b8ecd7213d2f8148a6d408b006","commits":[{"sha":"837d603ad978daad675b2b387500eab3750b5ce1","author":{"email":"102aa063a04718b7675f2a11275a651f31704f92@gsa.gov","name":"Theresa Summa"},"message":"fixing tests","distinct":true,"url":"https://api.github.com/repos/18F/openFEC-web-app/commits/837d603ad978daad675b2b387500eab3750b5ce1"}]},"public":true,"created_at":"2015-01-01T01:04:55Z","org":{"id":6233994,"login":"18F","gravatar_id":"","url":"https://api.github.com/orgs/18F","avatar_url":"https://avatars.githubusercontent.com/u/6233994?"}}
{"id":"2489397968","type":"CreateEvent","actor":{"id":3134745,"login":"Vextil","gravatar_id":"","url":"https://api.github.com/users/Vextil","avatar_url":"https://avatars.githubusercontent.com/u/3134745?"},"repo":{"id":28277457,"name":"Vextil/WAMD","url":"https://api.github.com/repos/Vextil/WAMD"},"payload":{"ref":"2.1.0-release","ref_type":"tag","master_branch":"master","description":"WAMD is a Material Design mod of the most popular mobile messaging app.","pusher_type":"user"},"public":true,"created_at":"2015-01-01T01:04:56Z"}
{"id":"2489397970","type":"PushEvent","actor":{"id":66897,"login":"asad","gravatar_id":"","url":"https://api.github.com/users/asad","avatar_url":"https://avatars.githubusercontent.com/u/66897?"},"repo":{"id":28622285,"name":"asad/ChemBLAST","url":"https://api.github.com/repos/asad/ChemBLAST"},"payload":{"push_id":536753164,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"f82c115e656962e0ee327c14a26c586b5da5d53b","before":"4fd33b8625d56ca7dcda0acc38f6f51ec1358c87","commits":[{"sha":"f82c115e656962e0ee327c14a26c586b5da5d53b","author":{"email":"09eb4ce7c91ecff4eff21da1532c566afe7cb66c@gmail.com","name":"Syed Asad Rahman"},"message":"fork and join blast search implemented - 4X speed obtained","distinct":true,"url":"https://api.github.com/repos/asad/ChemBLAST/commits/f82c115e656962e0ee327c14a26c586b5da5d53b"}]},"public":true,"created_at":"2015-01-01T01:04:56Z"}
{"id":"2489397975","type":"WatchEvent","actor":{"id":1177325,"login":"iguto","gravatar_id":"","url":"https://api.github.com/users/iguto","avatar_url":"https://avatars.githubusercontent.com/u/1177325?"},"repo":{"id":26689598,"name":"prakhar1989/awesome-courses","url":"https://api.github.com/repos/prakhar1989/awesome-courses"},"payload":{"action":"started"},"public":true,"created_at":"2015-01-01T01:04:57Z"}
{"id":"2489397976","type":"IssueCommentEvent","actor":{"id":790740,"login":"bokmadsen","gravatar_id":"","url":"https://api.github.com/users/bokmadsen","avatar_url":"https://avatars.githubusercontent.com/u/790740?"},"repo":{"id":20463939,"name":"XLabs/Xamarin-Forms-Labs","url":"https://api.github.com/repos/XLabs/Xamarin-Forms-Labs"},"payload":{"action":"created","issue":{"url":"https://api.github.com/repos/XLabs/Xamarin-Forms-Labs/issues/534","labels_url":"https://api.github.com/repos/XLabs/Xamarin-Forms-Labs/issues/534/labels{/name}","comments_url":"https://api.github.com/repos/XLabs/Xamarin-Forms-Labs/issues/534/comments","events_url":"https://api.github.com/repos/XLabs/Xamarin-Forms-Labs/issues/534/events","html_url":"https://github.com/XLabs/Xamarin-Forms-Labs/pull/534","id":52600191,"number":534,"title":"Added null check in HybridWebView","user":{"login":"bokmadsen","id":790740,"avatar_url":"https://avatars.githubusercontent.com/u/790740?v=3","gravatar_id":"","url":"https://api.github.com/users/bokmadsen","html_url":"https://github.com/bokmadsen","followers_url":"https://api.github.com/users/bokmadsen/followers","following_url":"https://api.github.com/users/bokmadsen/following{/other_user}","gists_url":"https://api.github.com/users/bokmadsen/gists{/gist_id}","starred_url":"https://api.github.com/users/bokmadsen/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/bokmadsen/subscriptions","organizations_url":"https://api.github.com/users/bokmadsen/orgs","repos_url":"https://api.github.com/users/bokmadsen/repos","events_url":"https://api.github.com/users/bokmadsen/events{/privacy}","received_events_url":"https://api.github.com/users/bokmadsen/received_events","type":"User","site_admin":false},"labels":[],"state":"closed","locked":false,"assignee":null,"milestone":null,"comments":1,"created_at":"2014-12-21T17:00:20Z","updated_at":"2015-01-01T01:04:57Z","closed_at":"2015-01-01T00:59:55Z","pull_request":{"url":"https://api.github.com/repos/XLabs/Xamarin-Forms-Labs/pulls/534","html_url":"https://github.com/XLabs/Xamarin-Forms-Labs/pull/534","diff_url":"https://github.com/XLabs/Xamarin-Forms-Labs/pull/534.diff","patch_url":"https://github.com/XLabs/Xamarin-Forms-Labs/pull/534.patch"},"body":""},"comment":{"url":"https://api.github.com/repos/XLabs/Xamarin-Forms-Labs/issues/comments/68477321","html_url":"https://github.com/XLabs/Xamarin-Forms-Labs/pull/534#issuecomment-68477321","issue_url":"https://api.github.com/repos/XLabs/Xamarin-Forms-Labs/issues/534","id":68477321,"user":{"login":"bokmadsen","id":790740,"avatar_url":"https://avatars.githubusercontent.com/u/790740?v=3","gravatar_id":"","url":"https://api.github.com/users/bokmadsen","html_url":"https://github.com/bokmadsen","followers_url":"https://api.github.com/users/bokmadsen/followers","following_url":"https://api.github.com/users/bokmadsen/following{/other_user}","gists_url":"https://api.github.com/users/bokmadsen/gists{/gist_id}","starred_url":"https://api.github.com/users/bokmadsen/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/bokmadsen/subscriptions","organizations_url":"https://api.github.com/users/bokmadsen/orgs","repos_url":"https://api.github.com/users/bokmadsen/repos","events_url":"https://api.github.com/users/bokmadsen/events{/privacy}","received_events_url":"https://api.github.com/users/bokmadsen/received_events","type":"User","site_admin":false},"created_at":"2015-01-01T01:04:57Z","updated_at":"2015-01-01T01:04:57Z","body":"Why is this closed? I've a situation where I reload a HybridWebView and it crashed because Element is null"}},"public":true,"created_at":"2015-01-01T01:04:57Z","org":{"id":7787062,"login":"XLabs","gravatar_id":"","url":"https://api.github.com/orgs/XLabs","avatar_url":"https://avatars.githubusercontent.com/u/7787062?"}}
{"id":"2489397981","type":"IssueCommentEvent","actor":{"id":6964047,"login":"TTMTT","gravatar_id":"","url":"https://api.github.com/users/TTMTT","avatar_url":"https://avatars.githubusercontent.com/u/6964047?"},"repo":{"id":26731988,"name":"badrsony/icloudin-support-","url":"https://api.github.com/repos/badrsony/icloudin-support-"},"payload":{"action":"created","issue":{"url":"https://api.github.com/repos/badrsony/icloudin-support-/issues/8","labels_url":"https://api.github.com/repos/badrsony/icloudin-support-/issues/8/labels{/name}","comments_url":"https://api.github.com/repos/badrsony/icloudin-support-/issues/8/comments","events_url":"https://api.github.com/repos/badrsony/icloudin-support-/issues/8/events","html_url":"https://github.com/badrsony/icloudin-support-/issues/8","id":53208937,"number":8,"title":"icloudin support ","user":{"login":"badrsony","id":7895050,"avatar_url":"https://avatars.githubusercontent.com/u/7895050?v=3","gravatar_id":"","url":"https://api.github.com/users/badrsony","html_url":"https://github.com/badrsony","followers_url":"https://api.github.com/users/badrsony/followers","following_url":"https://api.github.com/users/badrsony/following{/other_user}","gists_url":"https://api.github.com/users/badrsony/gists{/gist_id}","starred_url":"https://api.github.com/users/badrsony/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/badrsony/subscriptions","organizations_url":"https://api.github.com/users/badrsony/orgs","repos_url":"https://api.github.com/users/badrsony/repos","events_url":"https://api.github.com/users/badrsony/events{/privacy}","received_events_url":"https://api.github.com/users/badrsony/received_events","type":"User","site_admin":false},"labels":[],"state":"open","locked":false,"assignee":null,"milestone":null,"comments":9,"created_at":"2014-12-31T23:58:27Z","updated_at":"2015-01-01T01:04:58Z","closed_at":null,"body":"Originally written by @TTMTT. That we hope for him safery and peace\r\n.\r\n\r\nWow, ipod touch 5G (8.1) - iCL0udin v1.0 bypass activation (icloud)\r\n\r\nhttp://youtu.be/tZmEdlDGNu4\r\n\r\niCL0udin v1.0 bypass activation (icloud) - ipad mini 2G (7.1.1)\r\n\r\nhttp://youtu.be/tevYyBN2QCQ\r\n\r\nVideo for bypass icloud (iCL0udin v1.0) for iphone 4 CDMA ..\r\n\r\nhttp://youtu.be/i85-D6N2YLk\r\n\r\nNew video for iCL0udin v1.0 bypass icloud (3 iphones 7.1.2):\r\n\r\nhttp://youtu.be/p51TNlCr7ug\r\n\r\niCL0udin v1.0 -> %98\r\n\r\nRemaining: %2 testing with some people..\r\n\r\nLast Method:\r\n\r\nmethod 1 : via (other xml not to deviceservices - exploit)\r\nmethod 2 : via (apple cert & key and i can downgrade to any ios)\r\nmethod 3 : via (change some string by hex on ELF file << some times i got error)\r\nmethod 4 : via (use apple ssl cert or real ssl in server and change some string in iphone)\r\n\r\niCL0udin v1.0 have this method:\r\n\r\nmethod 1 : via (other xml not to deviceservices - exploit)\r\nmethod 2 : via (apple cert & key and i can downgrade to any ios)"},"comment":{"url":"https://api.github.com/repos/badrsony/icloudin-support-/issues/comments/68477322","html_url":"https://github.com/badrsony/icloudin-support-/issues/8#issuecomment-68477322","issue_url":"https://api.github.com/repos/badrsony/icloudin-support-/issues/8","id":68477322,"user":{"login":"TTMTT","id":6964047,"avatar_url":"https://avatars.githubusercontent.com/u/6964047?v=3","gravatar_id":"","url":"https://api.github.com/users/TTMTT","html_url":"https://github.com/TTMTT","followers_url":"https://api.github.com/users/TTMTT/followers","following_url":"https://api.github.com/users/TTMTT/following{/other_user}","gists_url":"https://api.github.com/users/TTMTT/gists{/gist_id}","starred_url":"https://api.github.com/users/TTMTT/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/TTMTT/subscriptions","organizations_url":"https://api.github.com/users/TTMTT/orgs","repos_url":"https://api.github.com/users/TTMTT/repos","events_url":"https://api.github.com/users/TTMTT/events{/privacy}","received_events_url":"https://api.github.com/users/TTMTT/received_events","type":"User","site_admin":false},"created_at":"2015-01-01T01:04:58Z","updated_at":"2015-01-01T01:04:58Z","body":"@badrsony \r\nexcuse me i open a new discuss for (iCL0udin v1.0):\r\n--------------------------------------------------------\r\nhttps://github.com/TTMTT/iCL0udin/issues/1\r\n--------------------------------------------------------"}},"public":true,"created_at":"2015-01-01T01:04:58Z"}
{"id":"2489397982","type":"ForkEvent","actor":{"id":10361479,"login":"mahlon15","gravatar_id":"","url":"https://api.github.com/users/mahlon15","avatar_url":"https://avatars.githubusercontent.com/u/10361479?"},"repo":{"id":20042152,"name":"nightscout/cgm-remote-monitor","url":"https://api.github.com/repos/nightscout/cgm-remote-monitor"},"payload":{"forkee":{"id":28678265,"name":"cgm-remote-monitor","full_name":"mahlon15/cgm-remote-monitor","owner":{"login":"mahlon15","id":10361479,"avatar_url":"https://avatars.githubusercontent.com/u/10361479?v=3","gravatar_id":"","url":"https://api.github.com/users/mahlon15","html_url":"https://github.com/mahlon15","followers_url":"https://api.github.com/users/mahlon15/followers","following_url":"https://api.github.com/users/mahlon15/following{/other_user}","gists_url":"https://api.github.com/users/mahlon15/gists{/gist_id}","starred_url":"https://api.github.com/users/mahlon15/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/mahlon15/subscriptions","organizations_url":"https://api.github.com/users/mahlon15/orgs","repos_url":"https://api.github.com/users/mahlon15/repos","events_url":"https://api.github.com/users/mahlon15/events{/privacy}","received_events_url":"https://api.github.com/users/mahlon15/received_events","type":"User","site_admin":false},"private":false,"html_url":"https://github.com/mahlon15/cgm-remote-monitor","description":"nightscout web monitor","fork":true,"url":"https://api.github.com/repos/mahlon15/cgm-remote-monitor","forks_url":"https://api.github.com/repos/mahlon15/cgm-remote-monitor/forks","keys_url":"https://api.github.com/repos/mahlon15/cgm-remote-monitor/keys{/key_id}","collaborators_url":"https://api.github.com/repos/mahlon15/cgm-remote-monitor/collaborators{/collaborator}","teams_url":"https://api.github.com/repos/mahlon15/cgm-remote-monitor/teams","hooks_url":"https://api.github.com/repos/mahlon15/cgm-remote-monitor/hooks","issue_events_url":"https://api.github.com/repos/mahlon15/cgm-remote-monitor/issues/events{/number}","events_url":"https://api.github.com/repos/mahlon15/cgm-remote-monitor/events","assignees_url":"https://api.github.com/repos/mahlon15/cgm-remote-monitor/assignees{/user}","branches_url":"https://api.github.com/repos/mahlon15/cgm-remote-monitor/branches{/branch}","tags_url":"https://api.github.com/repos/mahlon15/cgm-remote-monitor/tags","blobs_url":"https://api.github.com/repos/mahlon15/cgm-remote-monitor/git/blobs{/sha}","git_tags_url":"https://api.github.com/repos/mahlon15/cgm-remote-monitor/git/tags{/sha}","git_refs_url":"https://api.github.com/repos/mahlon15/cgm-remote-monitor/git/refs{/sha}","trees_url":"https://api.github.com/repos/mahlon15/cgm-remote-monitor/git/trees{/sha}","statuses_url":"https://api.github.com/repos/mahlon15/cgm-remote-monitor/statuses/{sha}","languages_url":"https://api.github.com/repos/mahlon15/cgm-remote-monitor/languages","stargazers_url":"https://api.github.com/repos/mahlon15/cgm-remote-monitor/stargazers","contributors_url":"https://api.github.com/repos/mahlon15/cgm-remote-monitor/contributors","subscribers_url":"https://api.github.com/repos/mahlon15/cgm-remote-monitor/subscribers","subscription_url":"https://api.github.com/repos/mahlon15/cgm-remote-monitor/subscription","commits_url":"https://api.github.com/repos/mahlon15/cgm-remote-monitor/commits{/sha}","git_commits_url":"https://api.github.com/repos/mahlon15/cgm-remote-monitor/git/commits{/sha}","comments_url":"https://api.github.com/repos/mahlon15/cgm-remote-monitor/comments{/number}","issue_comment_url":"https://api.github.com/repos/mahlon15/cgm-remote-monitor/issues/comments/{number}","contents_url":"https://api.github.com/repos/mahlon15/cgm-remote-monitor/contents/{+path}","compare_url":"https://api.github.com/repos/mahlon15/cgm-remote-monitor/compare/{base}...{head}","merges_url":"https://api.github.com/repos/mahlon15/cgm-remote-monitor/merges","archive_url":"https://api.github.com/repos/mahlon15/cgm-remote-monitor/{archive_format}{/ref}","downloads_url":"https://api.github.com/repos/mahlon15/cgm-remote-monitor/downloads","issues_url":"https://api.github.com/repos/mahlon15/cgm-remote-monitor/issues{/number}","pulls_url":"https://api.github.com/repos/mahlon15/cgm-remote-monitor/pulls{/number}","milestones_url":"https://api.github.com/repos/mahlon15/cgm-remote-monitor/milestones{/number}","notifications_url":"https://api.github.com/repos/mahlon15/cgm-remote-monitor/notifications{?since,all,participating}","labels_url":"https://api.github.com/repos/mahlon15/cgm-remote-monitor/labels{/name}","releases_url":"https://api.github.com/repos/mahlon15/cgm-remote-monitor/releases{/id}","created_at":"2015-01-01T01:04:58Z","updated_at":"2014-12-30T04:33:26Z","pushed_at":"2014-12-31T18:14:04Z","git_url":"git://github.com/mahlon15/cgm-remote-monitor.git","ssh_url":"git@github.com:mahlon15/cgm-remote-monitor.git","clone_url":"https://github.com/mahlon15/cgm-remote-monitor.git","svn_url":"https://github.com/mahlon15/cgm-remote-monitor","homepage":"","size":9502,"stargazers_count":0,"watchers_count":0,"language":null,"has_issues":false,"has_downloads":true,"has_wiki":true,"has_pages":false,"forks_count":0,"mirror_url":null,"open_issues_count":0,"forks":0,"open_issues":0,"watchers":0,"default_branch":"master","public":true}},"public":true,"created_at":"2015-01-01T01:04:59Z","org":{"id":7661012,"login":"nightscout","gravatar_id":"","url":"https://api.github.com/orgs/nightscout","avatar_url":"https://avatars.githubusercontent.com/u/7661012?"}}
{"id":"2489397984","type":"PushEvent","actor":{"id":7377949,"login":"rusefi","gravatar_id":"","url":"https://api.github.com/users/rusefi","avatar_url":"https://avatars.githubusercontent.com/u/7377949?"},"repo":{"id":19047649,"name":"rusefi/rusefi","url":"https://api.github.com/repos/rusefi/rusefi"},"payload":{"push_id":536753170,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"98582a43442ee88c1f3f1ced20131de107e3fd52","before":"6f7687ac1d7ba2adb73b9799dfa2831c9dfbdbf3","commits":[{"sha":"98582a43442ee88c1f3f1ced20131de107e3fd52","author":{"email":"667fbe48699c76efd895fe8014d756c77fa79f0f@gmail.com","name":"rusEfi"},"message":"auto-sync","distinct":true,"url":"https://api.github.com/repos/rusefi/rusefi/commits/98582a43442ee88c1f3f1ced20131de107e3fd52"}]},"public":true,"created_at":"2015-01-01T01:04:59Z"}
{"id":"2489397989","type":"CreateEvent","actor":{"id":995241,"login":"ggkuron","gravatar_id":"","url":"https://api.github.com/users/ggkuron","avatar_url":"https://avatars.githubusercontent.com/u/995241?"},"repo":{"id":12571910,"name":"ggkuron/dotfiles","url":"https://api.github.com/repos/ggkuron/dotfiles"},"payload":{"ref":"x230","ref_type":"branch","master_branch":"master","description":"my dotfiles","pusher_type":"user"},"public":true,"created_at":"2015-01-01T01:04:59Z"}
{"id":"2489397990","type":"PushEvent","actor":{"id":4380972,"login":"Camtendo","gravatar_id":"","url":"https://api.github.com/users/Camtendo","avatar_url":"https://avatars.githubusercontent.com/u/4380972?"},"repo":{"id":27618890,"name":"dguenther/web-overlay","url":"https://api.github.com/repos/dguenther/web-overlay"},"payload":{"push_id":536753171,"size":1,"distinct_size":1,"ref":"refs/heads/TwitchImplementation","head":"69a6a3723f7bce2d645d3a2a55d0bc8b019abd18","before":"db1e6eda79253813da6588cf457cd59a238c8ee2","commits":[{"sha":"69a6a3723f7bce2d645d3a2a55d0bc8b019abd18","author":{"email":"aba648f93bc6924c2458971c10c6192365c58b55@gmail.com","name":"Cameron Crockrom"},"message":"Use setTimeout for safety vs. setInterval.","distinct":true,"url":"https://api.github.com/repos/dguenther/web-overlay/commits/69a6a3723f7bce2d645d3a2a55d0bc8b019abd18"}]},"public":true,"created_at":"2015-01-01T01:04:59Z"}
{"id":"2489397992","type":"WatchEvent","actor":{"id":132444,"login":"PlasticLizard","gravatar_id":"","url":"https://api.github.com/users/PlasticLizard","avatar_url":"https://avatars.githubusercontent.com/u/132444?"},"repo":{"id":11225014,"name":"coreos/etcd","url":"https://api.github.com/repos/coreos/etcd"},"payload":{"action":"started"},"public":true,"created_at":"2015-01-01T01:05:01Z","org":{"id":3730757,"login":"coreos","gravatar_id":"","url":"https://api.github.com/orgs/coreos","avatar_url":"https://avatars.githubusercontent.com/u/3730757?"}}
{"id":"2489397993","type":"PullRequestReviewCommentEvent","actor":{"id":523287,"login":"j2sol","gravatar_id":"","url":"https://api.github.com/users/j2sol","avatar_url":"https://avatars.githubusercontent.com/u/523287?"},"repo":{"id":11848896,"name":"blueboxgroup/ursula","url":"https://api.github.com/repos/blueboxgroup/ursula"},"payload":{"action":"created","comment":{"url":"https://api.github.com/repos/blueboxgroup/ursula/pulls/comments/22397288","id":22397288,"diff_hunk":"@@ -1,121 +1,92 @@\n ---\n-- name: install apache\n-  apt: pkg={{ item }}\n-  with_items:\n-    - apache2\n-    - libapache2-mod-wsgi\n-\n - name: lesscpy must be in apache PATH\n   pip: name=lesscpy version=0.9j\n \n - name: get horizon source repo\n-  git: repo={{ openstack.git_mirror }}/horizon.git\n-       dest=/opt/stack/horizon\n-       version={{ horizon.rev }}\n-       update={{ openstack.git_update }}\n+  git: |\n+    repo={{ openstack.git_mirror}}/horizon.git\n+    dest=/opt/stack/horizon\n+    version={{ horizon.rev }}\n+    update={{ openstack.git_update }}\n   notify:\n     - setup horizon venv\n     - compress horizon assets\n \n-- template: src=opt/stack/horizon/hide-external-networks.patch dest=/opt/stack/horizon/hide-external-networks.patch mode=0644\n-- shell: patch -p1 < hide-external-networks.patch chdir=/opt/stack/horizon\n-  notify:\n-    - setup horizon venv\n-\n - name: add python-memcached to horizon requirements\n-  lineinfile: dest=/opt/stack/horizon/requirements.txt\n-              regexp=^python-memcached\n-              line=python-memcached\n+  lineinfile: dest=/opt/stack/horizon/requirements.txt regexp=^python-memcached line=python-memcached\n   notify:\n     - setup horizon venv\n \n-- name: disable apache status\n-  command: a2dismod status\n-  notify:\n-    - restart apache\n-\n-- name: apache ports config\n-  template: src=etc/apache2/ports.conf\n-            dest=/etc/apache2/ports.conf\n-  notify:\n-    - restart apache\n-\n-- name: disable default apache site\n-  command: a2dissite 000-default\n+- name: make sure apache knows about horizon ports\n+  lineinfile: dest=/etc/apache2/ports.conf line=\"Listen 8080\"\n   notify:\n-    - restart apache\n+    - reload apache\n \n-- name: openstack dashboard config (12.04)\n-  template: src=etc/apache2/sites-available/openstack_dashboard.conf\n-            dest=/etc/apache2/sites-available/openstack_dashboard\n+- name: create dashboard virtualhost on precise\n+  template: |\n+    src=etc/apache2/sites-available/openstack_dashboard.conf\n+    dest=/etc/apache2/sites-available/openstack_dashboard\n   when: ansible_distribution_version == \"12.04\"\n   notify:\n-    - restart apache\n+    - reload apache\n \n-- name: openstack dashboard config\n-  template: src=etc/apache2/sites-available/openstack_dashboard.conf\n-            dest=/etc/apache2/sites-available/openstack_dashboard.conf\n+- name: create dashboard virtualhost on other\n+  template: |\n+    src=etc/apache2/sites-available/openstack_dashboard.conf\n+    dest=/etc/apache2/sites-available/openstack_dashboard.conf\n   when: ansible_distribution_version != \"12.04\"\n   notify:\n-    - restart apache\n+    - reload apache\n \n - name: enable horizon apache site\n-  command: a2ensite openstack_dashboard\n+  apache2_site: state=enabled name=openstack_dashboard\n   notify:\n-    - restart apache\n-\n-- name: static asset directories\n-  file: dest={{ item }}\n-        state=directory\n-        owner=www-data\n-        group=www-data\n-        mode=0755\n+    - reload apache\n+\n+- name: create static asset dirs\n+  file: |\n+    dest={{ item }}\n+    state=directory\n+    owner=www-data\n+    group=www-data\n+    mode=0755\n   with_items:\n     - /opt/stack/horizon/static\n     - /opt/stack/horizon/static/dashboard\n \n-- name: horizon local settings\n-  template: src=opt/stack/horizon/openstack_dashboard/local/local_settings.py\n-            dest=/opt/stack/horizon/openstack_dashboard/local/local_settings.py\n-            mode=0644\n+- name: dashboard settings\n+  template: |","path":"roles/horizon/tasks/main.yml","position":111,"original_position":111,"commit_id":"2a6f35313b9936ce4450aba823d09287626bed6f","original_commit_id":"2a6f35313b9936ce4450aba823d09287626bed6f","user":{"login":"j2sol","id":523287,"avatar_url":"https://avatars.githubusercontent.com/u/523287?v=3","gravatar_id":"","url":"https://api.github.com/users/j2sol","html_url":"https://github.com/j2sol","followers_url":"https://api.github.com/users/j2sol/followers","following_url":"https://api.github.com/users/j2sol/following{/other_user}","gists_url":"https://api.github.com/users/j2sol/gists{/gist_id}","starred_url":"https://api.github.com/users/j2sol/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/j2sol/subscriptions","organizations_url":"https://api.github.com/users/j2sol/orgs","repos_url":"https://api.github.com/users/j2sol/repos","events_url":"https://api.github.com/users/j2sol/events{/privacy}","received_events_url":"https://api.github.com/users/j2sol/received_events","type":"User","site_admin":false},"body":"?","created_at":"2015-01-01T01:05:00Z","updated_at":"2015-01-01T01:05:00Z","html_url":"https://github.com/blueboxgroup/ursula/pull/705#discussion_r22397288","pull_request_url":"https://api.github.com/repos/blueboxgroup/ursula/pulls/705","_links":{"self":{"href":"https://api.github.com/repos/blueboxgroup/ursula/pulls/comments/22397288"},"html":{"href":"https://github.com/blueboxgroup/ursula/pull/705#discussion_r22397288"},"pull_request":{"href":"https://api.github.com/repos/blueboxgroup/ursula/pulls/705"}}},"pull_request":{"url":"https://api.github.com/repos/blueboxgroup/ursula/pulls/705","id":26738851,"html_url":"https://github.com/blueboxgroup/ursula/pull/705","diff_url":"https://github.com/blueboxgroup/ursula/pull/705.diff","patch_url":"https://github.com/blueboxgroup/ursula/pull/705.patch","issue_url":"https://api.github.com/repos/blueboxgroup/ursula/issues/705","number":705,"state":"open","locked":false,"title":"WIP:  apache for loadbalancing","user":{"login":"paulczar","id":2488346,"avatar_url":"https://avatars.githubusercontent.com/u/2488346?v=3","gravatar_id":"","url":"https://api.github.com/users/paulczar","html_url":"https://github.com/paulczar","followers_url":"https://api.github.com/users/paulczar/followers","following_url":"https://api.github.com/users/paulczar/following{/other_user}","gists_url":"https://api.github.com/users/paulczar/gists{/gist_id}","starred_url":"https://api.github.com/users/paulczar/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/paulczar/subscriptions","organizations_url":"https://api.github.com/users/paulczar/orgs","repos_url":"https://api.github.com/users/paulczar/repos","events_url":"https://api.github.com/users/paulczar/events{/privacy}","received_events_url":"https://api.github.com/users/paulczar/received_events","type":"User","site_admin":false},"body":"This is a quick POC / WIP to demo using apache instead of haproxy for loadbalancing our APIs.\r\n\r\nI think this gives us more flexibiltiy as we can enable in the APIs role itself ( in this case in keystone ) rather than a big monolithic haproxy.conf.      We also already have apache running for horizon, so it could reduce number of services.    apache also has better logging options that haproxy which can only log to syslog. ","created_at":"2015-01-01T00:04:13Z","updated_at":"2015-01-01T01:05:00Z","closed_at":null,"merged_at":null,"merge_commit_sha":"9b91693f11e166c9ee53836f19697868d412bf76","assignee":null,"milestone":null,"commits_url":"https://api.github.com/repos/blueboxgroup/ursula/pulls/705/commits","review_comments_url":"https://api.github.com/repos/blueboxgroup/ursula/pulls/705/comments","review_comment_url":"https://api.github.com/repos/blueboxgroup/ursula/pulls/comments/{number}","comments_url":"https://api.github.com/repos/blueboxgroup/ursula/issues/705/comments","statuses_url":"https://api.github.com/repos/blueboxgroup/ursula/statuses/2a6f35313b9936ce4450aba823d09287626bed6f","head":{"label":"blueboxgroup:use_apache_for_lb","ref":"use_apache_for_lb","sha":"2a6f35313b9936ce4450aba823d09287626bed6f","user":{"login":"blueboxgroup","id":458705,"avatar_url":"https://avatars.githubusercontent.com/u/458705?v=3","gravatar_id":"","url":"https://api.github.com/users/blueboxgroup","html_url":"https://github.com/blueboxgroup","followers_url":"https://api.github.com/users/blueboxgroup/followers","following_url":"https://api.github.com/users/blueboxgroup/following{/other_user}","gists_url":"https://api.github.com/users/blueboxgroup/gists{/gist_id}","starred_url":"https://api.github.com/users/blueboxgroup/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/blueboxgroup/subscriptions","organizations_url":"https://api.github.com/users/blueboxgroup/orgs","repos_url":"https://api.github.com/users/blueboxgroup/repos","events_url":"https://api.github.com/users/blueboxgroup/events{/privacy}","received_events_url":"https://api.github.com/users/blueboxgroup/received_events","type":"Organization","site_admin":false},"repo":{"id":11848896,"name":"ursula","full_name":"blueboxgroup/ursula","owner":{"login":"blueboxgroup","id":458705,"avatar_url":"https://avatars.githubusercontent.com/u/458705?v=3","gravatar_id":"","url":"https://api.github.com/users/blueboxgroup","html_url":"https://github.com/blueboxgroup","followers_url":"https://api.github.com/users/blueboxgroup/followers","following_url":"https://api.github.com/users/blueboxgroup/following{/other_user}","gists_url":"https://api.github.com/users/blueboxgroup/gists{/gist_id}","starred_url":"https://api.github.com/users/blueboxgroup/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/blueboxgroup/subscriptions","organizations_url":"https://api.github.com/users/blueboxgroup/orgs","repos_url":"https://api.github.com/users/blueboxgroup/repos","events_url":"https://api.github.com/users/blueboxgroup/events{/privacy}","received_events_url":"https://api.github.com/users/blueboxgroup/received_events","type":"Organization","site_admin":false},"private":false,"html_url":"https://github.com/blueboxgroup/ursula","description":"Ansible playbooks for operating OpenStack","fork":false,"url":"https://api.github.com/repos/blueboxgroup/ursula","forks_url":"https://api.github.com/repos/blueboxgroup/ursula/forks","keys_url":"https://api.github.com/repos/blueboxgroup/ursula/keys{/key_id}","collaborators_url":"https://api.github.com/repos/blueboxgroup/ursula/collaborators{/collaborator}","teams_url":"https://api.github.com/repos/blueboxgroup/ursula/teams","hooks_url":"https://api.github.com/repos/blueboxgroup/ursula/hooks","issue_events_url":"https://api.github.com/repos/blueboxgroup/ursula/issues/events{/number}","events_url":"https://api.github.com/repos/blueboxgroup/ursula/events","assignees_url":"https://api.github.com/repos/blueboxgroup/ursula/assignees{/user}","branches_url":"https://api.github.com/repos/blueboxgroup/ursula/branches{/branch}","tags_url":"https://api.github.com/repos/blueboxgroup/ursula/tags","blobs_url":"https://api.github.com/repos/blueboxgroup/ursula/git/blobs{/sha}","git_tags_url":"https://api.github.com/repos/blueboxgroup/ursula/git/tags{/sha}","git_refs_url":"https://api.github.com/repos/blueboxgroup/ursula/git/refs{/sha}","trees_url":"https://api.github.com/repos/blueboxgroup/ursula/git/trees{/sha}","statuses_url":"https://api.github.com/repos/blueboxgroup/ursula/statuses/{sha}","languages_url":"https://api.github.com/repos/blueboxgroup/ursula/languages","stargazers_url":"https://api.github.com/repos/blueboxgroup/ursula/stargazers","contributors_url":"https://api.github.com/repos/blueboxgroup/ursula/contributors","subscribers_url":"https://api.github.com/repos/blueboxgroup/ursula/subscribers","subscription_url":"https://api.github.com/repos/blueboxgroup/ursula/subscription","commits_url":"https://api.github.com/repos/blueboxgroup/ursula/commits{/sha}","git_commits_url":"https://api.github.com/repos/blueboxgroup/ursula/git/commits{/sha}","comments_url":"https://api.github.com/repos/blueboxgroup/ursula/comments{/number}","issue_comment_url":"https://api.github.com/repos/blueboxgroup/ursula/issues/comments/{number}","contents_url":"https://api.github.com/repos/blueboxgroup/ursula/contents/{+path}","compare_url":"https://api.github.com/repos/blueboxgroup/ursula/compare/{base}...{head}","merges_url":"https://api.github.com/repos/blueboxgroup/ursula/merges","archive_url":"https://api.github.com/repos/blueboxgroup/ursula/{archive_format}{/ref}","downloads_url":"https://api.github.com/repos/blueboxgroup/ursula/downloads","issues_url":"https://api.github.com/repos/blueboxgroup/ursula/issues{/number}","pulls_url":"https://api.github.com/repos/blueboxgroup/ursula/pulls{/number}","milestones_url":"https://api.github.com/repos/blueboxgroup/ursula/milestones{/number}","notifications_url":"https://api.github.com/repos/blueboxgroup/ursula/notifications{?since,all,participating}","labels_url":"https://api.github.com/repos/blueboxgroup/ursula/labels{/name}","releases_url":"https://api.github.com/repos/blueboxgroup/ursula/releases{/id}","created_at":"2013-08-02T17:37:26Z","updated_at":"2014-12-31T21:03:28Z","pushed_at":"2015-01-01T00:01:35Z","git_url":"git://github.com/blueboxgroup/ursula.git","ssh_url":"git@github.com:blueboxgroup/ursula.git","clone_url":"https://github.com/blueboxgroup/ursula.git","svn_url":"https://github.com/blueboxgroup/ursula","homepage":null,"size":9036,"stargazers_count":45,"watchers_count":45,"language":"Python","has_issues":true,"has_downloads":true,"has_wiki":true,"has_pages":false,"forks_count":23,"mirror_url":null,"open_issues_count":26,"forks":23,"open_issues":26,"watchers":45,"default_branch":"master"}},"base":{"label":"blueboxgroup:master","ref":"master","sha":"34b83c65ff0de2f8b006d8ce4f76919fe0167bbf","user":{"login":"blueboxgroup","id":458705,"avatar_url":"https://avatars.githubusercontent.com/u/458705?v=3","gravatar_id":"","url":"https://api.github.com/users/blueboxgroup","html_url":"https://github.com/blueboxgroup","followers_url":"https://api.github.com/users/blueboxgroup/followers","following_url":"https://api.github.com/users/blueboxgroup/following{/other_user}","gists_url":"https://api.github.com/users/blueboxgroup/gists{/gist_id}","starred_url":"https://api.github.com/users/blueboxgroup/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/blueboxgroup/subscriptions","organizations_url":"https://api.github.com/users/blueboxgroup/orgs","repos_url":"https://api.github.com/users/blueboxgroup/repos","events_url":"https://api.github.com/users/blueboxgroup/events{/privacy}","received_events_url":"https://api.github.com/users/blueboxgroup/received_events","type":"Organization","site_admin":false},"repo":{"id":11848896,"name":"ursula","full_name":"blueboxgroup/ursula","owner":{"login":"blueboxgroup","id":458705,"avatar_url":"https://avatars.githubusercontent.com/u/458705?v=3","gravatar_id":"","url":"https://api.github.com/users/blueboxgroup","html_url":"https://github.com/blueboxgroup","followers_url":"https://api.github.com/users/blueboxgroup/followers","following_url":"https://api.github.com/users/blueboxgroup/following{/other_user}","gists_url":"https://api.github.com/users/blueboxgroup/gists{/gist_id}","starred_url":"https://api.github.com/users/blueboxgroup/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/blueboxgroup/subscriptions","organizations_url":"https://api.github.com/users/blueboxgroup/orgs","repos_url":"https://api.github.com/users/blueboxgroup/repos","events_url":"https://api.github.com/users/blueboxgroup/events{/privacy}","received_events_url":"https://api.github.com/users/blueboxgroup/received_events","type":"Organization","site_admin":false},"private":false,"html_url":"https://github.com/blueboxgroup/ursula","description":"Ansible playbooks for operating OpenStack","fork":false,"url":"https://api.github.com/repos/blueboxgroup/ursula","forks_url":"https://api.github.com/repos/blueboxgroup/ursula/forks","keys_url":"https://api.github.com/repos/blueboxgroup/ursula/keys{/key_id}","collaborators_url":"https://api.github.com/repos/blueboxgroup/ursula/collaborators{/collaborator}","teams_url":"https://api.github.com/repos/blueboxgroup/ursula/teams","hooks_url":"https://api.github.com/repos/blueboxgroup/ursula/hooks","issue_events_url":"https://api.github.com/repos/blueboxgroup/ursula/issues/events{/number}","events_url":"https://api.github.com/repos/blueboxgroup/ursula/events","assignees_url":"https://api.github.com/repos/blueboxgroup/ursula/assignees{/user}","branches_url":"https://api.github.com/repos/blueboxgroup/ursula/branches{/branch}","tags_url":"https://api.github.com/repos/blueboxgroup/ursula/tags","blobs_url":"https://api.github.com/repos/blueboxgroup/ursula/git/blobs{/sha}","git_tags_url":"https://api.github.com/repos/blueboxgroup/ursula/git/tags{/sha}","git_refs_url":"https://api.github.com/repos/blueboxgroup/ursula/git/refs{/sha}","trees_url":"https://api.github.com/repos/blueboxgroup/ursula/git/trees{/sha}","statuses_url":"https://api.github.com/repos/blueboxgroup/ursula/statuses/{sha}","languages_url":"https://api.github.com/repos/blueboxgroup/ursula/languages","stargazers_url":"https://api.github.com/repos/blueboxgroup/ursula/stargazers","contributors_url":"https://api.github.com/repos/blueboxgroup/ursula/contributors","subscribers_url":"https://api.github.com/repos/blueboxgroup/ursula/subscribers","subscription_url":"https://api.github.com/repos/blueboxgroup/ursula/subscription","commits_url":"https://api.github.com/repos/blueboxgroup/ursula/commits{/sha}","git_commits_url":"https://api.github.com/repos/blueboxgroup/ursula/git/commits{/sha}","comments_url":"https://api.github.com/repos/blueboxgroup/ursula/comments{/number}","issue_comment_url":"https://api.github.com/repos/blueboxgroup/ursula/issues/comments/{number}","contents_url":"https://api.github.com/repos/blueboxgroup/ursula/contents/{+path}","compare_url":"https://api.github.com/repos/blueboxgroup/ursula/compare/{base}...{head}","merges_url":"https://api.github.com/repos/blueboxgroup/ursula/merges","archive_url":"https://api.github.com/repos/blueboxgroup/ursula/{archive_format}{/ref}","downloads_url":"https://api.github.com/repos/blueboxgroup/ursula/downloads","issues_url":"https://api.github.com/repos/blueboxgroup/ursula/issues{/number}","pulls_url":"https://api.github.com/repos/blueboxgroup/ursula/pulls{/number}","milestones_url":"https://api.github.com/repos/blueboxgroup/ursula/milestones{/number}","notifications_url":"https://api.github.com/repos/blueboxgroup/ursula/notifications{?since,all,participating}","labels_url":"https://api.github.com/repos/blueboxgroup/ursula/labels{/name}","releases_url":"https://api.github.com/repos/blueboxgroup/ursula/releases{/id}","created_at":"2013-08-02T17:37:26Z","updated_at":"2014-12-31T21:03:28Z","pushed_at":"2015-01-01T00:01:35Z","git_url":"git://github.com/blueboxgroup/ursula.git","ssh_url":"git@github.com:blueboxgroup/ursula.git","clone_url":"https://github.com/blueboxgroup/ursula.git","svn_url":"https://github.com/blueboxgroup/ursula","homepage":null,"size":9036,"stargazers_count":45,"watchers_count":45,"language":"Python","has_issues":true,"has_downloads":true,"has_wiki":true,"has_pages":false,"forks_count":23,"mirror_url":null,"open_issues_count":26,"forks":23,"open_issues":26,"watchers":45,"default_branch":"master"}},"_links":{"self":{"href":"https://api.github.com/repos/blueboxgroup/ursula/pulls/705"},"html":{"href":"https://github.com/blueboxgroup/ursula/pull/705"},"issue":{"href":"https://api.github.com/repos/blueboxgroup/ursula/issues/705"},"comments":{"href":"https://api.github.com/repos/blueboxgroup/ursula/issues/705/comments"},"review_comments":{"href":"https://api.github.com/repos/blueboxgroup/ursula/pulls/705/comments"},"review_comment":{"href":"https://api.github.com/repos/blueboxgroup/ursula/pulls/comments/{number}"},"commits":{"href":"https://api.github.com/repos/blueboxgroup/ursula/pulls/705/commits"},"statuses":{"href":"https://api.github.com/repos/blueboxgroup/ursula/statuses/2a6f35313b9936ce4450aba823d09287626bed6f"}}}},"public":true,"created_at":"2015-01-01T01:05:00Z","org":{"id":458705,"login":"blueboxgroup","gravatar_id":"","url":"https://api.github.com/orgs/blueboxgroup","avatar_url":"https://avatars.githubusercontent.com/u/458705?"}}
{"id":"2489397994","type":"PushEvent","actor":{"id":280212,"login":"KenanSulayman","gravatar_id":"","url":"https://api.github.com/users/KenanSulayman","avatar_url":"https://avatars.githubusercontent.com/u/280212?"},"repo":{"id":21481110,"name":"KenanSulayman/heartbeat","url":"https://api.github.com/repos/KenanSulayman/heartbeat"},"payload":{"push_id":536753173,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"089c8f0d2bac3da1fec35e110c876455549123ae","before":"f673aef9bc6b115cda55214d362fde50d301ea25","commits":[{"sha":"089c8f0d2bac3da1fec35e110c876455549123ae","author":{"email":"9176253dfc0bc82671a5e984646605f93319147a@sly.mn","name":"Kenan Sulayman"},"message":"1420074298826\n\nIim2uaMEmeYuzjr/BB4HDY5aDAhN4tj3tUKkEefUDNY=","distinct":true,"url":"https://api.github.com/repos/KenanSulayman/heartbeat/commits/089c8f0d2bac3da1fec35e110c876455549123ae"}]},"public":true,"created_at":"2015-01-01T01:05:01Z"}
{"id":"2489397996","type":"PushEvent","actor":{"id":2961036,"login":"codemercenary","gravatar_id":"","url":"https://api.github.com/users/codemercenary","avatar_url":"https://avatars.githubusercontent.com/u/2961036?"},"repo":{"id":22248790,"name":"codemercenary/autowiring","url":"https://api.github.com/repos/codemercenary/autowiring"},"payload":{"push_id":536753175,"size":2,"distinct_size":2,"ref":"refs/heads/fix-autoboost","head":"8f51be0a57b7463e15546b48ef20e07405c4fbcc","before":"36b2b53a58e4725efd0cf1a9823175cd492ad044","commits":[{"sha":"84a8a258066868e409162319da3c48751b136029","author":{"email":"f4b726eb4428c94ec1239af9e3b06d73d64a2f9c@gmail.com","name":"Jason Lokerson"},"message":"Fix header guards","distinct":true,"url":"https://api.github.com/repos/codemercenary/autowiring/commits/84a8a258066868e409162319da3c48751b136029"},{"sha":"8f51be0a57b7463e15546b48ef20e07405c4fbcc","author":{"email":"f4b726eb4428c94ec1239af9e3b06d73d64a2f9c@gmail.com","name":"Jason Lokerson"},"message":"Eliminate placeholder injection","distinct":true,"url":"https://api.github.com/repos/codemercenary/autowiring/commits/8f51be0a57b7463e15546b48ef20e07405c4fbcc"}]},"public":true,"created_at":"2015-01-01T01:05:01Z"}
{"id":"2489397998","type":"PushEvent","actor":{"id":671161,"login":"aimanparvaiz","gravatar_id":"","url":"https://api.github.com/users/aimanparvaiz","avatar_url":"https://avatars.githubusercontent.com/u/671161?"},"repo":{"id":28207723,"name":"akamel001/ssg","url":"https://api.github.com/repos/akamel001/ssg"},"payload":{"push_id":536753176,"size":1,"distinct_size":1,"ref":"refs/heads/redis","head":"97a09d2a39aa88d8a05080f028027071a2aedc77","before":"4be94c06212e79117a33df49c03ffd75742bf5ef","commits":[{"sha":"97a09d2a39aa88d8a05080f028027071a2aedc77","author":{"email":"a36175434507c8d1ff8c192e77af99c0d5cb0179@gmail.com","name":"aimanparvaiz"},"message":"Reverting changes to data_dplit not returning anything","distinct":true,"url":"https://api.github.com/repos/akamel001/ssg/commits/97a09d2a39aa88d8a05080f028027071a2aedc77"}]},"public":true,"created_at":"2015-01-01T01:05:01Z"}
{"id":"2489397999","type":"PushEvent","actor":{"id":2851221,"login":"alkass","gravatar_id":"","url":"https://api.github.com/users/alkass","avatar_url":"https://avatars.githubusercontent.com/u/2851221?"},"repo":{"id":28678233,"name":"alkass/seQre","url":"https://api.github.com/repos/alkass/seQre"},"payload":{"push_id":536753177,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"c205a49edb938d205047779cb9492e125de331ca","before":"3e46496fed34162743f34c34d45cca60df88ba6f","commits":[{"sha":"c205a49edb938d205047779cb9492e125de331ca","author":{"email":"a11a5b354f8e573649b5660989b915a86618a1f4@yahoo.com","name":"Fadi Hanna Al-Kass"},"message":"first commit","distinct":true,"url":"https://api.github.com/repos/alkass/seQre/commits/c205a49edb938d205047779cb9492e125de331ca"}]},"public":true,"created_at":"2015-01-01T01:05:01Z"}
{"id":"2489398007","type":"CreateEvent","actor":{"id":1265899,"login":"lynas","gravatar_id":"","url":"https://api.github.com/users/lynas","avatar_url":"https://avatars.githubusercontent.com/u/1265899?"},"repo":{"id":28678267,"name":"lynas/testforcom","url":"https://api.github.com/repos/lynas/testforcom"},"payload":{"ref":null,"ref_type":"repository","master_branch":"master","description":"","pusher_type":"user"},"public":true,"created_at":"2015-01-01T01:05:02Z"}
{"id":"2489398010","type":"PushEvent","actor":{"id":1681249,"login":"Toeler","gravatar_id":"","url":"https://api.github.com/users/Toeler","avatar_url":"https://avatars.githubusercontent.com/u/1681249?"},"repo":{"id":28678136,"name":"Toeler/Handmade-Hero","url":"https://api.github.com/repos/Toeler/Handmade-Hero"},"payload":{"push_id":536753180,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"294751cfbc4128f170d1f29059758ddd33fc0215","before":"408100c353fa4aa5b211754d5cfc1d83b8c359a3","commits":[{"sha":"294751cfbc4128f170d1f29059758ddd33fc0215","author":{"email":"1567efe08cf0fe56c7f6c76e22ebfc0c7eb0ca87@gmail.com","name":"Toeler"},"message":"Update README.md","distinct":true,"url":"https://api.github.com/repos/Toeler/Handmade-Hero/commits/294751cfbc4128f170d1f29059758ddd33fc0215"}]},"public":true,"created_at":"2015-01-01T01:05:02Z"}
{"id":"2489398012","type":"PushEvent","actor":{"id":6142965,"login":"toshibo","gravatar_id":"","url":"https://api.github.com/users/toshibo","avatar_url":"https://avatars.githubusercontent.com/u/6142965?"},"repo":{"id":28669825,"name":"toshibo/first_app","url":"https://api.github.com/repos/toshibo/first_app"},"payload":{"push_id":536753181,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"69adeede51123c81ea048177e88a7f0e19cd1dc5","before":"b3289500062ee995801e6d33f9ea834648adbafa","commits":[{"sha":"69adeede51123c81ea048177e88a7f0e19cd1dc5","author":{"email":"4a4dd8a7d0feb6dd182beabd5d78e33952f10637@gmail.com","name":"toshibo"},"message":"Improve the README file","distinct":true,"url":"https://api.github.com/repos/toshibo/first_app/commits/69adeede51123c81ea048177e88a7f0e19cd1dc5"}]},"public":true,"created_at":"2015-01-01T01:05:03Z"}
{"id":"2489398017","type":"PullRequestEvent","actor":{"id":69068,"login":"someara","gravatar_id":"","url":"https://api.github.com/users/someara","avatar_url":"https://avatars.githubusercontent.com/u/69068?"},"repo":{"id":28657951,"name":"hypomonk/slacker-packer","url":"https://api.github.com/repos/hypomonk/slacker-packer"},"payload":{"action":"opened","number":2,"pull_request":{"url":"https://api.github.com/repos/hypomonk/slacker-packer/pulls/2","id":26739453,"html_url":"https://github.com/hypomonk/slacker-packer/pull/2","diff_url":"https://github.com/hypomonk/slacker-packer/pull/2.diff","patch_url":"https://github.com/hypomonk/slacker-packer/pull/2.patch","issue_url":"https://api.github.com/repos/hypomonk/slacker-packer/issues/2","number":2,"state":"open","locked":false,"title":"adding .gitignore and --no-check-certificates","user":{"login":"someara","id":69068,"avatar_url":"https://avatars.githubusercontent.com/u/69068?v=3","gravatar_id":"","url":"https://api.github.com/users/someara","html_url":"https://github.com/someara","followers_url":"https://api.github.com/users/someara/followers","following_url":"https://api.github.com/users/someara/following{/other_user}","gists_url":"https://api.github.com/users/someara/gists{/gist_id}","starred_url":"https://api.github.com/users/someara/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/someara/subscriptions","organizations_url":"https://api.github.com/users/someara/orgs","repos_url":"https://api.github.com/users/someara/repos","events_url":"https://api.github.com/users/someara/events{/privacy}","received_events_url":"https://api.github.com/users/someara/received_events","type":"User","site_admin":false},"body":"","created_at":"2015-01-01T01:05:04Z","updated_at":"2015-01-01T01:05:04Z","closed_at":null,"merged_at":null,"merge_commit_sha":null,"assignee":null,"milestone":null,"commits_url":"https://api.github.com/repos/hypomonk/slacker-packer/pulls/2/commits","review_comments_url":"https://api.github.com/repos/hypomonk/slacker-packer/pulls/2/comments","review_comment_url":"https://api.github.com/repos/hypomonk/slacker-packer/pulls/comments/{number}","comments_url":"https://api.github.com/repos/hypomonk/slacker-packer/issues/2/comments","statuses_url":"https://api.github.com/repos/hypomonk/slacker-packer/statuses/a167b8d1405621a26333fda5325d389eeccc05ff","head":{"label":"someara:master","ref":"master","sha":"a167b8d1405621a26333fda5325d389eeccc05ff","user":{"login":"someara","id":69068,"avatar_url":"https://avatars.githubusercontent.com/u/69068?v=3","gravatar_id":"","url":"https://api.github.com/users/someara","html_url":"https://github.com/someara","followers_url":"https://api.github.com/users/someara/followers","following_url":"https://api.github.com/users/someara/following{/other_user}","gists_url":"https://api.github.com/users/someara/gists{/gist_id}","starred_url":"https://api.github.com/users/someara/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/someara/subscriptions","organizations_url":"https://api.github.com/users/someara/orgs","repos_url":"https://api.github.com/users/someara/repos","events_url":"https://api.github.com/users/someara/events{/privacy}","received_events_url":"https://api.github.com/users/someara/received_events","type":"User","site_admin":false},"repo":{"id":28658028,"name":"slacker-packer","full_name":"someara/slacker-packer","owner":{"login":"someara","id":69068,"avatar_url":"https://avatars.githubusercontent.com/u/69068?v=3","gravatar_id":"","url":"https://api.github.com/users/someara","html_url":"https://github.com/someara","followers_url":"https://api.github.com/users/someara/followers","following_url":"https://api.github.com/users/someara/following{/other_user}","gists_url":"https://api.github.com/users/someara/gists{/gist_id}","starred_url":"https://api.github.com/users/someara/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/someara/subscriptions","organizations_url":"https://api.github.com/users/someara/orgs","repos_url":"https://api.github.com/users/someara/repos","events_url":"https://api.github.com/users/someara/events{/privacy}","received_events_url":"https://api.github.com/users/someara/received_events","type":"User","site_admin":false},"private":false,"html_url":"https://github.com/someara/slacker-packer","description":"","fork":true,"url":"https://api.github.com/repos/someara/slacker-packer","forks_url":"https://api.github.com/repos/someara/slacker-packer/forks","keys_url":"https://api.github.com/repos/someara/slacker-packer/keys{/key_id}","collaborators_url":"https://api.github.com/repos/someara/slacker-packer/collaborators{/collaborator}","teams_url":"https://api.github.com/repos/someara/slacker-packer/teams","hooks_url":"https://api.github.com/repos/someara/slacker-packer/hooks","issue_events_url":"https://api.github.com/repos/someara/slacker-packer/issues/events{/number}","events_url":"https://api.github.com/repos/someara/slacker-packer/events","assignees_url":"https://api.github.com/repos/someara/slacker-packer/assignees{/user}","branches_url":"https://api.github.com/repos/someara/slacker-packer/branches{/branch}","tags_url":"https://api.github.com/repos/someara/slacker-packer/tags","blobs_url":"https://api.github.com/repos/someara/slacker-packer/git/blobs{/sha}","git_tags_url":"https://api.github.com/repos/someara/slacker-packer/git/tags{/sha}","git_refs_url":"https://api.github.com/repos/someara/slacker-packer/git/refs{/sha}","trees_url":"https://api.github.com/repos/someara/slacker-packer/git/trees{/sha}","statuses_url":"https://api.github.com/repos/someara/slacker-packer/statuses/{sha}","languages_url":"https://api.github.com/repos/someara/slacker-packer/languages","stargazers_url":"https://api.github.com/repos/someara/slacker-packer/stargazers","contributors_url":"https://api.github.com/repos/someara/slacker-packer/contributors","subscribers_url":"https://api.github.com/repos/someara/slacker-packer/subscribers","subscription_url":"https://api.github.com/repos/someara/slacker-packer/subscription","commits_url":"https://api.github.com/repos/someara/slacker-packer/commits{/sha}","git_commits_url":"https://api.github.com/repos/someara/slacker-packer/git/commits{/sha}","comments_url":"https://api.github.com/repos/someara/slacker-packer/comments{/number}","issue_comment_url":"https://api.github.com/repos/someara/slacker-packer/issues/comments/{number}","contents_url":"https://api.github.com/repos/someara/slacker-packer/contents/{+path}","compare_url":"https://api.github.com/repos/someara/slacker-packer/compare/{base}...{head}","merges_url":"https://api.github.com/repos/someara/slacker-packer/merges","archive_url":"https://api.github.com/repos/someara/slacker-packer/{archive_format}{/ref}","downloads_url":"https://api.github.com/repos/someara/slacker-packer/downloads","issues_url":"https://api.github.com/repos/someara/slacker-packer/issues{/number}","pulls_url":"https://api.github.com/repos/someara/slacker-packer/pulls{/number}","milestones_url":"https://api.github.com/repos/someara/slacker-packer/milestones{/number}","notifications_url":"https://api.github.com/repos/someara/slacker-packer/notifications{?since,all,participating}","labels_url":"https://api.github.com/repos/someara/slacker-packer/labels{/name}","releases_url":"https://api.github.com/repos/someara/slacker-packer/releases{/id}","created_at":"2014-12-31T06:18:22Z","updated_at":"2015-01-01T01:04:37Z","pushed_at":"2015-01-01T01:04:37Z","git_url":"git://github.com/someara/slacker-packer.git","ssh_url":"git@github.com:someara/slacker-packer.git","clone_url":"https://github.com/someara/slacker-packer.git","svn_url":"https://github.com/someara/slacker-packer","homepage":null,"size":0,"stargazers_count":0,"watchers_count":0,"language":"Shell","has_issues":false,"has_downloads":true,"has_wiki":true,"has_pages":false,"forks_count":0,"mirror_url":null,"open_issues_count":0,"forks":0,"open_issues":0,"watchers":0,"default_branch":"master"}},"base":{"label":"hypomonk:master","ref":"master","sha":"09f12c2d299252470229258e6f4a98f439bd025e","user":{"login":"hypomonk","id":6394422,"avatar_url":"https://avatars.githubusercontent.com/u/6394422?v=3","gravatar_id":"","url":"https://api.github.com/users/hypomonk","html_url":"https://github.com/hypomonk","followers_url":"https://api.github.com/users/hypomonk/followers","following_url":"https://api.github.com/users/hypomonk/following{/other_user}","gists_url":"https://api.github.com/users/hypomonk/gists{/gist_id}","starred_url":"https://api.github.com/users/hypomonk/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/hypomonk/subscriptions","organizations_url":"https://api.github.com/users/hypomonk/orgs","repos_url":"https://api.github.com/users/hypomonk/repos","events_url":"https://api.github.com/users/hypomonk/events{/privacy}","received_events_url":"https://api.github.com/users/hypomonk/received_events","type":"User","site_admin":false},"repo":{"id":28657951,"name":"slacker-packer","full_name":"hypomonk/slacker-packer","owner":{"login":"hypomonk","id":6394422,"avatar_url":"https://avatars.githubusercontent.com/u/6394422?v=3","gravatar_id":"","url":"https://api.github.com/users/hypomonk","html_url":"https://github.com/hypomonk","followers_url":"https://api.github.com/users/hypomonk/followers","following_url":"https://api.github.com/users/hypomonk/following{/other_user}","gists_url":"https://api.github.com/users/hypomonk/gists{/gist_id}","starred_url":"https://api.github.com/users/hypomonk/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/hypomonk/subscriptions","organizations_url":"https://api.github.com/users/hypomonk/orgs","repos_url":"https://api.github.com/users/hypomonk/repos","events_url":"https://api.github.com/users/hypomonk/events{/privacy}","received_events_url":"https://api.github.com/users/hypomonk/received_events","type":"User","site_admin":false},"private":false,"html_url":"https://github.com/hypomonk/slacker-packer","description":"","fork":false,"url":"https://api.github.com/repos/hypomonk/slacker-packer","forks_url":"https://api.github.com/repos/hypomonk/slacker-packer/forks","keys_url":"https://api.github.com/repos/hypomonk/slacker-packer/keys{/key_id}","collaborators_url":"https://api.github.com/repos/hypomonk/slacker-packer/collaborators{/collaborator}","teams_url":"https://api.github.com/repos/hypomonk/slacker-packer/teams","hooks_url":"https://api.github.com/repos/hypomonk/slacker-packer/hooks","issue_events_url":"https://api.github.com/repos/hypomonk/slacker-packer/issues/events{/number}","events_url":"https://api.github.com/repos/hypomonk/slacker-packer/events","assignees_url":"https://api.github.com/repos/hypomonk/slacker-packer/assignees{/user}","branches_url":"https://api.github.com/repos/hypomonk/slacker-packer/branches{/branch}","tags_url":"https://api.github.com/repos/hypomonk/slacker-packer/tags","blobs_url":"https://api.github.com/repos/hypomonk/slacker-packer/git/blobs{/sha}","git_tags_url":"https://api.github.com/repos/hypomonk/slacker-packer/git/tags{/sha}","git_refs_url":"https://api.github.com/repos/hypomonk/slacker-packer/git/refs{/sha}","trees_url":"https://api.github.com/repos/hypomonk/slacker-packer/git/trees{/sha}","statuses_url":"https://api.github.com/repos/hypomonk/slacker-packer/statuses/{sha}","languages_url":"https://api.github.com/repos/hypomonk/slacker-packer/languages","stargazers_url":"https://api.github.com/repos/hypomonk/slacker-packer/stargazers","contributors_url":"https://api.github.com/repos/hypomonk/slacker-packer/contributors","subscribers_url":"https://api.github.com/repos/hypomonk/slacker-packer/subscribers","subscription_url":"https://api.github.com/repos/hypomonk/slacker-packer/subscription","commits_url":"https://api.github.com/repos/hypomonk/slacker-packer/commits{/sha}","git_commits_url":"https://api.github.com/repos/hypomonk/slacker-packer/git/commits{/sha}","comments_url":"https://api.github.com/repos/hypomonk/slacker-packer/comments{/number}","issue_comment_url":"https://api.github.com/repos/hypomonk/slacker-packer/issues/comments/{number}","contents_url":"https://api.github.com/repos/hypomonk/slacker-packer/contents/{+path}","compare_url":"https://api.github.com/repos/hypomonk/slacker-packer/compare/{base}...{head}","merges_url":"https://api.github.com/repos/hypomonk/slacker-packer/merges","archive_url":"https://api.github.com/repos/hypomonk/slacker-packer/{archive_format}{/ref}","downloads_url":"https://api.github.com/repos/hypomonk/slacker-packer/downloads","issues_url":"https://api.github.com/repos/hypomonk/slacker-packer/issues{/number}","pulls_url":"https://api.github.com/repos/hypomonk/slacker-packer/pulls{/number}","milestones_url":"https://api.github.com/repos/hypomonk/slacker-packer/milestones{/number}","notifications_url":"https://api.github.com/repos/hypomonk/slacker-packer/notifications{?since,all,participating}","labels_url":"https://api.github.com/repos/hypomonk/slacker-packer/labels{/name}","releases_url":"https://api.github.com/repos/hypomonk/slacker-packer/releases{/id}","created_at":"2014-12-31T06:14:56Z","updated_at":"2014-12-31T22:20:37Z","pushed_at":"2014-12-31T22:20:36Z","git_url":"git://github.com/hypomonk/slacker-packer.git","ssh_url":"git@github.com:hypomonk/slacker-packer.git","clone_url":"https://github.com/hypomonk/slacker-packer.git","svn_url":"https://github.com/hypomonk/slacker-packer","homepage":null,"size":0,"stargazers_count":0,"watchers_count":0,"language":"Shell","has_issues":true,"has_downloads":true,"has_wiki":true,"has_pages":false,"forks_count":1,"mirror_url":null,"open_issues_count":2,"forks":1,"open_issues":2,"watchers":0,"default_branch":"master"}},"_links":{"self":{"href":"https://api.github.com/repos/hypomonk/slacker-packer/pulls/2"},"html":{"href":"https://github.com/hypomonk/slacker-packer/pull/2"},"issue":{"href":"https://api.github.com/repos/hypomonk/slacker-packer/issues/2"},"comments":{"href":"https://api.github.com/repos/hypomonk/slacker-packer/issues/2/comments"},"review_comments":{"href":"https://api.github.com/repos/hypomonk/slacker-packer/pulls/2/comments"},"review_comment":{"href":"https://api.github.com/repos/hypomonk/slacker-packer/pulls/comments/{number}"},"commits":{"href":"https://api.github.com/repos/hypomonk/slacker-packer/pulls/2/commits"},"statuses":{"href":"https://api.github.com/repos/hypomonk/slacker-packer/statuses/a167b8d1405621a26333fda5325d389eeccc05ff"}},"merged":false,"mergeable":null,"mergeable_state":"unknown","merged_by":null,"comments":0,"review_comments":0,"commits":1,"additions":18,"deletions":1,"changed_files":2}},"public":true,"created_at":"2015-01-01T01:05:04Z"}
{"id":"2489398019","type":"PushEvent","actor":{"id":4379694,"login":"moongato","gravatar_id":"","url":"https://api.github.com/users/moongato","avatar_url":"https://avatars.githubusercontent.com/u/4379694?"},"repo":{"id":11769015,"name":"moongato/android_frameworks_base","url":"https://api.github.com/repos/moongato/android_frameworks_base"},"payload":{"push_id":536753182,"size":6,"distinct_size":6,"ref":"refs/heads/lp50x","head":"2a724ce90a362e18dc10cd86f99760c5146c1e6a","before":"73c3f8da9962437774cec8442e0da8d431c28fa8","commits":[{"sha":"09ed328c580340d67492f81d855f8e2fe5834bd1","author":{"email":"97bd659605de2dc1baed2f2e8ef4e483c88d27f8@gmail.com","name":"Austin T. Conn"},"message":"volume rocker music controls","distinct":true,"url":"https://api.github.com/repos/moongato/android_frameworks_base/commits/09ed328c580340d67492f81d855f8e2fe5834bd1"},{"sha":"b3c8f58fb81a604be3f1fd2913e005afe300e296","author":{"email":"9defb1d2166fe02be9724618510318ef57e74e91@gmail.com","name":"Michael Bestas"},"message":"Fix volume rocker music controls and wake up\n\n- Forward port code from cm-11.0 and adjust for 5.0\n- Fix not being able to adjust volume when music control is on\n- Disable screen off volume/music control when wake key is enabled","distinct":true,"url":"https://api.github.com/repos/moongato/android_frameworks_base/commits/b3c8f58fb81a604be3f1fd2913e005afe300e296"},{"sha":"8040e4188be23da640d89fc829e33651826a48c0","author":{"email":"238a1843d81dd7fbe80b5c1b99515c4ba8c94d0d@cyngn.com","name":"Roman Birg"},"message":"status bar: improve brightness slider behavior\n\nMimic the brightness slider behavior in the statusbar.\nThis adds logic to make the statusbar slider also work with automatic brightness mode enabled and it will instead adjust the temporary automatic brightness overrride.","distinct":true,"url":"https://api.github.com/repos/moongato/android_frameworks_base/commits/8040e4188be23da640d89fc829e33651826a48c0"},{"sha":"58cadbda6cf16389eb849e5d9ed39eafb352d18a","author":{"email":"419b20914ad8ee7cdbbc7674d01c492d53cd267e@gmail.com","name":"Pawit Pornkitprasan"},"message":"status bar brightness: store value as int\n\nNon-automatic brightness value is stored as int, not float.\n\nSymptom: adjust the brightness in the status bar, the brightness slider in the notification bar will always be set to full","distinct":true,"url":"https://api.github.com/repos/moongato/android_frameworks_base/commits/58cadbda6cf16389eb849e5d9ed39eafb352d18a"},{"sha":"e0fb35b9ed52d05ce74b1c1833e20af6cd649f3c","author":{"email":"1e520a49e026effdcbd6ab603708edecd93fc284@gmail.com","name":"Clyde Tan"},"message":"Keep quiet when volume keys are used to wake up device\n\n- Userspace will make a 'beep' with it receives a key up, so  consume that event as well.\n- Removed wake key check in music control code as it will already be disabled here.","distinct":true,"url":"https://api.github.com/repos/moongato/android_frameworks_base/commits/e0fb35b9ed52d05ce74b1c1833e20af6cd649f3c"},{"sha":"2a724ce90a362e18dc10cd86f99760c5146c1e6a","author":{"email":"22e0f38e0fc64da9129ff9b9ef030b39415294a1@ubuntu","name":"moongato"},"message":"Merge remote-tracking branch 'upstream/lollipop-ras-mr1' into lp50x","distinct":true,"url":"https://api.github.com/repos/moongato/android_frameworks_base/commits/2a724ce90a362e18dc10cd86f99760c5146c1e6a"}]},"public":true,"created_at":"2015-01-01T01:05:04Z"}
{"id":"2489398027","type":"ForkEvent","actor":{"id":1449374,"login":"ohyeah521","gravatar_id":"","url":"https://api.github.com/users/ohyeah521","avatar_url":"https://avatars.githubusercontent.com/u/1449374?"},"repo":{"id":28629678,"name":"techbliss/ADB_Helper_For_ida_Pro","url":"https://api.github.com/repos/techbliss/ADB_Helper_For_ida_Pro"},"payload":{"forkee":{"id":28678268,"name":"ADB_Helper_For_ida_Pro","full_name":"ohyeah521/ADB_Helper_For_ida_Pro","owner":{"login":"ohyeah521","id":1449374,"avatar_url":"https://avatars.githubusercontent.com/u/1449374?v=3","gravatar_id":"","url":"https://api.github.com/users/ohyeah521","html_url":"https://github.com/ohyeah521","followers_url":"https://api.github.com/users/ohyeah521/followers","following_url":"https://api.github.com/users/ohyeah521/following{/other_user}","gists_url":"https://api.github.com/users/ohyeah521/gists{/gist_id}","starred_url":"https://api.github.com/users/ohyeah521/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/ohyeah521/subscriptions","organizations_url":"https://api.github.com/users/ohyeah521/orgs","repos_url":"https://api.github.com/users/ohyeah521/repos","events_url":"https://api.github.com/users/ohyeah521/events{/privacy}","received_events_url":"https://api.github.com/users/ohyeah521/received_events","type":"User","site_admin":false},"private":false,"html_url":"https://github.com/ohyeah521/ADB_Helper_For_ida_Pro","description":"Helps you debugging Android in Ida pro","fork":true,"url":"https://api.github.com/repos/ohyeah521/ADB_Helper_For_ida_Pro","forks_url":"https://api.github.com/repos/ohyeah521/ADB_Helper_For_ida_Pro/forks","keys_url":"https://api.github.com/repos/ohyeah521/ADB_Helper_For_ida_Pro/keys{/key_id}","collaborators_url":"https://api.github.com/repos/ohyeah521/ADB_Helper_For_ida_Pro/collaborators{/collaborator}","teams_url":"https://api.github.com/repos/ohyeah521/ADB_Helper_For_ida_Pro/teams","hooks_url":"https://api.github.com/repos/ohyeah521/ADB_Helper_For_ida_Pro/hooks","issue_events_url":"https://api.github.com/repos/ohyeah521/ADB_Helper_For_ida_Pro/issues/events{/number}","events_url":"https://api.github.com/repos/ohyeah521/ADB_Helper_For_ida_Pro/events","assignees_url":"https://api.github.com/repos/ohyeah521/ADB_Helper_For_ida_Pro/assignees{/user}","branches_url":"https://api.github.com/repos/ohyeah521/ADB_Helper_For_ida_Pro/branches{/branch}","tags_url":"https://api.github.com/repos/ohyeah521/ADB_Helper_For_ida_Pro/tags","blobs_url":"https://api.github.com/repos/ohyeah521/ADB_Helper_For_ida_Pro/git/blobs{/sha}","git_tags_url":"https://api.github.com/repos/ohyeah521/ADB_Helper_For_ida_Pro/git/tags{/sha}","git_refs_url":"https://api.github.com/repos/ohyeah521/ADB_Helper_For_ida_Pro/git/refs{/sha}","trees_url":"https://api.github.com/repos/ohyeah521/ADB_Helper_For_ida_Pro/git/trees{/sha}","statuses_url":"https://api.github.com/repos/ohyeah521/ADB_Helper_For_ida_Pro/statuses/{sha}","languages_url":"https://api.github.com/repos/ohyeah521/ADB_Helper_For_ida_Pro/languages","stargazers_url":"https://api.github.com/repos/ohyeah521/ADB_Helper_For_ida_Pro/stargazers","contributors_url":"https://api.github.com/repos/ohyeah521/ADB_Helper_For_ida_Pro/contributors","subscribers_url":"https://api.github.com/repos/ohyeah521/ADB_Helper_For_ida_Pro/subscribers","subscription_url":"https://api.github.com/repos/ohyeah521/ADB_Helper_For_ida_Pro/subscription","commits_url":"https://api.github.com/repos/ohyeah521/ADB_Helper_For_ida_Pro/commits{/sha}","git_commits_url":"https://api.github.com/repos/ohyeah521/ADB_Helper_For_ida_Pro/git/commits{/sha}","comments_url":"https://api.github.com/repos/ohyeah521/ADB_Helper_For_ida_Pro/comments{/number}","issue_comment_url":"https://api.github.com/repos/ohyeah521/ADB_Helper_For_ida_Pro/issues/comments/{number}","contents_url":"https://api.github.com/repos/ohyeah521/ADB_Helper_For_ida_Pro/contents/{+path}","compare_url":"https://api.github.com/repos/ohyeah521/ADB_Helper_For_ida_Pro/compare/{base}...{head}","merges_url":"https://api.github.com/repos/ohyeah521/ADB_Helper_For_ida_Pro/merges","archive_url":"https://api.github.com/repos/ohyeah521/ADB_Helper_For_ida_Pro/{archive_format}{/ref}","downloads_url":"https://api.github.com/repos/ohyeah521/ADB_Helper_For_ida_Pro/downloads","issues_url":"https://api.github.com/repos/ohyeah521/ADB_Helper_For_ida_Pro/issues{/number}","pulls_url":"https://api.github.com/repos/ohyeah521/ADB_Helper_For_ida_Pro/pulls{/number}","milestones_url":"https://api.github.com/repos/ohyeah521/ADB_Helper_For_ida_Pro/milestones{/number}","notifications_url":"https://api.github.com/repos/ohyeah521/ADB_Helper_For_ida_Pro/notifications{?since,all,participating}","labels_url":"https://api.github.com/repos/ohyeah521/ADB_Helper_For_ida_Pro/labels{/name}","releases_url":"https://api.github.com/repos/ohyeah521/ADB_Helper_For_ida_Pro/releases{/id}","created_at":"2015-01-01T01:05:06Z","updated_at":"2014-12-31T18:54:05Z","pushed_at":"2014-12-30T12:25:12Z","git_url":"git://github.com/ohyeah521/ADB_Helper_For_ida_Pro.git","ssh_url":"git@github.com:ohyeah521/ADB_Helper_For_ida_Pro.git","clone_url":"https://github.com/ohyeah521/ADB_Helper_For_ida_Pro.git","svn_url":"https://github.com/ohyeah521/ADB_Helper_For_ida_Pro","homepage":null,"size":0,"stargazers_count":0,"watchers_count":0,"language":null,"has_issues":false,"has_downloads":true,"has_wiki":true,"has_pages":false,"forks_count":0,"mirror_url":null,"open_issues_count":0,"forks":0,"open_issues":0,"watchers":0,"default_branch":"master","public":true}},"public":true,"created_at":"2015-01-01T01:05:06Z"}
{"id":"2489398028","type":"CreateEvent","actor":{"id":9505729,"login":"alishadot","gravatar_id":"","url":"https://api.github.com/users/alishadot","avatar_url":"https://avatars.githubusercontent.com/u/9505729?"},"repo":{"id":28678253,"name":"alishadot/keepcloud","url":"https://api.github.com/repos/alishadot/keepcloud"},"payload":{"ref":"master","ref_type":"branch","master_branch":"master","description":"","pusher_type":"user"},"public":true,"created_at":"2015-01-01T01:05:06Z"}
{"id":"2489398030","type":"PushEvent","actor":{"id":506010,"login":"gabeshaughnessy","gravatar_id":"","url":"https://api.github.com/users/gabeshaughnessy","avatar_url":"https://avatars.githubusercontent.com/u/506010?"},"repo":{"id":13913264,"name":"gabeshaughnessy/augmentedart","url":"https://api.github.com/repos/gabeshaughnessy/augmentedart"},"payload":{"push_id":536753186,"size":1,"distinct_size":1,"ref":"refs/heads/dungeon-hacker","head":"f1d6efa16b35cfe98b4ee3e54c3f333f87612fa1","before":"070da10a642c004ef5bc428b8ce1bf88e410e7b4","commits":[{"sha":"f1d6efa16b35cfe98b4ee3e54c3f333f87612fa1","author":{"email":"a2b2bb6e7f1b10ac88b326d5c10e33af6a8546bc@gmail.com","name":"gabeshaughnessy"},"message":"todo","distinct":true,"url":"https://api.github.com/repos/gabeshaughnessy/augmentedart/commits/f1d6efa16b35cfe98b4ee3e54c3f333f87612fa1"}]},"public":true,"created_at":"2015-01-01T01:05:06Z"}
{"id":"2489398031","type":"PushEvent","actor":{"id":489000,"login":"kwrobot","gravatar_id":"","url":"https://api.github.com/users/kwrobot","avatar_url":"https://avatars.githubusercontent.com/u/489000?"},"repo":{"id":537699,"name":"Kitware/CMake","url":"https://api.github.com/repos/Kitware/CMake"},"payload":{"push_id":536753184,"size":1,"distinct_size":0,"ref":"refs/heads/nightly-master","head":"c2445d3dfd837cd2e372061f5545054317be110a","before":"3b62cb7244716e0bd486d7023bec15d922572ad1","commits":[{"sha":"c2445d3dfd837cd2e372061f5545054317be110a","author":{"email":"29e2a43288125ec45952b67b65b7fb7ef6ca7262@kitware.com","name":"Kitware Robot"},"message":"CMake Nightly Date Stamp","distinct":false,"url":"https://api.github.com/repos/Kitware/CMake/commits/c2445d3dfd837cd2e372061f5545054317be110a"}]},"public":true,"created_at":"2015-01-01T01:05:06Z","org":{"id":87549,"login":"Kitware","gravatar_id":"","url":"https://api.github.com/orgs/Kitware","avatar_url":"https://avatars.githubusercontent.com/u/87549?"}}
{"id":"2489398032","type":"IssuesEvent","actor":{"id":3487141,"login":"graig","gravatar_id":"","url":"https://api.github.com/users/graig","avatar_url":"https://avatars.githubusercontent.com/u/3487141?"},"repo":{"id":919161,"name":"arduino/Arduino","url":"https://api.github.com/repos/arduino/Arduino"},"payload":{"action":"opened","issue":{"url":"https://api.github.com/repos/arduino/Arduino/issues/2525","labels_url":"https://api.github.com/repos/arduino/Arduino/issues/2525/labels{/name}","comments_url":"https://api.github.com/repos/arduino/Arduino/issues/2525/comments","events_url":"https://api.github.com/repos/arduino/Arduino/issues/2525/events","html_url":"https://github.com/arduino/Arduino/issues/2525","id":53210273,"number":2525,"title":"broken link - Yun","user":{"login":"graig","id":3487141,"avatar_url":"https://avatars.githubusercontent.com/u/3487141?v=3","gravatar_id":"","url":"https://api.github.com/users/graig","html_url":"https://github.com/graig","followers_url":"https://api.github.com/users/graig/followers","following_url":"https://api.github.com/users/graig/following{/other_user}","gists_url":"https://api.github.com/users/graig/gists{/gist_id}","starred_url":"https://api.github.com/users/graig/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/graig/subscriptions","organizations_url":"https://api.github.com/users/graig/orgs","repos_url":"https://api.github.com/users/graig/repos","events_url":"https://api.github.com/users/graig/events{/privacy}","received_events_url":"https://api.github.com/users/graig/received_events","type":"User","site_admin":false},"labels":[],"state":"open","locked":false,"assignee":null,"milestone":null,"comments":0,"created_at":"2015-01-01T01:05:05Z","updated_at":"2015-01-01T01:05:05Z","closed_at":null,"body":"The link for the Yun schematic works but the file (arduino-Yun-DSN.zip) is named wrong. When opened, it actually contains the schematic and board for the Uno, not the Yun."}},"public":true,"created_at":"2015-01-01T01:05:06Z","org":{"id":379109,"login":"arduino","gravatar_id":"","url":"https://api.github.com/orgs/arduino","avatar_url":"https://avatars.githubusercontent.com/u/379109?"}}
{"id":"2489398034","type":"PushEvent","actor":{"id":489000,"login":"kwrobot","gravatar_id":"","url":"https://api.github.com/users/kwrobot","avatar_url":"https://avatars.githubusercontent.com/u/489000?"},"repo":{"id":537699,"name":"Kitware/CMake","url":"https://api.github.com/repos/Kitware/CMake"},"payload":{"push_id":536753187,"size":24,"distinct_size":0,"ref":"refs/heads/nightly","head":"943791ec6b6166448216d2c12d355be291910948","before":"ce73c53c7a64d31432739f434f222cfa904c1aec","commits":[{"sha":"05105d5c13f6662907cfb63fb6723f9f34f4558d","author":{"email":"29e2a43288125ec45952b67b65b7fb7ef6ca7262@kitware.com","name":"Kitware Robot"},"message":"CMake Nightly Date Stamp","distinct":false,"url":"https://api.github.com/repos/Kitware/CMake/commits/05105d5c13f6662907cfb63fb6723f9f34f4558d"},{"sha":"2b28e07c02d9f13867d0f518b8341e77f006faa4","author":{"email":"29e2a43288125ec45952b67b65b7fb7ef6ca7262@kitware.com","name":"Kitware Robot"},"message":"CMake Nightly Date Stamp","distinct":false,"url":"https://api.github.com/repos/Kitware/CMake/commits/2b28e07c02d9f13867d0f518b8341e77f006faa4"},{"sha":"028cdfb3deaddef510537bbeb1a4202924c1a80b","author":{"email":"29e2a43288125ec45952b67b65b7fb7ef6ca7262@kitware.com","name":"Kitware Robot"},"message":"CMake Nightly Date Stamp","distinct":false,"url":"https://api.github.com/repos/Kitware/CMake/commits/028cdfb3deaddef510537bbeb1a4202924c1a80b"},{"sha":"8e6114017873e50817c6961ffcedb3c52a2ed1f1","author":{"email":"29e2a43288125ec45952b67b65b7fb7ef6ca7262@kitware.com","name":"Kitware Robot"},"message":"CMake Nightly Date Stamp","distinct":false,"url":"https://api.github.com/repos/Kitware/CMake/commits/8e6114017873e50817c6961ffcedb3c52a2ed1f1"},{"sha":"ca3d08e6b598a7f7d46b3125a0d7ddddf8be8dcd","author":{"email":"29e2a43288125ec45952b67b65b7fb7ef6ca7262@kitware.com","name":"Kitware Robot"},"message":"CMake Nightly Date Stamp","distinct":false,"url":"https://api.github.com/repos/Kitware/CMake/commits/ca3d08e6b598a7f7d46b3125a0d7ddddf8be8dcd"},{"sha":"3b62cb7244716e0bd486d7023bec15d922572ad1","author":{"email":"29e2a43288125ec45952b67b65b7fb7ef6ca7262@kitware.com","name":"Kitware Robot"},"message":"CMake Nightly Date Stamp","distinct":false,"url":"https://api.github.com/repos/Kitware/CMake/commits/3b62cb7244716e0bd486d7023bec15d922572ad1"},{"sha":"c2445d3dfd837cd2e372061f5545054317be110a","author":{"email":"29e2a43288125ec45952b67b65b7fb7ef6ca7262@kitware.com","name":"Kitware Robot"},"message":"CMake Nightly Date Stamp","distinct":false,"url":"https://api.github.com/repos/Kitware/CMake/commits/c2445d3dfd837cd2e372061f5545054317be110a"},{"sha":"5e8b4a718169837db825538561ddfd85cf62be43","author":{"email":"fbd1bb53ae91c7d21c5feb88facb5fbef8543d8e@gmail.com","name":"Stephen Kelly"},"message":"SolarisStudio: Use alternative standard library to build CMake.\n\nSolarisStudio ships a very old RogueWave standard library\nimplementation (libCstd) and uses it by default for backward compatibility.\nThe macros defined when building the system libCstd need to be the same as\nthe macros defined when using it for binary compatibility reasons etc.  The\nSolarisStudio compiler driver adds macros such as _RWSTD_NO_MEMBER_TEMPLATES and\n_RWSTD_NO_CLASS_PARTIAL_SPEC etc. These macros disable certain APIs in the\nstandard library headers.\n\nAlthough the compiler supports the features 'member templates' and 'partial\ntemplate specialization', the standard library does not provide APIs which\nrely on those features.  This means that std::vector::insert in libCStd does\nnot accept a pair of iterators from a different type of container, because\nthat requires member templates, and reverse_iterator<const T> can not\nbe constructed from a reverse_iterator<T> because that requires partial\nspecialization (or at least the _RWSTD_NO_CLASS_PARTIAL_SPEC define) and\nmember templates.\n\nThis causes many problems while building CMake using SolarisStudio, which\nhave not been well understood until now.  The problems are usually\nattributed to compiler limitations, while actually the problem is in\nthe standard library, as in commit v3.0.0-rc1~99^2~1 (Help: Document non-use\nof std::set::insert., 2014-01-24) and commit 107dcac3 (Fix compilation with\nthe Oracle / Sun compiler (#15318), 2014-12-12).\n\nSolarisStudio 12.3 and earlier also ships a version of stlport which may be\nused instead of libCstd by specifying -library=stlport4\n\n https://docs.oracle.com/cd/E18659_01/html/821-1383/bkakg.html\n\nSolarisStudio 12.4 ships a version of libstdc++ from GCC 4.8.2 which may be\nused by specifying -std=c++03 or -std=c++11 etc\n\n http://docs.oracle.com/cd/E37069_01/html/E37075/bkamw.html#OSSCPgnaof\n\nUse these more-capable standard library implementations when building cmake.\nThis will allow more use of 'normal' C++ (such as std::vector::insert), and cause\nfewer surprises resulting from dashboards using SolarisStudio.\n\nBecause cmake is not a library linked against by 3rd parties and does not have\nexternal dependencies, issues related to mixing code using libCStd and libstdc++\ndo not apply.","distinct":false,"url":"https://api.github.com/repos/Kitware/CMake/commits/5e8b4a718169837db825538561ddfd85cf62be43"},{"sha":"be77679552dbda01d62b03a85de05ad7e7684862","author":{"email":"fbd1bb53ae91c7d21c5feb88facb5fbef8543d8e@gmail.com","name":"Stephen Kelly"},"message":"Revert \"Misc. fixes for the Oracle / Sun compiler.\"\n\nThis reverts commit 97b65f8156734db2adc367b27c822a5fe332d740.","distinct":false,"url":"https://api.github.com/repos/Kitware/CMake/commits/be77679552dbda01d62b03a85de05ad7e7684862"},{"sha":"b162e9871e8fabacf6f565ad1ced05a6d234e25b","author":{"email":"fbd1bb53ae91c7d21c5feb88facb5fbef8543d8e@gmail.com","name":"Stephen Kelly"},"message":"Use insert instead of a loop in some cases.\n\nLimit this change to inserting into a vector from a vector.\n\nA follow up change can use insert for inserting into a set.","distinct":false,"url":"https://api.github.com/repos/Kitware/CMake/commits/b162e9871e8fabacf6f565ad1ced05a6d234e25b"},{"sha":"57969aebfc5bc3589972b497fc5deb30e292230f","author":{"email":"fbd1bb53ae91c7d21c5feb88facb5fbef8543d8e@gmail.com","name":"Stephen Kelly"},"message":"Use two-iterator std::set::insert where appropriate.","distinct":false,"url":"https://api.github.com/repos/Kitware/CMake/commits/57969aebfc5bc3589972b497fc5deb30e292230f"},{"sha":"6c02a443b92ba189288cbe9f01589e00cabfb994","author":{"email":"fbd1bb53ae91c7d21c5feb88facb5fbef8543d8e@gmail.com","name":"Stephen Kelly"},"message":"Help: Remove documented restriction on insert APIs.","distinct":false,"url":"https://api.github.com/repos/Kitware/CMake/commits/6c02a443b92ba189288cbe9f01589e00cabfb994"},{"sha":"59aa8d878e69fd694e44af3778e87615804ad53e","author":{"email":"fbd1bb53ae91c7d21c5feb88facb5fbef8543d8e@gmail.com","name":"Stephen Kelly"},"message":"Help: Remove documented restriction on find in conditions.\n\nThe necessary conversion is supported by all CMake host compilers.","distinct":false,"url":"https://api.github.com/repos/Kitware/CMake/commits/59aa8d878e69fd694e44af3778e87615804ad53e"},{"sha":"7403759846b9bd34bb425f5e90f6e367b80d1d58","author":{"email":"fbd1bb53ae91c7d21c5feb88facb5fbef8543d8e@gmail.com","name":"Stephen Kelly"},"message":"Help: Remove documented restriction on template use.","distinct":false,"url":"https://api.github.com/repos/Kitware/CMake/commits/7403759846b9bd34bb425f5e90f6e367b80d1d58"},{"sha":"2e1ea034a804cd1ec61ba5b9817452d49b6d0830","author":{"email":"fbd1bb53ae91c7d21c5feb88facb5fbef8543d8e@gmail.com","name":"Stephen Kelly"},"message":"Merge topic 'sun-better-stdlib' into next\n\n74037598 Help: Remove documented restriction on template use.\n59aa8d87 Help: Remove documented restriction on find in conditions.\n6c02a443 Help: Remove documented restriction on insert APIs.\n57969aeb Use two-iterator std::set::insert where appropriate.\nb162e987 Use insert instead of a loop in some cases.\nbe776795 Revert \"Misc. fixes for the Oracle / Sun compiler.\"\n5e8b4a71 SolarisStudio: Use alternative standard library to build CMake.\n3b62cb72 CMake Nightly Date Stamp\nca3d08e6 CMake Nightly Date Stamp\n8e611401 CMake Nightly Date Stamp\n028cdfb3 CMake Nightly Date Stamp\n2b28e07c CMake Nightly Date Stamp\n05105d5c CMake Nightly Date Stamp","distinct":false,"url":"https://api.github.com/repos/Kitware/CMake/commits/2e1ea034a804cd1ec61ba5b9817452d49b6d0830"},{"sha":"29b4f5420922a06cafeaf07c13b5d781790e8646","author":{"email":"fbd1bb53ae91c7d21c5feb88facb5fbef8543d8e@gmail.com","name":"Stephen Kelly"},"message":"RunCMake: Expect empty output by default.\n\nExpect tests to specify stderr content if it is present.\n\nFix the CMP0019 test, which has only been testing the WARN status\nuntil now.  Specify in the CommandLine and FPHSA tests that content\nis at least one character.\n\nSet policies in the Language and CheckModules tests, which have empty\ntest output, modulo unrelated policies on some platforms.","distinct":false,"url":"https://api.github.com/repos/Kitware/CMake/commits/29b4f5420922a06cafeaf07c13b5d781790e8646"},{"sha":"ff99adb80d59dcbe8cb0d9dc12db657a2f58be7e","author":{"email":"fbd1bb53ae91c7d21c5feb88facb5fbef8543d8e@gmail.com","name":"Stephen Kelly"},"message":"Merge topic 'RunCMake-stderr-default' into next\n\n29b4f542 RunCMake: Expect empty output by default.\nc2445d3d CMake Nightly Date Stamp","distinct":false,"url":"https://api.github.com/repos/Kitware/CMake/commits/ff99adb80d59dcbe8cb0d9dc12db657a2f58be7e"},{"sha":"2c528f860ff8ea458fbf8ab6c85908aeeaa749e0","author":{"email":"88a2dde5abcebb5c32bd0a2b4aff36eeea918955@kitware.com","name":"Robert Maynard"},"message":"CompileFeatures: NonValidTarget1 now handles not have cxx_final.\n\nPreviously we expanded HAVE_FINAL to determine what the copied_file number\nwould be, but when we don't have cxx_final than HAVE_FINAL is not defined.\nWhat we really want is to use expected_result.","distinct":false,"url":"https://api.github.com/repos/Kitware/CMake/commits/2c528f860ff8ea458fbf8ab6c85908aeeaa749e0"},{"sha":"b97c86b5009307e6b089bcc2ddef55d77918f765","author":{"email":"88a2dde5abcebb5c32bd0a2b4aff36eeea918955@kitware.com","name":"Robert Maynard"},"message":"CompileFeatures: Support compilers that don't have version modess.\n\ncompilers such as MSVC have no explicit flags to enable C++11 mode,\nit just is always on. So only run the link tests with compilers that require\na flag to specify the language version.","distinct":false,"url":"https://api.github.com/repos/Kitware/CMake/commits/b97c86b5009307e6b089bcc2ddef55d77918f765"},{"sha":"8ad33e01d2ed27c9ac136fd19516a21449b4c87b","author":{"email":"88a2dde5abcebb5c32bd0a2b4aff36eeea918955@kitware.com","name":"Robert Maynard"},"message":"Merge topic 'feature_record_msvc' into next\n\nb97c86b5 CompileFeatures: Support compilers that don't have version modess.\n2c528f86 CompileFeatures: NonValidTarget1 now handles not have cxx_final.","distinct":false,"url":"https://api.github.com/repos/Kitware/CMake/commits/8ad33e01d2ed27c9ac136fd19516a21449b4c87b"}]},"public":true,"created_at":"2015-01-01T01:05:06Z","org":{"id":87549,"login":"Kitware","gravatar_id":"","url":"https://api.github.com/orgs/Kitware","avatar_url":"https://avatars.githubusercontent.com/u/87549?"}}
{"id":"2489398039","type":"PushEvent","actor":{"id":452786,"login":"alrieckert","gravatar_id":"","url":"https://api.github.com/users/alrieckert","avatar_url":"https://avatars.githubusercontent.com/u/452786?"},"repo":{"id":6153802,"name":"alrieckert/freepascal","url":"https://api.github.com/repos/alrieckert/freepascal"},"payload":{"push_id":536753192,"size":2,"distinct_size":2,"ref":"refs/heads/master","head":"c119967bbbcfba0d00c6bfcf9d4e805272bbc8dd","before":"7688ca531943068f1b199008e7575bfb075729f1","commits":[{"sha":"8596d86916e4754dde940d6934430173218863b9","author":{"email":"3829486b93ec44395f0b980424bae9b6fb07b7bc@3ad0048d-3df7-0310-abae-a5850022a9f2","name":"marco"},"message":" * system unit additions from mantis #27206. Exports some dynarray related RTTI functions.\n\ngit-svn-id: http://svn.freepascal.org/svn/fpc/trunk@29364 3ad0048d-3df7-0310-abae-a5850022a9f2","distinct":true,"url":"https://api.github.com/repos/alrieckert/freepascal/commits/8596d86916e4754dde940d6934430173218863b9"},{"sha":"c119967bbbcfba0d00c6bfcf9d4e805272bbc8dd","author":{"email":"3829486b93ec44395f0b980424bae9b6fb07b7bc@3ad0048d-3df7-0310-abae-a5850022a9f2","name":"marco"},"message":" * Fix for #27228\n\n\ngit-svn-id: http://svn.freepascal.org/svn/fpc/trunk@29365 3ad0048d-3df7-0310-abae-a5850022a9f2","distinct":true,"url":"https://api.github.com/repos/alrieckert/freepascal/commits/c119967bbbcfba0d00c6bfcf9d4e805272bbc8dd"}]},"public":true,"created_at":"2015-01-01T01:05:06Z"}
{"id":"2489398041","type":"PushEvent","actor":{"id":6158630,"login":"greatfire","gravatar_id":"","url":"https://api.github.com/users/greatfire","avatar_url":"https://avatars.githubusercontent.com/u/6158630?"},"repo":{"id":18126008,"name":"greatfire/z","url":"https://api.github.com/repos/greatfire/z"},"payload":{"push_id":536753193,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"67eeb5f55504c0317a0e372e38eed9df2a97370d","before":"1c095ccf0c45826798d494d477eef16082e2919f","commits":[{"sha":"67eeb5f55504c0317a0e372e38eed9df2a97370d","author":{"email":"24bf68e341ce0fbd9259a5d51feed79682ea4eba@greatfire.org","name":"Ubuntu"},"message":"a","distinct":true,"url":"https://api.github.com/repos/greatfire/z/commits/67eeb5f55504c0317a0e372e38eed9df2a97370d"}]},"public":true,"created_at":"2015-01-01T01:05:07Z"}
{"id":"2489398043","type":"PushEvent","actor":{"id":6158630,"login":"greatfire","gravatar_id":"","url":"https://api.github.com/users/greatfire","avatar_url":"https://avatars.githubusercontent.com/u/6158630?"},"repo":{"id":15100395,"name":"greatfire/wiki","url":"https://api.github.com/repos/greatfire/wiki"},"payload":{"push_id":536753194,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"7ce647729785e7cfee67c96e185b8fa8df693623","before":"ba5bb9726f655f8acd29ecb3f89f1ae55305e680","commits":[{"sha":"7ce647729785e7cfee67c96e185b8fa8df693623","author":{"email":"24bf68e341ce0fbd9259a5d51feed79682ea4eba@greatfire.org","name":"Ubuntu"},"message":"a","distinct":true,"url":"https://api.github.com/repos/greatfire/wiki/commits/7ce647729785e7cfee67c96e185b8fa8df693623"}]},"public":true,"created_at":"2015-01-01T01:05:07Z"}
{"id":"2489398045","type":"PushEvent","actor":{"id":6895040,"login":"codertradergambler","gravatar_id":"","url":"https://api.github.com/users/codertradergambler","avatar_url":"https://avatars.githubusercontent.com/u/6895040?"},"repo":{"id":18620619,"name":"chancecoin/chancecoinj","url":"https://api.github.com/repos/chancecoin/chancecoinj"},"payload":{"push_id":536753196,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"d9886bb6d61f6f5e1e33b421db90e4c50feabbe2","before":"d4ec65797e8faf2aac84c02007d2ebeb342babd3","commits":[{"sha":"d9886bb6d61f6f5e1e33b421db90e4c50feabbe2","author":{"email":"0ccf54d51d1a5240ad356feb30dfa4d1749f8844@gmail.com","name":"TraderCoderGambler"},"message":"auto-update balances","distinct":true,"url":"https://api.github.com/repos/chancecoin/chancecoinj/commits/d9886bb6d61f6f5e1e33b421db90e4c50feabbe2"}]},"public":true,"created_at":"2015-01-01T01:05:08Z"}
{"id":"2489398046","type":"ForkEvent","actor":{"id":1129530,"login":"jimulabs","gravatar_id":"","url":"https://api.github.com/users/jimulabs","avatar_url":"https://avatars.githubusercontent.com/u/1129530?"},"repo":{"id":14393731,"name":"JakeWharton/u2020","url":"https://api.github.com/repos/JakeWharton/u2020"},"payload":{"forkee":{"id":28678269,"name":"u2020","full_name":"jimulabs/u2020","owner":{"login":"jimulabs","id":1129530,"avatar_url":"https://avatars.githubusercontent.com/u/1129530?v=3","gravatar_id":"","url":"https://api.github.com/users/jimulabs","html_url":"https://github.com/jimulabs","followers_url":"https://api.github.com/users/jimulabs/followers","following_url":"https://api.github.com/users/jimulabs/following{/other_user}","gists_url":"https://api.github.com/users/jimulabs/gists{/gist_id}","starred_url":"https://api.github.com/users/jimulabs/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/jimulabs/subscriptions","organizations_url":"https://api.github.com/users/jimulabs/orgs","repos_url":"https://api.github.com/users/jimulabs/repos","events_url":"https://api.github.com/users/jimulabs/events{/privacy}","received_events_url":"https://api.github.com/users/jimulabs/received_events","type":"Organization","site_admin":false},"private":false,"html_url":"https://github.com/jimulabs/u2020","description":"A sample Android app which showcases advanced usage of Dagger among other open source libraries.","fork":true,"url":"https://api.github.com/repos/jimulabs/u2020","forks_url":"https://api.github.com/repos/jimulabs/u2020/forks","keys_url":"https://api.github.com/repos/jimulabs/u2020/keys{/key_id}","collaborators_url":"https://api.github.com/repos/jimulabs/u2020/collaborators{/collaborator}","teams_url":"https://api.github.com/repos/jimulabs/u2020/teams","hooks_url":"https://api.github.com/repos/jimulabs/u2020/hooks","issue_events_url":"https://api.github.com/repos/jimulabs/u2020/issues/events{/number}","events_url":"https://api.github.com/repos/jimulabs/u2020/events","assignees_url":"https://api.github.com/repos/jimulabs/u2020/assignees{/user}","branches_url":"https://api.github.com/repos/jimulabs/u2020/branches{/branch}","tags_url":"https://api.github.com/repos/jimulabs/u2020/tags","blobs_url":"https://api.github.com/repos/jimulabs/u2020/git/blobs{/sha}","git_tags_url":"https://api.github.com/repos/jimulabs/u2020/git/tags{/sha}","git_refs_url":"https://api.github.com/repos/jimulabs/u2020/git/refs{/sha}","trees_url":"https://api.github.com/repos/jimulabs/u2020/git/trees{/sha}","statuses_url":"https://api.github.com/repos/jimulabs/u2020/statuses/{sha}","languages_url":"https://api.github.com/repos/jimulabs/u2020/languages","stargazers_url":"https://api.github.com/repos/jimulabs/u2020/stargazers","contributors_url":"https://api.github.com/repos/jimulabs/u2020/contributors","subscribers_url":"https://api.github.com/repos/jimulabs/u2020/subscribers","subscription_url":"https://api.github.com/repos/jimulabs/u2020/subscription","commits_url":"https://api.github.com/repos/jimulabs/u2020/commits{/sha}","git_commits_url":"https://api.github.com/repos/jimulabs/u2020/git/commits{/sha}","comments_url":"https://api.github.com/repos/jimulabs/u2020/comments{/number}","issue_comment_url":"https://api.github.com/repos/jimulabs/u2020/issues/comments/{number}","contents_url":"https://api.github.com/repos/jimulabs/u2020/contents/{+path}","compare_url":"https://api.github.com/repos/jimulabs/u2020/compare/{base}...{head}","merges_url":"https://api.github.com/repos/jimulabs/u2020/merges","archive_url":"https://api.github.com/repos/jimulabs/u2020/{archive_format}{/ref}","downloads_url":"https://api.github.com/repos/jimulabs/u2020/downloads","issues_url":"https://api.github.com/repos/jimulabs/u2020/issues{/number}","pulls_url":"https://api.github.com/repos/jimulabs/u2020/pulls{/number}","milestones_url":"https://api.github.com/repos/jimulabs/u2020/milestones{/number}","notifications_url":"https://api.github.com/repos/jimulabs/u2020/notifications{?since,all,participating}","labels_url":"https://api.github.com/repos/jimulabs/u2020/labels{/name}","releases_url":"https://api.github.com/repos/jimulabs/u2020/releases{/id}","created_at":"2015-01-01T01:05:08Z","updated_at":"2014-12-30T22:28:31Z","pushed_at":"2014-12-23T00:04:38Z","git_url":"git://github.com/jimulabs/u2020.git","ssh_url":"git@github.com:jimulabs/u2020.git","clone_url":"https://github.com/jimulabs/u2020.git","svn_url":"https://github.com/jimulabs/u2020","homepage":"http://parleys.com/play/529bde2ce4b0e619540cc3ae","size":8391,"stargazers_count":0,"watchers_count":0,"language":null,"has_issues":false,"has_downloads":true,"has_wiki":false,"has_pages":false,"forks_count":0,"mirror_url":null,"open_issues_count":0,"forks":0,"open_issues":0,"watchers":0,"default_branch":"master","public":true}},"public":true,"created_at":"2015-01-01T01:05:08Z"}
{"id":"2489398047","type":"PushEvent","actor":{"id":10225575,"login":"ExclusiveOrange","gravatar_id":"","url":"https://api.github.com/users/ExclusiveOrange","avatar_url":"https://avatars.githubusercontent.com/u/10225575?"},"repo":{"id":28677579,"name":"ExclusiveOrange/synthesizer","url":"https://api.github.com/repos/ExclusiveOrange/synthesizer"},"payload":{"push_id":536753197,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"9221d005a52f784d675044bb14013c0eec6ed795","before":"0e64036d5ac0d9c24b4cbe39bb778570db49caba","commits":[{"sha":"9221d005a52f784d675044bb14013c0eec6ed795","author":{"email":"de3bd7888dcfc4f7d00a4ef606710f57cbba1dbb@hotmail.com","name":"ExclusiveOrange"},"message":"included stuff needed to actually run program","distinct":true,"url":"https://api.github.com/repos/ExclusiveOrange/synthesizer/commits/9221d005a52f784d675044bb14013c0eec6ed795"}]},"public":true,"created_at":"2015-01-01T01:05:08Z"}
{"id":"2489398048","type":"IssueCommentEvent","actor":{"id":716644,"login":"amandaharlin","gravatar_id":"","url":"https://api.github.com/users/amandaharlin","avatar_url":"https://avatars.githubusercontent.com/u/716644?"},"repo":{"id":24870992,"name":"codeforokc/codeforokc","url":"https://api.github.com/repos/codeforokc/codeforokc"},"payload":{"action":"created","issue":{"url":"https://api.github.com/repos/codeforokc/codeforokc/issues/2","labels_url":"https://api.github.com/repos/codeforokc/codeforokc/issues/2/labels{/name}","comments_url":"https://api.github.com/repos/codeforokc/codeforokc/issues/2/comments","events_url":"https://api.github.com/repos/codeforokc/codeforokc/issues/2/events","html_url":"https://github.com/codeforokc/codeforokc/issues/2","id":52505386,"number":2,"title":"Add an About page","user":{"login":"mkchandler","id":436130,"avatar_url":"https://avatars.githubusercontent.com/u/436130?v=3","gravatar_id":"","url":"https://api.github.com/users/mkchandler","html_url":"https://github.com/mkchandler","followers_url":"https://api.github.com/users/mkchandler/followers","following_url":"https://api.github.com/users/mkchandler/following{/other_user}","gists_url":"https://api.github.com/users/mkchandler/gists{/gist_id}","starred_url":"https://api.github.com/users/mkchandler/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/mkchandler/subscriptions","organizations_url":"https://api.github.com/users/mkchandler/orgs","repos_url":"https://api.github.com/users/mkchandler/repos","events_url":"https://api.github.com/users/mkchandler/events{/privacy}","received_events_url":"https://api.github.com/users/mkchandler/received_events","type":"User","site_admin":false},"labels":[{"url":"https://api.github.com/repos/codeforokc/codeforokc/labels/enhancement","name":"enhancement","color":"84b6eb"}],"state":"open","locked":false,"assignee":null,"milestone":null,"comments":2,"created_at":"2014-12-19T17:04:48Z","updated_at":"2015-01-01T01:05:08Z","closed_at":null,"body":"Need to add an \"About\" page to the web site. It should at least include:\r\n\r\n* Summary of the group and what we do\r\n* List of core team members and what each do"},"comment":{"url":"https://api.github.com/repos/codeforokc/codeforokc/issues/comments/68477326","html_url":"https://github.com/codeforokc/codeforokc/issues/2#issuecomment-68477326","issue_url":"https://api.github.com/repos/codeforokc/codeforokc/issues/2","id":68477326,"user":{"login":"amandaharlin","id":716644,"avatar_url":"https://avatars.githubusercontent.com/u/716644?v=3","gravatar_id":"","url":"https://api.github.com/users/amandaharlin","html_url":"https://github.com/amandaharlin","followers_url":"https://api.github.com/users/amandaharlin/followers","following_url":"https://api.github.com/users/amandaharlin/following{/other_user}","gists_url":"https://api.github.com/users/amandaharlin/gists{/gist_id}","starred_url":"https://api.github.com/users/amandaharlin/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/amandaharlin/subscriptions","organizations_url":"https://api.github.com/users/amandaharlin/orgs","repos_url":"https://api.github.com/users/amandaharlin/repos","events_url":"https://api.github.com/users/amandaharlin/events{/privacy}","received_events_url":"https://api.github.com/users/amandaharlin/received_events","type":"User","site_admin":false},"created_at":"2015-01-01T01:05:08Z","updated_at":"2015-01-01T01:05:08Z","body":"can i get a list of the people & their roles? i only know 3 people so far, which might be all there is rn. "}},"public":true,"created_at":"2015-01-01T01:05:08Z","org":{"id":8738523,"login":"codeforokc","gravatar_id":"","url":"https://api.github.com/orgs/codeforokc","avatar_url":"https://avatars.githubusercontent.com/u/8738523?"}}
{"id":"2489398055","type":"WatchEvent","actor":{"id":2167695,"login":"skylerzhang","gravatar_id":"","url":"https://api.github.com/users/skylerzhang","avatar_url":"https://avatars.githubusercontent.com/u/2167695?"},"repo":{"id":28664808,"name":"cssdream/cssgrace","url":"https://api.github.com/repos/cssdream/cssgrace"},"payload":{"action":"started"},"public":true,"created_at":"2015-01-01T01:05:09Z","org":{"id":8910019,"login":"cssdream","gravatar_id":"","url":"https://api.github.com/orgs/cssdream","avatar_url":"https://avatars.githubusercontent.com/u/8910019?"}}
{"id":"2489398058","type":"PushEvent","actor":{"id":185007,"login":"dkirkby","gravatar_id":"","url":"https://api.github.com/users/dkirkby","avatar_url":"https://avatars.githubusercontent.com/u/185007?"},"repo":{"id":8727241,"name":"DarkEnergyScienceCollaboration/WeakLensingDeblending","url":"https://api.github.com/repos/DarkEnergyScienceCollaboration/WeakLensingDeblending"},"payload":{"push_id":536753204,"size":4,"distinct_size":4,"ref":"refs/heads/master","head":"4c8f9d910964133acd0f7eb2958ef7007f638dda","before":"ab294701300b44cd830d6577198084a508da6b31","commits":[{"sha":"8ffdfc613288637871b2cf022763f5d7b3dde5b4","author":{"email":"0e7e4469b1865516968f5f506ba25c60e5bedc8b@uci.edu","name":"David Kirkby"},"message":"Add PSF and cosmic shear parameters to the survey (not used yet).","distinct":true,"url":"https://api.github.com/repos/DarkEnergyScienceCollaboration/WeakLensingDeblending/commits/8ffdfc613288637871b2cf022763f5d7b3dde5b4"},{"sha":"b38651a711e4c240abe4190249b10d0e2eafb71b","author":{"email":"0e7e4469b1865516968f5f506ba25c60e5bedc8b@uci.edu","name":"David Kirkby"},"message":"Add optional shear to atmospheric PSF","distinct":true,"url":"https://api.github.com/repos/DarkEnergyScienceCollaboration/WeakLensingDeblending/commits/b38651a711e4c240abe4190249b10d0e2eafb71b"},{"sha":"fff691186b608876a72a7c6a106f3c0f20e922ac","author":{"email":"0e7e4469b1865516968f5f506ba25c60e5bedc8b@uci.edu","name":"David Kirkby"},"message":"Specify the ellipticity spinor convention we are using","distinct":true,"url":"https://api.github.com/repos/DarkEnergyScienceCollaboration/WeakLensingDeblending/commits/fff691186b608876a72a7c6a106f3c0f20e922ac"},{"sha":"4c8f9d910964133acd0f7eb2958ef7007f638dda","author":{"email":"0e7e4469b1865516968f5f506ba25c60e5bedc8b@uci.edu","name":"David Kirkby"},"message":"Protect against trying to set z scaling with too few pixels","distinct":true,"url":"https://api.github.com/repos/DarkEnergyScienceCollaboration/WeakLensingDeblending/commits/4c8f9d910964133acd0f7eb2958ef7007f638dda"}]},"public":true,"created_at":"2015-01-01T01:05:10Z","org":{"id":2731443,"login":"DarkEnergyScienceCollaboration","gravatar_id":"","url":"https://api.github.com/orgs/DarkEnergyScienceCollaboration","avatar_url":"https://avatars.githubusercontent.com/u/2731443?"}}
{"id":"2489398067","type":"PushEvent","actor":{"id":9000293,"login":"diianita","gravatar_id":"","url":"https://api.github.com/users/diianita","avatar_url":"https://avatars.githubusercontent.com/u/9000293?"},"repo":{"id":27146993,"name":"cArLiiToX/dtstore","url":"https://api.github.com/repos/cArLiiToX/dtstore"},"payload":{"push_id":536753208,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"6ce23947a2ec1c89d30f6e8d042154f2c431db86","before":"8cacad9b34f30388789700e5bb81deaa4471de12","commits":[{"sha":"6ce23947a2ec1c89d30f6e8d042154f2c431db86","author":{"email":"ab5e2bca84933118bbc9d48ffaccce3bac4eeb64@xng.bz","name":"cArLiiToX"},"message":"correciones","distinct":true,"url":"https://api.github.com/repos/cArLiiToX/dtstore/commits/6ce23947a2ec1c89d30f6e8d042154f2c431db86"}]},"public":true,"created_at":"2015-01-01T01:05:10Z"}
{"id":"2489398070","type":"WatchEvent","actor":{"id":694034,"login":"dsimmons","gravatar_id":"","url":"https://api.github.com/users/dsimmons","avatar_url":"https://avatars.githubusercontent.com/u/694034?"},"repo":{"id":11180687,"name":"spf13/hugo","url":"https://api.github.com/repos/spf13/hugo"},"payload":{"action":"started"},"public":true,"created_at":"2015-01-01T01:05:11Z"}
{"id":"2489398072","type":"PushEvent","actor":{"id":538610,"login":"zachwe","gravatar_id":"","url":"https://api.github.com/users/zachwe","avatar_url":"https://avatars.githubusercontent.com/u/538610?"},"repo":{"id":27940324,"name":"demitrin/listentogithub","url":"https://api.github.com/repos/demitrin/listentogithub"},"payload":{"push_id":536753210,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"edda8fe60cdd61df50c34608f44deeaac96fff62","before":"52f84b1f2d70fd051c27431d728395fc5cc28a76","commits":[{"sha":"edda8fe60cdd61df50c34608f44deeaac96fff62","author":{"email":"1ed83132ba391e321c1866dd62e4c246c89cd84e@gmail.com","name":"zachwe"},"message":"updated package.json","distinct":true,"url":"https://api.github.com/repos/demitrin/listentogithub/commits/edda8fe60cdd61df50c34608f44deeaac96fff62"}]},"public":true,"created_at":"2015-01-01T01:05:11Z"}
{"id":"2489398073","type":"GollumEvent","actor":{"id":6799218,"login":"gyuho","gravatar_id":"","url":"https://api.github.com/users/gyuho","avatar_url":"https://avatars.githubusercontent.com/u/6799218?"},"repo":{"id":23096959,"name":"golang/go","url":"https://api.github.com/repos/golang/go"},"payload":{"pages":[{"page_name":"whygo","title":"whygo","summary":null,"action":"edited","sha":"6beb51564de333d65182ed185c47d8648b76c641","html_url":"https://github.com/golang/go/wiki/whygo"}]},"public":true,"created_at":"2015-01-01T01:05:11Z","org":{"id":4314092,"login":"golang","gravatar_id":"","url":"https://api.github.com/orgs/golang","avatar_url":"https://avatars.githubusercontent.com/u/4314092?"}}
{"id":"2489398076","type":"IssueCommentEvent","actor":{"id":10361228,"login":"Dushku","gravatar_id":"","url":"https://api.github.com/users/Dushku","avatar_url":"https://avatars.githubusercontent.com/u/10361228?"},"repo":{"id":20304390,"name":"Epix37/Hearthstone-Deck-Tracker","url":"https://api.github.com/repos/Epix37/Hearthstone-Deck-Tracker"},"payload":{"action":"created","issue":{"url":"https://api.github.com/repos/Epix37/Hearthstone-Deck-Tracker/issues/496","labels_url":"https://api.github.com/repos/Epix37/Hearthstone-Deck-Tracker/issues/496/labels{/name}","comments_url":"https://api.github.com/repos/Epix37/Hearthstone-Deck-Tracker/issues/496/comments","events_url":"https://api.github.com/repos/Epix37/Hearthstone-Deck-Tracker/issues/496/events","html_url":"https://github.com/Epix37/Hearthstone-Deck-Tracker/issues/496","id":53208181,"number":496,"title":"export screenshot is cropped","user":{"login":"Dushku","id":10361228,"avatar_url":"https://avatars.githubusercontent.com/u/10361228?v=3","gravatar_id":"","url":"https://api.github.com/users/Dushku","html_url":"https://github.com/Dushku","followers_url":"https://api.github.com/users/Dushku/followers","following_url":"https://api.github.com/users/Dushku/following{/other_user}","gists_url":"https://api.github.com/users/Dushku/gists{/gist_id}","starred_url":"https://api.github.com/users/Dushku/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/Dushku/subscriptions","organizations_url":"https://api.github.com/users/Dushku/orgs","repos_url":"https://api.github.com/users/Dushku/repos","events_url":"https://api.github.com/users/Dushku/events{/privacy}","received_events_url":"https://api.github.com/users/Dushku/received_events","type":"User","site_admin":false},"labels":[],"state":"open","locked":false,"assignee":null,"milestone":null,"comments":1,"created_at":"2014-12-31T23:28:52Z","updated_at":"2015-01-01T01:05:11Z","closed_at":null,"body":"First post and I just wanted to say: I LOVE this tool! Thank you for all the hard work.\r\n\r\n![trump qm](https://cloud.githubusercontent.com/assets/10361228/5591152/9917046e-911a-11e4-9dd5-b5fd9f4b69b1.png)\r\n\r\nExport screenshot always only shows first 16 different cards and crops off the right side. I didn't find any other thread on the subject, so I assume it's my settings, but I can't figure out which. Any help would be appreciated."},"comment":{"url":"https://api.github.com/repos/Epix37/Hearthstone-Deck-Tracker/issues/comments/68477328","html_url":"https://github.com/Epix37/Hearthstone-Deck-Tracker/issues/496#issuecomment-68477328","issue_url":"https://api.github.com/repos/Epix37/Hearthstone-Deck-Tracker/issues/496","id":68477328,"user":{"login":"Dushku","id":10361228,"avatar_url":"https://avatars.githubusercontent.com/u/10361228?v=3","gravatar_id":"","url":"https://api.github.com/users/Dushku","html_url":"https://github.com/Dushku","followers_url":"https://api.github.com/users/Dushku/followers","following_url":"https://api.github.com/users/Dushku/following{/other_user}","gists_url":"https://api.github.com/users/Dushku/gists{/gist_id}","starred_url":"https://api.github.com/users/Dushku/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/Dushku/subscriptions","organizations_url":"https://api.github.com/users/Dushku/orgs","repos_url":"https://api.github.com/users/Dushku/repos","events_url":"https://api.github.com/users/Dushku/events{/privacy}","received_events_url":"https://api.github.com/users/Dushku/received_events","type":"User","site_admin":false},"created_at":"2015-01-01T01:05:11Z","updated_at":"2015-01-01T01:05:11Z","body":"For what it's worth, I was able to hit Print Screen while it rapidly brought up a window in response to the export screenshot command. It lists all the cards, but it too drops off the right side.\r\n\r\n![temp](https://cloud.githubusercontent.com/assets/10361228/5591414/3aff5ec2-9128-11e4-8408-92c5a57ed4be.jpg)\r\n"}},"public":true,"created_at":"2015-01-01T01:05:12Z"}
{"id":"2489398077","type":"PushEvent","actor":{"id":616495,"login":"harveyt","gravatar_id":"","url":"https://api.github.com/users/harveyt","avatar_url":"https://avatars.githubusercontent.com/u/616495?"},"repo":{"id":28677911,"name":"harveyt/harveyt.github.io","url":"https://api.github.com/repos/harveyt/harveyt.github.io"},"payload":{"push_id":536753211,"size":1,"distinct_size":1,"ref":"refs/heads/source","head":"8c51961f1332eb509084e9bab9432234b43f8f8f","before":"9f57ade1c98efb400f57d710a69c272464596ba4","commits":[{"sha":"8c51961f1332eb509084e9bab9432234b43f8f8f","author":{"email":"5b18f340f96afc1bfd4fbf498467b8b0cb41ea73@me.com","name":"Harvey Thompson"},"message":"Added ignore of .deploy","distinct":true,"url":"https://api.github.com/repos/harveyt/harveyt.github.io/commits/8c51961f1332eb509084e9bab9432234b43f8f8f"}]},"public":true,"created_at":"2015-01-01T01:05:12Z"}
{"id":"2489398082","type":"PushEvent","actor":{"id":489000,"login":"kwrobot","gravatar_id":"","url":"https://api.github.com/users/kwrobot","avatar_url":"https://avatars.githubusercontent.com/u/489000?"},"repo":{"id":631615,"name":"Kitware/VTK","url":"https://api.github.com/repos/Kitware/VTK"},"payload":{"push_id":536753215,"size":3,"distinct_size":0,"ref":"refs/heads/nightly-master","head":"fc4a4102c54b06f686588b0e3aac9c942c4f3e97","before":"5202a28a0d7d36ed1213dc0576549b7898594891","commits":[{"sha":"ad47d6abc5fee5d4f992fa4e10643e6f58511039","author":{"email":"ad952b69c80b75aa4e9d1e45057b03ba8d1a6fa5@kitware.com","name":"Chuck Atkins"},"message":"ADIOS: Properly handle variable sized data.\n\nRework the ADIOS writer and reader to properly address arrays that change size\nacross timesteps.\n\nChange-Id: I1612308accc36213cb2d21705088a058aba2d591","distinct":false,"url":"https://api.github.com/repos/Kitware/VTK/commits/ad47d6abc5fee5d4f992fa4e10643e6f58511039"},{"sha":"63c22698d5fd7b59ad8e9c7882c5b4b986ab760e","author":{"email":"ad952b69c80b75aa4e9d1e45057b03ba8d1a6fa5@kitware.com","name":"Chuck Atkins"},"message":"ADIOS: Fix memory leaks by adding deletes\n\nChange-Id: I73107bebe60d9b1351b1a0a5818b65b1668f3a81","distinct":false,"url":"https://api.github.com/repos/Kitware/VTK/commits/63c22698d5fd7b59ad8e9c7882c5b4b986ab760e"},{"sha":"fc4a4102c54b06f686588b0e3aac9c942c4f3e97","author":{"email":"ad952b69c80b75aa4e9d1e45057b03ba8d1a6fa5@kitware.com","name":"Chuck Atkins"},"message":"Merge topic 'fix-adios-multistep' into master\n\n63c22698 ADIOS: Fix memory leaks by adding deletes\nad47d6ab ADIOS: Properly handle variable sized data.","distinct":false,"url":"https://api.github.com/repos/Kitware/VTK/commits/fc4a4102c54b06f686588b0e3aac9c942c4f3e97"}]},"public":true,"created_at":"2015-01-01T01:05:12Z","org":{"id":87549,"login":"Kitware","gravatar_id":"","url":"https://api.github.com/orgs/Kitware","avatar_url":"https://avatars.githubusercontent.com/u/87549?"}}
{"id":"2489398083","type":"PushEvent","actor":{"id":3720783,"login":"designerwebhosting","gravatar_id":"","url":"https://api.github.com/users/designerwebhosting","avatar_url":"https://avatars.githubusercontent.com/u/3720783?"},"repo":{"id":20527117,"name":"designerwebhosting/christopherbyrne.github.io","url":"https://api.github.com/repos/designerwebhosting/christopherbyrne.github.io"},"payload":{"push_id":536753216,"size":1,"distinct_size":1,"ref":"refs/heads/gh-pages","head":"ff9f4da8bd5a71e0db5778bd27e29b075e9c65ac","before":"7e3ee7d19b64e0f0571098be4edb9729d09fb4f4","commits":[{"sha":"ff9f4da8bd5a71e0db5778bd27e29b075e9c65ac","author":{"email":"4bb0acc6ff8c0b6c31e50417877e6e3b3f1c65f0@googlemail.com","name":"Peter Noblee"},"message":"update 'date'","distinct":true,"url":"https://api.github.com/repos/designerwebhosting/christopherbyrne.github.io/commits/ff9f4da8bd5a71e0db5778bd27e29b075e9c65ac"}]},"public":true,"created_at":"2015-01-01T01:05:12Z"}
{"id":"2489398084","type":"PushEvent","actor":{"id":7670309,"login":"CodingMonkeyMonster","gravatar_id":"","url":"https://api.github.com/users/CodingMonkeyMonster","avatar_url":"https://avatars.githubusercontent.com/u/7670309?"},"repo":{"id":28644791,"name":"CodingMonkeyMonster/imageacqusitionfromtwosickrangers","url":"https://api.github.com/repos/CodingMonkeyMonster/imageacqusitionfromtwosickrangers"},"payload":{"push_id":536753217,"size":2,"distinct_size":2,"ref":"refs/heads/master","head":"c5db69a606212cc6d486c1f77ca3203cf1bf483f","before":"624b2e2b583755fc41eed2533198c30373c4760a","commits":[{"sha":"c339c869d03501ad837573ed6eaa294ac054586f","author":{"email":"120e3c204246881d0cb497deab877ed54b238a26@gmail.com","name":"CodeMonster"},"message":"Some modifications to incorporate the use of a second camera","distinct":true,"url":"https://api.github.com/repos/CodingMonkeyMonster/imageacqusitionfromtwosickrangers/commits/c339c869d03501ad837573ed6eaa294ac054586f"},{"sha":"c5db69a606212cc6d486c1f77ca3203cf1bf483f","author":{"email":"120e3c204246881d0cb497deab877ed54b238a26@gmail.com","name":"CodeMonster"},"message":"some more modifications before thinking about perhaps using asychronous threads or delegates?","distinct":true,"url":"https://api.github.com/repos/CodingMonkeyMonster/imageacqusitionfromtwosickrangers/commits/c5db69a606212cc6d486c1f77ca3203cf1bf483f"}]},"public":true,"created_at":"2015-01-01T01:05:12Z"}
{"id":"2489398086","type":"PushEvent","actor":{"id":10254849,"login":"NickSanzotta","gravatar_id":"","url":"https://api.github.com/users/NickSanzotta","avatar_url":"https://avatars.githubusercontent.com/u/10254849?"},"repo":{"id":28525122,"name":"NickSanzotta/strategicsec","url":"https://api.github.com/repos/NickSanzotta/strategicsec"},"payload":{"push_id":536753218,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"a018e85ada6048fc90131af5bd149a01712547b2","before":"0e3787e8504eb26395c2dc2e457275e41d56cf2e","commits":[{"sha":"a018e85ada6048fc90131af5bd149a01712547b2","author":{"email":"b49959da48d165fcfc8ebb39ae6132c54ef35404@outlook.com","name":"NickSanzotta"},"message":"domain function added","distinct":true,"url":"https://api.github.com/repos/NickSanzotta/strategicsec/commits/a018e85ada6048fc90131af5bd149a01712547b2"}]},"public":true,"created_at":"2015-01-01T01:05:13Z"}
{"id":"2489398088","type":"ForkEvent","actor":{"id":3356814,"login":"itpcc","gravatar_id":"","url":"https://api.github.com/users/itpcc","avatar_url":"https://avatars.githubusercontent.com/u/3356814?"},"repo":{"id":28064768,"name":"phpinfo-in-th/workshop-webboard","url":"https://api.github.com/repos/phpinfo-in-th/workshop-webboard"},"payload":{"forkee":{"id":28678270,"name":"workshop-webboard","full_name":"itpcc/workshop-webboard","owner":{"login":"itpcc","id":3356814,"avatar_url":"https://avatars.githubusercontent.com/u/3356814?v=3","gravatar_id":"","url":"https://api.github.com/users/itpcc","html_url":"https://github.com/itpcc","followers_url":"https://api.github.com/users/itpcc/followers","following_url":"https://api.github.com/users/itpcc/following{/other_user}","gists_url":"https://api.github.com/users/itpcc/gists{/gist_id}","starred_url":"https://api.github.com/users/itpcc/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/itpcc/subscriptions","organizations_url":"https://api.github.com/users/itpcc/orgs","repos_url":"https://api.github.com/users/itpcc/repos","events_url":"https://api.github.com/users/itpcc/events{/privacy}","received_events_url":"https://api.github.com/users/itpcc/received_events","type":"User","site_admin":false},"private":false,"html_url":"https://github.com/itpcc/workshop-webboard","description":"","fork":true,"url":"https://api.github.com/repos/itpcc/workshop-webboard","forks_url":"https://api.github.com/repos/itpcc/workshop-webboard/forks","keys_url":"https://api.github.com/repos/itpcc/workshop-webboard/keys{/key_id}","collaborators_url":"https://api.github.com/repos/itpcc/workshop-webboard/collaborators{/collaborator}","teams_url":"https://api.github.com/repos/itpcc/workshop-webboard/teams","hooks_url":"https://api.github.com/repos/itpcc/workshop-webboard/hooks","issue_events_url":"https://api.github.com/repos/itpcc/workshop-webboard/issues/events{/number}","events_url":"https://api.github.com/repos/itpcc/workshop-webboard/events","assignees_url":"https://api.github.com/repos/itpcc/workshop-webboard/assignees{/user}","branches_url":"https://api.github.com/repos/itpcc/workshop-webboard/branches{/branch}","tags_url":"https://api.github.com/repos/itpcc/workshop-webboard/tags","blobs_url":"https://api.github.com/repos/itpcc/workshop-webboard/git/blobs{/sha}","git_tags_url":"https://api.github.com/repos/itpcc/workshop-webboard/git/tags{/sha}","git_refs_url":"https://api.github.com/repos/itpcc/workshop-webboard/git/refs{/sha}","trees_url":"https://api.github.com/repos/itpcc/workshop-webboard/git/trees{/sha}","statuses_url":"https://api.github.com/repos/itpcc/workshop-webboard/statuses/{sha}","languages_url":"https://api.github.com/repos/itpcc/workshop-webboard/languages","stargazers_url":"https://api.github.com/repos/itpcc/workshop-webboard/stargazers","contributors_url":"https://api.github.com/repos/itpcc/workshop-webboard/contributors","subscribers_url":"https://api.github.com/repos/itpcc/workshop-webboard/subscribers","subscription_url":"https://api.github.com/repos/itpcc/workshop-webboard/subscription","commits_url":"https://api.github.com/repos/itpcc/workshop-webboard/commits{/sha}","git_commits_url":"https://api.github.com/repos/itpcc/workshop-webboard/git/commits{/sha}","comments_url":"https://api.github.com/repos/itpcc/workshop-webboard/comments{/number}","issue_comment_url":"https://api.github.com/repos/itpcc/workshop-webboard/issues/comments/{number}","contents_url":"https://api.github.com/repos/itpcc/workshop-webboard/contents/{+path}","compare_url":"https://api.github.com/repos/itpcc/workshop-webboard/compare/{base}...{head}","merges_url":"https://api.github.com/repos/itpcc/workshop-webboard/merges","archive_url":"https://api.github.com/repos/itpcc/workshop-webboard/{archive_format}{/ref}","downloads_url":"https://api.github.com/repos/itpcc/workshop-webboard/downloads","issues_url":"https://api.github.com/repos/itpcc/workshop-webboard/issues{/number}","pulls_url":"https://api.github.com/repos/itpcc/workshop-webboard/pulls{/number}","milestones_url":"https://api.github.com/repos/itpcc/workshop-webboard/milestones{/number}","notifications_url":"https://api.github.com/repos/itpcc/workshop-webboard/notifications{?since,all,participating}","labels_url":"https://api.github.com/repos/itpcc/workshop-webboard/labels{/name}","releases_url":"https://api.github.com/repos/itpcc/workshop-webboard/releases{/id}","created_at":"2015-01-01T01:05:13Z","updated_at":"2014-12-16T01:42:48Z","pushed_at":"2014-12-16T01:42:48Z","git_url":"git://github.com/itpcc/workshop-webboard.git","ssh_url":"git@github.com:itpcc/workshop-webboard.git","clone_url":"https://github.com/itpcc/workshop-webboard.git","svn_url":"https://github.com/itpcc/workshop-webboard","homepage":null,"size":140,"stargazers_count":0,"watchers_count":0,"language":null,"has_issues":false,"has_downloads":true,"has_wiki":true,"has_pages":false,"forks_count":0,"mirror_url":null,"open_issues_count":0,"forks":0,"open_issues":0,"watchers":0,"default_branch":"master","public":true}},"public":true,"created_at":"2015-01-01T01:05:13Z"}
{"id":"2489398089","type":"PushEvent","actor":{"id":106133,"login":"Tiggar","gravatar_id":"","url":"https://api.github.com/users/Tiggar","avatar_url":"https://avatars.githubusercontent.com/u/106133?"},"repo":{"id":27003508,"name":"Tiggar/isp-performance","url":"https://api.github.com/repos/Tiggar/isp-performance"},"payload":{"push_id":536753219,"size":1,"distinct_size":1,"ref":"refs/heads/gh-pages","head":"2dd68c64ebb4a14935823a00f0ce08df238f6cd5","before":"512ea3ddc142c05f89eaf1b69f5a084ac1f99ba6","commits":[{"sha":"2dd68c64ebb4a14935823a00f0ce08df238f6cd5","author":{"email":"5069df3b8e9785f1eb5e6bda1f2483f61b73e1aa@gmail.com","name":"Jan Michael"},"message":"updates all charts","distinct":true,"url":"https://api.github.com/repos/Tiggar/isp-performance/commits/2dd68c64ebb4a14935823a00f0ce08df238f6cd5"}]},"public":true,"created_at":"2015-01-01T01:05:13Z"}
{"id":"2489398090","type":"PushEvent","actor":{"id":9205456,"login":"Anthony-Dev","gravatar_id":"","url":"https://api.github.com/users/Anthony-Dev","avatar_url":"https://avatars.githubusercontent.com/u/9205456?"},"repo":{"id":28667691,"name":"Anthony-Dev/ModdedMinecraftJar","url":"https://api.github.com/repos/Anthony-Dev/ModdedMinecraftJar"},"payload":{"push_id":536753220,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"3956e0b94a256be19bb61d6c54e4534f03e6f99d","before":"05685975ac219c387b900e0f05665053f8e3a7f6","commits":[{"sha":"3956e0b94a256be19bb61d6c54e4534f03e6f99d","author":{"email":"28580e7b9fd3af655a23a148dc5c207632216f69@outlook.com","name":"Anthony-Dev"},"message":"Launcher Jar 8\n\nUUID Changes to this.id","distinct":true,"url":"https://api.github.com/repos/Anthony-Dev/ModdedMinecraftJar/commits/3956e0b94a256be19bb61d6c54e4534f03e6f99d"}]},"public":true,"created_at":"2015-01-01T01:05:13Z"}
{"id":"2489398095","type":"PushEvent","actor":{"id":1449778,"login":"billperegoy","gravatar_id":"","url":"https://api.github.com/users/billperegoy","avatar_url":"https://avatars.githubusercontent.com/u/1449778?"},"repo":{"id":28676506,"name":"billperegoy/parse_args","url":"https://api.github.com/repos/billperegoy/parse_args"},"payload":{"push_id":536753221,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"dd4eb8719dc48ca7e9bd948ffb9fe7ce492d70de","before":"4fc9773581df0562d3a49040ce00e1ef5c962bd8","commits":[{"sha":"dd4eb8719dc48ca7e9bd948ffb9fe7ce492d70de","author":{"email":"c692d6a10598e0a801576fdd4ecf3c37e45bfbc4@billperegoy.com","name":"billperegoy"},"message":"Added cane quality checks to Rakefile.","distinct":true,"url":"https://api.github.com/repos/billperegoy/parse_args/commits/dd4eb8719dc48ca7e9bd948ffb9fe7ce492d70de"}]},"public":true,"created_at":"2015-01-01T01:05:14Z"}
{"id":"2489398096","type":"WatchEvent","actor":{"id":1534224,"login":"tracyapps","gravatar_id":"","url":"https://api.github.com/users/tracyapps","avatar_url":"https://avatars.githubusercontent.com/u/1534224?"},"repo":{"id":19757917,"name":"maxwellito/vivus","url":"https://api.github.com/repos/maxwellito/vivus"},"payload":{"action":"started"},"public":true,"created_at":"2015-01-01T01:05:14Z"}
{"id":"2489398100","type":"WatchEvent","actor":{"id":3421858,"login":"codepreneur","gravatar_id":"","url":"https://api.github.com/users/codepreneur","avatar_url":"https://avatars.githubusercontent.com/u/3421858?"},"repo":{"id":5085231,"name":"WhisperSystems/RedPhone","url":"https://api.github.com/repos/WhisperSystems/RedPhone"},"payload":{"action":"started"},"public":true,"created_at":"2015-01-01T01:05:15Z","org":{"id":702459,"login":"WhisperSystems","gravatar_id":"","url":"https://api.github.com/orgs/WhisperSystems","avatar_url":"https://avatars.githubusercontent.com/u/702459?"}}
{"id":"2489398106","type":"PullRequestReviewCommentEvent","actor":{"id":523287,"login":"j2sol","gravatar_id":"","url":"https://api.github.com/users/j2sol","avatar_url":"https://avatars.githubusercontent.com/u/523287?"},"repo":{"id":11848896,"name":"blueboxgroup/ursula","url":"https://api.github.com/repos/blueboxgroup/ursula"},"payload":{"action":"created","comment":{"url":"https://api.github.com/repos/blueboxgroup/ursula/pulls/comments/22397290","id":22397290,"diff_hunk":"@@ -1,121 +1,92 @@\n ---\n-- name: install apache\n-  apt: pkg={{ item }}\n-  with_items:\n-    - apache2\n-    - libapache2-mod-wsgi\n-\n - name: lesscpy must be in apache PATH\n   pip: name=lesscpy version=0.9j\n \n - name: get horizon source repo\n-  git: repo={{ openstack.git_mirror }}/horizon.git\n-       dest=/opt/stack/horizon\n-       version={{ horizon.rev }}\n-       update={{ openstack.git_update }}\n+  git: |\n+    repo={{ openstack.git_mirror}}/horizon.git\n+    dest=/opt/stack/horizon\n+    version={{ horizon.rev }}\n+    update={{ openstack.git_update }}\n   notify:\n     - setup horizon venv\n     - compress horizon assets\n \n-- template: src=opt/stack/horizon/hide-external-networks.patch dest=/opt/stack/horizon/hide-external-networks.patch mode=0644\n-- shell: patch -p1 < hide-external-networks.patch chdir=/opt/stack/horizon\n-  notify:\n-    - setup horizon venv\n-\n - name: add python-memcached to horizon requirements\n-  lineinfile: dest=/opt/stack/horizon/requirements.txt\n-              regexp=^python-memcached\n-              line=python-memcached\n+  lineinfile: dest=/opt/stack/horizon/requirements.txt regexp=^python-memcached line=python-memcached\n   notify:\n     - setup horizon venv\n \n-- name: disable apache status\n-  command: a2dismod status\n-  notify:\n-    - restart apache\n-\n-- name: apache ports config\n-  template: src=etc/apache2/ports.conf\n-            dest=/etc/apache2/ports.conf\n-  notify:\n-    - restart apache\n-\n-- name: disable default apache site\n-  command: a2dissite 000-default\n+- name: make sure apache knows about horizon ports\n+  lineinfile: dest=/etc/apache2/ports.conf line=\"Listen 8080\"\n   notify:\n-    - restart apache\n+    - reload apache\n \n-- name: openstack dashboard config (12.04)\n-  template: src=etc/apache2/sites-available/openstack_dashboard.conf\n-            dest=/etc/apache2/sites-available/openstack_dashboard\n+- name: create dashboard virtualhost on precise\n+  template: |\n+    src=etc/apache2/sites-available/openstack_dashboard.conf\n+    dest=/etc/apache2/sites-available/openstack_dashboard\n   when: ansible_distribution_version == \"12.04\"\n   notify:\n-    - restart apache\n+    - reload apache\n \n-- name: openstack dashboard config\n-  template: src=etc/apache2/sites-available/openstack_dashboard.conf\n-            dest=/etc/apache2/sites-available/openstack_dashboard.conf\n+- name: create dashboard virtualhost on other\n+  template: |\n+    src=etc/apache2/sites-available/openstack_dashboard.conf\n+    dest=/etc/apache2/sites-available/openstack_dashboard.conf\n   when: ansible_distribution_version != \"12.04\"\n   notify:\n-    - restart apache\n+    - reload apache\n \n - name: enable horizon apache site\n-  command: a2ensite openstack_dashboard\n+  apache2_site: state=enabled name=openstack_dashboard\n   notify:\n-    - restart apache\n-\n-- name: static asset directories\n-  file: dest={{ item }}\n-        state=directory\n-        owner=www-data\n-        group=www-data\n-        mode=0755\n+    - reload apache\n+\n+- name: create static asset dirs\n+  file: |\n+    dest={{ item }}\n+    state=directory\n+    owner=www-data\n+    group=www-data\n+    mode=0755\n   with_items:\n     - /opt/stack/horizon/static\n     - /opt/stack/horizon/static/dashboard\n \n-- name: horizon local settings\n-  template: src=opt/stack/horizon/openstack_dashboard/local/local_settings.py\n-            dest=/opt/stack/horizon/openstack_dashboard/local/local_settings.py\n-            mode=0644\n+- name: dashboard settings\n+  template: |\n+    src=opt/stack/horizon/openstack_dashboard/local/local_settings.py\n+    dest=/opt/stack/horizon/openstack_dashboard/local/local_settings.py\n+    mode=0644\n   notify:\n-    - restart apache\n+    - reload apache\n \n - name: custom horizon logo\n-  get_url: url={{ horizon.logo_url }}\n-           dest=/opt/stack/horizon/openstack_dashboard/static/dashboard/img/logo.png\n-           mode=0644 force=yes\n+  get_url: url={{ horizon.logo_url }} dest=/opt/stack/horizon/openstack_dashboard/static/dashboard/img/logo.png mode=0644 force=yes","path":"roles/horizon/tasks/main.yml","position":123,"original_position":123,"commit_id":"2a6f35313b9936ce4450aba823d09287626bed6f","original_commit_id":"2a6f35313b9936ce4450aba823d09287626bed6f","user":{"login":"j2sol","id":523287,"avatar_url":"https://avatars.githubusercontent.com/u/523287?v=3","gravatar_id":"","url":"https://api.github.com/users/j2sol","html_url":"https://github.com/j2sol","followers_url":"https://api.github.com/users/j2sol/followers","following_url":"https://api.github.com/users/j2sol/following{/other_user}","gists_url":"https://api.github.com/users/j2sol/gists{/gist_id}","starred_url":"https://api.github.com/users/j2sol/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/j2sol/subscriptions","organizations_url":"https://api.github.com/users/j2sol/orgs","repos_url":"https://api.github.com/users/j2sol/repos","events_url":"https://api.github.com/users/j2sol/events{/privacy}","received_events_url":"https://api.github.com/users/j2sol/received_events","type":"User","site_admin":false},"body":"Why did this go single line?","created_at":"2015-01-01T01:05:15Z","updated_at":"2015-01-01T01:05:15Z","html_url":"https://github.com/blueboxgroup/ursula/pull/705#discussion_r22397290","pull_request_url":"https://api.github.com/repos/blueboxgroup/ursula/pulls/705","_links":{"self":{"href":"https://api.github.com/repos/blueboxgroup/ursula/pulls/comments/22397290"},"html":{"href":"https://github.com/blueboxgroup/ursula/pull/705#discussion_r22397290"},"pull_request":{"href":"https://api.github.com/repos/blueboxgroup/ursula/pulls/705"}}},"pull_request":{"url":"https://api.github.com/repos/blueboxgroup/ursula/pulls/705","id":26738851,"html_url":"https://github.com/blueboxgroup/ursula/pull/705","diff_url":"https://github.com/blueboxgroup/ursula/pull/705.diff","patch_url":"https://github.com/blueboxgroup/ursula/pull/705.patch","issue_url":"https://api.github.com/repos/blueboxgroup/ursula/issues/705","number":705,"state":"open","locked":false,"title":"WIP:  apache for loadbalancing","user":{"login":"paulczar","id":2488346,"avatar_url":"https://avatars.githubusercontent.com/u/2488346?v=3","gravatar_id":"","url":"https://api.github.com/users/paulczar","html_url":"https://github.com/paulczar","followers_url":"https://api.github.com/users/paulczar/followers","following_url":"https://api.github.com/users/paulczar/following{/other_user}","gists_url":"https://api.github.com/users/paulczar/gists{/gist_id}","starred_url":"https://api.github.com/users/paulczar/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/paulczar/subscriptions","organizations_url":"https://api.github.com/users/paulczar/orgs","repos_url":"https://api.github.com/users/paulczar/repos","events_url":"https://api.github.com/users/paulczar/events{/privacy}","received_events_url":"https://api.github.com/users/paulczar/received_events","type":"User","site_admin":false},"body":"This is a quick POC / WIP to demo using apache instead of haproxy for loadbalancing our APIs.\r\n\r\nI think this gives us more flexibiltiy as we can enable in the APIs role itself ( in this case in keystone ) rather than a big monolithic haproxy.conf.      We also already have apache running for horizon, so it could reduce number of services.    apache also has better logging options that haproxy which can only log to syslog. ","created_at":"2015-01-01T00:04:13Z","updated_at":"2015-01-01T01:05:15Z","closed_at":null,"merged_at":null,"merge_commit_sha":"9b91693f11e166c9ee53836f19697868d412bf76","assignee":null,"milestone":null,"commits_url":"https://api.github.com/repos/blueboxgroup/ursula/pulls/705/commits","review_comments_url":"https://api.github.com/repos/blueboxgroup/ursula/pulls/705/comments","review_comment_url":"https://api.github.com/repos/blueboxgroup/ursula/pulls/comments/{number}","comments_url":"https://api.github.com/repos/blueboxgroup/ursula/issues/705/comments","statuses_url":"https://api.github.com/repos/blueboxgroup/ursula/statuses/2a6f35313b9936ce4450aba823d09287626bed6f","head":{"label":"blueboxgroup:use_apache_for_lb","ref":"use_apache_for_lb","sha":"2a6f35313b9936ce4450aba823d09287626bed6f","user":{"login":"blueboxgroup","id":458705,"avatar_url":"https://avatars.githubusercontent.com/u/458705?v=3","gravatar_id":"","url":"https://api.github.com/users/blueboxgroup","html_url":"https://github.com/blueboxgroup","followers_url":"https://api.github.com/users/blueboxgroup/followers","following_url":"https://api.github.com/users/blueboxgroup/following{/other_user}","gists_url":"https://api.github.com/users/blueboxgroup/gists{/gist_id}","starred_url":"https://api.github.com/users/blueboxgroup/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/blueboxgroup/subscriptions","organizations_url":"https://api.github.com/users/blueboxgroup/orgs","repos_url":"https://api.github.com/users/blueboxgroup/repos","events_url":"https://api.github.com/users/blueboxgroup/events{/privacy}","received_events_url":"https://api.github.com/users/blueboxgroup/received_events","type":"Organization","site_admin":false},"repo":{"id":11848896,"name":"ursula","full_name":"blueboxgroup/ursula","owner":{"login":"blueboxgroup","id":458705,"avatar_url":"https://avatars.githubusercontent.com/u/458705?v=3","gravatar_id":"","url":"https://api.github.com/users/blueboxgroup","html_url":"https://github.com/blueboxgroup","followers_url":"https://api.github.com/users/blueboxgroup/followers","following_url":"https://api.github.com/users/blueboxgroup/following{/other_user}","gists_url":"https://api.github.com/users/blueboxgroup/gists{/gist_id}","starred_url":"https://api.github.com/users/blueboxgroup/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/blueboxgroup/subscriptions","organizations_url":"https://api.github.com/users/blueboxgroup/orgs","repos_url":"https://api.github.com/users/blueboxgroup/repos","events_url":"https://api.github.com/users/blueboxgroup/events{/privacy}","received_events_url":"https://api.github.com/users/blueboxgroup/received_events","type":"Organization","site_admin":false},"private":false,"html_url":"https://github.com/blueboxgroup/ursula","description":"Ansible playbooks for operating OpenStack","fork":false,"url":"https://api.github.com/repos/blueboxgroup/ursula","forks_url":"https://api.github.com/repos/blueboxgroup/ursula/forks","keys_url":"https://api.github.com/repos/blueboxgroup/ursula/keys{/key_id}","collaborators_url":"https://api.github.com/repos/blueboxgroup/ursula/collaborators{/collaborator}","teams_url":"https://api.github.com/repos/blueboxgroup/ursula/teams","hooks_url":"https://api.github.com/repos/blueboxgroup/ursula/hooks","issue_events_url":"https://api.github.com/repos/blueboxgroup/ursula/issues/events{/number}","events_url":"https://api.github.com/repos/blueboxgroup/ursula/events","assignees_url":"https://api.github.com/repos/blueboxgroup/ursula/assignees{/user}","branches_url":"https://api.github.com/repos/blueboxgroup/ursula/branches{/branch}","tags_url":"https://api.github.com/repos/blueboxgroup/ursula/tags","blobs_url":"https://api.github.com/repos/blueboxgroup/ursula/git/blobs{/sha}","git_tags_url":"https://api.github.com/repos/blueboxgroup/ursula/git/tags{/sha}","git_refs_url":"https://api.github.com/repos/blueboxgroup/ursula/git/refs{/sha}","trees_url":"https://api.github.com/repos/blueboxgroup/ursula/git/trees{/sha}","statuses_url":"https://api.github.com/repos/blueboxgroup/ursula/statuses/{sha}","languages_url":"https://api.github.com/repos/blueboxgroup/ursula/languages","stargazers_url":"https://api.github.com/repos/blueboxgroup/ursula/stargazers","contributors_url":"https://api.github.com/repos/blueboxgroup/ursula/contributors","subscribers_url":"https://api.github.com/repos/blueboxgroup/ursula/subscribers","subscription_url":"https://api.github.com/repos/blueboxgroup/ursula/subscription","commits_url":"https://api.github.com/repos/blueboxgroup/ursula/commits{/sha}","git_commits_url":"https://api.github.com/repos/blueboxgroup/ursula/git/commits{/sha}","comments_url":"https://api.github.com/repos/blueboxgroup/ursula/comments{/number}","issue_comment_url":"https://api.github.com/repos/blueboxgroup/ursula/issues/comments/{number}","contents_url":"https://api.github.com/repos/blueboxgroup/ursula/contents/{+path}","compare_url":"https://api.github.com/repos/blueboxgroup/ursula/compare/{base}...{head}","merges_url":"https://api.github.com/repos/blueboxgroup/ursula/merges","archive_url":"https://api.github.com/repos/blueboxgroup/ursula/{archive_format}{/ref}","downloads_url":"https://api.github.com/repos/blueboxgroup/ursula/downloads","issues_url":"https://api.github.com/repos/blueboxgroup/ursula/issues{/number}","pulls_url":"https://api.github.com/repos/blueboxgroup/ursula/pulls{/number}","milestones_url":"https://api.github.com/repos/blueboxgroup/ursula/milestones{/number}","notifications_url":"https://api.github.com/repos/blueboxgroup/ursula/notifications{?since,all,participating}","labels_url":"https://api.github.com/repos/blueboxgroup/ursula/labels{/name}","releases_url":"https://api.github.com/repos/blueboxgroup/ursula/releases{/id}","created_at":"2013-08-02T17:37:26Z","updated_at":"2014-12-31T21:03:28Z","pushed_at":"2015-01-01T00:01:35Z","git_url":"git://github.com/blueboxgroup/ursula.git","ssh_url":"git@github.com:blueboxgroup/ursula.git","clone_url":"https://github.com/blueboxgroup/ursula.git","svn_url":"https://github.com/blueboxgroup/ursula","homepage":null,"size":9036,"stargazers_count":45,"watchers_count":45,"language":"Python","has_issues":true,"has_downloads":true,"has_wiki":true,"has_pages":false,"forks_count":23,"mirror_url":null,"open_issues_count":26,"forks":23,"open_issues":26,"watchers":45,"default_branch":"master"}},"base":{"label":"blueboxgroup:master","ref":"master","sha":"34b83c65ff0de2f8b006d8ce4f76919fe0167bbf","user":{"login":"blueboxgroup","id":458705,"avatar_url":"https://avatars.githubusercontent.com/u/458705?v=3","gravatar_id":"","url":"https://api.github.com/users/blueboxgroup","html_url":"https://github.com/blueboxgroup","followers_url":"https://api.github.com/users/blueboxgroup/followers","following_url":"https://api.github.com/users/blueboxgroup/following{/other_user}","gists_url":"https://api.github.com/users/blueboxgroup/gists{/gist_id}","starred_url":"https://api.github.com/users/blueboxgroup/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/blueboxgroup/subscriptions","organizations_url":"https://api.github.com/users/blueboxgroup/orgs","repos_url":"https://api.github.com/users/blueboxgroup/repos","events_url":"https://api.github.com/users/blueboxgroup/events{/privacy}","received_events_url":"https://api.github.com/users/blueboxgroup/received_events","type":"Organization","site_admin":false},"repo":{"id":11848896,"name":"ursula","full_name":"blueboxgroup/ursula","owner":{"login":"blueboxgroup","id":458705,"avatar_url":"https://avatars.githubusercontent.com/u/458705?v=3","gravatar_id":"","url":"https://api.github.com/users/blueboxgroup","html_url":"https://github.com/blueboxgroup","followers_url":"https://api.github.com/users/blueboxgroup/followers","following_url":"https://api.github.com/users/blueboxgroup/following{/other_user}","gists_url":"https://api.github.com/users/blueboxgroup/gists{/gist_id}","starred_url":"https://api.github.com/users/blueboxgroup/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/blueboxgroup/subscriptions","organizations_url":"https://api.github.com/users/blueboxgroup/orgs","repos_url":"https://api.github.com/users/blueboxgroup/repos","events_url":"https://api.github.com/users/blueboxgroup/events{/privacy}","received_events_url":"https://api.github.com/users/blueboxgroup/received_events","type":"Organization","site_admin":false},"private":false,"html_url":"https://github.com/blueboxgroup/ursula","description":"Ansible playbooks for operating OpenStack","fork":false,"url":"https://api.github.com/repos/blueboxgroup/ursula","forks_url":"https://api.github.com/repos/blueboxgroup/ursula/forks","keys_url":"https://api.github.com/repos/blueboxgroup/ursula/keys{/key_id}","collaborators_url":"https://api.github.com/repos/blueboxgroup/ursula/collaborators{/collaborator}","teams_url":"https://api.github.com/repos/blueboxgroup/ursula/teams","hooks_url":"https://api.github.com/repos/blueboxgroup/ursula/hooks","issue_events_url":"https://api.github.com/repos/blueboxgroup/ursula/issues/events{/number}","events_url":"https://api.github.com/repos/blueboxgroup/ursula/events","assignees_url":"https://api.github.com/repos/blueboxgroup/ursula/assignees{/user}","branches_url":"https://api.github.com/repos/blueboxgroup/ursula/branches{/branch}","tags_url":"https://api.github.com/repos/blueboxgroup/ursula/tags","blobs_url":"https://api.github.com/repos/blueboxgroup/ursula/git/blobs{/sha}","git_tags_url":"https://api.github.com/repos/blueboxgroup/ursula/git/tags{/sha}","git_refs_url":"https://api.github.com/repos/blueboxgroup/ursula/git/refs{/sha}","trees_url":"https://api.github.com/repos/blueboxgroup/ursula/git/trees{/sha}","statuses_url":"https://api.github.com/repos/blueboxgroup/ursula/statuses/{sha}","languages_url":"https://api.github.com/repos/blueboxgroup/ursula/languages","stargazers_url":"https://api.github.com/repos/blueboxgroup/ursula/stargazers","contributors_url":"https://api.github.com/repos/blueboxgroup/ursula/contributors","subscribers_url":"https://api.github.com/repos/blueboxgroup/ursula/subscribers","subscription_url":"https://api.github.com/repos/blueboxgroup/ursula/subscription","commits_url":"https://api.github.com/repos/blueboxgroup/ursula/commits{/sha}","git_commits_url":"https://api.github.com/repos/blueboxgroup/ursula/git/commits{/sha}","comments_url":"https://api.github.com/repos/blueboxgroup/ursula/comments{/number}","issue_comment_url":"https://api.github.com/repos/blueboxgroup/ursula/issues/comments/{number}","contents_url":"https://api.github.com/repos/blueboxgroup/ursula/contents/{+path}","compare_url":"https://api.github.com/repos/blueboxgroup/ursula/compare/{base}...{head}","merges_url":"https://api.github.com/repos/blueboxgroup/ursula/merges","archive_url":"https://api.github.com/repos/blueboxgroup/ursula/{archive_format}{/ref}","downloads_url":"https://api.github.com/repos/blueboxgroup/ursula/downloads","issues_url":"https://api.github.com/repos/blueboxgroup/ursula/issues{/number}","pulls_url":"https://api.github.com/repos/blueboxgroup/ursula/pulls{/number}","milestones_url":"https://api.github.com/repos/blueboxgroup/ursula/milestones{/number}","notifications_url":"https://api.github.com/repos/blueboxgroup/ursula/notifications{?since,all,participating}","labels_url":"https://api.github.com/repos/blueboxgroup/ursula/labels{/name}","releases_url":"https://api.github.com/repos/blueboxgroup/ursula/releases{/id}","created_at":"2013-08-02T17:37:26Z","updated_at":"2014-12-31T21:03:28Z","pushed_at":"2015-01-01T00:01:35Z","git_url":"git://github.com/blueboxgroup/ursula.git","ssh_url":"git@github.com:blueboxgroup/ursula.git","clone_url":"https://github.com/blueboxgroup/ursula.git","svn_url":"https://github.com/blueboxgroup/ursula","homepage":null,"size":9036,"stargazers_count":45,"watchers_count":45,"language":"Python","has_issues":true,"has_downloads":true,"has_wiki":true,"has_pages":false,"forks_count":23,"mirror_url":null,"open_issues_count":26,"forks":23,"open_issues":26,"watchers":45,"default_branch":"master"}},"_links":{"self":{"href":"https://api.github.com/repos/blueboxgroup/ursula/pulls/705"},"html":{"href":"https://github.com/blueboxgroup/ursula/pull/705"},"issue":{"href":"https://api.github.com/repos/blueboxgroup/ursula/issues/705"},"comments":{"href":"https://api.github.com/repos/blueboxgroup/ursula/issues/705/comments"},"review_comments":{"href":"https://api.github.com/repos/blueboxgroup/ursula/pulls/705/comments"},"review_comment":{"href":"https://api.github.com/repos/blueboxgroup/ursula/pulls/comments/{number}"},"commits":{"href":"https://api.github.com/repos/blueboxgroup/ursula/pulls/705/commits"},"statuses":{"href":"https://api.github.com/repos/blueboxgroup/ursula/statuses/2a6f35313b9936ce4450aba823d09287626bed6f"}}}},"public":true,"created_at":"2015-01-01T01:05:15Z","org":{"id":458705,"login":"blueboxgroup","gravatar_id":"","url":"https://api.github.com/orgs/blueboxgroup","avatar_url":"https://avatars.githubusercontent.com/u/458705?"}}
{"id":"2489398107","type":"IssuesEvent","actor":{"id":2982725,"login":"sharef88","gravatar_id":"","url":"https://api.github.com/users/sharef88","avatar_url":"https://avatars.githubusercontent.com/u/2982725?"},"repo":{"id":22777385,"name":"ChatFawkes/Flux-Galaxy","url":"https://api.github.com/repos/ChatFawkes/Flux-Galaxy"},"payload":{"action":"opened","issue":{"url":"https://api.github.com/repos/ChatFawkes/Flux-Galaxy/issues/66","labels_url":"https://api.github.com/repos/ChatFawkes/Flux-Galaxy/issues/66/labels{/name}","comments_url":"https://api.github.com/repos/ChatFawkes/Flux-Galaxy/issues/66/comments","events_url":"https://api.github.com/repos/ChatFawkes/Flux-Galaxy/issues/66/events","html_url":"https://github.com/ChatFawkes/Flux-Galaxy/issues/66","id":53210275,"number":66,"title":"Crash that I can't figure out","user":{"login":"sharef88","id":2982725,"avatar_url":"https://avatars.githubusercontent.com/u/2982725?v=3","gravatar_id":"","url":"https://api.github.com/users/sharef88","html_url":"https://github.com/sharef88","followers_url":"https://api.github.com/users/sharef88/followers","following_url":"https://api.github.com/users/sharef88/following{/other_user}","gists_url":"https://api.github.com/users/sharef88/gists{/gist_id}","starred_url":"https://api.github.com/users/sharef88/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/sharef88/subscriptions","organizations_url":"https://api.github.com/users/sharef88/orgs","repos_url":"https://api.github.com/users/sharef88/repos","events_url":"https://api.github.com/users/sharef88/events{/privacy}","received_events_url":"https://api.github.com/users/sharef88/received_events","type":"User","site_admin":false},"labels":[],"state":"open","locked":false,"assignee":null,"milestone":null,"comments":0,"created_at":"2015-01-01T01:05:16Z","updated_at":"2015-01-01T01:05:16Z","closed_at":null,"body":"Crash-Report generated by the server.\r\nhttp://pastebin.com/k9z2X98f\r\nI had placed a small compact machine about 30m before this crash.  I was removing some mechanisim universal cable with an unenchanted bound pickaxe about 10 blocks away from said compact machine. The machine was inert and empty.  I cant figure out how to fix this.  MCEdit surgery didn't help the matter, nor did removing compact machines mod, or the related file in data/ or the dim.\r\nI'm using pack version 7.3."}},"public":true,"created_at":"2015-01-01T01:05:16Z"}
{"id":"2489398112","type":"PushEvent","actor":{"id":238354,"login":"variousred","gravatar_id":"","url":"https://api.github.com/users/variousred","avatar_url":"https://avatars.githubusercontent.com/u/238354?"},"repo":{"id":6274404,"name":"G5/g5-content-management-system","url":"https://api.github.com/repos/G5/g5-content-management-system"},"payload":{"push_id":536753224,"size":1,"distinct_size":1,"ref":"refs/heads/fix-deep-clone","head":"b16f39b5d6be375e42eef7183ef39ed67077bee0","before":"81baf7738ce7da9084ecd6f657cd3c0e60f888a2","commits":[{"sha":"b16f39b5d6be375e42eef7183ef39ed67077bee0","author":{"email":"16ea8d52c08316685a257e07ddecf7165a502f6d@gmail.com","name":"Michael Mitchell"},"message":" removes pry","distinct":true,"url":"https://api.github.com/repos/G5/g5-content-management-system/commits/b16f39b5d6be375e42eef7183ef39ed67077bee0"}]},"public":true,"created_at":"2015-01-01T01:05:17Z","org":{"id":2396851,"login":"G5","gravatar_id":"","url":"https://api.github.com/orgs/G5","avatar_url":"https://avatars.githubusercontent.com/u/2396851?"}}
{"id":"2489398116","type":"PushEvent","actor":{"id":312301,"login":"davidturner","gravatar_id":"","url":"https://api.github.com/users/davidturner","avatar_url":"https://avatars.githubusercontent.com/u/312301?"},"repo":{"id":26051556,"name":"davidturner/dotfiles","url":"https://api.github.com/repos/davidturner/dotfiles"},"payload":{"push_id":536753226,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"c526773632b35732e3955e054dc4d7248ab49238","before":"65c8456130b0154315b1a3684b2b46c4b0144fa8","commits":[{"sha":"c526773632b35732e3955e054dc4d7248ab49238","author":{"email":"aa743a0aaec8f7d7a1f01442503957f4d7a2d634@davidturner.name","name":"David Turner"},"message":"Streamlining setup process.","distinct":true,"url":"https://api.github.com/repos/davidturner/dotfiles/commits/c526773632b35732e3955e054dc4d7248ab49238"}]},"public":true,"created_at":"2015-01-01T01:05:17Z"}
{"id":"2489398124","type":"WatchEvent","actor":{"id":51633,"login":"marklise","gravatar_id":"","url":"https://api.github.com/users/marklise","avatar_url":"https://avatars.githubusercontent.com/u/51633?"},"repo":{"id":242821,"name":"omz/AppSales-Mobile","url":"https://api.github.com/repos/omz/AppSales-Mobile"},"payload":{"action":"started"},"public":true,"created_at":"2015-01-01T01:05:18Z"}
{"id":"2489398131","type":"PushEvent","actor":{"id":939501,"login":"jacebrowning","gravatar_id":"","url":"https://api.github.com/users/jacebrowning","avatar_url":"https://avatars.githubusercontent.com/u/939501?"},"repo":{"id":19165491,"name":"jacebrowning/yorm","url":"https://api.github.com/repos/jacebrowning/yorm"},"payload":{"push_id":536753230,"size":1,"distinct_size":1,"ref":"refs/heads/develop","head":"44343210f475f5d87a70dab541e9158ddc90c397","before":"9e70ef1c7855f04cbcd073c05a3b727e08b8df5f","commits":[{"sha":"44343210f475f5d87a70dab541e9158ddc90c397","author":{"email":"567f1b61689b9d694b4628a3551d98928040e4fd@gmail.com","name":"Jace Browning"},"message":"Add standard types with NoneType defaults","distinct":true,"url":"https://api.github.com/repos/jacebrowning/yorm/commits/44343210f475f5d87a70dab541e9158ddc90c397"}]},"public":true,"created_at":"2015-01-01T01:05:20Z"}
{"id":"2489398136","type":"IssueCommentEvent","actor":{"id":9351018,"login":"lblxh3","gravatar_id":"","url":"https://api.github.com/users/lblxh3","avatar_url":"https://avatars.githubusercontent.com/u/9351018?"},"repo":{"id":28678195,"name":"TTMTT/iCL0udin","url":"https://api.github.com/repos/TTMTT/iCL0udin"},"payload":{"action":"created","issue":{"url":"https://api.github.com/repos/TTMTT/iCL0udin/issues/1","labels_url":"https://api.github.com/repos/TTMTT/iCL0udin/issues/1/labels{/name}","comments_url":"https://api.github.com/repos/TTMTT/iCL0udin/issues/1/comments","events_url":"https://api.github.com/repos/TTMTT/iCL0udin/issues/1/events","html_url":"https://github.com/TTMTT/iCL0udin/issues/1","id":53210206,"number":1,"title":"Discuss1","user":{"login":"TTMTT","id":6964047,"avatar_url":"https://avatars.githubusercontent.com/u/6964047?v=3","gravatar_id":"","url":"https://api.github.com/users/TTMTT","html_url":"https://github.com/TTMTT","followers_url":"https://api.github.com/users/TTMTT/followers","following_url":"https://api.github.com/users/TTMTT/following{/other_user}","gists_url":"https://api.github.com/users/TTMTT/gists{/gist_id}","starred_url":"https://api.github.com/users/TTMTT/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/TTMTT/subscriptions","organizations_url":"https://api.github.com/users/TTMTT/orgs","repos_url":"https://api.github.com/users/TTMTT/repos","events_url":"https://api.github.com/users/TTMTT/events{/privacy}","received_events_url":"https://api.github.com/users/TTMTT/received_events","type":"User","site_admin":false},"labels":[],"state":"open","locked":false,"assignee":null,"milestone":null,"comments":1,"created_at":"2015-01-01T01:02:34Z","updated_at":"2015-01-01T01:05:21Z","closed_at":null,"body":"Now you can download vresion 1.0 from :\r\n---------------------------------------------------\r\nhttp://www.icloudin.net\r\n-----------------------------\r\nWow, ipod touch 5G (8.1) - iCL0udin v1.0 bypass activation (icloud)\r\n-------------------------------------------------------------------------------------\r\nhttp://youtu.be/tZmEdlDGNu4\r\n--------------------------------------\r\niCL0udin v1.0 bypass activation (icloud) - ipad mini 2G (7.1.1)\r\n-------------------------------------------------------------------------------------\r\nhttp://youtu.be/tevYyBN2QCQ\r\n---------------------------------------\r\nVideo for bypass icloud (iCL0udin v1.0) for iphone 4 CDMA ..\r\n-------------------------------------------------------------------------------------\r\nhttp://youtu.be/i85-D6N2YLk\r\n-------------------------------------\r\nNew video for iCL0udin v1.0 bypass icloud (3 iphones 7.1.2):\r\n-------------------------------------------------------------------------------------\r\nhttp://youtu.be/p51TNlCr7ug\r\n-------------------------------------\r\niCL0udin v1.0 -> %100\r\n----------------------------\r\nRemaining: %3 testing with some people..\r\n-----------------------------------------------------\r\nLast Method:\r\n-----------------\r\n\r\nmethod 1 : via (other xml not to deviceservices - exploit)\r\nmethod 2 : via (apple cert & key and i can downgrade to any ios)\r\nmethod 3 : via (change some string by hex on ELF file << some times i got error)\r\nmethod 4 : via (use apple ssl cert or real ssl in server and change some string in iphone)\r\niCL0udin v1.0 have this method:\r\n-----------------------------------------\r\n\r\nmethod 1 : via (other xml not to deviceservices - exploit)\r\nmethod 2 : via (apple cert & key and i can downgrade to any ios)"},"comment":{"url":"https://api.github.com/repos/TTMTT/iCL0udin/issues/comments/68477333","html_url":"https://github.com/TTMTT/iCL0udin/issues/1#issuecomment-68477333","issue_url":"https://api.github.com/repos/TTMTT/iCL0udin/issues/1","id":68477333,"user":{"login":"lblxh3","id":9351018,"avatar_url":"https://avatars.githubusercontent.com/u/9351018?v=3","gravatar_id":"","url":"https://api.github.com/users/lblxh3","html_url":"https://github.com/lblxh3","followers_url":"https://api.github.com/users/lblxh3/followers","following_url":"https://api.github.com/users/lblxh3/following{/other_user}","gists_url":"https://api.github.com/users/lblxh3/gists{/gist_id}","starred_url":"https://api.github.com/users/lblxh3/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/lblxh3/subscriptions","organizations_url":"https://api.github.com/users/lblxh3/orgs","repos_url":"https://api.github.com/users/lblxh3/repos","events_url":"https://api.github.com/users/lblxh3/events{/privacy}","received_events_url":"https://api.github.com/users/lblxh3/received_events","type":"User","site_admin":false},"created_at":"2015-01-01T01:05:21Z","updated_at":"2015-01-01T01:05:21Z","body":"love u"}},"public":true,"created_at":"2015-01-01T01:05:21Z"}
{"id":"2489398140","type":"PushEvent","actor":{"id":2812278,"login":"beret595","gravatar_id":"","url":"https://api.github.com/users/beret595","avatar_url":"https://avatars.githubusercontent.com/u/2812278?"},"repo":{"id":28470088,"name":"beret595/Ucar_Operation_Crm_Finance","url":"https://api.github.com/repos/beret595/Ucar_Operation_Crm_Finance"},"payload":{"push_id":536753232,"size":6,"distinct_size":1,"ref":"refs/heads/master","head":"4be49692843556bedea40c3fbe6954972dd7beb0","before":"83f3a8e7891270f54d4119a862c57bfaf1db5475","commits":[{"sha":"aa16c2df1091bdf449c6b6a4b4ae02cfde6daa0d","author":{"email":"230ed9215685d4acc3825e7461feafb870abaeb3@163.com","name":"lixi1984"},"message":"保险提醒数据不准确,将搜索结果按照以下字段显示\n\n保险提醒数据不准确,将搜索结果按照以下字段显示 .\n客户 品牌 车型 车牌 保险到期 保险公司 邀约员 生成日期 分配日期 案件状态 操作 查看\n将利润管理单元去掉\n呼叫管理,利润管理,绩效管理下面多了下划线,去掉","distinct":false,"url":"https://api.github.com/repos/beret595/Ucar_Operation_Crm_Finance/commits/aa16c2df1091bdf449c6b6a4b4ae02cfde6daa0d"},{"sha":"2ff7d33c43d841388406502538cc14f07139a34d","author":{"email":"230ed9215685d4acc3825e7461feafb870abaeb3@163.com","name":"lixi1984"},"message":"Revert \"保险提醒数据不准确,将搜索结果按照以下字段显示\"\n\nThis reverts commit aa16c2df1091bdf449c6b6a4b4ae02cfde6daa0d.","distinct":false,"url":"https://api.github.com/repos/beret595/Ucar_Operation_Crm_Finance/commits/2ff7d33c43d841388406502538cc14f07139a34d"},{"sha":"eee8c95ea1793f864928a018de1f821428948951","author":{"email":"230ed9215685d4acc3825e7461feafb870abaeb3@163.com","name":"lixi1984"},"message":"Revert \"Revert \"保险提醒数据不准确,将搜索结果按照以下字段显示\"\"\n\nThis reverts commit 2ff7d33c43d841388406502538cc14f07139a34d.","distinct":false,"url":"https://api.github.com/repos/beret595/Ucar_Operation_Crm_Finance/commits/eee8c95ea1793f864928a018de1f821428948951"},{"sha":"999eb6abb00d4f80ab2f908ddb75c591dae44e0e","author":{"email":"230ed9215685d4acc3825e7461feafb870abaeb3@163.com","name":"lixi1984"},"message":"动态库更新\n\n动态库更新","distinct":false,"url":"https://api.github.com/repos/beret595/Ucar_Operation_Crm_Finance/commits/999eb6abb00d4f80ab2f908ddb75c591dae44e0e"},{"sha":"fb9307eefb142d216d38294f23e42779e0aecbea","author":{"email":"230ed9215685d4acc3825e7461feafb870abaeb3@163.com","name":"lixi1984"},"message":"数据备份\n\n数据备份 车辆迁移,人员信息迁移时效验客户编码","distinct":false,"url":"https://api.github.com/repos/beret595/Ucar_Operation_Crm_Finance/commits/fb9307eefb142d216d38294f23e42779e0aecbea"},{"sha":"4be49692843556bedea40c3fbe6954972dd7beb0","author":{"email":"3218d7ac8ea669170780ae5452d9ed76867b408e@foxmail.com","name":"beret595"},"message":"Merge pull request #1 from beret595/lixi1984\n\nLixi1984","distinct":true,"url":"https://api.github.com/repos/beret595/Ucar_Operation_Crm_Finance/commits/4be49692843556bedea40c3fbe6954972dd7beb0"}]},"public":true,"created_at":"2015-01-01T01:05:22Z"}
{"id":"2489398141","type":"PullRequestEvent","actor":{"id":2812278,"login":"beret595","gravatar_id":"","url":"https://api.github.com/users/beret595","avatar_url":"https://avatars.githubusercontent.com/u/2812278?"},"repo":{"id":28470088,"name":"beret595/Ucar_Operation_Crm_Finance","url":"https://api.github.com/repos/beret595/Ucar_Operation_Crm_Finance"},"payload":{"action":"closed","number":1,"pull_request":{"url":"https://api.github.com/repos/beret595/Ucar_Operation_Crm_Finance/pulls/1","id":26714507,"html_url":"https://github.com/beret595/Ucar_Operation_Crm_Finance/pull/1","diff_url":"https://github.com/beret595/Ucar_Operation_Crm_Finance/pull/1.diff","patch_url":"https://github.com/beret595/Ucar_Operation_Crm_Finance/pull/1.patch","issue_url":"https://api.github.com/repos/beret595/Ucar_Operation_Crm_Finance/issues/1","number":1,"state":"closed","locked":false,"title":"Lixi1984","user":{"login":"beret595","id":2812278,"avatar_url":"https://avatars.githubusercontent.com/u/2812278?v=3","gravatar_id":"","url":"https://api.github.com/users/beret595","html_url":"https://github.com/beret595","followers_url":"https://api.github.com/users/beret595/followers","following_url":"https://api.github.com/users/beret595/following{/other_user}","gists_url":"https://api.github.com/users/beret595/gists{/gist_id}","starred_url":"https://api.github.com/users/beret595/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/beret595/subscriptions","organizations_url":"https://api.github.com/users/beret595/orgs","repos_url":"https://api.github.com/users/beret595/repos","events_url":"https://api.github.com/users/beret595/events{/privacy}","received_events_url":"https://api.github.com/users/beret595/received_events","type":"User","site_admin":false},"body":"1.业务系统中,客户编号不是7位数字和字母组合的不要上传至邀约系统\r\n2.保养提醒数据不准确,\r\n3.保险提醒数据不准确 ","created_at":"2014-12-31T04:03:10Z","updated_at":"2015-01-01T01:05:21Z","closed_at":"2015-01-01T01:05:21Z","merged_at":"2015-01-01T01:05:21Z","merge_commit_sha":"29b658d7803c1e09eae5558e8c34b52e90e270f0","assignee":null,"milestone":null,"commits_url":"https://api.github.com/repos/beret595/Ucar_Operation_Crm_Finance/pulls/1/commits","review_comments_url":"https://api.github.com/repos/beret595/Ucar_Operation_Crm_Finance/pulls/1/comments","review_comment_url":"https://api.github.com/repos/beret595/Ucar_Operation_Crm_Finance/pulls/comments/{number}","comments_url":"https://api.github.com/repos/beret595/Ucar_Operation_Crm_Finance/issues/1/comments","statuses_url":"https://api.github.com/repos/beret595/Ucar_Operation_Crm_Finance/statuses/fb9307eefb142d216d38294f23e42779e0aecbea","head":{"label":"beret595:lixi1984","ref":"lixi1984","sha":"fb9307eefb142d216d38294f23e42779e0aecbea","user":{"login":"beret595","id":2812278,"avatar_url":"https://avatars.githubusercontent.com/u/2812278?v=3","gravatar_id":"","url":"https://api.github.com/users/beret595","html_url":"https://github.com/beret595","followers_url":"https://api.github.com/users/beret595/followers","following_url":"https://api.github.com/users/beret595/following{/other_user}","gists_url":"https://api.github.com/users/beret595/gists{/gist_id}","starred_url":"https://api.github.com/users/beret595/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/beret595/subscriptions","organizations_url":"https://api.github.com/users/beret595/orgs","repos_url":"https://api.github.com/users/beret595/repos","events_url":"https://api.github.com/users/beret595/events{/privacy}","received_events_url":"https://api.github.com/users/beret595/received_events","type":"User","site_admin":false},"repo":{"id":28470088,"name":"Ucar_Operation_Crm_Finance","full_name":"beret595/Ucar_Operation_Crm_Finance","owner":{"login":"beret595","id":2812278,"avatar_url":"https://avatars.githubusercontent.com/u/2812278?v=3","gravatar_id":"","url":"https://api.github.com/users/beret595","html_url":"https://github.com/beret595","followers_url":"https://api.github.com/users/beret595/followers","following_url":"https://api.github.com/users/beret595/following{/other_user}","gists_url":"https://api.github.com/users/beret595/gists{/gist_id}","starred_url":"https://api.github.com/users/beret595/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/beret595/subscriptions","organizations_url":"https://api.github.com/users/beret595/orgs","repos_url":"https://api.github.com/users/beret595/repos","events_url":"https://api.github.com/users/beret595/events{/privacy}","received_events_url":"https://api.github.com/users/beret595/received_events","type":"User","site_admin":false},"private":false,"html_url":"https://github.com/beret595/Ucar_Operation_Crm_Finance","description":null,"fork":false,"url":"https://api.github.com/repos/beret595/Ucar_Operation_Crm_Finance","forks_url":"https://api.github.com/repos/beret595/Ucar_Operation_Crm_Finance/forks","keys_url":"https://api.github.com/repos/beret595/Ucar_Operation_Crm_Finance/keys{/key_id}","collaborators_url":"https://api.github.com/repos/beret595/Ucar_Operation_Crm_Finance/collaborators{/collaborator}","teams_url":"https://api.github.com/repos/beret595/Ucar_Operation_Crm_Finance/teams","hooks_url":"https://api.github.com/repos/beret595/Ucar_Operation_Crm_Finance/hooks","issue_events_url":"https://api.github.com/repos/beret595/Ucar_Operation_Crm_Finance/issues/events{/number}","events_url":"https://api.github.com/repos/beret595/Ucar_Operation_Crm_Finance/events","assignees_url":"https://api.github.com/repos/beret595/Ucar_Operation_Crm_Finance/assignees{/user}","branches_url":"https://api.github.com/repos/beret595/Ucar_Operation_Crm_Finance/branches{/branch}","tags_url":"https://api.github.com/repos/beret595/Ucar_Operation_Crm_Finance/tags","blobs_url":"https://api.github.com/repos/beret595/Ucar_Operation_Crm_Finance/git/blobs{/sha}","git_tags_url":"https://api.github.com/repos/beret595/Ucar_Operation_Crm_Finance/git/tags{/sha}","git_refs_url":"https://api.github.com/repos/beret595/Ucar_Operation_Crm_Finance/git/refs{/sha}","trees_url":"https://api.github.com/repos/beret595/Ucar_Operation_Crm_Finance/git/trees{/sha}","statuses_url":"https://api.github.com/repos/beret595/Ucar_Operation_Crm_Finance/statuses/{sha}","languages_url":"https://api.github.com/repos/beret595/Ucar_Operation_Crm_Finance/languages","stargazers_url":"https://api.github.com/repos/beret595/Ucar_Operation_Crm_Finance/stargazers","contributors_url":"https://api.github.com/repos/beret595/Ucar_Operation_Crm_Finance/contributors","subscribers_url":"https://api.github.com/repos/beret595/Ucar_Operation_Crm_Finance/subscribers","subscription_url":"https://api.github.com/repos/beret595/Ucar_Operation_Crm_Finance/subscription","commits_url":"https://api.github.com/repos/beret595/Ucar_Operation_Crm_Finance/commits{/sha}","git_commits_url":"https://api.github.com/repos/beret595/Ucar_Operation_Crm_Finance/git/commits{/sha}","comments_url":"https://api.github.com/repos/beret595/Ucar_Operation_Crm_Finance/comments{/number}","issue_comment_url":"https://api.github.com/repos/beret595/Ucar_Operation_Crm_Finance/issues/comments/{number}","contents_url":"https://api.github.com/repos/beret595/Ucar_Operation_Crm_Finance/contents/{+path}","compare_url":"https://api.github.com/repos/beret595/Ucar_Operation_Crm_Finance/compare/{base}...{head}","merges_url":"https://api.github.com/repos/beret595/Ucar_Operation_Crm_Finance/merges","archive_url":"https://api.github.com/repos/beret595/Ucar_Operation_Crm_Finance/{archive_format}{/ref}","downloads_url":"https://api.github.com/repos/beret595/Ucar_Operation_Crm_Finance/downloads","issues_url":"https://api.github.com/repos/beret595/Ucar_Operation_Crm_Finance/issues{/number}","pulls_url":"https://api.github.com/repos/beret595/Ucar_Operation_Crm_Finance/pulls{/number}","milestones_url":"https://api.github.com/repos/beret595/Ucar_Operation_Crm_Finance/milestones{/number}","notifications_url":"https://api.github.com/repos/beret595/Ucar_Operation_Crm_Finance/notifications{?since,all,participating}","labels_url":"https://api.github.com/repos/beret595/Ucar_Operation_Crm_Finance/labels{/name}","releases_url":"https://api.github.com/repos/beret595/Ucar_Operation_Crm_Finance/releases{/id}","created_at":"2014-12-25T03:53:57Z","updated_at":"2014-12-30T02:22:03Z","pushed_at":"2015-01-01T01:05:21Z","git_url":"git://github.com/beret595/Ucar_Operation_Crm_Finance.git","ssh_url":"git@github.com:beret595/Ucar_Operation_Crm_Finance.git","clone_url":"https://github.com/beret595/Ucar_Operation_Crm_Finance.git","svn_url":"https://github.com/beret595/Ucar_Operation_Crm_Finance","homepage":null,"size":0,"stargazers_count":0,"watchers_count":0,"language":"C#","has_issues":true,"has_downloads":true,"has_wiki":true,"has_pages":false,"forks_count":0,"mirror_url":null,"open_issues_count":0,"forks":0,"open_issues":0,"watchers":0,"default_branch":"master"}},"base":{"label":"beret595:master","ref":"master","sha":"83f3a8e7891270f54d4119a862c57bfaf1db5475","user":{"login":"beret595","id":2812278,"avatar_url":"https://avatars.githubusercontent.com/u/2812278?v=3","gravatar_id":"","url":"https://api.github.com/users/beret595","html_url":"https://github.com/beret595","followers_url":"https://api.github.com/users/beret595/followers","following_url":"https://api.github.com/users/beret595/following{/other_user}","gists_url":"https://api.github.com/users/beret595/gists{/gist_id}","starred_url":"https://api.github.com/users/beret595/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/beret595/subscriptions","organizations_url":"https://api.github.com/users/beret595/orgs","repos_url":"https://api.github.com/users/beret595/repos","events_url":"https://api.github.com/users/beret595/events{/privacy}","received_events_url":"https://api.github.com/users/beret595/received_events","type":"User","site_admin":false},"repo":{"id":28470088,"name":"Ucar_Operation_Crm_Finance","full_name":"beret595/Ucar_Operation_Crm_Finance","owner":{"login":"beret595","id":2812278,"avatar_url":"https://avatars.githubusercontent.com/u/2812278?v=3","gravatar_id":"","url":"https://api.github.com/users/beret595","html_url":"https://github.com/beret595","followers_url":"https://api.github.com/users/beret595/followers","following_url":"https://api.github.com/users/beret595/following{/other_user}","gists_url":"https://api.github.com/users/beret595/gists{/gist_id}","starred_url":"https://api.github.com/users/beret595/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/beret595/subscriptions","organizations_url":"https://api.github.com/users/beret595/orgs","repos_url":"https://api.github.com/users/beret595/repos","events_url":"https://api.github.com/users/beret595/events{/privacy}","received_events_url":"https://api.github.com/users/beret595/received_events","type":"User","site_admin":false},"private":false,"html_url":"https://github.com/beret595/Ucar_Operation_Crm_Finance","description":null,"fork":false,"url":"https://api.github.com/repos/beret595/Ucar_Operation_Crm_Finance","forks_url":"https://api.github.com/repos/beret595/Ucar_Operation_Crm_Finance/forks","keys_url":"https://api.github.com/repos/beret595/Ucar_Operation_Crm_Finance/keys{/key_id}","collaborators_url":"https://api.github.com/repos/beret595/Ucar_Operation_Crm_Finance/collaborators{/collaborator}","teams_url":"https://api.github.com/repos/beret595/Ucar_Operation_Crm_Finance/teams","hooks_url":"https://api.github.com/repos/beret595/Ucar_Operation_Crm_Finance/hooks","issue_events_url":"https://api.github.com/repos/beret595/Ucar_Operation_Crm_Finance/issues/events{/number}","events_url":"https://api.github.com/repos/beret595/Ucar_Operation_Crm_Finance/events","assignees_url":"https://api.github.com/repos/beret595/Ucar_Operation_Crm_Finance/assignees{/user}","branches_url":"https://api.github.com/repos/beret595/Ucar_Operation_Crm_Finance/branches{/branch}","tags_url":"https://api.github.com/repos/beret595/Ucar_Operation_Crm_Finance/tags","blobs_url":"https://api.github.com/repos/beret595/Ucar_Operation_Crm_Finance/git/blobs{/sha}","git_tags_url":"https://api.github.com/repos/beret595/Ucar_Operation_Crm_Finance/git/tags{/sha}","git_refs_url":"https://api.github.com/repos/beret595/Ucar_Operation_Crm_Finance/git/refs{/sha}","trees_url":"https://api.github.com/repos/beret595/Ucar_Operation_Crm_Finance/git/trees{/sha}","statuses_url":"https://api.github.com/repos/beret595/Ucar_Operation_Crm_Finance/statuses/{sha}","languages_url":"https://api.github.com/repos/beret595/Ucar_Operation_Crm_Finance/languages","stargazers_url":"https://api.github.com/repos/beret595/Ucar_Operation_Crm_Finance/stargazers","contributors_url":"https://api.github.com/repos/beret595/Ucar_Operation_Crm_Finance/contributors","subscribers_url":"https://api.github.com/repos/beret595/Ucar_Operation_Crm_Finance/subscribers","subscription_url":"https://api.github.com/repos/beret595/Ucar_Operation_Crm_Finance/subscription","commits_url":"https://api.github.com/repos/beret595/Ucar_Operation_Crm_Finance/commits{/sha}","git_commits_url":"https://api.github.com/repos/beret595/Ucar_Operation_Crm_Finance/git/commits{/sha}","comments_url":"https://api.github.com/repos/beret595/Ucar_Operation_Crm_Finance/comments{/number}","issue_comment_url":"https://api.github.com/repos/beret595/Ucar_Operation_Crm_Finance/issues/comments/{number}","contents_url":"https://api.github.com/repos/beret595/Ucar_Operation_Crm_Finance/contents/{+path}","compare_url":"https://api.github.com/repos/beret595/Ucar_Operation_Crm_Finance/compare/{base}...{head}","merges_url":"https://api.github.com/repos/beret595/Ucar_Operation_Crm_Finance/merges","archive_url":"https://api.github.com/repos/beret595/Ucar_Operation_Crm_Finance/{archive_format}{/ref}","downloads_url":"https://api.github.com/repos/beret595/Ucar_Operation_Crm_Finance/downloads","issues_url":"https://api.github.com/repos/beret595/Ucar_Operation_Crm_Finance/issues{/number}","pulls_url":"https://api.github.com/repos/beret595/Ucar_Operation_Crm_Finance/pulls{/number}","milestones_url":"https://api.github.com/repos/beret595/Ucar_Operation_Crm_Finance/milestones{/number}","notifications_url":"https://api.github.com/repos/beret595/Ucar_Operation_Crm_Finance/notifications{?since,all,participating}","labels_url":"https://api.github.com/repos/beret595/Ucar_Operation_Crm_Finance/labels{/name}","releases_url":"https://api.github.com/repos/beret595/Ucar_Operation_Crm_Finance/releases{/id}","created_at":"2014-12-25T03:53:57Z","updated_at":"2014-12-30T02:22:03Z","pushed_at":"2015-01-01T01:05:21Z","git_url":"git://github.com/beret595/Ucar_Operation_Crm_Finance.git","ssh_url":"git@github.com:beret595/Ucar_Operation_Crm_Finance.git","clone_url":"https://github.com/beret595/Ucar_Operation_Crm_Finance.git","svn_url":"https://github.com/beret595/Ucar_Operation_Crm_Finance","homepage":null,"size":0,"stargazers_count":0,"watchers_count":0,"language":"C#","has_issues":true,"has_downloads":true,"has_wiki":true,"has_pages":false,"forks_count":0,"mirror_url":null,"open_issues_count":0,"forks":0,"open_issues":0,"watchers":0,"default_branch":"master"}},"_links":{"self":{"href":"https://api.github.com/repos/beret595/Ucar_Operation_Crm_Finance/pulls/1"},"html":{"href":"https://github.com/beret595/Ucar_Operation_Crm_Finance/pull/1"},"issue":{"href":"https://api.github.com/repos/beret595/Ucar_Operation_Crm_Finance/issues/1"},"comments":{"href":"https://api.github.com/repos/beret595/Ucar_Operation_Crm_Finance/issues/1/comments"},"review_comments":{"href":"https://api.github.com/repos/beret595/Ucar_Operation_Crm_Finance/pulls/1/comments"},"review_comment":{"href":"https://api.github.com/repos/beret595/Ucar_Operation_Crm_Finance/pulls/comments/{number}"},"commits":{"href":"https://api.github.com/repos/beret595/Ucar_Operation_Crm_Finance/pulls/1/commits"},"statuses":{"href":"https://api.github.com/repos/beret595/Ucar_Operation_Crm_Finance/statuses/fb9307eefb142d216d38294f23e42779e0aecbea"}},"merged":true,"mergeable":null,"mergeable_state":"unknown","merged_by":{"login":"beret595","id":2812278,"avatar_url":"https://avatars.githubusercontent.com/u/2812278?v=3","gravatar_id":"","url":"https://api.github.com/users/beret595","html_url":"https://github.com/beret595","followers_url":"https://api.github.com/users/beret595/followers","following_url":"https://api.github.com/users/beret595/following{/other_user}","gists_url":"https://api.github.com/users/beret595/gists{/gist_id}","starred_url":"https://api.github.com/users/beret595/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/beret595/subscriptions","organizations_url":"https://api.github.com/users/beret595/orgs","repos_url":"https://api.github.com/users/beret595/repos","events_url":"https://api.github.com/users/beret595/events{/privacy}","received_events_url":"https://api.github.com/users/beret595/received_events","type":"User","site_admin":false},"comments":0,"review_comments":0,"commits":5,"additions":755,"deletions":44,"changed_files":11}},"public":true,"created_at":"2015-01-01T01:05:22Z"}
{"id":"2489398144","type":"WatchEvent","actor":{"id":1015032,"login":"miketahani","gravatar_id":"","url":"https://api.github.com/users/miketahani","avatar_url":"https://avatars.githubusercontent.com/u/1015032?"},"repo":{"id":4437769,"name":"casatt/html5-videoEditor","url":"https://api.github.com/repos/casatt/html5-videoEditor"},"payload":{"action":"started"},"public":true,"created_at":"2015-01-01T01:05:22Z"}
{"id":"2489398151","type":"PushEvent","actor":{"id":6825691,"login":"sogeo","gravatar_id":"","url":"https://api.github.com/users/sogeo","avatar_url":"https://avatars.githubusercontent.com/u/6825691?"},"repo":{"id":17319070,"name":"sogeo/DM01AVSO24","url":"https://api.github.com/repos/sogeo/DM01AVSO24"},"payload":{"push_id":536753235,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"7777eb7c152ff9e2597103295a71bf27496e1292","before":"13bd78547455b9ed0dbe380b1c4e614bd06100b3","commits":[{"sha":"7777eb7c152ff9e2597103295a71bf27496e1292","author":{"email":"afdee6c9fc3dccec54bef9bef15ae27098932d1c@gmail.com","name":"sogeo"},"message":"Wöchentliche Datenlieferung (1 / 1 / 2015-01-01-02.04.39)","distinct":true,"url":"https://api.github.com/repos/sogeo/DM01AVSO24/commits/7777eb7c152ff9e2597103295a71bf27496e1292"}]},"public":true,"created_at":"2015-01-01T01:05:23Z"}
{"id":"2489398152","type":"CreateEvent","actor":{"id":4975721,"login":"macieknajbar","gravatar_id":"","url":"https://api.github.com/users/macieknajbar","avatar_url":"https://avatars.githubusercontent.com/u/4975721?"},"repo":{"id":28678271,"name":"macieknajbar/GYm","url":"https://api.github.com/repos/macieknajbar/GYm"},"payload":{"ref":null,"ref_type":"repository","master_branch":"master","description":"A gym supporting application","pusher_type":"user"},"public":true,"created_at":"2015-01-01T01:05:23Z"}
{"id":"2489398153","type":"PushEvent","actor":{"id":1671640,"login":"alex6lc","gravatar_id":"","url":"https://api.github.com/users/alex6lc","avatar_url":"https://avatars.githubusercontent.com/u/1671640?"},"repo":{"id":28678262,"name":"alex6lc/material-ui-sass","url":"https://api.github.com/repos/alex6lc/material-ui-sass"},"payload":{"push_id":536753236,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"5c1c07ca7e009f91a0b0f6c953e826a7cb3f7aa8","before":"4caa9114f99ce0215e6db9ab551226d1d02aaf50","commits":[{"sha":"5c1c07ca7e009f91a0b0f6c953e826a7cb3f7aa8","author":{"email":"1154eaf5246093599e182c05c916e7a183e0e00e@gmail.com","name":"alex6lc"},"message":"Remove post install scripts","distinct":true,"url":"https://api.github.com/repos/alex6lc/material-ui-sass/commits/5c1c07ca7e009f91a0b0f6c953e826a7cb3f7aa8"}]},"public":true,"created_at":"2015-01-01T01:05:23Z"}
{"id":"2489398155","type":"IssueCommentEvent","actor":{"id":6964047,"login":"TTMTT","gravatar_id":"","url":"https://api.github.com/users/TTMTT","avatar_url":"https://avatars.githubusercontent.com/u/6964047?"},"repo":{"id":26731988,"name":"badrsony/icloudin-support-","url":"https://api.github.com/repos/badrsony/icloudin-support-"},"payload":{"action":"created","issue":{"url":"https://api.github.com/repos/badrsony/icloudin-support-/issues/4","labels_url":"https://api.github.com/repos/badrsony/icloudin-support-/issues/4/labels{/name}","comments_url":"https://api.github.com/repos/badrsony/icloudin-support-/issues/4/comments","events_url":"https://api.github.com/repos/badrsony/icloudin-support-/issues/4/events","html_url":"https://github.com/badrsony/icloudin-support-/issues/4","id":50920400,"number":4,"title":"icloudin support ","user":{"login":"badrsony","id":7895050,"avatar_url":"https://avatars.githubusercontent.com/u/7895050?v=3","gravatar_id":"","url":"https://api.github.com/users/badrsony","html_url":"https://github.com/badrsony","followers_url":"https://api.github.com/users/badrsony/followers","following_url":"https://api.github.com/users/badrsony/following{/other_user}","gists_url":"https://api.github.com/users/badrsony/gists{/gist_id}","starred_url":"https://api.github.com/users/badrsony/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/badrsony/subscriptions","organizations_url":"https://api.github.com/users/badrsony/orgs","repos_url":"https://api.github.com/users/badrsony/repos","events_url":"https://api.github.com/users/badrsony/events{/privacy}","received_events_url":"https://api.github.com/users/badrsony/received_events","type":"User","site_admin":false},"labels":[],"state":"closed","locked":false,"assignee":null,"milestone":null,"comments":997,"created_at":"2014-12-04T02:13:39Z","updated_at":"2015-01-01T01:05:23Z","closed_at":"2015-01-01T00:00:32Z","body":"Originally written by @TTMTT. That we hope for him safery and peace\r\n.\r\n\r\nWow, ipod touch 5G (8.1) - iCL0udin v1.0 bypass activation (icloud)\r\n\r\nhttp://youtu.be/tZmEdlDGNu4\r\n\r\niCL0udin v1.0 bypass activation (icloud) - ipad mini 2G (7.1.1)\r\n\r\nhttp://youtu.be/tevYyBN2QCQ\r\n\r\nVideo for bypass icloud (iCL0udin v1.0) for iphone 4 CDMA ..\r\n\r\nhttp://youtu.be/i85-D6N2YLk\r\n\r\nNew video for iCL0udin v1.0 bypass icloud (3 iphones 7.1.2):\r\n\r\nhttp://youtu.be/p51TNlCr7ug\r\n\r\niCL0udin v1.0 -> %98\r\n\r\nRemaining: %2 testing with some people..\r\n\r\nLast Method:\r\n\r\nmethod 1 : via (other xml not to deviceservices - exploit)\r\nmethod 2 : via (apple cert & key and i can downgrade to any ios)\r\nmethod 3 : via (change some string by hex on ELF file << some times i got error)\r\nmethod 4 : via (use apple ssl cert or real ssl in server and change some string in iphone)\r\n\r\niCL0udin v1.0 have this method:\r\n\r\nmethod 1 : via (other xml not to deviceservices - exploit)\r\nmethod 2 : via (apple cert & key and i can downgrade to any ios)"},"comment":{"url":"https://api.github.com/repos/badrsony/icloudin-support-/issues/comments/68477335","html_url":"https://github.com/badrsony/icloudin-support-/issues/4#issuecomment-68477335","issue_url":"https://api.github.com/repos/badrsony/icloudin-support-/issues/4","id":68477335,"user":{"login":"TTMTT","id":6964047,"avatar_url":"https://avatars.githubusercontent.com/u/6964047?v=3","gravatar_id":"","url":"https://api.github.com/users/TTMTT","html_url":"https://github.com/TTMTT","followers_url":"https://api.github.com/users/TTMTT/followers","following_url":"https://api.github.com/users/TTMTT/following{/other_user}","gists_url":"https://api.github.com/users/TTMTT/gists{/gist_id}","starred_url":"https://api.github.com/users/TTMTT/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/TTMTT/subscriptions","organizations_url":"https://api.github.com/users/TTMTT/orgs","repos_url":"https://api.github.com/users/TTMTT/repos","events_url":"https://api.github.com/users/TTMTT/events{/privacy}","received_events_url":"https://api.github.com/users/TTMTT/received_events","type":"User","site_admin":false},"created_at":"2015-01-01T01:05:23Z","updated_at":"2015-01-01T01:05:23Z","body":"@badrsony \r\nexcuse me i open a new discuss for (iCL0udin v1.0):\r\n--------------------------------------------------------\r\nhttps://github.com/TTMTT/iCL0udin/issues/1\r\n--------------------------------------------------------"}},"public":true,"created_at":"2015-01-01T01:05:24Z"}
{"id":"2489398158","type":"PullRequestEvent","actor":{"id":5831804,"login":"YueLinHo","gravatar_id":"","url":"https://api.github.com/users/YueLinHo","avatar_url":"https://avatars.githubusercontent.com/u/5831804?"},"repo":{"id":1197206,"name":"TortoiseGit/TortoiseGit","url":"https://api.github.com/repos/TortoiseGit/TortoiseGit"},"payload":{"action":"opened","number":151,"pull_request":{"url":"https://api.github.com/repos/TortoiseGit/TortoiseGit/pulls/151","id":26739456,"html_url":"https://github.com/TortoiseGit/TortoiseGit/pull/151","diff_url":"https://github.com/TortoiseGit/TortoiseGit/pull/151.diff","patch_url":"https://github.com/TortoiseGit/TortoiseGit/pull/151.patch","issue_url":"https://api.github.com/repos/TortoiseGit/TortoiseGit/issues/151","number":151,"state":"open","locked":false,"title":"Refresh the status of \"Working dir changes\" of Log dialog by pressing F6","user":{"login":"YueLinHo","id":5831804,"avatar_url":"https://avatars.githubusercontent.com/u/5831804?v=3","gravatar_id":"","url":"https://api.github.com/users/YueLinHo","html_url":"https://github.com/YueLinHo","followers_url":"https://api.github.com/users/YueLinHo/followers","following_url":"https://api.github.com/users/YueLinHo/following{/other_user}","gists_url":"https://api.github.com/users/YueLinHo/gists{/gist_id}","starred_url":"https://api.github.com/users/YueLinHo/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/YueLinHo/subscriptions","organizations_url":"https://api.github.com/users/YueLinHo/orgs","repos_url":"https://api.github.com/users/YueLinHo/repos","events_url":"https://api.github.com/users/YueLinHo/events{/privacy}","received_events_url":"https://api.github.com/users/YueLinHo/received_events","type":"User","site_admin":false},"body":"@lznuaa @csware @ch3cooli \r\nHappy new year to all of you. ^_______________^","created_at":"2015-01-01T01:05:24Z","updated_at":"2015-01-01T01:05:24Z","closed_at":null,"merged_at":null,"merge_commit_sha":null,"assignee":null,"milestone":null,"commits_url":"https://api.github.com/repos/TortoiseGit/TortoiseGit/pulls/151/commits","review_comments_url":"https://api.github.com/repos/TortoiseGit/TortoiseGit/pulls/151/comments","review_comment_url":"https://api.github.com/repos/TortoiseGit/TortoiseGit/pulls/comments/{number}","comments_url":"https://api.github.com/repos/TortoiseGit/TortoiseGit/issues/151/comments","statuses_url":"https://api.github.com/repos/TortoiseGit/TortoiseGit/statuses/a0af6070519ae3ffae329edd8e6cd1042d396fe0","head":{"label":"YueLinHo:ylh/happy_new_year_2015","ref":"ylh/happy_new_year_2015","sha":"a0af6070519ae3ffae329edd8e6cd1042d396fe0","user":{"login":"YueLinHo","id":5831804,"avatar_url":"https://avatars.githubusercontent.com/u/5831804?v=3","gravatar_id":"","url":"https://api.github.com/users/YueLinHo","html_url":"https://github.com/YueLinHo","followers_url":"https://api.github.com/users/YueLinHo/followers","following_url":"https://api.github.com/users/YueLinHo/following{/other_user}","gists_url":"https://api.github.com/users/YueLinHo/gists{/gist_id}","starred_url":"https://api.github.com/users/YueLinHo/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/YueLinHo/subscriptions","organizations_url":"https://api.github.com/users/YueLinHo/orgs","repos_url":"https://api.github.com/users/YueLinHo/repos","events_url":"https://api.github.com/users/YueLinHo/events{/privacy}","received_events_url":"https://api.github.com/users/YueLinHo/received_events","type":"User","site_admin":false},"repo":{"id":21376277,"name":"TortoiseGit","full_name":"YueLinHo/TortoiseGit","owner":{"login":"YueLinHo","id":5831804,"avatar_url":"https://avatars.githubusercontent.com/u/5831804?v=3","gravatar_id":"","url":"https://api.github.com/users/YueLinHo","html_url":"https://github.com/YueLinHo","followers_url":"https://api.github.com/users/YueLinHo/followers","following_url":"https://api.github.com/users/YueLinHo/following{/other_user}","gists_url":"https://api.github.com/users/YueLinHo/gists{/gist_id}","starred_url":"https://api.github.com/users/YueLinHo/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/YueLinHo/subscriptions","organizations_url":"https://api.github.com/users/YueLinHo/orgs","repos_url":"https://api.github.com/users/YueLinHo/repos","events_url":"https://api.github.com/users/YueLinHo/events{/privacy}","received_events_url":"https://api.github.com/users/YueLinHo/received_events","type":"User","site_admin":false},"private":false,"html_url":"https://github.com/YueLinHo/TortoiseGit","description":"Windows Explorer Extension to Operate Git; Mirror of GoogleCode repository","fork":true,"url":"https://api.github.com/repos/YueLinHo/TortoiseGit","forks_url":"https://api.github.com/repos/YueLinHo/TortoiseGit/forks","keys_url":"https://api.github.com/repos/YueLinHo/TortoiseGit/keys{/key_id}","collaborators_url":"https://api.github.com/repos/YueLinHo/TortoiseGit/collaborators{/collaborator}","teams_url":"https://api.github.com/repos/YueLinHo/TortoiseGit/teams","hooks_url":"https://api.github.com/repos/YueLinHo/TortoiseGit/hooks","issue_events_url":"https://api.github.com/repos/YueLinHo/TortoiseGit/issues/events{/number}","events_url":"https://api.github.com/repos/YueLinHo/TortoiseGit/events","assignees_url":"https://api.github.com/repos/YueLinHo/TortoiseGit/assignees{/user}","branches_url":"https://api.github.com/repos/YueLinHo/TortoiseGit/branches{/branch}","tags_url":"https://api.github.com/repos/YueLinHo/TortoiseGit/tags","blobs_url":"https://api.github.com/repos/YueLinHo/TortoiseGit/git/blobs{/sha}","git_tags_url":"https://api.github.com/repos/YueLinHo/TortoiseGit/git/tags{/sha}","git_refs_url":"https://api.github.com/repos/YueLinHo/TortoiseGit/git/refs{/sha}","trees_url":"https://api.github.com/repos/YueLinHo/TortoiseGit/git/trees{/sha}","statuses_url":"https://api.github.com/repos/YueLinHo/TortoiseGit/statuses/{sha}","languages_url":"https://api.github.com/repos/YueLinHo/TortoiseGit/languages","stargazers_url":"https://api.github.com/repos/YueLinHo/TortoiseGit/stargazers","contributors_url":"https://api.github.com/repos/YueLinHo/TortoiseGit/contributors","subscribers_url":"https://api.github.com/repos/YueLinHo/TortoiseGit/subscribers","subscription_url":"https://api.github.com/repos/YueLinHo/TortoiseGit/subscription","commits_url":"https://api.github.com/repos/YueLinHo/TortoiseGit/commits{/sha}","git_commits_url":"https://api.github.com/repos/YueLinHo/TortoiseGit/git/commits{/sha}","comments_url":"https://api.github.com/repos/YueLinHo/TortoiseGit/comments{/number}","issue_comment_url":"https://api.github.com/repos/YueLinHo/TortoiseGit/issues/comments/{number}","contents_url":"https://api.github.com/repos/YueLinHo/TortoiseGit/contents/{+path}","compare_url":"https://api.github.com/repos/YueLinHo/TortoiseGit/compare/{base}...{head}","merges_url":"https://api.github.com/repos/YueLinHo/TortoiseGit/merges","archive_url":"https://api.github.com/repos/YueLinHo/TortoiseGit/{archive_format}{/ref}","downloads_url":"https://api.github.com/repos/YueLinHo/TortoiseGit/downloads","issues_url":"https://api.github.com/repos/YueLinHo/TortoiseGit/issues{/number}","pulls_url":"https://api.github.com/repos/YueLinHo/TortoiseGit/pulls{/number}","milestones_url":"https://api.github.com/repos/YueLinHo/TortoiseGit/milestones{/number}","notifications_url":"https://api.github.com/repos/YueLinHo/TortoiseGit/notifications{?since,all,participating}","labels_url":"https://api.github.com/repos/YueLinHo/TortoiseGit/labels{/name}","releases_url":"https://api.github.com/repos/YueLinHo/TortoiseGit/releases{/id}","created_at":"2014-07-01T05:31:50Z","updated_at":"2014-12-30T09:25:25Z","pushed_at":"2015-01-01T01:04:01Z","git_url":"git://github.com/YueLinHo/TortoiseGit.git","ssh_url":"git@github.com:YueLinHo/TortoiseGit.git","clone_url":"https://github.com/YueLinHo/TortoiseGit.git","svn_url":"https://github.com/YueLinHo/TortoiseGit","homepage":"http://tortoisegit.org","size":93279,"stargazers_count":0,"watchers_count":0,"language":"C++","has_issues":false,"has_downloads":true,"has_wiki":false,"has_pages":false,"forks_count":0,"mirror_url":null,"open_issues_count":0,"forks":0,"open_issues":0,"watchers":0,"default_branch":"master"}},"base":{"label":"TortoiseGit:master","ref":"master","sha":"fa7295b820be9ca368924b8129253df52c189c9d","user":{"login":"TortoiseGit","id":1103929,"avatar_url":"https://avatars.githubusercontent.com/u/1103929?v=3","gravatar_id":"","url":"https://api.github.com/users/TortoiseGit","html_url":"https://github.com/TortoiseGit","followers_url":"https://api.github.com/users/TortoiseGit/followers","following_url":"https://api.github.com/users/TortoiseGit/following{/other_user}","gists_url":"https://api.github.com/users/TortoiseGit/gists{/gist_id}","starred_url":"https://api.github.com/users/TortoiseGit/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/TortoiseGit/subscriptions","organizations_url":"https://api.github.com/users/TortoiseGit/orgs","repos_url":"https://api.github.com/users/TortoiseGit/repos","events_url":"https://api.github.com/users/TortoiseGit/events{/privacy}","received_events_url":"https://api.github.com/users/TortoiseGit/received_events","type":"Organization","site_admin":false},"repo":{"id":1197206,"name":"TortoiseGit","full_name":"TortoiseGit/TortoiseGit","owner":{"login":"TortoiseGit","id":1103929,"avatar_url":"https://avatars.githubusercontent.com/u/1103929?v=3","gravatar_id":"","url":"https://api.github.com/users/TortoiseGit","html_url":"https://github.com/TortoiseGit","followers_url":"https://api.github.com/users/TortoiseGit/followers","following_url":"https://api.github.com/users/TortoiseGit/following{/other_user}","gists_url":"https://api.github.com/users/TortoiseGit/gists{/gist_id}","starred_url":"https://api.github.com/users/TortoiseGit/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/TortoiseGit/subscriptions","organizations_url":"https://api.github.com/users/TortoiseGit/orgs","repos_url":"https://api.github.com/users/TortoiseGit/repos","events_url":"https://api.github.com/users/TortoiseGit/events{/privacy}","received_events_url":"https://api.github.com/users/TortoiseGit/received_events","type":"Organization","site_admin":false},"private":false,"html_url":"https://github.com/TortoiseGit/TortoiseGit","description":"Windows Explorer Extension to Operate Git; Mirror of GoogleCode repository","fork":false,"url":"https://api.github.com/repos/TortoiseGit/TortoiseGit","forks_url":"https://api.github.com/repos/TortoiseGit/TortoiseGit/forks","keys_url":"https://api.github.com/repos/TortoiseGit/TortoiseGit/keys{/key_id}","collaborators_url":"https://api.github.com/repos/TortoiseGit/TortoiseGit/collaborators{/collaborator}","teams_url":"https://api.github.com/repos/TortoiseGit/TortoiseGit/teams","hooks_url":"https://api.github.com/repos/TortoiseGit/TortoiseGit/hooks","issue_events_url":"https://api.github.com/repos/TortoiseGit/TortoiseGit/issues/events{/number}","events_url":"https://api.github.com/repos/TortoiseGit/TortoiseGit/events","assignees_url":"https://api.github.com/repos/TortoiseGit/TortoiseGit/assignees{/user}","branches_url":"https://api.github.com/repos/TortoiseGit/TortoiseGit/branches{/branch}","tags_url":"https://api.github.com/repos/TortoiseGit/TortoiseGit/tags","blobs_url":"https://api.github.com/repos/TortoiseGit/TortoiseGit/git/blobs{/sha}","git_tags_url":"https://api.github.com/repos/TortoiseGit/TortoiseGit/git/tags{/sha}","git_refs_url":"https://api.github.com/repos/TortoiseGit/TortoiseGit/git/refs{/sha}","trees_url":"https://api.github.com/repos/TortoiseGit/TortoiseGit/git/trees{/sha}","statuses_url":"https://api.github.com/repos/TortoiseGit/TortoiseGit/statuses/{sha}","languages_url":"https://api.github.com/repos/TortoiseGit/TortoiseGit/languages","stargazers_url":"https://api.github.com/repos/TortoiseGit/TortoiseGit/stargazers","contributors_url":"https://api.github.com/repos/TortoiseGit/TortoiseGit/contributors","subscribers_url":"https://api.github.com/repos/TortoiseGit/TortoiseGit/subscribers","subscription_url":"https://api.github.com/repos/TortoiseGit/TortoiseGit/subscription","commits_url":"https://api.github.com/repos/TortoiseGit/TortoiseGit/commits{/sha}","git_commits_url":"https://api.github.com/repos/TortoiseGit/TortoiseGit/git/commits{/sha}","comments_url":"https://api.github.com/repos/TortoiseGit/TortoiseGit/comments{/number}","issue_comment_url":"https://api.github.com/repos/TortoiseGit/TortoiseGit/issues/comments/{number}","contents_url":"https://api.github.com/repos/TortoiseGit/TortoiseGit/contents/{+path}","compare_url":"https://api.github.com/repos/TortoiseGit/TortoiseGit/compare/{base}...{head}","merges_url":"https://api.github.com/repos/TortoiseGit/TortoiseGit/merges","archive_url":"https://api.github.com/repos/TortoiseGit/TortoiseGit/{archive_format}{/ref}","downloads_url":"https://api.github.com/repos/TortoiseGit/TortoiseGit/downloads","issues_url":"https://api.github.com/repos/TortoiseGit/TortoiseGit/issues{/number}","pulls_url":"https://api.github.com/repos/TortoiseGit/TortoiseGit/pulls{/number}","milestones_url":"https://api.github.com/repos/TortoiseGit/TortoiseGit/milestones{/number}","notifications_url":"https://api.github.com/repos/TortoiseGit/TortoiseGit/notifications{?since,all,participating}","labels_url":"https://api.github.com/repos/TortoiseGit/TortoiseGit/labels{/name}","releases_url":"https://api.github.com/repos/TortoiseGit/TortoiseGit/releases{/id}","created_at":"2010-12-25T14:10:21Z","updated_at":"2014-12-31T05:00:09Z","pushed_at":"2014-12-31T05:00:09Z","git_url":"git://github.com/TortoiseGit/TortoiseGit.git","ssh_url":"git@github.com:TortoiseGit/TortoiseGit.git","clone_url":"https://github.com/TortoiseGit/TortoiseGit.git","svn_url":"https://github.com/TortoiseGit/TortoiseGit","homepage":"http://tortoisegit.org","size":111079,"stargazers_count":193,"watchers_count":193,"language":"C++","has_issues":false,"has_downloads":true,"has_wiki":false,"has_pages":false,"forks_count":80,"mirror_url":null,"open_issues_count":17,"forks":80,"open_issues":17,"watchers":193,"default_branch":"master"}},"_links":{"self":{"href":"https://api.github.com/repos/TortoiseGit/TortoiseGit/pulls/151"},"html":{"href":"https://github.com/TortoiseGit/TortoiseGit/pull/151"},"issue":{"href":"https://api.github.com/repos/TortoiseGit/TortoiseGit/issues/151"},"comments":{"href":"https://api.github.com/repos/TortoiseGit/TortoiseGit/issues/151/comments"},"review_comments":{"href":"https://api.github.com/repos/TortoiseGit/TortoiseGit/pulls/151/comments"},"review_comment":{"href":"https://api.github.com/repos/TortoiseGit/TortoiseGit/pulls/comments/{number}"},"commits":{"href":"https://api.github.com/repos/TortoiseGit/TortoiseGit/pulls/151/commits"},"statuses":{"href":"https://api.github.com/repos/TortoiseGit/TortoiseGit/statuses/a0af6070519ae3ffae329edd8e6cd1042d396fe0"}},"merged":false,"mergeable":null,"mergeable_state":"unknown","merged_by":null,"comments":0,"review_comments":0,"commits":1,"additions":11,"deletions":1,"changed_files":4}},"public":true,"created_at":"2015-01-01T01:05:25Z","org":{"id":1103929,"login":"TortoiseGit","gravatar_id":"","url":"https://api.github.com/orgs/TortoiseGit","avatar_url":"https://avatars.githubusercontent.com/u/1103929?"}}
{"id":"2489398163","type":"PushEvent","actor":{"id":5700937,"login":"darealshinji","gravatar_id":"","url":"https://api.github.com/users/darealshinji","avatar_url":"https://avatars.githubusercontent.com/u/5700937?"},"repo":{"id":26483280,"name":"darealshinji/debian","url":"https://api.github.com/repos/darealshinji/debian"},"payload":{"push_id":536753239,"size":2,"distinct_size":2,"ref":"refs/heads/master","head":"69079504019294a505b9c248ba71186190abc0a8","before":"a0457f679a476079cb2ff0cafcff945120af4524","commits":[{"sha":"268b418c00f957794eed7a33f7e6089fb25162f2","author":{"email":"52122a01dfac1c09ea3fc6e6913df9984d0f756a@gmx.de","name":"darealshinji"},"message":"new package: editors/sublime-text-2","distinct":true,"url":"https://api.github.com/repos/darealshinji/debian/commits/268b418c00f957794eed7a33f7e6089fb25162f2"},{"sha":"69079504019294a505b9c248ba71186190abc0a8","author":{"email":"52122a01dfac1c09ea3fc6e6913df9984d0f756a@gmx.de","name":"darealshinji"},"message":"new package: editors/sublime-text-3","distinct":true,"url":"https://api.github.com/repos/darealshinji/debian/commits/69079504019294a505b9c248ba71186190abc0a8"}]},"public":true,"created_at":"2015-01-01T01:05:25Z"}
{"id":"2489398166","type":"PushEvent","actor":{"id":779660,"login":"KonstantinKo","gravatar_id":"","url":"https://api.github.com/users/KonstantinKo","avatar_url":"https://avatars.githubusercontent.com/u/779660?"},"repo":{"id":24053165,"name":"clarat-org/clarat","url":"https://api.github.com/repos/clarat-org/clarat"},"payload":{"push_id":536753242,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"f4dab9dbdc4c429106c3480b9f1ad18a5c9808a0","before":"9028d94d202c91452636053bfbd2df6eef61e707","commits":[{"sha":"f4dab9dbdc4c429106c3480b9f1ad18a5c9808a0","author":{"email":"23db271f4238abbd1fb089f3166866050f7291f6@gmail.com","name":"Konstantin K"},"message":"for #58 - ajaxify report overlay (& other ajax improvements and fixes)","distinct":true,"url":"https://api.github.com/repos/clarat-org/clarat/commits/f4dab9dbdc4c429106c3480b9f1ad18a5c9808a0"}]},"public":true,"created_at":"2015-01-01T01:05:25Z","org":{"id":8734408,"login":"clarat-org","gravatar_id":"","url":"https://api.github.com/orgs/clarat-org","avatar_url":"https://avatars.githubusercontent.com/u/8734408?"}}
{"id":"2489398167","type":"PushEvent","actor":{"id":744293,"login":"aatxe","gravatar_id":"","url":"https://api.github.com/users/aatxe","avatar_url":"https://avatars.githubusercontent.com/u/744293?"},"repo":{"id":23890761,"name":"aatxe/irc","url":"https://api.github.com/repos/aatxe/irc"},"payload":{"push_id":536753243,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"a6146bc1357831d76833acf7e0c9d56f55f376c7","before":"202748e7a91a52c2ea0afd033dfd6fe7291c98b7","commits":[{"sha":"a6146bc1357831d76833acf7e0c9d56f55f376c7","author":{"email":"2a84587e183d6a81cbf0d140ef37a969d7915794@gmail.com","name":"Aaron Weiss"},"message":"Clean up after #11, including unit tests.","distinct":true,"url":"https://api.github.com/repos/aatxe/irc/commits/a6146bc1357831d76833acf7e0c9d56f55f376c7"}]},"public":true,"created_at":"2015-01-01T01:05:25Z"}
{"id":"2489398168","type":"PushEvent","actor":{"id":4379694,"login":"moongato","gravatar_id":"","url":"https://api.github.com/users/moongato","avatar_url":"https://avatars.githubusercontent.com/u/4379694?"},"repo":{"id":11769015,"name":"moongato/android_frameworks_base","url":"https://api.github.com/repos/moongato/android_frameworks_base"},"payload":{"push_id":536753244,"size":6,"distinct_size":1,"ref":"refs/heads/lp50x-test","head":"af8fdeaf0cba8a8c0837cdf76121e5e1c3efec34","before":"73c3f8da9962437774cec8442e0da8d431c28fa8","commits":[{"sha":"09ed328c580340d67492f81d855f8e2fe5834bd1","author":{"email":"97bd659605de2dc1baed2f2e8ef4e483c88d27f8@gmail.com","name":"Austin T. Conn"},"message":"volume rocker music controls","distinct":false,"url":"https://api.github.com/repos/moongato/android_frameworks_base/commits/09ed328c580340d67492f81d855f8e2fe5834bd1"},{"sha":"b3c8f58fb81a604be3f1fd2913e005afe300e296","author":{"email":"9defb1d2166fe02be9724618510318ef57e74e91@gmail.com","name":"Michael Bestas"},"message":"Fix volume rocker music controls and wake up\n\n- Forward port code from cm-11.0 and adjust for 5.0\n- Fix not being able to adjust volume when music control is on\n- Disable screen off volume/music control when wake key is enabled","distinct":false,"url":"https://api.github.com/repos/moongato/android_frameworks_base/commits/b3c8f58fb81a604be3f1fd2913e005afe300e296"},{"sha":"8040e4188be23da640d89fc829e33651826a48c0","author":{"email":"238a1843d81dd7fbe80b5c1b99515c4ba8c94d0d@cyngn.com","name":"Roman Birg"},"message":"status bar: improve brightness slider behavior\n\nMimic the brightness slider behavior in the statusbar.\nThis adds logic to make the statusbar slider also work with automatic brightness mode enabled and it will instead adjust the temporary automatic brightness overrride.","distinct":false,"url":"https://api.github.com/repos/moongato/android_frameworks_base/commits/8040e4188be23da640d89fc829e33651826a48c0"},{"sha":"58cadbda6cf16389eb849e5d9ed39eafb352d18a","author":{"email":"419b20914ad8ee7cdbbc7674d01c492d53cd267e@gmail.com","name":"Pawit Pornkitprasan"},"message":"status bar brightness: store value as int\n\nNon-automatic brightness value is stored as int, not float.\n\nSymptom: adjust the brightness in the status bar, the brightness slider in the notification bar will always be set to full","distinct":false,"url":"https://api.github.com/repos/moongato/android_frameworks_base/commits/58cadbda6cf16389eb849e5d9ed39eafb352d18a"},{"sha":"e0fb35b9ed52d05ce74b1c1833e20af6cd649f3c","author":{"email":"1e520a49e026effdcbd6ab603708edecd93fc284@gmail.com","name":"Clyde Tan"},"message":"Keep quiet when volume keys are used to wake up device\n\n- Userspace will make a 'beep' with it receives a key up, so  consume that event as well.\n- Removed wake key check in music control code as it will already be disabled here.","distinct":false,"url":"https://api.github.com/repos/moongato/android_frameworks_base/commits/e0fb35b9ed52d05ce74b1c1833e20af6cd649f3c"},{"sha":"af8fdeaf0cba8a8c0837cdf76121e5e1c3efec34","author":{"email":"22e0f38e0fc64da9129ff9b9ef030b39415294a1@ubuntu","name":"moongato"},"message":"Merge remote-tracking branch 'upstream/lollipop-ras-mr1' into lp50x-test","distinct":true,"url":"https://api.github.com/repos/moongato/android_frameworks_base/commits/af8fdeaf0cba8a8c0837cdf76121e5e1c3efec34"}]},"public":true,"created_at":"2015-01-01T01:05:25Z"}
{"id":"2489398175","type":"IssuesEvent","actor":{"id":1217681,"login":"stoeffel","gravatar_id":"","url":"https://api.github.com/users/stoeffel","avatar_url":"https://avatars.githubusercontent.com/u/1217681?"},"repo":{"id":800115,"name":"epeli/underscore.string","url":"https://api.github.com/repos/epeli/underscore.string"},"payload":{"action":"closed","issue":{"url":"https://api.github.com/repos/epeli/underscore.string/issues/306","labels_url":"https://api.github.com/repos/epeli/underscore.string/issues/306/labels{/name}","comments_url":"https://api.github.com/repos/epeli/underscore.string/issues/306/comments","events_url":"https://api.github.com/repos/epeli/underscore.string/issues/306/events","html_url":"https://github.com/epeli/underscore.string/issues/306","id":41565393,"number":306,"title":"._camelize('Sample Text') returning \"SampleText\", not \"sampleText\"","user":{"login":"joshuahiggins","id":879413,"avatar_url":"https://avatars.githubusercontent.com/u/879413?v=3","gravatar_id":"","url":"https://api.github.com/users/joshuahiggins","html_url":"https://github.com/joshuahiggins","followers_url":"https://api.github.com/users/joshuahiggins/followers","following_url":"https://api.github.com/users/joshuahiggins/following{/other_user}","gists_url":"https://api.github.com/users/joshuahiggins/gists{/gist_id}","starred_url":"https://api.github.com/users/joshuahiggins/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/joshuahiggins/subscriptions","organizations_url":"https://api.github.com/users/joshuahiggins/orgs","repos_url":"https://api.github.com/users/joshuahiggins/repos","events_url":"https://api.github.com/users/joshuahiggins/events{/privacy}","received_events_url":"https://api.github.com/users/joshuahiggins/received_events","type":"User","site_admin":false},"labels":[],"state":"closed","locked":false,"assignee":{"login":"stoeffel","id":1217681,"avatar_url":"https://avatars.githubusercontent.com/u/1217681?v=3","gravatar_id":"","url":"https://api.github.com/users/stoeffel","html_url":"https://github.com/stoeffel","followers_url":"https://api.github.com/users/stoeffel/followers","following_url":"https://api.github.com/users/stoeffel/following{/other_user}","gists_url":"https://api.github.com/users/stoeffel/gists{/gist_id}","starred_url":"https://api.github.com/users/stoeffel/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/stoeffel/subscriptions","organizations_url":"https://api.github.com/users/stoeffel/orgs","repos_url":"https://api.github.com/users/stoeffel/repos","events_url":"https://api.github.com/users/stoeffel/events{/privacy}","received_events_url":"https://api.github.com/users/stoeffel/received_events","type":"User","site_admin":false},"milestone":{"url":"https://api.github.com/repos/epeli/underscore.string/milestones/1","labels_url":"https://api.github.com/repos/epeli/underscore.string/milestones/1/labels","id":905496,"number":1,"title":"3.0","description":"CommonJS modularization","creator":{"login":"epeli","id":225712,"avatar_url":"https://avatars.githubusercontent.com/u/225712?v=3","gravatar_id":"","url":"https://api.github.com/users/epeli","html_url":"https://github.com/epeli","followers_url":"https://api.github.com/users/epeli/followers","following_url":"https://api.github.com/users/epeli/following{/other_user}","gists_url":"https://api.github.com/users/epeli/gists{/gist_id}","starred_url":"https://api.github.com/users/epeli/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/epeli/subscriptions","organizations_url":"https://api.github.com/users/epeli/orgs","repos_url":"https://api.github.com/users/epeli/repos","events_url":"https://api.github.com/users/epeli/events{/privacy}","received_events_url":"https://api.github.com/users/epeli/received_events","type":"User","site_admin":false},"open_issues":4,"closed_issues":12,"state":"open","created_at":"2014-12-16T12:21:34Z","updated_at":"2015-01-01T01:05:25Z","due_on":null,"closed_at":null},"comments":11,"created_at":"2014-08-30T15:24:38Z","updated_at":"2015-01-01T01:05:25Z","closed_at":"2015-01-01T01:05:25Z","body":"The documentation is confusing, as it indicates the following (emphasis added):\r\n\r\n> Converts underscored or dasherized string to a camelized one. **Begins with a lower case letter** unless it starts with an underscore or **string**\r\n\r\nThe example that follows shows a dash utilized to prompt a lowercase letter, which is neither an underscore nor a string. Should the documentation read as `underscore or dash`? It wouldn't make sense that it starts with a lower case letter unless it starts with a string.\r\n\r\nCamelizing the phrase \"Sample Text\" should return \"sampleText\", not \"SampleText\". "}},"public":true,"created_at":"2015-01-01T01:05:26Z"}
{"id":"2489398176","type":"PullRequestEvent","actor":{"id":1217681,"login":"stoeffel","gravatar_id":"","url":"https://api.github.com/users/stoeffel","avatar_url":"https://avatars.githubusercontent.com/u/1217681?"},"repo":{"id":800115,"name":"epeli/underscore.string","url":"https://api.github.com/repos/epeli/underscore.string"},"payload":{"action":"closed","number":370,"pull_request":{"url":"https://api.github.com/repos/epeli/underscore.string/pulls/370","id":26636766,"html_url":"https://github.com/epeli/underscore.string/pull/370","diff_url":"https://github.com/epeli/underscore.string/pull/370.diff","patch_url":"https://github.com/epeli/underscore.string/pull/370.patch","issue_url":"https://api.github.com/repos/epeli/underscore.string/issues/370","number":370,"state":"closed","locked":false,"title":"add force lowercase flag to camelize","user":{"login":"stoeffel","id":1217681,"avatar_url":"https://avatars.githubusercontent.com/u/1217681?v=3","gravatar_id":"","url":"https://api.github.com/users/stoeffel","html_url":"https://github.com/stoeffel","followers_url":"https://api.github.com/users/stoeffel/followers","following_url":"https://api.github.com/users/stoeffel/following{/other_user}","gists_url":"https://api.github.com/users/stoeffel/gists{/gist_id}","starred_url":"https://api.github.com/users/stoeffel/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/stoeffel/subscriptions","organizations_url":"https://api.github.com/users/stoeffel/orgs","repos_url":"https://api.github.com/users/stoeffel/repos","events_url":"https://api.github.com/users/stoeffel/events{/privacy}","received_events_url":"https://api.github.com/users/stoeffel/received_events","type":"User","site_admin":false},"body":"- add tests for capitalization of the first letter\r\n- add alias camelback for camelize(str, true)\r\n- add alias camelcase (analoge ruby)\r\n- merge duplicate test suite for camelize\r\n\r\ncloses #306","created_at":"2014-12-29T09:15:54Z","updated_at":"2015-01-01T01:05:26Z","closed_at":"2015-01-01T01:05:26Z","merged_at":"2015-01-01T01:05:25Z","merge_commit_sha":"e5ccfbf9637aa84e69ccc2ba26a53170de0cdac6","assignee":null,"milestone":null,"commits_url":"https://api.github.com/repos/epeli/underscore.string/pulls/370/commits","review_comments_url":"https://api.github.com/repos/epeli/underscore.string/pulls/370/comments","review_comment_url":"https://api.github.com/repos/epeli/underscore.string/pulls/comments/{number}","comments_url":"https://api.github.com/repos/epeli/underscore.string/issues/370/comments","statuses_url":"https://api.github.com/repos/epeli/underscore.string/statuses/9fa0bbce075f82af8a7cd96abac4a6a1ae718611","head":{"label":"epeli:camelize-force-lowercase","ref":"camelize-force-lowercase","sha":"9fa0bbce075f82af8a7cd96abac4a6a1ae718611","user":{"login":"epeli","id":225712,"avatar_url":"https://avatars.githubusercontent.com/u/225712?v=3","gravatar_id":"","url":"https://api.github.com/users/epeli","html_url":"https://github.com/epeli","followers_url":"https://api.github.com/users/epeli/followers","following_url":"https://api.github.com/users/epeli/following{/other_user}","gists_url":"https://api.github.com/users/epeli/gists{/gist_id}","starred_url":"https://api.github.com/users/epeli/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/epeli/subscriptions","organizations_url":"https://api.github.com/users/epeli/orgs","repos_url":"https://api.github.com/users/epeli/repos","events_url":"https://api.github.com/users/epeli/events{/privacy}","received_events_url":"https://api.github.com/users/epeli/received_events","type":"User","site_admin":false},"repo":{"id":800115,"name":"underscore.string","full_name":"epeli/underscore.string","owner":{"login":"epeli","id":225712,"avatar_url":"https://avatars.githubusercontent.com/u/225712?v=3","gravatar_id":"","url":"https://api.github.com/users/epeli","html_url":"https://github.com/epeli","followers_url":"https://api.github.com/users/epeli/followers","following_url":"https://api.github.com/users/epeli/following{/other_user}","gists_url":"https://api.github.com/users/epeli/gists{/gist_id}","starred_url":"https://api.github.com/users/epeli/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/epeli/subscriptions","organizations_url":"https://api.github.com/users/epeli/orgs","repos_url":"https://api.github.com/users/epeli/repos","events_url":"https://api.github.com/users/epeli/events{/privacy}","received_events_url":"https://api.github.com/users/epeli/received_events","type":"User","site_admin":false},"private":false,"html_url":"https://github.com/epeli/underscore.string","description":"String manipulation helpers for javascript","fork":false,"url":"https://api.github.com/repos/epeli/underscore.string","forks_url":"https://api.github.com/repos/epeli/underscore.string/forks","keys_url":"https://api.github.com/repos/epeli/underscore.string/keys{/key_id}","collaborators_url":"https://api.github.com/repos/epeli/underscore.string/collaborators{/collaborator}","teams_url":"https://api.github.com/repos/epeli/underscore.string/teams","hooks_url":"https://api.github.com/repos/epeli/underscore.string/hooks","issue_events_url":"https://api.github.com/repos/epeli/underscore.string/issues/events{/number}","events_url":"https://api.github.com/repos/epeli/underscore.string/events","assignees_url":"https://api.github.com/repos/epeli/underscore.string/assignees{/user}","branches_url":"https://api.github.com/repos/epeli/underscore.string/branches{/branch}","tags_url":"https://api.github.com/repos/epeli/underscore.string/tags","blobs_url":"https://api.github.com/repos/epeli/underscore.string/git/blobs{/sha}","git_tags_url":"https://api.github.com/repos/epeli/underscore.string/git/tags{/sha}","git_refs_url":"https://api.github.com/repos/epeli/underscore.string/git/refs{/sha}","trees_url":"https://api.github.com/repos/epeli/underscore.string/git/trees{/sha}","statuses_url":"https://api.github.com/repos/epeli/underscore.string/statuses/{sha}","languages_url":"https://api.github.com/repos/epeli/underscore.string/languages","stargazers_url":"https://api.github.com/repos/epeli/underscore.string/stargazers","contributors_url":"https://api.github.com/repos/epeli/underscore.string/contributors","subscribers_url":"https://api.github.com/repos/epeli/underscore.string/subscribers","subscription_url":"https://api.github.com/repos/epeli/underscore.string/subscription","commits_url":"https://api.github.com/repos/epeli/underscore.string/commits{/sha}","git_commits_url":"https://api.github.com/repos/epeli/underscore.string/git/commits{/sha}","comments_url":"https://api.github.com/repos/epeli/underscore.string/comments{/number}","issue_comment_url":"https://api.github.com/repos/epeli/underscore.string/issues/comments/{number}","contents_url":"https://api.github.com/repos/epeli/underscore.string/contents/{+path}","compare_url":"https://api.github.com/repos/epeli/underscore.string/compare/{base}...{head}","merges_url":"https://api.github.com/repos/epeli/underscore.string/merges","archive_url":"https://api.github.com/repos/epeli/underscore.string/{archive_format}{/ref}","downloads_url":"https://api.github.com/repos/epeli/underscore.string/downloads","issues_url":"https://api.github.com/repos/epeli/underscore.string/issues{/number}","pulls_url":"https://api.github.com/repos/epeli/underscore.string/pulls{/number}","milestones_url":"https://api.github.com/repos/epeli/underscore.string/milestones{/number}","notifications_url":"https://api.github.com/repos/epeli/underscore.string/notifications{?since,all,participating}","labels_url":"https://api.github.com/repos/epeli/underscore.string/labels{/name}","releases_url":"https://api.github.com/repos/epeli/underscore.string/releases{/id}","created_at":"2010-07-27T08:01:42Z","updated_at":"2014-12-31T03:37:22Z","pushed_at":"2015-01-01T01:05:25Z","git_url":"git://github.com/epeli/underscore.string.git","ssh_url":"git@github.com:epeli/underscore.string.git","clone_url":"https://github.com/epeli/underscore.string.git","svn_url":"https://github.com/epeli/underscore.string","homepage":"http://epeli.github.com/underscore.string/","size":5116,"stargazers_count":2443,"watchers_count":2443,"language":"JavaScript","has_issues":true,"has_downloads":true,"has_wiki":false,"has_pages":true,"forks_count":307,"mirror_url":null,"open_issues_count":102,"forks":307,"open_issues":102,"watchers":2443,"default_branch":"master"}},"base":{"label":"epeli:master","ref":"master","sha":"244b1724770947430793dc43fb96d610dd045c47","user":{"login":"epeli","id":225712,"avatar_url":"https://avatars.githubusercontent.com/u/225712?v=3","gravatar_id":"","url":"https://api.github.com/users/epeli","html_url":"https://github.com/epeli","followers_url":"https://api.github.com/users/epeli/followers","following_url":"https://api.github.com/users/epeli/following{/other_user}","gists_url":"https://api.github.com/users/epeli/gists{/gist_id}","starred_url":"https://api.github.com/users/epeli/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/epeli/subscriptions","organizations_url":"https://api.github.com/users/epeli/orgs","repos_url":"https://api.github.com/users/epeli/repos","events_url":"https://api.github.com/users/epeli/events{/privacy}","received_events_url":"https://api.github.com/users/epeli/received_events","type":"User","site_admin":false},"repo":{"id":800115,"name":"underscore.string","full_name":"epeli/underscore.string","owner":{"login":"epeli","id":225712,"avatar_url":"https://avatars.githubusercontent.com/u/225712?v=3","gravatar_id":"","url":"https://api.github.com/users/epeli","html_url":"https://github.com/epeli","followers_url":"https://api.github.com/users/epeli/followers","following_url":"https://api.github.com/users/epeli/following{/other_user}","gists_url":"https://api.github.com/users/epeli/gists{/gist_id}","starred_url":"https://api.github.com/users/epeli/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/epeli/subscriptions","organizations_url":"https://api.github.com/users/epeli/orgs","repos_url":"https://api.github.com/users/epeli/repos","events_url":"https://api.github.com/users/epeli/events{/privacy}","received_events_url":"https://api.github.com/users/epeli/received_events","type":"User","site_admin":false},"private":false,"html_url":"https://github.com/epeli/underscore.string","description":"String manipulation helpers for javascript","fork":false,"url":"https://api.github.com/repos/epeli/underscore.string","forks_url":"https://api.github.com/repos/epeli/underscore.string/forks","keys_url":"https://api.github.com/repos/epeli/underscore.string/keys{/key_id}","collaborators_url":"https://api.github.com/repos/epeli/underscore.string/collaborators{/collaborator}","teams_url":"https://api.github.com/repos/epeli/underscore.string/teams","hooks_url":"https://api.github.com/repos/epeli/underscore.string/hooks","issue_events_url":"https://api.github.com/repos/epeli/underscore.string/issues/events{/number}","events_url":"https://api.github.com/repos/epeli/underscore.string/events","assignees_url":"https://api.github.com/repos/epeli/underscore.string/assignees{/user}","branches_url":"https://api.github.com/repos/epeli/underscore.string/branches{/branch}","tags_url":"https://api.github.com/repos/epeli/underscore.string/tags","blobs_url":"https://api.github.com/repos/epeli/underscore.string/git/blobs{/sha}","git_tags_url":"https://api.github.com/repos/epeli/underscore.string/git/tags{/sha}","git_refs_url":"https://api.github.com/repos/epeli/underscore.string/git/refs{/sha}","trees_url":"https://api.github.com/repos/epeli/underscore.string/git/trees{/sha}","statuses_url":"https://api.github.com/repos/epeli/underscore.string/statuses/{sha}","languages_url":"https://api.github.com/repos/epeli/underscore.string/languages","stargazers_url":"https://api.github.com/repos/epeli/underscore.string/stargazers","contributors_url":"https://api.github.com/repos/epeli/underscore.string/contributors","subscribers_url":"https://api.github.com/repos/epeli/underscore.string/subscribers","subscription_url":"https://api.github.com/repos/epeli/underscore.string/subscription","commits_url":"https://api.github.com/repos/epeli/underscore.string/commits{/sha}","git_commits_url":"https://api.github.com/repos/epeli/underscore.string/git/commits{/sha}","comments_url":"https://api.github.com/repos/epeli/underscore.string/comments{/number}","issue_comment_url":"https://api.github.com/repos/epeli/underscore.string/issues/comments/{number}","contents_url":"https://api.github.com/repos/epeli/underscore.string/contents/{+path}","compare_url":"https://api.github.com/repos/epeli/underscore.string/compare/{base}...{head}","merges_url":"https://api.github.com/repos/epeli/underscore.string/merges","archive_url":"https://api.github.com/repos/epeli/underscore.string/{archive_format}{/ref}","downloads_url":"https://api.github.com/repos/epeli/underscore.string/downloads","issues_url":"https://api.github.com/repos/epeli/underscore.string/issues{/number}","pulls_url":"https://api.github.com/repos/epeli/underscore.string/pulls{/number}","milestones_url":"https://api.github.com/repos/epeli/underscore.string/milestones{/number}","notifications_url":"https://api.github.com/repos/epeli/underscore.string/notifications{?since,all,participating}","labels_url":"https://api.github.com/repos/epeli/underscore.string/labels{/name}","releases_url":"https://api.github.com/repos/epeli/underscore.string/releases{/id}","created_at":"2010-07-27T08:01:42Z","updated_at":"2014-12-31T03:37:22Z","pushed_at":"2015-01-01T01:05:25Z","git_url":"git://github.com/epeli/underscore.string.git","ssh_url":"git@github.com:epeli/underscore.string.git","clone_url":"https://github.com/epeli/underscore.string.git","svn_url":"https://github.com/epeli/underscore.string","homepage":"http://epeli.github.com/underscore.string/","size":5116,"stargazers_count":2443,"watchers_count":2443,"language":"JavaScript","has_issues":true,"has_downloads":true,"has_wiki":false,"has_pages":true,"forks_count":307,"mirror_url":null,"open_issues_count":102,"forks":307,"open_issues":102,"watchers":2443,"default_branch":"master"}},"_links":{"self":{"href":"https://api.github.com/repos/epeli/underscore.string/pulls/370"},"html":{"href":"https://github.com/epeli/underscore.string/pull/370"},"issue":{"href":"https://api.github.com/repos/epeli/underscore.string/issues/370"},"comments":{"href":"https://api.github.com/repos/epeli/underscore.string/issues/370/comments"},"review_comments":{"href":"https://api.github.com/repos/epeli/underscore.string/pulls/370/comments"},"review_comment":{"href":"https://api.github.com/repos/epeli/underscore.string/pulls/comments/{number}"},"commits":{"href":"https://api.github.com/repos/epeli/underscore.string/pulls/370/commits"},"statuses":{"href":"https://api.github.com/repos/epeli/underscore.string/statuses/9fa0bbce075f82af8a7cd96abac4a6a1ae718611"}},"merged":true,"mergeable":null,"mergeable_state":"unknown","merged_by":{"login":"stoeffel","id":1217681,"avatar_url":"https://avatars.githubusercontent.com/u/1217681?v=3","gravatar_id":"","url":"https://api.github.com/users/stoeffel","html_url":"https://github.com/stoeffel","followers_url":"https://api.github.com/users/stoeffel/followers","following_url":"https://api.github.com/users/stoeffel/following{/other_user}","gists_url":"https://api.github.com/users/stoeffel/gists{/gist_id}","starred_url":"https://api.github.com/users/stoeffel/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/stoeffel/subscriptions","organizations_url":"https://api.github.com/users/stoeffel/orgs","repos_url":"https://api.github.com/users/stoeffel/repos","events_url":"https://api.github.com/users/stoeffel/events{/privacy}","received_events_url":"https://api.github.com/users/stoeffel/received_events","type":"User","site_admin":false},"comments":9,"review_comments":0,"commits":1,"additions":55,"deletions":32,"changed_files":4}},"public":true,"created_at":"2015-01-01T01:05:26Z"}
{"id":"2489398183","type":"PushEvent","actor":{"id":745333,"login":"mkeeter","gravatar_id":"","url":"https://api.github.com/users/mkeeter","avatar_url":"https://avatars.githubusercontent.com/u/745333?"},"repo":{"id":15458279,"name":"mkeeter/antimony","url":"https://api.github.com/repos/mkeeter/antimony"},"payload":{"push_id":536753246,"size":3,"distinct_size":3,"ref":"refs/heads/master","head":"af931f7902c93ac10b7f8c5f4bd24130448792da","before":"63294530fca3218ef2e545af86172024100fac7f","commits":[{"sha":"f466d66f8f5e3d3258cfa456221f0d296cb5519d","author":{"email":"b96049b2cf1cc4f51fb34d3c0383273ec5d20919@gmail.com","name":"Matt Keeter"},"message":"Prevent DummyControl from blocking everything behind it","distinct":true,"url":"https://api.github.com/repos/mkeeter/antimony/commits/f466d66f8f5e3d3258cfa456221f0d296cb5519d"},{"sha":"e8c74daafe41860bac6b63829e7488e94e951794","author":{"email":"b96049b2cf1cc4f51fb34d3c0383273ec5d20919@gmail.com","name":"Matt Keeter"},"message":"Make ControlProxies hierarchical (matching Controls)\n\nThis is nice because it makes the raise dialog only find one\nControlProxy when you right-click on something like a triangle's corner\n(where the line and corner point overlap)","distinct":true,"url":"https://api.github.com/repos/mkeeter/antimony/commits/e8c74daafe41860bac6b63829e7488e94e951794"},{"sha":"af931f7902c93ac10b7f8c5f4bd24130448792da","author":{"email":"b96049b2cf1cc4f51fb34d3c0383273ec5d20919@gmail.com","name":"Matt Keeter"},"message":"Only open raise menu if more than one control are overlapping","distinct":true,"url":"https://api.github.com/repos/mkeeter/antimony/commits/af931f7902c93ac10b7f8c5f4bd24130448792da"}]},"public":true,"created_at":"2015-01-01T01:05:26Z"}
{"id":"2489398189","type":"PullRequestReviewCommentEvent","actor":{"id":523287,"login":"j2sol","gravatar_id":"","url":"https://api.github.com/users/j2sol","avatar_url":"https://avatars.githubusercontent.com/u/523287?"},"repo":{"id":11848896,"name":"blueboxgroup/ursula","url":"https://api.github.com/repos/blueboxgroup/ursula"},"payload":{"action":"created","comment":{"url":"https://api.github.com/repos/blueboxgroup/ursula/pulls/comments/22397291","id":22397291,"diff_hunk":"@@ -1,121 +1,92 @@\n ---\n-- name: install apache\n-  apt: pkg={{ item }}\n-  with_items:\n-    - apache2\n-    - libapache2-mod-wsgi\n-\n - name: lesscpy must be in apache PATH\n   pip: name=lesscpy version=0.9j\n \n - name: get horizon source repo\n-  git: repo={{ openstack.git_mirror }}/horizon.git\n-       dest=/opt/stack/horizon\n-       version={{ horizon.rev }}\n-       update={{ openstack.git_update }}\n+  git: |\n+    repo={{ openstack.git_mirror}}/horizon.git\n+    dest=/opt/stack/horizon\n+    version={{ horizon.rev }}\n+    update={{ openstack.git_update }}\n   notify:\n     - setup horizon venv\n     - compress horizon assets\n \n-- template: src=opt/stack/horizon/hide-external-networks.patch dest=/opt/stack/horizon/hide-external-networks.patch mode=0644\n-- shell: patch -p1 < hide-external-networks.patch chdir=/opt/stack/horizon\n-  notify:\n-    - setup horizon venv\n-\n - name: add python-memcached to horizon requirements\n-  lineinfile: dest=/opt/stack/horizon/requirements.txt\n-              regexp=^python-memcached\n-              line=python-memcached\n+  lineinfile: dest=/opt/stack/horizon/requirements.txt regexp=^python-memcached line=python-memcached\n   notify:\n     - setup horizon venv\n \n-- name: disable apache status\n-  command: a2dismod status\n-  notify:\n-    - restart apache\n-\n-- name: apache ports config\n-  template: src=etc/apache2/ports.conf\n-            dest=/etc/apache2/ports.conf\n-  notify:\n-    - restart apache\n-\n-- name: disable default apache site\n-  command: a2dissite 000-default\n+- name: make sure apache knows about horizon ports\n+  lineinfile: dest=/etc/apache2/ports.conf line=\"Listen 8080\"\n   notify:\n-    - restart apache\n+    - reload apache\n \n-- name: openstack dashboard config (12.04)\n-  template: src=etc/apache2/sites-available/openstack_dashboard.conf\n-            dest=/etc/apache2/sites-available/openstack_dashboard\n+- name: create dashboard virtualhost on precise\n+  template: |\n+    src=etc/apache2/sites-available/openstack_dashboard.conf\n+    dest=/etc/apache2/sites-available/openstack_dashboard\n   when: ansible_distribution_version == \"12.04\"\n   notify:\n-    - restart apache\n+    - reload apache\n \n-- name: openstack dashboard config\n-  template: src=etc/apache2/sites-available/openstack_dashboard.conf\n-            dest=/etc/apache2/sites-available/openstack_dashboard.conf\n+- name: create dashboard virtualhost on other\n+  template: |\n+    src=etc/apache2/sites-available/openstack_dashboard.conf\n+    dest=/etc/apache2/sites-available/openstack_dashboard.conf\n   when: ansible_distribution_version != \"12.04\"\n   notify:\n-    - restart apache\n+    - reload apache\n \n - name: enable horizon apache site\n-  command: a2ensite openstack_dashboard\n+  apache2_site: state=enabled name=openstack_dashboard\n   notify:\n-    - restart apache\n-\n-- name: static asset directories\n-  file: dest={{ item }}\n-        state=directory\n-        owner=www-data\n-        group=www-data\n-        mode=0755\n+    - reload apache\n+\n+- name: create static asset dirs\n+  file: |\n+    dest={{ item }}\n+    state=directory\n+    owner=www-data\n+    group=www-data\n+    mode=0755\n   with_items:\n     - /opt/stack/horizon/static\n     - /opt/stack/horizon/static/dashboard\n \n-- name: horizon local settings\n-  template: src=opt/stack/horizon/openstack_dashboard/local/local_settings.py\n-            dest=/opt/stack/horizon/openstack_dashboard/local/local_settings.py\n-            mode=0644\n+- name: dashboard settings\n+  template: |\n+    src=opt/stack/horizon/openstack_dashboard/local/local_settings.py\n+    dest=/opt/stack/horizon/openstack_dashboard/local/local_settings.py\n+    mode=0644\n   notify:\n-    - restart apache\n+    - reload apache\n \n - name: custom horizon logo\n-  get_url: url={{ horizon.logo_url }}\n-           dest=/opt/stack/horizon/openstack_dashboard/static/dashboard/img/logo.png\n-           mode=0644 force=yes\n+  get_url: url={{ horizon.logo_url }} dest=/opt/stack/horizon/openstack_dashboard/static/dashboard/img/logo.png mode=0644 force=yes\n \n - name: custom horizon splash logo\n-  get_url: url={{ horizon.logo_url }}\n-           dest=/opt/stack/horizon/openstack_dashboard/static/dashboard/img/logo-splash.png\n-           mode=0644 force=yes\n+  get_url: url={{ horizon.logo_url }} dest=/opt/stack/horizon/openstack_dashboard/static/dashboard/img/logo-splash.png mode=0644 force=yes\n \n - name: custom horizon favicon\n-  get_url: url={{ horizon.favicon_url }}\n-           dest=/opt/stack/horizon/openstack_dashboard/static/dashboard/img/favicon.ico\n-           force=yes\n+  get_url: url={{ horizon.favicon_url }} dest=/opt/stack/horizon/openstack_dashboard/static/dashboard/img/favicon.ico force=yes","path":"roles/horizon/tasks/main.yml","position":135,"original_position":135,"commit_id":"2a6f35313b9936ce4450aba823d09287626bed6f","original_commit_id":"2a6f35313b9936ce4450aba823d09287626bed6f","user":{"login":"j2sol","id":523287,"avatar_url":"https://avatars.githubusercontent.com/u/523287?v=3","gravatar_id":"","url":"https://api.github.com/users/j2sol","html_url":"https://github.com/j2sol","followers_url":"https://api.github.com/users/j2sol/followers","following_url":"https://api.github.com/users/j2sol/following{/other_user}","gists_url":"https://api.github.com/users/j2sol/gists{/gist_id}","starred_url":"https://api.github.com/users/j2sol/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/j2sol/subscriptions","organizations_url":"https://api.github.com/users/j2sol/orgs","repos_url":"https://api.github.com/users/j2sol/repos","events_url":"https://api.github.com/users/j2sol/events{/privacy}","received_events_url":"https://api.github.com/users/j2sol/received_events","type":"User","site_admin":false},"body":"Same for the other two get_urls above.","created_at":"2015-01-01T01:05:27Z","updated_at":"2015-01-01T01:05:27Z","html_url":"https://github.com/blueboxgroup/ursula/pull/705#discussion_r22397291","pull_request_url":"https://api.github.com/repos/blueboxgroup/ursula/pulls/705","_links":{"self":{"href":"https://api.github.com/repos/blueboxgroup/ursula/pulls/comments/22397291"},"html":{"href":"https://github.com/blueboxgroup/ursula/pull/705#discussion_r22397291"},"pull_request":{"href":"https://api.github.com/repos/blueboxgroup/ursula/pulls/705"}}},"pull_request":{"url":"https://api.github.com/repos/blueboxgroup/ursula/pulls/705","id":26738851,"html_url":"https://github.com/blueboxgroup/ursula/pull/705","diff_url":"https://github.com/blueboxgroup/ursula/pull/705.diff","patch_url":"https://github.com/blueboxgroup/ursula/pull/705.patch","issue_url":"https://api.github.com/repos/blueboxgroup/ursula/issues/705","number":705,"state":"open","locked":false,"title":"WIP:  apache for loadbalancing","user":{"login":"paulczar","id":2488346,"avatar_url":"https://avatars.githubusercontent.com/u/2488346?v=3","gravatar_id":"","url":"https://api.github.com/users/paulczar","html_url":"https://github.com/paulczar","followers_url":"https://api.github.com/users/paulczar/followers","following_url":"https://api.github.com/users/paulczar/following{/other_user}","gists_url":"https://api.github.com/users/paulczar/gists{/gist_id}","starred_url":"https://api.github.com/users/paulczar/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/paulczar/subscriptions","organizations_url":"https://api.github.com/users/paulczar/orgs","repos_url":"https://api.github.com/users/paulczar/repos","events_url":"https://api.github.com/users/paulczar/events{/privacy}","received_events_url":"https://api.github.com/users/paulczar/received_events","type":"User","site_admin":false},"body":"This is a quick POC / WIP to demo using apache instead of haproxy for loadbalancing our APIs.\r\n\r\nI think this gives us more flexibiltiy as we can enable in the APIs role itself ( in this case in keystone ) rather than a big monolithic haproxy.conf.      We also already have apache running for horizon, so it could reduce number of services.    apache also has better logging options that haproxy which can only log to syslog. ","created_at":"2015-01-01T00:04:13Z","updated_at":"2015-01-01T01:05:27Z","closed_at":null,"merged_at":null,"merge_commit_sha":"9b91693f11e166c9ee53836f19697868d412bf76","assignee":null,"milestone":null,"commits_url":"https://api.github.com/repos/blueboxgroup/ursula/pulls/705/commits","review_comments_url":"https://api.github.com/repos/blueboxgroup/ursula/pulls/705/comments","review_comment_url":"https://api.github.com/repos/blueboxgroup/ursula/pulls/comments/{number}","comments_url":"https://api.github.com/repos/blueboxgroup/ursula/issues/705/comments","statuses_url":"https://api.github.com/repos/blueboxgroup/ursula/statuses/2a6f35313b9936ce4450aba823d09287626bed6f","head":{"label":"blueboxgroup:use_apache_for_lb","ref":"use_apache_for_lb","sha":"2a6f35313b9936ce4450aba823d09287626bed6f","user":{"login":"blueboxgroup","id":458705,"avatar_url":"https://avatars.githubusercontent.com/u/458705?v=3","gravatar_id":"","url":"https://api.github.com/users/blueboxgroup","html_url":"https://github.com/blueboxgroup","followers_url":"https://api.github.com/users/blueboxgroup/followers","following_url":"https://api.github.com/users/blueboxgroup/following{/other_user}","gists_url":"https://api.github.com/users/blueboxgroup/gists{/gist_id}","starred_url":"https://api.github.com/users/blueboxgroup/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/blueboxgroup/subscriptions","organizations_url":"https://api.github.com/users/blueboxgroup/orgs","repos_url":"https://api.github.com/users/blueboxgroup/repos","events_url":"https://api.github.com/users/blueboxgroup/events{/privacy}","received_events_url":"https://api.github.com/users/blueboxgroup/received_events","type":"Organization","site_admin":false},"repo":{"id":11848896,"name":"ursula","full_name":"blueboxgroup/ursula","owner":{"login":"blueboxgroup","id":458705,"avatar_url":"https://avatars.githubusercontent.com/u/458705?v=3","gravatar_id":"","url":"https://api.github.com/users/blueboxgroup","html_url":"https://github.com/blueboxgroup","followers_url":"https://api.github.com/users/blueboxgroup/followers","following_url":"https://api.github.com/users/blueboxgroup/following{/other_user}","gists_url":"https://api.github.com/users/blueboxgroup/gists{/gist_id}","starred_url":"https://api.github.com/users/blueboxgroup/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/blueboxgroup/subscriptions","organizations_url":"https://api.github.com/users/blueboxgroup/orgs","repos_url":"https://api.github.com/users/blueboxgroup/repos","events_url":"https://api.github.com/users/blueboxgroup/events{/privacy}","received_events_url":"https://api.github.com/users/blueboxgroup/received_events","type":"Organization","site_admin":false},"private":false,"html_url":"https://github.com/blueboxgroup/ursula","description":"Ansible playbooks for operating OpenStack","fork":false,"url":"https://api.github.com/repos/blueboxgroup/ursula","forks_url":"https://api.github.com/repos/blueboxgroup/ursula/forks","keys_url":"https://api.github.com/repos/blueboxgroup/ursula/keys{/key_id}","collaborators_url":"https://api.github.com/repos/blueboxgroup/ursula/collaborators{/collaborator}","teams_url":"https://api.github.com/repos/blueboxgroup/ursula/teams","hooks_url":"https://api.github.com/repos/blueboxgroup/ursula/hooks","issue_events_url":"https://api.github.com/repos/blueboxgroup/ursula/issues/events{/number}","events_url":"https://api.github.com/repos/blueboxgroup/ursula/events","assignees_url":"https://api.github.com/repos/blueboxgroup/ursula/assignees{/user}","branches_url":"https://api.github.com/repos/blueboxgroup/ursula/branches{/branch}","tags_url":"https://api.github.com/repos/blueboxgroup/ursula/tags","blobs_url":"https://api.github.com/repos/blueboxgroup/ursula/git/blobs{/sha}","git_tags_url":"https://api.github.com/repos/blueboxgroup/ursula/git/tags{/sha}","git_refs_url":"https://api.github.com/repos/blueboxgroup/ursula/git/refs{/sha}","trees_url":"https://api.github.com/repos/blueboxgroup/ursula/git/trees{/sha}","statuses_url":"https://api.github.com/repos/blueboxgroup/ursula/statuses/{sha}","languages_url":"https://api.github.com/repos/blueboxgroup/ursula/languages","stargazers_url":"https://api.github.com/repos/blueboxgroup/ursula/stargazers","contributors_url":"https://api.github.com/repos/blueboxgroup/ursula/contributors","subscribers_url":"https://api.github.com/repos/blueboxgroup/ursula/subscribers","subscription_url":"https://api.github.com/repos/blueboxgroup/ursula/subscription","commits_url":"https://api.github.com/repos/blueboxgroup/ursula/commits{/sha}","git_commits_url":"https://api.github.com/repos/blueboxgroup/ursula/git/commits{/sha}","comments_url":"https://api.github.com/repos/blueboxgroup/ursula/comments{/number}","issue_comment_url":"https://api.github.com/repos/blueboxgroup/ursula/issues/comments/{number}","contents_url":"https://api.github.com/repos/blueboxgroup/ursula/contents/{+path}","compare_url":"https://api.github.com/repos/blueboxgroup/ursula/compare/{base}...{head}","merges_url":"https://api.github.com/repos/blueboxgroup/ursula/merges","archive_url":"https://api.github.com/repos/blueboxgroup/ursula/{archive_format}{/ref}","downloads_url":"https://api.github.com/repos/blueboxgroup/ursula/downloads","issues_url":"https://api.github.com/repos/blueboxgroup/ursula/issues{/number}","pulls_url":"https://api.github.com/repos/blueboxgroup/ursula/pulls{/number}","milestones_url":"https://api.github.com/repos/blueboxgroup/ursula/milestones{/number}","notifications_url":"https://api.github.com/repos/blueboxgroup/ursula/notifications{?since,all,participating}","labels_url":"https://api.github.com/repos/blueboxgroup/ursula/labels{/name}","releases_url":"https://api.github.com/repos/blueboxgroup/ursula/releases{/id}","created_at":"2013-08-02T17:37:26Z","updated_at":"2014-12-31T21:03:28Z","pushed_at":"2015-01-01T00:01:35Z","git_url":"git://github.com/blueboxgroup/ursula.git","ssh_url":"git@github.com:blueboxgroup/ursula.git","clone_url":"https://github.com/blueboxgroup/ursula.git","svn_url":"https://github.com/blueboxgroup/ursula","homepage":null,"size":9036,"stargazers_count":45,"watchers_count":45,"language":"Python","has_issues":true,"has_downloads":true,"has_wiki":true,"has_pages":false,"forks_count":23,"mirror_url":null,"open_issues_count":26,"forks":23,"open_issues":26,"watchers":45,"default_branch":"master"}},"base":{"label":"blueboxgroup:master","ref":"master","sha":"34b83c65ff0de2f8b006d8ce4f76919fe0167bbf","user":{"login":"blueboxgroup","id":458705,"avatar_url":"https://avatars.githubusercontent.com/u/458705?v=3","gravatar_id":"","url":"https://api.github.com/users/blueboxgroup","html_url":"https://github.com/blueboxgroup","followers_url":"https://api.github.com/users/blueboxgroup/followers","following_url":"https://api.github.com/users/blueboxgroup/following{/other_user}","gists_url":"https://api.github.com/users/blueboxgroup/gists{/gist_id}","starred_url":"https://api.github.com/users/blueboxgroup/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/blueboxgroup/subscriptions","organizations_url":"https://api.github.com/users/blueboxgroup/orgs","repos_url":"https://api.github.com/users/blueboxgroup/repos","events_url":"https://api.github.com/users/blueboxgroup/events{/privacy}","received_events_url":"https://api.github.com/users/blueboxgroup/received_events","type":"Organization","site_admin":false},"repo":{"id":11848896,"name":"ursula","full_name":"blueboxgroup/ursula","owner":{"login":"blueboxgroup","id":458705,"avatar_url":"https://avatars.githubusercontent.com/u/458705?v=3","gravatar_id":"","url":"https://api.github.com/users/blueboxgroup","html_url":"https://github.com/blueboxgroup","followers_url":"https://api.github.com/users/blueboxgroup/followers","following_url":"https://api.github.com/users/blueboxgroup/following{/other_user}","gists_url":"https://api.github.com/users/blueboxgroup/gists{/gist_id}","starred_url":"https://api.github.com/users/blueboxgroup/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/blueboxgroup/subscriptions","organizations_url":"https://api.github.com/users/blueboxgroup/orgs","repos_url":"https://api.github.com/users/blueboxgroup/repos","events_url":"https://api.github.com/users/blueboxgroup/events{/privacy}","received_events_url":"https://api.github.com/users/blueboxgroup/received_events","type":"Organization","site_admin":false},"private":false,"html_url":"https://github.com/blueboxgroup/ursula","description":"Ansible playbooks for operating OpenStack","fork":false,"url":"https://api.github.com/repos/blueboxgroup/ursula","forks_url":"https://api.github.com/repos/blueboxgroup/ursula/forks","keys_url":"https://api.github.com/repos/blueboxgroup/ursula/keys{/key_id}","collaborators_url":"https://api.github.com/repos/blueboxgroup/ursula/collaborators{/collaborator}","teams_url":"https://api.github.com/repos/blueboxgroup/ursula/teams","hooks_url":"https://api.github.com/repos/blueboxgroup/ursula/hooks","issue_events_url":"https://api.github.com/repos/blueboxgroup/ursula/issues/events{/number}","events_url":"https://api.github.com/repos/blueboxgroup/ursula/events","assignees_url":"https://api.github.com/repos/blueboxgroup/ursula/assignees{/user}","branches_url":"https://api.github.com/repos/blueboxgroup/ursula/branches{/branch}","tags_url":"https://api.github.com/repos/blueboxgroup/ursula/tags","blobs_url":"https://api.github.com/repos/blueboxgroup/ursula/git/blobs{/sha}","git_tags_url":"https://api.github.com/repos/blueboxgroup/ursula/git/tags{/sha}","git_refs_url":"https://api.github.com/repos/blueboxgroup/ursula/git/refs{/sha}","trees_url":"https://api.github.com/repos/blueboxgroup/ursula/git/trees{/sha}","statuses_url":"https://api.github.com/repos/blueboxgroup/ursula/statuses/{sha}","languages_url":"https://api.github.com/repos/blueboxgroup/ursula/languages","stargazers_url":"https://api.github.com/repos/blueboxgroup/ursula/stargazers","contributors_url":"https://api.github.com/repos/blueboxgroup/ursula/contributors","subscribers_url":"https://api.github.com/repos/blueboxgroup/ursula/subscribers","subscription_url":"https://api.github.com/repos/blueboxgroup/ursula/subscription","commits_url":"https://api.github.com/repos/blueboxgroup/ursula/commits{/sha}","git_commits_url":"https://api.github.com/repos/blueboxgroup/ursula/git/commits{/sha}","comments_url":"https://api.github.com/repos/blueboxgroup/ursula/comments{/number}","issue_comment_url":"https://api.github.com/repos/blueboxgroup/ursula/issues/comments/{number}","contents_url":"https://api.github.com/repos/blueboxgroup/ursula/contents/{+path}","compare_url":"https://api.github.com/repos/blueboxgroup/ursula/compare/{base}...{head}","merges_url":"https://api.github.com/repos/blueboxgroup/ursula/merges","archive_url":"https://api.github.com/repos/blueboxgroup/ursula/{archive_format}{/ref}","downloads_url":"https://api.github.com/repos/blueboxgroup/ursula/downloads","issues_url":"https://api.github.com/repos/blueboxgroup/ursula/issues{/number}","pulls_url":"https://api.github.com/repos/blueboxgroup/ursula/pulls{/number}","milestones_url":"https://api.github.com/repos/blueboxgroup/ursula/milestones{/number}","notifications_url":"https://api.github.com/repos/blueboxgroup/ursula/notifications{?since,all,participating}","labels_url":"https://api.github.com/repos/blueboxgroup/ursula/labels{/name}","releases_url":"https://api.github.com/repos/blueboxgroup/ursula/releases{/id}","created_at":"2013-08-02T17:37:26Z","updated_at":"2014-12-31T21:03:28Z","pushed_at":"2015-01-01T00:01:35Z","git_url":"git://github.com/blueboxgroup/ursula.git","ssh_url":"git@github.com:blueboxgroup/ursula.git","clone_url":"https://github.com/blueboxgroup/ursula.git","svn_url":"https://github.com/blueboxgroup/ursula","homepage":null,"size":9036,"stargazers_count":45,"watchers_count":45,"language":"Python","has_issues":true,"has_downloads":true,"has_wiki":true,"has_pages":false,"forks_count":23,"mirror_url":null,"open_issues_count":26,"forks":23,"open_issues":26,"watchers":45,"default_branch":"master"}},"_links":{"self":{"href":"https://api.github.com/repos/blueboxgroup/ursula/pulls/705"},"html":{"href":"https://github.com/blueboxgroup/ursula/pull/705"},"issue":{"href":"https://api.github.com/repos/blueboxgroup/ursula/issues/705"},"comments":{"href":"https://api.github.com/repos/blueboxgroup/ursula/issues/705/comments"},"review_comments":{"href":"https://api.github.com/repos/blueboxgroup/ursula/pulls/705/comments"},"review_comment":{"href":"https://api.github.com/repos/blueboxgroup/ursula/pulls/comments/{number}"},"commits":{"href":"https://api.github.com/repos/blueboxgroup/ursula/pulls/705/commits"},"statuses":{"href":"https://api.github.com/repos/blueboxgroup/ursula/statuses/2a6f35313b9936ce4450aba823d09287626bed6f"}}}},"public":true,"created_at":"2015-01-01T01:05:27Z","org":{"id":458705,"login":"blueboxgroup","gravatar_id":"","url":"https://api.github.com/orgs/blueboxgroup","avatar_url":"https://avatars.githubusercontent.com/u/458705?"}}
{"id":"2489398191","type":"PushEvent","actor":{"id":7483224,"login":"seann1","gravatar_id":"","url":"https://api.github.com/users/seann1","avatar_url":"https://avatars.githubusercontent.com/u/7483224?"},"repo":{"id":28437213,"name":"seann1/twitterapi-rails","url":"https://api.github.com/repos/seann1/twitterapi-rails"},"payload":{"push_id":536753252,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"9f6d2ffe96a98af38f87ef905762e43893a8c461","before":"7a83e390ab1d5cb5b00d4136c8e01b0e81ae49f9","commits":[{"sha":"9f6d2ffe96a98af38f87ef905762e43893a8c461","author":{"email":"3cea802b5add67a11ab310afda68113858c6259a@gmail.com","name":"Sean"},"message":"dynamically creating bubble divs","distinct":true,"url":"https://api.github.com/repos/seann1/twitterapi-rails/commits/9f6d2ffe96a98af38f87ef905762e43893a8c461"}]},"public":true,"created_at":"2015-01-01T01:05:27Z"}
{"id":"2489398192","type":"GollumEvent","actor":{"id":10245688,"login":"SunyataZero","gravatar_id":"","url":"https://api.github.com/users/SunyataZero","avatar_url":"https://avatars.githubusercontent.com/u/10245688?"},"repo":{"id":28485643,"name":"EmpathyApp/EmpathyApp","url":"https://api.github.com/repos/EmpathyApp/EmpathyApp"},"payload":{"pages":[{"page_name":"Design-tools","title":"Design tools","summary":null,"action":"created","sha":"b8d60e0fc553722c073232af866539a4766571a6","html_url":"https://github.com/EmpathyApp/EmpathyApp/wiki/Design-tools"}]},"public":true,"created_at":"2015-01-01T01:05:27Z","org":{"id":10245750,"login":"EmpathyApp","gravatar_id":"","url":"https://api.github.com/orgs/EmpathyApp","avatar_url":"https://avatars.githubusercontent.com/u/10245750?"}}
{"id":"2489398196","type":"PushEvent","actor":{"id":172753,"login":"oehmiche","gravatar_id":"","url":"https://api.github.com/users/oehmiche","avatar_url":"https://avatars.githubusercontent.com/u/172753?"},"repo":{"id":26650146,"name":"oehmiche/isp-performance","url":"https://api.github.com/repos/oehmiche/isp-performance"},"payload":{"push_id":536753253,"size":1,"distinct_size":1,"ref":"refs/heads/gh-pages","head":"7cfa6900cc30482ca7d8b579f45af6d8ec90e117","before":"ce82142429c758277343abf359a05a410186264d","commits":[{"sha":"7cfa6900cc30482ca7d8b579f45af6d8ec90e117","author":{"email":"37955833ebc42115603c87ad993837f95227dc9d@raspberry.pi","name":"smokeping.script"},"message":"updates all charts","distinct":true,"url":"https://api.github.com/repos/oehmiche/isp-performance/commits/7cfa6900cc30482ca7d8b579f45af6d8ec90e117"}]},"public":true,"created_at":"2015-01-01T01:05:28Z"}
{"id":"2489398198","type":"PushEvent","actor":{"id":1217681,"login":"stoeffel","gravatar_id":"","url":"https://api.github.com/users/stoeffel","avatar_url":"https://avatars.githubusercontent.com/u/1217681?"},"repo":{"id":800115,"name":"epeli/underscore.string","url":"https://api.github.com/repos/epeli/underscore.string"},"payload":{"push_id":536753254,"size":2,"distinct_size":1,"ref":"refs/heads/master","head":"cebddf40cf2e10f0e9b596d9654edd0a1cfefc15","before":"244b1724770947430793dc43fb96d610dd045c47","commits":[{"sha":"9fa0bbce075f82af8a7cd96abac4a6a1ae718611","author":{"email":"3879ab0c8adeefa545d20a45d877af2f6b5284b0@tocco.ch","name":"Christoph Hermann"},"message":"add force lowercase flag to camelize\n\n- add tests for capitalization of the first letter\n- add alias camelcase (analoge ruby)\n- merge duplicate test suite for camelize\n\ncloses #306","distinct":false,"url":"https://api.github.com/repos/epeli/underscore.string/commits/9fa0bbce075f82af8a7cd96abac4a6a1ae718611"},{"sha":"cebddf40cf2e10f0e9b596d9654edd0a1cfefc15","author":{"email":"02503ea0b8f4cf66a2b1602591dbce46860393b2@gmail.com","name":"Christoph Hermann"},"message":"Merge pull request #370 from epeli/camelize-force-lowercase\n\nadd force lowercase flag to camelize","distinct":true,"url":"https://api.github.com/repos/epeli/underscore.string/commits/cebddf40cf2e10f0e9b596d9654edd0a1cfefc15"}]},"public":true,"created_at":"2015-01-01T01:05:28Z"}
{"id":"2489398199","type":"IssueCommentEvent","actor":{"id":1203825,"login":"huonw","gravatar_id":"","url":"https://api.github.com/users/huonw","avatar_url":"https://avatars.githubusercontent.com/u/1203825?"},"repo":{"id":724712,"name":"rust-lang/rust","url":"https://api.github.com/repos/rust-lang/rust"},"payload":{"action":"created","issue":{"url":"https://api.github.com/repos/rust-lang/rust/issues/20373","labels_url":"https://api.github.com/repos/rust-lang/rust/issues/20373/labels{/name}","comments_url":"https://api.github.com/repos/rust-lang/rust/issues/20373/comments","events_url":"https://api.github.com/repos/rust-lang/rust/issues/20373/events","html_url":"https://github.com/rust-lang/rust/pull/20373","id":53190761,"number":20373,"title":"Add a lint `unconditional_self_calls` to detect unconditional recursion.","user":{"login":"huonw","id":1203825,"avatar_url":"https://avatars.githubusercontent.com/u/1203825?v=3","gravatar_id":"","url":"https://api.github.com/users/huonw","html_url":"https://github.com/huonw","followers_url":"https://api.github.com/users/huonw/followers","following_url":"https://api.github.com/users/huonw/following{/other_user}","gists_url":"https://api.github.com/users/huonw/gists{/gist_id}","starred_url":"https://api.github.com/users/huonw/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/huonw/subscriptions","organizations_url":"https://api.github.com/users/huonw/orgs","repos_url":"https://api.github.com/users/huonw/repos","events_url":"https://api.github.com/users/huonw/events{/privacy}","received_events_url":"https://api.github.com/users/huonw/received_events","type":"User","site_admin":false},"labels":[],"state":"open","locked":false,"assignee":{"login":"luqmana","id":287063,"avatar_url":"https://avatars.githubusercontent.com/u/287063?v=3","gravatar_id":"","url":"https://api.github.com/users/luqmana","html_url":"https://github.com/luqmana","followers_url":"https://api.github.com/users/luqmana/followers","following_url":"https://api.github.com/users/luqmana/following{/other_user}","gists_url":"https://api.github.com/users/luqmana/gists{/gist_id}","starred_url":"https://api.github.com/users/luqmana/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/luqmana/subscriptions","organizations_url":"https://api.github.com/users/luqmana/orgs","repos_url":"https://api.github.com/users/luqmana/repos","events_url":"https://api.github.com/users/luqmana/events{/privacy}","received_events_url":"https://api.github.com/users/luqmana/received_events","type":"User","site_admin":false},"milestone":null,"comments":3,"created_at":"2014-12-31T16:18:18Z","updated_at":"2015-01-01T01:05:28Z","closed_at":null,"pull_request":{"url":"https://api.github.com/repos/rust-lang/rust/pulls/20373","html_url":"https://github.com/rust-lang/rust/pull/20373","diff_url":"https://github.com/rust-lang/rust/pull/20373.diff","patch_url":"https://github.com/rust-lang/rust/pull/20373.patch"},"body":"E.g. `fn foo() { foo() }`, or, more subtlely\r\n\r\n    impl Foo for Box<Foo+'static> {\r\n        fn bar(&self) {\r\n            self.bar();\r\n        }\r\n    }\r\n\r\nThe compiler will warn and point out the points where recursion occurs,\r\nif it determines that the function cannot return without calling itself.\r\n\r\nCloses #17899.\r\n\r\n---\r\n\r\nThis is highly non-perfect, in particular, my wording above is quite precise, and I have some unresolved questions: This currently will warn about\r\n\r\n```rust\r\nfn foo() {\r\n    if bar { loop {} }\r\n\r\n    foo()\r\n}\r\n```\r\n\r\neven though `foo` may never be called (i.e. our apparent \"unconditional\" recursion is actually conditional). I don't know if we should handle this case, and ones like it with `panic!()` instead of `loop` (or anything else that \"returns\" `!`).\r\n\r\nHowever, strictly speaking, it seems to me that changing the above to not warn will require changing\r\n\r\n```rust\r\nfn foo() {\r\n    while bar {}\r\n    foo()\r\n}\r\n```\r\n\r\nto also not warn since it could be that the `while` is an infinite loop and doesn't ever hit the `foo`.\r\n\r\nI'm inclined to think we let these cases warn since true edge cases like the first one seem rare, and if they do occur they seem like they would usually be typos in the function call. (I could imagine someone accidentally having code like `fn foo() { assert!(bar()); foo() /* meant to be boo() */ }` which won't warn if the `loop` case is \"fixed\".)\r\n\r\n(Part of the reason this is unresolved is wanting feedback, part of the reason is I couldn't devise a strategy that worked in all cases.)\r\n\r\n---\r\n\r\nThe name `unconditional_self_calls` is kinda clunky; and this reconstructs the CFG for each function that is linted which may or may not be very expensive, I don't know."},"comment":{"url":"https://api.github.com/repos/rust-lang/rust/issues/comments/68477337","html_url":"https://github.com/rust-lang/rust/pull/20373#issuecomment-68477337","issue_url":"https://api.github.com/repos/rust-lang/rust/issues/20373","id":68477337,"user":{"login":"huonw","id":1203825,"avatar_url":"https://avatars.githubusercontent.com/u/1203825?v=3","gravatar_id":"","url":"https://api.github.com/users/huonw","html_url":"https://github.com/huonw","followers_url":"https://api.github.com/users/huonw/followers","following_url":"https://api.github.com/users/huonw/following{/other_user}","gists_url":"https://api.github.com/users/huonw/gists{/gist_id}","starred_url":"https://api.github.com/users/huonw/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/huonw/subscriptions","organizations_url":"https://api.github.com/users/huonw/orgs","repos_url":"https://api.github.com/users/huonw/repos","events_url":"https://api.github.com/users/huonw/events{/privacy}","received_events_url":"https://api.github.com/users/huonw/received_events","type":"User","site_admin":false},"created_at":"2015-01-01T01:05:28Z","updated_at":"2015-01-01T01:05:28Z","body":"@luqmana, speaking prescriptively, \"recurs\" is actually *more* correct than recurses, e.g. http://english.stackexchange.com/questions/163446/does-a-recursive-procedure-recur ; I'm happy to change it if people prefer the recurse version."}},"public":true,"created_at":"2015-01-01T01:05:29Z","org":{"id":5430905,"login":"rust-lang","gravatar_id":"","url":"https://api.github.com/orgs/rust-lang","avatar_url":"https://avatars.githubusercontent.com/u/5430905?"}}
{"id":"2489398200","type":"WatchEvent","actor":{"id":1015032,"login":"miketahani","gravatar_id":"","url":"https://api.github.com/users/miketahani","avatar_url":"https://avatars.githubusercontent.com/u/1015032?"},"repo":{"id":1318988,"name":"Instagram/python-instagram","url":"https://api.github.com/repos/Instagram/python-instagram"},"payload":{"action":"started"},"public":true,"created_at":"2015-01-01T01:05:29Z","org":{"id":549085,"login":"Instagram","gravatar_id":"","url":"https://api.github.com/orgs/Instagram","avatar_url":"https://avatars.githubusercontent.com/u/549085?"}}
{"id":"2489398205","type":"PushEvent","actor":{"id":9278781,"login":"Missling","gravatar_id":"","url":"https://api.github.com/users/Missling","avatar_url":"https://avatars.githubusercontent.com/u/9278781?"},"repo":{"id":27950087,"name":"Missling/missling.github.io","url":"https://api.github.com/repos/Missling/missling.github.io"},"payload":{"push_id":536753258,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"837dcc81f2013cbfc2ded2f8e96ed6678e554e11","before":"ac2686d840d1c7edd43896a8170e969483d1a261","commits":[{"sha":"837dcc81f2013cbfc2ded2f8e96ed6678e554e11","author":{"email":"75f3425216d1181ebb16fc73302673da505d7ee1@gmail.com","name":"Ling Giang"},"message":"update website index page and blogcss","distinct":true,"url":"https://api.github.com/repos/Missling/missling.github.io/commits/837dcc81f2013cbfc2ded2f8e96ed6678e554e11"}]},"public":true,"created_at":"2015-01-01T01:05:30Z"}
{"id":"2489398207","type":"PullRequestEvent","actor":{"id":3489773,"login":"captainkirkby","gravatar_id":"","url":"https://api.github.com/users/captainkirkby","avatar_url":"https://avatars.githubusercontent.com/u/3489773?"},"repo":{"id":15461243,"name":"captainkirkby/Gears","url":"https://api.github.com/repos/captainkirkby/Gears"},"payload":{"action":"opened","number":31,"pull_request":{"url":"https://api.github.com/repos/captainkirkby/Gears/pulls/31","id":26739457,"html_url":"https://github.com/captainkirkby/Gears/pull/31","diff_url":"https://github.com/captainkirkby/Gears/pull/31.diff","patch_url":"https://github.com/captainkirkby/Gears/pull/31.patch","issue_url":"https://api.github.com/repos/captainkirkby/Gears/issues/31","number":31,"state":"open","locked":false,"title":"Add simple C program to replay binary file","user":{"login":"captainkirkby","id":3489773,"avatar_url":"https://avatars.githubusercontent.com/u/3489773?v=3","gravatar_id":"","url":"https://api.github.com/users/captainkirkby","html_url":"https://github.com/captainkirkby","followers_url":"https://api.github.com/users/captainkirkby/followers","following_url":"https://api.github.com/users/captainkirkby/following{/other_user}","gists_url":"https://api.github.com/users/captainkirkby/gists{/gist_id}","starred_url":"https://api.github.com/users/captainkirkby/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/captainkirkby/subscriptions","organizations_url":"https://api.github.com/users/captainkirkby/orgs","repos_url":"https://api.github.com/users/captainkirkby/repos","events_url":"https://api.github.com/users/captainkirkby/events{/privacy}","received_events_url":"https://api.github.com/users/captainkirkby/received_events","type":"User","site_admin":false},"body":"Closes issue #30 ","created_at":"2015-01-01T01:05:31Z","updated_at":"2015-01-01T01:05:31Z","closed_at":null,"merged_at":null,"merge_commit_sha":"1937489450eb244357356ec9a4ad968f1d63e23d","assignee":null,"milestone":null,"commits_url":"https://api.github.com/repos/captainkirkby/Gears/pulls/31/commits","review_comments_url":"https://api.github.com/repos/captainkirkby/Gears/pulls/31/comments","review_comment_url":"https://api.github.com/repos/captainkirkby/Gears/pulls/comments/{number}","comments_url":"https://api.github.com/repos/captainkirkby/Gears/issues/31/comments","statuses_url":"https://api.github.com/repos/captainkirkby/Gears/statuses/0ce69fa19d81de656dd6a74629099a7fa9261d1c","head":{"label":"captainkirkby:#30","ref":"#30","sha":"0ce69fa19d81de656dd6a74629099a7fa9261d1c","user":{"login":"captainkirkby","id":3489773,"avatar_url":"https://avatars.githubusercontent.com/u/3489773?v=3","gravatar_id":"","url":"https://api.github.com/users/captainkirkby","html_url":"https://github.com/captainkirkby","followers_url":"https://api.github.com/users/captainkirkby/followers","following_url":"https://api.github.com/users/captainkirkby/following{/other_user}","gists_url":"https://api.github.com/users/captainkirkby/gists{/gist_id}","starred_url":"https://api.github.com/users/captainkirkby/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/captainkirkby/subscriptions","organizations_url":"https://api.github.com/users/captainkirkby/orgs","repos_url":"https://api.github.com/users/captainkirkby/repos","events_url":"https://api.github.com/users/captainkirkby/events{/privacy}","received_events_url":"https://api.github.com/users/captainkirkby/received_events","type":"User","site_admin":false},"repo":{"id":15461243,"name":"Gears","full_name":"captainkirkby/Gears","owner":{"login":"captainkirkby","id":3489773,"avatar_url":"https://avatars.githubusercontent.com/u/3489773?v=3","gravatar_id":"","url":"https://api.github.com/users/captainkirkby","html_url":"https://github.com/captainkirkby","followers_url":"https://api.github.com/users/captainkirkby/followers","following_url":"https://api.github.com/users/captainkirkby/following{/other_user}","gists_url":"https://api.github.com/users/captainkirkby/gists{/gist_id}","starred_url":"https://api.github.com/users/captainkirkby/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/captainkirkby/subscriptions","organizations_url":"https://api.github.com/users/captainkirkby/orgs","repos_url":"https://api.github.com/users/captainkirkby/repos","events_url":"https://api.github.com/users/captainkirkby/events{/privacy}","received_events_url":"https://api.github.com/users/captainkirkby/received_events","type":"User","site_admin":false},"private":false,"html_url":"https://github.com/captainkirkby/Gears","description":"Set of packages used to measure a mechanical clock.","fork":false,"url":"https://api.github.com/repos/captainkirkby/Gears","forks_url":"https://api.github.com/repos/captainkirkby/Gears/forks","keys_url":"https://api.github.com/repos/captainkirkby/Gears/keys{/key_id}","collaborators_url":"https://api.github.com/repos/captainkirkby/Gears/collaborators{/collaborator}","teams_url":"https://api.github.com/repos/captainkirkby/Gears/teams","hooks_url":"https://api.github.com/repos/captainkirkby/Gears/hooks","issue_events_url":"https://api.github.com/repos/captainkirkby/Gears/issues/events{/number}","events_url":"https://api.github.com/repos/captainkirkby/Gears/events","assignees_url":"https://api.github.com/repos/captainkirkby/Gears/assignees{/user}","branches_url":"https://api.github.com/repos/captainkirkby/Gears/branches{/branch}","tags_url":"https://api.github.com/repos/captainkirkby/Gears/tags","blobs_url":"https://api.github.com/repos/captainkirkby/Gears/git/blobs{/sha}","git_tags_url":"https://api.github.com/repos/captainkirkby/Gears/git/tags{/sha}","git_refs_url":"https://api.github.com/repos/captainkirkby/Gears/git/refs{/sha}","trees_url":"https://api.github.com/repos/captainkirkby/Gears/git/trees{/sha}","statuses_url":"https://api.github.com/repos/captainkirkby/Gears/statuses/{sha}","languages_url":"https://api.github.com/repos/captainkirkby/Gears/languages","stargazers_url":"https://api.github.com/repos/captainkirkby/Gears/stargazers","contributors_url":"https://api.github.com/repos/captainkirkby/Gears/contributors","subscribers_url":"https://api.github.com/repos/captainkirkby/Gears/subscribers","subscription_url":"https://api.github.com/repos/captainkirkby/Gears/subscription","commits_url":"https://api.github.com/repos/captainkirkby/Gears/commits{/sha}","git_commits_url":"https://api.github.com/repos/captainkirkby/Gears/git/commits{/sha}","comments_url":"https://api.github.com/repos/captainkirkby/Gears/comments{/number}","issue_comment_url":"https://api.github.com/repos/captainkirkby/Gears/issues/comments/{number}","contents_url":"https://api.github.com/repos/captainkirkby/Gears/contents/{+path}","compare_url":"https://api.github.com/repos/captainkirkby/Gears/compare/{base}...{head}","merges_url":"https://api.github.com/repos/captainkirkby/Gears/merges","archive_url":"https://api.github.com/repos/captainkirkby/Gears/{archive_format}{/ref}","downloads_url":"https://api.github.com/repos/captainkirkby/Gears/downloads","issues_url":"https://api.github.com/repos/captainkirkby/Gears/issues{/number}","pulls_url":"https://api.github.com/repos/captainkirkby/Gears/pulls{/number}","milestones_url":"https://api.github.com/repos/captainkirkby/Gears/milestones{/number}","notifications_url":"https://api.github.com/repos/captainkirkby/Gears/notifications{?since,all,participating}","labels_url":"https://api.github.com/repos/captainkirkby/Gears/labels{/name}","releases_url":"https://api.github.com/repos/captainkirkby/Gears/releases{/id}","created_at":"2013-12-26T22:05:51Z","updated_at":"2015-01-01T00:41:54Z","pushed_at":"2015-01-01T01:02:09Z","git_url":"git://github.com/captainkirkby/Gears.git","ssh_url":"git@github.com:captainkirkby/Gears.git","clone_url":"https://github.com/captainkirkby/Gears.git","svn_url":"https://github.com/captainkirkby/Gears","homepage":"","size":18140,"stargazers_count":1,"watchers_count":1,"language":"C++","has_issues":true,"has_downloads":true,"has_wiki":true,"has_pages":false,"forks_count":0,"mirror_url":null,"open_issues_count":12,"forks":0,"open_issues":12,"watchers":1,"default_branch":"master"}},"base":{"label":"captainkirkby:master","ref":"master","sha":"b838f0c36403eab209f3565eeb7a10375911d228","user":{"login":"captainkirkby","id":3489773,"avatar_url":"https://avatars.githubusercontent.com/u/3489773?v=3","gravatar_id":"","url":"https://api.github.com/users/captainkirkby","html_url":"https://github.com/captainkirkby","followers_url":"https://api.github.com/users/captainkirkby/followers","following_url":"https://api.github.com/users/captainkirkby/following{/other_user}","gists_url":"https://api.github.com/users/captainkirkby/gists{/gist_id}","starred_url":"https://api.github.com/users/captainkirkby/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/captainkirkby/subscriptions","organizations_url":"https://api.github.com/users/captainkirkby/orgs","repos_url":"https://api.github.com/users/captainkirkby/repos","events_url":"https://api.github.com/users/captainkirkby/events{/privacy}","received_events_url":"https://api.github.com/users/captainkirkby/received_events","type":"User","site_admin":false},"repo":{"id":15461243,"name":"Gears","full_name":"captainkirkby/Gears","owner":{"login":"captainkirkby","id":3489773,"avatar_url":"https://avatars.githubusercontent.com/u/3489773?v=3","gravatar_id":"","url":"https://api.github.com/users/captainkirkby","html_url":"https://github.com/captainkirkby","followers_url":"https://api.github.com/users/captainkirkby/followers","following_url":"https://api.github.com/users/captainkirkby/following{/other_user}","gists_url":"https://api.github.com/users/captainkirkby/gists{/gist_id}","starred_url":"https://api.github.com/users/captainkirkby/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/captainkirkby/subscriptions","organizations_url":"https://api.github.com/users/captainkirkby/orgs","repos_url":"https://api.github.com/users/captainkirkby/repos","events_url":"https://api.github.com/users/captainkirkby/events{/privacy}","received_events_url":"https://api.github.com/users/captainkirkby/received_events","type":"User","site_admin":false},"private":false,"html_url":"https://github.com/captainkirkby/Gears","description":"Set of packages used to measure a mechanical clock.","fork":false,"url":"https://api.github.com/repos/captainkirkby/Gears","forks_url":"https://api.github.com/repos/captainkirkby/Gears/forks","keys_url":"https://api.github.com/repos/captainkirkby/Gears/keys{/key_id}","collaborators_url":"https://api.github.com/repos/captainkirkby/Gears/collaborators{/collaborator}","teams_url":"https://api.github.com/repos/captainkirkby/Gears/teams","hooks_url":"https://api.github.com/repos/captainkirkby/Gears/hooks","issue_events_url":"https://api.github.com/repos/captainkirkby/Gears/issues/events{/number}","events_url":"https://api.github.com/repos/captainkirkby/Gears/events","assignees_url":"https://api.github.com/repos/captainkirkby/Gears/assignees{/user}","branches_url":"https://api.github.com/repos/captainkirkby/Gears/branches{/branch}","tags_url":"https://api.github.com/repos/captainkirkby/Gears/tags","blobs_url":"https://api.github.com/repos/captainkirkby/Gears/git/blobs{/sha}","git_tags_url":"https://api.github.com/repos/captainkirkby/Gears/git/tags{/sha}","git_refs_url":"https://api.github.com/repos/captainkirkby/Gears/git/refs{/sha}","trees_url":"https://api.github.com/repos/captainkirkby/Gears/git/trees{/sha}","statuses_url":"https://api.github.com/repos/captainkirkby/Gears/statuses/{sha}","languages_url":"https://api.github.com/repos/captainkirkby/Gears/languages","stargazers_url":"https://api.github.com/repos/captainkirkby/Gears/stargazers","contributors_url":"https://api.github.com/repos/captainkirkby/Gears/contributors","subscribers_url":"https://api.github.com/repos/captainkirkby/Gears/subscribers","subscription_url":"https://api.github.com/repos/captainkirkby/Gears/subscription","commits_url":"https://api.github.com/repos/captainkirkby/Gears/commits{/sha}","git_commits_url":"https://api.github.com/repos/captainkirkby/Gears/git/commits{/sha}","comments_url":"https://api.github.com/repos/captainkirkby/Gears/comments{/number}","issue_comment_url":"https://api.github.com/repos/captainkirkby/Gears/issues/comments/{number}","contents_url":"https://api.github.com/repos/captainkirkby/Gears/contents/{+path}","compare_url":"https://api.github.com/repos/captainkirkby/Gears/compare/{base}...{head}","merges_url":"https://api.github.com/repos/captainkirkby/Gears/merges","archive_url":"https://api.github.com/repos/captainkirkby/Gears/{archive_format}{/ref}","downloads_url":"https://api.github.com/repos/captainkirkby/Gears/downloads","issues_url":"https://api.github.com/repos/captainkirkby/Gears/issues{/number}","pulls_url":"https://api.github.com/repos/captainkirkby/Gears/pulls{/number}","milestones_url":"https://api.github.com/repos/captainkirkby/Gears/milestones{/number}","notifications_url":"https://api.github.com/repos/captainkirkby/Gears/notifications{?since,all,participating}","labels_url":"https://api.github.com/repos/captainkirkby/Gears/labels{/name}","releases_url":"https://api.github.com/repos/captainkirkby/Gears/releases{/id}","created_at":"2013-12-26T22:05:51Z","updated_at":"2015-01-01T00:41:54Z","pushed_at":"2015-01-01T01:02:09Z","git_url":"git://github.com/captainkirkby/Gears.git","ssh_url":"git@github.com:captainkirkby/Gears.git","clone_url":"https://github.com/captainkirkby/Gears.git","svn_url":"https://github.com/captainkirkby/Gears","homepage":"","size":18140,"stargazers_count":1,"watchers_count":1,"language":"C++","has_issues":true,"has_downloads":true,"has_wiki":true,"has_pages":false,"forks_count":0,"mirror_url":null,"open_issues_count":12,"forks":0,"open_issues":12,"watchers":1,"default_branch":"master"}},"_links":{"self":{"href":"https://api.github.com/repos/captainkirkby/Gears/pulls/31"},"html":{"href":"https://github.com/captainkirkby/Gears/pull/31"},"issue":{"href":"https://api.github.com/repos/captainkirkby/Gears/issues/31"},"comments":{"href":"https://api.github.com/repos/captainkirkby/Gears/issues/31/comments"},"review_comments":{"href":"https://api.github.com/repos/captainkirkby/Gears/pulls/31/comments"},"review_comment":{"href":"https://api.github.com/repos/captainkirkby/Gears/pulls/comments/{number}"},"commits":{"href":"https://api.github.com/repos/captainkirkby/Gears/pulls/31/commits"},"statuses":{"href":"https://api.github.com/repos/captainkirkby/Gears/statuses/0ce69fa19d81de656dd6a74629099a7fa9261d1c"}},"merged":false,"mergeable":true,"mergeable_state":"clean","merged_by":null,"comments":0,"review_comments":0,"commits":1,"additions":129,"deletions":0,"changed_files":1}},"public":true,"created_at":"2015-01-01T01:05:32Z"}
{"id":"2489398208","type":"WatchEvent","actor":{"id":1817530,"login":"mitchellw","gravatar_id":"","url":"https://api.github.com/users/mitchellw","avatar_url":"https://avatars.githubusercontent.com/u/1817530?"},"repo":{"id":27339405,"name":"QBCo/akemi","url":"https://api.github.com/repos/QBCo/akemi"},"payload":{"action":"started"},"public":true,"created_at":"2015-01-01T01:05:32Z","org":{"id":10001822,"login":"QBCo","gravatar_id":"","url":"https://api.github.com/orgs/QBCo","avatar_url":"https://avatars.githubusercontent.com/u/10001822?"}}
{"id":"2489398215","type":"IssuesEvent","actor":{"id":1802542,"login":"ishayyaari","gravatar_id":"","url":"https://api.github.com/users/ishayyaari","avatar_url":"https://avatars.githubusercontent.com/u/1802542?"},"repo":{"id":4967600,"name":"MiYa-Solutions/sbcx","url":"https://api.github.com/repos/MiYa-Solutions/sbcx"},"payload":{"action":"closed","issue":{"url":"https://api.github.com/repos/MiYa-Solutions/sbcx/issues/715","labels_url":"https://api.github.com/repos/MiYa-Solutions/sbcx/issues/715/labels{/name}","comments_url":"https://api.github.com/repos/MiYa-Solutions/sbcx/issues/715/comments","events_url":"https://api.github.com/repos/MiYa-Solutions/sbcx/issues/715/events","html_url":"https://github.com/MiYa-Solutions/sbcx/issues/715","id":53198063,"number":715,"title":"Feedback From Rug Wash Meeting Dec 31 2014","user":{"login":"markmilman","id":1744318,"avatar_url":"https://avatars.githubusercontent.com/u/1744318?v=3","gravatar_id":"","url":"https://api.github.com/users/markmilman","html_url":"https://github.com/markmilman","followers_url":"https://api.github.com/users/markmilman/followers","following_url":"https://api.github.com/users/markmilman/following{/other_user}","gists_url":"https://api.github.com/users/markmilman/gists{/gist_id}","starred_url":"https://api.github.com/users/markmilman/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/markmilman/subscriptions","organizations_url":"https://api.github.com/users/markmilman/orgs","repos_url":"https://api.github.com/users/markmilman/repos","events_url":"https://api.github.com/users/markmilman/events{/privacy}","received_events_url":"https://api.github.com/users/markmilman/received_events","type":"User","site_admin":false},"labels":[],"state":"closed","locked":false,"assignee":{"login":"ishayyaari","id":1802542,"avatar_url":"https://avatars.githubusercontent.com/u/1802542?v=3","gravatar_id":"","url":"https://api.github.com/users/ishayyaari","html_url":"https://github.com/ishayyaari","followers_url":"https://api.github.com/users/ishayyaari/followers","following_url":"https://api.github.com/users/ishayyaari/following{/other_user}","gists_url":"https://api.github.com/users/ishayyaari/gists{/gist_id}","starred_url":"https://api.github.com/users/ishayyaari/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/ishayyaari/subscriptions","organizations_url":"https://api.github.com/users/ishayyaari/orgs","repos_url":"https://api.github.com/users/ishayyaari/repos","events_url":"https://api.github.com/users/ishayyaari/events{/privacy}","received_events_url":"https://api.github.com/users/ishayyaari/received_events","type":"User","site_admin":false},"milestone":{"url":"https://api.github.com/repos/MiYa-Solutions/sbcx/milestones/10","labels_url":"https://api.github.com/repos/MiYa-Solutions/sbcx/milestones/10/labels","id":835988,"number":10,"title":"Rug Wash Bug Fixes","description":"Fixes specifically for the rug wash opportunity","creator":{"login":"markmilman","id":1744318,"avatar_url":"https://avatars.githubusercontent.com/u/1744318?v=3","gravatar_id":"","url":"https://api.github.com/users/markmilman","html_url":"https://github.com/markmilman","followers_url":"https://api.github.com/users/markmilman/followers","following_url":"https://api.github.com/users/markmilman/following{/other_user}","gists_url":"https://api.github.com/users/markmilman/gists{/gist_id}","starred_url":"https://api.github.com/users/markmilman/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/markmilman/subscriptions","organizations_url":"https://api.github.com/users/markmilman/orgs","repos_url":"https://api.github.com/users/markmilman/repos","events_url":"https://api.github.com/users/markmilman/events{/privacy}","received_events_url":"https://api.github.com/users/markmilman/received_events","type":"User","site_admin":false},"open_issues":6,"closed_issues":37,"state":"open","created_at":"2014-10-22T14:08:56Z","updated_at":"2015-01-01T01:05:32Z","due_on":"2014-11-11T08:00:00Z","closed_at":null},"comments":0,"created_at":"2014-12-31T18:58:02Z","updated_at":"2015-01-01T01:05:32Z","closed_at":"2015-01-01T01:05:32Z","body":"* Show the Project Number (Order Number)\r\n* Include Job #  in the invoice"}},"public":true,"created_at":"2015-01-01T01:05:32Z","org":{"id":1788572,"login":"MiYa-Solutions","gravatar_id":"","url":"https://api.github.com/orgs/MiYa-Solutions","avatar_url":"https://avatars.githubusercontent.com/u/1788572?"}}
{"id":"2489398217","type":"PushEvent","actor":{"id":433707,"login":"ile","gravatar_id":"","url":"https://api.github.com/users/ile","avatar_url":"https://avatars.githubusercontent.com/u/433707?"},"repo":{"id":26847132,"name":"kantele/k-templates","url":"https://api.github.com/repos/kantele/k-templates"},"payload":{"push_id":536753264,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"ca0474a33dcc125aa7204b517dd7cef8003db346","before":"a2211fba71212268a1c0f0b3dc4ddb1412bf72b6","commits":[{"sha":"ca0474a33dcc125aa7204b517dd7cef8003db346","author":{"email":"4f3407de78bccc8cc160ee4d278d5efe7162e6b5@nateps.com","name":"Nate Smith"},"message":"0.2.1\n\nConflicts:\n\tpackage.json","distinct":true,"url":"https://api.github.com/repos/kantele/k-templates/commits/ca0474a33dcc125aa7204b517dd7cef8003db346"}]},"public":true,"created_at":"2015-01-01T01:05:32Z","org":{"id":5687585,"login":"kantele","gravatar_id":"","url":"https://api.github.com/orgs/kantele","avatar_url":"https://avatars.githubusercontent.com/u/5687585?"}}
{"id":"2489398218","type":"PushEvent","actor":{"id":1802542,"login":"ishayyaari","gravatar_id":"","url":"https://api.github.com/users/ishayyaari","avatar_url":"https://avatars.githubusercontent.com/u/1802542?"},"repo":{"id":4967600,"name":"MiYa-Solutions/sbcx","url":"https://api.github.com/repos/MiYa-Solutions/sbcx"},"payload":{"push_id":536753265,"size":1,"distinct_size":1,"ref":"refs/heads/development","head":"ead55f938ace15919d2bd2b15f1cde4ef5105ced","before":"3f21c270c34c90f4c7c43cf053dde0edd3841782","commits":[{"sha":"ead55f938ace15919d2bd2b15f1cde4ef5105ced","author":{"email":"9534b3c0ec96f8059b6f52efee60e93b9c6b42be","name":"ishayyaari"},"message":"Feedback From Rug Wash Meeting Dec 31 2014\n\nFixed #715","distinct":true,"url":"https://api.github.com/repos/MiYa-Solutions/sbcx/commits/ead55f938ace15919d2bd2b15f1cde4ef5105ced"}]},"public":true,"created_at":"2015-01-01T01:05:32Z","org":{"id":1788572,"login":"MiYa-Solutions","gravatar_id":"","url":"https://api.github.com/orgs/MiYa-Solutions","avatar_url":"https://avatars.githubusercontent.com/u/1788572?"}}
{"id":"2489398219","type":"PushEvent","actor":{"id":1133652,"login":"keum","gravatar_id":"","url":"https://api.github.com/users/keum","avatar_url":"https://avatars.githubusercontent.com/u/1133652?"},"repo":{"id":18115347,"name":"keum/data_display","url":"https://api.github.com/repos/keum/data_display"},"payload":{"push_id":536753266,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"a6eee972e4e07e37d6731216a5d653016c300784","before":"4e4c11b0947a21977b8eb995000a211cc06fa070","commits":[{"sha":"a6eee972e4e07e37d6731216a5d653016c300784","author":{"email":"77be1f27789ed5ba740c04e6493c37160e58f28c@gmail.com","name":"Peter Keum"},"message":"\"Data Upload: 2014-12-31 05:05:29 PM\"","distinct":true,"url":"https://api.github.com/repos/keum/data_display/commits/a6eee972e4e07e37d6731216a5d653016c300784"}]},"public":true,"created_at":"2015-01-01T01:05:32Z"}
{"id":"2489398220","type":"PullRequestEvent","actor":{"id":19792,"login":"wiredfool","gravatar_id":"","url":"https://api.github.com/users/wiredfool","avatar_url":"https://avatars.githubusercontent.com/u/19792?"},"repo":{"id":5171600,"name":"python-pillow/Pillow","url":"https://api.github.com/repos/python-pillow/Pillow"},"payload":{"action":"opened","number":1062,"pull_request":{"url":"https://api.github.com/repos/python-pillow/Pillow/pulls/1062","id":26739458,"html_url":"https://github.com/python-pillow/Pillow/pull/1062","diff_url":"https://github.com/python-pillow/Pillow/pull/1062.diff","patch_url":"https://github.com/python-pillow/Pillow/pull/1062.patch","issue_url":"https://api.github.com/repos/python-pillow/Pillow/issues/1062","number":1062,"state":"open","locked":false,"title":"Png text decompression dos fix, for 2.6.x","user":{"login":"wiredfool","id":19792,"avatar_url":"https://avatars.githubusercontent.com/u/19792?v=3","gravatar_id":"","url":"https://api.github.com/users/wiredfool","html_url":"https://github.com/wiredfool","followers_url":"https://api.github.com/users/wiredfool/followers","following_url":"https://api.github.com/users/wiredfool/following{/other_user}","gists_url":"https://api.github.com/users/wiredfool/gists{/gist_id}","starred_url":"https://api.github.com/users/wiredfool/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/wiredfool/subscriptions","organizations_url":"https://api.github.com/users/wiredfool/orgs","repos_url":"https://api.github.com/users/wiredfool/repos","events_url":"https://api.github.com/users/wiredfool/events{/privacy}","received_events_url":"https://api.github.com/users/wiredfool/received_events","type":"User","site_admin":false},"body":"Same as in master, but for 2.6.x","created_at":"2015-01-01T01:05:32Z","updated_at":"2015-01-01T01:05:32Z","closed_at":null,"merged_at":null,"merge_commit_sha":null,"assignee":null,"milestone":null,"commits_url":"https://api.github.com/repos/python-pillow/Pillow/pulls/1062/commits","review_comments_url":"https://api.github.com/repos/python-pillow/Pillow/pulls/1062/comments","review_comment_url":"https://api.github.com/repos/python-pillow/Pillow/pulls/comments/{number}","comments_url":"https://api.github.com/repos/python-pillow/Pillow/issues/1062/comments","statuses_url":"https://api.github.com/repos/python-pillow/Pillow/statuses/cf880329a755f5b5c81df661990105593adf4a37","head":{"label":"wiredfool:png-dos-2.6.1","ref":"png-dos-2.6.1","sha":"cf880329a755f5b5c81df661990105593adf4a37","user":{"login":"wiredfool","id":19792,"avatar_url":"https://avatars.githubusercontent.com/u/19792?v=3","gravatar_id":"","url":"https://api.github.com/users/wiredfool","html_url":"https://github.com/wiredfool","followers_url":"https://api.github.com/users/wiredfool/followers","following_url":"https://api.github.com/users/wiredfool/following{/other_user}","gists_url":"https://api.github.com/users/wiredfool/gists{/gist_id}","starred_url":"https://api.github.com/users/wiredfool/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/wiredfool/subscriptions","organizations_url":"https://api.github.com/users/wiredfool/orgs","repos_url":"https://api.github.com/users/wiredfool/repos","events_url":"https://api.github.com/users/wiredfool/events{/privacy}","received_events_url":"https://api.github.com/users/wiredfool/received_events","type":"User","site_admin":false},"repo":{"id":8664379,"name":"Pillow","full_name":"wiredfool/Pillow","owner":{"login":"wiredfool","id":19792,"avatar_url":"https://avatars.githubusercontent.com/u/19792?v=3","gravatar_id":"","url":"https://api.github.com/users/wiredfool","html_url":"https://github.com/wiredfool","followers_url":"https://api.github.com/users/wiredfool/followers","following_url":"https://api.github.com/users/wiredfool/following{/other_user}","gists_url":"https://api.github.com/users/wiredfool/gists{/gist_id}","starred_url":"https://api.github.com/users/wiredfool/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/wiredfool/subscriptions","organizations_url":"https://api.github.com/users/wiredfool/orgs","repos_url":"https://api.github.com/users/wiredfool/repos","events_url":"https://api.github.com/users/wiredfool/events{/privacy}","received_events_url":"https://api.github.com/users/wiredfool/received_events","type":"User","site_admin":false},"private":false,"html_url":"https://github.com/wiredfool/Pillow","description":"Pillow is the \"friendly\" PIL fork","fork":true,"url":"https://api.github.com/repos/wiredfool/Pillow","forks_url":"https://api.github.com/repos/wiredfool/Pillow/forks","keys_url":"https://api.github.com/repos/wiredfool/Pillow/keys{/key_id}","collaborators_url":"https://api.github.com/repos/wiredfool/Pillow/collaborators{/collaborator}","teams_url":"https://api.github.com/repos/wiredfool/Pillow/teams","hooks_url":"https://api.github.com/repos/wiredfool/Pillow/hooks","issue_events_url":"https://api.github.com/repos/wiredfool/Pillow/issues/events{/number}","events_url":"https://api.github.com/repos/wiredfool/Pillow/events","assignees_url":"https://api.github.com/repos/wiredfool/Pillow/assignees{/user}","branches_url":"https://api.github.com/repos/wiredfool/Pillow/branches{/branch}","tags_url":"https://api.github.com/repos/wiredfool/Pillow/tags","blobs_url":"https://api.github.com/repos/wiredfool/Pillow/git/blobs{/sha}","git_tags_url":"https://api.github.com/repos/wiredfool/Pillow/git/tags{/sha}","git_refs_url":"https://api.github.com/repos/wiredfool/Pillow/git/refs{/sha}","trees_url":"https://api.github.com/repos/wiredfool/Pillow/git/trees{/sha}","statuses_url":"https://api.github.com/repos/wiredfool/Pillow/statuses/{sha}","languages_url":"https://api.github.com/repos/wiredfool/Pillow/languages","stargazers_url":"https://api.github.com/repos/wiredfool/Pillow/stargazers","contributors_url":"https://api.github.com/repos/wiredfool/Pillow/contributors","subscribers_url":"https://api.github.com/repos/wiredfool/Pillow/subscribers","subscription_url":"https://api.github.com/repos/wiredfool/Pillow/subscription","commits_url":"https://api.github.com/repos/wiredfool/Pillow/commits{/sha}","git_commits_url":"https://api.github.com/repos/wiredfool/Pillow/git/commits{/sha}","comments_url":"https://api.github.com/repos/wiredfool/Pillow/comments{/number}","issue_comment_url":"https://api.github.com/repos/wiredfool/Pillow/issues/comments/{number}","contents_url":"https://api.github.com/repos/wiredfool/Pillow/contents/{+path}","compare_url":"https://api.github.com/repos/wiredfool/Pillow/compare/{base}...{head}","merges_url":"https://api.github.com/repos/wiredfool/Pillow/merges","archive_url":"https://api.github.com/repos/wiredfool/Pillow/{archive_format}{/ref}","downloads_url":"https://api.github.com/repos/wiredfool/Pillow/downloads","issues_url":"https://api.github.com/repos/wiredfool/Pillow/issues{/number}","pulls_url":"https://api.github.com/repos/wiredfool/Pillow/pulls{/number}","milestones_url":"https://api.github.com/repos/wiredfool/Pillow/milestones{/number}","notifications_url":"https://api.github.com/repos/wiredfool/Pillow/notifications{?since,all,participating}","labels_url":"https://api.github.com/repos/wiredfool/Pillow/labels{/name}","releases_url":"https://api.github.com/repos/wiredfool/Pillow/releases{/id}","created_at":"2013-03-09T03:12:08Z","updated_at":"2014-12-31T23:15:11Z","pushed_at":"2015-01-01T00:37:45Z","git_url":"git://github.com/wiredfool/Pillow.git","ssh_url":"git@github.com:wiredfool/Pillow.git","clone_url":"https://github.com/wiredfool/Pillow.git","svn_url":"https://github.com/wiredfool/Pillow","homepage":"http://python-imaging.github.com","size":14870,"stargazers_count":1,"watchers_count":1,"language":"Python","has_issues":false,"has_downloads":true,"has_wiki":false,"has_pages":true,"forks_count":0,"mirror_url":null,"open_issues_count":0,"forks":0,"open_issues":0,"watchers":1,"default_branch":"master"}},"base":{"label":"python-pillow:2.6.x","ref":"2.6.x","sha":"4a8471dea18f6196161e4444ce5625f46cecd1e1","user":{"login":"python-pillow","id":2036701,"avatar_url":"https://avatars.githubusercontent.com/u/2036701?v=3","gravatar_id":"","url":"https://api.github.com/users/python-pillow","html_url":"https://github.com/python-pillow","followers_url":"https://api.github.com/users/python-pillow/followers","following_url":"https://api.github.com/users/python-pillow/following{/other_user}","gists_url":"https://api.github.com/users/python-pillow/gists{/gist_id}","starred_url":"https://api.github.com/users/python-pillow/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/python-pillow/subscriptions","organizations_url":"https://api.github.com/users/python-pillow/orgs","repos_url":"https://api.github.com/users/python-pillow/repos","events_url":"https://api.github.com/users/python-pillow/events{/privacy}","received_events_url":"https://api.github.com/users/python-pillow/received_events","type":"Organization","site_admin":false},"repo":{"id":5171600,"name":"Pillow","full_name":"python-pillow/Pillow","owner":{"login":"python-pillow","id":2036701,"avatar_url":"https://avatars.githubusercontent.com/u/2036701?v=3","gravatar_id":"","url":"https://api.github.com/users/python-pillow","html_url":"https://github.com/python-pillow","followers_url":"https://api.github.com/users/python-pillow/followers","following_url":"https://api.github.com/users/python-pillow/following{/other_user}","gists_url":"https://api.github.com/users/python-pillow/gists{/gist_id}","starred_url":"https://api.github.com/users/python-pillow/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/python-pillow/subscriptions","organizations_url":"https://api.github.com/users/python-pillow/orgs","repos_url":"https://api.github.com/users/python-pillow/repos","events_url":"https://api.github.com/users/python-pillow/events{/privacy}","received_events_url":"https://api.github.com/users/python-pillow/received_events","type":"Organization","site_admin":false},"private":false,"html_url":"https://github.com/python-pillow/Pillow","description":"The friendly PIL fork","fork":false,"url":"https://api.github.com/repos/python-pillow/Pillow","forks_url":"https://api.github.com/repos/python-pillow/Pillow/forks","keys_url":"https://api.github.com/repos/python-pillow/Pillow/keys{/key_id}","collaborators_url":"https://api.github.com/repos/python-pillow/Pillow/collaborators{/collaborator}","teams_url":"https://api.github.com/repos/python-pillow/Pillow/teams","hooks_url":"https://api.github.com/repos/python-pillow/Pillow/hooks","issue_events_url":"https://api.github.com/repos/python-pillow/Pillow/issues/events{/number}","events_url":"https://api.github.com/repos/python-pillow/Pillow/events","assignees_url":"https://api.github.com/repos/python-pillow/Pillow/assignees{/user}","branches_url":"https://api.github.com/repos/python-pillow/Pillow/branches{/branch}","tags_url":"https://api.github.com/repos/python-pillow/Pillow/tags","blobs_url":"https://api.github.com/repos/python-pillow/Pillow/git/blobs{/sha}","git_tags_url":"https://api.github.com/repos/python-pillow/Pillow/git/tags{/sha}","git_refs_url":"https://api.github.com/repos/python-pillow/Pillow/git/refs{/sha}","trees_url":"https://api.github.com/repos/python-pillow/Pillow/git/trees{/sha}","statuses_url":"https://api.github.com/repos/python-pillow/Pillow/statuses/{sha}","languages_url":"https://api.github.com/repos/python-pillow/Pillow/languages","stargazers_url":"https://api.github.com/repos/python-pillow/Pillow/stargazers","contributors_url":"https://api.github.com/repos/python-pillow/Pillow/contributors","subscribers_url":"https://api.github.com/repos/python-pillow/Pillow/subscribers","subscription_url":"https://api.github.com/repos/python-pillow/Pillow/subscription","commits_url":"https://api.github.com/repos/python-pillow/Pillow/commits{/sha}","git_commits_url":"https://api.github.com/repos/python-pillow/Pillow/git/commits{/sha}","comments_url":"https://api.github.com/repos/python-pillow/Pillow/comments{/number}","issue_comment_url":"https://api.github.com/repos/python-pillow/Pillow/issues/comments/{number}","contents_url":"https://api.github.com/repos/python-pillow/Pillow/contents/{+path}","compare_url":"https://api.github.com/repos/python-pillow/Pillow/compare/{base}...{head}","merges_url":"https://api.github.com/repos/python-pillow/Pillow/merges","archive_url":"https://api.github.com/repos/python-pillow/Pillow/{archive_format}{/ref}","downloads_url":"https://api.github.com/repos/python-pillow/Pillow/downloads","issues_url":"https://api.github.com/repos/python-pillow/Pillow/issues{/number}","pulls_url":"https://api.github.com/repos/python-pillow/Pillow/pulls{/number}","milestones_url":"https://api.github.com/repos/python-pillow/Pillow/milestones{/number}","notifications_url":"https://api.github.com/repos/python-pillow/Pillow/notifications{?since,all,participating}","labels_url":"https://api.github.com/repos/python-pillow/Pillow/labels{/name}","releases_url":"https://api.github.com/repos/python-pillow/Pillow/releases{/id}","created_at":"2012-07-24T21:38:39Z","updated_at":"2014-12-31T22:44:33Z","pushed_at":"2014-12-31T22:44:33Z","git_url":"git://github.com/python-pillow/Pillow.git","ssh_url":"git@github.com:python-pillow/Pillow.git","clone_url":"https://github.com/python-pillow/Pillow.git","svn_url":"https://github.com/python-pillow/Pillow","homepage":"http://python-pillow.github.io/","size":20365,"stargazers_count":1391,"watchers_count":1391,"language":"Python","has_issues":true,"has_downloads":true,"has_wiki":true,"has_pages":true,"forks_count":319,"mirror_url":null,"open_issues_count":65,"forks":319,"open_issues":65,"watchers":1391,"default_branch":"master"}},"_links":{"self":{"href":"https://api.github.com/repos/python-pillow/Pillow/pulls/1062"},"html":{"href":"https://github.com/python-pillow/Pillow/pull/1062"},"issue":{"href":"https://api.github.com/repos/python-pillow/Pillow/issues/1062"},"comments":{"href":"https://api.github.com/repos/python-pillow/Pillow/issues/1062/comments"},"review_comments":{"href":"https://api.github.com/repos/python-pillow/Pillow/pulls/1062/comments"},"review_comment":{"href":"https://api.github.com/repos/python-pillow/Pillow/pulls/comments/{number}"},"commits":{"href":"https://api.github.com/repos/python-pillow/Pillow/pulls/1062/commits"},"statuses":{"href":"https://api.github.com/repos/python-pillow/Pillow/statuses/cf880329a755f5b5c81df661990105593adf4a37"}},"merged":false,"mergeable":null,"mergeable_state":"unknown","merged_by":null,"comments":0,"review_comments":0,"commits":6,"additions":95,"deletions":12,"changed_files":9}},"public":true,"created_at":"2015-01-01T01:05:32Z","org":{"id":2036701,"login":"python-pillow","gravatar_id":"","url":"https://api.github.com/orgs/python-pillow","avatar_url":"https://avatars.githubusercontent.com/u/2036701?"}}
{"id":"2489398223","type":"ReleaseEvent","actor":{"id":99359,"login":"llinder","gravatar_id":"","url":"https://api.github.com/users/llinder","avatar_url":"https://avatars.githubusercontent.com/u/99359?"},"repo":{"id":28669941,"name":"llinder/salt","url":"https://api.github.com/repos/llinder/salt"},"payload":{"action":"published","release":{"url":"https://api.github.com/repos/llinder/salt/releases/818220","assets_url":"https://api.github.com/repos/llinder/salt/releases/818220/assets","upload_url":"https://uploads.github.com/repos/llinder/salt/releases/818220/assets{?name}","html_url":"https://github.com/llinder/salt/releases/tag/v2014.7.0.1","id":818220,"tag_name":"v2014.7.0.1","target_commitish":"2014.7","name":"","draft":false,"author":{"login":"llinder","id":99359,"avatar_url":"https://avatars.githubusercontent.com/u/99359?v=3","gravatar_id":"","url":"https://api.github.com/users/llinder","html_url":"https://github.com/llinder","followers_url":"https://api.github.com/users/llinder/followers","following_url":"https://api.github.com/users/llinder/following{/other_user}","gists_url":"https://api.github.com/users/llinder/gists{/gist_id}","starred_url":"https://api.github.com/users/llinder/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/llinder/subscriptions","organizations_url":"https://api.github.com/users/llinder/orgs","repos_url":"https://api.github.com/users/llinder/repos","events_url":"https://api.github.com/users/llinder/events{/privacy}","received_events_url":"https://api.github.com/users/llinder/received_events","type":"User","site_admin":false},"prerelease":false,"created_at":"2014-12-31T17:03:50Z","published_at":"2015-01-01T01:05:32Z","assets":[],"tarball_url":"https://api.github.com/repos/llinder/salt/tarball/v2014.7.0.1","zipball_url":"https://api.github.com/repos/llinder/salt/zipball/v2014.7.0.1","body":""}},"public":true,"created_at":"2015-01-01T01:05:32Z"}
{"id":"2489398224","type":"PushEvent","actor":{"id":1402662,"login":"jamcar23","gravatar_id":"","url":"https://api.github.com/users/jamcar23","avatar_url":"https://avatars.githubusercontent.com/u/1402662?"},"repo":{"id":28678215,"name":"jamcar23/TextSecure","url":"https://api.github.com/repos/jamcar23/TextSecure"},"payload":{"push_id":536753268,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"cacd2d4c08275da40253cba2e5e8e1dd067e6535","before":"b6822b310ee8a480f9fa2ceab46e3cb7df3b011b","commits":[{"sha":"cacd2d4c08275da40253cba2e5e8e1dd067e6535","author":{"email":"7d57d41adbb4b81194decc0d3895cf6be7ed6b28@gmail.com","name":"jamcar23"},"message":"Added support for larger text such as a PGP key","distinct":true,"url":"https://api.github.com/repos/jamcar23/TextSecure/commits/cacd2d4c08275da40253cba2e5e8e1dd067e6535"}]},"public":true,"created_at":"2015-01-01T01:05:32Z"}
{"id":"2489398225","type":"CreateEvent","actor":{"id":99359,"login":"llinder","gravatar_id":"","url":"https://api.github.com/users/llinder","avatar_url":"https://avatars.githubusercontent.com/u/99359?"},"repo":{"id":28669941,"name":"llinder/salt","url":"https://api.github.com/repos/llinder/salt"},"payload":{"ref":"v2014.7.0.1","ref_type":"tag","master_branch":"develop","description":"Infrastructure automation and management system","pusher_type":"user"},"public":true,"created_at":"2015-01-01T01:05:32Z"}
{"id":"2489398232","type":"PushEvent","actor":{"id":1685551,"login":"nyankosoft","gravatar_id":"","url":"https://api.github.com/users/nyankosoft","avatar_url":"https://avatars.githubusercontent.com/u/1685551?"},"repo":{"id":4159713,"name":"nyankosoft/amorphous","url":"https://api.github.com/repos/nyankosoft/amorphous"},"payload":{"push_id":536753272,"size":10,"distinct_size":10,"ref":"refs/heads/master","head":"2080d2aa6a72a59832291f76b4e231b6bc27e2a9","before":"c4b5499bcc5d1f7c079e725c46fcd83d207fd86d","commits":[{"sha":"61fa0705992c0fab00e967469558305e68692664","author":{"email":"1e6e52750314f7db47451c08146cd425ed21ff15@gmail.com","name":"wanko"},"message":"updated: the skeletal mesh demo","distinct":true,"url":"https://api.github.com/repos/nyankosoft/amorphous/commits/61fa0705992c0fab00e967469558305e68692664"},{"sha":"ff50592dc05c087b16fcc889cc6331bb5d994a32","author":{"email":"1e6e52750314f7db47451c08146cd425ed21ff15@gmail.com","name":"wanko"},"message":"updated: VC++ project files.","distinct":true,"url":"https://api.github.com/repos/nyankosoft/amorphous/commits/ff50592dc05c087b16fcc889cc6331bb5d994a32"},{"sha":"148aee80cc188f10752f48bd01fbd3216112a75a","author":{"email":"1e6e52750314f7db47451c08146cd425ed21ff15@gmail.com","name":"wanko"},"message":"changed: the EoL characters to LFs.","distinct":true,"url":"https://api.github.com/repos/nyankosoft/amorphous/commits/148aee80cc188f10752f48bd01fbd3216112a75a"},{"sha":"464a6c62cad68b1213b939e8a745ecf47892e644","author":{"email":"1e6e52750314f7db47451c08146cd425ed21ff15@gmail.com","name":"wanko"},"message":"changed: class and file names from *Test to *Demo","distinct":true,"url":"https://api.github.com/repos/nyankosoft/amorphous/commits/464a6c62cad68b1213b939e8a745ecf47892e644"},{"sha":"90037f3c6af4acf4a67f8dae86463a71e1d9d373","author":{"email":"1e6e52750314f7db47451c08146cd425ed21ff15@gmail.com","name":"wanko"},"message":"changed: CGraphicsTestBase and other related source code.","distinct":true,"url":"https://api.github.com/repos/nyankosoft/amorphous/commits/90037f3c6af4acf4a67f8dae86463a71e1d9d373"},{"sha":"8731317418a36f1fe0f757dff00179e86f04dee5","author":{"email":"1e6e52750314f7db47451c08146cd425ed21ff15@gmail.com","name":"wanko"},"message":"fixed: file and class names","distinct":true,"url":"https://api.github.com/repos/nyankosoft/amorphous/commits/8731317418a36f1fe0f757dff00179e86f04dee5"},{"sha":"b59668a84490521c59af648c0759652c392fb6db","author":{"email":"1e6e52750314f7db47451c08146cd425ed21ff15@gmail.com","name":"wanko"},"message":"updated: VC++ project files","distinct":true,"url":"https://api.github.com/repos/nyankosoft/amorphous/commits/b59668a84490521c59af648c0759652c392fb6db"},{"sha":"545bd334f01905514efe81b594850cd93c5869b6","author":{"email":"1e6e52750314f7db47451c08146cd425ed21ff15@gmail.com","name":"wanko"},"message":"added: the Windows executable of MeshViewer","distinct":true,"url":"https://api.github.com/repos/nyankosoft/amorphous/commits/545bd334f01905514efe81b594850cd93c5869b6"},{"sha":"2721bd332fbda951f2ef1c0f581fe049d105273e","author":{"email":"1e6e52750314f7db47451c08146cd425ed21ff15@gmail.com","name":"wanko"},"message":"added: the Windows executable of MeshModelCompiler.exe","distinct":true,"url":"https://api.github.com/repos/nyankosoft/amorphous/commits/2721bd332fbda951f2ef1c0f581fe049d105273e"},{"sha":"2080d2aa6a72a59832291f76b4e231b6bc27e2a9","author":{"email":"1e6e52750314f7db47451c08146cd425ed21ff15@gmail.com","name":"wanko"},"message":"updated: a VC++ project file","distinct":true,"url":"https://api.github.com/repos/nyankosoft/amorphous/commits/2080d2aa6a72a59832291f76b4e231b6bc27e2a9"}]},"public":true,"created_at":"2015-01-01T01:05:33Z"}
{"id":"2489398233","type":"PushEvent","actor":{"id":4535554,"login":"Kflash","gravatar_id":"","url":"https://api.github.com/users/Kflash","avatar_url":"https://avatars.githubusercontent.com/u/4535554?"},"repo":{"id":28209294,"name":"ugma/ugma","url":"https://api.github.com/repos/ugma/ugma"},"payload":{"push_id":536753273,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"c55f37f14e2c6098ed43ec4ced1b8cce898ebc01","before":"958106c2bdc1af4ad5dcded148254f60ee0be0a2","commits":[{"sha":"c55f37f14e2c6098ed43ec4ced1b8cce898ebc01","author":{"email":"fedd6aa74861a001db1cce23d0a3b62b20a9d469@gmail.com","name":"KFlash"},"message":"removed minor bugs","distinct":true,"url":"https://api.github.com/repos/ugma/ugma/commits/c55f37f14e2c6098ed43ec4ced1b8cce898ebc01"}]},"public":true,"created_at":"2015-01-01T01:05:33Z","org":{"id":10238638,"login":"ugma","gravatar_id":"","url":"https://api.github.com/orgs/ugma","avatar_url":"https://avatars.githubusercontent.com/u/10238638?"}}
{"id":"2489398234","type":"PushEvent","actor":{"id":8471028,"login":"tejp","gravatar_id":"","url":"https://api.github.com/users/tejp","avatar_url":"https://avatars.githubusercontent.com/u/8471028?"},"repo":{"id":23040963,"name":"tejp/tejp.github.io","url":"https://api.github.com/repos/tejp/tejp.github.io"},"payload":{"push_id":536753274,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"363dbe560e3cff95e59fbdd48cf2332966d221c7","before":"d573ac05334c6d1d703ba4159a9910a3446a9209","commits":[{"sha":"363dbe560e3cff95e59fbdd48cf2332966d221c7","author":{"email":"d9c605cae73349f701ec912308096793b72cdc83@gmail.com","name":"tejp"},"message":"fix a setting","distinct":true,"url":"https://api.github.com/repos/tejp/tejp.github.io/commits/363dbe560e3cff95e59fbdd48cf2332966d221c7"}]},"public":true,"created_at":"2015-01-01T01:05:33Z"}
{"id":"2489398235","type":"DeleteEvent","actor":{"id":1217681,"login":"stoeffel","gravatar_id":"","url":"https://api.github.com/users/stoeffel","avatar_url":"https://avatars.githubusercontent.com/u/1217681?"},"repo":{"id":800115,"name":"epeli/underscore.string","url":"https://api.github.com/repos/epeli/underscore.string"},"payload":{"ref":"camelize-force-lowercase","ref_type":"branch","pusher_type":"user"},"public":true,"created_at":"2015-01-01T01:05:34Z"}
{"id":"2489398237","type":"PullRequestReviewCommentEvent","actor":{"id":523287,"login":"j2sol","gravatar_id":"","url":"https://api.github.com/users/j2sol","avatar_url":"https://avatars.githubusercontent.com/u/523287?"},"repo":{"id":11848896,"name":"blueboxgroup/ursula","url":"https://api.github.com/repos/blueboxgroup/ursula"},"payload":{"action":"created","comment":{"url":"https://api.github.com/repos/blueboxgroup/ursula/pulls/comments/22397292","id":22397292,"diff_hunk":"@@ -1,121 +1,92 @@\n ---\n-- name: install apache\n-  apt: pkg={{ item }}\n-  with_items:\n-    - apache2\n-    - libapache2-mod-wsgi\n-\n - name: lesscpy must be in apache PATH\n   pip: name=lesscpy version=0.9j\n \n - name: get horizon source repo\n-  git: repo={{ openstack.git_mirror }}/horizon.git\n-       dest=/opt/stack/horizon\n-       version={{ horizon.rev }}\n-       update={{ openstack.git_update }}\n+  git: |\n+    repo={{ openstack.git_mirror}}/horizon.git\n+    dest=/opt/stack/horizon\n+    version={{ horizon.rev }}\n+    update={{ openstack.git_update }}\n   notify:\n     - setup horizon venv\n     - compress horizon assets\n \n-- template: src=opt/stack/horizon/hide-external-networks.patch dest=/opt/stack/horizon/hide-external-networks.patch mode=0644\n-- shell: patch -p1 < hide-external-networks.patch chdir=/opt/stack/horizon\n-  notify:\n-    - setup horizon venv\n-\n - name: add python-memcached to horizon requirements\n-  lineinfile: dest=/opt/stack/horizon/requirements.txt\n-              regexp=^python-memcached\n-              line=python-memcached\n+  lineinfile: dest=/opt/stack/horizon/requirements.txt regexp=^python-memcached line=python-memcached\n   notify:\n     - setup horizon venv\n \n-- name: disable apache status\n-  command: a2dismod status\n-  notify:\n-    - restart apache\n-\n-- name: apache ports config\n-  template: src=etc/apache2/ports.conf\n-            dest=/etc/apache2/ports.conf\n-  notify:\n-    - restart apache\n-\n-- name: disable default apache site\n-  command: a2dissite 000-default\n+- name: make sure apache knows about horizon ports\n+  lineinfile: dest=/etc/apache2/ports.conf line=\"Listen 8080\"\n   notify:\n-    - restart apache\n+    - reload apache\n \n-- name: openstack dashboard config (12.04)\n-  template: src=etc/apache2/sites-available/openstack_dashboard.conf\n-            dest=/etc/apache2/sites-available/openstack_dashboard\n+- name: create dashboard virtualhost on precise\n+  template: |\n+    src=etc/apache2/sites-available/openstack_dashboard.conf\n+    dest=/etc/apache2/sites-available/openstack_dashboard\n   when: ansible_distribution_version == \"12.04\"\n   notify:\n-    - restart apache\n+    - reload apache\n \n-- name: openstack dashboard config\n-  template: src=etc/apache2/sites-available/openstack_dashboard.conf\n-            dest=/etc/apache2/sites-available/openstack_dashboard.conf\n+- name: create dashboard virtualhost on other\n+  template: |\n+    src=etc/apache2/sites-available/openstack_dashboard.conf\n+    dest=/etc/apache2/sites-available/openstack_dashboard.conf\n   when: ansible_distribution_version != \"12.04\"\n   notify:\n-    - restart apache\n+    - reload apache\n \n - name: enable horizon apache site\n-  command: a2ensite openstack_dashboard\n+  apache2_site: state=enabled name=openstack_dashboard\n   notify:\n-    - restart apache\n-\n-- name: static asset directories\n-  file: dest={{ item }}\n-        state=directory\n-        owner=www-data\n-        group=www-data\n-        mode=0755\n+    - reload apache\n+\n+- name: create static asset dirs\n+  file: |\n+    dest={{ item }}\n+    state=directory\n+    owner=www-data\n+    group=www-data\n+    mode=0755\n   with_items:\n     - /opt/stack/horizon/static\n     - /opt/stack/horizon/static/dashboard\n \n-- name: horizon local settings\n-  template: src=opt/stack/horizon/openstack_dashboard/local/local_settings.py\n-            dest=/opt/stack/horizon/openstack_dashboard/local/local_settings.py\n-            mode=0644\n+- name: dashboard settings\n+  template: |\n+    src=opt/stack/horizon/openstack_dashboard/local/local_settings.py\n+    dest=/opt/stack/horizon/openstack_dashboard/local/local_settings.py\n+    mode=0644\n   notify:\n-    - restart apache\n+    - reload apache\n \n - name: custom horizon logo\n-  get_url: url={{ horizon.logo_url }}\n-           dest=/opt/stack/horizon/openstack_dashboard/static/dashboard/img/logo.png\n-           mode=0644 force=yes\n+  get_url: url={{ horizon.logo_url }} dest=/opt/stack/horizon/openstack_dashboard/static/dashboard/img/logo.png mode=0644 force=yes\n \n - name: custom horizon splash logo\n-  get_url: url={{ horizon.logo_url }}\n-           dest=/opt/stack/horizon/openstack_dashboard/static/dashboard/img/logo-splash.png\n-           mode=0644 force=yes\n+  get_url: url={{ horizon.logo_url }} dest=/opt/stack/horizon/openstack_dashboard/static/dashboard/img/logo-splash.png mode=0644 force=yes\n \n - name: custom horizon favicon\n-  get_url: url={{ horizon.favicon_url }}\n-           dest=/opt/stack/horizon/openstack_dashboard/static/dashboard/img/favicon.ico\n-           force=yes\n+  get_url: url={{ horizon.favicon_url }} dest=/opt/stack/horizon/openstack_dashboard/static/dashboard/img/favicon.ico force=yes\n \n - name: put images and fonts where apache can find them\n-  file: src=/opt/stack/horizon/openstack_dashboard/static/dashboard/{{ item }}\n-        dest=/opt/stack/horizon/static/dashboard/{{ item }}\n-        state=link\n-        owner=www-data\n-        group=www-data\n+  file: |","path":"roles/horizon/tasks/main.yml","position":143,"original_position":143,"commit_id":"2a6f35313b9936ce4450aba823d09287626bed6f","original_commit_id":"2a6f35313b9936ce4450aba823d09287626bed6f","user":{"login":"j2sol","id":523287,"avatar_url":"https://avatars.githubusercontent.com/u/523287?v=3","gravatar_id":"","url":"https://api.github.com/users/j2sol","html_url":"https://github.com/j2sol","followers_url":"https://api.github.com/users/j2sol/followers","following_url":"https://api.github.com/users/j2sol/following{/other_user}","gists_url":"https://api.github.com/users/j2sol/gists{/gist_id}","starred_url":"https://api.github.com/users/j2sol/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/j2sol/subscriptions","organizations_url":"https://api.github.com/users/j2sol/orgs","repos_url":"https://api.github.com/users/j2sol/repos","events_url":"https://api.github.com/users/j2sol/events{/privacy}","received_events_url":"https://api.github.com/users/j2sol/received_events","type":"User","site_admin":false},"body":"?","created_at":"2015-01-01T01:05:34Z","updated_at":"2015-01-01T01:05:34Z","html_url":"https://github.com/blueboxgroup/ursula/pull/705#discussion_r22397292","pull_request_url":"https://api.github.com/repos/blueboxgroup/ursula/pulls/705","_links":{"self":{"href":"https://api.github.com/repos/blueboxgroup/ursula/pulls/comments/22397292"},"html":{"href":"https://github.com/blueboxgroup/ursula/pull/705#discussion_r22397292"},"pull_request":{"href":"https://api.github.com/repos/blueboxgroup/ursula/pulls/705"}}},"pull_request":{"url":"https://api.github.com/repos/blueboxgroup/ursula/pulls/705","id":26738851,"html_url":"https://github.com/blueboxgroup/ursula/pull/705","diff_url":"https://github.com/blueboxgroup/ursula/pull/705.diff","patch_url":"https://github.com/blueboxgroup/ursula/pull/705.patch","issue_url":"https://api.github.com/repos/blueboxgroup/ursula/issues/705","number":705,"state":"open","locked":false,"title":"WIP:  apache for loadbalancing","user":{"login":"paulczar","id":2488346,"avatar_url":"https://avatars.githubusercontent.com/u/2488346?v=3","gravatar_id":"","url":"https://api.github.com/users/paulczar","html_url":"https://github.com/paulczar","followers_url":"https://api.github.com/users/paulczar/followers","following_url":"https://api.github.com/users/paulczar/following{/other_user}","gists_url":"https://api.github.com/users/paulczar/gists{/gist_id}","starred_url":"https://api.github.com/users/paulczar/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/paulczar/subscriptions","organizations_url":"https://api.github.com/users/paulczar/orgs","repos_url":"https://api.github.com/users/paulczar/repos","events_url":"https://api.github.com/users/paulczar/events{/privacy}","received_events_url":"https://api.github.com/users/paulczar/received_events","type":"User","site_admin":false},"body":"This is a quick POC / WIP to demo using apache instead of haproxy for loadbalancing our APIs.\r\n\r\nI think this gives us more flexibiltiy as we can enable in the APIs role itself ( in this case in keystone ) rather than a big monolithic haproxy.conf.      We also already have apache running for horizon, so it could reduce number of services.    apache also has better logging options that haproxy which can only log to syslog. ","created_at":"2015-01-01T00:04:13Z","updated_at":"2015-01-01T01:05:34Z","closed_at":null,"merged_at":null,"merge_commit_sha":"9b91693f11e166c9ee53836f19697868d412bf76","assignee":null,"milestone":null,"commits_url":"https://api.github.com/repos/blueboxgroup/ursula/pulls/705/commits","review_comments_url":"https://api.github.com/repos/blueboxgroup/ursula/pulls/705/comments","review_comment_url":"https://api.github.com/repos/blueboxgroup/ursula/pulls/comments/{number}","comments_url":"https://api.github.com/repos/blueboxgroup/ursula/issues/705/comments","statuses_url":"https://api.github.com/repos/blueboxgroup/ursula/statuses/2a6f35313b9936ce4450aba823d09287626bed6f","head":{"label":"blueboxgroup:use_apache_for_lb","ref":"use_apache_for_lb","sha":"2a6f35313b9936ce4450aba823d09287626bed6f","user":{"login":"blueboxgroup","id":458705,"avatar_url":"https://avatars.githubusercontent.com/u/458705?v=3","gravatar_id":"","url":"https://api.github.com/users/blueboxgroup","html_url":"https://github.com/blueboxgroup","followers_url":"https://api.github.com/users/blueboxgroup/followers","following_url":"https://api.github.com/users/blueboxgroup/following{/other_user}","gists_url":"https://api.github.com/users/blueboxgroup/gists{/gist_id}","starred_url":"https://api.github.com/users/blueboxgroup/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/blueboxgroup/subscriptions","organizations_url":"https://api.github.com/users/blueboxgroup/orgs","repos_url":"https://api.github.com/users/blueboxgroup/repos","events_url":"https://api.github.com/users/blueboxgroup/events{/privacy}","received_events_url":"https://api.github.com/users/blueboxgroup/received_events","type":"Organization","site_admin":false},"repo":{"id":11848896,"name":"ursula","full_name":"blueboxgroup/ursula","owner":{"login":"blueboxgroup","id":458705,"avatar_url":"https://avatars.githubusercontent.com/u/458705?v=3","gravatar_id":"","url":"https://api.github.com/users/blueboxgroup","html_url":"https://github.com/blueboxgroup","followers_url":"https://api.github.com/users/blueboxgroup/followers","following_url":"https://api.github.com/users/blueboxgroup/following{/other_user}","gists_url":"https://api.github.com/users/blueboxgroup/gists{/gist_id}","starred_url":"https://api.github.com/users/blueboxgroup/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/blueboxgroup/subscriptions","organizations_url":"https://api.github.com/users/blueboxgroup/orgs","repos_url":"https://api.github.com/users/blueboxgroup/repos","events_url":"https://api.github.com/users/blueboxgroup/events{/privacy}","received_events_url":"https://api.github.com/users/blueboxgroup/received_events","type":"Organization","site_admin":false},"private":false,"html_url":"https://github.com/blueboxgroup/ursula","description":"Ansible playbooks for operating OpenStack","fork":false,"url":"https://api.github.com/repos/blueboxgroup/ursula","forks_url":"https://api.github.com/repos/blueboxgroup/ursula/forks","keys_url":"https://api.github.com/repos/blueboxgroup/ursula/keys{/key_id}","collaborators_url":"https://api.github.com/repos/blueboxgroup/ursula/collaborators{/collaborator}","teams_url":"https://api.github.com/repos/blueboxgroup/ursula/teams","hooks_url":"https://api.github.com/repos/blueboxgroup/ursula/hooks","issue_events_url":"https://api.github.com/repos/blueboxgroup/ursula/issues/events{/number}","events_url":"https://api.github.com/repos/blueboxgroup/ursula/events","assignees_url":"https://api.github.com/repos/blueboxgroup/ursula/assignees{/user}","branches_url":"https://api.github.com/repos/blueboxgroup/ursula/branches{/branch}","tags_url":"https://api.github.com/repos/blueboxgroup/ursula/tags","blobs_url":"https://api.github.com/repos/blueboxgroup/ursula/git/blobs{/sha}","git_tags_url":"https://api.github.com/repos/blueboxgroup/ursula/git/tags{/sha}","git_refs_url":"https://api.github.com/repos/blueboxgroup/ursula/git/refs{/sha}","trees_url":"https://api.github.com/repos/blueboxgroup/ursula/git/trees{/sha}","statuses_url":"https://api.github.com/repos/blueboxgroup/ursula/statuses/{sha}","languages_url":"https://api.github.com/repos/blueboxgroup/ursula/languages","stargazers_url":"https://api.github.com/repos/blueboxgroup/ursula/stargazers","contributors_url":"https://api.github.com/repos/blueboxgroup/ursula/contributors","subscribers_url":"https://api.github.com/repos/blueboxgroup/ursula/subscribers","subscription_url":"https://api.github.com/repos/blueboxgroup/ursula/subscription","commits_url":"https://api.github.com/repos/blueboxgroup/ursula/commits{/sha}","git_commits_url":"https://api.github.com/repos/blueboxgroup/ursula/git/commits{/sha}","comments_url":"https://api.github.com/repos/blueboxgroup/ursula/comments{/number}","issue_comment_url":"https://api.github.com/repos/blueboxgroup/ursula/issues/comments/{number}","contents_url":"https://api.github.com/repos/blueboxgroup/ursula/contents/{+path}","compare_url":"https://api.github.com/repos/blueboxgroup/ursula/compare/{base}...{head}","merges_url":"https://api.github.com/repos/blueboxgroup/ursula/merges","archive_url":"https://api.github.com/repos/blueboxgroup/ursula/{archive_format}{/ref}","downloads_url":"https://api.github.com/repos/blueboxgroup/ursula/downloads","issues_url":"https://api.github.com/repos/blueboxgroup/ursula/issues{/number}","pulls_url":"https://api.github.com/repos/blueboxgroup/ursula/pulls{/number}","milestones_url":"https://api.github.com/repos/blueboxgroup/ursula/milestones{/number}","notifications_url":"https://api.github.com/repos/blueboxgroup/ursula/notifications{?since,all,participating}","labels_url":"https://api.github.com/repos/blueboxgroup/ursula/labels{/name}","releases_url":"https://api.github.com/repos/blueboxgroup/ursula/releases{/id}","created_at":"2013-08-02T17:37:26Z","updated_at":"2014-12-31T21:03:28Z","pushed_at":"2015-01-01T00:01:35Z","git_url":"git://github.com/blueboxgroup/ursula.git","ssh_url":"git@github.com:blueboxgroup/ursula.git","clone_url":"https://github.com/blueboxgroup/ursula.git","svn_url":"https://github.com/blueboxgroup/ursula","homepage":null,"size":9036,"stargazers_count":45,"watchers_count":45,"language":"Python","has_issues":true,"has_downloads":true,"has_wiki":true,"has_pages":false,"forks_count":23,"mirror_url":null,"open_issues_count":26,"forks":23,"open_issues":26,"watchers":45,"default_branch":"master"}},"base":{"label":"blueboxgroup:master","ref":"master","sha":"34b83c65ff0de2f8b006d8ce4f76919fe0167bbf","user":{"login":"blueboxgroup","id":458705,"avatar_url":"https://avatars.githubusercontent.com/u/458705?v=3","gravatar_id":"","url":"https://api.github.com/users/blueboxgroup","html_url":"https://github.com/blueboxgroup","followers_url":"https://api.github.com/users/blueboxgroup/followers","following_url":"https://api.github.com/users/blueboxgroup/following{/other_user}","gists_url":"https://api.github.com/users/blueboxgroup/gists{/gist_id}","starred_url":"https://api.github.com/users/blueboxgroup/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/blueboxgroup/subscriptions","organizations_url":"https://api.github.com/users/blueboxgroup/orgs","repos_url":"https://api.github.com/users/blueboxgroup/repos","events_url":"https://api.github.com/users/blueboxgroup/events{/privacy}","received_events_url":"https://api.github.com/users/blueboxgroup/received_events","type":"Organization","site_admin":false},"repo":{"id":11848896,"name":"ursula","full_name":"blueboxgroup/ursula","owner":{"login":"blueboxgroup","id":458705,"avatar_url":"https://avatars.githubusercontent.com/u/458705?v=3","gravatar_id":"","url":"https://api.github.com/users/blueboxgroup","html_url":"https://github.com/blueboxgroup","followers_url":"https://api.github.com/users/blueboxgroup/followers","following_url":"https://api.github.com/users/blueboxgroup/following{/other_user}","gists_url":"https://api.github.com/users/blueboxgroup/gists{/gist_id}","starred_url":"https://api.github.com/users/blueboxgroup/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/blueboxgroup/subscriptions","organizations_url":"https://api.github.com/users/blueboxgroup/orgs","repos_url":"https://api.github.com/users/blueboxgroup/repos","events_url":"https://api.github.com/users/blueboxgroup/events{/privacy}","received_events_url":"https://api.github.com/users/blueboxgroup/received_events","type":"Organization","site_admin":false},"private":false,"html_url":"https://github.com/blueboxgroup/ursula","description":"Ansible playbooks for operating OpenStack","fork":false,"url":"https://api.github.com/repos/blueboxgroup/ursula","forks_url":"https://api.github.com/repos/blueboxgroup/ursula/forks","keys_url":"https://api.github.com/repos/blueboxgroup/ursula/keys{/key_id}","collaborators_url":"https://api.github.com/repos/blueboxgroup/ursula/collaborators{/collaborator}","teams_url":"https://api.github.com/repos/blueboxgroup/ursula/teams","hooks_url":"https://api.github.com/repos/blueboxgroup/ursula/hooks","issue_events_url":"https://api.github.com/repos/blueboxgroup/ursula/issues/events{/number}","events_url":"https://api.github.com/repos/blueboxgroup/ursula/events","assignees_url":"https://api.github.com/repos/blueboxgroup/ursula/assignees{/user}","branches_url":"https://api.github.com/repos/blueboxgroup/ursula/branches{/branch}","tags_url":"https://api.github.com/repos/blueboxgroup/ursula/tags","blobs_url":"https://api.github.com/repos/blueboxgroup/ursula/git/blobs{/sha}","git_tags_url":"https://api.github.com/repos/blueboxgroup/ursula/git/tags{/sha}","git_refs_url":"https://api.github.com/repos/blueboxgroup/ursula/git/refs{/sha}","trees_url":"https://api.github.com/repos/blueboxgroup/ursula/git/trees{/sha}","statuses_url":"https://api.github.com/repos/blueboxgroup/ursula/statuses/{sha}","languages_url":"https://api.github.com/repos/blueboxgroup/ursula/languages","stargazers_url":"https://api.github.com/repos/blueboxgroup/ursula/stargazers","contributors_url":"https://api.github.com/repos/blueboxgroup/ursula/contributors","subscribers_url":"https://api.github.com/repos/blueboxgroup/ursula/subscribers","subscription_url":"https://api.github.com/repos/blueboxgroup/ursula/subscription","commits_url":"https://api.github.com/repos/blueboxgroup/ursula/commits{/sha}","git_commits_url":"https://api.github.com/repos/blueboxgroup/ursula/git/commits{/sha}","comments_url":"https://api.github.com/repos/blueboxgroup/ursula/comments{/number}","issue_comment_url":"https://api.github.com/repos/blueboxgroup/ursula/issues/comments/{number}","contents_url":"https://api.github.com/repos/blueboxgroup/ursula/contents/{+path}","compare_url":"https://api.github.com/repos/blueboxgroup/ursula/compare/{base}...{head}","merges_url":"https://api.github.com/repos/blueboxgroup/ursula/merges","archive_url":"https://api.github.com/repos/blueboxgroup/ursula/{archive_format}{/ref}","downloads_url":"https://api.github.com/repos/blueboxgroup/ursula/downloads","issues_url":"https://api.github.com/repos/blueboxgroup/ursula/issues{/number}","pulls_url":"https://api.github.com/repos/blueboxgroup/ursula/pulls{/number}","milestones_url":"https://api.github.com/repos/blueboxgroup/ursula/milestones{/number}","notifications_url":"https://api.github.com/repos/blueboxgroup/ursula/notifications{?since,all,participating}","labels_url":"https://api.github.com/repos/blueboxgroup/ursula/labels{/name}","releases_url":"https://api.github.com/repos/blueboxgroup/ursula/releases{/id}","created_at":"2013-08-02T17:37:26Z","updated_at":"2014-12-31T21:03:28Z","pushed_at":"2015-01-01T00:01:35Z","git_url":"git://github.com/blueboxgroup/ursula.git","ssh_url":"git@github.com:blueboxgroup/ursula.git","clone_url":"https://github.com/blueboxgroup/ursula.git","svn_url":"https://github.com/blueboxgroup/ursula","homepage":null,"size":9036,"stargazers_count":45,"watchers_count":45,"language":"Python","has_issues":true,"has_downloads":true,"has_wiki":true,"has_pages":false,"forks_count":23,"mirror_url":null,"open_issues_count":26,"forks":23,"open_issues":26,"watchers":45,"default_branch":"master"}},"_links":{"self":{"href":"https://api.github.com/repos/blueboxgroup/ursula/pulls/705"},"html":{"href":"https://github.com/blueboxgroup/ursula/pull/705"},"issue":{"href":"https://api.github.com/repos/blueboxgroup/ursula/issues/705"},"comments":{"href":"https://api.github.com/repos/blueboxgroup/ursula/issues/705/comments"},"review_comments":{"href":"https://api.github.com/repos/blueboxgroup/ursula/pulls/705/comments"},"review_comment":{"href":"https://api.github.com/repos/blueboxgroup/ursula/pulls/comments/{number}"},"commits":{"href":"https://api.github.com/repos/blueboxgroup/ursula/pulls/705/commits"},"statuses":{"href":"https://api.github.com/repos/blueboxgroup/ursula/statuses/2a6f35313b9936ce4450aba823d09287626bed6f"}}}},"public":true,"created_at":"2015-01-01T01:05:34Z","org":{"id":458705,"login":"blueboxgroup","gravatar_id":"","url":"https://api.github.com/orgs/blueboxgroup","avatar_url":"https://avatars.githubusercontent.com/u/458705?"}}
{"id":"2489398243","type":"GollumEvent","actor":{"id":4620127,"login":"husathap","gravatar_id":"","url":"https://api.github.com/users/husathap","avatar_url":"https://avatars.githubusercontent.com/u/4620127?"},"repo":{"id":28579680,"name":"husathap/Inuvik","url":"https://api.github.com/repos/husathap/Inuvik"},"payload":{"pages":[{"page_name":"Tutorial-#1:-Creating-a-New-Room","title":"Tutorial #1: Creating a New Room","summary":null,"action":"created","sha":"11ee43f60ec85b1d5774e1d953b95a636a1bb0ff","html_url":"https://github.com/husathap/Inuvik/wiki/Tutorial-%231%3A-Creating-a-New-Room"}]},"public":true,"created_at":"2015-01-01T01:05:35Z"}
{"id":"2489398245","type":"GollumEvent","actor":{"id":4620127,"login":"husathap","gravatar_id":"","url":"https://api.github.com/users/husathap","avatar_url":"https://avatars.githubusercontent.com/u/4620127?"},"repo":{"id":28579680,"name":"husathap/Inuvik","url":"https://api.github.com/repos/husathap/Inuvik"},"payload":{"pages":[{"page_name":"Home","title":"Home","summary":null,"action":"created","sha":"ce6911e660816c3f4a6332848564fc52f58c63dd","html_url":"https://github.com/husathap/Inuvik/wiki/Home"}]},"public":true,"created_at":"2015-01-01T01:05:35Z"}
{"id":"2489398246","type":"PushEvent","actor":{"id":6484805,"login":"Piera","gravatar_id":"","url":"https://api.github.com/users/Piera","avatar_url":"https://avatars.githubusercontent.com/u/6484805?"},"repo":{"id":28613203,"name":"Piera/Project-U-C","url":"https://api.github.com/repos/Piera/Project-U-C"},"payload":{"push_id":536753277,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"ddf094f1c87680288341b667cefa0713155f656e","before":"7dd7b441f592a632d520a6493c91bf378de8a366","commits":[{"sha":"ddf094f1c87680288341b667cefa0713155f656e","author":{"email":"d4f798d7370ce072daf8219b0f67a9bac5ebb111@gmail.com","name":"Piera Damonte"},"message":"Update README.md","distinct":true,"url":"https://api.github.com/repos/Piera/Project-U-C/commits/ddf094f1c87680288341b667cefa0713155f656e"}]},"public":true,"created_at":"2015-01-01T01:05:35Z"}
{"id":"2489398247","type":"PushEvent","actor":{"id":3599988,"login":"wesdizzle","gravatar_id":"","url":"https://api.github.com/users/wesdizzle","avatar_url":"https://avatars.githubusercontent.com/u/3599988?"},"repo":{"id":28250120,"name":"wesdizzle/gagglelog","url":"https://api.github.com/repos/wesdizzle/gagglelog"},"payload":{"push_id":536753278,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"d04cbec8b68d0e66cf87c078862065645e181086","before":"fc86231b5063c1b8f2ed07b8d1ae887580869fcf","commits":[{"sha":"d04cbec8b68d0e66cf87c078862065645e181086","author":{"email":"baaa01a5d45f86e3d8f7008866cf0d37bea55570@gmail.com","name":"Wesley Miller"},"message":"added Index value to Games for multiple games in a series released simultaneously","distinct":true,"url":"https://api.github.com/repos/wesdizzle/gagglelog/commits/d04cbec8b68d0e66cf87c078862065645e181086"}]},"public":true,"created_at":"2015-01-01T01:05:35Z"}
{"id":"2489398248","type":"IssueCommentEvent","actor":{"id":663212,"login":"tdas","gravatar_id":"","url":"https://api.github.com/users/tdas","avatar_url":"https://avatars.githubusercontent.com/u/663212?"},"repo":{"id":17165658,"name":"apache/spark","url":"https://api.github.com/repos/apache/spark"},"payload":{"action":"created","issue":{"url":"https://api.github.com/repos/apache/spark/issues/3237","labels_url":"https://api.github.com/repos/apache/spark/issues/3237/labels{/name}","comments_url":"https://api.github.com/repos/apache/spark/issues/3237/comments","events_url":"https://api.github.com/repos/apache/spark/issues/3237/events","html_url":"https://github.com/apache/spark/pull/3237","id":48591711,"number":3237,"title":"[SPARK-3325][Streaming] Add a parameter to the method print in class DStream.","user":{"login":"watermen","id":1400819,"avatar_url":"https://avatars.githubusercontent.com/u/1400819?v=3","gravatar_id":"","url":"https://api.github.com/users/watermen","html_url":"https://github.com/watermen","followers_url":"https://api.github.com/users/watermen/followers","following_url":"https://api.github.com/users/watermen/following{/other_user}","gists_url":"https://api.github.com/users/watermen/gists{/gist_id}","starred_url":"https://api.github.com/users/watermen/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/watermen/subscriptions","organizations_url":"https://api.github.com/users/watermen/orgs","repos_url":"https://api.github.com/users/watermen/repos","events_url":"https://api.github.com/users/watermen/events{/privacy}","received_events_url":"https://api.github.com/users/watermen/received_events","type":"User","site_admin":false},"labels":[],"state":"open","locked":false,"assignee":null,"milestone":null,"comments":56,"created_at":"2014-11-13T02:52:35Z","updated_at":"2015-01-01T01:05:34Z","closed_at":null,"pull_request":{"url":"https://api.github.com/repos/apache/spark/pulls/3237","html_url":"https://github.com/apache/spark/pull/3237","diff_url":"https://github.com/apache/spark/pull/3237.diff","patch_url":"https://github.com/apache/spark/pull/3237.patch"},"body":"I have deleted the repository with mistake, so I create a new PR. old PR:https://github.com/apache/spark/pull/2216\r\n\r\n```scala\r\ndef print(num: Int = 10)\r\n```\r\nUser can control the number of elements which to print."},"comment":{"url":"https://api.github.com/repos/apache/spark/issues/comments/68477338","html_url":"https://github.com/apache/spark/pull/3237#issuecomment-68477338","issue_url":"https://api.github.com/repos/apache/spark/issues/3237","id":68477338,"user":{"login":"tdas","id":663212,"avatar_url":"https://avatars.githubusercontent.com/u/663212?v=3","gravatar_id":"","url":"https://api.github.com/users/tdas","html_url":"https://github.com/tdas","followers_url":"https://api.github.com/users/tdas/followers","following_url":"https://api.github.com/users/tdas/following{/other_user}","gists_url":"https://api.github.com/users/tdas/gists{/gist_id}","starred_url":"https://api.github.com/users/tdas/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/tdas/subscriptions","organizations_url":"https://api.github.com/users/tdas/orgs","repos_url":"https://api.github.com/users/tdas/repos","events_url":"https://api.github.com/users/tdas/events{/privacy}","received_events_url":"https://api.github.com/users/tdas/received_events","type":"User","site_admin":false},"created_at":"2015-01-01T01:05:34Z","updated_at":"2015-01-01T01:05:34Z","body":"Oops sorry, my bad. I created another merge conflict by merging another PR. Let me fix that for you."}},"public":true,"created_at":"2015-01-01T01:05:35Z","org":{"id":47359,"login":"apache","gravatar_id":"","url":"https://api.github.com/orgs/apache","avatar_url":"https://avatars.githubusercontent.com/u/47359?"}}
{"id":"2489398252","type":"PushEvent","actor":{"id":476440,"login":"sjkingo","gravatar_id":"","url":"https://api.github.com/users/sjkingo","avatar_url":"https://avatars.githubusercontent.com/u/476440?"},"repo":{"id":28647308,"name":"sjkingo/python-freshdesk","url":"https://api.github.com/repos/sjkingo/python-freshdesk"},"payload":{"push_id":536753279,"size":4,"distinct_size":4,"ref":"refs/heads/master","head":"58bac92e3df2218a325fc9237e2d9feff50fde02","before":"6d7bfadd2498b86848624affb47b921b0ef1fe9c","commits":[{"sha":"70602ce48ce709d6bef7ad009d487cca502cbc0e","author":{"email":"f16bed56189e249fe4ca8ed10a1ecae60e8ceac0@sjkwi.com.au","name":"Sam Kingston"},"message":"Handle API rate-limit gracefully","distinct":true,"url":"https://api.github.com/repos/sjkingo/python-freshdesk/commits/70602ce48ce709d6bef7ad009d487cca502cbc0e"},{"sha":"90bf419dd59a82753edc02bfe967b6dbb9bc215c","author":{"email":"f16bed56189e249fe4ca8ed10a1ecae60e8ceac0@sjkwi.com.au","name":"Sam Kingston"},"message":"Add tests for Comments","distinct":true,"url":"https://api.github.com/repos/sjkingo/python-freshdesk/commits/90bf419dd59a82753edc02bfe967b6dbb9bc215c"},{"sha":"4ecc96b5bb285f9a57df9ab46c06122847771890","author":{"email":"f16bed56189e249fe4ca8ed10a1ecae60e8ceac0@sjkwi.com.au","name":"Sam Kingston"},"message":"Add missing tests for str and repr methods on Ticket","distinct":true,"url":"https://api.github.com/repos/sjkingo/python-freshdesk/commits/4ecc96b5bb285f9a57df9ab46c06122847771890"},{"sha":"58bac92e3df2218a325fc9237e2d9feff50fde02","author":{"email":"f16bed56189e249fe4ca8ed10a1ecae60e8ceac0@sjkwi.com.au","name":"Sam Kingston"},"message":"Refactor tests to tidy","distinct":true,"url":"https://api.github.com/repos/sjkingo/python-freshdesk/commits/58bac92e3df2218a325fc9237e2d9feff50fde02"}]},"public":true,"created_at":"2015-01-01T01:05:36Z"}
{"id":"2489398254","type":"CreateEvent","actor":{"id":5226301,"login":"JoshSGman","gravatar_id":"","url":"https://api.github.com/users/JoshSGman","avatar_url":"https://avatars.githubusercontent.com/u/5226301?"},"repo":{"id":28678272,"name":"JoshSGman/itunesDataViz","url":"https://api.github.com/repos/JoshSGman/itunesDataViz"},"payload":{"ref":null,"ref_type":"repository","master_branch":"master","description":"A visualization library for itunes data","pusher_type":"user"},"public":true,"created_at":"2015-01-01T01:05:37Z"}
{"id":"2489398255","type":"IssuesEvent","actor":{"id":108040,"login":"jamesmintram","gravatar_id":"","url":"https://api.github.com/users/jamesmintram","avatar_url":"https://avatars.githubusercontent.com/u/108040?"},"repo":{"id":28670077,"name":"jamesmintram/LoomSDK","url":"https://api.github.com/repos/jamesmintram/LoomSDK"},"payload":{"action":"opened","issue":{"url":"https://api.github.com/repos/jamesmintram/LoomSDK/issues/1","labels_url":"https://api.github.com/repos/jamesmintram/LoomSDK/issues/1/labels{/name}","comments_url":"https://api.github.com/repos/jamesmintram/LoomSDK/issues/1/comments","events_url":"https://api.github.com/repos/jamesmintram/LoomSDK/issues/1/events","html_url":"https://github.com/jamesmintram/LoomSDK/issues/1","id":53210283,"number":1,"title":"Retina OSX nativeStageHeight incorrect","user":{"login":"jamesmintram","id":108040,"avatar_url":"https://avatars.githubusercontent.com/u/108040?v=3","gravatar_id":"","url":"https://api.github.com/users/jamesmintram","html_url":"https://github.com/jamesmintram","followers_url":"https://api.github.com/users/jamesmintram/followers","following_url":"https://api.github.com/users/jamesmintram/following{/other_user}","gists_url":"https://api.github.com/users/jamesmintram/gists{/gist_id}","starred_url":"https://api.github.com/users/jamesmintram/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/jamesmintram/subscriptions","organizations_url":"https://api.github.com/users/jamesmintram/orgs","repos_url":"https://api.github.com/users/jamesmintram/repos","events_url":"https://api.github.com/users/jamesmintram/events{/privacy}","received_events_url":"https://api.github.com/users/jamesmintram/received_events","type":"User","site_admin":false},"labels":[],"state":"open","locked":false,"assignee":null,"milestone":null,"comments":0,"created_at":"2015-01-01T01:05:37Z","updated_at":"2015-01-01T01:05:37Z","closed_at":null,"body":"It appears that stage.nativeStageWidth and stage.nativeStageHeight do not take into account the scale factor on OSX."}},"public":true,"created_at":"2015-01-01T01:05:37Z"}
{"id":"2489398262","type":"WatchEvent","actor":{"id":117788,"login":"nyarla","gravatar_id":"","url":"https://api.github.com/users/nyarla","avatar_url":"https://avatars.githubusercontent.com/u/117788?"},"repo":{"id":15659140,"name":"clbr/urlmatch","url":"https://api.github.com/repos/clbr/urlmatch"},"payload":{"action":"started"},"public":true,"created_at":"2015-01-01T01:05:37Z"}
{"id":"2489398266","type":"PushEvent","actor":{"id":2127465,"login":"gizmo385","gravatar_id":"","url":"https://api.github.com/users/gizmo385","avatar_url":"https://avatars.githubusercontent.com/u/2127465?"},"repo":{"id":25680223,"name":"gizmo385/LearningClojure","url":"https://api.github.com/repos/gizmo385/LearningClojure"},"payload":{"push_id":536753285,"size":2,"distinct_size":2,"ref":"refs/heads/master","head":"b183587e912c016d78339ce2a24d72561f22ea85","before":"cc88f9406f34d5a0256154003b4d9a96aa2d6428","commits":[{"sha":"32224fa783d11f07e04e908eb5be765b4dbe4db6","author":{"email":"aed2c4d01960864cfdbeee7b4c5891b1ffa98b04@gmail.com","name":"Christopher Chapline"},"message":"Updated readme","distinct":true,"url":"https://api.github.com/repos/gizmo385/LearningClojure/commits/32224fa783d11f07e04e908eb5be765b4dbe4db6"},{"sha":"b183587e912c016d78339ce2a24d72561f22ea85","author":{"email":"aed2c4d01960864cfdbeee7b4c5891b1ffa98b04@gmail.com","name":"Christopher Chapline"},"message":"New graph implementation based on protocols. SimpleGraph, Network, and Digraph implemented.","distinct":true,"url":"https://api.github.com/repos/gizmo385/LearningClojure/commits/b183587e912c016d78339ce2a24d72561f22ea85"}]},"public":true,"created_at":"2015-01-01T01:05:38Z"}
{"id":"2489398267","type":"PushEvent","actor":{"id":8941027,"login":"MarvAmBass","gravatar_id":"","url":"https://api.github.com/users/MarvAmBass","avatar_url":"https://avatars.githubusercontent.com/u/8941027?"},"repo":{"id":28630141,"name":"MarvAmBass/py-media.ccc-congress-crawler","url":"https://api.github.com/repos/MarvAmBass/py-media.ccc-congress-crawler"},"payload":{"push_id":536753286,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"b2f2a15104dd3784e9ca3e3c50305f09a0c732ca","before":"7e54b606cd5632cc34efc10e7842b72eeb3205b3","commits":[{"sha":"b2f2a15104dd3784e9ca3e3c50305f09a0c732ca","author":{"email":"78cbc2e9669f4cea46806632e080ee9166740ed9@gmail.com","name":"MarvAmBass"},"message":"complete rewrite","distinct":true,"url":"https://api.github.com/repos/MarvAmBass/py-media.ccc-congress-crawler/commits/b2f2a15104dd3784e9ca3e3c50305f09a0c732ca"}]},"public":true,"created_at":"2015-01-01T01:05:38Z"}
{"id":"2489398269","type":"CreateEvent","actor":{"id":10173890,"login":"daiguangfa","gravatar_id":"","url":"https://api.github.com/users/daiguangfa","avatar_url":"https://avatars.githubusercontent.com/u/10173890?"},"repo":{"id":28678274,"name":"daiguangfa/python_tutorial","url":"https://api.github.com/repos/daiguangfa/python_tutorial"},"payload":{"ref":null,"ref_type":"repository","master_branch":"master","description":"Python入门","pusher_type":"user"},"public":true,"created_at":"2015-01-01T01:05:40Z"}
{"id":"2489398280","type":"PullRequestEvent","actor":{"id":3489773,"login":"captainkirkby","gravatar_id":"","url":"https://api.github.com/users/captainkirkby","avatar_url":"https://avatars.githubusercontent.com/u/3489773?"},"repo":{"id":15461243,"name":"captainkirkby/Gears","url":"https://api.github.com/repos/captainkirkby/Gears"},"payload":{"action":"closed","number":31,"pull_request":{"url":"https://api.github.com/repos/captainkirkby/Gears/pulls/31","id":26739457,"html_url":"https://github.com/captainkirkby/Gears/pull/31","diff_url":"https://github.com/captainkirkby/Gears/pull/31.diff","patch_url":"https://github.com/captainkirkby/Gears/pull/31.patch","issue_url":"https://api.github.com/repos/captainkirkby/Gears/issues/31","number":31,"state":"closed","locked":false,"title":"Add simple C program to replay binary file","user":{"login":"captainkirkby","id":3489773,"avatar_url":"https://avatars.githubusercontent.com/u/3489773?v=3","gravatar_id":"","url":"https://api.github.com/users/captainkirkby","html_url":"https://github.com/captainkirkby","followers_url":"https://api.github.com/users/captainkirkby/followers","following_url":"https://api.github.com/users/captainkirkby/following{/other_user}","gists_url":"https://api.github.com/users/captainkirkby/gists{/gist_id}","starred_url":"https://api.github.com/users/captainkirkby/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/captainkirkby/subscriptions","organizations_url":"https://api.github.com/users/captainkirkby/orgs","repos_url":"https://api.github.com/users/captainkirkby/repos","events_url":"https://api.github.com/users/captainkirkby/events{/privacy}","received_events_url":"https://api.github.com/users/captainkirkby/received_events","type":"User","site_admin":false},"body":"Closes issue #30 ","created_at":"2015-01-01T01:05:31Z","updated_at":"2015-01-01T01:05:41Z","closed_at":"2015-01-01T01:05:41Z","merged_at":"2015-01-01T01:05:41Z","merge_commit_sha":"1937489450eb244357356ec9a4ad968f1d63e23d","assignee":null,"milestone":null,"commits_url":"https://api.github.com/repos/captainkirkby/Gears/pulls/31/commits","review_comments_url":"https://api.github.com/repos/captainkirkby/Gears/pulls/31/comments","review_comment_url":"https://api.github.com/repos/captainkirkby/Gears/pulls/comments/{number}","comments_url":"https://api.github.com/repos/captainkirkby/Gears/issues/31/comments","statuses_url":"https://api.github.com/repos/captainkirkby/Gears/statuses/0ce69fa19d81de656dd6a74629099a7fa9261d1c","head":{"label":"captainkirkby:#30","ref":"#30","sha":"0ce69fa19d81de656dd6a74629099a7fa9261d1c","user":{"login":"captainkirkby","id":3489773,"avatar_url":"https://avatars.githubusercontent.com/u/3489773?v=3","gravatar_id":"","url":"https://api.github.com/users/captainkirkby","html_url":"https://github.com/captainkirkby","followers_url":"https://api.github.com/users/captainkirkby/followers","following_url":"https://api.github.com/users/captainkirkby/following{/other_user}","gists_url":"https://api.github.com/users/captainkirkby/gists{/gist_id}","starred_url":"https://api.github.com/users/captainkirkby/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/captainkirkby/subscriptions","organizations_url":"https://api.github.com/users/captainkirkby/orgs","repos_url":"https://api.github.com/users/captainkirkby/repos","events_url":"https://api.github.com/users/captainkirkby/events{/privacy}","received_events_url":"https://api.github.com/users/captainkirkby/received_events","type":"User","site_admin":false},"repo":{"id":15461243,"name":"Gears","full_name":"captainkirkby/Gears","owner":{"login":"captainkirkby","id":3489773,"avatar_url":"https://avatars.githubusercontent.com/u/3489773?v=3","gravatar_id":"","url":"https://api.github.com/users/captainkirkby","html_url":"https://github.com/captainkirkby","followers_url":"https://api.github.com/users/captainkirkby/followers","following_url":"https://api.github.com/users/captainkirkby/following{/other_user}","gists_url":"https://api.github.com/users/captainkirkby/gists{/gist_id}","starred_url":"https://api.github.com/users/captainkirkby/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/captainkirkby/subscriptions","organizations_url":"https://api.github.com/users/captainkirkby/orgs","repos_url":"https://api.github.com/users/captainkirkby/repos","events_url":"https://api.github.com/users/captainkirkby/events{/privacy}","received_events_url":"https://api.github.com/users/captainkirkby/received_events","type":"User","site_admin":false},"private":false,"html_url":"https://github.com/captainkirkby/Gears","description":"Set of packages used to measure a mechanical clock.","fork":false,"url":"https://api.github.com/repos/captainkirkby/Gears","forks_url":"https://api.github.com/repos/captainkirkby/Gears/forks","keys_url":"https://api.github.com/repos/captainkirkby/Gears/keys{/key_id}","collaborators_url":"https://api.github.com/repos/captainkirkby/Gears/collaborators{/collaborator}","teams_url":"https://api.github.com/repos/captainkirkby/Gears/teams","hooks_url":"https://api.github.com/repos/captainkirkby/Gears/hooks","issue_events_url":"https://api.github.com/repos/captainkirkby/Gears/issues/events{/number}","events_url":"https://api.github.com/repos/captainkirkby/Gears/events","assignees_url":"https://api.github.com/repos/captainkirkby/Gears/assignees{/user}","branches_url":"https://api.github.com/repos/captainkirkby/Gears/branches{/branch}","tags_url":"https://api.github.com/repos/captainkirkby/Gears/tags","blobs_url":"https://api.github.com/repos/captainkirkby/Gears/git/blobs{/sha}","git_tags_url":"https://api.github.com/repos/captainkirkby/Gears/git/tags{/sha}","git_refs_url":"https://api.github.com/repos/captainkirkby/Gears/git/refs{/sha}","trees_url":"https://api.github.com/repos/captainkirkby/Gears/git/trees{/sha}","statuses_url":"https://api.github.com/repos/captainkirkby/Gears/statuses/{sha}","languages_url":"https://api.github.com/repos/captainkirkby/Gears/languages","stargazers_url":"https://api.github.com/repos/captainkirkby/Gears/stargazers","contributors_url":"https://api.github.com/repos/captainkirkby/Gears/contributors","subscribers_url":"https://api.github.com/repos/captainkirkby/Gears/subscribers","subscription_url":"https://api.github.com/repos/captainkirkby/Gears/subscription","commits_url":"https://api.github.com/repos/captainkirkby/Gears/commits{/sha}","git_commits_url":"https://api.github.com/repos/captainkirkby/Gears/git/commits{/sha}","comments_url":"https://api.github.com/repos/captainkirkby/Gears/comments{/number}","issue_comment_url":"https://api.github.com/repos/captainkirkby/Gears/issues/comments/{number}","contents_url":"https://api.github.com/repos/captainkirkby/Gears/contents/{+path}","compare_url":"https://api.github.com/repos/captainkirkby/Gears/compare/{base}...{head}","merges_url":"https://api.github.com/repos/captainkirkby/Gears/merges","archive_url":"https://api.github.com/repos/captainkirkby/Gears/{archive_format}{/ref}","downloads_url":"https://api.github.com/repos/captainkirkby/Gears/downloads","issues_url":"https://api.github.com/repos/captainkirkby/Gears/issues{/number}","pulls_url":"https://api.github.com/repos/captainkirkby/Gears/pulls{/number}","milestones_url":"https://api.github.com/repos/captainkirkby/Gears/milestones{/number}","notifications_url":"https://api.github.com/repos/captainkirkby/Gears/notifications{?since,all,participating}","labels_url":"https://api.github.com/repos/captainkirkby/Gears/labels{/name}","releases_url":"https://api.github.com/repos/captainkirkby/Gears/releases{/id}","created_at":"2013-12-26T22:05:51Z","updated_at":"2015-01-01T00:41:54Z","pushed_at":"2015-01-01T01:05:41Z","git_url":"git://github.com/captainkirkby/Gears.git","ssh_url":"git@github.com:captainkirkby/Gears.git","clone_url":"https://github.com/captainkirkby/Gears.git","svn_url":"https://github.com/captainkirkby/Gears","homepage":"","size":18140,"stargazers_count":1,"watchers_count":1,"language":"C++","has_issues":true,"has_downloads":true,"has_wiki":true,"has_pages":false,"forks_count":0,"mirror_url":null,"open_issues_count":11,"forks":0,"open_issues":11,"watchers":1,"default_branch":"master"}},"base":{"label":"captainkirkby:master","ref":"master","sha":"b838f0c36403eab209f3565eeb7a10375911d228","user":{"login":"captainkirkby","id":3489773,"avatar_url":"https://avatars.githubusercontent.com/u/3489773?v=3","gravatar_id":"","url":"https://api.github.com/users/captainkirkby","html_url":"https://github.com/captainkirkby","followers_url":"https://api.github.com/users/captainkirkby/followers","following_url":"https://api.github.com/users/captainkirkby/following{/other_user}","gists_url":"https://api.github.com/users/captainkirkby/gists{/gist_id}","starred_url":"https://api.github.com/users/captainkirkby/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/captainkirkby/subscriptions","organizations_url":"https://api.github.com/users/captainkirkby/orgs","repos_url":"https://api.github.com/users/captainkirkby/repos","events_url":"https://api.github.com/users/captainkirkby/events{/privacy}","received_events_url":"https://api.github.com/users/captainkirkby/received_events","type":"User","site_admin":false},"repo":{"id":15461243,"name":"Gears","full_name":"captainkirkby/Gears","owner":{"login":"captainkirkby","id":3489773,"avatar_url":"https://avatars.githubusercontent.com/u/3489773?v=3","gravatar_id":"","url":"https://api.github.com/users/captainkirkby","html_url":"https://github.com/captainkirkby","followers_url":"https://api.github.com/users/captainkirkby/followers","following_url":"https://api.github.com/users/captainkirkby/following{/other_user}","gists_url":"https://api.github.com/users/captainkirkby/gists{/gist_id}","starred_url":"https://api.github.com/users/captainkirkby/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/captainkirkby/subscriptions","organizations_url":"https://api.github.com/users/captainkirkby/orgs","repos_url":"https://api.github.com/users/captainkirkby/repos","events_url":"https://api.github.com/users/captainkirkby/events{/privacy}","received_events_url":"https://api.github.com/users/captainkirkby/received_events","type":"User","site_admin":false},"private":false,"html_url":"https://github.com/captainkirkby/Gears","description":"Set of packages used to measure a mechanical clock.","fork":false,"url":"https://api.github.com/repos/captainkirkby/Gears","forks_url":"https://api.github.com/repos/captainkirkby/Gears/forks","keys_url":"https://api.github.com/repos/captainkirkby/Gears/keys{/key_id}","collaborators_url":"https://api.github.com/repos/captainkirkby/Gears/collaborators{/collaborator}","teams_url":"https://api.github.com/repos/captainkirkby/Gears/teams","hooks_url":"https://api.github.com/repos/captainkirkby/Gears/hooks","issue_events_url":"https://api.github.com/repos/captainkirkby/Gears/issues/events{/number}","events_url":"https://api.github.com/repos/captainkirkby/Gears/events","assignees_url":"https://api.github.com/repos/captainkirkby/Gears/assignees{/user}","branches_url":"https://api.github.com/repos/captainkirkby/Gears/branches{/branch}","tags_url":"https://api.github.com/repos/captainkirkby/Gears/tags","blobs_url":"https://api.github.com/repos/captainkirkby/Gears/git/blobs{/sha}","git_tags_url":"https://api.github.com/repos/captainkirkby/Gears/git/tags{/sha}","git_refs_url":"https://api.github.com/repos/captainkirkby/Gears/git/refs{/sha}","trees_url":"https://api.github.com/repos/captainkirkby/Gears/git/trees{/sha}","statuses_url":"https://api.github.com/repos/captainkirkby/Gears/statuses/{sha}","languages_url":"https://api.github.com/repos/captainkirkby/Gears/languages","stargazers_url":"https://api.github.com/repos/captainkirkby/Gears/stargazers","contributors_url":"https://api.github.com/repos/captainkirkby/Gears/contributors","subscribers_url":"https://api.github.com/repos/captainkirkby/Gears/subscribers","subscription_url":"https://api.github.com/repos/captainkirkby/Gears/subscription","commits_url":"https://api.github.com/repos/captainkirkby/Gears/commits{/sha}","git_commits_url":"https://api.github.com/repos/captainkirkby/Gears/git/commits{/sha}","comments_url":"https://api.github.com/repos/captainkirkby/Gears/comments{/number}","issue_comment_url":"https://api.github.com/repos/captainkirkby/Gears/issues/comments/{number}","contents_url":"https://api.github.com/repos/captainkirkby/Gears/contents/{+path}","compare_url":"https://api.github.com/repos/captainkirkby/Gears/compare/{base}...{head}","merges_url":"https://api.github.com/repos/captainkirkby/Gears/merges","archive_url":"https://api.github.com/repos/captainkirkby/Gears/{archive_format}{/ref}","downloads_url":"https://api.github.com/repos/captainkirkby/Gears/downloads","issues_url":"https://api.github.com/repos/captainkirkby/Gears/issues{/number}","pulls_url":"https://api.github.com/repos/captainkirkby/Gears/pulls{/number}","milestones_url":"https://api.github.com/repos/captainkirkby/Gears/milestones{/number}","notifications_url":"https://api.github.com/repos/captainkirkby/Gears/notifications{?since,all,participating}","labels_url":"https://api.github.com/repos/captainkirkby/Gears/labels{/name}","releases_url":"https://api.github.com/repos/captainkirkby/Gears/releases{/id}","created_at":"2013-12-26T22:05:51Z","updated_at":"2015-01-01T00:41:54Z","pushed_at":"2015-01-01T01:05:41Z","git_url":"git://github.com/captainkirkby/Gears.git","ssh_url":"git@github.com:captainkirkby/Gears.git","clone_url":"https://github.com/captainkirkby/Gears.git","svn_url":"https://github.com/captainkirkby/Gears","homepage":"","size":18140,"stargazers_count":1,"watchers_count":1,"language":"C++","has_issues":true,"has_downloads":true,"has_wiki":true,"has_pages":false,"forks_count":0,"mirror_url":null,"open_issues_count":11,"forks":0,"open_issues":11,"watchers":1,"default_branch":"master"}},"_links":{"self":{"href":"https://api.github.com/repos/captainkirkby/Gears/pulls/31"},"html":{"href":"https://github.com/captainkirkby/Gears/pull/31"},"issue":{"href":"https://api.github.com/repos/captainkirkby/Gears/issues/31"},"comments":{"href":"https://api.github.com/repos/captainkirkby/Gears/issues/31/comments"},"review_comments":{"href":"https://api.github.com/repos/captainkirkby/Gears/pulls/31/comments"},"review_comment":{"href":"https://api.github.com/repos/captainkirkby/Gears/pulls/comments/{number}"},"commits":{"href":"https://api.github.com/repos/captainkirkby/Gears/pulls/31/commits"},"statuses":{"href":"https://api.github.com/repos/captainkirkby/Gears/statuses/0ce69fa19d81de656dd6a74629099a7fa9261d1c"}},"merged":true,"mergeable":null,"mergeable_state":"unknown","merged_by":{"login":"captainkirkby","id":3489773,"avatar_url":"https://avatars.githubusercontent.com/u/3489773?v=3","gravatar_id":"","url":"https://api.github.com/users/captainkirkby","html_url":"https://github.com/captainkirkby","followers_url":"https://api.github.com/users/captainkirkby/followers","following_url":"https://api.github.com/users/captainkirkby/following{/other_user}","gists_url":"https://api.github.com/users/captainkirkby/gists{/gist_id}","starred_url":"https://api.github.com/users/captainkirkby/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/captainkirkby/subscriptions","organizations_url":"https://api.github.com/users/captainkirkby/orgs","repos_url":"https://api.github.com/users/captainkirkby/repos","events_url":"https://api.github.com/users/captainkirkby/events{/privacy}","received_events_url":"https://api.github.com/users/captainkirkby/received_events","type":"User","site_admin":false},"comments":0,"review_comments":0,"commits":1,"additions":129,"deletions":0,"changed_files":1}},"public":true,"created_at":"2015-01-01T01:05:42Z"}
{"id":"2489398281","type":"PushEvent","actor":{"id":2110113,"login":"wiczerd","gravatar_id":"","url":"https://api.github.com/users/wiczerd","avatar_url":"https://avatars.githubusercontent.com/u/2110113?"},"repo":{"id":22581949,"name":"wiczerd/GKTW_empirical","url":"https://api.github.com/repos/wiczerd/GKTW_empirical"},"payload":{"push_id":536753289,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"3e6b0090163506b70aa0a443f97730d4836a743d","before":"1821290f1d7a8846cc7832431b01c14aaa777c44","commits":[{"sha":"3e6b0090163506b70aa0a443f97730d4836a743d","author":{"email":"078c0c67d55661fe08d5d1ec3da0bf82da0133d7@gmail.com","name":"David Wiczer"},"message":"changes to l_phys_neg l_phys_pos needed for where regressions","distinct":true,"url":"https://api.github.com/repos/wiczerd/GKTW_empirical/commits/3e6b0090163506b70aa0a443f97730d4836a743d"}]},"public":true,"created_at":"2015-01-01T01:05:42Z"}
{"id":"2489398282","type":"PushEvent","actor":{"id":3489773,"login":"captainkirkby","gravatar_id":"","url":"https://api.github.com/users/captainkirkby","avatar_url":"https://avatars.githubusercontent.com/u/3489773?"},"repo":{"id":15461243,"name":"captainkirkby/Gears","url":"https://api.github.com/repos/captainkirkby/Gears"},"payload":{"push_id":536753290,"size":2,"distinct_size":1,"ref":"refs/heads/master","head":"3a977b38b570126097e52fc850332efc76fe7efe","before":"b838f0c36403eab209f3565eeb7a10375911d228","commits":[{"sha":"0ce69fa19d81de656dd6a74629099a7fa9261d1c","author":{"email":"4d1902cf1aefa3df01c59cbb9ae7db3045be42ae@gmail.com","name":"Dylan Kirkby"},"message":"Add simple C program to replay binary file","distinct":false,"url":"https://api.github.com/repos/captainkirkby/Gears/commits/0ce69fa19d81de656dd6a74629099a7fa9261d1c"},{"sha":"3a977b38b570126097e52fc850332efc76fe7efe","author":{"email":"4d1902cf1aefa3df01c59cbb9ae7db3045be42ae@gmail.com","name":"Dylan Kirkby"},"message":"Merge pull request #31 from captainkirkby/#30\n\nAdd simple C program to replay binary file","distinct":true,"url":"https://api.github.com/repos/captainkirkby/Gears/commits/3a977b38b570126097e52fc850332efc76fe7efe"}]},"public":true,"created_at":"2015-01-01T01:05:42Z"}
{"id":"2489398289","type":"PushEvent","actor":{"id":965430,"login":"waltzofpearls","gravatar_id":"","url":"https://api.github.com/users/waltzofpearls","avatar_url":"https://avatars.githubusercontent.com/u/965430?"},"repo":{"id":28505561,"name":"waltzofpearls/dotfiles","url":"https://api.github.com/repos/waltzofpearls/dotfiles"},"payload":{"push_id":536753294,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"d7d714784919d48e92ed72486d1cbfd5dd4c896b","before":"d5a1f77ab903cdcf1d2ae292c7f0f259c6e32211","commits":[{"sha":"d7d714784919d48e92ed72486d1cbfd5dd4c896b","author":{"email":"c514db49330801e4e831feeacd2b70f6f55a5048@gmail.com","name":"Rollie Ma"},"message":"Changed alias d to d1 and dd to d2 to avoid possible command conflicts","distinct":true,"url":"https://api.github.com/repos/waltzofpearls/dotfiles/commits/d7d714784919d48e92ed72486d1cbfd5dd4c896b"}]},"public":true,"created_at":"2015-01-01T01:05:43Z"}
{"id":"2489398293","type":"WatchEvent","actor":{"id":4030056,"login":"alexFranka","gravatar_id":"","url":"https://api.github.com/users/alexFranka","avatar_url":"https://avatars.githubusercontent.com/u/4030056?"},"repo":{"id":5294540,"name":"Stereobit/dragend","url":"https://api.github.com/repos/Stereobit/dragend"},"payload":{"action":"started"},"public":true,"created_at":"2015-01-01T01:05:43Z"}
{"id":"2489398296","type":"DeleteEvent","actor":{"id":3489773,"login":"captainkirkby","gravatar_id":"","url":"https://api.github.com/users/captainkirkby","avatar_url":"https://avatars.githubusercontent.com/u/3489773?"},"repo":{"id":15461243,"name":"captainkirkby/Gears","url":"https://api.github.com/repos/captainkirkby/Gears"},"payload":{"ref":"#30","ref_type":"branch","pusher_type":"user"},"public":true,"created_at":"2015-01-01T01:05:43Z"}
{"id":"2489398297","type":"CreateEvent","actor":{"id":790100,"login":"mbutterworth","gravatar_id":"","url":"https://api.github.com/users/mbutterworth","avatar_url":"https://avatars.githubusercontent.com/u/790100?"},"repo":{"id":28678199,"name":"mbutterworth/menu-test","url":"https://api.github.com/repos/mbutterworth/menu-test"},"payload":{"ref":"master","ref_type":"branch","master_branch":"master","description":"","pusher_type":"user"},"public":true,"created_at":"2015-01-01T01:05:43Z"}
{"id":"2489398309","type":"WatchEvent","actor":{"id":1075965,"login":"takuan-osho","gravatar_id":"","url":"https://api.github.com/users/takuan-osho","avatar_url":"https://avatars.githubusercontent.com/u/1075965?"},"repo":{"id":28081156,"name":"lexrus/VPNOn","url":"https://api.github.com/repos/lexrus/VPNOn"},"payload":{"action":"started"},"public":true,"created_at":"2015-01-01T01:05:44Z"}
{"id":"2489398314","type":"PushEvent","actor":{"id":92735,"login":"sorear","gravatar_id":"","url":"https://api.github.com/users/sorear","avatar_url":"https://avatars.githubusercontent.com/u/92735?"},"repo":{"id":5104661,"name":"sorear/perl-DBR","url":"https://api.github.com/repos/sorear/perl-DBR"},"payload":{"push_id":536753304,"size":3,"distinct_size":0,"ref":"refs/heads/master","head":"ed1f9a08a0da68a67022b1df5e087e306a147a1c","before":"89749b9eea501807ca432473798ca70f504d1693","commits":[{"sha":"5d087526d37083ad04d5d9d830de31f8f441883c","author":{"email":"3d0f3b9ddcacec30c4008c5e030e6c13a478cb4f@gudtech.com","name":"Daniel Norman"},"message":"bugfix","distinct":false,"url":"https://api.github.com/repos/sorear/perl-DBR/commits/5d087526d37083ad04d5d9d830de31f8f441883c"},{"sha":"2d8c69c9fd8c008a2fd787b9eda342dbc0099ec9","author":{"email":"fed0578406081f3c3a132b2ffaa2b378514d6fc0@cox.net","name":"Stefan O'Rear"},"message":"Merge branch 'master' of github.com:dnorman/perl-DBR","distinct":false,"url":"https://api.github.com/repos/sorear/perl-DBR/commits/2d8c69c9fd8c008a2fd787b9eda342dbc0099ec9"},{"sha":"ed1f9a08a0da68a67022b1df5e087e306a147a1c","author":{"email":"fed0578406081f3c3a132b2ffaa2b378514d6fc0@cox.net","name":"Stefan O'Rear"},"message":"avoid generating nulls in IN-lists","distinct":false,"url":"https://api.github.com/repos/sorear/perl-DBR/commits/ed1f9a08a0da68a67022b1df5e087e306a147a1c"}]},"public":true,"created_at":"2015-01-01T01:05:45Z"}
{"id":"2489398316","type":"PushEvent","actor":{"id":280212,"login":"KenanSulayman","gravatar_id":"","url":"https://api.github.com/users/KenanSulayman","avatar_url":"https://avatars.githubusercontent.com/u/280212?"},"repo":{"id":21481110,"name":"KenanSulayman/heartbeat","url":"https://api.github.com/repos/KenanSulayman/heartbeat"},"payload":{"push_id":536753305,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"4a08cf46a835742f49c5272d70f3210529dbb819","before":"089c8f0d2bac3da1fec35e110c876455549123ae","commits":[{"sha":"4a08cf46a835742f49c5272d70f3210529dbb819","author":{"email":"9176253dfc0bc82671a5e984646605f93319147a@sly.mn","name":"Kenan Sulayman"},"message":"1420074344264\n\nYdoxe8jvlupoYjDMdaz3MuTJYDArYhC8zsnVTxc3DhA=","distinct":true,"url":"https://api.github.com/repos/KenanSulayman/heartbeat/commits/4a08cf46a835742f49c5272d70f3210529dbb819"}]},"public":true,"created_at":"2015-01-01T01:05:45Z"}
{"id":"2489398322","type":"PushEvent","actor":{"id":7282584,"login":"suhasgaddam","gravatar_id":"","url":"https://api.github.com/users/suhasgaddam","avatar_url":"https://avatars.githubusercontent.com/u/7282584?"},"repo":{"id":22023128,"name":"suhasgaddam/suhasgaddam","url":"https://api.github.com/repos/suhasgaddam/suhasgaddam"},"payload":{"push_id":536753308,"size":10,"distinct_size":1,"ref":"refs/heads/master","head":"8770d45468f7a35e3523dcd2c953e98495f7f9e1","before":"87857d97c47ccc77fddec314b222eca1c5b4c3d3","commits":[{"sha":"91a07bfa95c2dd01114091ec46b69029c5482c3a","author":{"email":"8941c16c0c424ea999586f4432f75bdae83bd66f@gmail.com","name":"Suhas Gaddam"},"message":"Update portfolio view","distinct":false,"url":"https://api.github.com/repos/suhasgaddam/suhasgaddam/commits/91a07bfa95c2dd01114091ec46b69029c5482c3a"},{"sha":"d086fe0560ede399831c0e939539048a8cf769d9","author":{"email":"8941c16c0c424ea999586f4432f75bdae83bd66f@gmail.com","name":"Suhas Gaddam"},"message":"Update ansible roles for larabook","distinct":false,"url":"https://api.github.com/repos/suhasgaddam/suhasgaddam/commits/d086fe0560ede399831c0e939539048a8cf769d9"},{"sha":"519f55acfccaff462e8d3c8b509c22e2978b6964","author":{"email":"8941c16c0c424ea999586f4432f75bdae83bd66f@gmail.com","name":"Suhas Gaddam"},"message":"Update composer dependencies","distinct":false,"url":"https://api.github.com/repos/suhasgaddam/suhasgaddam/commits/519f55acfccaff462e8d3c8b509c22e2978b6964"},{"sha":"a758b8a21b2eb691bfc6a8f7f81120c3c5ac00b4","author":{"email":"8941c16c0c424ea999586f4432f75bdae83bd66f@gmail.com","name":"Suhas Gaddam"},"message":"Update ansible roles","distinct":false,"url":"https://api.github.com/repos/suhasgaddam/suhasgaddam/commits/a758b8a21b2eb691bfc6a8f7f81120c3c5ac00b4"},{"sha":"44a91286a792f3176b23784d922ec67006ce1ae5","author":{"email":"8941c16c0c424ea999586f4432f75bdae83bd66f@gmail.com","name":"Suhas Gaddam"},"message":"Update ansible roles for larabook and ssl","distinct":false,"url":"https://api.github.com/repos/suhasgaddam/suhasgaddam/commits/44a91286a792f3176b23784d922ec67006ce1ae5"},{"sha":"906796e966cf00d3e4f95c725893bed23c780fe8","author":{"email":"8941c16c0c424ea999586f4432f75bdae83bd66f@gmail.com","name":"Suhas Gaddam"},"message":"Update GitHub API service class","distinct":false,"url":"https://api.github.com/repos/suhasgaddam/suhasgaddam/commits/906796e966cf00d3e4f95c725893bed23c780fe8"},{"sha":"1360cc3c364c6658990df6890ee74fa36bd0da80","author":{"email":"8941c16c0c424ea999586f4432f75bdae83bd66f@gmail.com","name":"Suhas Gaddam"},"message":"Organize ansible folder","distinct":false,"url":"https://api.github.com/repos/suhasgaddam/suhasgaddam/commits/1360cc3c364c6658990df6890ee74fa36bd0da80"},{"sha":"5fc4d906b4d59212f594ce267acceafd11b214a7","author":{"email":"8941c16c0c424ea999586f4432f75bdae83bd66f@gmail.com","name":"Suhas Gaddam"},"message":"Update ansible roles to use environment variables","distinct":false,"url":"https://api.github.com/repos/suhasgaddam/suhasgaddam/commits/5fc4d906b4d59212f594ce267acceafd11b214a7"},{"sha":"7d478f4562713035d6950734a9a92c0cfa891bb0","author":{"email":"8941c16c0c424ea999586f4432f75bdae83bd66f@gmail.com","name":"Suhas Gaddam"},"message":"Fix nginx template for www subdomain","distinct":false,"url":"https://api.github.com/repos/suhasgaddam/suhasgaddam/commits/7d478f4562713035d6950734a9a92c0cfa891bb0"},{"sha":"8770d45468f7a35e3523dcd2c953e98495f7f9e1","author":{"email":"8941c16c0c424ea999586f4432f75bdae83bd66f@gmail.com","name":"Suhas Gaddam"},"message":"Merge branch 'develop'","distinct":true,"url":"https://api.github.com/repos/suhasgaddam/suhasgaddam/commits/8770d45468f7a35e3523dcd2c953e98495f7f9e1"}]},"public":true,"created_at":"2015-01-01T01:05:47Z"}
{"id":"2489398328","type":"PushEvent","actor":{"id":3407942,"login":"pnlbwh","gravatar_id":"","url":"https://api.github.com/users/pnlbwh","avatar_url":"https://avatars.githubusercontent.com/u/3407942?"},"repo":{"id":25606127,"name":"pnlbwh/diskusage-logging","url":"https://api.github.com/repos/pnlbwh/diskusage-logging"},"payload":{"push_id":536753313,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"fee82b7c06761155df5d1bd78b5b6b485edd1923","before":"4dba9fc71445e445cbef290e486b3265ba7b283f","commits":[{"sha":"fee82b7c06761155df5d1bd78b5b6b485edd1923","author":{"email":"ea6edc91e6ce6eaff9d772be660c2fa0a7b1e60f@bwh.harvard.edu","name":"reckbo"},"message":"ENH: Add remote paths, and generic report","distinct":true,"url":"https://api.github.com/repos/pnlbwh/diskusage-logging/commits/fee82b7c06761155df5d1bd78b5b6b485edd1923"}]},"public":true,"created_at":"2015-01-01T01:05:47Z"}
{"id":"2489398330","type":"PushEvent","actor":{"id":995241,"login":"ggkuron","gravatar_id":"","url":"https://api.github.com/users/ggkuron","avatar_url":"https://avatars.githubusercontent.com/u/995241?"},"repo":{"id":12571910,"name":"ggkuron/dotfiles","url":"https://api.github.com/repos/ggkuron/dotfiles"},"payload":{"push_id":536753315,"size":6,"distinct_size":0,"ref":"refs/heads/X230","head":"09214bd8722793af81c66a913d8f72b55b48036e","before":"4e3621cd80a6ac39d4a3d069d3f7ceed47cb4670","commits":[{"sha":"b223857d2dc4d4d1be233b266c90e021c713eb4e","author":{"email":"a5d06a406de0a33fcbcafe77084f41b3871f8b1f@gmail.com","name":"ggkuron"},"message":"x230 wifi setting","distinct":false,"url":"https://api.github.com/repos/ggkuron/dotfiles/commits/b223857d2dc4d4d1be233b266c90e021c713eb4e"},{"sha":"40160aede782fbd7e6267f0ddf97b1106a67e614","author":{"email":"a5d06a406de0a33fcbcafe77084f41b3871f8b1f@gmail.com","name":"ggkuron"},"message":"migrate to xkb from xmodmap setting","distinct":false,"url":"https://api.github.com/repos/ggkuron/dotfiles/commits/40160aede782fbd7e6267f0ddf97b1106a67e614"},{"sha":"fff4016764a0d5d6129a6855e8c068b92c3f61e1","author":{"email":"a5d06a406de0a33fcbcafe77084f41b3871f8b1f@gmail.com","name":"ggkuron"},"message":"gnome-power-manager init again","distinct":false,"url":"https://api.github.com/repos/ggkuron/dotfiles/commits/fff4016764a0d5d6129a6855e8c068b92c3f61e1"},{"sha":"0dc458f8e32336cc2cc4998adbae510cfab67c0e","author":{"email":"a5d06a406de0a33fcbcafe77084f41b3871f8b1f@gmail.com","name":"ggkuron"},"message":"update vimrc :<","distinct":false,"url":"https://api.github.com/repos/ggkuron/dotfiles/commits/0dc458f8e32336cc2cc4998adbae510cfab67c0e"},{"sha":"284cc12097bb43d8f40f0b6b39b40508c01ee3cd","author":{"email":"a5d06a406de0a33fcbcafe77084f41b3871f8b1f@gmail.com","name":"ggkuron"},"message":"fix tmux copy pipe","distinct":false,"url":"https://api.github.com/repos/ggkuron/dotfiles/commits/284cc12097bb43d8f40f0b6b39b40508c01ee3cd"},{"sha":"09214bd8722793af81c66a913d8f72b55b48036e","author":{"email":"a5d06a406de0a33fcbcafe77084f41b3871f8b1f@gmail.com","name":"ggkuron"},"message":"gvimrc font bigger","distinct":false,"url":"https://api.github.com/repos/ggkuron/dotfiles/commits/09214bd8722793af81c66a913d8f72b55b48036e"}]},"public":true,"created_at":"2015-01-01T01:05:48Z"}
{"id":"2489398331","type":"PullRequestReviewCommentEvent","actor":{"id":706947,"login":"d3athrow","gravatar_id":"","url":"https://api.github.com/users/d3athrow","avatar_url":"https://avatars.githubusercontent.com/u/706947?"},"repo":{"id":10441188,"name":"d3athrow/vgstation13","url":"https://api.github.com/repos/d3athrow/vgstation13"},"payload":{"action":"created","comment":{"url":"https://api.github.com/repos/d3athrow/vgstation13/pulls/comments/22397293","id":22397293,"diff_hunk":"@@ -8,6 +8,7 @@\n \tmax_heat_protection_temperature = FIRE_HELMET_MAX_HEAT_PROTECITON_TEMPERATURE\n \tvar/obj/machinery/camera/camera\n \tspecies_restricted = list(\"exclude\",\"Vox\")\n+\tflags = PLASMAGUARD","path":"code/modules/clothing/spacesuits/ert.dm","position":4,"original_position":4,"commit_id":"b93293990c4d927f30a1f048939d427ee591e4a6","original_commit_id":"b93293990c4d927f30a1f048939d427ee591e4a6","user":{"login":"d3athrow","id":706947,"avatar_url":"https://avatars.githubusercontent.com/u/706947?v=3","gravatar_id":"","url":"https://api.github.com/users/d3athrow","html_url":"https://github.com/d3athrow","followers_url":"https://api.github.com/users/d3athrow/followers","following_url":"https://api.github.com/users/d3athrow/following{/other_user}","gists_url":"https://api.github.com/users/d3athrow/gists{/gist_id}","starred_url":"https://api.github.com/users/d3athrow/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/d3athrow/subscriptions","organizations_url":"https://api.github.com/users/d3athrow/orgs","repos_url":"https://api.github.com/users/d3athrow/repos","events_url":"https://api.github.com/users/d3athrow/events{/privacy}","received_events_url":"https://api.github.com/users/d3athrow/received_events","type":"User","site_admin":false},"body":"flages = FPRINT | TABLEPASS | HEADCOVERSEYES | BLOCKHAIR | STOPSPRESSUREDMAGE | PLASMAGUARD","created_at":"2015-01-01T01:05:48Z","updated_at":"2015-01-01T01:05:48Z","html_url":"https://github.com/d3athrow/vgstation13/pull/2405#discussion_r22397293","pull_request_url":"https://api.github.com/repos/d3athrow/vgstation13/pulls/2405","_links":{"self":{"href":"https://api.github.com/repos/d3athrow/vgstation13/pulls/comments/22397293"},"html":{"href":"https://github.com/d3athrow/vgstation13/pull/2405#discussion_r22397293"},"pull_request":{"href":"https://api.github.com/repos/d3athrow/vgstation13/pulls/2405"}}},"pull_request":{"url":"https://api.github.com/repos/d3athrow/vgstation13/pulls/2405","id":26675841,"html_url":"https://github.com/d3athrow/vgstation13/pull/2405","diff_url":"https://github.com/d3athrow/vgstation13/pull/2405.diff","patch_url":"https://github.com/d3athrow/vgstation13/pull/2405.patch","issue_url":"https://api.github.com/repos/d3athrow/vgstation13/issues/2405","number":2405,"state":"open","locked":false,"title":"Added PLASMAGUARD flag to some spacesuits","user":{"login":"Rei1226","id":4923426,"avatar_url":"https://avatars.githubusercontent.com/u/4923426?v=3","gravatar_id":"","url":"https://api.github.com/users/Rei1226","html_url":"https://github.com/Rei1226","followers_url":"https://api.github.com/users/Rei1226/followers","following_url":"https://api.github.com/users/Rei1226/following{/other_user}","gists_url":"https://api.github.com/users/Rei1226/gists{/gist_id}","starred_url":"https://api.github.com/users/Rei1226/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/Rei1226/subscriptions","organizations_url":"https://api.github.com/users/Rei1226/orgs","repos_url":"https://api.github.com/users/Rei1226/repos","events_url":"https://api.github.com/users/Rei1226/events{/privacy}","received_events_url":"https://api.github.com/users/Rei1226/received_events","type":"User","site_admin":false},"body":"Added the PLASMAGUARD flag to ERT suits, deathsquad suits, and CE/Atmos suits as requested in \r\n\r\nhttps://github.com/d3athrow/vgstation13/issues/2369","created_at":"2014-12-30T07:18:28Z","updated_at":"2015-01-01T01:05:48Z","closed_at":null,"merged_at":null,"merge_commit_sha":"fff34ea0a38796d850e3f5aba53410e1b7bde9c8","assignee":null,"milestone":null,"commits_url":"https://api.github.com/repos/d3athrow/vgstation13/pulls/2405/commits","review_comments_url":"https://api.github.com/repos/d3athrow/vgstation13/pulls/2405/comments","review_comment_url":"https://api.github.com/repos/d3athrow/vgstation13/pulls/comments/{number}","comments_url":"https://api.github.com/repos/d3athrow/vgstation13/issues/2405/comments","statuses_url":"https://api.github.com/repos/d3athrow/vgstation13/statuses/b93293990c4d927f30a1f048939d427ee591e4a6","head":{"label":"Rei1226:ratdicks","ref":"ratdicks","sha":"b93293990c4d927f30a1f048939d427ee591e4a6","user":{"login":"Rei1226","id":4923426,"avatar_url":"https://avatars.githubusercontent.com/u/4923426?v=3","gravatar_id":"","url":"https://api.github.com/users/Rei1226","html_url":"https://github.com/Rei1226","followers_url":"https://api.github.com/users/Rei1226/followers","following_url":"https://api.github.com/users/Rei1226/following{/other_user}","gists_url":"https://api.github.com/users/Rei1226/gists{/gist_id}","starred_url":"https://api.github.com/users/Rei1226/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/Rei1226/subscriptions","organizations_url":"https://api.github.com/users/Rei1226/orgs","repos_url":"https://api.github.com/users/Rei1226/repos","events_url":"https://api.github.com/users/Rei1226/events{/privacy}","received_events_url":"https://api.github.com/users/Rei1226/received_events","type":"User","site_admin":false},"repo":{"id":19230658,"name":"vgstation13","full_name":"Rei1226/vgstation13","owner":{"login":"Rei1226","id":4923426,"avatar_url":"https://avatars.githubusercontent.com/u/4923426?v=3","gravatar_id":"","url":"https://api.github.com/users/Rei1226","html_url":"https://github.com/Rei1226","followers_url":"https://api.github.com/users/Rei1226/followers","following_url":"https://api.github.com/users/Rei1226/following{/other_user}","gists_url":"https://api.github.com/users/Rei1226/gists{/gist_id}","starred_url":"https://api.github.com/users/Rei1226/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/Rei1226/subscriptions","organizations_url":"https://api.github.com/users/Rei1226/orgs","repos_url":"https://api.github.com/users/Rei1226/repos","events_url":"https://api.github.com/users/Rei1226/events{/privacy}","received_events_url":"https://api.github.com/users/Rei1226/received_events","type":"User","site_admin":false},"private":false,"html_url":"https://github.com/Rei1226/vgstation13","description":"This is the vgstation's fork of baystation12's code.","fork":true,"url":"https://api.github.com/repos/Rei1226/vgstation13","forks_url":"https://api.github.com/repos/Rei1226/vgstation13/forks","keys_url":"https://api.github.com/repos/Rei1226/vgstation13/keys{/key_id}","collaborators_url":"https://api.github.com/repos/Rei1226/vgstation13/collaborators{/collaborator}","teams_url":"https://api.github.com/repos/Rei1226/vgstation13/teams","hooks_url":"https://api.github.com/repos/Rei1226/vgstation13/hooks","issue_events_url":"https://api.github.com/repos/Rei1226/vgstation13/issues/events{/number}","events_url":"https://api.github.com/repos/Rei1226/vgstation13/events","assignees_url":"https://api.github.com/repos/Rei1226/vgstation13/assignees{/user}","branches_url":"https://api.github.com/repos/Rei1226/vgstation13/branches{/branch}","tags_url":"https://api.github.com/repos/Rei1226/vgstation13/tags","blobs_url":"https://api.github.com/repos/Rei1226/vgstation13/git/blobs{/sha}","git_tags_url":"https://api.github.com/repos/Rei1226/vgstation13/git/tags{/sha}","git_refs_url":"https://api.github.com/repos/Rei1226/vgstation13/git/refs{/sha}","trees_url":"https://api.github.com/repos/Rei1226/vgstation13/git/trees{/sha}","statuses_url":"https://api.github.com/repos/Rei1226/vgstation13/statuses/{sha}","languages_url":"https://api.github.com/repos/Rei1226/vgstation13/languages","stargazers_url":"https://api.github.com/repos/Rei1226/vgstation13/stargazers","contributors_url":"https://api.github.com/repos/Rei1226/vgstation13/contributors","subscribers_url":"https://api.github.com/repos/Rei1226/vgstation13/subscribers","subscription_url":"https://api.github.com/repos/Rei1226/vgstation13/subscription","commits_url":"https://api.github.com/repos/Rei1226/vgstation13/commits{/sha}","git_commits_url":"https://api.github.com/repos/Rei1226/vgstation13/git/commits{/sha}","comments_url":"https://api.github.com/repos/Rei1226/vgstation13/comments{/number}","issue_comment_url":"https://api.github.com/repos/Rei1226/vgstation13/issues/comments/{number}","contents_url":"https://api.github.com/repos/Rei1226/vgstation13/contents/{+path}","compare_url":"https://api.github.com/repos/Rei1226/vgstation13/compare/{base}...{head}","merges_url":"https://api.github.com/repos/Rei1226/vgstation13/merges","archive_url":"https://api.github.com/repos/Rei1226/vgstation13/{archive_format}{/ref}","downloads_url":"https://api.github.com/repos/Rei1226/vgstation13/downloads","issues_url":"https://api.github.com/repos/Rei1226/vgstation13/issues{/number}","pulls_url":"https://api.github.com/repos/Rei1226/vgstation13/pulls{/number}","milestones_url":"https://api.github.com/repos/Rei1226/vgstation13/milestones{/number}","notifications_url":"https://api.github.com/repos/Rei1226/vgstation13/notifications{?since,all,participating}","labels_url":"https://api.github.com/repos/Rei1226/vgstation13/labels{/name}","releases_url":"https://api.github.com/repos/Rei1226/vgstation13/releases{/id}","created_at":"2014-04-28T07:36:48Z","updated_at":"2014-12-30T08:33:17Z","pushed_at":"2014-12-30T08:33:10Z","git_url":"git://github.com/Rei1226/vgstation13.git","ssh_url":"git@github.com:Rei1226/vgstation13.git","clone_url":"https://github.com/Rei1226/vgstation13.git","svn_url":"https://github.com/Rei1226/vgstation13","homepage":"","size":722996,"stargazers_count":0,"watchers_count":0,"language":"DM","has_issues":false,"has_downloads":true,"has_wiki":false,"has_pages":false,"forks_count":0,"mirror_url":null,"open_issues_count":0,"forks":0,"open_issues":0,"watchers":0,"default_branch":"master"}},"base":{"label":"d3athrow:Bleeding-Edge","ref":"Bleeding-Edge","sha":"ea27b58dbac4fdb65119b09648f3f4f2395125de","user":{"login":"d3athrow","id":706947,"avatar_url":"https://avatars.githubusercontent.com/u/706947?v=3","gravatar_id":"","url":"https://api.github.com/users/d3athrow","html_url":"https://github.com/d3athrow","followers_url":"https://api.github.com/users/d3athrow/followers","following_url":"https://api.github.com/users/d3athrow/following{/other_user}","gists_url":"https://api.github.com/users/d3athrow/gists{/gist_id}","starred_url":"https://api.github.com/users/d3athrow/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/d3athrow/subscriptions","organizations_url":"https://api.github.com/users/d3athrow/orgs","repos_url":"https://api.github.com/users/d3athrow/repos","events_url":"https://api.github.com/users/d3athrow/events{/privacy}","received_events_url":"https://api.github.com/users/d3athrow/received_events","type":"User","site_admin":false},"repo":{"id":10441188,"name":"vgstation13","full_name":"d3athrow/vgstation13","owner":{"login":"d3athrow","id":706947,"avatar_url":"https://avatars.githubusercontent.com/u/706947?v=3","gravatar_id":"","url":"https://api.github.com/users/d3athrow","html_url":"https://github.com/d3athrow","followers_url":"https://api.github.com/users/d3athrow/followers","following_url":"https://api.github.com/users/d3athrow/following{/other_user}","gists_url":"https://api.github.com/users/d3athrow/gists{/gist_id}","starred_url":"https://api.github.com/users/d3athrow/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/d3athrow/subscriptions","organizations_url":"https://api.github.com/users/d3athrow/orgs","repos_url":"https://api.github.com/users/d3athrow/repos","events_url":"https://api.github.com/users/d3athrow/events{/privacy}","received_events_url":"https://api.github.com/users/d3athrow/received_events","type":"User","site_admin":false},"private":false,"html_url":"https://github.com/d3athrow/vgstation13","description":"This is the vgstation's fork of baystation12's code.","fork":true,"url":"https://api.github.com/repos/d3athrow/vgstation13","forks_url":"https://api.github.com/repos/d3athrow/vgstation13/forks","keys_url":"https://api.github.com/repos/d3athrow/vgstation13/keys{/key_id}","collaborators_url":"https://api.github.com/repos/d3athrow/vgstation13/collaborators{/collaborator}","teams_url":"https://api.github.com/repos/d3athrow/vgstation13/teams","hooks_url":"https://api.github.com/repos/d3athrow/vgstation13/hooks","issue_events_url":"https://api.github.com/repos/d3athrow/vgstation13/issues/events{/number}","events_url":"https://api.github.com/repos/d3athrow/vgstation13/events","assignees_url":"https://api.github.com/repos/d3athrow/vgstation13/assignees{/user}","branches_url":"https://api.github.com/repos/d3athrow/vgstation13/branches{/branch}","tags_url":"https://api.github.com/repos/d3athrow/vgstation13/tags","blobs_url":"https://api.github.com/repos/d3athrow/vgstation13/git/blobs{/sha}","git_tags_url":"https://api.github.com/repos/d3athrow/vgstation13/git/tags{/sha}","git_refs_url":"https://api.github.com/repos/d3athrow/vgstation13/git/refs{/sha}","trees_url":"https://api.github.com/repos/d3athrow/vgstation13/git/trees{/sha}","statuses_url":"https://api.github.com/repos/d3athrow/vgstation13/statuses/{sha}","languages_url":"https://api.github.com/repos/d3athrow/vgstation13/languages","stargazers_url":"https://api.github.com/repos/d3athrow/vgstation13/stargazers","contributors_url":"https://api.github.com/repos/d3athrow/vgstation13/contributors","subscribers_url":"https://api.github.com/repos/d3athrow/vgstation13/subscribers","subscription_url":"https://api.github.com/repos/d3athrow/vgstation13/subscription","commits_url":"https://api.github.com/repos/d3athrow/vgstation13/commits{/sha}","git_commits_url":"https://api.github.com/repos/d3athrow/vgstation13/git/commits{/sha}","comments_url":"https://api.github.com/repos/d3athrow/vgstation13/comments{/number}","issue_comment_url":"https://api.github.com/repos/d3athrow/vgstation13/issues/comments/{number}","contents_url":"https://api.github.com/repos/d3athrow/vgstation13/contents/{+path}","compare_url":"https://api.github.com/repos/d3athrow/vgstation13/compare/{base}...{head}","merges_url":"https://api.github.com/repos/d3athrow/vgstation13/merges","archive_url":"https://api.github.com/repos/d3athrow/vgstation13/{archive_format}{/ref}","downloads_url":"https://api.github.com/repos/d3athrow/vgstation13/downloads","issues_url":"https://api.github.com/repos/d3athrow/vgstation13/issues{/number}","pulls_url":"https://api.github.com/repos/d3athrow/vgstation13/pulls{/number}","milestones_url":"https://api.github.com/repos/d3athrow/vgstation13/milestones{/number}","notifications_url":"https://api.github.com/repos/d3athrow/vgstation13/notifications{?since,all,participating}","labels_url":"https://api.github.com/repos/d3athrow/vgstation13/labels{/name}","releases_url":"https://api.github.com/repos/d3athrow/vgstation13/releases{/id}","created_at":"2013-06-02T19:39:54Z","updated_at":"2014-12-31T20:06:46Z","pushed_at":"2015-01-01T01:04:27Z","git_url":"git://github.com/d3athrow/vgstation13.git","ssh_url":"git@github.com:d3athrow/vgstation13.git","clone_url":"https://github.com/d3athrow/vgstation13.git","svn_url":"https://github.com/d3athrow/vgstation13","homepage":"","size":937605,"stargazers_count":45,"watchers_count":45,"language":"DM","has_issues":true,"has_downloads":true,"has_wiki":true,"has_pages":false,"forks_count":135,"mirror_url":null,"open_issues_count":259,"forks":135,"open_issues":259,"watchers":45,"default_branch":"master"}},"_links":{"self":{"href":"https://api.github.com/repos/d3athrow/vgstation13/pulls/2405"},"html":{"href":"https://github.com/d3athrow/vgstation13/pull/2405"},"issue":{"href":"https://api.github.com/repos/d3athrow/vgstation13/issues/2405"},"comments":{"href":"https://api.github.com/repos/d3athrow/vgstation13/issues/2405/comments"},"review_comments":{"href":"https://api.github.com/repos/d3athrow/vgstation13/pulls/2405/comments"},"review_comment":{"href":"https://api.github.com/repos/d3athrow/vgstation13/pulls/comments/{number}"},"commits":{"href":"https://api.github.com/repos/d3athrow/vgstation13/pulls/2405/commits"},"statuses":{"href":"https://api.github.com/repos/d3athrow/vgstation13/statuses/b93293990c4d927f30a1f048939d427ee591e4a6"}}}},"public":true,"created_at":"2015-01-01T01:05:48Z"}
{"id":"2489398337","type":"IssuesEvent","actor":{"id":726063,"login":"coder543","gravatar_id":"","url":"https://api.github.com/users/coder543","avatar_url":"https://avatars.githubusercontent.com/u/726063?"},"repo":{"id":12176600,"name":"AngryLawyer/rust-sdl2","url":"https://api.github.com/repos/AngryLawyer/rust-sdl2"},"payload":{"action":"opened","issue":{"url":"https://api.github.com/repos/AngryLawyer/rust-sdl2/issues/248","labels_url":"https://api.github.com/repos/AngryLawyer/rust-sdl2/issues/248/labels{/name}","comments_url":"https://api.github.com/repos/AngryLawyer/rust-sdl2/issues/248/comments","events_url":"https://api.github.com/repos/AngryLawyer/rust-sdl2/issues/248/events","html_url":"https://github.com/AngryLawyer/rust-sdl2/issues/248","id":53210284,"number":248,"title":"Unneccessary line in demo.rs?","user":{"login":"coder543","id":726063,"avatar_url":"https://avatars.githubusercontent.com/u/726063?v=3","gravatar_id":"","url":"https://api.github.com/users/coder543","html_url":"https://github.com/coder543","followers_url":"https://api.github.com/users/coder543/followers","following_url":"https://api.github.com/users/coder543/following{/other_user}","gists_url":"https://api.github.com/users/coder543/gists{/gist_id}","starred_url":"https://api.github.com/users/coder543/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/coder543/subscriptions","organizations_url":"https://api.github.com/users/coder543/orgs","repos_url":"https://api.github.com/users/coder543/repos","events_url":"https://api.github.com/users/coder543/events{/privacy}","received_events_url":"https://api.github.com/users/coder543/received_events","type":"User","site_admin":false},"labels":[],"state":"open","locked":false,"assignee":null,"milestone":null,"comments":0,"created_at":"2015-01-01T01:05:48Z","updated_at":"2015-01-01T01:05:48Z","closed_at":null,"body":"[This line of code](https://github.com/AngryLawyer/rust-sdl2/blob/84e67fbece4c9f92fd5635b19805eb47f271c432/examples/demo.rs#L30) doesn't seem to accomplish anything. In fact, I think the whole inner 'event loop could probably be done away with, just based on playing with the code a little. Could someone with more experience explain to me why that inner loop is there, and what line 30 is accomplishing? I'm really new to Rust, so I may just be missing something."}},"public":true,"created_at":"2015-01-01T01:05:48Z"}
{"id":"2489398342","type":"IssueCommentEvent","actor":{"id":49391,"login":"myronmarston","gravatar_id":"","url":"https://api.github.com/users/myronmarston","avatar_url":"https://avatars.githubusercontent.com/u/49391?"},"repo":{"id":238983,"name":"rspec/rspec-mocks","url":"https://api.github.com/repos/rspec/rspec-mocks"},"payload":{"action":"created","issue":{"url":"https://api.github.com/repos/rspec/rspec-mocks/issues/854","labels_url":"https://api.github.com/repos/rspec/rspec-mocks/issues/854/labels{/name}","comments_url":"https://api.github.com/repos/rspec/rspec-mocks/issues/854/comments","events_url":"https://api.github.com/repos/rspec/rspec-mocks/issues/854/events","html_url":"https://github.com/rspec/rspec-mocks/issues/854","id":53194690,"number":854,"title":"mock_of? to check types on doubles (to avoid unnecessary coercions)","user":{"login":"maxlinc","id":896878,"avatar_url":"https://avatars.githubusercontent.com/u/896878?v=3","gravatar_id":"","url":"https://api.github.com/users/maxlinc","html_url":"https://github.com/maxlinc","followers_url":"https://api.github.com/users/maxlinc/followers","following_url":"https://api.github.com/users/maxlinc/following{/other_user}","gists_url":"https://api.github.com/users/maxlinc/gists{/gist_id}","starred_url":"https://api.github.com/users/maxlinc/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/maxlinc/subscriptions","organizations_url":"https://api.github.com/users/maxlinc/orgs","repos_url":"https://api.github.com/users/maxlinc/repos","events_url":"https://api.github.com/users/maxlinc/events{/privacy}","received_events_url":"https://api.github.com/users/maxlinc/received_events","type":"User","site_admin":false},"labels":[],"state":"open","locked":false,"assignee":null,"milestone":null,"comments":5,"created_at":"2014-12-31T17:42:16Z","updated_at":"2015-01-01T01:05:50Z","closed_at":null,"body":"I have a feature request similar to #794 (instance_double not matching the same class it is mocking) but I have a more specific use-case and solving for it doesn't necessary require stubbing `#===`.\r\n\r\nThere are many Ruby gems that support type coercion, like:\r\n- https://github.com/intridea/hashie#coercion\r\n- https://github.com/solnic/virtus\r\n- https://github.com/solnic/coercible\r\n- https://github.com/apotonick/representable#coercion\r\n\r\nI believe they all do a type check to avoid unnecessary coercions. In the case of Hashie, coercion is skipped if the value is already the target class:\r\n\r\n```ruby\r\n  it 'skips unnecessary coercions' do\r\n      subject.coerce_key :foo, Coercable\r\n\r\n      object = Coercable.new('bar')\r\n      instance[:foo] = object\r\n      expect(instance[:foo]).to eq(object)\r\n    end\r\n```\r\n\r\nHowever, if the value is an double of the target class than it will be coerced:\r\n```ruby\r\n    it 'skips unnecessary coercions (RSpec instance_double)' do\r\n      subject.coerce_key :foo, Coercable\r\n\r\n      object = instance_double(Coercable)\r\n      instance[:foo] = object\r\n      expect(instance[:foo]).to eq(object)\r\n    end\r\n```\r\n\r\n```\r\nFailures:\r\n\r\n  1) Hashie::Extensions::Coercion#coerce_key skips unnecessary coercions (RSpec instance_double)\r\n     Failure/Error: expect(instance[:foo]).to eq(object)\r\n\r\n       expected: #<RSpec::Mocks::InstanceVerifyingDouble:0x3fe5cdd89080 @name=\"Coercable (instance)\">\r\n            got: #<Coercable:0x007fcb9bb11de0 @coerced=true, @value=\"RSpec::Mocks::InstanceVerifyingDouble\">\r\n\r\n       (compared using ==)\r\n\r\n       Diff:\r\n       @@ -1,2 +1,4 @@\r\n       -#<RSpec::Mocks::InstanceVerifyingDouble:0x3fe5cdd89080 @name=\"Coercable (instance)\">\r\n       +#<Coercable:0x007fcb9bb11de0\r\n       + @coerced=true,\r\n       + @value=\"RSpec::Mocks::InstanceVerifyingDouble\">\r\n```\r\n\r\nI'd like to be able to avoid that coercion. Rather than stubbing `#kind_of?` or `#===` something like `#mock_of?` that behaves similar to `#kind_of?` on the doubled class would be useful."},"comment":{"url":"https://api.github.com/repos/rspec/rspec-mocks/issues/comments/68477339","html_url":"https://github.com/rspec/rspec-mocks/issues/854#issuecomment-68477339","issue_url":"https://api.github.com/repos/rspec/rspec-mocks/issues/854","id":68477339,"user":{"login":"myronmarston","id":49391,"avatar_url":"https://avatars.githubusercontent.com/u/49391?v=3","gravatar_id":"","url":"https://api.github.com/users/myronmarston","html_url":"https://github.com/myronmarston","followers_url":"https://api.github.com/users/myronmarston/followers","following_url":"https://api.github.com/users/myronmarston/following{/other_user}","gists_url":"https://api.github.com/users/myronmarston/gists{/gist_id}","starred_url":"https://api.github.com/users/myronmarston/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/myronmarston/subscriptions","organizations_url":"https://api.github.com/users/myronmarston/orgs","repos_url":"https://api.github.com/users/myronmarston/repos","events_url":"https://api.github.com/users/myronmarston/events{/privacy}","received_events_url":"https://api.github.com/users/myronmarston/received_events","type":"User","site_admin":false},"created_at":"2015-01-01T01:05:50Z","updated_at":"2015-01-01T01:05:50Z","body":"> I'd appreciate a method to find out what is being doubled (`@doubled_module.const_to_replace`). It's not public, so right now I can only find out via monkeypatching or instance_variable_get.\r\n\r\nI definitely want to provide an API for your use.  One possibility is what is being added in #832, although as a callback API that might not fit your needs.  We could also add something like `doubled_module` to verifying doubles, although that has a couple of issues:\r\n\r\n* The doubled module may not be loaded, so it would have to return `nil` in that case which gives you no information.\r\n* As I mentioned above, I want to limit the number of built-in methods defined on doubles.\r\n\r\nI'm thinking that we may want to go a more functional route where you would call `RSpec::Mocks.doubled_module_for(dbl)` instead.  (That would solve the latter problem).  For the former problem, we may want to make the API return a module reference (similar to what #832 is going) instead of the actual module.  But then we should call the method something different.\r\n\r\nWhat would meet your needs?"}},"public":true,"created_at":"2015-01-01T01:05:50Z","org":{"id":22388,"login":"rspec","gravatar_id":"","url":"https://api.github.com/orgs/rspec","avatar_url":"https://avatars.githubusercontent.com/u/22388?"}}
{"id":"2489398345","type":"IssueCommentEvent","actor":{"id":8890867,"login":"willgabriel","gravatar_id":"","url":"https://api.github.com/users/willgabriel","avatar_url":"https://avatars.githubusercontent.com/u/8890867?"},"repo":{"id":28678195,"name":"TTMTT/iCL0udin","url":"https://api.github.com/repos/TTMTT/iCL0udin"},"payload":{"action":"created","issue":{"url":"https://api.github.com/repos/TTMTT/iCL0udin/issues/1","labels_url":"https://api.github.com/repos/TTMTT/iCL0udin/issues/1/labels{/name}","comments_url":"https://api.github.com/repos/TTMTT/iCL0udin/issues/1/comments","events_url":"https://api.github.com/repos/TTMTT/iCL0udin/issues/1/events","html_url":"https://github.com/TTMTT/iCL0udin/issues/1","id":53210206,"number":1,"title":"Discuss1","user":{"login":"TTMTT","id":6964047,"avatar_url":"https://avatars.githubusercontent.com/u/6964047?v=3","gravatar_id":"","url":"https://api.github.com/users/TTMTT","html_url":"https://github.com/TTMTT","followers_url":"https://api.github.com/users/TTMTT/followers","following_url":"https://api.github.com/users/TTMTT/following{/other_user}","gists_url":"https://api.github.com/users/TTMTT/gists{/gist_id}","starred_url":"https://api.github.com/users/TTMTT/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/TTMTT/subscriptions","organizations_url":"https://api.github.com/users/TTMTT/orgs","repos_url":"https://api.github.com/users/TTMTT/repos","events_url":"https://api.github.com/users/TTMTT/events{/privacy}","received_events_url":"https://api.github.com/users/TTMTT/received_events","type":"User","site_admin":false},"labels":[],"state":"open","locked":false,"assignee":null,"milestone":null,"comments":2,"created_at":"2015-01-01T01:02:34Z","updated_at":"2015-01-01T01:05:51Z","closed_at":null,"body":"Now you can download vresion 1.0 from :\r\n---------------------------------------------------\r\nhttp://www.icloudin.net\r\n-----------------------------\r\nWow, ipod touch 5G (8.1) - iCL0udin v1.0 bypass activation (icloud)\r\n-------------------------------------------------------------------------------------\r\nhttp://youtu.be/tZmEdlDGNu4\r\n--------------------------------------\r\niCL0udin v1.0 bypass activation (icloud) - ipad mini 2G (7.1.1)\r\n-------------------------------------------------------------------------------------\r\nhttp://youtu.be/tevYyBN2QCQ\r\n---------------------------------------\r\nVideo for bypass icloud (iCL0udin v1.0) for iphone 4 CDMA ..\r\n-------------------------------------------------------------------------------------\r\nhttp://youtu.be/i85-D6N2YLk\r\n-------------------------------------\r\nNew video for iCL0udin v1.0 bypass icloud (3 iphones 7.1.2):\r\n-------------------------------------------------------------------------------------\r\nhttp://youtu.be/p51TNlCr7ug\r\n-------------------------------------\r\niCL0udin v1.0 -> %100\r\n----------------------------\r\nRemaining: %3 testing with some people..\r\n-----------------------------------------------------\r\nLast Method:\r\n-----------------\r\n\r\nmethod 1 : via (other xml not to deviceservices - exploit)\r\nmethod 2 : via (apple cert & key and i can downgrade to any ios)\r\nmethod 3 : via (change some string by hex on ELF file << some times i got error)\r\nmethod 4 : via (use apple ssl cert or real ssl in server and change some string in iphone)\r\niCL0udin v1.0 have this method:\r\n-----------------------------------------\r\n\r\nmethod 1 : via (other xml not to deviceservices - exploit)\r\nmethod 2 : via (apple cert & key and i can downgrade to any ios)"},"comment":{"url":"https://api.github.com/repos/TTMTT/iCL0udin/issues/comments/68477341","html_url":"https://github.com/TTMTT/iCL0udin/issues/1#issuecomment-68477341","issue_url":"https://api.github.com/repos/TTMTT/iCL0udin/issues/1","id":68477341,"user":{"login":"willgabriel","id":8890867,"avatar_url":"https://avatars.githubusercontent.com/u/8890867?v=3","gravatar_id":"","url":"https://api.github.com/users/willgabriel","html_url":"https://github.com/willgabriel","followers_url":"https://api.github.com/users/willgabriel/followers","following_url":"https://api.github.com/users/willgabriel/following{/other_user}","gists_url":"https://api.github.com/users/willgabriel/gists{/gist_id}","starred_url":"https://api.github.com/users/willgabriel/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/willgabriel/subscriptions","organizations_url":"https://api.github.com/users/willgabriel/orgs","repos_url":"https://api.github.com/users/willgabriel/repos","events_url":"https://api.github.com/users/willgabriel/events{/privacy}","received_events_url":"https://api.github.com/users/willgabriel/received_events","type":"User","site_admin":false},"created_at":"2015-01-01T01:05:50Z","updated_at":"2015-01-01T01:05:50Z","body":"ok bro"}},"public":true,"created_at":"2015-01-01T01:05:51Z"}
{"id":"2489398347","type":"PushEvent","actor":{"id":8323759,"login":"MozillaPootleL10nBot","gravatar_id":"","url":"https://api.github.com/users/MozillaPootleL10nBot","avatar_url":"https://avatars.githubusercontent.com/u/8323759?"},"repo":{"id":6078190,"name":"translate/mozilla-lang","url":"https://api.github.com/repos/translate/mozilla-lang"},"payload":{"push_id":536753320,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"f468205040a01ee5ffed377ec4f2b2a6be35c687","before":"2df4901774321d656e6e60150051a66dc87cefcb","commits":[{"sha":"f468205040a01ee5ffed377ec4f2b2a6be35c687","author":{"email":"f02c4b7f151600c94fb4d6f03844f716aeaa6d62@translate.org.za","name":"Mozilla Pootle L10n Robot"},"message":"[son] pull from Pootle","distinct":true,"url":"https://api.github.com/repos/translate/mozilla-lang/commits/f468205040a01ee5ffed377ec4f2b2a6be35c687"}]},"public":true,"created_at":"2015-01-01T01:05:51Z","org":{"id":1538178,"login":"translate","gravatar_id":"","url":"https://api.github.com/orgs/translate","avatar_url":"https://avatars.githubusercontent.com/u/1538178?"}}
{"id":"2489398355","type":"PushEvent","actor":{"id":506010,"login":"gabeshaughnessy","gravatar_id":"","url":"https://api.github.com/users/gabeshaughnessy","avatar_url":"https://avatars.githubusercontent.com/u/506010?"},"repo":{"id":13913264,"name":"gabeshaughnessy/augmentedart","url":"https://api.github.com/repos/gabeshaughnessy/augmentedart"},"payload":{"push_id":536753322,"size":1,"distinct_size":1,"ref":"refs/heads/dungeon-hacker","head":"1855adda47047b9a781de334f4616c312ec65dc6","before":"f1d6efa16b35cfe98b4ee3e54c3f333f87612fa1","commits":[{"sha":"1855adda47047b9a781de334f4616c312ec65dc6","author":{"email":"a2b2bb6e7f1b10ac88b326d5c10e33af6a8546bc@gmail.com","name":"gabeshaughnessy"},"message":"task list","distinct":true,"url":"https://api.github.com/repos/gabeshaughnessy/augmentedart/commits/1855adda47047b9a781de334f4616c312ec65dc6"}]},"public":true,"created_at":"2015-01-01T01:05:53Z"}
{"id":"2489398362","type":"GollumEvent","actor":{"id":10245688,"login":"SunyataZero","gravatar_id":"","url":"https://api.github.com/users/SunyataZero","avatar_url":"https://avatars.githubusercontent.com/u/10245688?"},"repo":{"id":28485643,"name":"EmpathyApp/EmpathyApp","url":"https://api.github.com/repos/EmpathyApp/EmpathyApp"},"payload":{"pages":[{"page_name":"Design-tools","title":"Design tools","summary":null,"action":"edited","sha":"39fe159c9630870c8f3da7f55774c6ea773d45be","html_url":"https://github.com/EmpathyApp/EmpathyApp/wiki/Design-tools"}]},"public":true,"created_at":"2015-01-01T01:05:54Z","org":{"id":10245750,"login":"EmpathyApp","gravatar_id":"","url":"https://api.github.com/orgs/EmpathyApp","avatar_url":"https://avatars.githubusercontent.com/u/10245750?"}}
{"id":"2489398364","type":"CreateEvent","actor":{"id":6955935,"login":"wfrizzell","gravatar_id":"","url":"https://api.github.com/users/wfrizzell","avatar_url":"https://avatars.githubusercontent.com/u/6955935?"},"repo":{"id":28678275,"name":"wfrizzell/Completed-Target-Model-Table-Documentation","url":"https://api.github.com/repos/wfrizzell/Completed-Target-Model-Table-Documentation"},"payload":{"ref":null,"ref_type":"repository","master_branch":"master","description":"","pusher_type":"user"},"public":true,"created_at":"2015-01-01T01:05:55Z"}
{"id":"2489398368","type":"PushEvent","actor":{"id":486234,"login":"dubinsky","gravatar_id":"","url":"https://api.github.com/users/dubinsky","avatar_url":"https://avatars.githubusercontent.com/u/486234?"},"repo":{"id":28631502,"name":"dubinsky/19-kislev-archive","url":"https://api.github.com/repos/dubinsky/19-kislev-archive"},"payload":{"push_id":536753326,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"c805962cac1cf5f6d5f408079c05213ed0d738a8","before":"34816ca67b9ed5364ea6e0bfeaacd594ac89e04f","commits":[{"sha":"c805962cac1cf5f6d5f408079c05213ed0d738a8","author":{"email":"1ca4b28513c5e015ce705bdc97bba1a9e4624b16@podval.org","name":"Leonid Dubinsky"},"message":"Sync.","distinct":true,"url":"https://api.github.com/repos/dubinsky/19-kislev-archive/commits/c805962cac1cf5f6d5f408079c05213ed0d738a8"}]},"public":true,"created_at":"2015-01-01T01:05:56Z"}
{"id":"2489398369","type":"PushEvent","actor":{"id":698770,"login":"johnnovak","gravatar_id":"","url":"https://api.github.com/users/johnnovak","avatar_url":"https://avatars.githubusercontent.com/u/698770?"},"repo":{"id":17473666,"name":"johnnovak/dotfiles","url":"https://api.github.com/repos/johnnovak/dotfiles"},"payload":{"push_id":536753327,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"a84040736d0e942689cd5444100dc91ae7661ba8","before":"c03d592c8fa1a6638cce9d972cfdb65ad89f26e6","commits":[{"sha":"a84040736d0e942689cd5444100dc91ae7661ba8","author":{"email":"a51dda7c7ff50b61eaea0444371f4a6a9301e501@johnnovak.net","name":"John Novak"},"message":"vimrc: cleanup","distinct":true,"url":"https://api.github.com/repos/johnnovak/dotfiles/commits/a84040736d0e942689cd5444100dc91ae7661ba8"}]},"public":true,"created_at":"2015-01-01T01:05:56Z"}
{"id":"2489398370","type":"CommitCommentEvent","actor":{"id":1497508,"login":"simon816","gravatar_id":"","url":"https://api.github.com/users/simon816","avatar_url":"https://avatars.githubusercontent.com/u/1497508?"},"repo":{"id":23774298,"name":"SpongePowered/Sponge","url":"https://api.github.com/repos/SpongePowered/Sponge"},"payload":{"comment":{"url":"https://api.github.com/repos/SpongePowered/Sponge/comments/9131367","html_url":"https://github.com/SpongePowered/Sponge/commit/b0c96c3f67ffd4830420b7c62edd8db816fc3d64#commitcomment-9131367","id":9131367,"user":{"login":"simon816","id":1497508,"avatar_url":"https://avatars.githubusercontent.com/u/1497508?v=3","gravatar_id":"","url":"https://api.github.com/users/simon816","html_url":"https://github.com/simon816","followers_url":"https://api.github.com/users/simon816/followers","following_url":"https://api.github.com/users/simon816/following{/other_user}","gists_url":"https://api.github.com/users/simon816/gists{/gist_id}","starred_url":"https://api.github.com/users/simon816/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/simon816/subscriptions","organizations_url":"https://api.github.com/users/simon816/orgs","repos_url":"https://api.github.com/users/simon816/repos","events_url":"https://api.github.com/users/simon816/events{/privacy}","received_events_url":"https://api.github.com/users/simon816/received_events","type":"User","site_admin":false},"position":130,"line":176,"path":"src/main/java/org/spongepowered/mod/registry/SpongeGameRegistry.java","commit_id":"b0c96c3f67ffd4830420b7c62edd8db816fc3d64","created_at":"2015-01-01T01:05:55Z","updated_at":"2015-01-01T01:05:55Z","body":"This should be `ARMOR_STAND`"}},"public":true,"created_at":"2015-01-01T01:05:55Z","org":{"id":8683473,"login":"SpongePowered","gravatar_id":"","url":"https://api.github.com/orgs/SpongePowered","avatar_url":"https://avatars.githubusercontent.com/u/8683473?"}}
{"id":"2489398372","type":"PullRequestEvent","actor":{"id":447804,"login":"tfoote","gravatar_id":"","url":"https://api.github.com/users/tfoote","avatar_url":"https://avatars.githubusercontent.com/u/447804?"},"repo":{"id":3149845,"name":"ros/rosdistro","url":"https://api.github.com/repos/ros/rosdistro"},"payload":{"action":"opened","number":6732,"pull_request":{"url":"https://api.github.com/repos/ros/rosdistro/pulls/6732","id":26739460,"html_url":"https://github.com/ros/rosdistro/pull/6732","diff_url":"https://github.com/ros/rosdistro/pull/6732.diff","patch_url":"https://github.com/ros/rosdistro/pull/6732.patch","issue_url":"https://api.github.com/repos/ros/rosdistro/issues/6732","number":6732,"state":"open","locked":false,"title":"adding bullet rosdep rules for utopic and vivid","user":{"login":"tfoote","id":447804,"avatar_url":"https://avatars.githubusercontent.com/u/447804?v=3","gravatar_id":"","url":"https://api.github.com/users/tfoote","html_url":"https://github.com/tfoote","followers_url":"https://api.github.com/users/tfoote/followers","following_url":"https://api.github.com/users/tfoote/following{/other_user}","gists_url":"https://api.github.com/users/tfoote/gists{/gist_id}","starred_url":"https://api.github.com/users/tfoote/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/tfoote/subscriptions","organizations_url":"https://api.github.com/users/tfoote/orgs","repos_url":"https://api.github.com/users/tfoote/repos","events_url":"https://api.github.com/users/tfoote/events{/privacy}","received_events_url":"https://api.github.com/users/tfoote/received_events","type":"User","site_admin":false},"body":"","created_at":"2015-01-01T01:05:55Z","updated_at":"2015-01-01T01:05:55Z","closed_at":null,"merged_at":null,"merge_commit_sha":null,"assignee":null,"milestone":null,"commits_url":"https://api.github.com/repos/ros/rosdistro/pulls/6732/commits","review_comments_url":"https://api.github.com/repos/ros/rosdistro/pulls/6732/comments","review_comment_url":"https://api.github.com/repos/ros/rosdistro/pulls/comments/{number}","comments_url":"https://api.github.com/repos/ros/rosdistro/issues/6732/comments","statuses_url":"https://api.github.com/repos/ros/rosdistro/statuses/aa0e8faf57abed8143ce567ceb6c45736946d0cd","head":{"label":"ros:bullet_UV","ref":"bullet_UV","sha":"aa0e8faf57abed8143ce567ceb6c45736946d0cd","user":{"login":"ros","id":547448,"avatar_url":"https://avatars.githubusercontent.com/u/547448?v=3","gravatar_id":"","url":"https://api.github.com/users/ros","html_url":"https://github.com/ros","followers_url":"https://api.github.com/users/ros/followers","following_url":"https://api.github.com/users/ros/following{/other_user}","gists_url":"https://api.github.com/users/ros/gists{/gist_id}","starred_url":"https://api.github.com/users/ros/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/ros/subscriptions","organizations_url":"https://api.github.com/users/ros/orgs","repos_url":"https://api.github.com/users/ros/repos","events_url":"https://api.github.com/users/ros/events{/privacy}","received_events_url":"https://api.github.com/users/ros/received_events","type":"Organization","site_admin":false},"repo":{"id":3149845,"name":"rosdistro","full_name":"ros/rosdistro","owner":{"login":"ros","id":547448,"avatar_url":"https://avatars.githubusercontent.com/u/547448?v=3","gravatar_id":"","url":"https://api.github.com/users/ros","html_url":"https://github.com/ros","followers_url":"https://api.github.com/users/ros/followers","following_url":"https://api.github.com/users/ros/following{/other_user}","gists_url":"https://api.github.com/users/ros/gists{/gist_id}","starred_url":"https://api.github.com/users/ros/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/ros/subscriptions","organizations_url":"https://api.github.com/users/ros/orgs","repos_url":"https://api.github.com/users/ros/repos","events_url":"https://api.github.com/users/ros/events{/privacy}","received_events_url":"https://api.github.com/users/ros/received_events","type":"Organization","site_admin":false},"private":false,"html_url":"https://github.com/ros/rosdistro","description":"This repo maintains a lists of repositories for each ROS distribution","fork":false,"url":"https://api.github.com/repos/ros/rosdistro","forks_url":"https://api.github.com/repos/ros/rosdistro/forks","keys_url":"https://api.github.com/repos/ros/rosdistro/keys{/key_id}","collaborators_url":"https://api.github.com/repos/ros/rosdistro/collaborators{/collaborator}","teams_url":"https://api.github.com/repos/ros/rosdistro/teams","hooks_url":"https://api.github.com/repos/ros/rosdistro/hooks","issue_events_url":"https://api.github.com/repos/ros/rosdistro/issues/events{/number}","events_url":"https://api.github.com/repos/ros/rosdistro/events","assignees_url":"https://api.github.com/repos/ros/rosdistro/assignees{/user}","branches_url":"https://api.github.com/repos/ros/rosdistro/branches{/branch}","tags_url":"https://api.github.com/repos/ros/rosdistro/tags","blobs_url":"https://api.github.com/repos/ros/rosdistro/git/blobs{/sha}","git_tags_url":"https://api.github.com/repos/ros/rosdistro/git/tags{/sha}","git_refs_url":"https://api.github.com/repos/ros/rosdistro/git/refs{/sha}","trees_url":"https://api.github.com/repos/ros/rosdistro/git/trees{/sha}","statuses_url":"https://api.github.com/repos/ros/rosdistro/statuses/{sha}","languages_url":"https://api.github.com/repos/ros/rosdistro/languages","stargazers_url":"https://api.github.com/repos/ros/rosdistro/stargazers","contributors_url":"https://api.github.com/repos/ros/rosdistro/contributors","subscribers_url":"https://api.github.com/repos/ros/rosdistro/subscribers","subscription_url":"https://api.github.com/repos/ros/rosdistro/subscription","commits_url":"https://api.github.com/repos/ros/rosdistro/commits{/sha}","git_commits_url":"https://api.github.com/repos/ros/rosdistro/git/commits{/sha}","comments_url":"https://api.github.com/repos/ros/rosdistro/comments{/number}","issue_comment_url":"https://api.github.com/repos/ros/rosdistro/issues/comments/{number}","contents_url":"https://api.github.com/repos/ros/rosdistro/contents/{+path}","compare_url":"https://api.github.com/repos/ros/rosdistro/compare/{base}...{head}","merges_url":"https://api.github.com/repos/ros/rosdistro/merges","archive_url":"https://api.github.com/repos/ros/rosdistro/{archive_format}{/ref}","downloads_url":"https://api.github.com/repos/ros/rosdistro/downloads","issues_url":"https://api.github.com/repos/ros/rosdistro/issues{/number}","pulls_url":"https://api.github.com/repos/ros/rosdistro/pulls{/number}","milestones_url":"https://api.github.com/repos/ros/rosdistro/milestones{/number}","notifications_url":"https://api.github.com/repos/ros/rosdistro/notifications{?since,all,participating}","labels_url":"https://api.github.com/repos/ros/rosdistro/labels{/name}","releases_url":"https://api.github.com/repos/ros/rosdistro/releases{/id}","created_at":"2012-01-11T00:13:17Z","updated_at":"2014-12-31T23:39:13Z","pushed_at":"2015-01-01T00:27:02Z","git_url":"git://github.com/ros/rosdistro.git","ssh_url":"git@github.com:ros/rosdistro.git","clone_url":"https://github.com/ros/rosdistro.git","svn_url":"https://github.com/ros/rosdistro","homepage":"","size":40338,"stargazers_count":107,"watchers_count":107,"language":"Python","has_issues":true,"has_downloads":true,"has_wiki":true,"has_pages":false,"forks_count":459,"mirror_url":null,"open_issues_count":29,"forks":459,"open_issues":29,"watchers":107,"default_branch":"master"}},"base":{"label":"ros:master","ref":"master","sha":"c92186717af0766aa2b4dc6adf216ee610a4ed1e","user":{"login":"ros","id":547448,"avatar_url":"https://avatars.githubusercontent.com/u/547448?v=3","gravatar_id":"","url":"https://api.github.com/users/ros","html_url":"https://github.com/ros","followers_url":"https://api.github.com/users/ros/followers","following_url":"https://api.github.com/users/ros/following{/other_user}","gists_url":"https://api.github.com/users/ros/gists{/gist_id}","starred_url":"https://api.github.com/users/ros/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/ros/subscriptions","organizations_url":"https://api.github.com/users/ros/orgs","repos_url":"https://api.github.com/users/ros/repos","events_url":"https://api.github.com/users/ros/events{/privacy}","received_events_url":"https://api.github.com/users/ros/received_events","type":"Organization","site_admin":false},"repo":{"id":3149845,"name":"rosdistro","full_name":"ros/rosdistro","owner":{"login":"ros","id":547448,"avatar_url":"https://avatars.githubusercontent.com/u/547448?v=3","gravatar_id":"","url":"https://api.github.com/users/ros","html_url":"https://github.com/ros","followers_url":"https://api.github.com/users/ros/followers","following_url":"https://api.github.com/users/ros/following{/other_user}","gists_url":"https://api.github.com/users/ros/gists{/gist_id}","starred_url":"https://api.github.com/users/ros/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/ros/subscriptions","organizations_url":"https://api.github.com/users/ros/orgs","repos_url":"https://api.github.com/users/ros/repos","events_url":"https://api.github.com/users/ros/events{/privacy}","received_events_url":"https://api.github.com/users/ros/received_events","type":"Organization","site_admin":false},"private":false,"html_url":"https://github.com/ros/rosdistro","description":"This repo maintains a lists of repositories for each ROS distribution","fork":false,"url":"https://api.github.com/repos/ros/rosdistro","forks_url":"https://api.github.com/repos/ros/rosdistro/forks","keys_url":"https://api.github.com/repos/ros/rosdistro/keys{/key_id}","collaborators_url":"https://api.github.com/repos/ros/rosdistro/collaborators{/collaborator}","teams_url":"https://api.github.com/repos/ros/rosdistro/teams","hooks_url":"https://api.github.com/repos/ros/rosdistro/hooks","issue_events_url":"https://api.github.com/repos/ros/rosdistro/issues/events{/number}","events_url":"https://api.github.com/repos/ros/rosdistro/events","assignees_url":"https://api.github.com/repos/ros/rosdistro/assignees{/user}","branches_url":"https://api.github.com/repos/ros/rosdistro/branches{/branch}","tags_url":"https://api.github.com/repos/ros/rosdistro/tags","blobs_url":"https://api.github.com/repos/ros/rosdistro/git/blobs{/sha}","git_tags_url":"https://api.github.com/repos/ros/rosdistro/git/tags{/sha}","git_refs_url":"https://api.github.com/repos/ros/rosdistro/git/refs{/sha}","trees_url":"https://api.github.com/repos/ros/rosdistro/git/trees{/sha}","statuses_url":"https://api.github.com/repos/ros/rosdistro/statuses/{sha}","languages_url":"https://api.github.com/repos/ros/rosdistro/languages","stargazers_url":"https://api.github.com/repos/ros/rosdistro/stargazers","contributors_url":"https://api.github.com/repos/ros/rosdistro/contributors","subscribers_url":"https://api.github.com/repos/ros/rosdistro/subscribers","subscription_url":"https://api.github.com/repos/ros/rosdistro/subscription","commits_url":"https://api.github.com/repos/ros/rosdistro/commits{/sha}","git_commits_url":"https://api.github.com/repos/ros/rosdistro/git/commits{/sha}","comments_url":"https://api.github.com/repos/ros/rosdistro/comments{/number}","issue_comment_url":"https://api.github.com/repos/ros/rosdistro/issues/comments/{number}","contents_url":"https://api.github.com/repos/ros/rosdistro/contents/{+path}","compare_url":"https://api.github.com/repos/ros/rosdistro/compare/{base}...{head}","merges_url":"https://api.github.com/repos/ros/rosdistro/merges","archive_url":"https://api.github.com/repos/ros/rosdistro/{archive_format}{/ref}","downloads_url":"https://api.github.com/repos/ros/rosdistro/downloads","issues_url":"https://api.github.com/repos/ros/rosdistro/issues{/number}","pulls_url":"https://api.github.com/repos/ros/rosdistro/pulls{/number}","milestones_url":"https://api.github.com/repos/ros/rosdistro/milestones{/number}","notifications_url":"https://api.github.com/repos/ros/rosdistro/notifications{?since,all,participating}","labels_url":"https://api.github.com/repos/ros/rosdistro/labels{/name}","releases_url":"https://api.github.com/repos/ros/rosdistro/releases{/id}","created_at":"2012-01-11T00:13:17Z","updated_at":"2014-12-31T23:39:13Z","pushed_at":"2015-01-01T00:27:02Z","git_url":"git://github.com/ros/rosdistro.git","ssh_url":"git@github.com:ros/rosdistro.git","clone_url":"https://github.com/ros/rosdistro.git","svn_url":"https://github.com/ros/rosdistro","homepage":"","size":40338,"stargazers_count":107,"watchers_count":107,"language":"Python","has_issues":true,"has_downloads":true,"has_wiki":true,"has_pages":false,"forks_count":459,"mirror_url":null,"open_issues_count":29,"forks":459,"open_issues":29,"watchers":107,"default_branch":"master"}},"_links":{"self":{"href":"https://api.github.com/repos/ros/rosdistro/pulls/6732"},"html":{"href":"https://github.com/ros/rosdistro/pull/6732"},"issue":{"href":"https://api.github.com/repos/ros/rosdistro/issues/6732"},"comments":{"href":"https://api.github.com/repos/ros/rosdistro/issues/6732/comments"},"review_comments":{"href":"https://api.github.com/repos/ros/rosdistro/pulls/6732/comments"},"review_comment":{"href":"https://api.github.com/repos/ros/rosdistro/pulls/comments/{number}"},"commits":{"href":"https://api.github.com/repos/ros/rosdistro/pulls/6732/commits"},"statuses":{"href":"https://api.github.com/repos/ros/rosdistro/statuses/aa0e8faf57abed8143ce567ceb6c45736946d0cd"}},"merged":false,"mergeable":null,"mergeable_state":"unknown","merged_by":null,"comments":0,"review_comments":0,"commits":1,"additions":6,"deletions":0,"changed_files":1}},"public":true,"created_at":"2015-01-01T01:05:56Z","org":{"id":547448,"login":"ros","gravatar_id":"","url":"https://api.github.com/orgs/ros","avatar_url":"https://avatars.githubusercontent.com/u/547448?"}}
{"id":"2489398374","type":"IssuesEvent","actor":{"id":1312880,"login":"cmwwebfx","gravatar_id":"","url":"https://api.github.com/users/cmwwebfx","avatar_url":"https://avatars.githubusercontent.com/u/1312880?"},"repo":{"id":8194553,"name":"michaeluno/admin-page-framework","url":"https://api.github.com/repos/michaeluno/admin-page-framework"},"payload":{"action":"opened","issue":{"url":"https://api.github.com/repos/michaeluno/admin-page-framework/issues/180","labels_url":"https://api.github.com/repos/michaeluno/admin-page-framework/issues/180/labels{/name}","comments_url":"https://api.github.com/repos/michaeluno/admin-page-framework/issues/180/comments","events_url":"https://api.github.com/repos/michaeluno/admin-page-framework/issues/180/events","html_url":"https://github.com/michaeluno/admin-page-framework/issues/180","id":53210287,"number":180,"title":"Flexible content field group","user":{"login":"cmwwebfx","id":1312880,"avatar_url":"https://avatars.githubusercontent.com/u/1312880?v=3","gravatar_id":"","url":"https://api.github.com/users/cmwwebfx","html_url":"https://github.com/cmwwebfx","followers_url":"https://api.github.com/users/cmwwebfx/followers","following_url":"https://api.github.com/users/cmwwebfx/following{/other_user}","gists_url":"https://api.github.com/users/cmwwebfx/gists{/gist_id}","starred_url":"https://api.github.com/users/cmwwebfx/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/cmwwebfx/subscriptions","organizations_url":"https://api.github.com/users/cmwwebfx/orgs","repos_url":"https://api.github.com/users/cmwwebfx/repos","events_url":"https://api.github.com/users/cmwwebfx/events{/privacy}","received_events_url":"https://api.github.com/users/cmwwebfx/received_events","type":"User","site_admin":false},"labels":[],"state":"open","locked":false,"assignee":null,"milestone":null,"comments":0,"created_at":"2015-01-01T01:05:57Z","updated_at":"2015-01-01T01:05:57Z","closed_at":null,"body":"Hi Michael,\r\n\r\nHappy new year..\r\n\r\nI have used a plugin before for creating custom fields for a small project, and it was called ACF (Advanced Custom Fields) by Elliot Condon.\r\n\r\nWhile I used this plugin for creating a simple layout, I explored the options they had available in the PRO version. What I really loved was something called \"Flexible Content Field\". \r\n\r\nhttp://www.advancedcustomfields.com/resources/flexible-content/\r\n\r\nThis was really awesome since it allowed me to make a set of grouped fields, then add them to this area that I wanted. I used this to make a pretty complex , yet easy to use selection of groups for the end user.\r\n\r\nIs this something you might consider to add to Admin Page Framework? Here are some screenshots of how I have used it, and you can see how this is quite beneficial to have such an option.\r\n\r\n![add a flexible content field](https://cloud.githubusercontent.com/assets/1312880/5591413/18e8920e-91aa-11e4-9744-8630fcc2eb81.jpg)\r\n\r\n![flexible content field](https://cloud.githubusercontent.com/assets/1312880/5591415/36f2ef60-91aa-11e4-92b3-a4d749d4afe5.jpg)\r\n\r\n![flexible content field dragable](https://cloud.githubusercontent.com/assets/1312880/5591416/3a79ee2c-91aa-11e4-9656-f9ae00f86776.jpg)\r\n\r\n"}},"public":true,"created_at":"2015-01-01T01:05:57Z"}
{"id":"2489398377","type":"PushEvent","actor":{"id":1220541,"login":"orthez","gravatar_id":"","url":"https://api.github.com/users/orthez","avatar_url":"https://avatars.githubusercontent.com/u/1220541?"},"repo":{"id":24684211,"name":"orthez/workspace-homology","url":"https://api.github.com/repos/orthez/workspace-homology"},"payload":{"push_id":536753331,"size":2,"distinct_size":2,"ref":"refs/heads/master","head":"4bb77a864087fb80e8990a3983133898439fd0b1","before":"d688fe2f3b340b3512afb14060097d6152fb56d7","commits":[{"sha":"d1b825e541f55691602a4091f5db1338cc634fa9","author":{"email":"f357ae49b6cf16f864ac544048626472d25113dd@gmx.de","name":"Andreas Orthey"},"message":"xspace computation module","distinct":true,"url":"https://api.github.com/repos/orthez/workspace-homology/commits/d1b825e541f55691602a4091f5db1338cc634fa9"},{"sha":"4bb77a864087fb80e8990a3983133898439fd0b1","author":{"email":"f357ae49b6cf16f864ac544048626472d25113dd@gmx.de","name":"Andreas Orthey"},"message":"plot module for cspace | readjusted robot parameters","distinct":true,"url":"https://api.github.com/repos/orthez/workspace-homology/commits/4bb77a864087fb80e8990a3983133898439fd0b1"}]},"public":true,"created_at":"2015-01-01T01:05:57Z"}
{"id":"2489398379","type":"PushEvent","actor":{"id":433707,"login":"ile","gravatar_id":"","url":"https://api.github.com/users/ile","avatar_url":"https://avatars.githubusercontent.com/u/433707?"},"repo":{"id":26847132,"name":"kantele/k-templates","url":"https://api.github.com/repos/kantele/k-templates"},"payload":{"push_id":536753332,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"6630db87e4ed496f67a88bf24f22332c67e9792d","before":"ca0474a33dcc125aa7204b517dd7cef8003db346","commits":[{"sha":"6630db87e4ed496f67a88bf24f22332c67e9792d","author":{"email":"4f3407de78bccc8cc160ee4d278d5efe7162e6b5@nateps.com","name":"Nate Smith"},"message":"fix bug in detecting which bindings are list items","distinct":true,"url":"https://api.github.com/repos/kantele/k-templates/commits/6630db87e4ed496f67a88bf24f22332c67e9792d"}]},"public":true,"created_at":"2015-01-01T01:05:57Z","org":{"id":5687585,"login":"kantele","gravatar_id":"","url":"https://api.github.com/orgs/kantele","avatar_url":"https://avatars.githubusercontent.com/u/5687585?"}}
{"id":"2489398380","type":"DeleteEvent","actor":{"id":99359,"login":"llinder","gravatar_id":"","url":"https://api.github.com/users/llinder","avatar_url":"https://avatars.githubusercontent.com/u/99359?"},"repo":{"id":28669941,"name":"llinder/salt","url":"https://api.github.com/repos/llinder/salt"},"payload":{"ref":"v2014.7.0_1","ref_type":"tag","pusher_type":"user"},"public":true,"created_at":"2015-01-01T01:05:57Z"}
{"id":"2489398388","type":"PushEvent","actor":{"id":21060,"login":"taladar","gravatar_id":"","url":"https://api.github.com/users/taladar","avatar_url":"https://avatars.githubusercontent.com/u/21060?"},"repo":{"id":6124150,"name":"taladar/portage","url":"https://api.github.com/repos/taladar/portage"},"payload":{"push_id":536753336,"size":1,"distinct_size":1,"ref":"refs/heads/gentoo.org","head":"a887ddbd472af412c458a84e61675debb6a4703b","before":"bb37d9cff8757360f30e14e7046bfd7da864872b","commits":[{"sha":"a887ddbd472af412c458a84e61675debb6a4703b","author":{"email":"dc76e9f0c0006e8f919e0c515c66dbba3982f785@root2.taladar.net","name":"root2.taladar.net root"},"message":"Portage rsync://rsync.de.gentoo.org/gentoo-portage at 2015-01-01 02:05:36","distinct":true,"url":"https://api.github.com/repos/taladar/portage/commits/a887ddbd472af412c458a84e61675debb6a4703b"}]},"public":true,"created_at":"2015-01-01T01:05:58Z"}
{"id":"2489398389","type":"PushEvent","actor":{"id":815193,"login":"aquach","gravatar_id":"","url":"https://api.github.com/users/aquach","avatar_url":"https://avatars.githubusercontent.com/u/815193?"},"repo":{"id":4950386,"name":"aquach/miner","url":"https://api.github.com/repos/aquach/miner"},"payload":{"push_id":536753337,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"f4ad3cb3d0e30ce311b8b032cf6923544eca80a0","before":"93759971a2c59562d5413a0d236663435fb5e442","commits":[{"sha":"f4ad3cb3d0e30ce311b8b032cf6923544eca80a0","author":{"email":"60c6d277a8bd81de7fdde19201bf9c58a3df08f4@clinkle.com","name":"Alex Quach"},"message":"Delete unnecessary stuff and kill medical skill/sickbays. Can't find a use for it.","distinct":true,"url":"https://api.github.com/repos/aquach/miner/commits/f4ad3cb3d0e30ce311b8b032cf6923544eca80a0"}]},"public":true,"created_at":"2015-01-01T01:05:58Z"}
{"id":"2489398391","type":"CreateEvent","actor":{"id":4440858,"login":"maynarddemmon","gravatar_id":"","url":"https://api.github.com/users/maynarddemmon","avatar_url":"https://avatars.githubusercontent.com/u/4440858?"},"repo":{"id":19410013,"name":"teem2/dreem","url":"https://api.github.com/repos/teem2/dreem"},"payload":{"ref":"sizetodom","ref_type":"branch","master_branch":"master","description":"A prototyping language for multiscreen multidevice UX","pusher_type":"user"},"public":true,"created_at":"2015-01-01T01:05:58Z","org":{"id":7244222,"login":"teem2","gravatar_id":"","url":"https://api.github.com/orgs/teem2","avatar_url":"https://avatars.githubusercontent.com/u/7244222?"}}
{"id":"2489398395","type":"IssuesEvent","actor":{"id":5497952,"login":"g19-mr","gravatar_id":"","url":"https://api.github.com/users/g19-mr","avatar_url":"https://avatars.githubusercontent.com/u/5497952?"},"repo":{"id":25435487,"name":"g19-mr/azh","url":"https://api.github.com/repos/g19-mr/azh"},"payload":{"action":"opened","issue":{"url":"https://api.github.com/repos/g19-mr/azh/issues/83","labels_url":"https://api.github.com/repos/g19-mr/azh/issues/83/labels{/name}","comments_url":"https://api.github.com/repos/g19-mr/azh/issues/83/comments","events_url":"https://api.github.com/repos/g19-mr/azh/issues/83/events","html_url":"https://github.com/g19-mr/azh/issues/83","id":53210289,"number":83,"title":"Add icons to the left of the text on About screen buttons","user":{"login":"g19-mr","id":5497952,"avatar_url":"https://avatars.githubusercontent.com/u/5497952?v=3","gravatar_id":"","url":"https://api.github.com/users/g19-mr","html_url":"https://github.com/g19-mr","followers_url":"https://api.github.com/users/g19-mr/followers","following_url":"https://api.github.com/users/g19-mr/following{/other_user}","gists_url":"https://api.github.com/users/g19-mr/gists{/gist_id}","starred_url":"https://api.github.com/users/g19-mr/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/g19-mr/subscriptions","organizations_url":"https://api.github.com/users/g19-mr/orgs","repos_url":"https://api.github.com/users/g19-mr/repos","events_url":"https://api.github.com/users/g19-mr/events{/privacy}","received_events_url":"https://api.github.com/users/g19-mr/received_events","type":"User","site_admin":false},"labels":[{"url":"https://api.github.com/repos/g19-mr/azh/labels/improvement","name":"improvement","color":"84b6eb"}],"state":"open","locked":false,"assignee":{"login":"g19-mr","id":5497952,"avatar_url":"https://avatars.githubusercontent.com/u/5497952?v=3","gravatar_id":"","url":"https://api.github.com/users/g19-mr","html_url":"https://github.com/g19-mr","followers_url":"https://api.github.com/users/g19-mr/followers","following_url":"https://api.github.com/users/g19-mr/following{/other_user}","gists_url":"https://api.github.com/users/g19-mr/gists{/gist_id}","starred_url":"https://api.github.com/users/g19-mr/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/g19-mr/subscriptions","organizations_url":"https://api.github.com/users/g19-mr/orgs","repos_url":"https://api.github.com/users/g19-mr/repos","events_url":"https://api.github.com/users/g19-mr/events{/privacy}","received_events_url":"https://api.github.com/users/g19-mr/received_events","type":"User","site_admin":false},"milestone":{"url":"https://api.github.com/repos/g19-mr/azh/milestones/2","labels_url":"https://api.github.com/repos/g19-mr/azh/milestones/2/labels","id":873798,"number":2,"title":"Android 1.0.1","description":null,"creator":{"login":"g19-mr","id":5497952,"avatar_url":"https://avatars.githubusercontent.com/u/5497952?v=3","gravatar_id":"","url":"https://api.github.com/users/g19-mr","html_url":"https://github.com/g19-mr","followers_url":"https://api.github.com/users/g19-mr/followers","following_url":"https://api.github.com/users/g19-mr/following{/other_user}","gists_url":"https://api.github.com/users/g19-mr/gists{/gist_id}","starred_url":"https://api.github.com/users/g19-mr/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/g19-mr/subscriptions","organizations_url":"https://api.github.com/users/g19-mr/orgs","repos_url":"https://api.github.com/users/g19-mr/repos","events_url":"https://api.github.com/users/g19-mr/events{/privacy}","received_events_url":"https://api.github.com/users/g19-mr/received_events","type":"User","site_admin":false},"open_issues":6,"closed_issues":11,"state":"open","created_at":"2014-11-20T05:20:02Z","updated_at":"2015-01-01T01:05:59Z","due_on":null,"closed_at":null},"comments":0,"created_at":"2015-01-01T01:05:59Z","updated_at":"2015-01-01T01:05:59Z","closed_at":null,"body":"Related icons aligned to the left on the buttons on about screen"}},"public":true,"created_at":"2015-01-01T01:05:59Z"}
{"id":"2489398402","type":"IssueCommentEvent","actor":{"id":1813305,"login":"Bart39","gravatar_id":"","url":"https://api.github.com/users/Bart39","avatar_url":"https://avatars.githubusercontent.com/u/1813305?"},"repo":{"id":9683876,"name":"nZEDb/nZEDb","url":"https://api.github.com/repos/nZEDb/nZEDb"},"payload":{"action":"created","issue":{"url":"https://api.github.com/repos/nZEDb/nZEDb/issues/1572","labels_url":"https://api.github.com/repos/nZEDb/nZEDb/issues/1572/labels{/name}","comments_url":"https://api.github.com/repos/nZEDb/nZEDb/issues/1572/comments","events_url":"https://api.github.com/repos/nZEDb/nZEDb/issues/1572/events","html_url":"https://github.com/nZEDb/nZEDb/issues/1572","id":53191494,"number":1572,"title":"Trakt IMDB search url format changed","user":{"login":"RickDB","id":347084,"avatar_url":"https://avatars.githubusercontent.com/u/347084?v=3","gravatar_id":"","url":"https://api.github.com/users/RickDB","html_url":"https://github.com/RickDB","followers_url":"https://api.github.com/users/RickDB/followers","following_url":"https://api.github.com/users/RickDB/following{/other_user}","gists_url":"https://api.github.com/users/RickDB/gists{/gist_id}","starred_url":"https://api.github.com/users/RickDB/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/RickDB/subscriptions","organizations_url":"https://api.github.com/users/RickDB/orgs","repos_url":"https://api.github.com/users/RickDB/repos","events_url":"https://api.github.com/users/RickDB/events{/privacy}","received_events_url":"https://api.github.com/users/RickDB/received_events","type":"User","site_admin":false},"labels":[],"state":"closed","locked":false,"assignee":null,"milestone":null,"comments":2,"created_at":"2014-12-31T16:34:10Z","updated_at":"2015-01-01T01:06:00Z","closed_at":"2015-01-01T01:06:00Z","body":"Trakt launched their new site and among other things the URL format for searching based on IMDB id has changed from:\r\n\r\nhttp://trakt.tv/search/imdb?q=tt2395427/\r\n\r\nto:\r\n\r\nhttp://trakt.tv/search/imdb/tt2395427/\r\n\r\nThis affects the movie template but might be used in other areas as well, pretty easy fix but though I let you guys know."},"comment":{"url":"https://api.github.com/repos/nZEDb/nZEDb/issues/comments/68477343","html_url":"https://github.com/nZEDb/nZEDb/issues/1572#issuecomment-68477343","issue_url":"https://api.github.com/repos/nZEDb/nZEDb/issues/1572","id":68477343,"user":{"login":"Bart39","id":1813305,"avatar_url":"https://avatars.githubusercontent.com/u/1813305?v=3","gravatar_id":"","url":"https://api.github.com/users/Bart39","html_url":"https://github.com/Bart39","followers_url":"https://api.github.com/users/Bart39/followers","following_url":"https://api.github.com/users/Bart39/following{/other_user}","gists_url":"https://api.github.com/users/Bart39/gists{/gist_id}","starred_url":"https://api.github.com/users/Bart39/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/Bart39/subscriptions","organizations_url":"https://api.github.com/users/Bart39/orgs","repos_url":"https://api.github.com/users/Bart39/repos","events_url":"https://api.github.com/users/Bart39/events{/privacy}","received_events_url":"https://api.github.com/users/Bart39/received_events","type":"User","site_admin":false},"created_at":"2015-01-01T01:06:00Z","updated_at":"2015-01-01T01:06:00Z","body":"merged to dev #1573 "}},"public":true,"created_at":"2015-01-01T01:06:01Z","org":{"id":4260270,"login":"nZEDb","gravatar_id":"","url":"https://api.github.com/orgs/nZEDb","avatar_url":"https://avatars.githubusercontent.com/u/4260270?"}}
{"id":"2489398403","type":"IssuesEvent","actor":{"id":1813305,"login":"Bart39","gravatar_id":"","url":"https://api.github.com/users/Bart39","avatar_url":"https://avatars.githubusercontent.com/u/1813305?"},"repo":{"id":9683876,"name":"nZEDb/nZEDb","url":"https://api.github.com/repos/nZEDb/nZEDb"},"payload":{"action":"closed","issue":{"url":"https://api.github.com/repos/nZEDb/nZEDb/issues/1572","labels_url":"https://api.github.com/repos/nZEDb/nZEDb/issues/1572/labels{/name}","comments_url":"https://api.github.com/repos/nZEDb/nZEDb/issues/1572/comments","events_url":"https://api.github.com/repos/nZEDb/nZEDb/issues/1572/events","html_url":"https://github.com/nZEDb/nZEDb/issues/1572","id":53191494,"number":1572,"title":"Trakt IMDB search url format changed","user":{"login":"RickDB","id":347084,"avatar_url":"https://avatars.githubusercontent.com/u/347084?v=3","gravatar_id":"","url":"https://api.github.com/users/RickDB","html_url":"https://github.com/RickDB","followers_url":"https://api.github.com/users/RickDB/followers","following_url":"https://api.github.com/users/RickDB/following{/other_user}","gists_url":"https://api.github.com/users/RickDB/gists{/gist_id}","starred_url":"https://api.github.com/users/RickDB/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/RickDB/subscriptions","organizations_url":"https://api.github.com/users/RickDB/orgs","repos_url":"https://api.github.com/users/RickDB/repos","events_url":"https://api.github.com/users/RickDB/events{/privacy}","received_events_url":"https://api.github.com/users/RickDB/received_events","type":"User","site_admin":false},"labels":[],"state":"closed","locked":false,"assignee":null,"milestone":null,"comments":2,"created_at":"2014-12-31T16:34:10Z","updated_at":"2015-01-01T01:06:00Z","closed_at":"2015-01-01T01:06:00Z","body":"Trakt launched their new site and among other things the URL format for searching based on IMDB id has changed from:\r\n\r\nhttp://trakt.tv/search/imdb?q=tt2395427/\r\n\r\nto:\r\n\r\nhttp://trakt.tv/search/imdb/tt2395427/\r\n\r\nThis affects the movie template but might be used in other areas as well, pretty easy fix but though I let you guys know."}},"public":true,"created_at":"2015-01-01T01:06:01Z","org":{"id":4260270,"login":"nZEDb","gravatar_id":"","url":"https://api.github.com/orgs/nZEDb","avatar_url":"https://avatars.githubusercontent.com/u/4260270?"}}
{"id":"2489398405","type":"IssueCommentEvent","actor":{"id":2354108,"login":"coveralls","gravatar_id":"","url":"https://api.github.com/users/coveralls","avatar_url":"https://avatars.githubusercontent.com/u/2354108?"},"repo":{"id":20897533,"name":"OCA/vertical-travel","url":"https://api.github.com/repos/OCA/vertical-travel"},"payload":{"action":"created","issue":{"url":"https://api.github.com/repos/OCA/vertical-travel/issues/19","labels_url":"https://api.github.com/repos/OCA/vertical-travel/issues/19/labels{/name}","comments_url":"https://api.github.com/repos/OCA/vertical-travel/issues/19/comments","events_url":"https://api.github.com/repos/OCA/vertical-travel/issues/19/events","html_url":"https://github.com/OCA/vertical-travel/pull/19","id":53210017,"number":19,"title":"[IMP] Relax ACLs to access the reports","user":{"login":"joaoalf","id":840120,"avatar_url":"https://avatars.githubusercontent.com/u/840120?v=3","gravatar_id":"","url":"https://api.github.com/users/joaoalf","html_url":"https://github.com/joaoalf","followers_url":"https://api.github.com/users/joaoalf/followers","following_url":"https://api.github.com/users/joaoalf/following{/other_user}","gists_url":"https://api.github.com/users/joaoalf/gists{/gist_id}","starred_url":"https://api.github.com/users/joaoalf/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/joaoalf/subscriptions","organizations_url":"https://api.github.com/users/joaoalf/orgs","repos_url":"https://api.github.com/users/joaoalf/repos","events_url":"https://api.github.com/users/joaoalf/events{/privacy}","received_events_url":"https://api.github.com/users/joaoalf/received_events","type":"User","site_admin":false},"labels":[],"state":"open","locked":false,"assignee":null,"milestone":null,"comments":1,"created_at":"2015-01-01T00:51:32Z","updated_at":"2015-01-01T01:06:00Z","closed_at":null,"pull_request":{"url":"https://api.github.com/repos/OCA/vertical-travel/pulls/19","html_url":"https://github.com/OCA/vertical-travel/pull/19","diff_url":"https://github.com/OCA/vertical-travel/pull/19.diff","patch_url":"https://github.com/OCA/vertical-travel/pull/19.patch"},"body":"Another PR in the ACL series"},"comment":{"url":"https://api.github.com/repos/OCA/vertical-travel/issues/comments/68477344","html_url":"https://github.com/OCA/vertical-travel/pull/19#issuecomment-68477344","issue_url":"https://api.github.com/repos/OCA/vertical-travel/issues/19","id":68477344,"user":{"login":"coveralls","id":2354108,"avatar_url":"https://avatars.githubusercontent.com/u/2354108?v=3","gravatar_id":"","url":"https://api.github.com/users/coveralls","html_url":"https://github.com/coveralls","followers_url":"https://api.github.com/users/coveralls/followers","following_url":"https://api.github.com/users/coveralls/following{/other_user}","gists_url":"https://api.github.com/users/coveralls/gists{/gist_id}","starred_url":"https://api.github.com/users/coveralls/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/coveralls/subscriptions","organizations_url":"https://api.github.com/users/coveralls/orgs","repos_url":"https://api.github.com/users/coveralls/repos","events_url":"https://api.github.com/users/coveralls/events{/privacy}","received_events_url":"https://api.github.com/users/coveralls/received_events","type":"User","site_admin":false},"created_at":"2015-01-01T01:06:00Z","updated_at":"2015-01-01T01:06:00Z","body":"\n[![Coverage Status](https://coveralls.io/builds/1679499/badge)](https://coveralls.io/builds/1679499)\n\nCoverage remained the same when pulling **68ea6d231ce88e56db8bc2e6eb1e7553e205207f on savoirfairelinux:7.0_travel_journey_acl** into **552b843dcfc28878480cbf4159c5b941c89fdf6d on OCA:7.0**.\n"}},"public":true,"created_at":"2015-01-01T01:06:01Z","org":{"id":7600578,"login":"OCA","gravatar_id":"","url":"https://api.github.com/orgs/OCA","avatar_url":"https://avatars.githubusercontent.com/u/7600578?"}}
{"id":"2489398409","type":"DeleteEvent","actor":{"id":995241,"login":"ggkuron","gravatar_id":"","url":"https://api.github.com/users/ggkuron","avatar_url":"https://avatars.githubusercontent.com/u/995241?"},"repo":{"id":12571910,"name":"ggkuron/dotfiles","url":"https://api.github.com/repos/ggkuron/dotfiles"},"payload":{"ref":"x230","ref_type":"branch","pusher_type":"user"},"public":true,"created_at":"2015-01-01T01:06:01Z"}
{"id":"2489398408","type":"IssueCommentEvent","actor":{"id":1138857,"login":"peterkc","gravatar_id":"","url":"https://api.github.com/users/peterkc","avatar_url":"https://avatars.githubusercontent.com/u/1138857?"},"repo":{"id":24388525,"name":"box/leche","url":"https://api.github.com/repos/box/leche"},"payload":{"action":"created","issue":{"url":"https://api.github.com/repos/box/leche/issues/5","labels_url":"https://api.github.com/repos/box/leche/issues/5/labels{/name}","comments_url":"https://api.github.com/repos/box/leche/issues/5/comments","events_url":"https://api.github.com/repos/box/leche/issues/5/events","html_url":"https://github.com/box/leche/pull/5","id":53209954,"number":5,"title":"Update dependencies in package.json to latest and add peerDependencies","user":{"login":"peterkc","id":1138857,"avatar_url":"https://avatars.githubusercontent.com/u/1138857?v=3","gravatar_id":"","url":"https://api.github.com/users/peterkc","html_url":"https://github.com/peterkc","followers_url":"https://api.github.com/users/peterkc/followers","following_url":"https://api.github.com/users/peterkc/following{/other_user}","gists_url":"https://api.github.com/users/peterkc/gists{/gist_id}","starred_url":"https://api.github.com/users/peterkc/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/peterkc/subscriptions","organizations_url":"https://api.github.com/users/peterkc/orgs","repos_url":"https://api.github.com/users/peterkc/repos","events_url":"https://api.github.com/users/peterkc/events{/privacy}","received_events_url":"https://api.github.com/users/peterkc/received_events","type":"User","site_admin":false},"labels":[],"state":"open","locked":false,"assignee":null,"milestone":null,"comments":2,"created_at":"2015-01-01T00:47:14Z","updated_at":"2015-01-01T01:06:00Z","closed_at":null,"pull_request":{"url":"https://api.github.com/repos/box/leche/pulls/5","html_url":"https://github.com/box/leche/pull/5","diff_url":"https://github.com/box/leche/pull/5.diff","patch_url":"https://github.com/box/leche/pull/5.patch"},"body":"Updating dependencies (#4) also required fixing some lint issues (#3) in leche.js"},"comment":{"url":"https://api.github.com/repos/box/leche/issues/comments/68477345","html_url":"https://github.com/box/leche/pull/5#issuecomment-68477345","issue_url":"https://api.github.com/repos/box/leche/issues/5","id":68477345,"user":{"login":"peterkc","id":1138857,"avatar_url":"https://avatars.githubusercontent.com/u/1138857?v=3","gravatar_id":"","url":"https://api.github.com/users/peterkc","html_url":"https://github.com/peterkc","followers_url":"https://api.github.com/users/peterkc/followers","following_url":"https://api.github.com/users/peterkc/following{/other_user}","gists_url":"https://api.github.com/users/peterkc/gists{/gist_id}","starred_url":"https://api.github.com/users/peterkc/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/peterkc/subscriptions","organizations_url":"https://api.github.com/users/peterkc/orgs","repos_url":"https://api.github.com/users/peterkc/repos","events_url":"https://api.github.com/users/peterkc/events{/privacy}","received_events_url":"https://api.github.com/users/peterkc/received_events","type":"User","site_admin":false},"created_at":"2015-01-01T01:06:00Z","updated_at":"2015-01-01T01:06:00Z","body":"CLA signed"}},"public":true,"created_at":"2015-01-01T01:06:01Z","org":{"id":23900,"login":"box","gravatar_id":"","url":"https://api.github.com/orgs/box","avatar_url":"https://avatars.githubusercontent.com/u/23900?"}}
{"id":"2489398410","type":"CreateEvent","actor":{"id":6955935,"login":"wfrizzell","gravatar_id":"","url":"https://api.github.com/users/wfrizzell","avatar_url":"https://avatars.githubusercontent.com/u/6955935?"},"repo":{"id":28678275,"name":"wfrizzell/Completed-Target-Model-Table-Documentation","url":"https://api.github.com/repos/wfrizzell/Completed-Target-Model-Table-Documentation"},"payload":{"ref":"master","ref_type":"branch","master_branch":"master","description":"","pusher_type":"user"},"public":true,"created_at":"2015-01-01T01:06:01Z"}
{"id":"2489398411","type":"PushEvent","actor":{"id":2074134,"login":"jtbdevelopment","gravatar_id":"","url":"https://api.github.com/users/jtbdevelopment","avatar_url":"https://avatars.githubusercontent.com/u/2074134?"},"repo":{"id":25750775,"name":"jtbdevelopment/TwistedHangman","url":"https://api.github.com/repos/jtbdevelopment/TwistedHangman"},"payload":{"push_id":536753342,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"ffb0188d246564af4993cbe840261401c90ed312","before":"12941ba32ad8534239d2b94382938978fd5865b4","commits":[{"sha":"ffb0188d246564af4993cbe840261401c90ed312","author":{"email":"3fbaf13ce556021e810d7c5980db29812a1bff3d@gmail.com","name":"JTB Development"},"message":"starting an FB friend invite screen","distinct":true,"url":"https://api.github.com/repos/jtbdevelopment/TwistedHangman/commits/ffb0188d246564af4993cbe840261401c90ed312"}]},"public":true,"created_at":"2015-01-01T01:06:01Z"}
{"id":"2489398421","type":"CreateEvent","actor":{"id":2829718,"login":"phister","gravatar_id":"","url":"https://api.github.com/users/phister","avatar_url":"https://avatars.githubusercontent.com/u/2829718?"},"repo":{"id":28678276,"name":"phister/CollegeFootballPlayoff","url":"https://api.github.com/repos/phister/CollegeFootballPlayoff"},"payload":{"ref":null,"ref_type":"repository","master_branch":"master","description":null,"pusher_type":"user"},"public":true,"created_at":"2015-01-01T01:06:02Z"}
{"id":"2489398424","type":"PushEvent","actor":{"id":10225575,"login":"ExclusiveOrange","gravatar_id":"","url":"https://api.github.com/users/ExclusiveOrange","avatar_url":"https://avatars.githubusercontent.com/u/10225575?"},"repo":{"id":28677579,"name":"ExclusiveOrange/synthesizer","url":"https://api.github.com/repos/ExclusiveOrange/synthesizer"},"payload":{"push_id":536753349,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"cec30520f9eb65d16e63f8d5efdd251204a519ca","before":"9221d005a52f784d675044bb14013c0eec6ed795","commits":[{"sha":"cec30520f9eb65d16e63f8d5efdd251204a519ca","author":{"email":"de3bd7888dcfc4f7d00a4ef606710f57cbba1dbb@hotmail.com","name":"ExclusiveOrange"},"message":"removed old stuff","distinct":true,"url":"https://api.github.com/repos/ExclusiveOrange/synthesizer/commits/cec30520f9eb65d16e63f8d5efdd251204a519ca"}]},"public":true,"created_at":"2015-01-01T01:06:02Z"}
{"id":"2489398426","type":"IssueCommentEvent","actor":{"id":1932804,"login":"coldmind","gravatar_id":"","url":"https://api.github.com/users/coldmind","avatar_url":"https://avatars.githubusercontent.com/u/1932804?"},"repo":{"id":4164482,"name":"django/django","url":"https://api.github.com/repos/django/django"},"payload":{"action":"created","issue":{"url":"https://api.github.com/repos/django/django/issues/3821","labels_url":"https://api.github.com/repos/django/django/issues/3821/labels{/name}","comments_url":"https://api.github.com/repos/django/django/issues/3821/comments","events_url":"https://api.github.com/repos/django/django/issues/3821/events","html_url":"https://github.com/django/django/pull/3821","id":53200969,"number":3821,"title":"[WIP] Fixed #24064 - Prevented database access in compile time in spatialite models","user":{"login":"coldmind","id":1932804,"avatar_url":"https://avatars.githubusercontent.com/u/1932804?v=3","gravatar_id":"","url":"https://api.github.com/users/coldmind","html_url":"https://github.com/coldmind","followers_url":"https://api.github.com/users/coldmind/followers","following_url":"https://api.github.com/users/coldmind/following{/other_user}","gists_url":"https://api.github.com/users/coldmind/gists{/gist_id}","starred_url":"https://api.github.com/users/coldmind/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/coldmind/subscriptions","organizations_url":"https://api.github.com/users/coldmind/orgs","repos_url":"https://api.github.com/users/coldmind/repos","events_url":"https://api.github.com/users/coldmind/events{/privacy}","received_events_url":"https://api.github.com/users/coldmind/received_events","type":"User","site_admin":false},"labels":[],"state":"open","locked":false,"assignee":null,"milestone":null,"comments":5,"created_at":"2014-12-31T20:02:17Z","updated_at":"2015-01-01T01:06:01Z","closed_at":null,"pull_request":{"url":"https://api.github.com/repos/django/django/pulls/3821","html_url":"https://github.com/django/django/pull/3821","diff_url":"https://github.com/django/django/pull/3821.diff","patch_url":"https://github.com/django/django/pull/3821.patch"},"body":"Here is the patch that can fix problem.\r\nIdeas about improvements are welcome."},"comment":{"url":"https://api.github.com/repos/django/django/issues/comments/68477346","html_url":"https://github.com/django/django/pull/3821#issuecomment-68477346","issue_url":"https://api.github.com/repos/django/django/issues/3821","id":68477346,"user":{"login":"coldmind","id":1932804,"avatar_url":"https://avatars.githubusercontent.com/u/1932804?v=3","gravatar_id":"","url":"https://api.github.com/users/coldmind","html_url":"https://github.com/coldmind","followers_url":"https://api.github.com/users/coldmind/followers","following_url":"https://api.github.com/users/coldmind/following{/other_user}","gists_url":"https://api.github.com/users/coldmind/gists{/gist_id}","starred_url":"https://api.github.com/users/coldmind/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/coldmind/subscriptions","organizations_url":"https://api.github.com/users/coldmind/orgs","repos_url":"https://api.github.com/users/coldmind/repos","events_url":"https://api.github.com/users/coldmind/events{/privacy}","received_events_url":"https://api.github.com/users/coldmind/received_events","type":"User","site_admin":false},"created_at":"2015-01-01T01:06:01Z","updated_at":"2015-01-01T01:06:01Z","body":"buildbot, test this please."}},"public":true,"created_at":"2015-01-01T01:06:02Z","org":{"id":27804,"login":"django","gravatar_id":"","url":"https://api.github.com/orgs/django","avatar_url":"https://avatars.githubusercontent.com/u/27804?"}}
{"id":"2489398428","type":"CreateEvent","actor":{"id":5249918,"login":"ehnmark","gravatar_id":"","url":"https://api.github.com/users/ehnmark","avatar_url":"https://avatars.githubusercontent.com/u/5249918?"},"repo":{"id":28678277,"name":"ehnmark/housing","url":"https://api.github.com/repos/ehnmark/housing"},"payload":{"ref":null,"ref_type":"repository","master_branch":"master","description":"","pusher_type":"user"},"public":true,"created_at":"2015-01-01T01:06:03Z"}
{"id":"2489398429","type":"PushEvent","actor":{"id":10182579,"login":"Hyftar","gravatar_id":"","url":"https://api.github.com/users/Hyftar","avatar_url":"https://avatars.githubusercontent.com/u/10182579?"},"repo":{"id":28678188,"name":"Hyftar/blah","url":"https://api.github.com/repos/Hyftar/blah"},"payload":{"push_id":536753350,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"382bf507dbf58ef02b9daac86377895787d90e1d","before":"b8125f82b3ca1d038368cfd44882b5f68413a3b0","commits":[{"sha":"382bf507dbf58ef02b9daac86377895787d90e1d","author":{"email":"03d2ba3a5d0bf707f7f3c852ae80a60d66351e89@ymail.com","name":"Hyftar"},"message":"First commit","distinct":true,"url":"https://api.github.com/repos/Hyftar/blah/commits/382bf507dbf58ef02b9daac86377895787d90e1d"}]},"public":true,"created_at":"2015-01-01T01:06:03Z"}
{"id":"2489398433","type":"ForkEvent","actor":{"id":2875366,"login":"k6dsp","gravatar_id":"","url":"https://api.github.com/users/k6dsp","avatar_url":"https://avatars.githubusercontent.com/u/2875366?"},"repo":{"id":19836773,"name":"DigilentInc/Linux-Digilent-Dev","url":"https://api.github.com/repos/DigilentInc/Linux-Digilent-Dev"},"payload":{"forkee":{"id":28678278,"name":"Linux-Digilent-Dev","full_name":"k6dsp/Linux-Digilent-Dev","owner":{"login":"k6dsp","id":2875366,"avatar_url":"https://avatars.githubusercontent.com/u/2875366?v=3","gravatar_id":"","url":"https://api.github.com/users/k6dsp","html_url":"https://github.com/k6dsp","followers_url":"https://api.github.com/users/k6dsp/followers","following_url":"https://api.github.com/users/k6dsp/following{/other_user}","gists_url":"https://api.github.com/users/k6dsp/gists{/gist_id}","starred_url":"https://api.github.com/users/k6dsp/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/k6dsp/subscriptions","organizations_url":"https://api.github.com/users/k6dsp/orgs","repos_url":"https://api.github.com/users/k6dsp/repos","events_url":"https://api.github.com/users/k6dsp/events{/privacy}","received_events_url":"https://api.github.com/users/k6dsp/received_events","type":"User","site_admin":false},"private":false,"html_url":"https://github.com/k6dsp/Linux-Digilent-Dev","description":"The official Linux kernel from Xilinx","fork":true,"url":"https://api.github.com/repos/k6dsp/Linux-Digilent-Dev","forks_url":"https://api.github.com/repos/k6dsp/Linux-Digilent-Dev/forks","keys_url":"https://api.github.com/repos/k6dsp/Linux-Digilent-Dev/keys{/key_id}","collaborators_url":"https://api.github.com/repos/k6dsp/Linux-Digilent-Dev/collaborators{/collaborator}","teams_url":"https://api.github.com/repos/k6dsp/Linux-Digilent-Dev/teams","hooks_url":"https://api.github.com/repos/k6dsp/Linux-Digilent-Dev/hooks","issue_events_url":"https://api.github.com/repos/k6dsp/Linux-Digilent-Dev/issues/events{/number}","events_url":"https://api.github.com/repos/k6dsp/Linux-Digilent-Dev/events","assignees_url":"https://api.github.com/repos/k6dsp/Linux-Digilent-Dev/assignees{/user}","branches_url":"https://api.github.com/repos/k6dsp/Linux-Digilent-Dev/branches{/branch}","tags_url":"https://api.github.com/repos/k6dsp/Linux-Digilent-Dev/tags","blobs_url":"https://api.github.com/repos/k6dsp/Linux-Digilent-Dev/git/blobs{/sha}","git_tags_url":"https://api.github.com/repos/k6dsp/Linux-Digilent-Dev/git/tags{/sha}","git_refs_url":"https://api.github.com/repos/k6dsp/Linux-Digilent-Dev/git/refs{/sha}","trees_url":"https://api.github.com/repos/k6dsp/Linux-Digilent-Dev/git/trees{/sha}","statuses_url":"https://api.github.com/repos/k6dsp/Linux-Digilent-Dev/statuses/{sha}","languages_url":"https://api.github.com/repos/k6dsp/Linux-Digilent-Dev/languages","stargazers_url":"https://api.github.com/repos/k6dsp/Linux-Digilent-Dev/stargazers","contributors_url":"https://api.github.com/repos/k6dsp/Linux-Digilent-Dev/contributors","subscribers_url":"https://api.github.com/repos/k6dsp/Linux-Digilent-Dev/subscribers","subscription_url":"https://api.github.com/repos/k6dsp/Linux-Digilent-Dev/subscription","commits_url":"https://api.github.com/repos/k6dsp/Linux-Digilent-Dev/commits{/sha}","git_commits_url":"https://api.github.com/repos/k6dsp/Linux-Digilent-Dev/git/commits{/sha}","comments_url":"https://api.github.com/repos/k6dsp/Linux-Digilent-Dev/comments{/number}","issue_comment_url":"https://api.github.com/repos/k6dsp/Linux-Digilent-Dev/issues/comments/{number}","contents_url":"https://api.github.com/repos/k6dsp/Linux-Digilent-Dev/contents/{+path}","compare_url":"https://api.github.com/repos/k6dsp/Linux-Digilent-Dev/compare/{base}...{head}","merges_url":"https://api.github.com/repos/k6dsp/Linux-Digilent-Dev/merges","archive_url":"https://api.github.com/repos/k6dsp/Linux-Digilent-Dev/{archive_format}{/ref}","downloads_url":"https://api.github.com/repos/k6dsp/Linux-Digilent-Dev/downloads","issues_url":"https://api.github.com/repos/k6dsp/Linux-Digilent-Dev/issues{/number}","pulls_url":"https://api.github.com/repos/k6dsp/Linux-Digilent-Dev/pulls{/number}","milestones_url":"https://api.github.com/repos/k6dsp/Linux-Digilent-Dev/milestones{/number}","notifications_url":"https://api.github.com/repos/k6dsp/Linux-Digilent-Dev/notifications{?since,all,participating}","labels_url":"https://api.github.com/repos/k6dsp/Linux-Digilent-Dev/labels{/name}","releases_url":"https://api.github.com/repos/k6dsp/Linux-Digilent-Dev/releases{/id}","created_at":"2015-01-01T01:06:03Z","updated_at":"2014-09-07T23:09:11Z","pushed_at":"2014-05-23T19:19:11Z","git_url":"git://github.com/k6dsp/Linux-Digilent-Dev.git","ssh_url":"git@github.com:k6dsp/Linux-Digilent-Dev.git","clone_url":"https://github.com/k6dsp/Linux-Digilent-Dev.git","svn_url":"https://github.com/k6dsp/Linux-Digilent-Dev","homepage":"","size":890055,"stargazers_count":0,"watchers_count":0,"language":null,"has_issues":false,"has_downloads":true,"has_wiki":true,"has_pages":false,"forks_count":0,"mirror_url":null,"open_issues_count":0,"forks":0,"open_issues":0,"watchers":0,"default_branch":"master","public":true}},"public":true,"created_at":"2015-01-01T01:06:03Z","org":{"id":7597005,"login":"DigilentInc","gravatar_id":"","url":"https://api.github.com/orgs/DigilentInc","avatar_url":"https://avatars.githubusercontent.com/u/7597005?"}}
{"id":"2489398434","type":"IssueCommentEvent","actor":{"id":6845864,"login":"boxcla","gravatar_id":"","url":"https://api.github.com/users/boxcla","avatar_url":"https://avatars.githubusercontent.com/u/6845864?"},"repo":{"id":24388525,"name":"box/leche","url":"https://api.github.com/repos/box/leche"},"payload":{"action":"created","issue":{"url":"https://api.github.com/repos/box/leche/issues/5","labels_url":"https://api.github.com/repos/box/leche/issues/5/labels{/name}","comments_url":"https://api.github.com/repos/box/leche/issues/5/comments","events_url":"https://api.github.com/repos/box/leche/issues/5/events","html_url":"https://github.com/box/leche/pull/5","id":53209954,"number":5,"title":"Update dependencies in package.json to latest and add peerDependencies","user":{"login":"peterkc","id":1138857,"avatar_url":"https://avatars.githubusercontent.com/u/1138857?v=3","gravatar_id":"","url":"https://api.github.com/users/peterkc","html_url":"https://github.com/peterkc","followers_url":"https://api.github.com/users/peterkc/followers","following_url":"https://api.github.com/users/peterkc/following{/other_user}","gists_url":"https://api.github.com/users/peterkc/gists{/gist_id}","starred_url":"https://api.github.com/users/peterkc/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/peterkc/subscriptions","organizations_url":"https://api.github.com/users/peterkc/orgs","repos_url":"https://api.github.com/users/peterkc/repos","events_url":"https://api.github.com/users/peterkc/events{/privacy}","received_events_url":"https://api.github.com/users/peterkc/received_events","type":"User","site_admin":false},"labels":[],"state":"open","locked":false,"assignee":null,"milestone":null,"comments":3,"created_at":"2015-01-01T00:47:14Z","updated_at":"2015-01-01T01:06:03Z","closed_at":null,"pull_request":{"url":"https://api.github.com/repos/box/leche/pulls/5","html_url":"https://github.com/box/leche/pull/5","diff_url":"https://github.com/box/leche/pull/5.diff","patch_url":"https://github.com/box/leche/pull/5.patch"},"body":"Updating dependencies (#4) also required fixing some lint issues (#3) in leche.js"},"comment":{"url":"https://api.github.com/repos/box/leche/issues/comments/68477348","html_url":"https://github.com/box/leche/pull/5#issuecomment-68477348","issue_url":"https://api.github.com/repos/box/leche/issues/5","id":68477348,"user":{"login":"boxcla","id":6845864,"avatar_url":"https://avatars.githubusercontent.com/u/6845864?v=3","gravatar_id":"","url":"https://api.github.com/users/boxcla","html_url":"https://github.com/boxcla","followers_url":"https://api.github.com/users/boxcla/followers","following_url":"https://api.github.com/users/boxcla/following{/other_user}","gists_url":"https://api.github.com/users/boxcla/gists{/gist_id}","starred_url":"https://api.github.com/users/boxcla/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/boxcla/subscriptions","organizations_url":"https://api.github.com/users/boxcla/orgs","repos_url":"https://api.github.com/users/boxcla/repos","events_url":"https://api.github.com/users/boxcla/events{/privacy}","received_events_url":"https://api.github.com/users/boxcla/received_events","type":"User","site_admin":false},"created_at":"2015-01-01T01:06:03Z","updated_at":"2015-01-01T01:06:03Z","body":"Verified that @peterkc has just signed the CLA. Thanks, and we look forward to your contribution."}},"public":true,"created_at":"2015-01-01T01:06:03Z","org":{"id":23900,"login":"box","gravatar_id":"","url":"https://api.github.com/orgs/box","avatar_url":"https://avatars.githubusercontent.com/u/23900?"}}
{"id":"2489398437","type":"IssueCommentEvent","actor":{"id":646600,"login":"mikeshulman","gravatar_id":"","url":"https://api.github.com/users/mikeshulman","avatar_url":"https://avatars.githubusercontent.com/u/646600?"},"repo":{"id":6569872,"name":"HoTT/book","url":"https://api.github.com/repos/HoTT/book"},"payload":{"action":"created","issue":{"url":"https://api.github.com/repos/HoTT/book/issues/744","labels_url":"https://api.github.com/repos/HoTT/book/issues/744/labels{/name}","comments_url":"https://api.github.com/repos/HoTT/book/issues/744/comments","events_url":"https://api.github.com/repos/HoTT/book/issues/744/events","html_url":"https://github.com/HoTT/book/issues/744","id":51177378,"number":744,"title":"Proofs of Lems. 7.2.9 and 7.3.1","user":{"login":"kristinas","id":1341988,"avatar_url":"https://avatars.githubusercontent.com/u/1341988?v=3","gravatar_id":"","url":"https://api.github.com/users/kristinas","html_url":"https://github.com/kristinas","followers_url":"https://api.github.com/users/kristinas/followers","following_url":"https://api.github.com/users/kristinas/following{/other_user}","gists_url":"https://api.github.com/users/kristinas/gists{/gist_id}","starred_url":"https://api.github.com/users/kristinas/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/kristinas/subscriptions","organizations_url":"https://api.github.com/users/kristinas/orgs","repos_url":"https://api.github.com/users/kristinas/repos","events_url":"https://api.github.com/users/kristinas/events{/privacy}","received_events_url":"https://api.github.com/users/kristinas/received_events","type":"User","site_admin":false},"labels":[{"url":"https://api.github.com/repos/HoTT/book/labels/math+question","name":"math question","color":"5319e7"}],"state":"open","locked":false,"assignee":null,"milestone":null,"comments":3,"created_at":"2014-12-06T09:36:05Z","updated_at":"2015-01-01T01:06:04Z","closed_at":null,"body":"Dear all,\r\n\r\nI do not quite see what is going on in the proofs of lemmas 7.2.9 and 7.3.1.\r\n\r\nThe first lemma states that for n>= -1, A is an n-type iff the iterated loop space \\omega^{n+1}(A,a) is contractible for all a :A. Let us consider an equivalent statement instead, which says that for n>= -1, is-n-type(A) is equivalent to\r\n\\Pi{a:A} is-contr(\\omega^{n+1}(A,a)).\r\n\r\nThe base case when n = -1 is Exercise 3.5, as in the current proof. For the inductive case it suffices to prove the logical equivalence between the two types, as they are both mere props. We have that is-(n+1)-type(A) is by definition\r\n\\Pi{x,y:A} is-n-type(x=y). By induction, this is equivalent to \\Pi{x,y:A} \\Pi{p:x=y} is-contr(\\omega^{n+1}(x=y,p)). On the other hand, \\Pi{x:A} is-contr(\\omega^{n+2}(A,x)) is definitionally equal to \\Pi{x:A} is-contr(\\omega^{n+1}(x=x,refl(x))).\r\nIt remains to show that the two types \\Pi{x,y:A} \\Pi{p:x=y} is-contr(\\omega^{n+1}(x=y,p)) and\r\n\\Pi{x:A} is-contr(\\omega^{n+1}(x=x,refl(x))) are logically equivalent. Going from left to right is obvious and from right to left is just path induction on p. So we are done. No?\r\n\r\nLemma 7.3.1 states that the n-truncation of A is an n-type. When reading the section on truncations for the first time, I was very confused by the motivation given via iterated loop spaces and maps of pointed types. Eventually I gave up and tried to understand it in a different way.\r\nFor example, we can first prove a lemma which says that for n >= -1, the statement that X is an n-type is equivalent to saying that, loosely speaking, any function from S^{n+1} to X is 'constant' (I am putting it in quotes since people like to argue about the terminology). Formally, for n >= -1, is-n-type(X) is equivalent to\r\n\\Pi{r: S^{n+1} \\to X} \\Sigma {h : X} \\Pi{z: S^{n+1}} r(z) = h. There is a simple proof by induction on n. I am not sure if this lemma might be useful in other places as a general characteristic of an n-type, but at the very least one direction of it is used in Theorem 7.3.2 without explicit justification.\r\nOf course, once we have the lemma the motivation for defining the truncation as we did, as well as the subsequent proof that the truncation is really an n-type, is trivial.\r\n\r\nPlease let me know what you think.\r\n\r\nKristina\r\n\r\n\r\n\r\n\r\n\r\n\r\n\r\n"},"comment":{"url":"https://api.github.com/repos/HoTT/book/issues/comments/68477349","html_url":"https://github.com/HoTT/book/issues/744#issuecomment-68477349","issue_url":"https://api.github.com/repos/HoTT/book/issues/744","id":68477349,"user":{"login":"mikeshulman","id":646600,"avatar_url":"https://avatars.githubusercontent.com/u/646600?v=3","gravatar_id":"","url":"https://api.github.com/users/mikeshulman","html_url":"https://github.com/mikeshulman","followers_url":"https://api.github.com/users/mikeshulman/followers","following_url":"https://api.github.com/users/mikeshulman/following{/other_user}","gists_url":"https://api.github.com/users/mikeshulman/gists{/gist_id}","starred_url":"https://api.github.com/users/mikeshulman/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/mikeshulman/subscriptions","organizations_url":"https://api.github.com/users/mikeshulman/orgs","repos_url":"https://api.github.com/users/mikeshulman/repos","events_url":"https://api.github.com/users/mikeshulman/events{/privacy}","received_events_url":"https://api.github.com/users/mikeshulman/received_events","type":"User","site_admin":false},"created_at":"2015-01-01T01:06:04Z","updated_at":"2015-01-01T01:06:04Z","body":"There's no a priori reason the proofs in the book are the simplest ones; they're just the ones that whoever was writing that chapter thought of at the time."}},"public":true,"created_at":"2015-01-01T01:06:04Z","org":{"id":692156,"login":"HoTT","gravatar_id":"","url":"https://api.github.com/orgs/HoTT","avatar_url":"https://avatars.githubusercontent.com/u/692156?"}}
{"id":"2489398439","type":"CreateEvent","actor":{"id":9402134,"login":"kesiena115","gravatar_id":"","url":"https://api.github.com/users/kesiena115","avatar_url":"https://avatars.githubusercontent.com/u/9402134?"},"repo":{"id":28678279,"name":"kesiena115/R1","url":"https://api.github.com/repos/kesiena115/R1"},"payload":{"ref":null,"ref_type":"repository","master_branch":"master","description":"Project Repository","pusher_type":"user"},"public":true,"created_at":"2015-01-01T01:06:06Z"}
{"id":"2489398441","type":"PushEvent","actor":{"id":734484,"login":"smcelhinney","gravatar_id":"","url":"https://api.github.com/users/smcelhinney","avatar_url":"https://avatars.githubusercontent.com/u/734484?"},"repo":{"id":28406073,"name":"smcelhinney/fireblog","url":"https://api.github.com/repos/smcelhinney/fireblog"},"payload":{"push_id":536753352,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"875e125f1d832fd1d4b917d905c44ccf209ec632","before":"c86fb3faded34b9979276557ee83beb0dc414b59","commits":[{"sha":"875e125f1d832fd1d4b917d905c44ccf209ec632","author":{"email":"9be487b550ce83311cfee6c22e48907b229f1a73@tcd.ie","name":"smcelhinney"},"message":"Fixed some JSHINT stuff.","distinct":true,"url":"https://api.github.com/repos/smcelhinney/fireblog/commits/875e125f1d832fd1d4b917d905c44ccf209ec632"}]},"public":true,"created_at":"2015-01-01T01:06:06Z"}
{"id":"2489398442","type":"IssueCommentEvent","actor":{"id":12637,"login":"rwjblue","gravatar_id":"","url":"https://api.github.com/users/rwjblue","avatar_url":"https://avatars.githubusercontent.com/u/12637?"},"repo":{"id":14089735,"name":"ember-cli/ember-cli","url":"https://api.github.com/repos/ember-cli/ember-cli"},"payload":{"action":"created","issue":{"url":"https://api.github.com/repos/ember-cli/ember-cli/issues/2091","labels_url":"https://api.github.com/repos/ember-cli/ember-cli/issues/2091/labels{/name}","comments_url":"https://api.github.com/repos/ember-cli/ember-cli/issues/2091/comments","events_url":"https://api.github.com/repos/ember-cli/ember-cli/issues/2091/events","html_url":"https://github.com/ember-cli/ember-cli/issues/2091","id":43685212,"number":2091,"title":"How to create or keep a symlink in dist","user":{"login":"pradius-fut","id":1803477,"avatar_url":"https://avatars.githubusercontent.com/u/1803477?v=3","gravatar_id":"","url":"https://api.github.com/users/pradius-fut","html_url":"https://github.com/pradius-fut","followers_url":"https://api.github.com/users/pradius-fut/followers","following_url":"https://api.github.com/users/pradius-fut/following{/other_user}","gists_url":"https://api.github.com/users/pradius-fut/gists{/gist_id}","starred_url":"https://api.github.com/users/pradius-fut/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/pradius-fut/subscriptions","organizations_url":"https://api.github.com/users/pradius-fut/orgs","repos_url":"https://api.github.com/users/pradius-fut/repos","events_url":"https://api.github.com/users/pradius-fut/events{/privacy}","received_events_url":"https://api.github.com/users/pradius-fut/received_events","type":"User","site_admin":false},"labels":[],"state":"closed","locked":false,"assignee":null,"milestone":null,"comments":7,"created_at":"2014-09-23T21:16:23Z","updated_at":"2015-01-01T01:06:05Z","closed_at":"2014-10-12T15:17:47Z","body":"i would like to have a symlink `/api` in the dist folder to an api webroot outside the ember app root.\r\nHow can i create this symlink during the build process, or make sure it stays in the dist dir (when i create it manually).\r\n\r\nI'm testing ember and ember-cli, i have the same setup for the application in backbone/grunt where this is working fine."},"comment":{"url":"https://api.github.com/repos/ember-cli/ember-cli/issues/comments/68477351","html_url":"https://github.com/ember-cli/ember-cli/issues/2091#issuecomment-68477351","issue_url":"https://api.github.com/repos/ember-cli/ember-cli/issues/2091","id":68477351,"user":{"login":"rwjblue","id":12637,"avatar_url":"https://avatars.githubusercontent.com/u/12637?v=3","gravatar_id":"","url":"https://api.github.com/users/rwjblue","html_url":"https://github.com/rwjblue","followers_url":"https://api.github.com/users/rwjblue/followers","following_url":"https://api.github.com/users/rwjblue/following{/other_user}","gists_url":"https://api.github.com/users/rwjblue/gists{/gist_id}","starred_url":"https://api.github.com/users/rwjblue/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/rwjblue/subscriptions","organizations_url":"https://api.github.com/users/rwjblue/orgs","repos_url":"https://api.github.com/users/rwjblue/repos","events_url":"https://api.github.com/users/rwjblue/events{/privacy}","received_events_url":"https://api.github.com/users/rwjblue/received_events","type":"User","site_admin":false},"created_at":"2015-01-01T01:06:05Z","updated_at":"2015-01-01T01:06:05Z","body":"@ef4: Its possible that it was always wrong, but I believe that at the time I wrote it we were using `broccoli-export-tree` so the `results.directory` was actually `dist/`.   Either way you are right, and it is incorrect today.  The general concept is sound though (making a symlink inside the `postBuild` hook).\r\n\r\nIt does seem that we should expose the `builder` model's `this.outputPath` to the hook though.  Otherwise, you would be assuming `dist/` which is not guaranteed."}},"public":true,"created_at":"2015-01-01T01:06:06Z","org":{"id":10262982,"login":"ember-cli","gravatar_id":"","url":"https://api.github.com/orgs/ember-cli","avatar_url":"https://avatars.githubusercontent.com/u/10262982?"}}
{"id":"2489398443","type":"PushEvent","actor":{"id":5240798,"login":"hxwang","gravatar_id":"","url":"https://api.github.com/users/hxwang","avatar_url":"https://avatars.githubusercontent.com/u/5240798?"},"repo":{"id":20258812,"name":"hxwang/Leetcode","url":"https://api.github.com/repos/hxwang/Leetcode"},"payload":{"push_id":536753353,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"e67f3471c2ea1c6556ff18137af91f8d92e5e39d","before":"3b594d10e300b52c24bffed44d66ea7aae8e7639","commits":[{"sha":"e67f3471c2ea1c6556ff18137af91f8d92e5e39d","author":{"email":"320cb2ff8e2e195f7d4e5cd3b27b690e919d61e5@gmail.com","name":"Huangxin"},"message":"Update Implement-strStr.java","distinct":true,"url":"https://api.github.com/repos/hxwang/Leetcode/commits/e67f3471c2ea1c6556ff18137af91f8d92e5e39d"}]},"public":true,"created_at":"2015-01-01T01:06:06Z"}
{"id":"2489398444","type":"PushEvent","actor":{"id":296116,"login":"raorao","gravatar_id":"","url":"https://api.github.com/users/raorao","avatar_url":"https://avatars.githubusercontent.com/u/296116?"},"repo":{"id":28544148,"name":"raorao/groceries","url":"https://api.github.com/repos/raorao/groceries"},"payload":{"push_id":536753354,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"c7a2701ccbe6ce99648377c56a826e0446d44ff9","before":"2cbbf1b1c59eac0c09118d8bbf2465b5d8113959","commits":[{"sha":"c7a2701ccbe6ce99648377c56a826e0446d44ff9","author":{"email":"4c1374f3c4f425d5dc04034017c8940e6ba2f209@gmail.com","name":"raorao"},"message":"adds explicit body-parser dependency","distinct":true,"url":"https://api.github.com/repos/raorao/groceries/commits/c7a2701ccbe6ce99648377c56a826e0446d44ff9"}]},"public":true,"created_at":"2015-01-01T01:06:06Z"}
{"id":"2489398445","type":"PushEvent","actor":{"id":2874368,"login":"janie177","gravatar_id":"","url":"https://api.github.com/users/janie177","avatar_url":"https://avatars.githubusercontent.com/u/2874368?"},"repo":{"id":28406300,"name":"janie177/MGRacesRedone","url":"https://api.github.com/repos/janie177/MGRacesRedone"},"payload":{"push_id":536753355,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"73f1823a1a9f25ba53c15b7ec32607e1bed77e09","before":"d1da31bff6f19d84613fa5ef6afb9124ca12d28c","commits":[{"sha":"73f1823a1a9f25ba53c15b7ec32607e1bed77e09","author":{"email":"56d775a7c13bb3dbfe56eb5fa7074a17cc2db31c@hotmail.com","name":"Jan"},"message":"Minor adjustments.\nFixed potion effects and amplifiers being switched for mobs.","distinct":true,"url":"https://api.github.com/repos/janie177/MGRacesRedone/commits/73f1823a1a9f25ba53c15b7ec32607e1bed77e09"}]},"public":true,"created_at":"2015-01-01T01:06:06Z"}
{"id":"2489398447","type":"PushEvent","actor":{"id":248290,"login":"lexmag","gravatar_id":"","url":"https://api.github.com/users/lexmag","avatar_url":"https://avatars.githubusercontent.com/u/248290?"},"repo":{"id":20156619,"name":"lexmag/tty2048","url":"https://api.github.com/repos/lexmag/tty2048"},"payload":{"push_id":536753356,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"d9cb70b865980e3ddba854ac4d08d791957304ee","before":"5fc470c05be7c489aa9d865205e663bc8d2c33f6","commits":[{"sha":"d9cb70b865980e3ddba854ac4d08d791957304ee","author":{"email":"24e2170222e81d4e3239eb4676aa506f230bfdd9@me.com","name":"Aleksei Magusev"},"message":"Do not rely on the Crypto application","distinct":true,"url":"https://api.github.com/repos/lexmag/tty2048/commits/d9cb70b865980e3ddba854ac4d08d791957304ee"}]},"public":true,"created_at":"2015-01-01T01:06:06Z"}
{"id":"2489398449","type":"PushEvent","actor":{"id":3112493,"login":"djstroky","gravatar_id":"","url":"https://api.github.com/users/djstroky","avatar_url":"https://avatars.githubusercontent.com/u/3112493?"},"repo":{"id":28258658,"name":"djstroky/backbone-google-calendar","url":"https://api.github.com/repos/djstroky/backbone-google-calendar"},"payload":{"push_id":536753358,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"293361e1dc564daae89ebb389032fb076a89e459","before":"e2c85077a3ea6dd238684e62e049d68fb686c497","commits":[{"sha":"293361e1dc564daae89ebb389032fb076a89e459","author":{"email":"b9600dec4a2cd1f0ecf0c56887050a58cde1ff86@yahoo.com","name":"djstroky"},"message":"fixed misspelling","distinct":true,"url":"https://api.github.com/repos/djstroky/backbone-google-calendar/commits/293361e1dc564daae89ebb389032fb076a89e459"}]},"public":true,"created_at":"2015-01-01T01:06:06Z"}
{"id":"2489398458","type":"PushEvent","actor":{"id":7336721,"login":"aow1980","gravatar_id":"","url":"https://api.github.com/users/aow1980","avatar_url":"https://avatars.githubusercontent.com/u/7336721?"},"repo":{"id":28617444,"name":"aow1980/kernel_lge_hammerhead","url":"https://api.github.com/repos/aow1980/kernel_lge_hammerhead"},"payload":{"push_id":536753361,"size":33,"distinct_size":33,"ref":"refs/heads/lp5.0","head":"754847ec691ce0d45103f052e86aafe744cddc81","before":"a4e247102c297d001cc6b1e564060ae3fe7d174b","commits":[{"sha":"6adbdc70a8846302e95d7c637d4d601848072264","author":{"email":"457cfb837588e6491cbd81701614a2c9f7081d84@gmail.com","name":"aow1980"},"message":"block: row: Fix crash when adding a new field in bio struct\n\nWhen adding new field to struct bio there is a crash in the removed\ncode lines. This issue was introduced by commit\n80a8f0f87bee18283e9ca0a8966ec97ad9f084e5  \"block: row-iosched idling\ntriggered by readahead pages\"\n\n(Partly) reverting this patch till root cause is fixed (on FS level).\n\nChange-Id: Idce180802227aaab495bf0723768ba4cb437bcab\nSigned-off-by: Tanya Brokhman <tlinder@codeaurora.org>\nSigned-off-by: engstk <eng.stk@sapo.pt>\nSigned-off-by: flar2 <asegaert@gmail.com>","distinct":true,"url":"https://api.github.com/repos/aow1980/kernel_lge_hammerhead/commits/6adbdc70a8846302e95d7c637d4d601848072264"},{"sha":"cc6449f427439b647e8e521db660d15d1d20ed73","author":{"email":"457cfb837588e6491cbd81701614a2c9f7081d84@gmail.com","name":"aow1980"},"message":"block: introduce the BFQ-v6 I/O sched for 3.4\n\nAdd the BFQ-v6 I/O scheduler to 3.4.\nThe general structure is borrowed from CFQ, as much code. A (bfq_)queue is\nassociated to each task doing I/O on a device, and each time a scheduling\ndecision has to be made a queue is selected and served until it expires.\n\n    - Slices are given in the service domain: tasks are assigned budgets,\n      measured in number of sectors. Once got the disk, a task must\n      however consume its assigned budget within a configurable maximum time\n      (by default, the maximum possible value of the budgets is automatically\n      computed to comply with this timeout). This allows the desired latency\n      vs \"throughput boosting\" tradeoff to be set.\n\n    - Budgets are scheduled according to a variant of WF2Q+, implemented\n      using an augmented rb-tree to take eligibility into account while\n      preserving an O(log N) overall complexity.\n\n    - A low-latency tunable is provided; if enabled, both interactive and soft\n      real-time applications are guaranteed very low latency.\n\n    - Latency guarantees are preserved also in presence of NCQ.\n\n    - Also with flash-based devices, a high throughput is achieved while\n      still preserving latency guarantees.\n\n    - A useful feature borrowed from CFQ: static fallback queue for OOM.\n\n    - Differently from CFQ, BFQ uses a unified mechanism (Early Queue Merge,\n      EQM) to get a sequential read pattern, and hence a high throughput,\n      with any set of processes performing interleaved I/O. EQM also\n      preserves low latency. The code for detecting whether two queues have\n      to be merged is a slightly modified version of the CFQ code for\n      detecting whether two queues belong to cooperating processes and whether\n      the service of a queue should be preempted to boost the throughput.\n\n    - BFQ supports full hierarchical scheduling, exporting a cgroups\n      interface.  Each node has a full scheduler, so each group can\n      be assigned its own ioprio (mapped to a weight, see next point)\n      and an ioprio_class.\n\n    - If the cgroups interface is used, weights can be explictly assigned,\n      otherwise ioprio values are mapped to weights using the relation\n      weight = IOPRIO_BE_NR - ioprio.\n\n    - ioprio classes are served in strict priority order, i.e., lower\n      priority queues are not served as long as there are higher priority\n      queues.  Among queues in the same class the bandwidth is distributed\n      in proportion to the weight of each queue. A very thin extra bandwidth\n      is however guaranteed to the Idle class, to prevent it from starving.\n\nChange-Id: Iae219b7532e7c41a88601a77f86f8f20211c30da\nSigned-off-by: Paolo Valente <paolo.valente@unimore.it>\nSigned-off-by: Arianna Avanzini <avanzini.arianna@gmail.com>\nSigned-off-by: flar2 <asegaert@gmail.com>","distinct":true,"url":"https://api.github.com/repos/aow1980/kernel_lge_hammerhead/commits/cc6449f427439b647e8e521db660d15d1d20ed73"},{"sha":"831b6b7d7b89efd711eef2e14eb8b9f46b4916c5","author":{"email":"457cfb837588e6491cbd81701614a2c9f7081d84@gmail.com","name":"aow1980"},"message":"block: cgroups, kconfig, build bits for BFQ-v6-3.4\n\nUpdate Kconfig.iosched and do the related Makefile changes to include\nkernel configuration options for BFQ. Also add the bfqio controller\nto the cgroups subsystem.\n\nChange-Id: I51837750d0a3ac5da9c5adc0e3dcff5894bf1fc8\nSigned-off-by: Paolo Valente <paolo.valente@unimore.it>\nSigned-off-by: Arianna Avanzini <avanzini.arianna@gmail.com>\nSigned-off-by: flar2 <asegaert@gmail.com>","distinct":true,"url":"https://api.github.com/repos/aow1980/kernel_lge_hammerhead/commits/831b6b7d7b89efd711eef2e14eb8b9f46b4916c5"},{"sha":"ecdda7ef938d5aa2db8dc8aa4da733328d6ea836","author":{"email":"457cfb837588e6491cbd81701614a2c9f7081d84@gmail.com","name":"aow1980"},"message":"remove Defconfigs I don't use\n\nChange-Id: I507046245020147e89f11c33414ebf72e25df61a","distinct":true,"url":"https://api.github.com/repos/aow1980/kernel_lge_hammerhead/commits/ecdda7ef938d5aa2db8dc8aa4da733328d6ea836"},{"sha":"d43565d19aeb25eb8432c8636bf7c4d0a18fc974","author":{"email":"457cfb837588e6491cbd81701614a2c9f7081d84@gmail.com","name":"aow1980"},"message":"Add BFQ I/O Scheduler\n\nChange-Id: I1a415a3f3f35fbdc03d6737e4cfd5ba0deddde28","distinct":true,"url":"https://api.github.com/repos/aow1980/kernel_lge_hammerhead/commits/d43565d19aeb25eb8432c8636bf7c4d0a18fc974"},{"sha":"d3c5b34d36f3ea86b8d73555659edad098f2e06e","author":{"email":"457cfb837588e6491cbd81701614a2c9f7081d84@gmail.com","name":"aow1980"},"message":"net: fix info leak in compat dev_ifconf()\n\nThe implementation of dev_ifconf() for the compat ioctl interface uses\nan intermediate ifc structure allocated in userland for the duration of\nthe syscall. Though, it fails to initialize the padding bytes inserted\nfor alignment and that for leaks four bytes of kernel stack. Add an\nexplicit memset(0) before filling the structure to avoid the info leak.\n\nSigned-off-by: Mathias Krause <minipli@googlemail.com>\nSigned-off-by: David S. Miller <davem@davemloft.net>\nSigned-off-by: Greg Kroah-Hartman <gregkh@linuxfoundation.org>\nSigned-off-by: Pranav Vashi <neobuddy89@gmail.com>\nnet: Block MSG_CMSG_COMPAT in send(m)msg and recv(m)msg\n\nMSG_CMSG_COMPAT is (AFAIK) not intended to be part of the API --\nit's a hack that steals a bit to indicate to other networking code\nthat a compat entry was used.  So don't allow it from a non-compat\nsyscall.\n\nThis prevents an oops when running this code:\n\nint main()\n{\n\tint s;\n\tstruct sockaddr_in addr;\n\tstruct msghdr *hdr;\n\n\tchar *highpage = mmap((void*)(TASK_SIZE_MAX - 4096), 4096,\n\t                      PROT_READ | PROT_WRITE,\n\t                      MAP_PRIVATE | MAP_ANONYMOUS | MAP_FIXED, -1, 0);\n\tif (highpage == MAP_FAILED)\n\t\terr(1, \"mmap\");\n\n\ts = socket(AF_INET, SOCK_DGRAM, IPPROTO_UDP);\n\tif (s == -1)\n\t\terr(1, \"socket\");\n\n        addr.sin_family = AF_INET;\n        addr.sin_port = htons(1);\n        addr.sin_addr.s_addr = htonl(INADDR_LOOPBACK);\n\tif (connect(s, (struct sockaddr*)&addr, sizeof(addr)) != 0)\n\t\terr(1, \"connect\");\n\n\tvoid *evil = highpage + 4096 - COMPAT_MSGHDR_SIZE;\n\tprintf(\"Evil address is %p\\n\", evil);\n\n\tif (syscall(__NR_sendmmsg, s, evil, 1, MSG_CMSG_COMPAT) < 0)\n\t\terr(1, \"sendmmsg\");\n\n\treturn 0;\n}\n\nSigned-off-by: Andy Lutomirski <luto@amacapital.net>\nCc: David S. Miller <davem@davemloft.net>\nSigned-off-by: David S. Miller <davem@davemloft.net>\nSigned-off-by: Greg Kroah-Hartman <gregkh@linuxfoundation.org>\nSigned-off-by: Pranav Vashi <neobuddy89@gmail.com>\nnet: heap overflow in __audit_sockaddr()\n\nWe need to cap ->msg_namelen or it leads to a buffer overflow when we\nto the memcpy() in __audit_sockaddr().  It requires CAP_AUDIT_CONTROL to\nexploit this bug.\n\nThe call tree is:\n___sys_recvmsg()\n  move_addr_to_user()\n    audit_sockaddr()\n      __audit_sockaddr()\n\nReported-by: Jüri Aedla <juri.aedla@gmail.com>\nSigned-off-by: Dan Carpenter <dan.carpenter@oracle.com>\nSigned-off-by: David S. Miller <davem@davemloft.net>\nSigned-off-by: Greg Kroah-Hartman <gregkh@linuxfoundation.org>\nSigned-off-by: Pranav Vashi <neobuddy89@gmail.com>\nnet: add BUG_ON if kernel advertises msg_namelen > sizeof(struct sockaddr_storage)\n\nIn that case it is probable that kernel code overwrote part of the\nstack. So we should bail out loudly here.\n\nThe BUG_ON may be removed in future if we are sure all protocols are\nconformant.\n\nSuggested-by: Eric Dumazet <eric.dumazet@gmail.com>\nSigned-off-by: Hannes Frederic Sowa <hannes@stressinduktion.org>\nSigned-off-by: David S. Miller <davem@davemloft.net>\nSigned-off-by: Greg Kroah-Hartman <gregkh@linuxfoundation.org>\nSigned-off-by: Pranav Vashi <neobuddy89@gmail.com>\nnet: clamp ->msg_namelen instead of returning an error\n\nIf kmsg->msg_namelen > sizeof(struct sockaddr_storage) then in the\noriginal code that would lead to memory corruption in the kernel if you\nhad audit configured.  If you didn't have audit configured it was\nharmless.\n\nThere are some programs such as beta versions of Ruby which use too\nlarge of a buffer and returning an error code breaks them.  We should\nclamp the ->msg_namelen value instead.\n\nFixes: 1661bf364ae9 (\"net: heap overflow in __audit_sockaddr()\")\nReported-by: Eric Wong <normalperson@yhbt.net>\nSigned-off-by: Dan Carpenter <dan.carpenter@oracle.com>\nTested-by: Eric Wong <normalperson@yhbt.net>\nAcked-by: Eric Dumazet <edumazet@google.com>\nSigned-off-by: David S. Miller <davem@davemloft.net>\nSigned-off-by: Greg Kroah-Hartman <gregkh@linuxfoundation.org>\nSigned-off-by: Pranav Vashi <neobuddy89@gmail.com>\nnet: socket: error on a negative msg_namelen\n\nWhen copying in a struct msghdr from the user, if the user has set the\nmsg_namelen parameter to a negative value it gets clamped to a valid\nsize due to a comparison between signed and unsigned values.\n\nEnsure the syscall errors when the user passes in a negative value.\n\nSigned-off-by: Matthew Leach <matthew.leach@arm.com>\nSigned-off-by: David S. Miller <davem@davemloft.net>\nSigned-off-by: Greg Kroah-Hartman <gregkh@linuxfoundation.org>\nSigned-off-by: Pranav Vashi <neobuddy89@gmail.com>\nnet: Fix references to out-of-scope variables in put_cmsg_compat()\n\nIn net/compat.c::put_cmsg_compat() we may assign 'data' the address of\neither the 'ctv' or 'cts' local variables inside the 'if\n(!COMPAT_USE_64BIT_TIME)' branch.\n\nThose variables go out of scope at the end of the 'if' statement, so\nwhen we use 'data' further down in 'copy_to_user(CMSG_COMPAT_DATA(cm),\ndata, cmlen - sizeof(struct compat_cmsghdr))' there's no telling what\nit may be refering to - not good.\n\nFix the problem by simply giving 'ctv' and 'cts' function scope.\n\nChange-Id: I8ebc2efb0ae5d1009804698bebefb16a2b5fd2dd\nSigned-off-by: Jesper Juhl <jj@chaosbits.net>\nSigned-off-by: David S. Miller <davem@davemloft.net>\nSigned-off-by: Greg Kroah-Hartman <gregkh@linuxfoundation.org>\nSigned-off-by: Pranav Vashi <neobuddy89@gmail.com>","distinct":true,"url":"https://api.github.com/repos/aow1980/kernel_lge_hammerhead/commits/d3c5b34d36f3ea86b8d73555659edad098f2e06e"},{"sha":"ec249eef47eeef64595c1d8a12ac530e1884d6c8","author":{"email":"457cfb837588e6491cbd81701614a2c9f7081d84@gmail.com","name":"aow1980"},"message":"Fix order of arguments to compat_put_time[spec|val]\n\nCommit 644595f89620 (\"compat: Handle COMPAT_USE_64BIT_TIME in\nnet/socket.c\") introduced a bug where the helper functions to take\neither a 64-bit or compat time[spec|val] got the arguments in the wrong\norder, passing the kernel stack pointer off as a user pointer (and vice\nversa).\n\nBecause of the user address range check, that in turn then causes an\nEFAULT due to the user pointer range checking failing for the kernel\naddress.  Incorrectly resuling in a failed system call for 32-bit\nprocesses with a 64-bit kernel.\n\nOn odder architectures like HP-PA (with separate user/kernel address\nspaces), it can be used read kernel memory.\n\nChange-Id: I012dfbe26f92558e2203ae36db662bf33deb4329\nSigned-off-by: Mikulas Patocka <mpatocka@redhat.com>\nSigned-off-by: Linus Torvalds <torvalds@linux-foundation.org>\nSigned-off-by: Greg Kroah-Hartman <gregkh@linuxfoundation.org>\nSigned-off-by: Pranav Vashi <neobuddy89@gmail.com>\nSigned-off-by: engstk <eng.stk@sapo.pt>","distinct":true,"url":"https://api.github.com/repos/aow1980/kernel_lge_hammerhead/commits/ec249eef47eeef64595c1d8a12ac530e1884d6c8"},{"sha":"c434ee7f4a569336e1790f39ce1bc018e16197d0","author":{"email":"457cfb837588e6491cbd81701614a2c9f7081d84@gmail.com","name":"aow1980"},"message":"af_key: fix info leaks in notify messages\n\nkey_notify_sa_flush() and key_notify_policy_flush() miss to initialize\nthe sadb_msg_reserved member of the broadcasted message and thereby\nleak 2 bytes of heap memory to listeners. Fix that.\n\nSigned-off-by: Mathias Krause <minipli@googlemail.com>\nCc: Steffen Klassert <steffen.klassert@secunet.com>\nCc: \"David S. Miller\" <davem@davemloft.net>\nCc: Herbert Xu <herbert@gondor.apana.org.au>\nSigned-off-by: David S. Miller <davem@davemloft.net>\nSigned-off-by: Greg Kroah-Hartman <gregkh@linuxfoundation.org>\nSigned-off-by: Pranav Vashi <neobuddy89@gmail.com>\nSigned-off-by: engstk <eng.stk@sapo.pt>\naf_key: more info leaks in pfkey messages\n\nThis is inspired by a5cc68f3d6 \"af_key: fix info leaks in notify\nmessages\".  There are some struct members which don't get initialized\nand could disclose small amounts of private information.\n\nAcked-by: Mathias Krause <minipli@googlemail.com>\nSigned-off-by: Dan Carpenter <dan.carpenter@oracle.com>\nAcked-by: Steffen Klassert <steffen.klassert@secunet.com>\nSigned-off-by: David S. Miller <davem@davemloft.net>\nSigned-off-by: Greg Kroah-Hartman <gregkh@linuxfoundation.org>\nSigned-off-by: Pranav Vashi <neobuddy89@gmail.com>\nSigned-off-by: engstk <eng.stk@sapo.pt>\naf_key: initialize satype in key_notify_policy_flush()\n\nThis field was left uninitialized. Some user daemons perform check against this\nfield.\n\nChange-Id: I747fca7338e0441afdd418fba5dfec51aa94f1c4\nSigned-off-by: Nicolas Dichtel <nicolas.dichtel@6wind.com>\nSigned-off-by: Steffen Klassert <steffen.klassert@secunet.com>\nCc: Luis Henriques <luis.henriques@canonical.com>\nSigned-off-by: Greg Kroah-Hartman <gregkh@linuxfoundation.org>\nSigned-off-by: Pranav Vashi <neobuddy89@gmail.com>\nSigned-off-by: engstk <eng.stk@sapo.pt>","distinct":true,"url":"https://api.github.com/repos/aow1980/kernel_lge_hammerhead/commits/c434ee7f4a569336e1790f39ce1bc018e16197d0"},{"sha":"f54b415df6c0a73280bc28a7c572ae748b588bc2","author":{"email":"457cfb837588e6491cbd81701614a2c9f7081d84@gmail.com","name":"aow1980"},"message":"Fix blocking allocations called very early during bootup\n\nDuring early boot, when the scheduler hasn't really been fully set up,\nwe really can't do blocking allocations because with certain (dubious)\nconfigurations the \"might_resched()\" calls can actually result in\nscheduling events.\n\nWe could just make such users always use GFP_ATOMIC, but quite often the\ncode that does the allocation isn't really aware of the fact that the\nscheduler isn't up yet, and forcing that kind of random knowledge on the\ninitialization code is just annoying and not good for anybody.\n\nAnd we actually have a the 'gfp_allowed_mask' exactly for this reason:\nit's just that the kernel init sequence happens to set it to allow\nblocking allocations much too early.\n\nSo move the 'gfp_allowed_mask' initialization from 'start_kernel()'\n(which is some of the earliest init code, and runs with preemption\ndisabled for good reasons) into 'kernel_init()'.  kernel_init() is run\nin the newly created thread that will become the 'init' process, as\nopposed to the early startup code that runs within the context of what\nwill be the first idle thread.\n\nSo by the time we reach 'kernel_init()', we know that the scheduler must\nbe at least limping along, because we've already scheduled from the idle\nthread into the init thread.\n\nReported-by: Steven Rostedt <rostedt@goodmis.org>\nCc: David Rientjes <rientjes@google.com>\nSigned-off-by: Linus Torvalds <torvalds@linux-foundation.org>\nSigned-off-by: Greg Kroah-Hartman <gregkh@linuxfoundation.org>\nSigned-off-by: Pranav Vashi <neobuddy89@gmail.com>\nSigned-off-by: engstk <eng.stk@sapo.pt>\nmodule_param: stop double-calling parameters.\n\nCommit 026cee0086fe1df4cf74691cf273062cc769617d \"params:\n<level>_initcall-like kernel parameters\" set old-style module\nparameters to level 0.  And we call those level 0 calls where we used\nto, early in start_kernel().\n\nWe also loop through the initcall levels and call the levelled\nmodule_params before the corresponding initcall.  Unfortunately level\n0 is early_init(), so we call the standard module_param calls twice.\n\n(Turns out most things don't care, but at least ubi.mtd does).\n\nChange the level to -1 for standard module_param calls.\n\nReported-by: Benoît Thébaudeau <benoit.thebaudeau@advansee.com>\nSigned-off-by: Rusty Russell <rusty@rustcorp.com.au>\nSigned-off-by: Greg Kroah-Hartman <gregkh@linuxfoundation.org>\nSigned-off-by: Pranav Vashi <neobuddy89@gmail.com>\nSigned-off-by: engstk <eng.stk@sapo.pt>\nof: fdt: fix memory initialization for expanded DT\n\nAlready existing property flags are filled wrong for properties created from\ninitial FDT. This could cause problems if this DYNAMIC device-tree functions\nare used later, i.e. properties are attached/detached/replaced. Simply dumping\nflags from the running system show, that some initial static (not allocated via\nkzmalloc()) nodes are marked as dynamic.\n\nI putted some debug extensions to property_proc_show(..) :\n..\n+       if (OF_IS_DYNAMIC(pp))\n+               pr_err(\"DEBUG: xxx : OF_IS_DYNAMIC\\n\");\n+       if (OF_IS_DETACHED(pp))\n+               pr_err(\"DEBUG: xxx : OF_IS_DETACHED\\n\");\n\nwhen you operate on the nodes (e.g.: ~$ cat /proc/device-tree/*some_node*) you\nwill see that those flags are filled wrong, basically in most cases it will dump\na DYNAMIC or DETACHED status, which is in not true.\n(BTW. this OF_IS_DETACHED is a own define for debug purposes which which just\nmake a test_bit(OF_DETACHED, &x->_flags)\n\nIf nodes are dynamic kernel is allowed to kfree() them. But it will crash\nattempting to do so on the nodes from FDT -- they are not allocated via\nkzmalloc().\n\nSigned-off-by: Wladislav Wiebe <wladislav.kw@gmail.com>\nAcked-by: Alexander Sverdlin <alexander.sverdlin@nsn.com>\nSigned-off-by: Rob Herring <rob.herring@calxeda.com>\nSigned-off-by: Greg Kroah-Hartman <gregkh@linuxfoundation.org>\nSigned-off-by: Pranav Vashi <neobuddy89@gmail.com>\nSigned-off-by: engstk <eng.stk@sapo.pt>\nof: Fix missing memory initialization on FDT unflattening\n\nAny calls to dt_alloc() need to be zeroed. This is a temporary fix, but\nthe allocation function itself needs to zero memory before returning\nit. This is a follow up to patch 9e4012752, \"of: fdt: fix memory\ninitialization for expanded DT\" which fixed one call site but missed\nanother.\n\nSigned-off-by: Grant Likely <grant.likely@linaro.org>\nAcked-by: Wladislav Wiebe <wladislav.kw@gmail.com>\nSigned-off-by: Greg Kroah-Hartman <gregkh@linuxfoundation.org>\nSigned-off-by: Pranav Vashi <neobuddy89@gmail.com>\nSigned-off-by: engstk <eng.stk@sapo.pt>\nregulator: core: Release regulator-regulator supplies on error\n\nIf we fail while registering a regulator make sure we release the supply\nfor the regulator if there is one.\n\nChange-Id: Icfa3c3087d9d91ee2272fa77614302e15fa0b247\nSigned-off-by: Mark Brown <broonie@opensource.wolfsonmicro.com>\nAcked-by: Liam Girdwood <lrg@ti.com>\nSigned-off-by: Greg Kroah-Hartman <gregkh@linuxfoundation.org>\nSigned-off-by: Pranav Vashi <neobuddy89@gmail.com>\nSigned-off-by: engstk <eng.stk@sapo.pt>","distinct":true,"url":"https://api.github.com/repos/aow1980/kernel_lge_hammerhead/commits/f54b415df6c0a73280bc28a7c572ae748b588bc2"},{"sha":"76cdc5eff4f5f89aaa761726e0199d682db23183","author":{"email":"457cfb837588e6491cbd81701614a2c9f7081d84@gmail.com","name":"aow1980"},"message":"msm: thermal: add my msm thermal code.\n\nChange-Id: I081bef136e4066aec962c1600e27cf96a213119d\nSigned-off-by: franciscofranco <franciscofranco.1990@gmail.com>","distinct":true,"url":"https://api.github.com/repos/aow1980/kernel_lge_hammerhead/commits/76cdc5eff4f5f89aaa761726e0199d682db23183"},{"sha":"ef7789edd4f11fb87d4c44f4e5d98acb32954a96","author":{"email":"457cfb837588e6491cbd81701614a2c9f7081d84@gmail.com","name":"aow1980"},"message":"msm: thermal: no need for this check.\n\nSigned-off-by: franciscofranco <franciscofranco.1990@gmail.com>\nmsm: thermal: the wq can freezes during freezer phase.\n\nSigned-off-by: franciscofranco <franciscofranco.1990@gmail.com>\nmsm: thermal: improve some codes.\n\nSigned-off-by: franciscofranco <franciscofranco.1990@gmail.com>\ndrivers: thermal: back to 70C throttle point.\n\nChange-Id: Ice0bf89b16e2b5c3adec59dedbc90dcaf3e01658\nSigned-off-by: franciscofranco <franciscofranco.1990@gmail.com>","distinct":true,"url":"https://api.github.com/repos/aow1980/kernel_lge_hammerhead/commits/ef7789edd4f11fb87d4c44f4e5d98acb32954a96"},{"sha":"dae1230cfafa03edcf45ac45d655368060253345","author":{"email":"457cfb837588e6491cbd81701614a2c9f7081d84@gmail.com","name":"aow1980"},"message":"thermal: add a 5C threshold to prevent throttled/unthrottled to be triggered a lot when the CPU temp dwells close to the temp threshold.\n\nSigned-off-by: franciscofranco <franciscofranco.1990@gmail.com>\nmsm: thermal: Update thermal subsystem\n\nThis is a squash of the following commits:\n\n4bc738d2 msm: thermal: Set vdd restriction initialize level to -1\n5daeff0f msm: thermal: Clean up msm cpufreq function calls\n6b21cae8 thermal: tsens: Fix invalid set temperature check\nc473c9dd Revert \"msm: thermal: Clean up msm cpufreq function calls\"\nbb646211 thermal: Add sensor API to allow any driver to set thresholds\n718bf641 thermal: msm: tsens: Notify thermal framework on threshold cross\n4ff40944 msm: thermal: Enable hotplug support in kernel\n3af26db0 thermal: Fix sensor thresholds not accounted correctly\nd8b1e1ec Revert \"Revert \"msm: thermal: Clean up msm cpufreq function calls\"\"\nb2f16712 thermal: Add Support for enabling and disabling tsens trip\n81c1b0b7 msm: thermal: Don't initialize hotplug thread when not configured\n89961312 msm: thermal: Add support for emergency frequency mitigation\n6460392a msm: thermal: Add IOCTL interface support to Kernel Thermal Monitor\n\nBug: 14139855\nConflicts:\n\tdrivers/thermal/msm_thermal.c\nSigned-off-by: Naveen Ramaraj <nramaraj@codeaurora.org>\n\nChange-Id: I22911e6ffe1a9f553b1c721341fbe530e03eec6c","distinct":true,"url":"https://api.github.com/repos/aow1980/kernel_lge_hammerhead/commits/dae1230cfafa03edcf45ac45d655368060253345"},{"sha":"2cb3f5da76a724cd78ba57184fbc11ed2a529957","author":{"email":"457cfb837588e6491cbd81701614a2c9f7081d84@gmail.com","name":"aow1980"},"message":"msm: thermal: refactor the code.\n\nChange-Id: I313980b5ed2abd9761307db0bf40c08af96e7dc2\nSigned-off-by: franciscofranco <franciscofranco.1990@gmail.com>","distinct":true,"url":"https://api.github.com/repos/aow1980/kernel_lge_hammerhead/commits/2cb3f5da76a724cd78ba57184fbc11ed2a529957"},{"sha":"a58513ad8a06c5bf56b0577026678eab08128aca","author":{"email":"457cfb837588e6491cbd81701614a2c9f7081d84@gmail.com","name":"aow1980"},"message":"msm: thermal: there's no need to ask for a policy, we can simply lift the limit with LONG_MAX. Also queue only on cpu0.\n\nChange-Id: I41559724a44f3e9b8bbce22aa4f15b254dfd73cb\nSigned-off-by: franciscofranco <franciscofranco.1990@gmail.com>","distinct":true,"url":"https://api.github.com/repos/aow1980/kernel_lge_hammerhead/commits/a58513ad8a06c5bf56b0577026678eab08128aca"},{"sha":"9bc3ecbd3e5f1819321286d96979d95d6234f3c6","author":{"email":"457cfb837588e6491cbd81701614a2c9f7081d84@gmail.com","name":"aow1980"},"message":"msm: thermal: make sure we actually want to go through with the policy adjust since this can be triggered by any policy update with the cPUFREQ_ADJUST flag.\n\nSigned-off-by: franciscofranco <franciscofranco.1990@gmail.com>\nmsm: thermal: change the init sequence.\n\nChange-Id: I6a3b8ad7f80bcb2484f2f69effd5d1105073e73b\nSigned-off-by: franciscofranco <franciscofranco.1990@gmail.com>","distinct":true,"url":"https://api.github.com/repos/aow1980/kernel_lge_hammerhead/commits/9bc3ecbd3e5f1819321286d96979d95d6234f3c6"},{"sha":"d024894241a20ad55a57280127becf3d4013a628","author":{"email":"457cfb837588e6491cbd81701614a2c9f7081d84@gmail.com","name":"aow1980"},"message":"msm: thermal: add my Thermal solution\n\nChange-Id: I5fc653d6bcacf97b36f4f8ec63ccdf8dd94e1999\nSigned-off-by: franciscofranco <franciscofranco.1990@gmail.com>","distinct":true,"url":"https://api.github.com/repos/aow1980/kernel_lge_hammerhead/commits/d024894241a20ad55a57280127becf3d4013a628"},{"sha":"036a45f062aea6b8abb9bb0bbfc64f436d68d5ff","author":{"email":"457cfb837588e6491cbd81701614a2c9f7081d84@gmail.com","name":"aow1980"},"message":"msm: rq_stats: Calculate load based on current freq limit\n\nPrior to this patch, load has been calculated based on an\ninitial value of policy.cpuinfo.max_freq. This value may\nchange for several reasons: userspace settings or thermal\nthrottling (hello hammerhead!). This results in unreliable\ncalculations that confuse mpdecision which accesses\n/sys/devices/system/cpu/cpu0/rq-stats/* for stats info.\nConsider current policy.max to fix this behaviour.\n\nChange-Id: Iae1f2fc7f4aa470f7e80371c1ebcf7be423f51ca\nSigned-off-by: engstk <eng.stk@sapo.pt>","distinct":true,"url":"https://api.github.com/repos/aow1980/kernel_lge_hammerhead/commits/036a45f062aea6b8abb9bb0bbfc64f436d68d5ff"},{"sha":"a025c1d886c10249118d2e16abed161c39d501cf","author":{"email":"457cfb837588e6491cbd81701614a2c9f7081d84@gmail.com","name":"aow1980"},"message":"thermal: raise thermal frequency throttle limits\n\nChange-Id: I83f9a590ce30d965534426e517b566c0f704ab00\nSigned-off-by: engstk <eng.stk@sapo.pt>","distinct":true,"url":"https://api.github.com/repos/aow1980/kernel_lge_hammerhead/commits/a025c1d886c10249118d2e16abed161c39d501cf"},{"sha":"a6b0b481b5f9808b4ff5777e67392f38978df6f8","author":{"email":"457cfb837588e6491cbd81701614a2c9f7081d84@gmail.com","name":"aow1980"},"message":"Switch to Franco Thermal control\n\nChange-Id: I08eada544f6d1fb5cbbbf01e89978346760bceef","distinct":true,"url":"https://api.github.com/repos/aow1980/kernel_lge_hammerhead/commits/a6b0b481b5f9808b4ff5777e67392f38978df6f8"},{"sha":"88698edd466cabc71f5523640a07d9bd22409cce","author":{"email":"457cfb837588e6491cbd81701614a2c9f7081d84@gmail.com","name":"aow1980"},"message":"writeback: fix race that cause writeback hung\n\nThere is a race between mark inode dirty and writeback thread, see the\nfollowing scenario.  In this case, writeback thread will not run though\nthere is dirty_io.\n\n__mark_inode_dirty()                                          bdi_writeback_workfn()\n\t...                                                       \t...\n\tspin_lock(&inode->i_lock);\n\t...\n\tif (bdi_cap_writeback_dirty(bdi)) {\n\t    <<< assume wb has dirty_io, so wakeup_bdi is false.\n\t    <<< the following inode_dirty also have wakeup_bdi false.\n\t    if (!wb_has_dirty_io(&bdi->wb))\n\t\t    wakeup_bdi = true;\n\t}\n\tspin_unlock(&inode->i_lock);\n\t                                                            <<< assume last dirty_io is removed here.\n\t                                                            pages_written = wb_do_writeback(wb);\n\t                                                            ...\n\t                                                            <<< work_list empty and wb has no dirty_io,\n\t                                                            <<< delayed_work will not be queued.\n\t                                                            if (!list_empty(&bdi->work_list) ||\n\t                                                                (wb_has_dirty_io(wb) && dirty_writeback_interval))\n\t                                                                queue_delayed_work(bdi_wq, &wb->dwork,\n\t                                                                    msecs_to_jiffies(dirty_writeback_interval * 10));\n\tspin_lock(&bdi->wb.list_lock);\n\tinode->dirtied_when = jiffies;\n\t<<< new dirty_io is added.\n\tlist_move(&inode->i_wb_list, &bdi->wb.b_dirty);\n\tspin_unlock(&bdi->wb.list_lock);\n\n\t<<< though there is dirty_io, but wakeup_bdi is false,\n\t<<< so writeback thread will not be waked up and\n\t<<< the new dirty_io will not be flushed.\n\tif (wakeup_bdi)\n\t    bdi_wakeup_thread_delayed(bdi);\n\nWriteback will run until there is a new flush work queued.  This may cause\na lot of dirty pages stay in memory for a long time.\n\nChange-Id: I4f25c8878d0aabcc3408af017f2948776565fead\nSigned-off-by: Junxiao Bi <junxiao.bi@oracle.com>\nReviewed-by: Jan Kara <jack@suse.cz>\nCc: Fengguang Wu <fengguang.wu@intel.com>\nSigned-off-by: Andrew Morton <akpm@linux-foundation.org>\nSigned-off-by: Linus Torvalds <torvalds@linux-foundation.org>\nSigned-off-by: Francisco Franco <franciscofranco.1990@gmail.com>\nSigned-off-by: Chet Kener <Cl3Kener@gmail.com>","distinct":true,"url":"https://api.github.com/repos/aow1980/kernel_lge_hammerhead/commits/88698edd466cabc71f5523640a07d9bd22409cce"}]},"public":true,"created_at":"2015-01-01T01:06:07Z"}
{"id":"2489398459","type":"IssueCommentEvent","actor":{"id":1235097,"login":"rmarinho","gravatar_id":"","url":"https://api.github.com/users/rmarinho","avatar_url":"https://avatars.githubusercontent.com/u/1235097?"},"repo":{"id":20463939,"name":"XLabs/Xamarin-Forms-Labs","url":"https://api.github.com/repos/XLabs/Xamarin-Forms-Labs"},"payload":{"action":"created","issue":{"url":"https://api.github.com/repos/XLabs/Xamarin-Forms-Labs/issues/543","labels_url":"https://api.github.com/repos/XLabs/Xamarin-Forms-Labs/issues/543/labels{/name}","comments_url":"https://api.github.com/repos/XLabs/Xamarin-Forms-Labs/issues/543/comments","events_url":"https://api.github.com/repos/XLabs/Xamarin-Forms-Labs/issues/543/events","html_url":"https://github.com/XLabs/Xamarin-Forms-Labs/issues/543","id":53118143,"number":543,"title":"Update Nuget build process","user":{"login":"ravensorb","id":2222472,"avatar_url":"https://avatars.githubusercontent.com/u/2222472?v=3","gravatar_id":"","url":"https://api.github.com/users/ravensorb","html_url":"https://github.com/ravensorb","followers_url":"https://api.github.com/users/ravensorb/followers","following_url":"https://api.github.com/users/ravensorb/following{/other_user}","gists_url":"https://api.github.com/users/ravensorb/gists{/gist_id}","starred_url":"https://api.github.com/users/ravensorb/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/ravensorb/subscriptions","organizations_url":"https://api.github.com/users/ravensorb/orgs","repos_url":"https://api.github.com/users/ravensorb/repos","events_url":"https://api.github.com/users/ravensorb/events{/privacy}","received_events_url":"https://api.github.com/users/ravensorb/received_events","type":"User","site_admin":false},"labels":[{"url":"https://api.github.com/repos/XLabs/Xamarin-Forms-Labs/labels/enhancement","name":"enhancement","color":"84b6eb"}],"state":"open","locked":false,"assignee":{"login":"ravensorb","id":2222472,"avatar_url":"https://avatars.githubusercontent.com/u/2222472?v=3","gravatar_id":"","url":"https://api.github.com/users/ravensorb","html_url":"https://github.com/ravensorb","followers_url":"https://api.github.com/users/ravensorb/followers","following_url":"https://api.github.com/users/ravensorb/following{/other_user}","gists_url":"https://api.github.com/users/ravensorb/gists{/gist_id}","starred_url":"https://api.github.com/users/ravensorb/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/ravensorb/subscriptions","organizations_url":"https://api.github.com/users/ravensorb/orgs","repos_url":"https://api.github.com/users/ravensorb/repos","events_url":"https://api.github.com/users/ravensorb/events{/privacy}","received_events_url":"https://api.github.com/users/ravensorb/received_events","type":"User","site_admin":false},"milestone":null,"comments":20,"created_at":"2014-12-30T14:17:00Z","updated_at":"2015-01-01T01:06:07Z","closed_at":null,"body":"Now that we have the main work done for porting to the new structure, we should probably update the nuget build process.  Anyone interested in taking this one?"},"comment":{"url":"https://api.github.com/repos/XLabs/Xamarin-Forms-Labs/issues/comments/68477353","html_url":"https://github.com/XLabs/Xamarin-Forms-Labs/issues/543#issuecomment-68477353","issue_url":"https://api.github.com/repos/XLabs/Xamarin-Forms-Labs/issues/543","id":68477353,"user":{"login":"rmarinho","id":1235097,"avatar_url":"https://avatars.githubusercontent.com/u/1235097?v=3","gravatar_id":"","url":"https://api.github.com/users/rmarinho","html_url":"https://github.com/rmarinho","followers_url":"https://api.github.com/users/rmarinho/followers","following_url":"https://api.github.com/users/rmarinho/following{/other_user}","gists_url":"https://api.github.com/users/rmarinho/gists{/gist_id}","starred_url":"https://api.github.com/users/rmarinho/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/rmarinho/subscriptions","organizations_url":"https://api.github.com/users/rmarinho/orgs","repos_url":"https://api.github.com/users/rmarinho/repos","events_url":"https://api.github.com/users/rmarinho/events{/privacy}","received_events_url":"https://api.github.com/users/rmarinho/received_events","type":"User","site_admin":false},"created_at":"2015-01-01T01:06:07Z","updated_at":"2015-01-01T01:06:07Z","body":"hey guys, great work, i m not having the time i wanted to help you guys.. but here are my 2 cents.. \r\n\r\nWe have decided before that XLabs next release will be 2.0, i think we should launch 2.0-pre1 where we don't have unified support, and we will launch the final version of 2.0 when Xamarin releases unified on stable. \r\n\r\nWe still need to put the packages as pre to see issues others can find in our new structure.\r\n\r\n@ravensorb  is the nuget process the same?  build everything for the release folder and nuget picks up from there? \r\n\r\nwe should also look and this is the time to remove obsolete or properties that are now covered on Xamarin Core, like stuff related to fonts (extended label if i recall)"}},"public":true,"created_at":"2015-01-01T01:06:08Z","org":{"id":7787062,"login":"XLabs","gravatar_id":"","url":"https://api.github.com/orgs/XLabs","avatar_url":"https://avatars.githubusercontent.com/u/7787062?"}}
{"id":"2489398461","type":"PushEvent","actor":{"id":6241554,"login":"leo-yuriev","gravatar_id":"","url":"https://api.github.com/users/leo-yuriev","avatar_url":"https://avatars.githubusercontent.com/u/6241554?"},"repo":{"id":23696666,"name":"leo-yuriev/openldap-lmdb-challenge","url":"https://api.github.com/repos/leo-yuriev/openldap-lmdb-challenge"},"payload":{"push_id":536753363,"size":14,"distinct_size":14,"ref":"refs/heads/2.4-devel","head":"3c4005e809a729cc9f6b63e39ee26e39b3f10fe8","before":"f705475af08e6b50420a8ff22b71cfbe45cea409","commits":[{"sha":"0fd73aa27bb25ed790d723ceaca16c4bf228a691","author":{"email":"1f0a51c36efaa0f44e4899c26d2028681997c8ea@yuriev.ru","name":"Leo Yuriev"},"message":"ps-build.sh","distinct":true,"url":"https://api.github.com/repos/leo-yuriev/openldap-lmdb-challenge/commits/0fd73aa27bb25ed790d723ceaca16c4bf228a691"},{"sha":"3b9f7bf005eb43645b2dfb3c1eb1341912ea39ca","author":{"email":"1f0a51c36efaa0f44e4899c26d2028681997c8ea@yuriev.ru","name":"Leo Yuriev"},"message":"qt-creator project","distinct":true,"url":"https://api.github.com/repos/leo-yuriev/openldap-lmdb-challenge/commits/3b9f7bf005eb43645b2dfb3c1eb1341912ea39ca"},{"sha":"677cefedf3d6f46ae74b7b25db28b53d32788c3e","author":{"email":"1f0a51c36efaa0f44e4899c26d2028681997c8ea@yuriev.ru","name":"Leo Yuriev"},"message":"fix debug marco","distinct":true,"url":"https://api.github.com/repos/leo-yuriev/openldap-lmdb-challenge/commits/677cefedf3d6f46ae74b7b25db28b53d32788c3e"},{"sha":"0ab01722504df3e913a7c7559a2f06ba54820470","author":{"email":"1f0a51c36efaa0f44e4899c26d2028681997c8ea@yuriev.ru","name":"Leo Yuriev"},"message":"fix: using strerror_r()","distinct":true,"url":"https://api.github.com/repos/leo-yuriev/openldap-lmdb-challenge/commits/0ab01722504df3e913a7c7559a2f06ba54820470"},{"sha":"c32f6ea113ddac0cdd1a7dd1944994714d45863b","author":{"email":"1f0a51c36efaa0f44e4899c26d2028681997c8ea@yuriev.ru","name":"Leo Yuriev"},"message":"fix: read/write ignored result.","distinct":true,"url":"https://api.github.com/repos/leo-yuriev/openldap-lmdb-challenge/commits/c32f6ea113ddac0cdd1a7dd1944994714d45863b"},{"sha":"dccc7ef0254abe37e3e91d527032dd8120249859","author":{"email":"1f0a51c36efaa0f44e4899c26d2028681997c8ea@yuriev.ru","name":"Leo Yuriev"},"message":"fix: check getcmd() result","distinct":true,"url":"https://api.github.com/repos/leo-yuriev/openldap-lmdb-challenge/commits/dccc7ef0254abe37e3e91d527032dd8120249859"},{"sha":"c20b58e144515fcb25c821d5bf2fd5a58eea3055","author":{"email":"1f0a51c36efaa0f44e4899c26d2028681997c8ea@yuriev.ru","name":"Leo Yuriev"},"message":"fix: printf unused agrv[0] in main()","distinct":true,"url":"https://api.github.com/repos/leo-yuriev/openldap-lmdb-challenge/commits/c20b58e144515fcb25c821d5bf2fd5a58eea3055"},{"sha":"0bf7975dc8489f33e5f8a7331308fc3885e17aa6","author":{"email":"1f0a51c36efaa0f44e4899c26d2028681997c8ea@yuriev.ru","name":"Leo Yuriev"},"message":"fix: printf %d without arg in main()","distinct":true,"url":"https://api.github.com/repos/leo-yuriev/openldap-lmdb-challenge/commits/0bf7975dc8489f33e5f8a7331308fc3885e17aa6"},{"sha":"d26104515ccff47d3a81465b5b033fe8fe3bb548","author":{"email":"1f0a51c36efaa0f44e4899c26d2028681997c8ea@yuriev.ru","name":"Leo Yuriev"},"message":"fix: warning-errors for configure","distinct":true,"url":"https://api.github.com/repos/leo-yuriev/openldap-lmdb-challenge/commits/d26104515ccff47d3a81465b5b033fe8fe3bb548"},{"sha":"cb104588617e0ee1754e0a9f96d93cb32a537725","author":{"email":"1f0a51c36efaa0f44e4899c26d2028681997c8ea@yuriev.ru","name":"Leo Yuriev"},"message":"fix: build-warnings (most 'unused')","distinct":true,"url":"https://api.github.com/repos/leo-yuriev/openldap-lmdb-challenge/commits/cb104588617e0ee1754e0a9f96d93cb32a537725"},{"sha":"da05f7f43f784f81f0a1fae8f86561a73eb83534","author":{"email":"1f0a51c36efaa0f44e4899c26d2028681997c8ea@yuriev.ru","name":"Leo Yuriev"},"message":"fix: const","distinct":true,"url":"https://api.github.com/repos/leo-yuriev/openldap-lmdb-challenge/commits/da05f7f43f784f81f0a1fae8f86561a73eb83534"},{"sha":"9bab6ea187c7633769858bbb70bb156ed2fd1fa8","author":{"email":"1f0a51c36efaa0f44e4899c26d2028681997c8ea@yuriev.ru","name":"Leo Yuriev"},"message":"fix: warnings (uninitialized)","distinct":true,"url":"https://api.github.com/repos/leo-yuriev/openldap-lmdb-challenge/commits/9bab6ea187c7633769858bbb70bb156ed2fd1fa8"},{"sha":"6db3f1d5b7860f1d3e95d12cce171d9db699e51d","author":{"email":"1f0a51c36efaa0f44e4899c26d2028681997c8ea@yuriev.ru","name":"Leo Yuriev"},"message":"sasl callback's typecast","distinct":true,"url":"https://api.github.com/repos/leo-yuriev/openldap-lmdb-challenge/commits/6db3f1d5b7860f1d3e95d12cce171d9db699e51d"},{"sha":"3c4005e809a729cc9f6b63e39ee26e39b3f10fe8","author":{"email":"1f0a51c36efaa0f44e4899c26d2028681997c8ea@yuriev.ru","name":"Leo Yuriev"},"message":"fix warnings (unused, uninitialized, misc);","distinct":true,"url":"https://api.github.com/repos/leo-yuriev/openldap-lmdb-challenge/commits/3c4005e809a729cc9f6b63e39ee26e39b3f10fe8"}]},"public":true,"created_at":"2015-01-01T01:06:08Z"}
{"id":"2489398466","type":"PushEvent","actor":{"id":1579058,"login":"cessen","gravatar_id":"","url":"https://api.github.com/users/cessen","avatar_url":"https://avatars.githubusercontent.com/u/1579058?"},"repo":{"id":28025559,"name":"cessen/led","url":"https://api.github.com/repos/cessen/led"},"payload":{"push_id":536753365,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"95d6d3fd3eb8d1771e46c900cc04b1eeb6b8b3e4","before":"28a4da97a7ea7ba7c9e99c0ebc160cceb70ba495","commits":[{"sha":"95d6d3fd3eb8d1771e46c900cc04b1eeb6b8b3e4","author":{"email":"49beb02aed03d4c7798ad211ffd5f7674b731bcb@cessen.com","name":"Nathan Vegdahl"},"message":"Got remove_text() working.\n\nAt least, based on the unit tests so far.","distinct":true,"url":"https://api.github.com/repos/cessen/led/commits/95d6d3fd3eb8d1771e46c900cc04b1eeb6b8b3e4"}]},"public":true,"created_at":"2015-01-01T01:06:08Z"}
{"id":"2489398467","type":"IssueCommentEvent","actor":{"id":3103764,"login":"carymrobbins","gravatar_id":"","url":"https://api.github.com/users/carymrobbins","avatar_url":"https://avatars.githubusercontent.com/u/3103764?"},"repo":{"id":15573192,"name":"carymrobbins/intellij-haskforce","url":"https://api.github.com/repos/carymrobbins/intellij-haskforce"},"payload":{"action":"created","issue":{"url":"https://api.github.com/repos/carymrobbins/intellij-haskforce/issues/105","labels_url":"https://api.github.com/repos/carymrobbins/intellij-haskforce/issues/105/labels{/name}","comments_url":"https://api.github.com/repos/carymrobbins/intellij-haskforce/issues/105/comments","events_url":"https://api.github.com/repos/carymrobbins/intellij-haskforce/issues/105/events","html_url":"https://github.com/carymrobbins/intellij-haskforce/pull/105","id":52960360,"number":105,"title":"Issue90 type information","user":{"login":"KasperJanssens","id":5415995,"avatar_url":"https://avatars.githubusercontent.com/u/5415995?v=3","gravatar_id":"","url":"https://api.github.com/users/KasperJanssens","html_url":"https://github.com/KasperJanssens","followers_url":"https://api.github.com/users/KasperJanssens/followers","following_url":"https://api.github.com/users/KasperJanssens/following{/other_user}","gists_url":"https://api.github.com/users/KasperJanssens/gists{/gist_id}","starred_url":"https://api.github.com/users/KasperJanssens/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/KasperJanssens/subscriptions","organizations_url":"https://api.github.com/users/KasperJanssens/orgs","repos_url":"https://api.github.com/users/KasperJanssens/repos","events_url":"https://api.github.com/users/KasperJanssens/events{/privacy}","received_events_url":"https://api.github.com/users/KasperJanssens/received_events","type":"User","site_admin":false},"labels":[],"state":"open","locked":false,"assignee":null,"milestone":null,"comments":1,"created_at":"2014-12-27T16:19:07Z","updated_at":"2015-01-01T01:06:08Z","closed_at":null,"pull_request":{"url":"https://api.github.com/repos/carymrobbins/intellij-haskforce/pulls/105","html_url":"https://github.com/carymrobbins/intellij-haskforce/pull/105","diff_url":"https://github.com/carymrobbins/intellij-haskforce/pull/105.diff","patch_url":"https://github.com/carymrobbins/intellij-haskforce/pull/105.patch"},"body":"Cary,\r\n\r\nFirst try of the type information. It seems quite stable, been using it for a few days (provided the configuration is correct, I suppose, didn't test what happens when ghc-modi is not correctly configured).\r\n\r\nI bound the type info call to the DocumentationProvider as well as to an action (alt - equals, like scala). I prefer the action, I think the documentation provider doesn't work so well. There are tests of the parsing of the output of ghc-modi, but not really of the documentationprovider, basically because of the abundance of static calls and the fact that I think they can only be mocked while testing, and statics can only be mocked through Powermock if I recall correctly, which would mean an extra test dependency and so on and so forth, so I left that to be your call.\r\n\r\nAlso, there is a weird behaviour that getting the editor creates a stack trace of around 5 kilometers long, something that seems like a threading issue, but the function seems to work. I don't really know why the stack trace happens, all the more because it only happens when calling the type information through the documentation provider (same code path is used when the action is called, but no stack trace). Maybe you know more what could go wrong, it looks like something intellij-related.\r\n\r\nSo, consider this a \"request for comment\" more than a pull request ;-)\r\n\r\nKasper"},"comment":{"url":"https://api.github.com/repos/carymrobbins/intellij-haskforce/issues/comments/68477354","html_url":"https://github.com/carymrobbins/intellij-haskforce/pull/105#issuecomment-68477354","issue_url":"https://api.github.com/repos/carymrobbins/intellij-haskforce/issues/105","id":68477354,"user":{"login":"carymrobbins","id":3103764,"avatar_url":"https://avatars.githubusercontent.com/u/3103764?v=3","gravatar_id":"","url":"https://api.github.com/users/carymrobbins","html_url":"https://github.com/carymrobbins","followers_url":"https://api.github.com/users/carymrobbins/followers","following_url":"https://api.github.com/users/carymrobbins/following{/other_user}","gists_url":"https://api.github.com/users/carymrobbins/gists{/gist_id}","starred_url":"https://api.github.com/users/carymrobbins/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/carymrobbins/subscriptions","organizations_url":"https://api.github.com/users/carymrobbins/orgs","repos_url":"https://api.github.com/users/carymrobbins/repos","events_url":"https://api.github.com/users/carymrobbins/events{/privacy}","received_events_url":"https://api.github.com/users/carymrobbins/received_events","type":"User","site_admin":false},"created_at":"2015-01-01T01:06:08Z","updated_at":"2015-01-01T01:06:08Z","body":"Nice work @KasperJanssens!  Sorry, barely getting around to trying this out.\r\n\r\nI've updated the **Files Changed** tab with comments and questions.  Overall, this is really good stuff.  I'm glad that you have tests, you've refactored some crufty stuff, and tapped into popups to provide a custom UI."}},"public":true,"created_at":"2015-01-01T01:06:08Z"}
{"id":"2489398469","type":"WatchEvent","actor":{"id":1093204,"login":"mlnlover11","gravatar_id":"","url":"https://api.github.com/users/mlnlover11","avatar_url":"https://avatars.githubusercontent.com/u/1093204?"},"repo":{"id":15789289,"name":"KJCracks/Clutch","url":"https://api.github.com/repos/KJCracks/Clutch"},"payload":{"action":"started"},"public":true,"created_at":"2015-01-01T01:06:08Z","org":{"id":2375988,"login":"KJCracks","gravatar_id":"","url":"https://api.github.com/orgs/KJCracks","avatar_url":"https://avatars.githubusercontent.com/u/2375988?"}}
{"id":"2489398473","type":"CreateEvent","actor":{"id":2829718,"login":"phister","gravatar_id":"","url":"https://api.github.com/users/phister","avatar_url":"https://avatars.githubusercontent.com/u/2829718?"},"repo":{"id":28678276,"name":"phister/CollegeFootballPlayoff","url":"https://api.github.com/repos/phister/CollegeFootballPlayoff"},"payload":{"ref":"master","ref_type":"branch","master_branch":"master","description":null,"pusher_type":"user"},"public":true,"created_at":"2015-01-01T01:06:09Z"}
{"id":"2489398478","type":"PullRequestReviewCommentEvent","actor":{"id":706947,"login":"d3athrow","gravatar_id":"","url":"https://api.github.com/users/d3athrow","avatar_url":"https://avatars.githubusercontent.com/u/706947?"},"repo":{"id":10441188,"name":"d3athrow/vgstation13","url":"https://api.github.com/repos/d3athrow/vgstation13"},"payload":{"action":"created","comment":{"url":"https://api.github.com/repos/d3athrow/vgstation13/pulls/comments/22397297","id":22397297,"diff_hunk":"@@ -36,6 +37,7 @@\n \t/obj/item/weapon/screwdriver, /obj/item/weapon/weldingtool, /obj/item/weapon/wirecutters, /obj/item/weapon/wrench, /obj/item/device/multitool, \\\n \t/obj/item/device/radio, /obj/item/device/analyzer, /obj/item/weapon/gun/energy/laser, /obj/item/weapon/gun/energy/pulse_rifle, \\\n \t/obj/item/weapon/gun/energy/taser, /obj/item/weapon/melee/baton, /obj/item/weapon/gun/energy/gun)\n+\tflags = PLASMAGUARD","path":"code/modules/clothing/spacesuits/ert.dm","position":12,"original_position":12,"commit_id":"b93293990c4d927f30a1f048939d427ee591e4a6","original_commit_id":"b93293990c4d927f30a1f048939d427ee591e4a6","user":{"login":"d3athrow","id":706947,"avatar_url":"https://avatars.githubusercontent.com/u/706947?v=3","gravatar_id":"","url":"https://api.github.com/users/d3athrow","html_url":"https://github.com/d3athrow","followers_url":"https://api.github.com/users/d3athrow/followers","following_url":"https://api.github.com/users/d3athrow/following{/other_user}","gists_url":"https://api.github.com/users/d3athrow/gists{/gist_id}","starred_url":"https://api.github.com/users/d3athrow/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/d3athrow/subscriptions","organizations_url":"https://api.github.com/users/d3athrow/orgs","repos_url":"https://api.github.com/users/d3athrow/repos","events_url":"https://api.github.com/users/d3athrow/events{/privacy}","received_events_url":"https://api.github.com/users/d3athrow/received_events","type":"User","site_admin":false},"body":"flags = FPRINT | TABLEPASS | STOPSPRESSUREDMAGE | PLASMAGUARD","created_at":"2015-01-01T01:06:11Z","updated_at":"2015-01-01T01:06:11Z","html_url":"https://github.com/d3athrow/vgstation13/pull/2405#discussion_r22397297","pull_request_url":"https://api.github.com/repos/d3athrow/vgstation13/pulls/2405","_links":{"self":{"href":"https://api.github.com/repos/d3athrow/vgstation13/pulls/comments/22397297"},"html":{"href":"https://github.com/d3athrow/vgstation13/pull/2405#discussion_r22397297"},"pull_request":{"href":"https://api.github.com/repos/d3athrow/vgstation13/pulls/2405"}}},"pull_request":{"url":"https://api.github.com/repos/d3athrow/vgstation13/pulls/2405","id":26675841,"html_url":"https://github.com/d3athrow/vgstation13/pull/2405","diff_url":"https://github.com/d3athrow/vgstation13/pull/2405.diff","patch_url":"https://github.com/d3athrow/vgstation13/pull/2405.patch","issue_url":"https://api.github.com/repos/d3athrow/vgstation13/issues/2405","number":2405,"state":"open","locked":false,"title":"Added PLASMAGUARD flag to some spacesuits","user":{"login":"Rei1226","id":4923426,"avatar_url":"https://avatars.githubusercontent.com/u/4923426?v=3","gravatar_id":"","url":"https://api.github.com/users/Rei1226","html_url":"https://github.com/Rei1226","followers_url":"https://api.github.com/users/Rei1226/followers","following_url":"https://api.github.com/users/Rei1226/following{/other_user}","gists_url":"https://api.github.com/users/Rei1226/gists{/gist_id}","starred_url":"https://api.github.com/users/Rei1226/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/Rei1226/subscriptions","organizations_url":"https://api.github.com/users/Rei1226/orgs","repos_url":"https://api.github.com/users/Rei1226/repos","events_url":"https://api.github.com/users/Rei1226/events{/privacy}","received_events_url":"https://api.github.com/users/Rei1226/received_events","type":"User","site_admin":false},"body":"Added the PLASMAGUARD flag to ERT suits, deathsquad suits, and CE/Atmos suits as requested in \r\n\r\nhttps://github.com/d3athrow/vgstation13/issues/2369","created_at":"2014-12-30T07:18:28Z","updated_at":"2015-01-01T01:06:11Z","closed_at":null,"merged_at":null,"merge_commit_sha":"fff34ea0a38796d850e3f5aba53410e1b7bde9c8","assignee":null,"milestone":null,"commits_url":"https://api.github.com/repos/d3athrow/vgstation13/pulls/2405/commits","review_comments_url":"https://api.github.com/repos/d3athrow/vgstation13/pulls/2405/comments","review_comment_url":"https://api.github.com/repos/d3athrow/vgstation13/pulls/comments/{number}","comments_url":"https://api.github.com/repos/d3athrow/vgstation13/issues/2405/comments","statuses_url":"https://api.github.com/repos/d3athrow/vgstation13/statuses/b93293990c4d927f30a1f048939d427ee591e4a6","head":{"label":"Rei1226:ratdicks","ref":"ratdicks","sha":"b93293990c4d927f30a1f048939d427ee591e4a6","user":{"login":"Rei1226","id":4923426,"avatar_url":"https://avatars.githubusercontent.com/u/4923426?v=3","gravatar_id":"","url":"https://api.github.com/users/Rei1226","html_url":"https://github.com/Rei1226","followers_url":"https://api.github.com/users/Rei1226/followers","following_url":"https://api.github.com/users/Rei1226/following{/other_user}","gists_url":"https://api.github.com/users/Rei1226/gists{/gist_id}","starred_url":"https://api.github.com/users/Rei1226/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/Rei1226/subscriptions","organizations_url":"https://api.github.com/users/Rei1226/orgs","repos_url":"https://api.github.com/users/Rei1226/repos","events_url":"https://api.github.com/users/Rei1226/events{/privacy}","received_events_url":"https://api.github.com/users/Rei1226/received_events","type":"User","site_admin":false},"repo":{"id":19230658,"name":"vgstation13","full_name":"Rei1226/vgstation13","owner":{"login":"Rei1226","id":4923426,"avatar_url":"https://avatars.githubusercontent.com/u/4923426?v=3","gravatar_id":"","url":"https://api.github.com/users/Rei1226","html_url":"https://github.com/Rei1226","followers_url":"https://api.github.com/users/Rei1226/followers","following_url":"https://api.github.com/users/Rei1226/following{/other_user}","gists_url":"https://api.github.com/users/Rei1226/gists{/gist_id}","starred_url":"https://api.github.com/users/Rei1226/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/Rei1226/subscriptions","organizations_url":"https://api.github.com/users/Rei1226/orgs","repos_url":"https://api.github.com/users/Rei1226/repos","events_url":"https://api.github.com/users/Rei1226/events{/privacy}","received_events_url":"https://api.github.com/users/Rei1226/received_events","type":"User","site_admin":false},"private":false,"html_url":"https://github.com/Rei1226/vgstation13","description":"This is the vgstation's fork of baystation12's code.","fork":true,"url":"https://api.github.com/repos/Rei1226/vgstation13","forks_url":"https://api.github.com/repos/Rei1226/vgstation13/forks","keys_url":"https://api.github.com/repos/Rei1226/vgstation13/keys{/key_id}","collaborators_url":"https://api.github.com/repos/Rei1226/vgstation13/collaborators{/collaborator}","teams_url":"https://api.github.com/repos/Rei1226/vgstation13/teams","hooks_url":"https://api.github.com/repos/Rei1226/vgstation13/hooks","issue_events_url":"https://api.github.com/repos/Rei1226/vgstation13/issues/events{/number}","events_url":"https://api.github.com/repos/Rei1226/vgstation13/events","assignees_url":"https://api.github.com/repos/Rei1226/vgstation13/assignees{/user}","branches_url":"https://api.github.com/repos/Rei1226/vgstation13/branches{/branch}","tags_url":"https://api.github.com/repos/Rei1226/vgstation13/tags","blobs_url":"https://api.github.com/repos/Rei1226/vgstation13/git/blobs{/sha}","git_tags_url":"https://api.github.com/repos/Rei1226/vgstation13/git/tags{/sha}","git_refs_url":"https://api.github.com/repos/Rei1226/vgstation13/git/refs{/sha}","trees_url":"https://api.github.com/repos/Rei1226/vgstation13/git/trees{/sha}","statuses_url":"https://api.github.com/repos/Rei1226/vgstation13/statuses/{sha}","languages_url":"https://api.github.com/repos/Rei1226/vgstation13/languages","stargazers_url":"https://api.github.com/repos/Rei1226/vgstation13/stargazers","contributors_url":"https://api.github.com/repos/Rei1226/vgstation13/contributors","subscribers_url":"https://api.github.com/repos/Rei1226/vgstation13/subscribers","subscription_url":"https://api.github.com/repos/Rei1226/vgstation13/subscription","commits_url":"https://api.github.com/repos/Rei1226/vgstation13/commits{/sha}","git_commits_url":"https://api.github.com/repos/Rei1226/vgstation13/git/commits{/sha}","comments_url":"https://api.github.com/repos/Rei1226/vgstation13/comments{/number}","issue_comment_url":"https://api.github.com/repos/Rei1226/vgstation13/issues/comments/{number}","contents_url":"https://api.github.com/repos/Rei1226/vgstation13/contents/{+path}","compare_url":"https://api.github.com/repos/Rei1226/vgstation13/compare/{base}...{head}","merges_url":"https://api.github.com/repos/Rei1226/vgstation13/merges","archive_url":"https://api.github.com/repos/Rei1226/vgstation13/{archive_format}{/ref}","downloads_url":"https://api.github.com/repos/Rei1226/vgstation13/downloads","issues_url":"https://api.github.com/repos/Rei1226/vgstation13/issues{/number}","pulls_url":"https://api.github.com/repos/Rei1226/vgstation13/pulls{/number}","milestones_url":"https://api.github.com/repos/Rei1226/vgstation13/milestones{/number}","notifications_url":"https://api.github.com/repos/Rei1226/vgstation13/notifications{?since,all,participating}","labels_url":"https://api.github.com/repos/Rei1226/vgstation13/labels{/name}","releases_url":"https://api.github.com/repos/Rei1226/vgstation13/releases{/id}","created_at":"2014-04-28T07:36:48Z","updated_at":"2014-12-30T08:33:17Z","pushed_at":"2014-12-30T08:33:10Z","git_url":"git://github.com/Rei1226/vgstation13.git","ssh_url":"git@github.com:Rei1226/vgstation13.git","clone_url":"https://github.com/Rei1226/vgstation13.git","svn_url":"https://github.com/Rei1226/vgstation13","homepage":"","size":722996,"stargazers_count":0,"watchers_count":0,"language":"DM","has_issues":false,"has_downloads":true,"has_wiki":false,"has_pages":false,"forks_count":0,"mirror_url":null,"open_issues_count":0,"forks":0,"open_issues":0,"watchers":0,"default_branch":"master"}},"base":{"label":"d3athrow:Bleeding-Edge","ref":"Bleeding-Edge","sha":"ea27b58dbac4fdb65119b09648f3f4f2395125de","user":{"login":"d3athrow","id":706947,"avatar_url":"https://avatars.githubusercontent.com/u/706947?v=3","gravatar_id":"","url":"https://api.github.com/users/d3athrow","html_url":"https://github.com/d3athrow","followers_url":"https://api.github.com/users/d3athrow/followers","following_url":"https://api.github.com/users/d3athrow/following{/other_user}","gists_url":"https://api.github.com/users/d3athrow/gists{/gist_id}","starred_url":"https://api.github.com/users/d3athrow/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/d3athrow/subscriptions","organizations_url":"https://api.github.com/users/d3athrow/orgs","repos_url":"https://api.github.com/users/d3athrow/repos","events_url":"https://api.github.com/users/d3athrow/events{/privacy}","received_events_url":"https://api.github.com/users/d3athrow/received_events","type":"User","site_admin":false},"repo":{"id":10441188,"name":"vgstation13","full_name":"d3athrow/vgstation13","owner":{"login":"d3athrow","id":706947,"avatar_url":"https://avatars.githubusercontent.com/u/706947?v=3","gravatar_id":"","url":"https://api.github.com/users/d3athrow","html_url":"https://github.com/d3athrow","followers_url":"https://api.github.com/users/d3athrow/followers","following_url":"https://api.github.com/users/d3athrow/following{/other_user}","gists_url":"https://api.github.com/users/d3athrow/gists{/gist_id}","starred_url":"https://api.github.com/users/d3athrow/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/d3athrow/subscriptions","organizations_url":"https://api.github.com/users/d3athrow/orgs","repos_url":"https://api.github.com/users/d3athrow/repos","events_url":"https://api.github.com/users/d3athrow/events{/privacy}","received_events_url":"https://api.github.com/users/d3athrow/received_events","type":"User","site_admin":false},"private":false,"html_url":"https://github.com/d3athrow/vgstation13","description":"This is the vgstation's fork of baystation12's code.","fork":true,"url":"https://api.github.com/repos/d3athrow/vgstation13","forks_url":"https://api.github.com/repos/d3athrow/vgstation13/forks","keys_url":"https://api.github.com/repos/d3athrow/vgstation13/keys{/key_id}","collaborators_url":"https://api.github.com/repos/d3athrow/vgstation13/collaborators{/collaborator}","teams_url":"https://api.github.com/repos/d3athrow/vgstation13/teams","hooks_url":"https://api.github.com/repos/d3athrow/vgstation13/hooks","issue_events_url":"https://api.github.com/repos/d3athrow/vgstation13/issues/events{/number}","events_url":"https://api.github.com/repos/d3athrow/vgstation13/events","assignees_url":"https://api.github.com/repos/d3athrow/vgstation13/assignees{/user}","branches_url":"https://api.github.com/repos/d3athrow/vgstation13/branches{/branch}","tags_url":"https://api.github.com/repos/d3athrow/vgstation13/tags","blobs_url":"https://api.github.com/repos/d3athrow/vgstation13/git/blobs{/sha}","git_tags_url":"https://api.github.com/repos/d3athrow/vgstation13/git/tags{/sha}","git_refs_url":"https://api.github.com/repos/d3athrow/vgstation13/git/refs{/sha}","trees_url":"https://api.github.com/repos/d3athrow/vgstation13/git/trees{/sha}","statuses_url":"https://api.github.com/repos/d3athrow/vgstation13/statuses/{sha}","languages_url":"https://api.github.com/repos/d3athrow/vgstation13/languages","stargazers_url":"https://api.github.com/repos/d3athrow/vgstation13/stargazers","contributors_url":"https://api.github.com/repos/d3athrow/vgstation13/contributors","subscribers_url":"https://api.github.com/repos/d3athrow/vgstation13/subscribers","subscription_url":"https://api.github.com/repos/d3athrow/vgstation13/subscription","commits_url":"https://api.github.com/repos/d3athrow/vgstation13/commits{/sha}","git_commits_url":"https://api.github.com/repos/d3athrow/vgstation13/git/commits{/sha}","comments_url":"https://api.github.com/repos/d3athrow/vgstation13/comments{/number}","issue_comment_url":"https://api.github.com/repos/d3athrow/vgstation13/issues/comments/{number}","contents_url":"https://api.github.com/repos/d3athrow/vgstation13/contents/{+path}","compare_url":"https://api.github.com/repos/d3athrow/vgstation13/compare/{base}...{head}","merges_url":"https://api.github.com/repos/d3athrow/vgstation13/merges","archive_url":"https://api.github.com/repos/d3athrow/vgstation13/{archive_format}{/ref}","downloads_url":"https://api.github.com/repos/d3athrow/vgstation13/downloads","issues_url":"https://api.github.com/repos/d3athrow/vgstation13/issues{/number}","pulls_url":"https://api.github.com/repos/d3athrow/vgstation13/pulls{/number}","milestones_url":"https://api.github.com/repos/d3athrow/vgstation13/milestones{/number}","notifications_url":"https://api.github.com/repos/d3athrow/vgstation13/notifications{?since,all,participating}","labels_url":"https://api.github.com/repos/d3athrow/vgstation13/labels{/name}","releases_url":"https://api.github.com/repos/d3athrow/vgstation13/releases{/id}","created_at":"2013-06-02T19:39:54Z","updated_at":"2014-12-31T20:06:46Z","pushed_at":"2015-01-01T01:04:27Z","git_url":"git://github.com/d3athrow/vgstation13.git","ssh_url":"git@github.com:d3athrow/vgstation13.git","clone_url":"https://github.com/d3athrow/vgstation13.git","svn_url":"https://github.com/d3athrow/vgstation13","homepage":"","size":937605,"stargazers_count":45,"watchers_count":45,"language":"DM","has_issues":true,"has_downloads":true,"has_wiki":true,"has_pages":false,"forks_count":135,"mirror_url":null,"open_issues_count":259,"forks":135,"open_issues":259,"watchers":45,"default_branch":"master"}},"_links":{"self":{"href":"https://api.github.com/repos/d3athrow/vgstation13/pulls/2405"},"html":{"href":"https://github.com/d3athrow/vgstation13/pull/2405"},"issue":{"href":"https://api.github.com/repos/d3athrow/vgstation13/issues/2405"},"comments":{"href":"https://api.github.com/repos/d3athrow/vgstation13/issues/2405/comments"},"review_comments":{"href":"https://api.github.com/repos/d3athrow/vgstation13/pulls/2405/comments"},"review_comment":{"href":"https://api.github.com/repos/d3athrow/vgstation13/pulls/comments/{number}"},"commits":{"href":"https://api.github.com/repos/d3athrow/vgstation13/pulls/2405/commits"},"statuses":{"href":"https://api.github.com/repos/d3athrow/vgstation13/statuses/b93293990c4d927f30a1f048939d427ee591e4a6"}}}},"public":true,"created_at":"2015-01-01T01:06:11Z"}
{"id":"2489398480","type":"IssueCommentEvent","actor":{"id":5497952,"login":"g19-mr","gravatar_id":"","url":"https://api.github.com/users/g19-mr","avatar_url":"https://avatars.githubusercontent.com/u/5497952?"},"repo":{"id":25435487,"name":"g19-mr/azh","url":"https://api.github.com/repos/g19-mr/azh"},"payload":{"action":"created","issue":{"url":"https://api.github.com/repos/g19-mr/azh/issues/83","labels_url":"https://api.github.com/repos/g19-mr/azh/issues/83/labels{/name}","comments_url":"https://api.github.com/repos/g19-mr/azh/issues/83/comments","events_url":"https://api.github.com/repos/g19-mr/azh/issues/83/events","html_url":"https://github.com/g19-mr/azh/issues/83","id":53210289,"number":83,"title":"Add icons to the left of the text on About screen buttons","user":{"login":"g19-mr","id":5497952,"avatar_url":"https://avatars.githubusercontent.com/u/5497952?v=3","gravatar_id":"","url":"https://api.github.com/users/g19-mr","html_url":"https://github.com/g19-mr","followers_url":"https://api.github.com/users/g19-mr/followers","following_url":"https://api.github.com/users/g19-mr/following{/other_user}","gists_url":"https://api.github.com/users/g19-mr/gists{/gist_id}","starred_url":"https://api.github.com/users/g19-mr/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/g19-mr/subscriptions","organizations_url":"https://api.github.com/users/g19-mr/orgs","repos_url":"https://api.github.com/users/g19-mr/repos","events_url":"https://api.github.com/users/g19-mr/events{/privacy}","received_events_url":"https://api.github.com/users/g19-mr/received_events","type":"User","site_admin":false},"labels":[{"url":"https://api.github.com/repos/g19-mr/azh/labels/improvement","name":"improvement","color":"84b6eb"}],"state":"closed","locked":false,"assignee":{"login":"g19-mr","id":5497952,"avatar_url":"https://avatars.githubusercontent.com/u/5497952?v=3","gravatar_id":"","url":"https://api.github.com/users/g19-mr","html_url":"https://github.com/g19-mr","followers_url":"https://api.github.com/users/g19-mr/followers","following_url":"https://api.github.com/users/g19-mr/following{/other_user}","gists_url":"https://api.github.com/users/g19-mr/gists{/gist_id}","starred_url":"https://api.github.com/users/g19-mr/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/g19-mr/subscriptions","organizations_url":"https://api.github.com/users/g19-mr/orgs","repos_url":"https://api.github.com/users/g19-mr/repos","events_url":"https://api.github.com/users/g19-mr/events{/privacy}","received_events_url":"https://api.github.com/users/g19-mr/received_events","type":"User","site_admin":false},"milestone":{"url":"https://api.github.com/repos/g19-mr/azh/milestones/2","labels_url":"https://api.github.com/repos/g19-mr/azh/milestones/2/labels","id":873798,"number":2,"title":"Android 1.0.1","description":null,"creator":{"login":"g19-mr","id":5497952,"avatar_url":"https://avatars.githubusercontent.com/u/5497952?v=3","gravatar_id":"","url":"https://api.github.com/users/g19-mr","html_url":"https://github.com/g19-mr","followers_url":"https://api.github.com/users/g19-mr/followers","following_url":"https://api.github.com/users/g19-mr/following{/other_user}","gists_url":"https://api.github.com/users/g19-mr/gists{/gist_id}","starred_url":"https://api.github.com/users/g19-mr/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/g19-mr/subscriptions","organizations_url":"https://api.github.com/users/g19-mr/orgs","repos_url":"https://api.github.com/users/g19-mr/repos","events_url":"https://api.github.com/users/g19-mr/events{/privacy}","received_events_url":"https://api.github.com/users/g19-mr/received_events","type":"User","site_admin":false},"open_issues":5,"closed_issues":12,"state":"open","created_at":"2014-11-20T05:20:02Z","updated_at":"2015-01-01T01:06:12Z","due_on":null,"closed_at":null},"comments":1,"created_at":"2015-01-01T01:05:59Z","updated_at":"2015-01-01T01:06:12Z","closed_at":"2015-01-01T01:06:12Z","body":"Related icons aligned to the left on the buttons on about screen"},"comment":{"url":"https://api.github.com/repos/g19-mr/azh/issues/comments/68477355","html_url":"https://github.com/g19-mr/azh/issues/83#issuecomment-68477355","issue_url":"https://api.github.com/repos/g19-mr/azh/issues/83","id":68477355,"user":{"login":"g19-mr","id":5497952,"avatar_url":"https://avatars.githubusercontent.com/u/5497952?v=3","gravatar_id":"","url":"https://api.github.com/users/g19-mr","html_url":"https://github.com/g19-mr","followers_url":"https://api.github.com/users/g19-mr/followers","following_url":"https://api.github.com/users/g19-mr/following{/other_user}","gists_url":"https://api.github.com/users/g19-mr/gists{/gist_id}","starred_url":"https://api.github.com/users/g19-mr/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/g19-mr/subscriptions","organizations_url":"https://api.github.com/users/g19-mr/orgs","repos_url":"https://api.github.com/users/g19-mr/repos","events_url":"https://api.github.com/users/g19-mr/events{/privacy}","received_events_url":"https://api.github.com/users/g19-mr/received_events","type":"User","site_admin":false},"created_at":"2015-01-01T01:06:12Z","updated_at":"2015-01-01T01:06:12Z","body":"Added icons to about screen buttons"}},"public":true,"created_at":"2015-01-01T01:06:12Z"}
{"id":"2489398481","type":"IssuesEvent","actor":{"id":5497952,"login":"g19-mr","gravatar_id":"","url":"https://api.github.com/users/g19-mr","avatar_url":"https://avatars.githubusercontent.com/u/5497952?"},"repo":{"id":25435487,"name":"g19-mr/azh","url":"https://api.github.com/repos/g19-mr/azh"},"payload":{"action":"closed","issue":{"url":"https://api.github.com/repos/g19-mr/azh/issues/83","labels_url":"https://api.github.com/repos/g19-mr/azh/issues/83/labels{/name}","comments_url":"https://api.github.com/repos/g19-mr/azh/issues/83/comments","events_url":"https://api.github.com/repos/g19-mr/azh/issues/83/events","html_url":"https://github.com/g19-mr/azh/issues/83","id":53210289,"number":83,"title":"Add icons to the left of the text on About screen buttons","user":{"login":"g19-mr","id":5497952,"avatar_url":"https://avatars.githubusercontent.com/u/5497952?v=3","gravatar_id":"","url":"https://api.github.com/users/g19-mr","html_url":"https://github.com/g19-mr","followers_url":"https://api.github.com/users/g19-mr/followers","following_url":"https://api.github.com/users/g19-mr/following{/other_user}","gists_url":"https://api.github.com/users/g19-mr/gists{/gist_id}","starred_url":"https://api.github.com/users/g19-mr/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/g19-mr/subscriptions","organizations_url":"https://api.github.com/users/g19-mr/orgs","repos_url":"https://api.github.com/users/g19-mr/repos","events_url":"https://api.github.com/users/g19-mr/events{/privacy}","received_events_url":"https://api.github.com/users/g19-mr/received_events","type":"User","site_admin":false},"labels":[{"url":"https://api.github.com/repos/g19-mr/azh/labels/improvement","name":"improvement","color":"84b6eb"}],"state":"closed","locked":false,"assignee":{"login":"g19-mr","id":5497952,"avatar_url":"https://avatars.githubusercontent.com/u/5497952?v=3","gravatar_id":"","url":"https://api.github.com/users/g19-mr","html_url":"https://github.com/g19-mr","followers_url":"https://api.github.com/users/g19-mr/followers","following_url":"https://api.github.com/users/g19-mr/following{/other_user}","gists_url":"https://api.github.com/users/g19-mr/gists{/gist_id}","starred_url":"https://api.github.com/users/g19-mr/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/g19-mr/subscriptions","organizations_url":"https://api.github.com/users/g19-mr/orgs","repos_url":"https://api.github.com/users/g19-mr/repos","events_url":"https://api.github.com/users/g19-mr/events{/privacy}","received_events_url":"https://api.github.com/users/g19-mr/received_events","type":"User","site_admin":false},"milestone":{"url":"https://api.github.com/repos/g19-mr/azh/milestones/2","labels_url":"https://api.github.com/repos/g19-mr/azh/milestones/2/labels","id":873798,"number":2,"title":"Android 1.0.1","description":null,"creator":{"login":"g19-mr","id":5497952,"avatar_url":"https://avatars.githubusercontent.com/u/5497952?v=3","gravatar_id":"","url":"https://api.github.com/users/g19-mr","html_url":"https://github.com/g19-mr","followers_url":"https://api.github.com/users/g19-mr/followers","following_url":"https://api.github.com/users/g19-mr/following{/other_user}","gists_url":"https://api.github.com/users/g19-mr/gists{/gist_id}","starred_url":"https://api.github.com/users/g19-mr/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/g19-mr/subscriptions","organizations_url":"https://api.github.com/users/g19-mr/orgs","repos_url":"https://api.github.com/users/g19-mr/repos","events_url":"https://api.github.com/users/g19-mr/events{/privacy}","received_events_url":"https://api.github.com/users/g19-mr/received_events","type":"User","site_admin":false},"open_issues":5,"closed_issues":12,"state":"open","created_at":"2014-11-20T05:20:02Z","updated_at":"2015-01-01T01:06:12Z","due_on":null,"closed_at":null},"comments":1,"created_at":"2015-01-01T01:05:59Z","updated_at":"2015-01-01T01:06:12Z","closed_at":"2015-01-01T01:06:12Z","body":"Related icons aligned to the left on the buttons on about screen"}},"public":true,"created_at":"2015-01-01T01:06:12Z"}
{"id":"2489398482","type":"PushEvent","actor":{"id":3299558,"login":"jonlai","gravatar_id":"","url":"https://api.github.com/users/jonlai","avatar_url":"https://avatars.githubusercontent.com/u/3299558?"},"repo":{"id":24589839,"name":"jonlai/personal-website","url":"https://api.github.com/repos/jonlai/personal-website"},"payload":{"push_id":536753371,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"cb8c22571f6e99bd45efa105692f9c25d9fa616e","before":"b292f784b928993eb5d993b54f9db897a1d6ae89","commits":[{"sha":"cb8c22571f6e99bd45efa105692f9c25d9fa616e","author":{"email":"3692bfa45759a67d83aedf0045f6cb635a966abf@jonlai.com","name":"jonlai"},"message":"Add mobile-menu functionality","distinct":true,"url":"https://api.github.com/repos/jonlai/personal-website/commits/cb8c22571f6e99bd45efa105692f9c25d9fa616e"}]},"public":true,"created_at":"2015-01-01T01:06:12Z"}
{"id":"2489398483","type":"IssueCommentEvent","actor":{"id":585534,"login":"gorhill","gravatar_id":"","url":"https://api.github.com/users/gorhill","avatar_url":"https://avatars.githubusercontent.com/u/585534?"},"repo":{"id":21108956,"name":"gorhill/uBlock","url":"https://api.github.com/repos/gorhill/uBlock"},"payload":{"action":"created","issue":{"url":"https://api.github.com/repos/gorhill/uBlock/issues/452","labels_url":"https://api.github.com/repos/gorhill/uBlock/issues/452/labels{/name}","comments_url":"https://api.github.com/repos/gorhill/uBlock/issues/452/comments","events_url":"https://api.github.com/repos/gorhill/uBlock/issues/452/events","html_url":"https://github.com/gorhill/uBlock/issues/452","id":53199774,"number":452,"title":"Github Issue","user":{"login":"gpedro","id":2898638,"avatar_url":"https://avatars.githubusercontent.com/u/2898638?v=3","gravatar_id":"","url":"https://api.github.com/users/gpedro","html_url":"https://github.com/gpedro","followers_url":"https://api.github.com/users/gpedro/followers","following_url":"https://api.github.com/users/gpedro/following{/other_user}","gists_url":"https://api.github.com/users/gpedro/gists{/gist_id}","starred_url":"https://api.github.com/users/gpedro/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/gpedro/subscriptions","organizations_url":"https://api.github.com/users/gpedro/orgs","repos_url":"https://api.github.com/users/gpedro/repos","events_url":"https://api.github.com/users/gpedro/events{/privacy}","received_events_url":"https://api.github.com/users/gpedro/received_events","type":"User","site_admin":false},"labels":[],"state":"open","locked":false,"assignee":null,"milestone":null,"comments":7,"created_at":"2014-12-31T19:34:09Z","updated_at":"2015-01-01T01:06:12Z","closed_at":null,"body":"![gh problems](http://i.imgur.com/DjNwMiq.png)\r\n\r\nI've tested and is caused by uBlock \r\n\r\nI'm using Chrome 39.0.2171.95 (64-bit), OSX 10.9.5"},"comment":{"url":"https://api.github.com/repos/gorhill/uBlock/issues/comments/68477356","html_url":"https://github.com/gorhill/uBlock/issues/452#issuecomment-68477356","issue_url":"https://api.github.com/repos/gorhill/uBlock/issues/452","id":68477356,"user":{"login":"gorhill","id":585534,"avatar_url":"https://avatars.githubusercontent.com/u/585534?v=3","gravatar_id":"","url":"https://api.github.com/users/gorhill","html_url":"https://github.com/gorhill","followers_url":"https://api.github.com/users/gorhill/followers","following_url":"https://api.github.com/users/gorhill/following{/other_user}","gists_url":"https://api.github.com/users/gorhill/gists{/gist_id}","starred_url":"https://api.github.com/users/gorhill/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/gorhill/subscriptions","organizations_url":"https://api.github.com/users/gorhill/orgs","repos_url":"https://api.github.com/users/gorhill/repos","events_url":"https://api.github.com/users/gorhill/events{/privacy}","received_events_url":"https://api.github.com/users/gorhill/received_events","type":"User","site_admin":false},"created_at":"2015-01-01T01:06:12Z","updated_at":"2015-01-01T01:06:12Z","body":"Ok I can reproduce on my very old laptop, I can investigate now."}},"public":true,"created_at":"2015-01-01T01:06:12Z"}
{"id":"2489398486","type":"PushEvent","actor":{"id":6693944,"login":"Eternaldoom","gravatar_id":"","url":"https://api.github.com/users/Eternaldoom","avatar_url":"https://avatars.githubusercontent.com/u/6693944?"},"repo":{"id":28652181,"name":"BossLetsPlays/WaffleMod","url":"https://api.github.com/repos/BossLetsPlays/WaffleMod"},"payload":{"push_id":536753374,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"19f0e5ca1ba35f901a5934705fddaecad5f7a49d","before":"7fd8147512d920a40a0e36752cff63ce832fd57d","commits":[{"sha":"19f0e5ca1ba35f901a5934705fddaecad5f7a49d","author":{"email":"ec291313f6147c66cfacc4177a9e43f07db94e06@icloud.com","name":"Eternaldoom"},"message":"waffle texture","distinct":true,"url":"https://api.github.com/repos/BossLetsPlays/WaffleMod/commits/19f0e5ca1ba35f901a5934705fddaecad5f7a49d"}]},"public":true,"created_at":"2015-01-01T01:06:12Z"}
{"id":"2489398495","type":"PushEvent","actor":{"id":9539839,"login":"nathanpanchal","gravatar_id":"","url":"https://api.github.com/users/nathanpanchal","avatar_url":"https://avatars.githubusercontent.com/u/9539839?"},"repo":{"id":28327047,"name":"nathanpanchal/rep","url":"https://api.github.com/repos/nathanpanchal/rep"},"payload":{"push_id":536753378,"size":2,"distinct_size":2,"ref":"refs/heads/master","head":"4cc6c3bf7c84c0e045b0c28d17fbb185ba167a7f","before":"48660b086b03fd3fa0932a7028e59c60c195c183","commits":[{"sha":"7a6f155b740a17645f8a7c3c0753e7babd61a18b","author":{"email":"ea7a0c1525d0377387a689662b80f80209af162b@gmail.com","name":"Nathan Panchal"},"message":"np - updated solutions and spelling","distinct":true,"url":"https://api.github.com/repos/nathanpanchal/rep/commits/7a6f155b740a17645f8a7c3c0753e7babd61a18b"},{"sha":"4cc6c3bf7c84c0e045b0c28d17fbb185ba167a7f","author":{"email":"ea7a0c1525d0377387a689662b80f80209af162b@gmail.com","name":"Nathan Panchal"},"message":"np - initial upload","distinct":true,"url":"https://api.github.com/repos/nathanpanchal/rep/commits/4cc6c3bf7c84c0e045b0c28d17fbb185ba167a7f"}]},"public":true,"created_at":"2015-01-01T01:06:14Z"}
{"id":"2489398497","type":"PushEvent","actor":{"id":2012806,"login":"aconley","gravatar_id":"","url":"https://api.github.com/users/aconley","avatar_url":"https://avatars.githubusercontent.com/u/2012806?"},"repo":{"id":18895528,"name":"aconley/MachineLearning","url":"https://api.github.com/repos/aconley/MachineLearning"},"payload":{"push_id":536753379,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"4847438e4f4f82c3f466820f18ef92480b220ff7","before":"ea0c13da5d0cfea3c77fa92d3489580516353378","commits":[{"sha":"4847438e4f4f82c3f466820f18ef92480b220ff7","author":{"email":"da6b13ae5bc1edd63fbaa421fd5ef5233ae76713@colorado.edu","name":"Alexander Conley"},"message":"First 2 problems in BDA chap 2, added header sizes to all notes.","distinct":true,"url":"https://api.github.com/repos/aconley/MachineLearning/commits/4847438e4f4f82c3f466820f18ef92480b220ff7"}]},"public":true,"created_at":"2015-01-01T01:06:14Z"}
{"id":"2489398498","type":"PushEvent","actor":{"id":826422,"login":"devhd","gravatar_id":"","url":"https://api.github.com/users/devhd","avatar_url":"https://avatars.githubusercontent.com/u/826422?"},"repo":{"id":28672269,"name":"devhd/rulus","url":"https://api.github.com/repos/devhd/rulus"},"payload":{"push_id":536753370,"size":1000,"distinct_size":4394,"ref":"refs/heads/corporate-commit","head":"e4f8c39db38c3dc14d9f069b61226a731a173287","before":"24a33a4632530cbe66971c91a3f73fed71285b45","commits":[{"sha":"811baf9c467324f1a1f05ce6af51caeb4b7dd414","author":{"email":"01142e84179254d983577d421939de6325fe05f7@users.noreply.github.com","name":"devhd"},"message":"commit from Rulus company with internal id 793e827461e3","distinct":true,"url":"https://api.github.com/repos/devhd/rulus/commits/811baf9c467324f1a1f05ce6af51caeb4b7dd414"},{"sha":"c7f3b24506c5cf593063910449656fa9d6fc1ca5","author":{"email":"01142e84179254d983577d421939de6325fe05f7@users.noreply.github.com","name":"devhd"},"message":"commit from Rulus company with internal id eacaf6e3b4e1","distinct":true,"url":"https://api.github.com/repos/devhd/rulus/commits/c7f3b24506c5cf593063910449656fa9d6fc1ca5"},{"sha":"eaf754ef5e7290a91fb7954fcc0330c59b6bab0e","author":{"email":"01142e84179254d983577d421939de6325fe05f7@users.noreply.github.com","name":"devhd"},"message":"commit from Rulus company with internal id b3b085e89e1e","distinct":true,"url":"https://api.github.com/repos/devhd/rulus/commits/eaf754ef5e7290a91fb7954fcc0330c59b6bab0e"},{"sha":"052de2fa7f8150056a3c39d1d05737573f54d18c","author":{"email":"99c668761d020b9679555123ba53755f7c2ea5a5@rulus.com","name":"rulus-employee-57e138dc"},"message":"commit from Rulus company with internal id 57e138dcfafe","distinct":true,"url":"https://api.github.com/repos/devhd/rulus/commits/052de2fa7f8150056a3c39d1d05737573f54d18c"},{"sha":"ceb4f1d74e9cbf34e6f99127e9effa4976a5b4c1","author":{"email":"24e8d9567bae12b60ea2fef0579698e2123b7bd1@rulus.com","name":"rulus-employee-b06e52c4"},"message":"commit from Rulus company with internal id b06e52c4824d","distinct":true,"url":"https://api.github.com/repos/devhd/rulus/commits/ceb4f1d74e9cbf34e6f99127e9effa4976a5b4c1"},{"sha":"568d72b46c7f649f4fe8d1811e6c86ba9d0fc480","author":{"email":"77d6b0ff6d4b9c1d3ecd8ab24e4f8a9753205217@rulus.com","name":"rulus-employee-9df85673"},"message":"commit from Rulus company with internal id 9df856735928","distinct":true,"url":"https://api.github.com/repos/devhd/rulus/commits/568d72b46c7f649f4fe8d1811e6c86ba9d0fc480"},{"sha":"4f755c68cc64918713db129373ad9f65bb2c53ae","author":{"email":"46a809052e8a001d8aaafdfd30a3674055ad8b31@rulus.com","name":"rulus-employee-2631fc20"},"message":"commit from Rulus company with internal id 2631fc203a38","distinct":true,"url":"https://api.github.com/repos/devhd/rulus/commits/4f755c68cc64918713db129373ad9f65bb2c53ae"},{"sha":"e6621ee719c52fecafa1b238908bde9ecc8db8c7","author":{"email":"f3967c3031d56cde0eb96f865167fad108cab328@users.noreply.github.com","name":"andrejev"},"message":"commit from Rulus company with internal id 1ed5468637be","distinct":true,"url":"https://api.github.com/repos/devhd/rulus/commits/e6621ee719c52fecafa1b238908bde9ecc8db8c7"},{"sha":"4a2fcd7a274a99dbc8437c717556d3cf71042028","author":{"email":"f3967c3031d56cde0eb96f865167fad108cab328@users.noreply.github.com","name":"andrejev"},"message":"commit from Rulus company with internal id a08651cf2f5e","distinct":true,"url":"https://api.github.com/repos/devhd/rulus/commits/4a2fcd7a274a99dbc8437c717556d3cf71042028"},{"sha":"b28669116dc6f7e84824d2fb0f6133f15e2fdc2a","author":{"email":"f3967c3031d56cde0eb96f865167fad108cab328@users.noreply.github.com","name":"andrejev"},"message":"commit from Rulus company with internal id b0b95077dbb4","distinct":true,"url":"https://api.github.com/repos/devhd/rulus/commits/b28669116dc6f7e84824d2fb0f6133f15e2fdc2a"},{"sha":"b2a01f646ae7c0a50d6fa259d33c63a547600b42","author":{"email":"f3967c3031d56cde0eb96f865167fad108cab328@users.noreply.github.com","name":"andrejev"},"message":"commit from Rulus company with internal id 62719714ae42","distinct":true,"url":"https://api.github.com/repos/devhd/rulus/commits/b2a01f646ae7c0a50d6fa259d33c63a547600b42"},{"sha":"ab19a3f469c89e4736784a0c38f5cd0697864a47","author":{"email":"573d675efc8ed21e4a661e8897d95a5b47d57ea6@rulus.com","name":"rulus-employee-65181a44"},"message":"commit from Rulus company with internal id 65181a441879","distinct":true,"url":"https://api.github.com/repos/devhd/rulus/commits/ab19a3f469c89e4736784a0c38f5cd0697864a47"},{"sha":"a3cb09199efb10ae4ed77dc1c7e80a1031cb7de1","author":{"email":"aad584ac7ca8bed03f673f16c0cb6a2c032ed207@rulus.com","name":"rulus-employee-05bfe041"},"message":"commit from Rulus company with internal id 05bfe0411e85","distinct":true,"url":"https://api.github.com/repos/devhd/rulus/commits/a3cb09199efb10ae4ed77dc1c7e80a1031cb7de1"},{"sha":"0b8277cd37d19e227542237aa4f776f6ca29efce","author":{"email":"f3967c3031d56cde0eb96f865167fad108cab328@users.noreply.github.com","name":"andrejev"},"message":"commit from Rulus company with internal id 92d839c3e65c","distinct":true,"url":"https://api.github.com/repos/devhd/rulus/commits/0b8277cd37d19e227542237aa4f776f6ca29efce"},{"sha":"d509539f990f0ec2a2792e5d39ef66cef0180f6d","author":{"email":"fe6f8e15c3e6fbb8a40a2ce6e98848853603f68a@users.noreply.github.com","name":"ntklim"},"message":"commit from Rulus company with internal id f01b994a77bb","distinct":true,"url":"https://api.github.com/repos/devhd/rulus/commits/d509539f990f0ec2a2792e5d39ef66cef0180f6d"},{"sha":"46ca565baaf416978396bdfd68d22afb40c5ac93","author":{"email":"fe6f8e15c3e6fbb8a40a2ce6e98848853603f68a@users.noreply.github.com","name":"ntklim"},"message":"commit from Rulus company with internal id e6d067cb8ba9","distinct":true,"url":"https://api.github.com/repos/devhd/rulus/commits/46ca565baaf416978396bdfd68d22afb40c5ac93"},{"sha":"eecdefff74d967f8715d7933e8766c8338ab7992","author":{"email":"8f3457924a1eb5af6fd611493be2bd7ad154a1fb@rulus.com","name":"rulus-employee-d955c736"},"message":"commit from Rulus company with internal id d955c736e585","distinct":true,"url":"https://api.github.com/repos/devhd/rulus/commits/eecdefff74d967f8715d7933e8766c8338ab7992"},{"sha":"72c4c5f9d3477157fead5059599b6b3cf96a4b03","author":{"email":"8ccf6737f7ac752e448572e9e5a7850e406ff3a9@rulus.com","name":"rulus-employee-124d5850"},"message":"commit from Rulus company with internal id 124d58504f69","distinct":true,"url":"https://api.github.com/repos/devhd/rulus/commits/72c4c5f9d3477157fead5059599b6b3cf96a4b03"},{"sha":"fa78e9ad82b8af64f51df9c7350aac3b17d84c58","author":{"email":"a25961e887882f8dec7b0ecf28bf20814085f77f@rulus.com","name":"rulus-employee-f0be14e7"},"message":"commit from Rulus company with internal id f0be14e7607c","distinct":true,"url":"https://api.github.com/repos/devhd/rulus/commits/fa78e9ad82b8af64f51df9c7350aac3b17d84c58"},{"sha":"c7c085cab4770b7ef6ac34da7537527558f86cf0","author":{"email":"78dccec6bff894326f4b4d70c6de378e286bb775@rulus.com","name":"rulus-employee-8e066744"},"message":"commit from Rulus company with internal id 8e0667447802","distinct":true,"url":"https://api.github.com/repos/devhd/rulus/commits/c7c085cab4770b7ef6ac34da7537527558f86cf0"}]},"public":true,"created_at":"2015-01-01T01:06:15Z"}
{"id":"2489398506","type":"WatchEvent","actor":{"id":9970148,"login":"bchoomnuan","gravatar_id":"","url":"https://api.github.com/users/bchoomnuan","avatar_url":"https://avatars.githubusercontent.com/u/9970148?"},"repo":{"id":24993905,"name":"socketplane/socketplane","url":"https://api.github.com/repos/socketplane/socketplane"},"payload":{"action":"started"},"public":true,"created_at":"2015-01-01T01:06:15Z","org":{"id":9063170,"login":"socketplane","gravatar_id":"","url":"https://api.github.com/orgs/socketplane","avatar_url":"https://avatars.githubusercontent.com/u/9063170?"}}
{"id":"2489398510","type":"PushEvent","actor":{"id":1687477,"login":"kllmctrl","gravatar_id":"","url":"https://api.github.com/users/kllmctrl","avatar_url":"https://avatars.githubusercontent.com/u/1687477?"},"repo":{"id":22713199,"name":"kllmctrl/blog","url":"https://api.github.com/repos/kllmctrl/blog"},"payload":{"push_id":536753382,"size":1,"distinct_size":1,"ref":"refs/heads/gh-pages","head":"542fa01a5cb21e143fb434dbbe4962b0dad7f075","before":"e530ef5a1f5d42a38cef0c14bbd2692a16ebdfd0","commits":[{"sha":"542fa01a5cb21e143fb434dbbe4962b0dad7f075","author":{"email":"f80e4117476d2980d2730856b4e57c1491ba28a9@gmail.com","name":"KC"},"message":"Update 2014-12-31-me-summary2014.md","distinct":true,"url":"https://api.github.com/repos/kllmctrl/blog/commits/542fa01a5cb21e143fb434dbbe4962b0dad7f075"}]},"public":true,"created_at":"2015-01-01T01:06:16Z"}
{"id":"2489398519","type":"WatchEvent","actor":{"id":117788,"login":"nyarla","gravatar_id":"","url":"https://api.github.com/users/nyarla","avatar_url":"https://avatars.githubusercontent.com/u/117788?"},"repo":{"id":9267658,"name":"kisielk/vigo","url":"https://api.github.com/repos/kisielk/vigo"},"payload":{"action":"started"},"public":true,"created_at":"2015-01-01T01:06:17Z"}
{"id":"2489398527","type":"PushEvent","actor":{"id":1308363,"login":"paymonp","gravatar_id":"","url":"https://api.github.com/users/paymonp","avatar_url":"https://avatars.githubusercontent.com/u/1308363?"},"repo":{"id":28678242,"name":"paymonp/forecast_wrapper","url":"https://api.github.com/repos/paymonp/forecast_wrapper"},"payload":{"push_id":536753388,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"9b9757b748dd98f06c2517a9af376e7515716a6a","before":"a6f19abd10df22698f53704cd60bb245961a6365","commits":[{"sha":"9b9757b748dd98f06c2517a9af376e7515716a6a","author":{"email":"fc8885f78a23392efbab2637290a95a3fe38d9fa@team.curious.com","name":"Paymon"},"message":"Create README.md","distinct":true,"url":"https://api.github.com/repos/paymonp/forecast_wrapper/commits/9b9757b748dd98f06c2517a9af376e7515716a6a"}]},"public":true,"created_at":"2015-01-01T01:06:18Z"}
{"id":"2489398531","type":"PushEvent","actor":{"id":9201970,"login":"qdm","gravatar_id":"","url":"https://api.github.com/users/qdm","avatar_url":"https://avatars.githubusercontent.com/u/9201970?"},"repo":{"id":25173910,"name":"qdm/qdm.github.io","url":"https://api.github.com/repos/qdm/qdm.github.io"},"payload":{"push_id":536753389,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"d4b8f56130659dbd132ba75208e1812a0233dadb","before":"dbcd229108e512d575dcd1e4595183ce055f8e2f","commits":[{"sha":"d4b8f56130659dbd132ba75208e1812a0233dadb","author":{"email":"de163e90d3aeef9f404d1de71c48e234a211e3c3@gmail.com","name":"KT"},"message":"Update","distinct":true,"url":"https://api.github.com/repos/qdm/qdm.github.io/commits/d4b8f56130659dbd132ba75208e1812a0233dadb"}]},"public":true,"created_at":"2015-01-01T01:06:18Z"}
{"id":"2489398534","type":"PushEvent","actor":{"id":5378975,"login":"shk33","gravatar_id":"","url":"https://api.github.com/users/shk33","avatar_url":"https://avatars.githubusercontent.com/u/5378975?"},"repo":{"id":27845488,"name":"shk33/RailsTuto","url":"https://api.github.com/repos/shk33/RailsTuto"},"payload":{"push_id":536753393,"size":1,"distinct_size":1,"ref":"refs/heads/posts","head":"bae94f8a9a33209c890f220f30632b4f5a6bf192","before":"8741a4f19d72e935c30ecdd60fe4408d71b2bb27","commits":[{"sha":"bae94f8a9a33209c890f220f30632b4f5a6bf192","author":{"email":"5c080636567f0cafe2deca0ef026947600762c71@gmail.com","name":"shk33"},"message":"Add image resize","distinct":true,"url":"https://api.github.com/repos/shk33/RailsTuto/commits/bae94f8a9a33209c890f220f30632b4f5a6bf192"}]},"public":true,"created_at":"2015-01-01T01:06:18Z"}
{"id":"2489398535","type":"PushEvent","actor":{"id":4153853,"login":"jlumijarvi","gravatar_id":"","url":"https://api.github.com/users/jlumijarvi","avatar_url":"https://avatars.githubusercontent.com/u/4153853?"},"repo":{"id":28678176,"name":"jlumijarvi/csv2xml","url":"https://api.github.com/repos/jlumijarvi/csv2xml"},"payload":{"push_id":536753392,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"191be1eb12b72eac931815f4d9dc022ec9d4ef22","before":"44f7054077780dd70b8ad070b9b04640a65282ec","commits":[{"sha":"191be1eb12b72eac931815f4d9dc022ec9d4ef22","author":{"email":"40e6fc59d2535c98bfd5d19357e20df6e95cef64@gmail.com","name":"jlumijarvi"},"message":"Update README.md","distinct":true,"url":"https://api.github.com/repos/jlumijarvi/csv2xml/commits/191be1eb12b72eac931815f4d9dc022ec9d4ef22"}]},"public":true,"created_at":"2015-01-01T01:06:18Z"}
{"id":"2489398537","type":"DeleteEvent","actor":{"id":2812278,"login":"beret595","gravatar_id":"","url":"https://api.github.com/users/beret595","avatar_url":"https://avatars.githubusercontent.com/u/2812278?"},"repo":{"id":28470088,"name":"beret595/Ucar_Operation_Crm_Finance","url":"https://api.github.com/repos/beret595/Ucar_Operation_Crm_Finance"},"payload":{"ref":"Ocean","ref_type":"branch","pusher_type":"user"},"public":true,"created_at":"2015-01-01T01:06:18Z"}
{"id":"2489398541","type":"PushEvent","actor":{"id":7336721,"login":"aow1980","gravatar_id":"","url":"https://api.github.com/users/aow1980","avatar_url":"https://avatars.githubusercontent.com/u/7336721?"},"repo":{"id":27033479,"name":"aow1980/android_system_core","url":"https://api.github.com/repos/aow1980/android_system_core"},"payload":{"push_id":536753397,"size":12,"distinct_size":12,"ref":"refs/heads/lp5.0","head":"e32edbcdc6851baf2e9fdb9586b19c9503436db2","before":"ce1744ba2e2bb8731621c1cdc4aa0663a83eb972","commits":[{"sha":"4b2626f0f43973b445a167370caf9fe9df834e7d","author":{"email":"457cfb837588e6491cbd81701614a2c9f7081d84@gmail.com","name":"aow1980"},"message":"healthd: Reinitialize mChargerNames for every battery update\n\nBooting up the device without the usb sets the usb power supply\ntype as UNKNOWN. Due to this mChargerNames gets incorrectly\ninitialized at bootup. The value of usb power supply type changes\nat run-time. So it makes sense to update mChargerNames everytime\nwe have a battery related update.\n\nChange-Id: I2ec9f9a420ca61814d43c316b418ce94de3691bc","distinct":true,"url":"https://api.github.com/repos/aow1980/android_system_core/commits/4b2626f0f43973b445a167370caf9fe9df834e7d"},{"sha":"78215b970e26959e1ad7f4129f84d8879e43ad35","author":{"email":"457cfb837588e6491cbd81701614a2c9f7081d84@gmail.com","name":"aow1980"},"message":"audio: Add 24-bit offload format to audio_bytes_per_sample\n\nChange-Id: I238f302beadf8ba7705ffcb70639fb32be4ff2c4","distinct":true,"url":"https://api.github.com/repos/aow1980/android_system_core/commits/78215b970e26959e1ad7f4129f84d8879e43ad35"},{"sha":"0f6f929147dad895bf830989d491beab7513e93a","author":{"email":"457cfb837588e6491cbd81701614a2c9f7081d84@gmail.com","name":"aow1980"},"message":"Healthd: charger: allow override of LED/BACKLIGHT paths\n\nChange-Id: Ib7372e441d554e16ffc20ce43993ee78cdc5b187","distinct":true,"url":"https://api.github.com/repos/aow1980/android_system_core/commits/0f6f929147dad895bf830989d491beab7513e93a"},{"sha":"b0e263832d9eb57b2705f36200c170c9b7274e8d","author":{"email":"457cfb837588e6491cbd81701614a2c9f7081d84@gmail.com","name":"aow1980"},"message":"healthd: Detect power supply type for all charger devices\n\nPower supply type is not determined via the device name,\nhence iterate over all available devices in the subsystem\nnode and read the type from device file.\n\n  shell@hammerhead:/ $ ls /sys/class/power_supply\n  ac\n  batt_therm\n  battery\n  touch\n  usb\n  wireless\n\n<4>[ 3184.867782] healthd: touch: Unknown power supply type\n<4>[ 3184.868039] healthd: batt_therm: Unknown power supply type\n<6>[ 3184.880506] healthd: battery l=89 v=4181 t=25.5 h=2 st=2 c=-288 chg=u\n<4>[ 3184.890362] healthd: touch: Unknown power supply type\n<4>[ 3184.890549] healthd: batt_therm: Unknown power supply type\n<6>[ 3184.899419] healthd: battery l=89 v=4181 t=25.5 h=2 st=2 c=-59 chg=u\n<4>[ 3184.908756] healthd: touch: Unknown power supply type\n<4>[ 3184.908984] healthd: batt_therm: Unknown power supply type\n<6>[ 3184.919672] healthd: battery l=89 v=4181 t=25.6 h=2 st=2 c=-25 chg=u\n\nChange-Id: I863bfab95193899460237b51997e0418eeb4ee2c","distinct":true,"url":"https://api.github.com/repos/aow1980/android_system_core/commits/b0e263832d9eb57b2705f36200c170c9b7274e8d"},{"sha":"e95c00ae6b23f31a356549e69cbc271db674ec29","author":{"email":"457cfb837588e6491cbd81701614a2c9f7081d84@gmail.com","name":"aow1980"},"message":"adb: host: Provide better sideload status\n\n * Show data transfer in MB and in multiple of the file size.\n\n * Show a spinner to indicate liveness, which is updated at least once\n   per second regardless of data transfer.\n\n * Do not allow sideload of zero sized files.\n\nChange-Id: I1bd0df6a8183fad5a502fc26a7e789c27d24f71a","distinct":true,"url":"https://api.github.com/repos/aow1980/android_system_core/commits/e95c00ae6b23f31a356549e69cbc271db674ec29"},{"sha":"322799474a0e0492dbdfcbb029dc724b99d972f3","author":{"email":"457cfb837588e6491cbd81701614a2c9f7081d84@gmail.com","name":"aow1980"},"message":"adb: Fix host build\n\nChange-Id: I173e920aa836bb0327bfae235022de011f3e2b99","distinct":true,"url":"https://api.github.com/repos/aow1980/android_system_core/commits/322799474a0e0492dbdfcbb029dc724b99d972f3"},{"sha":"16057b3eb88144955a86e9591c5517af7447da53","author":{"email":"457cfb837588e6491cbd81701614a2c9f7081d84@gmail.com","name":"aow1980"},"message":"set /system/etc/init.d/* permissions\n\nported from CM7\n\nChange-Id: I3422c392248673fd7a8c8b45f34678097e553b5b","distinct":true,"url":"https://api.github.com/repos/aow1980/android_system_core/commits/16057b3eb88144955a86e9591c5517af7447da53"},{"sha":"fe4cc92ac754b3a3787f56563c1123a1086931c9","author":{"email":"457cfb837588e6491cbd81701614a2c9f7081d84@gmail.com","name":"aow1980"},"message":"init: create symlinks to mtd block device nodes\n\nGiven a device in the form of \"/devices/virtual/mtd/mtd0/mtdblock0\":\n* Creates symlinks for mtd block devices in\n  /dev/block/mtd/mtd<partition number>\n* Creates symlinks based on partition name in\n  /dev/block/mtd/by-name/<partition name>\n\nChange-Id: Id8d61be88935a0ef83297d1d5e453d8ba0d586de","distinct":true,"url":"https://api.github.com/repos/aow1980/android_system_core/commits/fe4cc92ac754b3a3787f56563c1123a1086931c9"},{"sha":"9f694a70b15ad0dfb84b176e542c95ce811af8c0","author":{"email":"457cfb837588e6491cbd81701614a2c9f7081d84@gmail.com","name":"aow1980"},"message":"fastboot: Add missing fastboot USB IDs\n\nChange-Id: I1616e9e6a57652aa919f979833c0e19479343966","distinct":true,"url":"https://api.github.com/repos/aow1980/android_system_core/commits/9f694a70b15ad0dfb84b176e542c95ce811af8c0"},{"sha":"3d9f73c94d78cc3a445d9040bf8b948ca5636f78","author":{"email":"457cfb837588e6491cbd81701614a2c9f7081d84@gmail.com","name":"aow1980"},"message":"libcutils: Do not use the kernel headers\n\nNo idea why this is here, but it breaks arm64 builds. bionic's signal.h\nmust be used on those\n\nChange-Id: Id4f07a9b13a32c563fda6e96e4a87b8b97d125fd","distinct":true,"url":"https://api.github.com/repos/aow1980/android_system_core/commits/3d9f73c94d78cc3a445d9040bf8b948ca5636f78"},{"sha":"2269774631b7e39c832c79406b1aa587954ff294","author":{"email":"457cfb837588e6491cbd81701614a2c9f7081d84@gmail.com","name":"aow1980"},"message":"libsysutils: Do not use the kernel headers\n\nNo idea why this is here, but it breaks arm64 builds. bionic's signal.h\nmust be used on those\n\nChange-Id: I64f71565b179af38345fcf1496274ee5858abb05","distinct":true,"url":"https://api.github.com/repos/aow1980/android_system_core/commits/2269774631b7e39c832c79406b1aa587954ff294"},{"sha":"e32edbcdc6851baf2e9fdb9586b19c9503436db2","author":{"email":"457cfb837588e6491cbd81701614a2c9f7081d84@gmail.com","name":"aow1980"},"message":"Forward-port mkbootimg / unpackbootimg support\n\n * Mostly from Koush and Seth Shelnutt\n\nunpackbootimg (squashed)\n\nunpackbootimg ported forward from eclair\n\nChange-Id: I74d2df0b47d40e7105cc58c2b05f8f383dc7f8a0\n\nport forward pagesize arg from eclair\n\nChange-Id: Ia789a4f392a3890aa0efa7efb42032482b48beb0\n\nunpackbootimg should output BOARD_PAGE_SIZE\n\nChange-Id: Ieb5cda01943a33da97eee4d025f56c2c6e7560e8\n\noutput page size in mkbootimg\n\nadd an option to override the pagesize for boot images created by nubs. ie, acer liquid mkliquidbootimg.\n\nChange-Id: Ie0c7e67edf5ae59019517e72b9be8c0b81388e41\n\nUpdate unpackbootimg to verify the Android boot image magic value. It will also search the first 512 bytes for padding.\n\nChange-Id: I490cba05f2bb616a3f64e3271ecaa61eb9e64be8\n\nunpackbootimg: Fix up the padding search in case the magic does not fall on a 8 byte boundary.\n\nChange-Id: I57471f9c2117cd7965b6958ea0aa88e356436da6\n\nunpackbootimg: Fix magic search.\n\nChange-Id: I68470b637556a08e48ff72b7ef8811cba13b04ad\n\nunpackbootimg: apparently mkbootimg no longer accepts hex values\n\nChange-Id: I95a33f7b40470e4500d418d863a65a75e7aa8499\n\nunpackbootimg: Need to also update the written file.\n\nChange-Id: I45faddbae85273c79b2837f97933634b6e70546f\n\nramdiskaddr is now ramdisk_offset\n\nChange-Id: I3bf83af5f7001f581506dc7fd9b1eb653334ad35\n\nunpackbootimg: remove host LOCAL_MODULE_TAG\n\nChange-Id: I199d680dc5ab8bf50f5be65c29095bf3adade695\n\nunpackbootimg: Add support for device trees\n\nChange-Id: I340eed99d2274a2f4cbaf5a9f27726ff3a9302e5\n\nunpackbootimg: Add support for detecting lz4 compressed ramdisks\n\nThis will check for lz4 magic, and if found change the extension of the\nfile. Else it'll fall back to the default behavior of assuming gzip. This has\nbeen tested with stock LS980 boot images and LS970 boot images for lz4\nand gzip respectively.\n\nChange-Id: If2139ff172397b6db079ffb7ab9cb61897c38fb3\n\nunpackbootimg: Add support for dumping ramdisk offset\n\nChange-Id: Ic62b9fe61db4435ecbc52b66db5ffc9b9d79cbb4\n\nunpackbootimg: Add support for second, second_offset and tags_offset.\n\nChange-Id: Ia7ef7f00191dbf2c44736c4e4d980f72afa8c253","distinct":true,"url":"https://api.github.com/repos/aow1980/android_system_core/commits/e32edbcdc6851baf2e9fdb9586b19c9503436db2"}]},"public":true,"created_at":"2015-01-01T01:06:18Z"}
{"id":"2489398543","type":"PushEvent","actor":{"id":10263666,"login":"katiekroik","gravatar_id":"","url":"https://api.github.com/users/katiekroik","avatar_url":"https://avatars.githubusercontent.com/u/10263666?"},"repo":{"id":28677679,"name":"jl4282/swirlwebsite","url":"https://api.github.com/repos/jl4282/swirlwebsite"},"payload":{"push_id":536753398,"size":1,"distinct_size":1,"ref":"refs/heads/develop","head":"53bc894d93b396c5cc3c224311421a017ceac40e","before":"bd278f438aba4582c30eb8d42e7b52740b739e5b","commits":[{"sha":"53bc894d93b396c5cc3c224311421a017ceac40e","author":{"email":"fdb375617daf85f650fdf56bce778da925caee49@nyu.edu","name":"katiekroik"},"message":"Updated README","distinct":true,"url":"https://api.github.com/repos/jl4282/swirlwebsite/commits/53bc894d93b396c5cc3c224311421a017ceac40e"}]},"public":true,"created_at":"2015-01-01T01:06:18Z"}
{"id":"2489398544","type":"GollumEvent","actor":{"id":4620127,"login":"husathap","gravatar_id":"","url":"https://api.github.com/users/husathap","avatar_url":"https://avatars.githubusercontent.com/u/4620127?"},"repo":{"id":28579680,"name":"husathap/Inuvik","url":"https://api.github.com/repos/husathap/Inuvik"},"payload":{"pages":[{"page_name":"Tutorial-#1:-Creating-a-New-Room","title":"Tutorial #1: Creating a New Room","summary":null,"action":"edited","sha":"dc5f3f3a5cd37352810747bce11e48dc9c0541ee","html_url":"https://github.com/husathap/Inuvik/wiki/Tutorial-%231%3A-Creating-a-New-Room"}]},"public":true,"created_at":"2015-01-01T01:06:18Z"}
{"id":"2489398545","type":"PushEvent","actor":{"id":1745861,"login":"topaztee","gravatar_id":"","url":"https://api.github.com/users/topaztee","avatar_url":"https://avatars.githubusercontent.com/u/1745861?"},"repo":{"id":28677407,"name":"topaztee/topaztee.github.io","url":"https://api.github.com/repos/topaztee/topaztee.github.io"},"payload":{"push_id":536753399,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"3f5e524f47baf10eafc7deecb718ff84dab8d25a","before":"70a7d7ee278b87fbcbe0c785d3ec3c1dcb12a8d4","commits":[{"sha":"3f5e524f47baf10eafc7deecb718ff84dab8d25a","author":{"email":"f74c82d708bb42a372674042ebc8a1411fbc9344@192-168-1-2.tpgi.com.au","name":"topaztur@gmail.com"},"message":"Blog update at 2015-01-01 01:06:09","distinct":true,"url":"https://api.github.com/repos/topaztee/topaztee.github.io/commits/3f5e524f47baf10eafc7deecb718ff84dab8d25a"}]},"public":true,"created_at":"2015-01-01T01:06:18Z"}
{"id":"2489398553","type":"WatchEvent","actor":{"id":1391558,"login":"UndefinedOffset","gravatar_id":"","url":"https://api.github.com/users/UndefinedOffset","avatar_url":"https://avatars.githubusercontent.com/u/1391558?"},"repo":{"id":1030566,"name":"furf/jquery-ui-touch-punch","url":"https://api.github.com/repos/furf/jquery-ui-touch-punch"},"payload":{"action":"started"},"public":true,"created_at":"2015-01-01T01:06:22Z"}
{"id":"2489398558","type":"WatchEvent","actor":{"id":117788,"login":"nyarla","gravatar_id":"","url":"https://api.github.com/users/nyarla","avatar_url":"https://avatars.githubusercontent.com/u/117788?"},"repo":{"id":28428729,"name":"wasabeef/awesome-android-ui","url":"https://api.github.com/repos/wasabeef/awesome-android-ui"},"payload":{"action":"started"},"public":true,"created_at":"2015-01-01T01:06:23Z"}
{"id":"2489398559","type":"PushEvent","actor":{"id":9038488,"login":"martindevnow","gravatar_id":"","url":"https://api.github.com/users/martindevnow","avatar_url":"https://avatars.githubusercontent.com/u/9038488?"},"repo":{"id":28460218,"name":"martindevnow/larabook","url":"https://api.github.com/repos/martindevnow/larabook"},"payload":{"push_id":536753400,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"247a3c2ba8b1d067c146dfa23587614f564b2c2f","before":"b4d8b51987660e73ac233d8d34fa8c25001af5a5","commits":[{"sha":"247a3c2ba8b1d067c146dfa23587614f564b2c2f","author":{"email":"e4fb5da29019c84509153dcdcc3d610b56ae63a4@gmail.com","name":"Ben Martin (Cooler-PC)"},"message":"Products","distinct":true,"url":"https://api.github.com/repos/martindevnow/larabook/commits/247a3c2ba8b1d067c146dfa23587614f564b2c2f"}]},"public":true,"created_at":"2015-01-01T01:06:23Z"}
{"id":"2489398561","type":"PushEvent","actor":{"id":433707,"login":"ile","gravatar_id":"","url":"https://api.github.com/users/ile","avatar_url":"https://avatars.githubusercontent.com/u/433707?"},"repo":{"id":26847132,"name":"kantele/k-templates","url":"https://api.github.com/repos/kantele/k-templates"},"payload":{"push_id":536753401,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"274cca1b2adc063b47d558ac9bafa0dce7a05abb","before":"6630db87e4ed496f67a88bf24f22332c67e9792d","commits":[{"sha":"274cca1b2adc063b47d558ac9bafa0dce7a05abb","author":{"email":"4f3407de78bccc8cc160ee4d278d5efe7162e6b5@nateps.com","name":"Nate Smith"},"message":"null check expression.meta","distinct":true,"url":"https://api.github.com/repos/kantele/k-templates/commits/274cca1b2adc063b47d558ac9bafa0dce7a05abb"}]},"public":true,"created_at":"2015-01-01T01:06:23Z","org":{"id":5687585,"login":"kantele","gravatar_id":"","url":"https://api.github.com/orgs/kantele","avatar_url":"https://avatars.githubusercontent.com/u/5687585?"}}
{"id":"2489398566","type":"PushEvent","actor":{"id":5606771,"login":"rchoetzlein","gravatar_id":"","url":"https://api.github.com/users/rchoetzlein","avatar_url":"https://avatars.githubusercontent.com/u/5606771?"},"repo":{"id":28014200,"name":"rchoetzlein/luna","url":"https://api.github.com/repos/rchoetzlein/luna"},"payload":{"push_id":536753407,"size":2,"distinct_size":1,"ref":"refs/heads/release","head":"0406bbe059f3d0121cff67e5e2afeb2510b97dfc","before":"ea9868cd5999171ed66ccca64f33db74c4901104","commits":[{"sha":"6ae249b814f81055c160ea612e3817a582a819f0","author":{"email":"8b97780f57e4074b50b20f54327dcaeef1063a29@gmail.com","name":"Rama Hoetzlein"},"message":"testing","distinct":false,"url":"https://api.github.com/repos/rchoetzlein/luna/commits/6ae249b814f81055c160ea612e3817a582a819f0"},{"sha":"0406bbe059f3d0121cff67e5e2afeb2510b97dfc","author":{"email":"8b97780f57e4074b50b20f54327dcaeef1063a29@gmail.com","name":"Rama Hoetzlein"},"message":"Merge branch 'rama' into release","distinct":true,"url":"https://api.github.com/repos/rchoetzlein/luna/commits/0406bbe059f3d0121cff67e5e2afeb2510b97dfc"}]},"public":true,"created_at":"2015-01-01T01:06:23Z"}
{"id":"2489398569","type":"PushEvent","actor":{"id":4379694,"login":"moongato","gravatar_id":"","url":"https://api.github.com/users/moongato","avatar_url":"https://avatars.githubusercontent.com/u/4379694?"},"repo":{"id":11769101,"name":"moongato/android_packages_apps_settings","url":"https://api.github.com/repos/moongato/android_packages_apps_settings"},"payload":{"push_id":536753409,"size":3,"distinct_size":3,"ref":"refs/heads/lp50x-test","head":"5b4781c9b6ff5d41e22f14aaac8d384ed85d0c19","before":"56646a94c0aedc577d5db224058fb9be4c927786","commits":[{"sha":"e53c63b3254c37b69e9fcf05b69a1b2fb7f1858c","author":{"email":"0fdcc473619717889ce3a7389c2487333487bab5@gmail.com","name":"rascarlo"},"message":"volume rocker music controls","distinct":true,"url":"https://api.github.com/repos/moongato/android_packages_apps_settings/commits/e53c63b3254c37b69e9fcf05b69a1b2fb7f1858c"},{"sha":"bebb75fdaa4a085c814ea6d2551899593454440d","author":{"email":"0fdcc473619717889ce3a7389c2487333487bab5@gmail.com","name":"rascarlo"},"message":"status bar brightness control edits.\n\nremove check for SCREEN_BRIGHTNESS_MODE_AUTOMATIC","distinct":true,"url":"https://api.github.com/repos/moongato/android_packages_apps_settings/commits/bebb75fdaa4a085c814ea6d2551899593454440d"},{"sha":"5b4781c9b6ff5d41e22f14aaac8d384ed85d0c19","author":{"email":"22e0f38e0fc64da9129ff9b9ef030b39415294a1@ubuntu","name":"moongato"},"message":"Merge remote-tracking branch 'upstream/lollipop-ras-mr1' into lp50x-test","distinct":true,"url":"https://api.github.com/repos/moongato/android_packages_apps_settings/commits/5b4781c9b6ff5d41e22f14aaac8d384ed85d0c19"}]},"public":true,"created_at":"2015-01-01T01:06:23Z"}
{"id":"2489398571","type":"PushEvent","actor":{"id":10355660,"login":"nomadturk","gravatar_id":"","url":"https://api.github.com/users/nomadturk","avatar_url":"https://avatars.githubusercontent.com/u/10355660?"},"repo":{"id":28657737,"name":"nomadturk/nginx-conf","url":"https://api.github.com/repos/nomadturk/nginx-conf"},"payload":{"push_id":536753411,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"f560a8bd7c3d688fd6b99a5976e3518fbbfd68a3","before":"5c897fb95e40e2b52b31c71de5eaed81d9989c6d","commits":[{"sha":"f560a8bd7c3d688fd6b99a5976e3518fbbfd68a3","author":{"email":"90283840d90de49b8e7984bd99b47fee0d4bd50d@cokh.net","name":"nomadturk"},"message":"Update pagespeed.add","distinct":true,"url":"https://api.github.com/repos/nomadturk/nginx-conf/commits/f560a8bd7c3d688fd6b99a5976e3518fbbfd68a3"}]},"public":true,"created_at":"2015-01-01T01:06:24Z"}
{"id":"2489398573","type":"PushEvent","actor":{"id":5674054,"login":"winsphinx","gravatar_id":"","url":"https://api.github.com/users/winsphinx","avatar_url":"https://avatars.githubusercontent.com/u/5674054?"},"repo":{"id":24920694,"name":"winsphinx/MyDesktop","url":"https://api.github.com/repos/winsphinx/MyDesktop"},"payload":{"push_id":536753412,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"e9598c0de93d13ac89e00771bbdd1ac0cadaa6c4","before":"a76c17c45cc8caf929cfeb0ccd1ebf88d5eb9773","commits":[{"sha":"e9598c0de93d13ac89e00771bbdd1ac0cadaa6c4","author":{"email":"fcb6a490c5f10779ac384c021b9111357615f586@gmail.com","name":"winsphinx"},"message":"add notepad2","distinct":true,"url":"https://api.github.com/repos/winsphinx/MyDesktop/commits/e9598c0de93d13ac89e00771bbdd1ac0cadaa6c4"}]},"public":true,"created_at":"2015-01-01T01:06:24Z"}
{"id":"2489398574","type":"PullRequestReviewCommentEvent","actor":{"id":523287,"login":"j2sol","gravatar_id":"","url":"https://api.github.com/users/j2sol","avatar_url":"https://avatars.githubusercontent.com/u/523287?"},"repo":{"id":11848896,"name":"blueboxgroup/ursula","url":"https://api.github.com/repos/blueboxgroup/ursula"},"payload":{"action":"created","comment":{"url":"https://api.github.com/repos/blueboxgroup/ursula/pulls/comments/22397298","id":22397298,"diff_hunk":"@@ -1,121 +1,92 @@\n ---\n-- name: install apache\n-  apt: pkg={{ item }}\n-  with_items:\n-    - apache2\n-    - libapache2-mod-wsgi\n-\n - name: lesscpy must be in apache PATH\n   pip: name=lesscpy version=0.9j\n \n - name: get horizon source repo\n-  git: repo={{ openstack.git_mirror }}/horizon.git\n-       dest=/opt/stack/horizon\n-       version={{ horizon.rev }}\n-       update={{ openstack.git_update }}\n+  git: |\n+    repo={{ openstack.git_mirror}}/horizon.git\n+    dest=/opt/stack/horizon\n+    version={{ horizon.rev }}\n+    update={{ openstack.git_update }}\n   notify:\n     - setup horizon venv\n     - compress horizon assets\n \n-- template: src=opt/stack/horizon/hide-external-networks.patch dest=/opt/stack/horizon/hide-external-networks.patch mode=0644\n-- shell: patch -p1 < hide-external-networks.patch chdir=/opt/stack/horizon\n-  notify:\n-    - setup horizon venv\n-\n - name: add python-memcached to horizon requirements\n-  lineinfile: dest=/opt/stack/horizon/requirements.txt\n-              regexp=^python-memcached\n-              line=python-memcached\n+  lineinfile: dest=/opt/stack/horizon/requirements.txt regexp=^python-memcached line=python-memcached\n   notify:\n     - setup horizon venv\n \n-- name: disable apache status\n-  command: a2dismod status\n-  notify:\n-    - restart apache\n-\n-- name: apache ports config\n-  template: src=etc/apache2/ports.conf\n-            dest=/etc/apache2/ports.conf\n-  notify:\n-    - restart apache\n-\n-- name: disable default apache site\n-  command: a2dissite 000-default\n+- name: make sure apache knows about horizon ports\n+  lineinfile: dest=/etc/apache2/ports.conf line=\"Listen 8080\"\n   notify:\n-    - restart apache\n+    - reload apache\n \n-- name: openstack dashboard config (12.04)\n-  template: src=etc/apache2/sites-available/openstack_dashboard.conf\n-            dest=/etc/apache2/sites-available/openstack_dashboard\n+- name: create dashboard virtualhost on precise\n+  template: |\n+    src=etc/apache2/sites-available/openstack_dashboard.conf\n+    dest=/etc/apache2/sites-available/openstack_dashboard\n   when: ansible_distribution_version == \"12.04\"\n   notify:\n-    - restart apache\n+    - reload apache\n \n-- name: openstack dashboard config\n-  template: src=etc/apache2/sites-available/openstack_dashboard.conf\n-            dest=/etc/apache2/sites-available/openstack_dashboard.conf\n+- name: create dashboard virtualhost on other\n+  template: |\n+    src=etc/apache2/sites-available/openstack_dashboard.conf\n+    dest=/etc/apache2/sites-available/openstack_dashboard.conf\n   when: ansible_distribution_version != \"12.04\"\n   notify:\n-    - restart apache\n+    - reload apache\n \n - name: enable horizon apache site\n-  command: a2ensite openstack_dashboard\n+  apache2_site: state=enabled name=openstack_dashboard\n   notify:\n-    - restart apache\n-\n-- name: static asset directories\n-  file: dest={{ item }}\n-        state=directory\n-        owner=www-data\n-        group=www-data\n-        mode=0755\n+    - reload apache\n+\n+- name: create static asset dirs\n+  file: |\n+    dest={{ item }}\n+    state=directory\n+    owner=www-data\n+    group=www-data\n+    mode=0755\n   with_items:\n     - /opt/stack/horizon/static\n     - /opt/stack/horizon/static/dashboard\n \n-- name: horizon local settings\n-  template: src=opt/stack/horizon/openstack_dashboard/local/local_settings.py\n-            dest=/opt/stack/horizon/openstack_dashboard/local/local_settings.py\n-            mode=0644\n+- name: dashboard settings\n+  template: |\n+    src=opt/stack/horizon/openstack_dashboard/local/local_settings.py\n+    dest=/opt/stack/horizon/openstack_dashboard/local/local_settings.py\n+    mode=0644\n   notify:\n-    - restart apache\n+    - reload apache\n \n - name: custom horizon logo\n-  get_url: url={{ horizon.logo_url }}\n-           dest=/opt/stack/horizon/openstack_dashboard/static/dashboard/img/logo.png\n-           mode=0644 force=yes\n+  get_url: url={{ horizon.logo_url }} dest=/opt/stack/horizon/openstack_dashboard/static/dashboard/img/logo.png mode=0644 force=yes\n \n - name: custom horizon splash logo\n-  get_url: url={{ horizon.logo_url }}\n-           dest=/opt/stack/horizon/openstack_dashboard/static/dashboard/img/logo-splash.png\n-           mode=0644 force=yes\n+  get_url: url={{ horizon.logo_url }} dest=/opt/stack/horizon/openstack_dashboard/static/dashboard/img/logo-splash.png mode=0644 force=yes\n \n - name: custom horizon favicon\n-  get_url: url={{ horizon.favicon_url }}\n-           dest=/opt/stack/horizon/openstack_dashboard/static/dashboard/img/favicon.ico\n-           force=yes\n+  get_url: url={{ horizon.favicon_url }} dest=/opt/stack/horizon/openstack_dashboard/static/dashboard/img/favicon.ico force=yes\n \n - name: put images and fonts where apache can find them\n-  file: src=/opt/stack/horizon/openstack_dashboard/static/dashboard/{{ item }}\n-        dest=/opt/stack/horizon/static/dashboard/{{ item }}\n-        state=link\n-        owner=www-data\n-        group=www-data\n+  file: |\n+    src=/opt/stack/horizon/openstack_dashboard/static/dashboard/{{ item }}\n+    dest=/opt/stack/horizon/static/dashboard/{{ item }}\n+    state=link\n+    owner=www-data\n+    group=www-data\n   with_items:\n     - img\n     - fonts\n \n-# flush before ensuring apache running, saves immediate restart\n-- meta: flush_handlers\n-\n-- name: ensure apache started\n+- name: ensure apache is running","path":"roles/horizon/tasks/main.yml","position":157,"original_position":157,"commit_id":"2a6f35313b9936ce4450aba823d09287626bed6f","original_commit_id":"2a6f35313b9936ce4450aba823d09287626bed6f","user":{"login":"j2sol","id":523287,"avatar_url":"https://avatars.githubusercontent.com/u/523287?v=3","gravatar_id":"","url":"https://api.github.com/users/j2sol","html_url":"https://github.com/j2sol","followers_url":"https://api.github.com/users/j2sol/followers","following_url":"https://api.github.com/users/j2sol/following{/other_user}","gists_url":"https://api.github.com/users/j2sol/gists{/gist_id}","starred_url":"https://api.github.com/users/j2sol/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/j2sol/subscriptions","organizations_url":"https://api.github.com/users/j2sol/orgs","repos_url":"https://api.github.com/users/j2sol/repos","events_url":"https://api.github.com/users/j2sol/events{/privacy}","received_events_url":"https://api.github.com/users/j2sol/received_events","type":"User","site_admin":false},"body":"Now you have a start followed by an immediate reload. Will apache be okay with that?","created_at":"2015-01-01T01:06:24Z","updated_at":"2015-01-01T01:06:24Z","html_url":"https://github.com/blueboxgroup/ursula/pull/705#discussion_r22397298","pull_request_url":"https://api.github.com/repos/blueboxgroup/ursula/pulls/705","_links":{"self":{"href":"https://api.github.com/repos/blueboxgroup/ursula/pulls/comments/22397298"},"html":{"href":"https://github.com/blueboxgroup/ursula/pull/705#discussion_r22397298"},"pull_request":{"href":"https://api.github.com/repos/blueboxgroup/ursula/pulls/705"}}},"pull_request":{"url":"https://api.github.com/repos/blueboxgroup/ursula/pulls/705","id":26738851,"html_url":"https://github.com/blueboxgroup/ursula/pull/705","diff_url":"https://github.com/blueboxgroup/ursula/pull/705.diff","patch_url":"https://github.com/blueboxgroup/ursula/pull/705.patch","issue_url":"https://api.github.com/repos/blueboxgroup/ursula/issues/705","number":705,"state":"open","locked":false,"title":"WIP:  apache for loadbalancing","user":{"login":"paulczar","id":2488346,"avatar_url":"https://avatars.githubusercontent.com/u/2488346?v=3","gravatar_id":"","url":"https://api.github.com/users/paulczar","html_url":"https://github.com/paulczar","followers_url":"https://api.github.com/users/paulczar/followers","following_url":"https://api.github.com/users/paulczar/following{/other_user}","gists_url":"https://api.github.com/users/paulczar/gists{/gist_id}","starred_url":"https://api.github.com/users/paulczar/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/paulczar/subscriptions","organizations_url":"https://api.github.com/users/paulczar/orgs","repos_url":"https://api.github.com/users/paulczar/repos","events_url":"https://api.github.com/users/paulczar/events{/privacy}","received_events_url":"https://api.github.com/users/paulczar/received_events","type":"User","site_admin":false},"body":"This is a quick POC / WIP to demo using apache instead of haproxy for loadbalancing our APIs.\r\n\r\nI think this gives us more flexibiltiy as we can enable in the APIs role itself ( in this case in keystone ) rather than a big monolithic haproxy.conf.      We also already have apache running for horizon, so it could reduce number of services.    apache also has better logging options that haproxy which can only log to syslog. ","created_at":"2015-01-01T00:04:13Z","updated_at":"2015-01-01T01:06:24Z","closed_at":null,"merged_at":null,"merge_commit_sha":"9b91693f11e166c9ee53836f19697868d412bf76","assignee":null,"milestone":null,"commits_url":"https://api.github.com/repos/blueboxgroup/ursula/pulls/705/commits","review_comments_url":"https://api.github.com/repos/blueboxgroup/ursula/pulls/705/comments","review_comment_url":"https://api.github.com/repos/blueboxgroup/ursula/pulls/comments/{number}","comments_url":"https://api.github.com/repos/blueboxgroup/ursula/issues/705/comments","statuses_url":"https://api.github.com/repos/blueboxgroup/ursula/statuses/2a6f35313b9936ce4450aba823d09287626bed6f","head":{"label":"blueboxgroup:use_apache_for_lb","ref":"use_apache_for_lb","sha":"2a6f35313b9936ce4450aba823d09287626bed6f","user":{"login":"blueboxgroup","id":458705,"avatar_url":"https://avatars.githubusercontent.com/u/458705?v=3","gravatar_id":"","url":"https://api.github.com/users/blueboxgroup","html_url":"https://github.com/blueboxgroup","followers_url":"https://api.github.com/users/blueboxgroup/followers","following_url":"https://api.github.com/users/blueboxgroup/following{/other_user}","gists_url":"https://api.github.com/users/blueboxgroup/gists{/gist_id}","starred_url":"https://api.github.com/users/blueboxgroup/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/blueboxgroup/subscriptions","organizations_url":"https://api.github.com/users/blueboxgroup/orgs","repos_url":"https://api.github.com/users/blueboxgroup/repos","events_url":"https://api.github.com/users/blueboxgroup/events{/privacy}","received_events_url":"https://api.github.com/users/blueboxgroup/received_events","type":"Organization","site_admin":false},"repo":{"id":11848896,"name":"ursula","full_name":"blueboxgroup/ursula","owner":{"login":"blueboxgroup","id":458705,"avatar_url":"https://avatars.githubusercontent.com/u/458705?v=3","gravatar_id":"","url":"https://api.github.com/users/blueboxgroup","html_url":"https://github.com/blueboxgroup","followers_url":"https://api.github.com/users/blueboxgroup/followers","following_url":"https://api.github.com/users/blueboxgroup/following{/other_user}","gists_url":"https://api.github.com/users/blueboxgroup/gists{/gist_id}","starred_url":"https://api.github.com/users/blueboxgroup/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/blueboxgroup/subscriptions","organizations_url":"https://api.github.com/users/blueboxgroup/orgs","repos_url":"https://api.github.com/users/blueboxgroup/repos","events_url":"https://api.github.com/users/blueboxgroup/events{/privacy}","received_events_url":"https://api.github.com/users/blueboxgroup/received_events","type":"Organization","site_admin":false},"private":false,"html_url":"https://github.com/blueboxgroup/ursula","description":"Ansible playbooks for operating OpenStack","fork":false,"url":"https://api.github.com/repos/blueboxgroup/ursula","forks_url":"https://api.github.com/repos/blueboxgroup/ursula/forks","keys_url":"https://api.github.com/repos/blueboxgroup/ursula/keys{/key_id}","collaborators_url":"https://api.github.com/repos/blueboxgroup/ursula/collaborators{/collaborator}","teams_url":"https://api.github.com/repos/blueboxgroup/ursula/teams","hooks_url":"https://api.github.com/repos/blueboxgroup/ursula/hooks","issue_events_url":"https://api.github.com/repos/blueboxgroup/ursula/issues/events{/number}","events_url":"https://api.github.com/repos/blueboxgroup/ursula/events","assignees_url":"https://api.github.com/repos/blueboxgroup/ursula/assignees{/user}","branches_url":"https://api.github.com/repos/blueboxgroup/ursula/branches{/branch}","tags_url":"https://api.github.com/repos/blueboxgroup/ursula/tags","blobs_url":"https://api.github.com/repos/blueboxgroup/ursula/git/blobs{/sha}","git_tags_url":"https://api.github.com/repos/blueboxgroup/ursula/git/tags{/sha}","git_refs_url":"https://api.github.com/repos/blueboxgroup/ursula/git/refs{/sha}","trees_url":"https://api.github.com/repos/blueboxgroup/ursula/git/trees{/sha}","statuses_url":"https://api.github.com/repos/blueboxgroup/ursula/statuses/{sha}","languages_url":"https://api.github.com/repos/blueboxgroup/ursula/languages","stargazers_url":"https://api.github.com/repos/blueboxgroup/ursula/stargazers","contributors_url":"https://api.github.com/repos/blueboxgroup/ursula/contributors","subscribers_url":"https://api.github.com/repos/blueboxgroup/ursula/subscribers","subscription_url":"https://api.github.com/repos/blueboxgroup/ursula/subscription","commits_url":"https://api.github.com/repos/blueboxgroup/ursula/commits{/sha}","git_commits_url":"https://api.github.com/repos/blueboxgroup/ursula/git/commits{/sha}","comments_url":"https://api.github.com/repos/blueboxgroup/ursula/comments{/number}","issue_comment_url":"https://api.github.com/repos/blueboxgroup/ursula/issues/comments/{number}","contents_url":"https://api.github.com/repos/blueboxgroup/ursula/contents/{+path}","compare_url":"https://api.github.com/repos/blueboxgroup/ursula/compare/{base}...{head}","merges_url":"https://api.github.com/repos/blueboxgroup/ursula/merges","archive_url":"https://api.github.com/repos/blueboxgroup/ursula/{archive_format}{/ref}","downloads_url":"https://api.github.com/repos/blueboxgroup/ursula/downloads","issues_url":"https://api.github.com/repos/blueboxgroup/ursula/issues{/number}","pulls_url":"https://api.github.com/repos/blueboxgroup/ursula/pulls{/number}","milestones_url":"https://api.github.com/repos/blueboxgroup/ursula/milestones{/number}","notifications_url":"https://api.github.com/repos/blueboxgroup/ursula/notifications{?since,all,participating}","labels_url":"https://api.github.com/repos/blueboxgroup/ursula/labels{/name}","releases_url":"https://api.github.com/repos/blueboxgroup/ursula/releases{/id}","created_at":"2013-08-02T17:37:26Z","updated_at":"2014-12-31T21:03:28Z","pushed_at":"2015-01-01T00:01:35Z","git_url":"git://github.com/blueboxgroup/ursula.git","ssh_url":"git@github.com:blueboxgroup/ursula.git","clone_url":"https://github.com/blueboxgroup/ursula.git","svn_url":"https://github.com/blueboxgroup/ursula","homepage":null,"size":9036,"stargazers_count":45,"watchers_count":45,"language":"Python","has_issues":true,"has_downloads":true,"has_wiki":true,"has_pages":false,"forks_count":23,"mirror_url":null,"open_issues_count":26,"forks":23,"open_issues":26,"watchers":45,"default_branch":"master"}},"base":{"label":"blueboxgroup:master","ref":"master","sha":"34b83c65ff0de2f8b006d8ce4f76919fe0167bbf","user":{"login":"blueboxgroup","id":458705,"avatar_url":"https://avatars.githubusercontent.com/u/458705?v=3","gravatar_id":"","url":"https://api.github.com/users/blueboxgroup","html_url":"https://github.com/blueboxgroup","followers_url":"https://api.github.com/users/blueboxgroup/followers","following_url":"https://api.github.com/users/blueboxgroup/following{/other_user}","gists_url":"https://api.github.com/users/blueboxgroup/gists{/gist_id}","starred_url":"https://api.github.com/users/blueboxgroup/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/blueboxgroup/subscriptions","organizations_url":"https://api.github.com/users/blueboxgroup/orgs","repos_url":"https://api.github.com/users/blueboxgroup/repos","events_url":"https://api.github.com/users/blueboxgroup/events{/privacy}","received_events_url":"https://api.github.com/users/blueboxgroup/received_events","type":"Organization","site_admin":false},"repo":{"id":11848896,"name":"ursula","full_name":"blueboxgroup/ursula","owner":{"login":"blueboxgroup","id":458705,"avatar_url":"https://avatars.githubusercontent.com/u/458705?v=3","gravatar_id":"","url":"https://api.github.com/users/blueboxgroup","html_url":"https://github.com/blueboxgroup","followers_url":"https://api.github.com/users/blueboxgroup/followers","following_url":"https://api.github.com/users/blueboxgroup/following{/other_user}","gists_url":"https://api.github.com/users/blueboxgroup/gists{/gist_id}","starred_url":"https://api.github.com/users/blueboxgroup/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/blueboxgroup/subscriptions","organizations_url":"https://api.github.com/users/blueboxgroup/orgs","repos_url":"https://api.github.com/users/blueboxgroup/repos","events_url":"https://api.github.com/users/blueboxgroup/events{/privacy}","received_events_url":"https://api.github.com/users/blueboxgroup/received_events","type":"Organization","site_admin":false},"private":false,"html_url":"https://github.com/blueboxgroup/ursula","description":"Ansible playbooks for operating OpenStack","fork":false,"url":"https://api.github.com/repos/blueboxgroup/ursula","forks_url":"https://api.github.com/repos/blueboxgroup/ursula/forks","keys_url":"https://api.github.com/repos/blueboxgroup/ursula/keys{/key_id}","collaborators_url":"https://api.github.com/repos/blueboxgroup/ursula/collaborators{/collaborator}","teams_url":"https://api.github.com/repos/blueboxgroup/ursula/teams","hooks_url":"https://api.github.com/repos/blueboxgroup/ursula/hooks","issue_events_url":"https://api.github.com/repos/blueboxgroup/ursula/issues/events{/number}","events_url":"https://api.github.com/repos/blueboxgroup/ursula/events","assignees_url":"https://api.github.com/repos/blueboxgroup/ursula/assignees{/user}","branches_url":"https://api.github.com/repos/blueboxgroup/ursula/branches{/branch}","tags_url":"https://api.github.com/repos/blueboxgroup/ursula/tags","blobs_url":"https://api.github.com/repos/blueboxgroup/ursula/git/blobs{/sha}","git_tags_url":"https://api.github.com/repos/blueboxgroup/ursula/git/tags{/sha}","git_refs_url":"https://api.github.com/repos/blueboxgroup/ursula/git/refs{/sha}","trees_url":"https://api.github.com/repos/blueboxgroup/ursula/git/trees{/sha}","statuses_url":"https://api.github.com/repos/blueboxgroup/ursula/statuses/{sha}","languages_url":"https://api.github.com/repos/blueboxgroup/ursula/languages","stargazers_url":"https://api.github.com/repos/blueboxgroup/ursula/stargazers","contributors_url":"https://api.github.com/repos/blueboxgroup/ursula/contributors","subscribers_url":"https://api.github.com/repos/blueboxgroup/ursula/subscribers","subscription_url":"https://api.github.com/repos/blueboxgroup/ursula/subscription","commits_url":"https://api.github.com/repos/blueboxgroup/ursula/commits{/sha}","git_commits_url":"https://api.github.com/repos/blueboxgroup/ursula/git/commits{/sha}","comments_url":"https://api.github.com/repos/blueboxgroup/ursula/comments{/number}","issue_comment_url":"https://api.github.com/repos/blueboxgroup/ursula/issues/comments/{number}","contents_url":"https://api.github.com/repos/blueboxgroup/ursula/contents/{+path}","compare_url":"https://api.github.com/repos/blueboxgroup/ursula/compare/{base}...{head}","merges_url":"https://api.github.com/repos/blueboxgroup/ursula/merges","archive_url":"https://api.github.com/repos/blueboxgroup/ursula/{archive_format}{/ref}","downloads_url":"https://api.github.com/repos/blueboxgroup/ursula/downloads","issues_url":"https://api.github.com/repos/blueboxgroup/ursula/issues{/number}","pulls_url":"https://api.github.com/repos/blueboxgroup/ursula/pulls{/number}","milestones_url":"https://api.github.com/repos/blueboxgroup/ursula/milestones{/number}","notifications_url":"https://api.github.com/repos/blueboxgroup/ursula/notifications{?since,all,participating}","labels_url":"https://api.github.com/repos/blueboxgroup/ursula/labels{/name}","releases_url":"https://api.github.com/repos/blueboxgroup/ursula/releases{/id}","created_at":"2013-08-02T17:37:26Z","updated_at":"2014-12-31T21:03:28Z","pushed_at":"2015-01-01T00:01:35Z","git_url":"git://github.com/blueboxgroup/ursula.git","ssh_url":"git@github.com:blueboxgroup/ursula.git","clone_url":"https://github.com/blueboxgroup/ursula.git","svn_url":"https://github.com/blueboxgroup/ursula","homepage":null,"size":9036,"stargazers_count":45,"watchers_count":45,"language":"Python","has_issues":true,"has_downloads":true,"has_wiki":true,"has_pages":false,"forks_count":23,"mirror_url":null,"open_issues_count":26,"forks":23,"open_issues":26,"watchers":45,"default_branch":"master"}},"_links":{"self":{"href":"https://api.github.com/repos/blueboxgroup/ursula/pulls/705"},"html":{"href":"https://github.com/blueboxgroup/ursula/pull/705"},"issue":{"href":"https://api.github.com/repos/blueboxgroup/ursula/issues/705"},"comments":{"href":"https://api.github.com/repos/blueboxgroup/ursula/issues/705/comments"},"review_comments":{"href":"https://api.github.com/repos/blueboxgroup/ursula/pulls/705/comments"},"review_comment":{"href":"https://api.github.com/repos/blueboxgroup/ursula/pulls/comments/{number}"},"commits":{"href":"https://api.github.com/repos/blueboxgroup/ursula/pulls/705/commits"},"statuses":{"href":"https://api.github.com/repos/blueboxgroup/ursula/statuses/2a6f35313b9936ce4450aba823d09287626bed6f"}}}},"public":true,"created_at":"2015-01-01T01:06:24Z","org":{"id":458705,"login":"blueboxgroup","gravatar_id":"","url":"https://api.github.com/orgs/blueboxgroup","avatar_url":"https://avatars.githubusercontent.com/u/458705?"}}
{"id":"2489398577","type":"IssueCommentEvent","actor":{"id":993322,"login":"qiangxue","gravatar_id":"","url":"https://api.github.com/users/qiangxue","avatar_url":"https://avatars.githubusercontent.com/u/993322?"},"repo":{"id":3431193,"name":"yiisoft/yii2","url":"https://api.github.com/repos/yiisoft/yii2"},"payload":{"action":"created","issue":{"url":"https://api.github.com/repos/yiisoft/yii2/issues/6708","labels_url":"https://api.github.com/repos/yiisoft/yii2/issues/6708/labels{/name}","comments_url":"https://api.github.com/repos/yiisoft/yii2/issues/6708/comments","events_url":"https://api.github.com/repos/yiisoft/yii2/issues/6708/events","html_url":"https://github.com/yiisoft/yii2/issues/6708","id":53187446,"number":6708,"title":"PHP Notice when working with related records","user":{"login":"SDKiller","id":2150916,"avatar_url":"https://avatars.githubusercontent.com/u/2150916?v=3","gravatar_id":"","url":"https://api.github.com/users/SDKiller","html_url":"https://github.com/SDKiller","followers_url":"https://api.github.com/users/SDKiller/followers","following_url":"https://api.github.com/users/SDKiller/following{/other_user}","gists_url":"https://api.github.com/users/SDKiller/gists{/gist_id}","starred_url":"https://api.github.com/users/SDKiller/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/SDKiller/subscriptions","organizations_url":"https://api.github.com/users/SDKiller/orgs","repos_url":"https://api.github.com/users/SDKiller/repos","events_url":"https://api.github.com/users/SDKiller/events{/privacy}","received_events_url":"https://api.github.com/users/SDKiller/received_events","type":"User","site_admin":false},"labels":[{"url":"https://api.github.com/repos/yiisoft/yii2/labels/status%3Aneed+more+info","name":"status:need more info","color":"d4c5f9"}],"state":"open","locked":false,"assignee":null,"milestone":null,"comments":4,"created_at":"2014-12-31T15:04:22Z","updated_at":"2015-01-01T01:06:23Z","closed_at":null,"body":"```\r\nPHP Notice – yii\\base\\ErrorException\r\nIndirect modification of overloaded property common\\models\\catalog\\Categories::$subCategories has no effect\r\n```\r\n\r\nBut if I supress error reporting - everything works fine, related records are processed as expected.\r\nAm I doing something wrong or it is a drawback of relations `magic`?\r\n\r\n\r\nin controller:\r\n```\r\n    ....\r\n        $category = Categories::find()\r\n            ->where($condition)\r\n            ->with('subCategories')\r\n            ->one();\r\n\r\n        $category->buildPaths();\r\n    ...\r\n```\r\n\r\n\r\nin `Categories` model\r\n```\r\n...\r\n    /**\r\n     * Relation with \\common\\models\\catalog\\Categories to retrieve sub-categories\r\n     */\r\n    public function getSubCategories()\r\n    {\r\n        return $this->hasMany(Categories::className(), ['parent' => '_id'])\r\n            ->where(['published' => 1])\r\n            ->orderBy(['ordering' => SORT_ASC, 'name' => SORT_ASC]);\r\n    }\r\n\r\n    ...\r\n\r\n    public function buildPaths()\r\n    {\r\n        if (!empty($this->subCategories)) {\r\n            foreach ($this->subCategories as &$subCategory) {\r\n                $subCategory->setPath($this->path . '/' . $subCategory->alias);\r\n            }\r\n        }\r\n    }\r\n...\r\n```"},"comment":{"url":"https://api.github.com/repos/yiisoft/yii2/issues/comments/68477358","html_url":"https://github.com/yiisoft/yii2/issues/6708#issuecomment-68477358","issue_url":"https://api.github.com/repos/yiisoft/yii2/issues/6708","id":68477358,"user":{"login":"qiangxue","id":993322,"avatar_url":"https://avatars.githubusercontent.com/u/993322?v=3","gravatar_id":"","url":"https://api.github.com/users/qiangxue","html_url":"https://github.com/qiangxue","followers_url":"https://api.github.com/users/qiangxue/followers","following_url":"https://api.github.com/users/qiangxue/following{/other_user}","gists_url":"https://api.github.com/users/qiangxue/gists{/gist_id}","starred_url":"https://api.github.com/users/qiangxue/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/qiangxue/subscriptions","organizations_url":"https://api.github.com/users/qiangxue/orgs","repos_url":"https://api.github.com/users/qiangxue/repos","events_url":"https://api.github.com/users/qiangxue/events{/privacy}","received_events_url":"https://api.github.com/users/qiangxue/received_events","type":"User","site_admin":false},"created_at":"2015-01-01T01:06:23Z","updated_at":"2015-01-01T01:06:23Z","body":"Why do you use `&$subCategory`?"}},"public":true,"created_at":"2015-01-01T01:06:24Z","org":{"id":993323,"login":"yiisoft","gravatar_id":"","url":"https://api.github.com/orgs/yiisoft","avatar_url":"https://avatars.githubusercontent.com/u/993323?"}}
{"id":"2489398578","type":"PushEvent","actor":{"id":1684950,"login":"naijaping","gravatar_id":"","url":"https://api.github.com/users/naijaping","avatar_url":"https://avatars.githubusercontent.com/u/1684950?"},"repo":{"id":28650038,"name":"naijaping/awonlist","url":"https://api.github.com/repos/naijaping/awonlist"},"payload":{"push_id":536753415,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"7f482e40c0e163ac46ddcfc1c206c6a851e0b62b","before":"f454a5a195625a9128fddb04b192fcc457e82091","commits":[{"sha":"7f482e40c0e163ac46ddcfc1c206c6a851e0b62b","author":{"email":"8a1440b218d23a283d388025f7c9dc3555009ec5@gmail.com","name":"naijaping"},"message":"Update uk","distinct":true,"url":"https://api.github.com/repos/naijaping/awonlist/commits/7f482e40c0e163ac46ddcfc1c206c6a851e0b62b"}]},"public":true,"created_at":"2015-01-01T01:06:24Z"}
{"id":"2489398579","type":"CreateEvent","actor":{"id":3960243,"login":"wp-plugins-user","gravatar_id":"","url":"https://api.github.com/users/wp-plugins-user","avatar_url":"https://avatars.githubusercontent.com/u/3960243?"},"repo":{"id":22870574,"name":"wp-plugins/chamber-dashboard-business-directory","url":"https://api.github.com/repos/wp-plugins/chamber-dashboard-business-directory"},"payload":{"ref":"1.9","ref_type":"tag","master_branch":"master","description":"WordPress.org Plugin Mirror","pusher_type":"user"},"public":true,"created_at":"2015-01-01T01:06:24Z","org":{"id":2996849,"login":"wp-plugins","gravatar_id":"","url":"https://api.github.com/orgs/wp-plugins","avatar_url":"https://avatars.githubusercontent.com/u/2996849?"}}
{"id":"2489398580","type":"PushEvent","actor":{"id":739622,"login":"treydock","gravatar_id":"","url":"https://api.github.com/users/treydock","avatar_url":"https://avatars.githubusercontent.com/u/739622?"},"repo":{"id":23934080,"name":"idhmc-tamu/emop-dashboard","url":"https://api.github.com/repos/idhmc-tamu/emop-dashboard"},"payload":{"push_id":536753416,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"f26c3459c2f4116b0a267740239059c68bdf9995","before":"668e7ea0bdfc797da70795b9b9ae61bead37b3fb","commits":[{"sha":"f26c3459c2f4116b0a267740239059c68bdf9995","author":{"email":"ea4a4ed01189a93e0c88f9f6e05a922974b21422@tamu.edu","name":"Trey Dockendorf"},"message":"Update FontsController\n* Use ActiveRecord methods for performing queries to database rather than raw SQL\n* Streamline much of the code to be simpler\n* Correct indentation issue to be 2-spaces to indent\n* Add unit tests\n\nModel updates\n* Associate PrintFront and Work models\n* Validate that a PrintFront instance's name value (pf_name) is unique\n* Add instance method to Font model that generates the traineddata path rather than creating the path in controllers","distinct":true,"url":"https://api.github.com/repos/idhmc-tamu/emop-dashboard/commits/f26c3459c2f4116b0a267740239059c68bdf9995"}]},"public":true,"created_at":"2015-01-01T01:06:24Z","org":{"id":4932222,"login":"idhmc-tamu","gravatar_id":"","url":"https://api.github.com/orgs/idhmc-tamu","avatar_url":"https://avatars.githubusercontent.com/u/4932222?"}}
{"id":"2489398582","type":"PushEvent","actor":{"id":3960243,"login":"wp-plugins-user","gravatar_id":"","url":"https://api.github.com/users/wp-plugins-user","avatar_url":"https://avatars.githubusercontent.com/u/3960243?"},"repo":{"id":22870574,"name":"wp-plugins/chamber-dashboard-business-directory","url":"https://api.github.com/repos/wp-plugins/chamber-dashboard-business-directory"},"payload":{"push_id":536753417,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"52cd22ebee5fa319aa244d232c376aec6865ba16","before":"17c18938eaf97feb2c3f55eb276b6c1145e86969","commits":[{"sha":"52cd22ebee5fa319aa244d232c376aec6865ba16","author":{"email":"ce123eae784bf8ff0a0dbf80492a59e7c0a2bfbf@b8457f37-d9ea-0310-8a92-e5e31aec5664","name":"Gwendydd"},"message":"added social media fields\n\ngit-svn-id: https://plugins.svn.wordpress.org/chamber-dashboard-business-directory/trunk@1057716 b8457f37-d9ea-0310-8a92-e5e31aec5664","distinct":true,"url":"https://api.github.com/repos/wp-plugins/chamber-dashboard-business-directory/commits/52cd22ebee5fa319aa244d232c376aec6865ba16"}]},"public":true,"created_at":"2015-01-01T01:06:24Z","org":{"id":2996849,"login":"wp-plugins","gravatar_id":"","url":"https://api.github.com/orgs/wp-plugins","avatar_url":"https://avatars.githubusercontent.com/u/2996849?"}}
{"id":"2489398584","type":"PushEvent","actor":{"id":2453862,"login":"schloo","gravatar_id":"","url":"https://api.github.com/users/schloo","avatar_url":"https://avatars.githubusercontent.com/u/2453862?"},"repo":{"id":28160579,"name":"azilnik/phetch","url":"https://api.github.com/repos/azilnik/phetch"},"payload":{"push_id":536753420,"size":1,"distinct_size":1,"ref":"refs/heads/gh-pages","head":"672e3213d883f8d100f0e2d38b1c739ecc39acf5","before":"1b32d9c513558f8cc57ed88edff23b0d45610363","commits":[{"sha":"672e3213d883f8d100f0e2d38b1c739ecc39acf5","author":{"email":"03cd939e5e01f81bd3cbeb1977c82e3d0109cf43@Michelles-Air.home","name":"schloo"},"message":"oops moar","distinct":true,"url":"https://api.github.com/repos/azilnik/phetch/commits/672e3213d883f8d100f0e2d38b1c739ecc39acf5"}]},"public":true,"created_at":"2015-01-01T01:06:24Z"}
{"id":"2489398586","type":"PushEvent","actor":{"id":1445198,"login":"FleurDeLuce","gravatar_id":"","url":"https://api.github.com/users/FleurDeLuce","avatar_url":"https://avatars.githubusercontent.com/u/1445198?"},"repo":{"id":18230007,"name":"FleurDeLuce/Leetcode","url":"https://api.github.com/repos/FleurDeLuce/Leetcode"},"payload":{"push_id":536753422,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"153fe4cc6aeb387647e30f5c67b7572763439d0c","before":"d0dbdf0f946b052673cbe4ea6f9c385788e155c7","commits":[{"sha":"153fe4cc6aeb387647e30f5c67b7572763439d0c","author":{"email":"b8ad7a82476ffa543a8614f8b96f97e16135a3b6@gmail.com","name":"FleurDeLuce"},"message":"factorial trailing zeroes solution added","distinct":true,"url":"https://api.github.com/repos/FleurDeLuce/Leetcode/commits/153fe4cc6aeb387647e30f5c67b7572763439d0c"}]},"public":true,"created_at":"2015-01-01T01:06:25Z"}
{"id":"2489398592","type":"IssueCommentEvent","actor":{"id":4192725,"login":"yangarbiter","gravatar_id":"","url":"https://api.github.com/users/yangarbiter","avatar_url":"https://avatars.githubusercontent.com/u/4192725?"},"repo":{"id":13980094,"name":"botonchou/libdnn","url":"https://api.github.com/repos/botonchou/libdnn"},"payload":{"action":"created","issue":{"url":"https://api.github.com/repos/botonchou/libdnn/issues/8","labels_url":"https://api.github.com/repos/botonchou/libdnn/issues/8/labels{/name}","comments_url":"https://api.github.com/repos/botonchou/libdnn/issues/8/comments","events_url":"https://api.github.com/repos/botonchou/libdnn/issues/8/events","html_url":"https://github.com/botonchou/libdnn/issues/8","id":53170772,"number":8,"title":"How to lower the total needed shared memory?","user":{"login":"yangarbiter","id":4192725,"avatar_url":"https://avatars.githubusercontent.com/u/4192725?v=3","gravatar_id":"","url":"https://api.github.com/users/yangarbiter","html_url":"https://github.com/yangarbiter","followers_url":"https://api.github.com/users/yangarbiter/followers","following_url":"https://api.github.com/users/yangarbiter/following{/other_user}","gists_url":"https://api.github.com/users/yangarbiter/gists{/gist_id}","starred_url":"https://api.github.com/users/yangarbiter/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/yangarbiter/subscriptions","organizations_url":"https://api.github.com/users/yangarbiter/orgs","repos_url":"https://api.github.com/users/yangarbiter/repos","events_url":"https://api.github.com/users/yangarbiter/events{/privacy}","received_events_url":"https://api.github.com/users/yangarbiter/received_events","type":"User","site_admin":false},"labels":[{"url":"https://api.github.com/repos/botonchou/libdnn/labels/question","name":"question","color":"cc317c"}],"state":"open","locked":false,"assignee":null,"milestone":null,"comments":4,"created_at":"2014-12-31T06:59:09Z","updated_at":"2015-01-01T01:06:26Z","closed_at":null,"body":"Hi Chou,\r\n\r\nI am encountering the following problem when trying to run convolutional neural network.\r\n```\r\nterminate called after throwing an instance of 'std::runtime_error'\r\n  what():  [Error] In function \"getSuitableShmConfig\" (at src/cnn-utility.cu:418): Exceeds maximum shared memory available. (49152 bytes)\r\nkernel = (100, 92), grids = (8, 8, 40), threads = (4, 4, 1)  => 75940 bytes of shared memory needed.\r\n```\r\nWhat is the standard way to fix this problem if I really don't have that much memory? (ex. lowering thread count)\r\n\r\nThanks in advance."},"comment":{"url":"https://api.github.com/repos/botonchou/libdnn/issues/comments/68477359","html_url":"https://github.com/botonchou/libdnn/issues/8#issuecomment-68477359","issue_url":"https://api.github.com/repos/botonchou/libdnn/issues/8","id":68477359,"user":{"login":"yangarbiter","id":4192725,"avatar_url":"https://avatars.githubusercontent.com/u/4192725?v=3","gravatar_id":"","url":"https://api.github.com/users/yangarbiter","html_url":"https://github.com/yangarbiter","followers_url":"https://api.github.com/users/yangarbiter/followers","following_url":"https://api.github.com/users/yangarbiter/following{/other_user}","gists_url":"https://api.github.com/users/yangarbiter/gists{/gist_id}","starred_url":"https://api.github.com/users/yangarbiter/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/yangarbiter/subscriptions","organizations_url":"https://api.github.com/users/yangarbiter/orgs","repos_url":"https://api.github.com/users/yangarbiter/repos","events_url":"https://api.github.com/users/yangarbiter/events{/privacy}","received_events_url":"https://api.github.com/users/yangarbiter/received_events","type":"User","site_admin":false},"created_at":"2015-01-01T01:06:26Z","updated_at":"2015-01-01T01:06:26Z","body":"Actually the kernel size 23*14 is able to be run on my computer using theano. I am still wondering about what Caffe have done to get the 7% error rate. I can only achieve around 15% error rate with Lenet implemented by theano.\r\n\r\nBTW, I found out the the nn-init would crash without any error message when the format of input training data is wrong. (I accidentally start my array from zero) \r\n\r\n"}},"public":true,"created_at":"2015-01-01T01:06:27Z"}
{"id":"2489398593","type":"PushEvent","actor":{"id":1779595,"login":"dcbaker","gravatar_id":"","url":"https://api.github.com/users/dcbaker","avatar_url":"https://avatars.githubusercontent.com/u/1779595?"},"repo":{"id":8488437,"name":"dcbaker/piglit","url":"https://api.github.com/repos/dcbaker/piglit"},"payload":{"push_id":536753426,"size":1,"distinct_size":1,"ref":"refs/heads/wip/command-list-only-v5","head":"4664b69bd21c2dc875eb7ac03be904a6eb371d9c","before":"cf5cf7224385c3c3d086762b5bc1d8f7df031ae7","commits":[{"sha":"4664b69bd21c2dc875eb7ac03be904a6eb371d9c","author":{"email":"c26a678a04c601e0311b0d6006e67eee6ed19a8e@intel.com","name":"Dylan Baker"},"message":"fixup! fixup! all.py: Replace some string concatenation with str.format()","distinct":true,"url":"https://api.github.com/repos/dcbaker/piglit/commits/4664b69bd21c2dc875eb7ac03be904a6eb371d9c"}]},"public":true,"created_at":"2015-01-01T01:06:27Z"}
{"id":"2489398596","type":"PushEvent","actor":{"id":3960243,"login":"wp-plugins-user","gravatar_id":"","url":"https://api.github.com/users/wp-plugins-user","avatar_url":"https://avatars.githubusercontent.com/u/3960243?"},"repo":{"id":27287395,"name":"wp-plugins/spam-hammer","url":"https://api.github.com/repos/wp-plugins/spam-hammer"},"payload":{"push_id":536753429,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"5c71935c5b32807aedcc9533e4e9105b7bf38947","before":"df54c7e1ab24d713b54f4c3660c186982d6cae95","commits":[{"sha":"5c71935c5b32807aedcc9533e4e9105b7bf38947","author":{"email":"8177b3ca125b2874291549da03b6ae3b620b0c28@b8457f37-d9ea-0310-8a92-e5e31aec5664","name":"wpspamhammer"},"message":"Readme.txt Update.  Total Spam Attacks: 15,150,841\n\ngit-svn-id: https://plugins.svn.wordpress.org/spam-hammer/trunk@1057715 b8457f37-d9ea-0310-8a92-e5e31aec5664","distinct":true,"url":"https://api.github.com/repos/wp-plugins/spam-hammer/commits/5c71935c5b32807aedcc9533e4e9105b7bf38947"}]},"public":true,"created_at":"2015-01-01T01:06:27Z","org":{"id":2996849,"login":"wp-plugins","gravatar_id":"","url":"https://api.github.com/orgs/wp-plugins","avatar_url":"https://avatars.githubusercontent.com/u/2996849?"}}
{"id":"2489398600","type":"IssuesEvent","actor":{"id":23202,"login":"aduros","gravatar_id":"","url":"https://api.github.com/users/aduros","avatar_url":"https://avatars.githubusercontent.com/u/23202?"},"repo":{"id":10282042,"name":"HaxeFoundation/haxe","url":"https://api.github.com/repos/HaxeFoundation/haxe"},"payload":{"action":"opened","issue":{"url":"https://api.github.com/repos/HaxeFoundation/haxe/issues/3730","labels_url":"https://api.github.com/repos/HaxeFoundation/haxe/issues/3730/labels{/name}","comments_url":"https://api.github.com/repos/HaxeFoundation/haxe/issues/3730/comments","events_url":"https://api.github.com/repos/HaxeFoundation/haxe/issues/3730/events","html_url":"https://github.com/HaxeFoundation/haxe/issues/3730","id":53210295,"number":3730,"title":"#file support","user":{"login":"aduros","id":23202,"avatar_url":"https://avatars.githubusercontent.com/u/23202?v=3","gravatar_id":"","url":"https://api.github.com/users/aduros","html_url":"https://github.com/aduros","followers_url":"https://api.github.com/users/aduros/followers","following_url":"https://api.github.com/users/aduros/following{/other_user}","gists_url":"https://api.github.com/users/aduros/gists{/gist_id}","starred_url":"https://api.github.com/users/aduros/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/aduros/subscriptions","organizations_url":"https://api.github.com/users/aduros/orgs","repos_url":"https://api.github.com/users/aduros/repos","events_url":"https://api.github.com/users/aduros/events{/privacy}","received_events_url":"https://api.github.com/users/aduros/received_events","type":"User","site_admin":false},"labels":[],"state":"open","locked":false,"assignee":null,"milestone":null,"comments":0,"created_at":"2015-01-01T01:06:27Z","updated_at":"2015-01-01T01:06:27Z","closed_at":null,"body":"#line is pretty useful for compilers that translate to Haxe. Would it be possible to also support something like #file to pass the source filename?\r\n\r\nWould be helpful for a project I'm working on, but if it's not an easy change no worries :)\r\n\r\nMight also be useful to @tardisgo?"}},"public":true,"created_at":"2015-01-01T01:06:28Z","org":{"id":3826779,"login":"HaxeFoundation","gravatar_id":"","url":"https://api.github.com/orgs/HaxeFoundation","avatar_url":"https://avatars.githubusercontent.com/u/3826779?"}}
{"id":"2489398601","type":"PushEvent","actor":{"id":4170616,"login":"cmsbuild","gravatar_id":"","url":"https://api.github.com/users/cmsbuild","avatar_url":"https://avatars.githubusercontent.com/u/4170616?"},"repo":{"id":20482496,"name":"cms-sw/cms-sw.github.io","url":"https://api.github.com/repos/cms-sw/cms-sw.github.io"},"payload":{"push_id":536753430,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"714d9b5ebc2cb4242ac08affaf1a0cbce8d02218","before":"e473bfee29d1543bd1dba301d6c1a3ef60dc1248","commits":[{"sha":"714d9b5ebc2cb4242ac08affaf1a0cbce8d02218","author":{"email":"5a25e995b53ac7cd7cc4edf867580fb423e22fde@cern.ch","name":"CMS Build"},"message":"New report generated 20150101-0206","distinct":true,"url":"https://api.github.com/repos/cms-sw/cms-sw.github.io/commits/714d9b5ebc2cb4242ac08affaf1a0cbce8d02218"}]},"public":true,"created_at":"2015-01-01T01:06:28Z","org":{"id":3863500,"login":"cms-sw","gravatar_id":"","url":"https://api.github.com/orgs/cms-sw","avatar_url":"https://avatars.githubusercontent.com/u/3863500?"}}
{"id":"2489398602","type":"PushEvent","actor":{"id":106511,"login":"andrewrk","gravatar_id":"","url":"https://api.github.com/users/andrewrk","avatar_url":"https://avatars.githubusercontent.com/u/106511?"},"repo":{"id":28373474,"name":"thejoshwolfe/nethack","url":"https://api.github.com/repos/thejoshwolfe/nethack"},"payload":{"push_id":536753431,"size":1,"distinct_size":1,"ref":"refs/heads/it-is-time","head":"3231a8162f90ce411af8c23d67cc04584f0ed7fa","before":"b0821d5e5d69c4b72114e3426b6c2b34be07356a","commits":[{"sha":"3231a8162f90ce411af8c23d67cc04584f0ed7fa","author":{"email":"af99923804d57df769e1fbdbabc16e1c5dd902e2@gmail.com","name":"Andrew Kelley"},"message":"bones.c","distinct":true,"url":"https://api.github.com/repos/thejoshwolfe/nethack/commits/3231a8162f90ce411af8c23d67cc04584f0ed7fa"}]},"public":true,"created_at":"2015-01-01T01:06:28Z"}
{"id":"2489398604","type":"WatchEvent","actor":{"id":1570089,"login":"sirvon","gravatar_id":"","url":"https://api.github.com/users/sirvon","avatar_url":"https://avatars.githubusercontent.com/u/1570089?"},"repo":{"id":4605713,"name":"stackmagic/bitly-api-client","url":"https://api.github.com/repos/stackmagic/bitly-api-client"},"payload":{"action":"started"},"public":true,"created_at":"2015-01-01T01:06:29Z"}
{"id":"2489398610","type":"ForkEvent","actor":{"id":7791006,"login":"hlk2014","gravatar_id":"","url":"https://api.github.com/users/hlk2014","avatar_url":"https://avatars.githubusercontent.com/u/7791006?"},"repo":{"id":15464223,"name":"linuxdeepin/deepin-emacs","url":"https://api.github.com/repos/linuxdeepin/deepin-emacs"},"payload":{"forkee":{"id":28678280,"name":"deepin-emacs","full_name":"hlk2014/deepin-emacs","owner":{"login":"hlk2014","id":7791006,"avatar_url":"https://avatars.githubusercontent.com/u/7791006?v=3","gravatar_id":"","url":"https://api.github.com/users/hlk2014","html_url":"https://github.com/hlk2014","followers_url":"https://api.github.com/users/hlk2014/followers","following_url":"https://api.github.com/users/hlk2014/following{/other_user}","gists_url":"https://api.github.com/users/hlk2014/gists{/gist_id}","starred_url":"https://api.github.com/users/hlk2014/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/hlk2014/subscriptions","organizations_url":"https://api.github.com/users/hlk2014/orgs","repos_url":"https://api.github.com/users/hlk2014/repos","events_url":"https://api.github.com/users/hlk2014/events{/privacy}","received_events_url":"https://api.github.com/users/hlk2014/received_events","type":"User","site_admin":false},"private":false,"html_url":"https://github.com/hlk2014/deepin-emacs","description":"Deepin emacs","fork":true,"url":"https://api.github.com/repos/hlk2014/deepin-emacs","forks_url":"https://api.github.com/repos/hlk2014/deepin-emacs/forks","keys_url":"https://api.github.com/repos/hlk2014/deepin-emacs/keys{/key_id}","collaborators_url":"https://api.github.com/repos/hlk2014/deepin-emacs/collaborators{/collaborator}","teams_url":"https://api.github.com/repos/hlk2014/deepin-emacs/teams","hooks_url":"https://api.github.com/repos/hlk2014/deepin-emacs/hooks","issue_events_url":"https://api.github.com/repos/hlk2014/deepin-emacs/issues/events{/number}","events_url":"https://api.github.com/repos/hlk2014/deepin-emacs/events","assignees_url":"https://api.github.com/repos/hlk2014/deepin-emacs/assignees{/user}","branches_url":"https://api.github.com/repos/hlk2014/deepin-emacs/branches{/branch}","tags_url":"https://api.github.com/repos/hlk2014/deepin-emacs/tags","blobs_url":"https://api.github.com/repos/hlk2014/deepin-emacs/git/blobs{/sha}","git_tags_url":"https://api.github.com/repos/hlk2014/deepin-emacs/git/tags{/sha}","git_refs_url":"https://api.github.com/repos/hlk2014/deepin-emacs/git/refs{/sha}","trees_url":"https://api.github.com/repos/hlk2014/deepin-emacs/git/trees{/sha}","statuses_url":"https://api.github.com/repos/hlk2014/deepin-emacs/statuses/{sha}","languages_url":"https://api.github.com/repos/hlk2014/deepin-emacs/languages","stargazers_url":"https://api.github.com/repos/hlk2014/deepin-emacs/stargazers","contributors_url":"https://api.github.com/repos/hlk2014/deepin-emacs/contributors","subscribers_url":"https://api.github.com/repos/hlk2014/deepin-emacs/subscribers","subscription_url":"https://api.github.com/repos/hlk2014/deepin-emacs/subscription","commits_url":"https://api.github.com/repos/hlk2014/deepin-emacs/commits{/sha}","git_commits_url":"https://api.github.com/repos/hlk2014/deepin-emacs/git/commits{/sha}","comments_url":"https://api.github.com/repos/hlk2014/deepin-emacs/comments{/number}","issue_comment_url":"https://api.github.com/repos/hlk2014/deepin-emacs/issues/comments/{number}","contents_url":"https://api.github.com/repos/hlk2014/deepin-emacs/contents/{+path}","compare_url":"https://api.github.com/repos/hlk2014/deepin-emacs/compare/{base}...{head}","merges_url":"https://api.github.com/repos/hlk2014/deepin-emacs/merges","archive_url":"https://api.github.com/repos/hlk2014/deepin-emacs/{archive_format}{/ref}","downloads_url":"https://api.github.com/repos/hlk2014/deepin-emacs/downloads","issues_url":"https://api.github.com/repos/hlk2014/deepin-emacs/issues{/number}","pulls_url":"https://api.github.com/repos/hlk2014/deepin-emacs/pulls{/number}","milestones_url":"https://api.github.com/repos/hlk2014/deepin-emacs/milestones{/number}","notifications_url":"https://api.github.com/repos/hlk2014/deepin-emacs/notifications{?since,all,participating}","labels_url":"https://api.github.com/repos/hlk2014/deepin-emacs/labels{/name}","releases_url":"https://api.github.com/repos/hlk2014/deepin-emacs/releases{/id}","created_at":"2015-01-01T01:06:30Z","updated_at":"2014-12-13T11:28:12Z","pushed_at":"2014-10-18T01:10:59Z","git_url":"git://github.com/hlk2014/deepin-emacs.git","ssh_url":"git@github.com:hlk2014/deepin-emacs.git","clone_url":"https://github.com/hlk2014/deepin-emacs.git","svn_url":"https://github.com/hlk2014/deepin-emacs","homepage":null,"size":57006,"stargazers_count":0,"watchers_count":0,"language":null,"has_issues":false,"has_downloads":true,"has_wiki":true,"has_pages":false,"forks_count":0,"mirror_url":null,"open_issues_count":0,"forks":0,"open_issues":0,"watchers":0,"default_branch":"master","public":true}},"public":true,"created_at":"2015-01-01T01:06:30Z","org":{"id":1592697,"login":"linuxdeepin","gravatar_id":"","url":"https://api.github.com/orgs/linuxdeepin","avatar_url":"https://avatars.githubusercontent.com/u/1592697?"}}
{"id":"2489398617","type":"IssueCommentEvent","actor":{"id":1802542,"login":"ishayyaari","gravatar_id":"","url":"https://api.github.com/users/ishayyaari","avatar_url":"https://avatars.githubusercontent.com/u/1802542?"},"repo":{"id":4967600,"name":"MiYa-Solutions/sbcx","url":"https://api.github.com/repos/MiYa-Solutions/sbcx"},"payload":{"action":"created","issue":{"url":"https://api.github.com/repos/MiYa-Solutions/sbcx/issues/708","labels_url":"https://api.github.com/repos/MiYa-Solutions/sbcx/issues/708/labels{/name}","comments_url":"https://api.github.com/repos/MiYa-Solutions/sbcx/issues/708/comments","events_url":"https://api.github.com/repos/MiYa-Solutions/sbcx/issues/708/events","html_url":"https://github.com/MiYa-Solutions/sbcx/issues/708","id":53092805,"number":708,"title":"Mobile: Projects","user":{"login":"ishayyaari","id":1802542,"avatar_url":"https://avatars.githubusercontent.com/u/1802542?v=3","gravatar_id":"","url":"https://api.github.com/users/ishayyaari","html_url":"https://github.com/ishayyaari","followers_url":"https://api.github.com/users/ishayyaari/followers","following_url":"https://api.github.com/users/ishayyaari/following{/other_user}","gists_url":"https://api.github.com/users/ishayyaari/gists{/gist_id}","starred_url":"https://api.github.com/users/ishayyaari/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/ishayyaari/subscriptions","organizations_url":"https://api.github.com/users/ishayyaari/orgs","repos_url":"https://api.github.com/users/ishayyaari/repos","events_url":"https://api.github.com/users/ishayyaari/events{/privacy}","received_events_url":"https://api.github.com/users/ishayyaari/received_events","type":"User","site_admin":false},"labels":[{"url":"https://api.github.com/repos/MiYa-Solutions/sbcx/labels/High","name":"High","color":"FF0000"},{"url":"https://api.github.com/repos/MiYa-Solutions/sbcx/labels/UI+Feature","name":"UI Feature","color":"02e10c"}],"state":"open","locked":false,"assignee":{"login":"ishayyaari","id":1802542,"avatar_url":"https://avatars.githubusercontent.com/u/1802542?v=3","gravatar_id":"","url":"https://api.github.com/users/ishayyaari","html_url":"https://github.com/ishayyaari","followers_url":"https://api.github.com/users/ishayyaari/followers","following_url":"https://api.github.com/users/ishayyaari/following{/other_user}","gists_url":"https://api.github.com/users/ishayyaari/gists{/gist_id}","starred_url":"https://api.github.com/users/ishayyaari/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/ishayyaari/subscriptions","organizations_url":"https://api.github.com/users/ishayyaari/orgs","repos_url":"https://api.github.com/users/ishayyaari/repos","events_url":"https://api.github.com/users/ishayyaari/events{/privacy}","received_events_url":"https://api.github.com/users/ishayyaari/received_events","type":"User","site_admin":false},"milestone":{"url":"https://api.github.com/repos/MiYa-Solutions/sbcx/milestones/10","labels_url":"https://api.github.com/repos/MiYa-Solutions/sbcx/milestones/10/labels","id":835988,"number":10,"title":"Rug Wash Bug Fixes","description":"Fixes specifically for the rug wash opportunity","creator":{"login":"markmilman","id":1744318,"avatar_url":"https://avatars.githubusercontent.com/u/1744318?v=3","gravatar_id":"","url":"https://api.github.com/users/markmilman","html_url":"https://github.com/markmilman","followers_url":"https://api.github.com/users/markmilman/followers","following_url":"https://api.github.com/users/markmilman/following{/other_user}","gists_url":"https://api.github.com/users/markmilman/gists{/gist_id}","starred_url":"https://api.github.com/users/markmilman/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/markmilman/subscriptions","organizations_url":"https://api.github.com/users/markmilman/orgs","repos_url":"https://api.github.com/users/markmilman/repos","events_url":"https://api.github.com/users/markmilman/events{/privacy}","received_events_url":"https://api.github.com/users/markmilman/received_events","type":"User","site_admin":false},"open_issues":6,"closed_issues":37,"state":"open","created_at":"2014-10-22T14:08:56Z","updated_at":"2015-01-01T01:05:32Z","due_on":"2014-11-11T08:00:00Z","closed_at":null},"comments":1,"created_at":"2014-12-30T04:38:31Z","updated_at":"2015-01-01T01:06:31Z","closed_at":null,"body":"\r\n\r\n"},"comment":{"url":"https://api.github.com/repos/MiYa-Solutions/sbcx/issues/comments/68477360","html_url":"https://github.com/MiYa-Solutions/sbcx/issues/708#issuecomment-68477360","issue_url":"https://api.github.com/repos/MiYa-Solutions/sbcx/issues/708","id":68477360,"user":{"login":"ishayyaari","id":1802542,"avatar_url":"https://avatars.githubusercontent.com/u/1802542?v=3","gravatar_id":"","url":"https://api.github.com/users/ishayyaari","html_url":"https://github.com/ishayyaari","followers_url":"https://api.github.com/users/ishayyaari/followers","following_url":"https://api.github.com/users/ishayyaari/following{/other_user}","gists_url":"https://api.github.com/users/ishayyaari/gists{/gist_id}","starred_url":"https://api.github.com/users/ishayyaari/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/ishayyaari/subscriptions","organizations_url":"https://api.github.com/users/ishayyaari/orgs","repos_url":"https://api.github.com/users/ishayyaari/repos","events_url":"https://api.github.com/users/ishayyaari/events{/privacy}","received_events_url":"https://api.github.com/users/ishayyaari/received_events","type":"User","site_admin":false},"created_at":"2015-01-01T01:06:31Z","updated_at":"2015-01-01T01:06:31Z","body":"Add link - new project\r\nDesign screen:\r\nnew project\r\nproject show\r\nprojects index\r\n\r\nAdd link to New Job\r\n"}},"public":true,"created_at":"2015-01-01T01:06:32Z","org":{"id":1788572,"login":"MiYa-Solutions","gravatar_id":"","url":"https://api.github.com/orgs/MiYa-Solutions","avatar_url":"https://avatars.githubusercontent.com/u/1788572?"}}
{"id":"2489398618","type":"PushEvent","actor":{"id":280212,"login":"KenanSulayman","gravatar_id":"","url":"https://api.github.com/users/KenanSulayman","avatar_url":"https://avatars.githubusercontent.com/u/280212?"},"repo":{"id":21481110,"name":"KenanSulayman/heartbeat","url":"https://api.github.com/repos/KenanSulayman/heartbeat"},"payload":{"push_id":536753434,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"cf281dd3839c3e07ed867a2eb77aa4965a2a1400","before":"4a08cf46a835742f49c5272d70f3210529dbb819","commits":[{"sha":"cf281dd3839c3e07ed867a2eb77aa4965a2a1400","author":{"email":"9176253dfc0bc82671a5e984646605f93319147a@sly.mn","name":"Kenan Sulayman"},"message":"1420074389244\n\nnRgGIKdriEl0S2qJGXnQVTH0OZV30N+8iE2Gf95JgnQ=","distinct":true,"url":"https://api.github.com/repos/KenanSulayman/heartbeat/commits/cf281dd3839c3e07ed867a2eb77aa4965a2a1400"}]},"public":true,"created_at":"2015-01-01T01:06:33Z"}
{"id":"2489398619","type":"PushEvent","actor":{"id":5240798,"login":"hxwang","gravatar_id":"","url":"https://api.github.com/users/hxwang","avatar_url":"https://avatars.githubusercontent.com/u/5240798?"},"repo":{"id":20258812,"name":"hxwang/Leetcode","url":"https://api.github.com/repos/hxwang/Leetcode"},"payload":{"push_id":536753435,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"628e4f129b5723f944d1a7887509c737762b2821","before":"e67f3471c2ea1c6556ff18137af91f8d92e5e39d","commits":[{"sha":"628e4f129b5723f944d1a7887509c737762b2821","author":{"email":"320cb2ff8e2e195f7d4e5cd3b27b690e919d61e5@gmail.com","name":"Huangxin"},"message":"Update summary-types.md","distinct":true,"url":"https://api.github.com/repos/hxwang/Leetcode/commits/628e4f129b5723f944d1a7887509c737762b2821"}]},"public":true,"created_at":"2015-01-01T01:06:33Z"}
{"id":"2489398634","type":"WatchEvent","actor":{"id":117788,"login":"nyarla","gravatar_id":"","url":"https://api.github.com/users/nyarla","avatar_url":"https://avatars.githubusercontent.com/u/117788?"},"repo":{"id":28594887,"name":"opennota/macro","url":"https://api.github.com/repos/opennota/macro"},"payload":{"action":"started"},"public":true,"created_at":"2015-01-01T01:06:34Z"}
{"id":"2489398636","type":"PushEvent","actor":{"id":9882658,"login":"sw1308","gravatar_id":"","url":"https://api.github.com/users/sw1308","avatar_url":"https://avatars.githubusercontent.com/u/9882658?"},"repo":{"id":27245135,"name":"sw1308/Programming","url":"https://api.github.com/repos/sw1308/Programming"},"payload":{"push_id":536753444,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"64297900b95bff1508a18a31e53ff9f25a89b7f7","before":"6d0cc02640c6ad8a909736a0415cf95f8e43f693","commits":[{"sha":"64297900b95bff1508a18a31e53ff9f25a89b7f7","author":{"email":"4c225d032373d049685b78ca1f2e87cbde7ff0e2@york.ac.uk","name":"sw1308"},"message":"Created new files for graphics testing","distinct":true,"url":"https://api.github.com/repos/sw1308/Programming/commits/64297900b95bff1508a18a31e53ff9f25a89b7f7"}]},"public":true,"created_at":"2015-01-01T01:06:34Z"}
{"id":"2489398638","type":"WatchEvent","actor":{"id":30923,"login":"digitalsanctum","gravatar_id":"","url":"https://api.github.com/users/digitalsanctum","avatar_url":"https://avatars.githubusercontent.com/u/30923?"},"repo":{"id":16621659,"name":"real-logic/Aeron","url":"https://api.github.com/repos/real-logic/Aeron"},"payload":{"action":"started"},"public":true,"created_at":"2015-01-01T01:06:37Z","org":{"id":5371471,"login":"real-logic","gravatar_id":"","url":"https://api.github.com/orgs/real-logic","avatar_url":"https://avatars.githubusercontent.com/u/5371471?"}}
{"id":"2489398640","type":"IssuesEvent","actor":{"id":8218499,"login":"GunZi200","gravatar_id":"","url":"https://api.github.com/users/GunZi200","avatar_url":"https://avatars.githubusercontent.com/u/8218499?"},"repo":{"id":27030606,"name":"GunZi200/Memory-Colour","url":"https://api.github.com/repos/GunZi200/Memory-Colour"},"payload":{"action":"opened","issue":{"url":"https://api.github.com/repos/GunZi200/Memory-Colour/issues/2","labels_url":"https://api.github.com/repos/GunZi200/Memory-Colour/issues/2/labels{/name}","comments_url":"https://api.github.com/repos/GunZi200/Memory-Colour/issues/2/comments","events_url":"https://api.github.com/repos/GunZi200/Memory-Colour/issues/2/events","html_url":"https://github.com/GunZi200/Memory-Colour/issues/2","id":53210296,"number":2,"title":"Heart is rendered incorrectly","user":{"login":"GunZi200","id":8218499,"avatar_url":"https://avatars.githubusercontent.com/u/8218499?v=3","gravatar_id":"","url":"https://api.github.com/users/GunZi200","html_url":"https://github.com/GunZi200","followers_url":"https://api.github.com/users/GunZi200/followers","following_url":"https://api.github.com/users/GunZi200/following{/other_user}","gists_url":"https://api.github.com/users/GunZi200/gists{/gist_id}","starred_url":"https://api.github.com/users/GunZi200/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/GunZi200/subscriptions","organizations_url":"https://api.github.com/users/GunZi200/orgs","repos_url":"https://api.github.com/users/GunZi200/repos","events_url":"https://api.github.com/users/GunZi200/events{/privacy}","received_events_url":"https://api.github.com/users/GunZi200/received_events","type":"User","site_admin":false},"labels":[{"url":"https://api.github.com/repos/GunZi200/Memory-Colour/labels/bug","name":"bug","color":"fc2929"}],"state":"open","locked":false,"assignee":null,"milestone":null,"comments":0,"created_at":"2015-01-01T01:06:35Z","updated_at":"2015-01-01T01:06:35Z","closed_at":null,"body":"On some devices(at least iPhone), the two circles and diamond that make up the heart can be seen clearly. Displaying sharp edges and not a smooth heart icon.\r\n\r\nThis will me fixed soon."}},"public":true,"created_at":"2015-01-01T01:06:37Z"}
{"id":"2489398646","type":"PushEvent","actor":{"id":506010,"login":"gabeshaughnessy","gravatar_id":"","url":"https://api.github.com/users/gabeshaughnessy","avatar_url":"https://avatars.githubusercontent.com/u/506010?"},"repo":{"id":13913264,"name":"gabeshaughnessy/augmentedart","url":"https://api.github.com/repos/gabeshaughnessy/augmentedart"},"payload":{"push_id":536753451,"size":1,"distinct_size":1,"ref":"refs/heads/dungeon-hacker","head":"dcb8b8efe59d396379657ae1d6884406e628fbdb","before":"1855adda47047b9a781de334f4616c312ec65dc6","commits":[{"sha":"dcb8b8efe59d396379657ae1d6884406e628fbdb","author":{"email":"a2b2bb6e7f1b10ac88b326d5c10e33af6a8546bc@gmail.com","name":"gabeshaughnessy"},"message":"task list","distinct":true,"url":"https://api.github.com/repos/gabeshaughnessy/augmentedart/commits/dcb8b8efe59d396379657ae1d6884406e628fbdb"}]},"public":true,"created_at":"2015-01-01T01:06:38Z"}
{"id":"2489398647","type":"PushEvent","actor":{"id":433707,"login":"ile","gravatar_id":"","url":"https://api.github.com/users/ile","avatar_url":"https://avatars.githubusercontent.com/u/433707?"},"repo":{"id":26847132,"name":"kantele/k-templates","url":"https://api.github.com/repos/kantele/k-templates"},"payload":{"push_id":536753448,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"bd9e3811383e5c3fc3bbd2b9ddd90047df70e7c5","before":"274cca1b2adc063b47d558ac9bafa0dce7a05abb","commits":[{"sha":"bd9e3811383e5c3fc3bbd2b9ddd90047df70e7c5","author":{"email":"4f3407de78bccc8cc160ee4d278d5efe7162e6b5@nateps.com","name":"Nate Smith"},"message":"fix relative paths inside of views to return parent","distinct":true,"url":"https://api.github.com/repos/kantele/k-templates/commits/bd9e3811383e5c3fc3bbd2b9ddd90047df70e7c5"}]},"public":true,"created_at":"2015-01-01T01:06:38Z","org":{"id":5687585,"login":"kantele","gravatar_id":"","url":"https://api.github.com/orgs/kantele","avatar_url":"https://avatars.githubusercontent.com/u/5687585?"}}
{"id":"2489398653","type":"PushEvent","actor":{"id":4729139,"login":"poschengband","gravatar_id":"","url":"https://api.github.com/users/poschengband","avatar_url":"https://avatars.githubusercontent.com/u/4729139?"},"repo":{"id":10765478,"name":"poschengband/poschengband","url":"https://api.github.com/repos/poschengband/poschengband"},"payload":{"push_id":536753455,"size":1,"distinct_size":1,"ref":"refs/heads/develop","head":"a3a5ea26c7a02f84e24b2866eadc12f00ff681d1","before":"de2d3a235737a729201a3b0578f9bfc73731dc20","commits":[{"sha":"a3a5ea26c7a02f84e24b2866eadc12f00ff681d1","author":{"email":"59f8025d5107eab2ad159f3dd097ebc035e401a3@gmail.com","name":"poschengband"},"message":"Possessor: Playtesting","distinct":true,"url":"https://api.github.com/repos/poschengband/poschengband/commits/a3a5ea26c7a02f84e24b2866eadc12f00ff681d1"}]},"public":true,"created_at":"2015-01-01T01:06:38Z"}
{"id":"2489398659","type":"PushEvent","actor":{"id":1588951,"login":"TAGC","gravatar_id":"","url":"https://api.github.com/users/TAGC","avatar_url":"https://avatars.githubusercontent.com/u/1588951?"},"repo":{"id":28516105,"name":"TAGC/Semver","url":"https://api.github.com/repos/TAGC/Semver"},"payload":{"push_id":536753456,"size":6,"distinct_size":6,"ref":"refs/heads/develop","head":"9bc9f01848ee531b14b2ba1faefbd1f58fc105fc","before":"c14bd6aeef1be553879694e2c3ba8535749f5380","commits":[{"sha":"1dfd6b42e9c69b76f8953e87f09b28bcdfb523f2","author":{"email":"ff51050dd5988c994d7cae2035c2292721cc7625@gmail.com","name":"David"},"message":"Configured cobertura","distinct":true,"url":"https://api.github.com/repos/TAGC/Semver/commits/1dfd6b42e9c69b76f8953e87f09b28bcdfb523f2"},{"sha":"f90418a9a618f5d7ff8781046a920fb892b2bbf8","author":{"email":"ff51050dd5988c994d7cae2035c2292721cc7625@gmail.com","name":"David"},"message":"Configure codenarc","distinct":true,"url":"https://api.github.com/repos/TAGC/Semver/commits/f90418a9a618f5d7ff8781046a920fb892b2bbf8"},{"sha":"227c645edb028aa30e09a80f40febcdb6d872e31","author":{"email":"ff51050dd5988c994d7cae2035c2292721cc7625@gmail.com","name":"David"},"message":"Additional codenarc configuration","distinct":true,"url":"https://api.github.com/repos/TAGC/Semver/commits/227c645edb028aa30e09a80f40febcdb6d872e31"},{"sha":"50c650626bb7df42b8bb388bff84abaf0efd6b1d","author":{"email":"ff51050dd5988c994d7cae2035c2292721cc7625@gmail.com","name":"David"},"message":"Additional configuration in build script","distinct":true,"url":"https://api.github.com/repos/TAGC/Semver/commits/50c650626bb7df42b8bb388bff84abaf0efd6b1d"},{"sha":"8c50d4f13932c7ccf3a78fa2fc7b9db5395bc809","author":{"email":"ff51050dd5988c994d7cae2035c2292721cc7625@gmail.com","name":"David"},"message":"Merge branch 'feature/configure/codenarc' into develop","distinct":true,"url":"https://api.github.com/repos/TAGC/Semver/commits/8c50d4f13932c7ccf3a78fa2fc7b9db5395bc809"},{"sha":"9bc9f01848ee531b14b2ba1faefbd1f58fc105fc","author":{"email":"ff51050dd5988c994d7cae2035c2292721cc7625@gmail.com","name":"David"},"message":"Merge branch 'develop' of https://github.com/TAGC/Semver into develop","distinct":true,"url":"https://api.github.com/repos/TAGC/Semver/commits/9bc9f01848ee531b14b2ba1faefbd1f58fc105fc"}]},"public":true,"created_at":"2015-01-01T01:06:39Z"}
{"id":"2489398660","type":"PushEvent","actor":{"id":1580785,"login":"gmilligan","gravatar_id":"","url":"https://api.github.com/users/gmilligan","avatar_url":"https://avatars.githubusercontent.com/u/1580785?"},"repo":{"id":28199368,"name":"gmilligan/gmilligan.github.io","url":"https://api.github.com/repos/gmilligan/gmilligan.github.io"},"payload":{"push_id":536753457,"size":5,"distinct_size":5,"ref":"refs/heads/development","head":"2424cedc72a4b31e9feb52fb0c73c610b29f255b","before":"d11816d799c6a50f019dd22eaf9852ac2a80e2cb","commits":[{"sha":"099396797049f59a65b1c67089a9bd9809d9257c","author":{"email":"b4b508b1a3018069c698b5419b143ce95eea496c@gmail.com","name":"Greg Milligan"},"message":"lint and DI fixes for production build","distinct":true,"url":"https://api.github.com/repos/gmilligan/gmilligan.github.io/commits/099396797049f59a65b1c67089a9bd9809d9257c"},{"sha":"e5e753c4280c77241f6935193df429d89db25872","author":{"email":"b4b508b1a3018069c698b5419b143ce95eea496c@gmail.com","name":"Greg Milligan"},"message":"less to css changes","distinct":true,"url":"https://api.github.com/repos/gmilligan/gmilligan.github.io/commits/e5e753c4280c77241f6935193df429d89db25872"},{"sha":"da058848e25979191312fbd394572403990ffb8d","author":{"email":"b4b508b1a3018069c698b5419b143ce95eea496c@gmail.com","name":"Greg Milligan"},"message":"add Gulp production automation","distinct":true,"url":"https://api.github.com/repos/gmilligan/gmilligan.github.io/commits/da058848e25979191312fbd394572403990ffb8d"},{"sha":"d9c959104e576ab4ef20c92c468c8d0b513b9f52","author":{"email":"b4b508b1a3018069c698b5419b143ce95eea496c@gmail.com","name":"Greg Milligan"},"message":"gulp automation edits","distinct":true,"url":"https://api.github.com/repos/gmilligan/gmilligan.github.io/commits/d9c959104e576ab4ef20c92c468c8d0b513b9f52"},{"sha":"2424cedc72a4b31e9feb52fb0c73c610b29f255b","author":{"email":"b4b508b1a3018069c698b5419b143ce95eea496c@gmail.com","name":"Greg Milligan"},"message":"remove mdeium sized images","distinct":true,"url":"https://api.github.com/repos/gmilligan/gmilligan.github.io/commits/2424cedc72a4b31e9feb52fb0c73c610b29f255b"}]},"public":true,"created_at":"2015-01-01T01:06:39Z"}
{"id":"2489398661","type":"PushEvent","actor":{"id":2209144,"login":"bwbaugh","gravatar_id":"","url":"https://api.github.com/users/bwbaugh","avatar_url":"https://avatars.githubusercontent.com/u/2209144?"},"repo":{"id":28676842,"name":"bwbaugh/dotfiles","url":"https://api.github.com/repos/bwbaugh/dotfiles"},"payload":{"push_id":536753458,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"006ae1000b628dfbc2e7b57fc44486c10236512e","before":"24dd5a64192f7855318b0d050f8e1954f9a603e9","commits":[{"sha":"006ae1000b628dfbc2e7b57fc44486c10236512e","author":{"email":"564269323e6a7fccff1f236f3209e6b63492d40b","name":"Wesley Baugh"},"message":"Add path for macports","distinct":true,"url":"https://api.github.com/repos/bwbaugh/dotfiles/commits/006ae1000b628dfbc2e7b57fc44486c10236512e"}]},"public":true,"created_at":"2015-01-01T01:06:39Z"}
{"id":"2489398664","type":"PushEvent","actor":{"id":7122850,"login":"sararibeiro","gravatar_id":"","url":"https://api.github.com/users/sararibeiro","avatar_url":"https://avatars.githubusercontent.com/u/7122850?"},"repo":{"id":21713999,"name":"sararibeiro/gtg","url":"https://api.github.com/repos/sararibeiro/gtg"},"payload":{"push_id":536753459,"size":1,"distinct_size":1,"ref":"refs/heads/calendar-plugin","head":"95cdec6034a10610bbe827b43689a5ed0f9dfb6e","before":"b1a0be746888e62c067e26df65f8ab0c0bfe7add","commits":[{"sha":"95cdec6034a10610bbe827b43689a5ed0f9dfb6e","author":{"email":"f90fb4f31eb6dfae57fef64f6d1adbd053837f59@gmail.com","name":"Sara Ribeiro"},"message":"Fixing issues pointed by Izidor's code review.\n* Removed FIXME that were left on the code.\n* Added copyright to all the files.\n* Fixed small bug that happened when transitioning from December 31st to\n  January.\n* Listed calendar view as an available plugin on userdocs.","distinct":true,"url":"https://api.github.com/repos/sararibeiro/gtg/commits/95cdec6034a10610bbe827b43689a5ed0f9dfb6e"}]},"public":true,"created_at":"2015-01-01T01:06:40Z"}
{"id":"2489398668","type":"IssueCommentEvent","actor":{"id":99834,"login":"FCO","gravatar_id":"","url":"https://api.github.com/users/FCO","avatar_url":"https://avatars.githubusercontent.com/u/99834?"},"repo":{"id":26700916,"name":"FCO/Dispatcher","url":"https://api.github.com/repos/FCO/Dispatcher"},"payload":{"action":"created","issue":{"url":"https://api.github.com/repos/FCO/Dispatcher/issues/19","labels_url":"https://api.github.com/repos/FCO/Dispatcher/issues/19/labels{/name}","comments_url":"https://api.github.com/repos/FCO/Dispatcher/issues/19/comments","events_url":"https://api.github.com/repos/FCO/Dispatcher/issues/19/events","html_url":"https://github.com/FCO/Dispatcher/issues/19","id":52033743,"number":19,"title":"cookie","user":{"login":"FCO","id":99834,"avatar_url":"https://avatars.githubusercontent.com/u/99834?v=3","gravatar_id":"","url":"https://api.github.com/users/FCO","html_url":"https://github.com/FCO","followers_url":"https://api.github.com/users/FCO/followers","following_url":"https://api.github.com/users/FCO/following{/other_user}","gists_url":"https://api.github.com/users/FCO/gists{/gist_id}","starred_url":"https://api.github.com/users/FCO/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/FCO/subscriptions","organizations_url":"https://api.github.com/users/FCO/orgs","repos_url":"https://api.github.com/users/FCO/repos","events_url":"https://api.github.com/users/FCO/events{/privacy}","received_events_url":"https://api.github.com/users/FCO/received_events","type":"User","site_admin":false},"labels":[],"state":"closed","locked":false,"assignee":{"login":"FCO","id":99834,"avatar_url":"https://avatars.githubusercontent.com/u/99834?v=3","gravatar_id":"","url":"https://api.github.com/users/FCO","html_url":"https://github.com/FCO","followers_url":"https://api.github.com/users/FCO/followers","following_url":"https://api.github.com/users/FCO/following{/other_user}","gists_url":"https://api.github.com/users/FCO/gists{/gist_id}","starred_url":"https://api.github.com/users/FCO/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/FCO/subscriptions","organizations_url":"https://api.github.com/users/FCO/orgs","repos_url":"https://api.github.com/users/FCO/repos","events_url":"https://api.github.com/users/FCO/events{/privacy}","received_events_url":"https://api.github.com/users/FCO/received_events","type":"User","site_admin":false},"milestone":null,"comments":1,"created_at":"2014-12-15T20:21:40Z","updated_at":"2015-01-01T01:06:41Z","closed_at":"2015-01-01T01:06:41Z","body":""},"comment":{"url":"https://api.github.com/repos/FCO/Dispatcher/issues/comments/68477365","html_url":"https://github.com/FCO/Dispatcher/issues/19#issuecomment-68477365","issue_url":"https://api.github.com/repos/FCO/Dispatcher/issues/19","id":68477365,"user":{"login":"FCO","id":99834,"avatar_url":"https://avatars.githubusercontent.com/u/99834?v=3","gravatar_id":"","url":"https://api.github.com/users/FCO","html_url":"https://github.com/FCO","followers_url":"https://api.github.com/users/FCO/followers","following_url":"https://api.github.com/users/FCO/following{/other_user}","gists_url":"https://api.github.com/users/FCO/gists{/gist_id}","starred_url":"https://api.github.com/users/FCO/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/FCO/subscriptions","organizations_url":"https://api.github.com/users/FCO/orgs","repos_url":"https://api.github.com/users/FCO/repos","events_url":"https://api.github.com/users/FCO/events{/privacy}","received_events_url":"https://api.github.com/users/FCO/received_events","type":"User","site_admin":false},"created_at":"2015-01-01T01:06:40Z","updated_at":"2015-01-01T01:06:40Z","body":"Not done"}},"public":true,"created_at":"2015-01-01T01:06:43Z"}
{"id":"2489398669","type":"IssuesEvent","actor":{"id":99834,"login":"FCO","gravatar_id":"","url":"https://api.github.com/users/FCO","avatar_url":"https://avatars.githubusercontent.com/u/99834?"},"repo":{"id":26700916,"name":"FCO/Dispatcher","url":"https://api.github.com/repos/FCO/Dispatcher"},"payload":{"action":"closed","issue":{"url":"https://api.github.com/repos/FCO/Dispatcher/issues/19","labels_url":"https://api.github.com/repos/FCO/Dispatcher/issues/19/labels{/name}","comments_url":"https://api.github.com/repos/FCO/Dispatcher/issues/19/comments","events_url":"https://api.github.com/repos/FCO/Dispatcher/issues/19/events","html_url":"https://github.com/FCO/Dispatcher/issues/19","id":52033743,"number":19,"title":"cookie","user":{"login":"FCO","id":99834,"avatar_url":"https://avatars.githubusercontent.com/u/99834?v=3","gravatar_id":"","url":"https://api.github.com/users/FCO","html_url":"https://github.com/FCO","followers_url":"https://api.github.com/users/FCO/followers","following_url":"https://api.github.com/users/FCO/following{/other_user}","gists_url":"https://api.github.com/users/FCO/gists{/gist_id}","starred_url":"https://api.github.com/users/FCO/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/FCO/subscriptions","organizations_url":"https://api.github.com/users/FCO/orgs","repos_url":"https://api.github.com/users/FCO/repos","events_url":"https://api.github.com/users/FCO/events{/privacy}","received_events_url":"https://api.github.com/users/FCO/received_events","type":"User","site_admin":false},"labels":[],"state":"closed","locked":false,"assignee":{"login":"FCO","id":99834,"avatar_url":"https://avatars.githubusercontent.com/u/99834?v=3","gravatar_id":"","url":"https://api.github.com/users/FCO","html_url":"https://github.com/FCO","followers_url":"https://api.github.com/users/FCO/followers","following_url":"https://api.github.com/users/FCO/following{/other_user}","gists_url":"https://api.github.com/users/FCO/gists{/gist_id}","starred_url":"https://api.github.com/users/FCO/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/FCO/subscriptions","organizations_url":"https://api.github.com/users/FCO/orgs","repos_url":"https://api.github.com/users/FCO/repos","events_url":"https://api.github.com/users/FCO/events{/privacy}","received_events_url":"https://api.github.com/users/FCO/received_events","type":"User","site_admin":false},"milestone":null,"comments":1,"created_at":"2014-12-15T20:21:40Z","updated_at":"2015-01-01T01:06:41Z","closed_at":"2015-01-01T01:06:41Z","body":""}},"public":true,"created_at":"2015-01-01T01:06:43Z"}
{"id":"2489398672","type":"ForkEvent","actor":{"id":7151313,"login":"theTechnoKid","gravatar_id":"","url":"https://api.github.com/users/theTechnoKid","avatar_url":"https://avatars.githubusercontent.com/u/7151313?"},"repo":{"id":11571950,"name":"spywhere/Monopoly","url":"https://api.github.com/repos/spywhere/Monopoly"},"payload":{"forkee":{"id":28678282,"name":"Monopoly","full_name":"theTechnoKid/Monopoly","owner":{"login":"theTechnoKid","id":7151313,"avatar_url":"https://avatars.githubusercontent.com/u/7151313?v=3","gravatar_id":"","url":"https://api.github.com/users/theTechnoKid","html_url":"https://github.com/theTechnoKid","followers_url":"https://api.github.com/users/theTechnoKid/followers","following_url":"https://api.github.com/users/theTechnoKid/following{/other_user}","gists_url":"https://api.github.com/users/theTechnoKid/gists{/gist_id}","starred_url":"https://api.github.com/users/theTechnoKid/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/theTechnoKid/subscriptions","organizations_url":"https://api.github.com/users/theTechnoKid/orgs","repos_url":"https://api.github.com/users/theTechnoKid/repos","events_url":"https://api.github.com/users/theTechnoKid/events{/privacy}","received_events_url":"https://api.github.com/users/theTechnoKid/received_events","type":"User","site_admin":false},"private":false,"html_url":"https://github.com/theTechnoKid/Monopoly","description":"Project for Object-Oriented Computing","fork":true,"url":"https://api.github.com/repos/theTechnoKid/Monopoly","forks_url":"https://api.github.com/repos/theTechnoKid/Monopoly/forks","keys_url":"https://api.github.com/repos/theTechnoKid/Monopoly/keys{/key_id}","collaborators_url":"https://api.github.com/repos/theTechnoKid/Monopoly/collaborators{/collaborator}","teams_url":"https://api.github.com/repos/theTechnoKid/Monopoly/teams","hooks_url":"https://api.github.com/repos/theTechnoKid/Monopoly/hooks","issue_events_url":"https://api.github.com/repos/theTechnoKid/Monopoly/issues/events{/number}","events_url":"https://api.github.com/repos/theTechnoKid/Monopoly/events","assignees_url":"https://api.github.com/repos/theTechnoKid/Monopoly/assignees{/user}","branches_url":"https://api.github.com/repos/theTechnoKid/Monopoly/branches{/branch}","tags_url":"https://api.github.com/repos/theTechnoKid/Monopoly/tags","blobs_url":"https://api.github.com/repos/theTechnoKid/Monopoly/git/blobs{/sha}","git_tags_url":"https://api.github.com/repos/theTechnoKid/Monopoly/git/tags{/sha}","git_refs_url":"https://api.github.com/repos/theTechnoKid/Monopoly/git/refs{/sha}","trees_url":"https://api.github.com/repos/theTechnoKid/Monopoly/git/trees{/sha}","statuses_url":"https://api.github.com/repos/theTechnoKid/Monopoly/statuses/{sha}","languages_url":"https://api.github.com/repos/theTechnoKid/Monopoly/languages","stargazers_url":"https://api.github.com/repos/theTechnoKid/Monopoly/stargazers","contributors_url":"https://api.github.com/repos/theTechnoKid/Monopoly/contributors","subscribers_url":"https://api.github.com/repos/theTechnoKid/Monopoly/subscribers","subscription_url":"https://api.github.com/repos/theTechnoKid/Monopoly/subscription","commits_url":"https://api.github.com/repos/theTechnoKid/Monopoly/commits{/sha}","git_commits_url":"https://api.github.com/repos/theTechnoKid/Monopoly/git/commits{/sha}","comments_url":"https://api.github.com/repos/theTechnoKid/Monopoly/comments{/number}","issue_comment_url":"https://api.github.com/repos/theTechnoKid/Monopoly/issues/comments/{number}","contents_url":"https://api.github.com/repos/theTechnoKid/Monopoly/contents/{+path}","compare_url":"https://api.github.com/repos/theTechnoKid/Monopoly/compare/{base}...{head}","merges_url":"https://api.github.com/repos/theTechnoKid/Monopoly/merges","archive_url":"https://api.github.com/repos/theTechnoKid/Monopoly/{archive_format}{/ref}","downloads_url":"https://api.github.com/repos/theTechnoKid/Monopoly/downloads","issues_url":"https://api.github.com/repos/theTechnoKid/Monopoly/issues{/number}","pulls_url":"https://api.github.com/repos/theTechnoKid/Monopoly/pulls{/number}","milestones_url":"https://api.github.com/repos/theTechnoKid/Monopoly/milestones{/number}","notifications_url":"https://api.github.com/repos/theTechnoKid/Monopoly/notifications{?since,all,participating}","labels_url":"https://api.github.com/repos/theTechnoKid/Monopoly/labels{/name}","releases_url":"https://api.github.com/repos/theTechnoKid/Monopoly/releases{/id}","created_at":"2015-01-01T01:06:41Z","updated_at":"2013-10-15T12:29:53Z","pushed_at":"2013-07-22T08:34:18Z","git_url":"git://github.com/theTechnoKid/Monopoly.git","ssh_url":"git@github.com:theTechnoKid/Monopoly.git","clone_url":"https://github.com/theTechnoKid/Monopoly.git","svn_url":"https://github.com/theTechnoKid/Monopoly","homepage":null,"size":564,"stargazers_count":0,"watchers_count":0,"language":null,"has_issues":false,"has_downloads":true,"has_wiki":true,"has_pages":false,"forks_count":0,"mirror_url":null,"open_issues_count":0,"forks":0,"open_issues":0,"watchers":0,"default_branch":"master","public":true}},"public":true,"created_at":"2015-01-01T01:06:43Z"}
{"id":"2489398676","type":"CreateEvent","actor":{"id":1734986,"login":"Adamwgoh","gravatar_id":"","url":"https://api.github.com/users/Adamwgoh","avatar_url":"https://avatars.githubusercontent.com/u/1734986?"},"repo":{"id":28678222,"name":"Adamwgoh/Laura","url":"https://api.github.com/repos/Adamwgoh/Laura"},"payload":{"ref":"master","ref_type":"branch","master_branch":"master","description":"G52GRP re-upload","pusher_type":"user"},"public":true,"created_at":"2015-01-01T01:06:43Z"}
{"id":"2489398678","type":"PushEvent","actor":{"id":3794984,"login":"abustamam","gravatar_id":"","url":"https://api.github.com/users/abustamam","avatar_url":"https://avatars.githubusercontent.com/u/3794984?"},"repo":{"id":25110710,"name":"abustamam/Udacity-Portfolio","url":"https://api.github.com/repos/abustamam/Udacity-Portfolio"},"payload":{"push_id":536753462,"size":4,"distinct_size":0,"ref":"refs/heads/gh-pages","head":"5776bf9082fbc389cc986d9159e7367cc2fcdf20","before":"781f999ab1214e4ca396fe3bdb7721ec5e81d208","commits":[{"sha":"585271ef771aad13ac3cdc7ba5aeb766e843e972","author":{"email":"1f8e819f7c9fbaadfc4b5b78cc4be161892e8692@gmail.com","name":"Rasheed Bustamam"},"message":"Resize photos, change cover image","distinct":false,"url":"https://api.github.com/repos/abustamam/Udacity-Portfolio/commits/585271ef771aad13ac3cdc7ba5aeb766e843e972"},{"sha":"b39e5ac9096f3ddcc10a485bd9df8dbedcfda5ef","author":{"email":"1f8e819f7c9fbaadfc4b5b78cc4be161892e8692@gmail.com","name":"Rasheed Bustamam"},"message":"Update README.md","distinct":false,"url":"https://api.github.com/repos/abustamam/Udacity-Portfolio/commits/b39e5ac9096f3ddcc10a485bd9df8dbedcfda5ef"},{"sha":"e323ac3bd7451b41388d083ec83e1dc3a4d94022","author":{"email":"1f8e819f7c9fbaadfc4b5b78cc4be161892e8692@gmail.com","name":"Rasheed Bustamam"},"message":"Change project 1 img","distinct":false,"url":"https://api.github.com/repos/abustamam/Udacity-Portfolio/commits/e323ac3bd7451b41388d083ec83e1dc3a4d94022"},{"sha":"5776bf9082fbc389cc986d9159e7367cc2fcdf20","author":{"email":"1f8e819f7c9fbaadfc4b5b78cc4be161892e8692@gmail.com","name":"Rasheed Bustamam"},"message":"Merge branch 'master' of github.com:abustamam/Udacity-Portfolio\n\nPull readme","distinct":false,"url":"https://api.github.com/repos/abustamam/Udacity-Portfolio/commits/5776bf9082fbc389cc986d9159e7367cc2fcdf20"}]},"public":true,"created_at":"2015-01-01T01:06:43Z"}
{"id":"2489398680","type":"PushEvent","actor":{"id":7275188,"login":"mxcapo","gravatar_id":"","url":"https://api.github.com/users/mxcapo","avatar_url":"https://avatars.githubusercontent.com/u/7275188?"},"repo":{"id":27788033,"name":"mxcapo/mxcapo.github.io","url":"https://api.github.com/repos/mxcapo/mxcapo.github.io"},"payload":{"push_id":536753464,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"14c4f783a8d62d81b30c3268deca41ae4d4f1133","before":"8dc39e5aa797d7f340d56ba94bc51e83374fc90a","commits":[{"sha":"14c4f783a8d62d81b30c3268deca41ae4d4f1133","author":{"email":"a7f48bd5c86f435aba4630eb6fad8b467d5719b5@gmail.com","name":"mxcapo"},"message":"tweak","distinct":true,"url":"https://api.github.com/repos/mxcapo/mxcapo.github.io/commits/14c4f783a8d62d81b30c3268deca41ae4d4f1133"}]},"public":true,"created_at":"2015-01-01T01:06:43Z"}
{"id":"2489398681","type":"PushEvent","actor":{"id":676533,"login":"501st-alpha1","gravatar_id":"","url":"https://api.github.com/users/501st-alpha1","avatar_url":"https://avatars.githubusercontent.com/u/676533?"},"repo":{"id":15497204,"name":"501st-alpha1/emacs-init","url":"https://api.github.com/repos/501st-alpha1/emacs-init"},"payload":{"push_id":536753465,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"a56556f9b33872e0ed4aca1fdf773e24215afdd3","before":"8ac7f1e49e1a9b29f4243b3c126aab766ff7d95c","commits":[{"sha":"a56556f9b33872e0ed4aca1fdf773e24215afdd3","author":{"email":"625600233cb3bcab32268c17610882e0fdaed295@scott-weldon.com","name":"Scott Weldon"},"message":"Allow setting auto-revert-mode in .dir-locals.el","distinct":true,"url":"https://api.github.com/repos/501st-alpha1/emacs-init/commits/a56556f9b33872e0ed4aca1fdf773e24215afdd3"}]},"public":true,"created_at":"2015-01-01T01:06:43Z"}
{"id":"2489398683","type":"PushEvent","actor":{"id":76367,"login":"md5","gravatar_id":"","url":"https://api.github.com/users/md5","avatar_url":"https://avatars.githubusercontent.com/u/76367?"},"repo":{"id":28625804,"name":"astrifex/astrifex","url":"https://api.github.com/repos/astrifex/astrifex"},"payload":{"push_id":536753466,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"1aadb40fa78ff80d4e60a403d2819af18fd1d119","before":"ddb58acdb8e1ed67dbcbe45d76fee55d09a29577","commits":[{"sha":"1aadb40fa78ff80d4e60a403d2819af18fd1d119","author":{"email":"a17fed27eaa842282862ff7c1b9c8395a26ac320@embody.org","name":"Mike Dillon"},"message":"Add size","distinct":true,"url":"https://api.github.com/repos/astrifex/astrifex/commits/1aadb40fa78ff80d4e60a403d2819af18fd1d119"}]},"public":true,"created_at":"2015-01-01T01:06:43Z","org":{"id":10359906,"login":"astrifex","gravatar_id":"","url":"https://api.github.com/orgs/astrifex","avatar_url":"https://avatars.githubusercontent.com/u/10359906?"}}
{"id":"2489398684","type":"PushEvent","actor":{"id":1785816,"login":"natashavlahakis","gravatar_id":"","url":"https://api.github.com/users/natashavlahakis","avatar_url":"https://avatars.githubusercontent.com/u/1785816?"},"repo":{"id":27246389,"name":"natashavlahakis/figtree","url":"https://api.github.com/repos/natashavlahakis/figtree"},"payload":{"push_id":536753467,"size":1,"distinct_size":1,"ref":"refs/heads/gh-pages","head":"9791f481f66b12d027b824e5d13771451e1ad28a","before":"03e086487f01d5fff1574e9906ad4a4e06082211","commits":[{"sha":"9791f481f66b12d027b824e5d13771451e1ad28a","author":{"email":"84a888d1cdc9202fb22178d441aabd7da0eefd07@gmail.com","name":"Natasha Vlahakis"},"message":"added row","distinct":true,"url":"https://api.github.com/repos/natashavlahakis/figtree/commits/9791f481f66b12d027b824e5d13771451e1ad28a"}]},"public":true,"created_at":"2015-01-01T01:06:43Z"}
{"id":"2489398685","type":"PushEvent","actor":{"id":166301,"login":"bcomnes","gravatar_id":"","url":"https://api.github.com/users/bcomnes","avatar_url":"https://avatars.githubusercontent.com/u/166301?"},"repo":{"id":6861308,"name":"bcomnes/bcomnes.github.io","url":"https://api.github.com/repos/bcomnes/bcomnes.github.io"},"payload":{"push_id":536753468,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"f75503acf7e511ce91c18a99ce1042cc2e1e650b","before":"821968b470015bf7a6d5f86aeea8d739dd1aadbe","commits":[{"sha":"f75503acf7e511ce91c18a99ce1042cc2e1e650b","author":{"email":"6df4fba95631fe4f4c4337307cda4e0fc4c27d16@gmail.com","name":"Bret Comnes"},"message":"Update 2015-01-01-shell-art.md","distinct":true,"url":"https://api.github.com/repos/bcomnes/bcomnes.github.io/commits/f75503acf7e511ce91c18a99ce1042cc2e1e650b"}]},"public":true,"created_at":"2015-01-01T01:06:43Z"}
{"id":"2489398686","type":"ForkEvent","actor":{"id":880050,"login":"kazutomi","gravatar_id":"","url":"https://api.github.com/users/kazutomi","avatar_url":"https://avatars.githubusercontent.com/u/880050?"},"repo":{"id":115341,"name":"alexvollmer/daemon-spawn","url":"https://api.github.com/repos/alexvollmer/daemon-spawn"},"payload":{"forkee":{"id":28678283,"name":"daemon-spawn","full_name":"kazutomi/daemon-spawn","owner":{"login":"kazutomi","id":880050,"avatar_url":"https://avatars.githubusercontent.com/u/880050?v=3","gravatar_id":"","url":"https://api.github.com/users/kazutomi","html_url":"https://github.com/kazutomi","followers_url":"https://api.github.com/users/kazutomi/followers","following_url":"https://api.github.com/users/kazutomi/following{/other_user}","gists_url":"https://api.github.com/users/kazutomi/gists{/gist_id}","starred_url":"https://api.github.com/users/kazutomi/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/kazutomi/subscriptions","organizations_url":"https://api.github.com/users/kazutomi/orgs","repos_url":"https://api.github.com/users/kazutomi/repos","events_url":"https://api.github.com/users/kazutomi/events{/privacy}","received_events_url":"https://api.github.com/users/kazutomi/received_events","type":"User","site_admin":false},"private":false,"html_url":"https://github.com/kazutomi/daemon-spawn","description":"A simple, flexible daemon management library.","fork":true,"url":"https://api.github.com/repos/kazutomi/daemon-spawn","forks_url":"https://api.github.com/repos/kazutomi/daemon-spawn/forks","keys_url":"https://api.github.com/repos/kazutomi/daemon-spawn/keys{/key_id}","collaborators_url":"https://api.github.com/repos/kazutomi/daemon-spawn/collaborators{/collaborator}","teams_url":"https://api.github.com/repos/kazutomi/daemon-spawn/teams","hooks_url":"https://api.github.com/repos/kazutomi/daemon-spawn/hooks","issue_events_url":"https://api.github.com/repos/kazutomi/daemon-spawn/issues/events{/number}","events_url":"https://api.github.com/repos/kazutomi/daemon-spawn/events","assignees_url":"https://api.github.com/repos/kazutomi/daemon-spawn/assignees{/user}","branches_url":"https://api.github.com/repos/kazutomi/daemon-spawn/branches{/branch}","tags_url":"https://api.github.com/repos/kazutomi/daemon-spawn/tags","blobs_url":"https://api.github.com/repos/kazutomi/daemon-spawn/git/blobs{/sha}","git_tags_url":"https://api.github.com/repos/kazutomi/daemon-spawn/git/tags{/sha}","git_refs_url":"https://api.github.com/repos/kazutomi/daemon-spawn/git/refs{/sha}","trees_url":"https://api.github.com/repos/kazutomi/daemon-spawn/git/trees{/sha}","statuses_url":"https://api.github.com/repos/kazutomi/daemon-spawn/statuses/{sha}","languages_url":"https://api.github.com/repos/kazutomi/daemon-spawn/languages","stargazers_url":"https://api.github.com/repos/kazutomi/daemon-spawn/stargazers","contributors_url":"https://api.github.com/repos/kazutomi/daemon-spawn/contributors","subscribers_url":"https://api.github.com/repos/kazutomi/daemon-spawn/subscribers","subscription_url":"https://api.github.com/repos/kazutomi/daemon-spawn/subscription","commits_url":"https://api.github.com/repos/kazutomi/daemon-spawn/commits{/sha}","git_commits_url":"https://api.github.com/repos/kazutomi/daemon-spawn/git/commits{/sha}","comments_url":"https://api.github.com/repos/kazutomi/daemon-spawn/comments{/number}","issue_comment_url":"https://api.github.com/repos/kazutomi/daemon-spawn/issues/comments/{number}","contents_url":"https://api.github.com/repos/kazutomi/daemon-spawn/contents/{+path}","compare_url":"https://api.github.com/repos/kazutomi/daemon-spawn/compare/{base}...{head}","merges_url":"https://api.github.com/repos/kazutomi/daemon-spawn/merges","archive_url":"https://api.github.com/repos/kazutomi/daemon-spawn/{archive_format}{/ref}","downloads_url":"https://api.github.com/repos/kazutomi/daemon-spawn/downloads","issues_url":"https://api.github.com/repos/kazutomi/daemon-spawn/issues{/number}","pulls_url":"https://api.github.com/repos/kazutomi/daemon-spawn/pulls{/number}","milestones_url":"https://api.github.com/repos/kazutomi/daemon-spawn/milestones{/number}","notifications_url":"https://api.github.com/repos/kazutomi/daemon-spawn/notifications{?since,all,participating}","labels_url":"https://api.github.com/repos/kazutomi/daemon-spawn/labels{/name}","releases_url":"https://api.github.com/repos/kazutomi/daemon-spawn/releases{/id}","created_at":"2015-01-01T01:06:43Z","updated_at":"2014-12-29T02:27:27Z","pushed_at":"2012-11-21T17:14:36Z","git_url":"git://github.com/kazutomi/daemon-spawn.git","ssh_url":"git@github.com:kazutomi/daemon-spawn.git","clone_url":"https://github.com/kazutomi/daemon-spawn.git","svn_url":"https://github.com/kazutomi/daemon-spawn","homepage":"http://www.evri.com","size":155,"stargazers_count":0,"watchers_count":0,"language":null,"has_issues":false,"has_downloads":true,"has_wiki":true,"has_pages":false,"forks_count":0,"mirror_url":null,"open_issues_count":0,"forks":0,"open_issues":0,"watchers":0,"default_branch":"master","public":true}},"public":true,"created_at":"2015-01-01T01:06:43Z"}
{"id":"2489398687","type":"PushEvent","actor":{"id":5090808,"login":"iderioja","gravatar_id":"","url":"https://api.github.com/users/iderioja","avatar_url":"https://avatars.githubusercontent.com/u/5090808?"},"repo":{"id":16545715,"name":"iderioja/base_datos_geografica","url":"https://api.github.com/repos/iderioja/base_datos_geografica"},"payload":{"push_id":536753469,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"101f98a1fb0221d38c432fe06e223ea3c08926fb","before":"0f5909f48c0a61d3151203b4662ed2d0c34a9b5d","commits":[{"sha":"101f98a1fb0221d38c432fe06e223ea3c08926fb","author":{"email":"0c9edb4bafa26e2cc6fb9112520016fa2774e8ce@wamba.larioja.org","name":"fmeserver"},"message":"Actualización geoJSON desde tablas Oracle con FME. 20150101020635","distinct":true,"url":"https://api.github.com/repos/iderioja/base_datos_geografica/commits/101f98a1fb0221d38c432fe06e223ea3c08926fb"}]},"public":true,"created_at":"2015-01-01T01:06:43Z"}
{"id":"2489398689","type":"PushEvent","actor":{"id":380021,"login":"wolf31o2","gravatar_id":"","url":"https://api.github.com/users/wolf31o2","avatar_url":"https://avatars.githubusercontent.com/u/380021?"},"repo":{"id":17919097,"name":"caskdata/coopr","url":"https://api.github.com/repos/caskdata/coopr"},"payload":{"push_id":536753471,"size":1,"distinct_size":1,"ref":"refs/heads/feature/dockerfile","head":"026cc002d2379d68209f00d609d56448e66bcb15","before":"3b77a6638a992f0b8f605aab3d44ce9987b78741","commits":[{"sha":"026cc002d2379d68209f00d609d56448e66bcb15","author":{"email":"711c73f64afdce07b7e38039a96d2224209e9a6c@cask.co","name":"Chris Gianelloni"},"message":"Do not use localhost for any externally-exposed ports","distinct":true,"url":"https://api.github.com/repos/caskdata/coopr/commits/026cc002d2379d68209f00d609d56448e66bcb15"}]},"public":true,"created_at":"2015-01-01T01:06:43Z","org":{"id":8123023,"login":"caskdata","gravatar_id":"","url":"https://api.github.com/orgs/caskdata","avatar_url":"https://avatars.githubusercontent.com/u/8123023?"}}
{"id":"2489398690","type":"PushEvent","actor":{"id":960411,"login":"fauxfiction","gravatar_id":"","url":"https://api.github.com/users/fauxfiction","avatar_url":"https://avatars.githubusercontent.com/u/960411?"},"repo":{"id":28618969,"name":"fauxfiction/Sick-Beard","url":"https://api.github.com/repos/fauxfiction/Sick-Beard"},"payload":{"push_id":536753472,"size":1,"distinct_size":1,"ref":"refs/heads/fix-newznab-response-xpath","head":"5f6888811bcc778c8832b4d77f05d047013c38ba","before":"69817a46a431c25adc66c236fca351e3d904b389","commits":[{"sha":"5f6888811bcc778c8832b4d77f05d047013c38ba","author":{"email":"64b2b6d12bfe4baae7dad3d018f8cbf6b0e7a044@fauxfiction.com","name":"fauxfiction"},"message":"Iterate over XML etree nodes in newznab provider\n\nInstead of using XPath queries which are not supported prior to Python\n2.7, grab an iterator to collect nodes of interest.","distinct":true,"url":"https://api.github.com/repos/fauxfiction/Sick-Beard/commits/5f6888811bcc778c8832b4d77f05d047013c38ba"}]},"public":true,"created_at":"2015-01-01T01:06:43Z"}
{"id":"2489398696","type":"WatchEvent","actor":{"id":1170642,"login":"niofis","gravatar_id":"","url":"https://api.github.com/users/niofis","avatar_url":"https://avatars.githubusercontent.com/u/1170642?"},"repo":{"id":11541598,"name":"hermanhermitage/videocoreiv-qpu","url":"https://api.github.com/repos/hermanhermitage/videocoreiv-qpu"},"payload":{"action":"started"},"public":true,"created_at":"2015-01-01T01:06:44Z"}
{"id":"2489398698","type":"PushEvent","actor":{"id":1515006,"login":"LordPsychoMaster","gravatar_id":"","url":"https://api.github.com/users/LordPsychoMaster","avatar_url":"https://avatars.githubusercontent.com/u/1515006?"},"repo":{"id":28061377,"name":"LordPsychoMaster/SchitEngine","url":"https://api.github.com/repos/LordPsychoMaster/SchitEngine"},"payload":{"push_id":536753473,"size":3,"distinct_size":3,"ref":"refs/heads/master","head":"54d4858b59afff9fd288692a97b22ed45cdbe7bc","before":"8c90925c3d2e0d6fb7d96e29ff671667232ba26f","commits":[{"sha":"4c64252c67e7b0ec6728c68e273a7e4226673750","author":{"email":"52153f19f64cb8f0c20cf48997f6dcb5cc4cb401@gmail.com","name":"Jonathan Jao"},"message":"cleacleaned up directory","distinct":true,"url":"https://api.github.com/repos/LordPsychoMaster/SchitEngine/commits/4c64252c67e7b0ec6728c68e273a7e4226673750"},{"sha":"8bca8506bac64aa2036237cb31447883f00d8249","author":{"email":"52153f19f64cb8f0c20cf48997f6dcb5cc4cb401@gmail.com","name":"Jonathan Jao"},"message":"Back and Forth Sockets handshake done","distinct":true,"url":"https://api.github.com/repos/LordPsychoMaster/SchitEngine/commits/8bca8506bac64aa2036237cb31447883f00d8249"},{"sha":"54d4858b59afff9fd288692a97b22ed45cdbe7bc","author":{"email":"52153f19f64cb8f0c20cf48997f6dcb5cc4cb401@gmail.com","name":"Jonathan Jao"},"message":"test","distinct":true,"url":"https://api.github.com/repos/LordPsychoMaster/SchitEngine/commits/54d4858b59afff9fd288692a97b22ed45cdbe7bc"}]},"public":true,"created_at":"2015-01-01T01:06:44Z"}
{"id":"2489398699","type":"PushEvent","actor":{"id":10349906,"login":"noobfish","gravatar_id":"","url":"https://api.github.com/users/noobfish","avatar_url":"https://avatars.githubusercontent.com/u/10349906?"},"repo":{"id":28634881,"name":"noobfish/simple","url":"https://api.github.com/repos/noobfish/simple"},"payload":{"push_id":536753474,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"fb2725e3511b36d1762f388e4a38d43c46d3a3fd","before":"b4ed23be12698cdc458884d79f406d551330b2d1","commits":[{"sha":"fb2725e3511b36d1762f388e4a38d43c46d3a3fd","author":{"email":"f4576d39c25ca3a0435d50421190b319ce2c2dd7@users.noreply.github.com","name":"noobfish"},"message":"Update main.json","distinct":true,"url":"https://api.github.com/repos/noobfish/simple/commits/fb2725e3511b36d1762f388e4a38d43c46d3a3fd"}]},"public":true,"created_at":"2015-01-01T01:06:44Z"}
{"id":"2489398700","type":"WatchEvent","actor":{"id":6190487,"login":"Tommy-Geenexus","gravatar_id":"","url":"https://api.github.com/users/Tommy-Geenexus","avatar_url":"https://avatars.githubusercontent.com/u/6190487?"},"repo":{"id":14080264,"name":"faux123/Nexus_5","url":"https://api.github.com/repos/faux123/Nexus_5"},"payload":{"action":"started"},"public":true,"created_at":"2015-01-01T01:06:45Z"}
{"id":"2489398701","type":"GollumEvent","actor":{"id":7797609,"login":"ivanwfr","gravatar_id":"","url":"https://api.github.com/users/ivanwfr","avatar_url":"https://avatars.githubusercontent.com/u/7797609?"},"repo":{"id":808316,"name":"cswetenham/tabspace2.1","url":"https://api.github.com/repos/cswetenham/tabspace2.1"},"payload":{"pages":[{"page_name":"Brandon-Craig-Rhodes-TabSpace-Chords-Colored","title":"Brandon Craig Rhodes TabSpace Chords Colored","summary":null,"action":"edited","sha":"d09c2420a64f21b7a0778ef7d3245689239eea08","html_url":"https://github.com/cswetenham/tabspace2.1/wiki/Brandon-Craig-Rhodes-TabSpace-Chords-Colored"}]},"public":true,"created_at":"2015-01-01T01:06:45Z"}
{"id":"2489398702","type":"PushEvent","actor":{"id":3022197,"login":"liuyang1","gravatar_id":"","url":"https://api.github.com/users/liuyang1","avatar_url":"https://avatars.githubusercontent.com/u/3022197?"},"repo":{"id":26949326,"name":"liuyang1/test","url":"https://api.github.com/repos/liuyang1/test"},"payload":{"push_id":536753475,"size":2,"distinct_size":2,"ref":"refs/heads/master","head":"8837445c1174eede953b25f754b128a924ee1b84","before":"0376a5169b1e0d40ba945bbe9b991b6bd142b2ff","commits":[{"sha":"355f7490539ead559764f294aade43d904ba5aa7","author":{"email":"35a72eefb2bfb2a974e000ff4a69ccb41ad11391@mail.ustc.edu.cn","name":"liuyang1"},"message":"dynamic Macro add timestamp","distinct":true,"url":"https://api.github.com/repos/liuyang1/test/commits/355f7490539ead559764f294aade43d904ba5aa7"},{"sha":"8837445c1174eede953b25f754b128a924ee1b84","author":{"email":"35a72eefb2bfb2a974e000ff4a69ccb41ad11391@mail.ustc.edu.cn","name":"liuyang1"},"message":"Merge branch 'master' of github.com:liuyang1/test","distinct":true,"url":"https://api.github.com/repos/liuyang1/test/commits/8837445c1174eede953b25f754b128a924ee1b84"}]},"public":true,"created_at":"2015-01-01T01:06:45Z"}
{"id":"2489398703","type":"PushEvent","actor":{"id":9101573,"login":"megantmcginley","gravatar_id":"","url":"https://api.github.com/users/megantmcginley","avatar_url":"https://avatars.githubusercontent.com/u/9101573?"},"repo":{"id":25549968,"name":"megantmcginley/megantmcginley.github.io","url":"https://api.github.com/repos/megantmcginley/megantmcginley.github.io"},"payload":{"push_id":536753476,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"1cfb7c3568cd96f4d5233c1ca07f94a0d6a56762","before":"1ac2c938f5436c6ff9576e262b80ccbced4586a8","commits":[{"sha":"1cfb7c3568cd96f4d5233c1ca07f94a0d6a56762","author":{"email":"92f56e51255edbb80c74150d0115560b34c2bc35@users.noreply.github.com","name":"megantmcginley"},"message":"Update about.html","distinct":true,"url":"https://api.github.com/repos/megantmcginley/megantmcginley.github.io/commits/1cfb7c3568cd96f4d5233c1ca07f94a0d6a56762"}]},"public":true,"created_at":"2015-01-01T01:06:45Z"}
{"id":"2489398704","type":"PushEvent","actor":{"id":376203,"login":"JoshEngebretson","gravatar_id":"","url":"https://api.github.com/users/JoshEngebretson","avatar_url":"https://avatars.githubusercontent.com/u/376203?"},"repo":{"id":26557148,"name":"AtomicGameEngine/AtomicRuntime","url":"https://api.github.com/repos/AtomicGameEngine/AtomicRuntime"},"payload":{"push_id":536753477,"size":1,"distinct_size":1,"ref":"refs/heads/atomic_light2d","head":"b2bca32f071f0b1d396834006324c09719f92353","before":"1d650fe0e4ee13049f9e32fd7ad8d650f99b13d2","commits":[{"sha":"b2bca32f071f0b1d396834006324c09719f92353","author":{"email":"c028c213ed5efcf30c3f4fc7361dbde0c893c5b7@galaxyfarfaraway.com","name":"Josh Engebretson"},"message":"Light2D Fix silly error","distinct":true,"url":"https://api.github.com/repos/AtomicGameEngine/AtomicRuntime/commits/b2bca32f071f0b1d396834006324c09719f92353"}]},"public":true,"created_at":"2015-01-01T01:06:45Z","org":{"id":9641691,"login":"AtomicGameEngine","gravatar_id":"","url":"https://api.github.com/orgs/AtomicGameEngine","avatar_url":"https://avatars.githubusercontent.com/u/9641691?"}}
{"id":"2489398706","type":"PushEvent","actor":{"id":7606292,"login":"simplicit","gravatar_id":"","url":"https://api.github.com/users/simplicit","avatar_url":"https://avatars.githubusercontent.com/u/7606292?"},"repo":{"id":27554172,"name":"lenovo-a3-dev/android_frameworks_opt_telephony","url":"https://api.github.com/repos/lenovo-a3-dev/android_frameworks_opt_telephony"},"payload":{"push_id":536753478,"size":1,"distinct_size":1,"ref":"refs/heads/cm-11.0","head":"29b19bfb6baee32941b09a186caca194f3c1756f","before":"9e20514b298ee1cdf909084c9d1a56e8663d132a","commits":[{"sha":"29b19bfb6baee32941b09a186caca194f3c1756f","author":{"email":"c692d6a10598e0a801576fdd4ecf3c37e45bfbc4@cs.pitt.edu","name":"William C. Garrison III"},"message":"Telephony: If no wrapped message, originating address is null\n\nA Verizon HTC m8 user reported this error:\n\nhttp://pastebin.com/3LaYGB6X\n\nwhich means that mWrappedSmsMessage is null, meaning it wasn't created\nsuccessfully by createFromPdu(pdu, format). Let's let getOriginatingAddress()\nreport this as a null, and see if createFromPdu(pdu) can create the wrapped\nmessage properly.\n\nEven if it's still a null, TextUtils.isEmpty will return true, meaning the\nmessage's address won't be returned (better than crashing com.process.phone).\n\nChange-Id: I419bc3e6045b0cf7d62a348a0be02555e0f7b76e","distinct":true,"url":"https://api.github.com/repos/lenovo-a3-dev/android_frameworks_opt_telephony/commits/29b19bfb6baee32941b09a186caca194f3c1756f"}]},"public":true,"created_at":"2015-01-01T01:06:47Z","org":{"id":6270737,"login":"lenovo-a3-dev","gravatar_id":"","url":"https://api.github.com/orgs/lenovo-a3-dev","avatar_url":"https://avatars.githubusercontent.com/u/6270737?"}}
{"id":"2489398707","type":"PushEvent","actor":{"id":10263666,"login":"katiekroik","gravatar_id":"","url":"https://api.github.com/users/katiekroik","avatar_url":"https://avatars.githubusercontent.com/u/10263666?"},"repo":{"id":28677679,"name":"jl4282/swirlwebsite","url":"https://api.github.com/repos/jl4282/swirlwebsite"},"payload":{"push_id":536753479,"size":1,"distinct_size":1,"ref":"refs/heads/develop","head":"0b72a0bb1292ee07b8309774bdcc4165db322c26","before":"53bc894d93b396c5cc3c224311421a017ceac40e","commits":[{"sha":"0b72a0bb1292ee07b8309774bdcc4165db322c26","author":{"email":"fdb375617daf85f650fdf56bce778da925caee49@nyu.edu","name":"katiekroik"},"message":"Updated README","distinct":true,"url":"https://api.github.com/repos/jl4282/swirlwebsite/commits/0b72a0bb1292ee07b8309774bdcc4165db322c26"}]},"public":true,"created_at":"2015-01-01T01:06:47Z"}
{"id":"2489398715","type":"PushEvent","actor":{"id":3020337,"login":"ads04r","gravatar_id":"","url":"https://api.github.com/users/ads04r","avatar_url":"https://avatars.githubusercontent.com/u/3020337?"},"repo":{"id":7232953,"name":"ads04r/imouto","url":"https://api.github.com/repos/ads04r/imouto"},"payload":{"push_id":536753483,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"957618358c63acb1bdd466c1ca5236c5027d6298","before":"85c3e84ba948391cfe558c49d6a7468ead1101f2","commits":[{"sha":"957618358c63acb1bdd466c1ca5236c5027d6298","author":{"email":"0ccde024171faa98768fb1f17761d5e2335a31b4@ecs.soton.ac.uk","name":"Ash"},"message":"Some basic queries for generating yearly summaries\n\nWill be removed and integrated properly soon, I just wanted them in\nchange control sooner rather than later.","distinct":true,"url":"https://api.github.com/repos/ads04r/imouto/commits/957618358c63acb1bdd466c1ca5236c5027d6298"}]},"public":true,"created_at":"2015-01-01T01:06:47Z"}
{"id":"2489398721","type":"PushEvent","actor":{"id":458892,"login":"Havanna","gravatar_id":"","url":"https://api.github.com/users/Havanna","avatar_url":"https://avatars.githubusercontent.com/u/458892?"},"repo":{"id":22987680,"name":"Ihavee/ihavee.github.io","url":"https://api.github.com/repos/Ihavee/ihavee.github.io"},"payload":{"push_id":536753486,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"b51e29b184d6b5c13c71376a6f7e75c42c364759","before":"44190b8c058537664c002a93b6db1d47dd7f6bb2","commits":[{"sha":"b51e29b184d6b5c13c71376a6f7e75c42c364759","author":{"email":"8743e28f8544a53faec3c88031aa3516d5d474c9@yeah.net","name":"Havanna"},"message":"update image","distinct":true,"url":"https://api.github.com/repos/Ihavee/ihavee.github.io/commits/b51e29b184d6b5c13c71376a6f7e75c42c364759"}]},"public":true,"created_at":"2015-01-01T01:06:49Z","org":{"id":1856466,"login":"Ihavee","gravatar_id":"","url":"https://api.github.com/orgs/Ihavee","avatar_url":"https://avatars.githubusercontent.com/u/1856466?"}}
{"id":"2489398730","type":"IssueCommentEvent","actor":{"id":1682199,"login":"JayBeavers","gravatar_id":"","url":"https://api.github.com/users/JayBeavers","avatar_url":"https://avatars.githubusercontent.com/u/1682199?"},"repo":{"id":21885551,"name":"erikringsmuth/app-router","url":"https://api.github.com/repos/erikringsmuth/app-router"},"payload":{"action":"created","issue":{"url":"https://api.github.com/repos/erikringsmuth/app-router/issues/60","labels_url":"https://api.github.com/repos/erikringsmuth/app-router/issues/60/labels{/name}","comments_url":"https://api.github.com/repos/erikringsmuth/app-router/issues/60/comments","events_url":"https://api.github.com/repos/erikringsmuth/app-router/issues/60/events","html_url":"https://github.com/erikringsmuth/app-router/issues/60","id":53166608,"number":60,"title":"Test instructions in readme out of date?","user":{"login":"JayBeavers","id":1682199,"avatar_url":"https://avatars.githubusercontent.com/u/1682199?v=3","gravatar_id":"","url":"https://api.github.com/users/JayBeavers","html_url":"https://github.com/JayBeavers","followers_url":"https://api.github.com/users/JayBeavers/followers","following_url":"https://api.github.com/users/JayBeavers/following{/other_user}","gists_url":"https://api.github.com/users/JayBeavers/gists{/gist_id}","starred_url":"https://api.github.com/users/JayBeavers/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/JayBeavers/subscriptions","organizations_url":"https://api.github.com/users/JayBeavers/orgs","repos_url":"https://api.github.com/users/JayBeavers/repos","events_url":"https://api.github.com/users/JayBeavers/events{/privacy}","received_events_url":"https://api.github.com/users/JayBeavers/received_events","type":"User","site_admin":false},"labels":[],"state":"closed","locked":false,"assignee":null,"milestone":null,"comments":5,"created_at":"2014-12-31T04:25:55Z","updated_at":"2015-01-01T01:06:50Z","closed_at":"2015-01-01T01:06:50Z","body":"At [build, test, and debug](https://github.com/erikringsmuth/app-router/#build-test-and-debug-) it says to:\r\n\r\n    Manually run functional tests in the browser by starting a static content server\r\n    (node http-server or python -m SimpleHTTPServer) and open\r\n    http://localhost:8080/tests/functional-tests/\r\n\r\nBut this gets you a 404.  Perhaps you meant\r\n\r\n    http://localhost:8080/tests/SpecRunner.html\r\n\r\nBut I *think* this is taken care of by gulp."},"comment":{"url":"https://api.github.com/repos/erikringsmuth/app-router/issues/comments/68477366","html_url":"https://github.com/erikringsmuth/app-router/issues/60#issuecomment-68477366","issue_url":"https://api.github.com/repos/erikringsmuth/app-router/issues/60","id":68477366,"user":{"login":"JayBeavers","id":1682199,"avatar_url":"https://avatars.githubusercontent.com/u/1682199?v=3","gravatar_id":"","url":"https://api.github.com/users/JayBeavers","html_url":"https://github.com/JayBeavers","followers_url":"https://api.github.com/users/JayBeavers/followers","following_url":"https://api.github.com/users/JayBeavers/following{/other_user}","gists_url":"https://api.github.com/users/JayBeavers/gists{/gist_id}","starred_url":"https://api.github.com/users/JayBeavers/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/JayBeavers/subscriptions","organizations_url":"https://api.github.com/users/JayBeavers/orgs","repos_url":"https://api.github.com/users/JayBeavers/repos","events_url":"https://api.github.com/users/JayBeavers/events{/privacy}","received_events_url":"https://api.github.com/users/JayBeavers/received_events","type":"User","site_admin":false},"created_at":"2015-01-01T01:06:50Z","updated_at":"2015-01-01T01:06:50Z","body":"Closing.  Would offer to PR the docs, but you're moving towards an automated approach instead."}},"public":true,"created_at":"2015-01-01T01:06:51Z"}
{"id":"2489398731","type":"IssuesEvent","actor":{"id":1682199,"login":"JayBeavers","gravatar_id":"","url":"https://api.github.com/users/JayBeavers","avatar_url":"https://avatars.githubusercontent.com/u/1682199?"},"repo":{"id":21885551,"name":"erikringsmuth/app-router","url":"https://api.github.com/repos/erikringsmuth/app-router"},"payload":{"action":"closed","issue":{"url":"https://api.github.com/repos/erikringsmuth/app-router/issues/60","labels_url":"https://api.github.com/repos/erikringsmuth/app-router/issues/60/labels{/name}","comments_url":"https://api.github.com/repos/erikringsmuth/app-router/issues/60/comments","events_url":"https://api.github.com/repos/erikringsmuth/app-router/issues/60/events","html_url":"https://github.com/erikringsmuth/app-router/issues/60","id":53166608,"number":60,"title":"Test instructions in readme out of date?","user":{"login":"JayBeavers","id":1682199,"avatar_url":"https://avatars.githubusercontent.com/u/1682199?v=3","gravatar_id":"","url":"https://api.github.com/users/JayBeavers","html_url":"https://github.com/JayBeavers","followers_url":"https://api.github.com/users/JayBeavers/followers","following_url":"https://api.github.com/users/JayBeavers/following{/other_user}","gists_url":"https://api.github.com/users/JayBeavers/gists{/gist_id}","starred_url":"https://api.github.com/users/JayBeavers/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/JayBeavers/subscriptions","organizations_url":"https://api.github.com/users/JayBeavers/orgs","repos_url":"https://api.github.com/users/JayBeavers/repos","events_url":"https://api.github.com/users/JayBeavers/events{/privacy}","received_events_url":"https://api.github.com/users/JayBeavers/received_events","type":"User","site_admin":false},"labels":[],"state":"closed","locked":false,"assignee":null,"milestone":null,"comments":5,"created_at":"2014-12-31T04:25:55Z","updated_at":"2015-01-01T01:06:50Z","closed_at":"2015-01-01T01:06:50Z","body":"At [build, test, and debug](https://github.com/erikringsmuth/app-router/#build-test-and-debug-) it says to:\r\n\r\n    Manually run functional tests in the browser by starting a static content server\r\n    (node http-server or python -m SimpleHTTPServer) and open\r\n    http://localhost:8080/tests/functional-tests/\r\n\r\nBut this gets you a 404.  Perhaps you meant\r\n\r\n    http://localhost:8080/tests/SpecRunner.html\r\n\r\nBut I *think* this is taken care of by gulp."}},"public":true,"created_at":"2015-01-01T01:06:51Z"}
{"id":"2489398735","type":"PushEvent","actor":{"id":9828988,"login":"alexformagio","gravatar_id":"","url":"https://api.github.com/users/alexformagio","avatar_url":"https://avatars.githubusercontent.com/u/9828988?"},"repo":{"id":28678021,"name":"alexformagio/python30min","url":"https://api.github.com/repos/alexformagio/python30min"},"payload":{"push_id":536753490,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"94076cb80620e00f80a01fb228e6f01bbcaf550e","before":"6148df2e7babc92c0568cc452deae2b683a041da","commits":[{"sha":"94076cb80620e00f80a01fb228e6f01bbcaf550e","author":{"email":"eb51c250a6d7f2b7307829ec95405c85965e34b2@gmail.com","name":"alex_formagio"},"message":"uploa file3","distinct":true,"url":"https://api.github.com/repos/alexformagio/python30min/commits/94076cb80620e00f80a01fb228e6f01bbcaf550e"}]},"public":true,"created_at":"2015-01-01T01:06:51Z"}
{"id":"2489398736","type":"PushEvent","actor":{"id":3332598,"login":"pgruenbacher","gravatar_id":"","url":"https://api.github.com/users/pgruenbacher","avatar_url":"https://avatars.githubusercontent.com/u/3332598?"},"repo":{"id":28670009,"name":"pgruenbacher/mydrive5","url":"https://api.github.com/repos/pgruenbacher/mydrive5"},"payload":{"push_id":536753491,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"397ed4267dcdbff8c52324a3f66776a87495da02","before":"9237ed0f2b971ef413bd50e748dc8579e2323a5c","commits":[{"sha":"397ed4267dcdbff8c52324a3f66776a87495da02","author":{"email":"6f5c7f15036059ac7b25472c8812708bfb22b1eb@gmail.com","name":"Paul Gruenbacher"},"message":"palette","distinct":true,"url":"https://api.github.com/repos/pgruenbacher/mydrive5/commits/397ed4267dcdbff8c52324a3f66776a87495da02"}]},"public":true,"created_at":"2015-01-01T01:06:51Z"}
{"id":"2489398743","type":"PushEvent","actor":{"id":10355660,"login":"nomadturk","gravatar_id":"","url":"https://api.github.com/users/nomadturk","avatar_url":"https://avatars.githubusercontent.com/u/10355660?"},"repo":{"id":28657737,"name":"nomadturk/nginx-conf","url":"https://api.github.com/repos/nomadturk/nginx-conf"},"payload":{"push_id":536753494,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"035679b2f50ea9d689bba803906d5b1ee3418062","before":"f560a8bd7c3d688fd6b99a5976e3518fbbfd68a3","commits":[{"sha":"035679b2f50ea9d689bba803906d5b1ee3418062","author":{"email":"90283840d90de49b8e7984bd99b47fee0d4bd50d@cokh.net","name":"nomadturk"},"message":"Create pagespeed-all-settings.add","distinct":true,"url":"https://api.github.com/repos/nomadturk/nginx-conf/commits/035679b2f50ea9d689bba803906d5b1ee3418062"}]},"public":true,"created_at":"2015-01-01T01:06:53Z"}
{"id":"2489398744","type":"PushEvent","actor":{"id":3105201,"login":"beh68030","gravatar_id":"","url":"https://api.github.com/users/beh68030","avatar_url":"https://avatars.githubusercontent.com/u/3105201?"},"repo":{"id":22865608,"name":"beh68030/twitch_lookup","url":"https://api.github.com/repos/beh68030/twitch_lookup"},"payload":{"push_id":536753495,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"2e8582db72d4c53a2627aa9fb700aa56c9689bf9","before":"18fabca10abfd73c080a73db05759fa14d98dfa6","commits":[{"sha":"2e8582db72d4c53a2627aa9fb700aa56c9689bf9","author":{"email":"3e061f68f73b3319b5773c9f6054f99a9369e4cb@users.noreply.github.com","name":"beh68030"},"message":"Update search.lisp","distinct":true,"url":"https://api.github.com/repos/beh68030/twitch_lookup/commits/2e8582db72d4c53a2627aa9fb700aa56c9689bf9"}]},"public":true,"created_at":"2015-01-01T01:06:53Z"}
{"id":"2489398750","type":"PushEvent","actor":{"id":32421,"login":"damonallison","gravatar_id":"","url":"https://api.github.com/users/damonallison","avatar_url":"https://avatars.githubusercontent.com/u/32421?"},"repo":{"id":28276966,"name":"damonallison/git-test","url":"https://api.github.com/repos/damonallison/git-test"},"payload":{"push_id":536753497,"size":5,"distinct_size":4,"ref":"refs/heads/damon2","head":"3e58f93effeb21baf088c66ac7ba4db6565f832e","before":"096de29c8100f5a960060052b04f5ef4902355cd","commits":[{"sha":"0cd38185bffd3af3513d0763ced55fb8916f6072","author":{"email":"a836250b7333a571ccf7c31c8a50a83778615420@code42.com","name":"Damon Allison"},"message":"damon","distinct":true,"url":"https://api.github.com/repos/damonallison/git-test/commits/0cd38185bffd3af3513d0763ced55fb8916f6072"},{"sha":"a0241b998058d49fe5ec6b1732d32f4269d4de30","author":{"email":"a836250b7333a571ccf7c31c8a50a83778615420@code42.com","name":"Damon Allison"},"message":"master","distinct":false,"url":"https://api.github.com/repos/damonallison/git-test/commits/a0241b998058d49fe5ec6b1732d32f4269d4de30"},{"sha":"eb2b6231b59cda41629ce12b4750d55e5946b6d5","author":{"email":"a836250b7333a571ccf7c31c8a50a83778615420@code42.com","name":"Damon Allison"},"message":"more on damon2","distinct":true,"url":"https://api.github.com/repos/damonallison/git-test/commits/eb2b6231b59cda41629ce12b4750d55e5946b6d5"},{"sha":"df69472afe16ac49d94618598ae40f9bde0b50b9","author":{"email":"a836250b7333a571ccf7c31c8a50a83778615420@code42.com","name":"Damon Allison"},"message":"more(2) on damon2","distinct":true,"url":"https://api.github.com/repos/damonallison/git-test/commits/df69472afe16ac49d94618598ae40f9bde0b50b9"},{"sha":"3e58f93effeb21baf088c66ac7ba4db6565f832e","author":{"email":"a836250b7333a571ccf7c31c8a50a83778615420@code42.com","name":"Damon Allison"},"message":"Merge branch 'master' into damon2","distinct":true,"url":"https://api.github.com/repos/damonallison/git-test/commits/3e58f93effeb21baf088c66ac7ba4db6565f832e"}]},"public":true,"created_at":"2015-01-01T01:06:53Z"}
{"id":"2489398752","type":"PushEvent","actor":{"id":9271233,"login":"Nexusty","gravatar_id":"","url":"https://api.github.com/users/Nexusty","avatar_url":"https://avatars.githubusercontent.com/u/9271233?"},"repo":{"id":28494954,"name":"Nexusty/open_exoplanet_catalogue","url":"https://api.github.com/repos/Nexusty/open_exoplanet_catalogue"},"payload":{"push_id":536753498,"size":3,"distinct_size":3,"ref":"refs/heads/master","head":"6fde6be1e4178a9268ad735ca4bc12edb9f66290","before":"1c76a1af7971f4fcc693b147bbf70c75d7352617","commits":[{"sha":"da3f398815f136e62b18be313e10dc5317d27a72","author":{"email":"898dba66b7f38fdb797b262b137097fc973d6485@hanno-rein.de","name":"Hanno Rein"},"message":"Merge pull request #434 from Nexusty/master\n\nWASP-84 b","distinct":true,"url":"https://api.github.com/repos/Nexusty/open_exoplanet_catalogue/commits/da3f398815f136e62b18be313e10dc5317d27a72"},{"sha":"ab6d6080cd03d5aaa863bfba2944f7e006b1e186","author":{"email":"7108125947c1f9f50408652b4c345d19fd23e566@users.noreply.github.com","name":"Christian Sturm"},"message":"Added hot Jupiter\n\nCloses #435","distinct":true,"url":"https://api.github.com/repos/Nexusty/open_exoplanet_catalogue/commits/ab6d6080cd03d5aaa863bfba2944f7e006b1e186"},{"sha":"6fde6be1e4178a9268ad735ca4bc12edb9f66290","author":{"email":"898dba66b7f38fdb797b262b137097fc973d6485@hanno-rein.de","name":"Hanno Rein"},"message":"Merge pull request #436 from Sol-d/patch-6\n\nAdded hot Jupiter","distinct":true,"url":"https://api.github.com/repos/Nexusty/open_exoplanet_catalogue/commits/6fde6be1e4178a9268ad735ca4bc12edb9f66290"}]},"public":true,"created_at":"2015-01-01T01:06:53Z"}
{"id":"2489398760","type":"PushEvent","actor":{"id":660054,"login":"MarkAYoder","gravatar_id":"","url":"https://api.github.com/users/MarkAYoder","avatar_url":"https://avatars.githubusercontent.com/u/660054?"},"repo":{"id":5111513,"name":"MarkAYoder/BeagleBoard-exercises","url":"https://api.github.com/repos/MarkAYoder/BeagleBoard-exercises"},"payload":{"push_id":536753503,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"ab3d6b980de5ba3c23f61a4645efb701fbbde1a2","before":"ebc1e32f6e6e373f1d46fa4d0b532eba4ec7c497","commits":[{"sha":"ab3d6b980de5ba3c23f61a4645efb701fbbde1a2","author":{"email":"9068e990bc2a9df3bc663b2b11b19718c2490ef5@Rose-Hulman.edu","name":"Mark A. Yoder"},"message":"Added STRING_LEN and color-names","distinct":true,"url":"https://api.github.com/repos/MarkAYoder/BeagleBoard-exercises/commits/ab3d6b980de5ba3c23f61a4645efb701fbbde1a2"}]},"public":true,"created_at":"2015-01-01T01:06:55Z"}
{"id":"2489398762","type":"PushEvent","actor":{"id":433707,"login":"ile","gravatar_id":"","url":"https://api.github.com/users/ile","avatar_url":"https://avatars.githubusercontent.com/u/433707?"},"repo":{"id":26847132,"name":"kantele/k-templates","url":"https://api.github.com/repos/kantele/k-templates"},"payload":{"push_id":536753504,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"2250e5e1294fae3c21d3fa9b19bd162c40c29a6c","before":"bd9e3811383e5c3fc3bbd2b9ddd90047df70e7c5","commits":[{"sha":"2250e5e1294fae3c21d3fa9b19bd162c40c29a6c","author":{"email":"4f3407de78bccc8cc160ee4d278d5efe7162e6b5@nateps.com","name":"Nate Smith"},"message":"always make dynamic views optional\n\ninstead of throwing an error when a dynamic lookup fails and optional\nis not specified, just always render a blank template","distinct":true,"url":"https://api.github.com/repos/kantele/k-templates/commits/2250e5e1294fae3c21d3fa9b19bd162c40c29a6c"}]},"public":true,"created_at":"2015-01-01T01:06:55Z","org":{"id":5687585,"login":"kantele","gravatar_id":"","url":"https://api.github.com/orgs/kantele","avatar_url":"https://avatars.githubusercontent.com/u/5687585?"}}
{"id":"2489398767","type":"PushEvent","actor":{"id":1308363,"login":"paymonp","gravatar_id":"","url":"https://api.github.com/users/paymonp","avatar_url":"https://avatars.githubusercontent.com/u/1308363?"},"repo":{"id":28678242,"name":"paymonp/forecast_wrapper","url":"https://api.github.com/repos/paymonp/forecast_wrapper"},"payload":{"push_id":536753505,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"cfa67c6a84faaa2bddc78c69075b5d1c9ebb42fd","before":"9b9757b748dd98f06c2517a9af376e7515716a6a","commits":[{"sha":"cfa67c6a84faaa2bddc78c69075b5d1c9ebb42fd","author":{"email":"fc8885f78a23392efbab2637290a95a3fe38d9fa@team.curious.com","name":"Paymon"},"message":"Update README.md","distinct":true,"url":"https://api.github.com/repos/paymonp/forecast_wrapper/commits/cfa67c6a84faaa2bddc78c69075b5d1c9ebb42fd"}]},"public":true,"created_at":"2015-01-01T01:06:57Z"}
{"id":"2489398768","type":"CreateEvent","actor":{"id":10214932,"login":"jplarida","gravatar_id":"","url":"https://api.github.com/users/jplarida","avatar_url":"https://avatars.githubusercontent.com/u/10214932?"},"repo":{"id":28678286,"name":"jplarida/testgit","url":"https://api.github.com/repos/jplarida/testgit"},"payload":{"ref":null,"ref_type":"repository","master_branch":"master","description":"this is a test","pusher_type":"user"},"public":true,"created_at":"2015-01-01T01:06:58Z"}
{"id":"2489398769","type":"IssuesEvent","actor":{"id":1737635,"login":"waltervr","gravatar_id":"","url":"https://api.github.com/users/waltervr","avatar_url":"https://avatars.githubusercontent.com/u/1737635?"},"repo":{"id":28369326,"name":"waltervr/mejengol","url":"https://api.github.com/repos/waltervr/mejengol"},"payload":{"action":"opened","issue":{"url":"https://api.github.com/repos/waltervr/mejengol/issues/6","labels_url":"https://api.github.com/repos/waltervr/mejengol/issues/6/labels{/name}","comments_url":"https://api.github.com/repos/waltervr/mejengol/issues/6/comments","events_url":"https://api.github.com/repos/waltervr/mejengol/issues/6/events","html_url":"https://github.com/waltervr/mejengol/issues/6","id":53210298,"number":6,"title":"Use a single button for start/stop chronometer.","user":{"login":"waltervr","id":1737635,"avatar_url":"https://avatars.githubusercontent.com/u/1737635?v=3","gravatar_id":"","url":"https://api.github.com/users/waltervr","html_url":"https://github.com/waltervr","followers_url":"https://api.github.com/users/waltervr/followers","following_url":"https://api.github.com/users/waltervr/following{/other_user}","gists_url":"https://api.github.com/users/waltervr/gists{/gist_id}","starred_url":"https://api.github.com/users/waltervr/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/waltervr/subscriptions","organizations_url":"https://api.github.com/users/waltervr/orgs","repos_url":"https://api.github.com/users/waltervr/repos","events_url":"https://api.github.com/users/waltervr/events{/privacy}","received_events_url":"https://api.github.com/users/waltervr/received_events","type":"User","site_admin":false},"labels":[],"state":"open","locked":false,"assignee":null,"milestone":null,"comments":0,"created_at":"2015-01-01T01:06:57Z","updated_at":"2015-01-01T01:06:57Z","closed_at":null,"body":"Use a single button for start/stop chronometer."}},"public":true,"created_at":"2015-01-01T01:06:58Z"}
{"id":"2489398771","type":"PushEvent","actor":{"id":777062,"login":"MikeLorenz","gravatar_id":"","url":"https://api.github.com/users/MikeLorenz","avatar_url":"https://avatars.githubusercontent.com/u/777062?"},"repo":{"id":28676253,"name":"MikeLorenz/Spoon-Knife","url":"https://api.github.com/repos/MikeLorenz/Spoon-Knife"},"payload":{"push_id":536753506,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"5e43e91af613860fc38ce4e2f77272bfd60cc143","before":"d0dd1f61b33d64e29d8bc1372a94ef6a2fee76a9","commits":[{"sha":"5e43e91af613860fc38ce4e2f77272bfd60cc143","author":{"email":"a17fed27eaa842282862ff7c1b9c8395a26ac320@mikelorenz.com","name":"Mike Lorenz"},"message":"Changed the outgoing text.","distinct":true,"url":"https://api.github.com/repos/MikeLorenz/Spoon-Knife/commits/5e43e91af613860fc38ce4e2f77272bfd60cc143"}]},"public":true,"created_at":"2015-01-01T01:06:58Z"}
{"id":"2489398778","type":"PushEvent","actor":{"id":8683432,"login":"wkcool","gravatar_id":"","url":"https://api.github.com/users/wkcool","avatar_url":"https://avatars.githubusercontent.com/u/8683432?"},"repo":{"id":27059641,"name":"wkcool/wkcool.github.com","url":"https://api.github.com/repos/wkcool/wkcool.github.com"},"payload":{"push_id":536753510,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"9f6584f5fa96346a20b148f340fbfd055dd70e7e","before":"48d6c11b675a084cfa0321b7b14c00241e423044","commits":[{"sha":"9f6584f5fa96346a20b148f340fbfd055dd70e7e","author":{"email":"ddd2d39a843d8ae129b2e2fc6f13669f44116bd1@gmail.com","name":"wenkrcool"},"message":"提交","distinct":true,"url":"https://api.github.com/repos/wkcool/wkcool.github.com/commits/9f6584f5fa96346a20b148f340fbfd055dd70e7e"}]},"public":true,"created_at":"2015-01-01T01:06:59Z"}
{"id":"2489398785","type":"PushEvent","actor":{"id":1714830,"login":"davidsavagejr","gravatar_id":"","url":"https://api.github.com/users/davidsavagejr","avatar_url":"https://avatars.githubusercontent.com/u/1714830?"},"repo":{"id":28677976,"name":"davidsavagejr/NSBTransactionPerformance","url":"https://api.github.com/repos/davidsavagejr/NSBTransactionPerformance"},"payload":{"push_id":536753515,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"142bcdb815e594a389be04a10fa12465d9de7699","before":"a15ad161b2efd7821dadfe429d641b349ebeb65f","commits":[{"sha":"142bcdb815e594a389be04a10fa12465d9de7699","author":{"email":"aa743a0aaec8f7d7a1f01442503957f4d7a2d634@headspring.com","name":"David Savage"},"message":"Couple cleanup items and added sql file","distinct":true,"url":"https://api.github.com/repos/davidsavagejr/NSBTransactionPerformance/commits/142bcdb815e594a389be04a10fa12465d9de7699"}]},"public":true,"created_at":"2015-01-01T01:07:00Z"}
{"id":"2489398787","type":"IssueCommentEvent","actor":{"id":10238253,"login":"DasCode","gravatar_id":"","url":"https://api.github.com/users/DasCode","avatar_url":"https://avatars.githubusercontent.com/u/10238253?"},"repo":{"id":24246283,"name":"trydis/FIFA-Ultimate-Team-2015-Toolkit","url":"https://api.github.com/repos/trydis/FIFA-Ultimate-Team-2015-Toolkit"},"payload":{"action":"created","issue":{"url":"https://api.github.com/repos/trydis/FIFA-Ultimate-Team-2015-Toolkit/issues/73","labels_url":"https://api.github.com/repos/trydis/FIFA-Ultimate-Team-2015-Toolkit/issues/73/labels{/name}","comments_url":"https://api.github.com/repos/trydis/FIFA-Ultimate-Team-2015-Toolkit/issues/73/comments","events_url":"https://api.github.com/repos/trydis/FIFA-Ultimate-Team-2015-Toolkit/issues/73/events","html_url":"https://github.com/trydis/FIFA-Ultimate-Team-2015-Toolkit/issues/73","id":47828562,"number":73,"title":"[Question] Check in Watchlist, if I'm overbid?","user":{"login":"Taggardos","id":7068808,"avatar_url":"https://avatars.githubusercontent.com/u/7068808?v=3","gravatar_id":"","url":"https://api.github.com/users/Taggardos","html_url":"https://github.com/Taggardos","followers_url":"https://api.github.com/users/Taggardos/followers","following_url":"https://api.github.com/users/Taggardos/following{/other_user}","gists_url":"https://api.github.com/users/Taggardos/gists{/gist_id}","starred_url":"https://api.github.com/users/Taggardos/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/Taggardos/subscriptions","organizations_url":"https://api.github.com/users/Taggardos/orgs","repos_url":"https://api.github.com/users/Taggardos/repos","events_url":"https://api.github.com/users/Taggardos/events{/privacy}","received_events_url":"https://api.github.com/users/Taggardos/received_events","type":"User","site_admin":false},"labels":[],"state":"open","locked":false,"assignee":null,"milestone":null,"comments":1,"created_at":"2014-11-05T12:00:50Z","updated_at":"2015-01-01T01:07:00Z","closed_at":null,"body":"Hello,\r\nthe Topic says it all?\r\nIs it possible to check, if I am overbidded by someone else with the Toolkit?\r\n"},"comment":{"url":"https://api.github.com/repos/trydis/FIFA-Ultimate-Team-2015-Toolkit/issues/comments/68477369","html_url":"https://github.com/trydis/FIFA-Ultimate-Team-2015-Toolkit/issues/73#issuecomment-68477369","issue_url":"https://api.github.com/repos/trydis/FIFA-Ultimate-Team-2015-Toolkit/issues/73","id":68477369,"user":{"login":"DasCode","id":10238253,"avatar_url":"https://avatars.githubusercontent.com/u/10238253?v=3","gravatar_id":"","url":"https://api.github.com/users/DasCode","html_url":"https://github.com/DasCode","followers_url":"https://api.github.com/users/DasCode/followers","following_url":"https://api.github.com/users/DasCode/following{/other_user}","gists_url":"https://api.github.com/users/DasCode/gists{/gist_id}","starred_url":"https://api.github.com/users/DasCode/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/DasCode/subscriptions","organizations_url":"https://api.github.com/users/DasCode/orgs","repos_url":"https://api.github.com/users/DasCode/repos","events_url":"https://api.github.com/users/DasCode/events{/privacy}","received_events_url":"https://api.github.com/users/DasCode/received_events","type":"User","site_admin":false},"created_at":"2015-01-01T01:07:00Z","updated_at":"2015-01-01T01:07:00Z","body":"As with anything, try it with the real web app, observe what happens in fiddler, and then use that to figure it out.\r\nIn this case if you bidState is \"outbid\""}},"public":true,"created_at":"2015-01-01T01:07:00Z"}
{"id":"2489398789","type":"CreateEvent","actor":{"id":804014,"login":"ry5n","gravatar_id":"","url":"https://api.github.com/users/ry5n","avatar_url":"https://avatars.githubusercontent.com/u/804014?"},"repo":{"id":28678287,"name":"ry5n/sass-inline-svg","url":"https://api.github.com/repos/ry5n/sass-inline-svg"},"payload":{"ref":null,"ref_type":"repository","master_branch":"master","description":"Inline an SVG as a CSS data URI. Allows recoloring paths.","pusher_type":"user"},"public":true,"created_at":"2015-01-01T01:07:00Z"}
{"id":"2489398793","type":"WatchEvent","actor":{"id":5554477,"login":"errolgrannum","gravatar_id":"","url":"https://api.github.com/users/errolgrannum","avatar_url":"https://avatars.githubusercontent.com/u/5554477?"},"repo":{"id":8845569,"name":"adamw523/simple_pyobjc_cocoa_xib","url":"https://api.github.com/repos/adamw523/simple_pyobjc_cocoa_xib"},"payload":{"action":"started"},"public":true,"created_at":"2015-01-01T01:07:01Z"}
{"id":"2489398795","type":"PushEvent","actor":{"id":3259988,"login":"Chaldron","gravatar_id":"","url":"https://api.github.com/users/Chaldron","avatar_url":"https://avatars.githubusercontent.com/u/3259988?"},"repo":{"id":28620299,"name":"Chaldron/chaldron.github.io","url":"https://api.github.com/repos/Chaldron/chaldron.github.io"},"payload":{"push_id":536753517,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"95f51364ae4ffa6d8c05ac103f6673b582aee33f","before":"bbae0256bd9a39b68421f3b8f57e1d1f2c82e44a","commits":[{"sha":"95f51364ae4ffa6d8c05ac103f6673b582aee33f","author":{"email":"201d29e73a9d86ccd769ab841a6a1fabfaeec39b@me.com","name":"Aditya"},"message":"Replace master branch with page content via GitHub","distinct":true,"url":"https://api.github.com/repos/Chaldron/chaldron.github.io/commits/95f51364ae4ffa6d8c05ac103f6673b582aee33f"}]},"public":true,"created_at":"2015-01-01T01:07:01Z"}
{"id":"2489398800","type":"PushEvent","actor":{"id":5728403,"login":"patrick-hudson","gravatar_id":"","url":"https://api.github.com/users/patrick-hudson","avatar_url":"https://avatars.githubusercontent.com/u/5728403?"},"repo":{"id":25392255,"name":"patrick-hudson/EggDrop","url":"https://api.github.com/repos/patrick-hudson/EggDrop"},"payload":{"push_id":536753519,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"0976103a68d57ef5dfd23ce0b13166ed29505f57","before":"84116936c4f6805f56a1e643eb9898ebdc854334","commits":[{"sha":"0976103a68d57ef5dfd23ce0b13166ed29505f57","author":{"email":"cbb7353e6d953ef360baf960c122346276c6e320@hudson.bz","name":"Patrick Hudson"},"message":"Scripted auto-commit on change (2014-12-31 20:07:00) by gitwatch.sh","distinct":true,"url":"https://api.github.com/repos/patrick-hudson/EggDrop/commits/0976103a68d57ef5dfd23ce0b13166ed29505f57"}]},"public":true,"created_at":"2015-01-01T01:07:02Z"}
{"id":"2489398801","type":"WatchEvent","actor":{"id":7682325,"login":"humanrocker","gravatar_id":"","url":"https://api.github.com/users/humanrocker","avatar_url":"https://avatars.githubusercontent.com/u/7682325?"},"repo":{"id":168370,"name":"jruby/jruby","url":"https://api.github.com/repos/jruby/jruby"},"payload":{"action":"started"},"public":true,"created_at":"2015-01-01T01:07:02Z","org":{"id":55687,"login":"jruby","gravatar_id":"","url":"https://api.github.com/orgs/jruby","avatar_url":"https://avatars.githubusercontent.com/u/55687?"}}
{"id":"2489398802","type":"CreateEvent","actor":{"id":2357415,"login":"neeleshbagga","gravatar_id":"","url":"https://api.github.com/users/neeleshbagga","avatar_url":"https://avatars.githubusercontent.com/u/2357415?"},"repo":{"id":28678288,"name":"neeleshbagga/CS2110QA","url":"https://api.github.com/repos/neeleshbagga/CS2110QA"},"payload":{"ref":null,"ref_type":"repository","master_branch":"master","description":"An interactive Q&A tool built in Java","pusher_type":"user"},"public":true,"created_at":"2015-01-01T01:07:02Z"}
{"id":"2489398803","type":"PushEvent","actor":{"id":8965687,"login":"Gawainus","gravatar_id":"","url":"https://api.github.com/users/Gawainus","avatar_url":"https://avatars.githubusercontent.com/u/8965687?"},"repo":{"id":27628356,"name":"Gawainus/Systems","url":"https://api.github.com/repos/Gawainus/Systems"},"payload":{"push_id":536753520,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"fd9c66e6d94ab09f42e0986e8eecf075dc637f82","before":"04808fff427dd5bc90f3da6faa7abd58a3975139","commits":[{"sha":"fd9c66e6d94ab09f42e0986e8eecf075dc637f82","author":{"email":"95ac278ea19f44ce11e50f5f7e263294f31b7bb2@gmail.com","name":"Yumen Cao"},"message":"Malloc added","distinct":true,"url":"https://api.github.com/repos/Gawainus/Systems/commits/fd9c66e6d94ab09f42e0986e8eecf075dc637f82"}]},"public":true,"created_at":"2015-01-01T01:07:02Z"}
{"id":"2489398804","type":"WatchEvent","actor":{"id":1043930,"login":"hsw0","gravatar_id":"","url":"https://api.github.com/users/hsw0","avatar_url":"https://avatars.githubusercontent.com/u/1043930?"},"repo":{"id":330414,"name":"h2o/picohttpparser","url":"https://api.github.com/repos/h2o/picohttpparser"},"payload":{"action":"started"},"public":true,"created_at":"2015-01-01T01:07:03Z","org":{"id":9275116,"login":"h2o","gravatar_id":"","url":"https://api.github.com/orgs/h2o","avatar_url":"https://avatars.githubusercontent.com/u/9275116?"}}
{"id":"2489398809","type":"PushEvent","actor":{"id":6955935,"login":"wfrizzell","gravatar_id":"","url":"https://api.github.com/users/wfrizzell","avatar_url":"https://avatars.githubusercontent.com/u/6955935?"},"repo":{"id":28678275,"name":"wfrizzell/Completed-Target-Model-Table-Documentation","url":"https://api.github.com/repos/wfrizzell/Completed-Target-Model-Table-Documentation"},"payload":{"push_id":536753521,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"d030634f4bd8d8dc6d305cbe2afd05acefdacbd0","before":"265ddc64dff3dbbdaa2ce6021056a64b95b36c06","commits":[{"sha":"d030634f4bd8d8dc6d305cbe2afd05acefdacbd0","author":{"email":"e965d2ed358da94c7eb620090099fbbbcd752703@mphasis.com","name":"Bill Frizzell"},"message":"Target Model Entity Documentation","distinct":true,"url":"https://api.github.com/repos/wfrizzell/Completed-Target-Model-Table-Documentation/commits/d030634f4bd8d8dc6d305cbe2afd05acefdacbd0"}]},"public":true,"created_at":"2015-01-01T01:07:03Z"}
{"id":"2489398811","type":"PushEvent","actor":{"id":19571,"login":"lizadaly","gravatar_id":"","url":"https://api.github.com/users/lizadaly","avatar_url":"https://avatars.githubusercontent.com/u/19571?"},"repo":{"id":28673562,"name":"lizadaly/surrealisme","url":"https://api.github.com/repos/lizadaly/surrealisme"},"payload":{"push_id":536753523,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"748cde8726a87a0ca8102578e8bf0e1380b5bc92","before":"5bd3db7045dc3b1a231978c8b0ba17438a05436d","commits":[{"sha":"748cde8726a87a0ca8102578e8bf0e1380b5bc92","author":{"email":"7e31b076c038116b711593886947b7ee669cdd6a@safaribooksonline.com","name":"Liza Daly"},"message":"Some code","distinct":true,"url":"https://api.github.com/repos/lizadaly/surrealisme/commits/748cde8726a87a0ca8102578e8bf0e1380b5bc92"}]},"public":true,"created_at":"2015-01-01T01:07:03Z"}
{"id":"2489398815","type":"PushEvent","actor":{"id":4379694,"login":"moongato","gravatar_id":"","url":"https://api.github.com/users/moongato","avatar_url":"https://avatars.githubusercontent.com/u/4379694?"},"repo":{"id":11769101,"name":"moongato/android_packages_apps_settings","url":"https://api.github.com/repos/moongato/android_packages_apps_settings"},"payload":{"push_id":536753526,"size":3,"distinct_size":1,"ref":"refs/heads/lp50x","head":"a9d6ccf56bd0f57c043d30e57bf4aa9dde0f27ad","before":"56646a94c0aedc577d5db224058fb9be4c927786","commits":[{"sha":"e53c63b3254c37b69e9fcf05b69a1b2fb7f1858c","author":{"email":"0fdcc473619717889ce3a7389c2487333487bab5@gmail.com","name":"rascarlo"},"message":"volume rocker music controls","distinct":false,"url":"https://api.github.com/repos/moongato/android_packages_apps_settings/commits/e53c63b3254c37b69e9fcf05b69a1b2fb7f1858c"},{"sha":"bebb75fdaa4a085c814ea6d2551899593454440d","author":{"email":"0fdcc473619717889ce3a7389c2487333487bab5@gmail.com","name":"rascarlo"},"message":"status bar brightness control edits.\n\nremove check for SCREEN_BRIGHTNESS_MODE_AUTOMATIC","distinct":false,"url":"https://api.github.com/repos/moongato/android_packages_apps_settings/commits/bebb75fdaa4a085c814ea6d2551899593454440d"},{"sha":"a9d6ccf56bd0f57c043d30e57bf4aa9dde0f27ad","author":{"email":"22e0f38e0fc64da9129ff9b9ef030b39415294a1@ubuntu","name":"moongato"},"message":"Merge remote-tracking branch 'upstream/lollipop-ras-mr1' into lp50x","distinct":true,"url":"https://api.github.com/repos/moongato/android_packages_apps_settings/commits/a9d6ccf56bd0f57c043d30e57bf4aa9dde0f27ad"}]},"public":true,"created_at":"2015-01-01T01:07:04Z"}
{"id":"2489398818","type":"PushEvent","actor":{"id":3964764,"login":"elliekimpot","gravatar_id":"","url":"https://api.github.com/users/elliekimpot","avatar_url":"https://avatars.githubusercontent.com/u/3964764?"},"repo":{"id":28625867,"name":"elliekimpot/msm","url":"https://api.github.com/repos/elliekimpot/msm"},"payload":{"push_id":536753528,"size":7,"distinct_size":0,"ref":"refs/heads/base","head":"6393887f2296f3e7d7820ceefa0177003261ec68","before":"0011b847c3b6a0082306b3b29077bdc9550c6dda","commits":[{"sha":"8facc7f43ff2a8292656bf436f369b9455c1ab3a","author":{"email":"c6c610d4ed4672366596341ac49b62c9256ebf55@gmail.com","name":"Ellie"},"message":"pantech/debug: Drop PANTECH_PS_WIFI_COM_PREF_LOGGING\n\nSigned-off-by: Ellie <elliekimpot@gmail.com>","distinct":false,"url":"https://api.github.com/repos/elliekimpot/msm/commits/8facc7f43ff2a8292656bf436f369b9455c1ab3a"},{"sha":"9bfea860d1057c466a88f9a78bf28bf11b0fb221","author":{"email":"c6c610d4ed4672366596341ac49b62c9256ebf55@gmail.com","name":"Ellie"},"message":"pantech/debug: Drop PANTECH_SELINUX_DENIAL_LOG\n\nSigned-off-by: Ellie <elliekimpot@gmail.com>","distinct":false,"url":"https://api.github.com/repos/elliekimpot/msm/commits/9bfea860d1057c466a88f9a78bf28bf11b0fb221"},{"sha":"8ae5cba2d0c6e13cdbb3682fa7cc70960cd95246","author":{"email":"c6c610d4ed4672366596341ac49b62c9256ebf55@gmail.com","name":"Ellie"},"message":"pantech/debug: Drop PANTECH_MORE_DEBUGGING_INFO_ON_KERNEL\n\nSigned-off-by: Ellie <elliekimpot@gmail.com>","distinct":false,"url":"https://api.github.com/repos/elliekimpot/msm/commits/8ae5cba2d0c6e13cdbb3682fa7cc70960cd95246"},{"sha":"1fae68014e73cfc3a32fa5eca33505b011ebb7b4","author":{"email":"c6c610d4ed4672366596341ac49b62c9256ebf55@gmail.com","name":"Ellie"},"message":"Revert \"add basic CFLAGS for Krait\"\n\nThis reverts commit 0011b847c3b6a0082306b3b29077bdc9550c6dda.","distinct":false,"url":"https://api.github.com/repos/elliekimpot/msm/commits/1fae68014e73cfc3a32fa5eca33505b011ebb7b4"},{"sha":"ff109d56f2b1b87aada770208ba471ef9d085a70","author":{"email":"c6c610d4ed4672366596341ac49b62c9256ebf55@gmail.com","name":"Ellie"},"message":"pantech/debug: Drop PANTECH_DEBUG\n\nDrop following features\n* PANTECH_DEBUG_ON\n* PANTECH_DEBUG\n* PANTECH_DEBUG_SCHED_LOG\n* PANTECH_DEBUG_IRQ_LOG\n* PANTECH_DEBUG_DCVS_LOG\n* PANTECH_DEBUG_RPM_LOG\n\nSigned-off-by: Ellie <elliekimpot@gmail.com>","distinct":false,"url":"https://api.github.com/repos/elliekimpot/msm/commits/ff109d56f2b1b87aada770208ba471ef9d085a70"},{"sha":"c3d59ecafe5fda8c6776139e45c6c76eecbf046d","author":{"email":"c6c610d4ed4672366596341ac49b62c9256ebf55@gmail.com","name":"Ellie"},"message":"pantech/debug: Drop PANTECH_FS_AUTO_REPAIR\n\nSigned-off-by: Ellie <elliekimpot@gmail.com>","distinct":false,"url":"https://api.github.com/repos/elliekimpot/msm/commits/c3d59ecafe5fda8c6776139e45c6c76eecbf046d"},{"sha":"6393887f2296f3e7d7820ceefa0177003261ec68","author":{"email":"c6c610d4ed4672366596341ac49b62c9256ebf55@gmail.com","name":"Ellie"},"message":"pantech/debug: Drop PANTECH_ERR_CRASH_LOGGING\n\nDrop PANTECH_ERR_CRASH_LOGGING and introduce PANTECH_SYS\ndue to proper build (Solve error/mipi_sony_incell.c).\n\nSigned-off-by: Ellie <elliekimpot@gmail.com>","distinct":false,"url":"https://api.github.com/repos/elliekimpot/msm/commits/6393887f2296f3e7d7820ceefa0177003261ec68"}]},"public":true,"created_at":"2015-01-01T01:07:05Z"}
{"id":"2489398830","type":"PushEvent","actor":{"id":4438295,"login":"ezzye","gravatar_id":"","url":"https://api.github.com/users/ezzye","avatar_url":"https://avatars.githubusercontent.com/u/4438295?"},"repo":{"id":28522532,"name":"ezzye/mean_example1","url":"https://api.github.com/repos/ezzye/mean_example1"},"payload":{"push_id":536753530,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"429b580df6f07fa1d998c1561bfe07ce99c2ab70","before":"71b3fb787d28aab581c80fa04e8330d0ea965c75","commits":[{"sha":"429b580df6f07fa1d998c1561bfe07ce99c2ab70","author":{"email":"60004a400d96d28036d21c59f517f0e3e3a6150f@gmail.com","name":"ezzye"},"message":"sort entires by dates","distinct":true,"url":"https://api.github.com/repos/ezzye/mean_example1/commits/429b580df6f07fa1d998c1561bfe07ce99c2ab70"}]},"public":true,"created_at":"2015-01-01T01:07:07Z"}
{"id":"2489398831","type":"PushEvent","actor":{"id":201997,"login":"gridaphobe","gravatar_id":"","url":"https://api.github.com/users/gridaphobe","avatar_url":"https://avatars.githubusercontent.com/u/201997?"},"repo":{"id":16334926,"name":"gridaphobe/target","url":"https://api.github.com/repos/gridaphobe/target"},"payload":{"push_id":536753531,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"25d0127dba9df025f3f7c927abf018118b072816","before":"7da2460eba860a739db8aa61898015081bb1f77c","commits":[{"sha":"25d0127dba9df025f3f7c927abf018118b072816","author":{"email":"7c47fb8c5e263626481b146af46f62cf5772922e@gmail.com","name":"Eric Seidel"},"message":"a bit more docs","distinct":true,"url":"https://api.github.com/repos/gridaphobe/target/commits/25d0127dba9df025f3f7c927abf018118b072816"}]},"public":true,"created_at":"2015-01-01T01:07:07Z"}
{"id":"2489398834","type":"PushEvent","actor":{"id":447569,"login":"tom-henderson","gravatar_id":"","url":"https://api.github.com/users/tom-henderson","avatar_url":"https://avatars.githubusercontent.com/u/447569?"},"repo":{"id":23275671,"name":"tom-henderson/django-template","url":"https://api.github.com/repos/tom-henderson/django-template"},"payload":{"push_id":536753533,"size":3,"distinct_size":3,"ref":"refs/heads/master","head":"8dc1ec4089bb639884f24fd4a5f7e7693099a5d9","before":"5e058c0e862a71ad83228c96c56bae766cbd8f4b","commits":[{"sha":"4ebf23c0aefef609187114e9a18b88b15ccac618","author":{"email":"06d851666d407f85c6c32c8197898614a9ec61fa@mac.com","name":"Tom Henderson"},"message":"Ignore .sqlite3 files.","distinct":true,"url":"https://api.github.com/repos/tom-henderson/django-template/commits/4ebf23c0aefef609187114e9a18b88b15ccac618"},{"sha":"8cd6c73216a0aa3d3377ed32827c3a9bf2b51c1c","author":{"email":"06d851666d407f85c6c32c8197898614a9ec61fa@mac.com","name":"Tom Henderson"},"message":"Support collectstatic.","distinct":true,"url":"https://api.github.com/repos/tom-henderson/django-template/commits/8cd6c73216a0aa3d3377ed32827c3a9bf2b51c1c"},{"sha":"8dc1ec4089bb639884f24fd4a5f7e7693099a5d9","author":{"email":"06d851666d407f85c6c32c8197898614a9ec61fa@mac.com","name":"Tom Henderson"},"message":"Define THIRD_PARTY_APPS separtely from LOCAL and CORE.","distinct":true,"url":"https://api.github.com/repos/tom-henderson/django-template/commits/8dc1ec4089bb639884f24fd4a5f7e7693099a5d9"}]},"public":true,"created_at":"2015-01-01T01:07:07Z"}
{"id":"2489398836","type":"PushEvent","actor":{"id":32421,"login":"damonallison","gravatar_id":"","url":"https://api.github.com/users/damonallison","avatar_url":"https://avatars.githubusercontent.com/u/32421?"},"repo":{"id":28276966,"name":"damonallison/git-test","url":"https://api.github.com/repos/damonallison/git-test"},"payload":{"push_id":536753535,"size":4,"distinct_size":0,"ref":"refs/heads/master","head":"3e58f93effeb21baf088c66ac7ba4db6565f832e","before":"a0241b998058d49fe5ec6b1732d32f4269d4de30","commits":[{"sha":"0cd38185bffd3af3513d0763ced55fb8916f6072","author":{"email":"a836250b7333a571ccf7c31c8a50a83778615420@code42.com","name":"Damon Allison"},"message":"damon","distinct":false,"url":"https://api.github.com/repos/damonallison/git-test/commits/0cd38185bffd3af3513d0763ced55fb8916f6072"},{"sha":"eb2b6231b59cda41629ce12b4750d55e5946b6d5","author":{"email":"a836250b7333a571ccf7c31c8a50a83778615420@code42.com","name":"Damon Allison"},"message":"more on damon2","distinct":false,"url":"https://api.github.com/repos/damonallison/git-test/commits/eb2b6231b59cda41629ce12b4750d55e5946b6d5"},{"sha":"df69472afe16ac49d94618598ae40f9bde0b50b9","author":{"email":"a836250b7333a571ccf7c31c8a50a83778615420@code42.com","name":"Damon Allison"},"message":"more(2) on damon2","distinct":false,"url":"https://api.github.com/repos/damonallison/git-test/commits/df69472afe16ac49d94618598ae40f9bde0b50b9"},{"sha":"3e58f93effeb21baf088c66ac7ba4db6565f832e","author":{"email":"a836250b7333a571ccf7c31c8a50a83778615420@code42.com","name":"Damon Allison"},"message":"Merge branch 'master' into damon2","distinct":false,"url":"https://api.github.com/repos/damonallison/git-test/commits/3e58f93effeb21baf088c66ac7ba4db6565f832e"}]},"public":true,"created_at":"2015-01-01T01:07:07Z"}
{"id":"2489398837","type":"PushEvent","actor":{"id":10144074,"login":"carodew","gravatar_id":"","url":"https://api.github.com/users/carodew","avatar_url":"https://avatars.githubusercontent.com/u/10144074?"},"repo":{"id":27844858,"name":"carodew/carodew.github.io","url":"https://api.github.com/repos/carodew/carodew.github.io"},"payload":{"push_id":536753536,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"01e87433331ac75e4e42724f13368f9178b3a44e","before":"62bd3e248d57b48720930200d73b4273993a2e66","commits":[{"sha":"01e87433331ac75e4e42724f13368f9178b3a44e","author":{"email":"6e3c6f0214740e9061d9ca5c79eb6e0ff9cc1741@unknown542696dd77af.gateway.pace.com","name":"Carolyn"},"message":"update h2 styles on homepage","distinct":true,"url":"https://api.github.com/repos/carodew/carodew.github.io/commits/01e87433331ac75e4e42724f13368f9178b3a44e"}]},"public":true,"created_at":"2015-01-01T01:07:07Z"}
{"id":"2489398838","type":"WatchEvent","actor":{"id":4433943,"login":"jkrmr","gravatar_id":"","url":"https://api.github.com/users/jkrmr","avatar_url":"https://avatars.githubusercontent.com/u/4433943?"},"repo":{"id":19797857,"name":"rsense/rsense","url":"https://api.github.com/repos/rsense/rsense"},"payload":{"action":"started"},"public":true,"created_at":"2015-01-01T01:07:07Z","org":{"id":7576243,"login":"rsense","gravatar_id":"","url":"https://api.github.com/orgs/rsense","avatar_url":"https://avatars.githubusercontent.com/u/7576243?"}}
{"id":"2489398840","type":"CreateEvent","actor":{"id":932999,"login":"loyos","gravatar_id":"","url":"https://api.github.com/users/loyos","avatar_url":"https://avatars.githubusercontent.com/u/932999?"},"repo":{"id":28678289,"name":"loyos/cemento","url":"https://api.github.com/repos/loyos/cemento"},"payload":{"ref":null,"ref_type":"repository","master_branch":"master","description":"","pusher_type":"user"},"public":true,"created_at":"2015-01-01T01:07:08Z"}
{"id":"2489398845","type":"CreateEvent","actor":{"id":2357415,"login":"neeleshbagga","gravatar_id":"","url":"https://api.github.com/users/neeleshbagga","avatar_url":"https://avatars.githubusercontent.com/u/2357415?"},"repo":{"id":28678288,"name":"neeleshbagga/CS2110QA","url":"https://api.github.com/repos/neeleshbagga/CS2110QA"},"payload":{"ref":"master","ref_type":"branch","master_branch":"master","description":"An interactive Q&A tool built in Java","pusher_type":"user"},"public":true,"created_at":"2015-01-01T01:07:09Z"}
{"id":"2489398851","type":"IssueCommentEvent","actor":{"id":5404873,"login":"RuslanIsrafilov","gravatar_id":"","url":"https://api.github.com/users/RuslanIsrafilov","avatar_url":"https://avatars.githubusercontent.com/u/5404873?"},"repo":{"id":24333720,"name":"antonlarin/aNiMated-batman","url":"https://api.github.com/repos/antonlarin/aNiMated-batman"},"payload":{"action":"created","issue":{"url":"https://api.github.com/repos/antonlarin/aNiMated-batman/issues/41","labels_url":"https://api.github.com/repos/antonlarin/aNiMated-batman/issues/41/labels{/name}","comments_url":"https://api.github.com/repos/antonlarin/aNiMated-batman/issues/41/comments","events_url":"https://api.github.com/repos/antonlarin/aNiMated-batman/issues/41/events","html_url":"https://github.com/antonlarin/aNiMated-batman/issues/41","id":53209423,"number":41,"title":"Не работает изменение режима счёта (все слои/счёт на установление)","user":{"login":"RuslanIsrafilov","id":5404873,"avatar_url":"https://avatars.githubusercontent.com/u/5404873?v=3","gravatar_id":"","url":"https://api.github.com/users/RuslanIsrafilov","html_url":"https://github.com/RuslanIsrafilov","followers_url":"https://api.github.com/users/RuslanIsrafilov/followers","following_url":"https://api.github.com/users/RuslanIsrafilov/following{/other_user}","gists_url":"https://api.github.com/users/RuslanIsrafilov/gists{/gist_id}","starred_url":"https://api.github.com/users/RuslanIsrafilov/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/RuslanIsrafilov/subscriptions","organizations_url":"https://api.github.com/users/RuslanIsrafilov/orgs","repos_url":"https://api.github.com/users/RuslanIsrafilov/repos","events_url":"https://api.github.com/users/RuslanIsrafilov/events{/privacy}","received_events_url":"https://api.github.com/users/RuslanIsrafilov/received_events","type":"User","site_admin":false},"labels":[{"url":"https://api.github.com/repos/antonlarin/aNiMated-batman/labels/Bug","name":"Bug","color":"eb6420"}],"state":"open","locked":false,"assignee":{"login":"antonlarin","id":1180097,"avatar_url":"https://avatars.githubusercontent.com/u/1180097?v=3","gravatar_id":"","url":"https://api.github.com/users/antonlarin","html_url":"https://github.com/antonlarin","followers_url":"https://api.github.com/users/antonlarin/followers","following_url":"https://api.github.com/users/antonlarin/following{/other_user}","gists_url":"https://api.github.com/users/antonlarin/gists{/gist_id}","starred_url":"https://api.github.com/users/antonlarin/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/antonlarin/subscriptions","organizations_url":"https://api.github.com/users/antonlarin/orgs","repos_url":"https://api.github.com/users/antonlarin/repos","events_url":"https://api.github.com/users/antonlarin/events{/privacy}","received_events_url":"https://api.github.com/users/antonlarin/received_events","type":"User","site_admin":false},"milestone":null,"comments":1,"created_at":"2015-01-01T00:19:34Z","updated_at":"2015-01-01T01:07:10Z","closed_at":null,"body":"Проблема следующая.\r\nПри выбранной явной схеме нажимаю \"Вычисление всех слоёв\", \"Счёт на установление\" - работает всё как надо. Потом выбираю неявную схему и запускаю тоже самое, в результате работает либо \"Вычисление всех слоёв\" либо \"Счёт на установление\", в независимости от нажатой кнопки."},"comment":{"url":"https://api.github.com/repos/antonlarin/aNiMated-batman/issues/comments/68477373","html_url":"https://github.com/antonlarin/aNiMated-batman/issues/41#issuecomment-68477373","issue_url":"https://api.github.com/repos/antonlarin/aNiMated-batman/issues/41","id":68477373,"user":{"login":"RuslanIsrafilov","id":5404873,"avatar_url":"https://avatars.githubusercontent.com/u/5404873?v=3","gravatar_id":"","url":"https://api.github.com/users/RuslanIsrafilov","html_url":"https://github.com/RuslanIsrafilov","followers_url":"https://api.github.com/users/RuslanIsrafilov/followers","following_url":"https://api.github.com/users/RuslanIsrafilov/following{/other_user}","gists_url":"https://api.github.com/users/RuslanIsrafilov/gists{/gist_id}","starred_url":"https://api.github.com/users/RuslanIsrafilov/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/RuslanIsrafilov/subscriptions","organizations_url":"https://api.github.com/users/RuslanIsrafilov/orgs","repos_url":"https://api.github.com/users/RuslanIsrafilov/repos","events_url":"https://api.github.com/users/RuslanIsrafilov/events{/privacy}","received_events_url":"https://api.github.com/users/RuslanIsrafilov/received_events","type":"User","site_admin":false},"created_at":"2015-01-01T01:07:10Z","updated_at":"2015-01-01T01:07:10Z","body":"Сам нашёл, сам пофиксил - всё правильно."}},"public":true,"created_at":"2015-01-01T01:07:10Z"}
{"id":"2489398852","type":"PushEvent","actor":{"id":109048,"login":"bestian","gravatar_id":"","url":"https://api.github.com/users/bestian","avatar_url":"https://avatars.githubusercontent.com/u/109048?"},"repo":{"id":27702247,"name":"g0v/goban","url":"https://api.github.com/repos/g0v/goban"},"payload":{"push_id":536753540,"size":1,"distinct_size":1,"ref":"refs/heads/gh-pages","head":"7ced4bb306188a4505e541d1f9d198116bf1f7e6","before":"42001fdc8ab4af516c60229fbacffa082215f195","commits":[{"sha":"7ced4bb306188a4505e541d1f9d198116bf1f7e6","author":{"email":"295c90327d3df30c5845123db2f48facf2356138@gmail.com","name":"Bestian Tang"},"message":"responsive init & sass partialized init","distinct":true,"url":"https://api.github.com/repos/g0v/goban/commits/7ced4bb306188a4505e541d1f9d198116bf1f7e6"}]},"public":true,"created_at":"2015-01-01T01:07:10Z","org":{"id":2668086,"login":"g0v","gravatar_id":"","url":"https://api.github.com/orgs/g0v","avatar_url":"https://avatars.githubusercontent.com/u/2668086?"}}
{"id":"2489398855","type":"CreateEvent","actor":{"id":4193711,"login":"CorruptingAcid","gravatar_id":"","url":"https://api.github.com/users/CorruptingAcid","avatar_url":"https://avatars.githubusercontent.com/u/4193711?"},"repo":{"id":28678290,"name":"CorruptingAcid/UltimatePnP","url":"https://api.github.com/repos/CorruptingAcid/UltimatePnP"},"payload":{"ref":null,"ref_type":"repository","master_branch":"master","description":"Table top RPG assistant","pusher_type":"user"},"public":true,"created_at":"2015-01-01T01:07:13Z"}
{"id":"2489398859","type":"PushEvent","actor":{"id":458272,"login":"tomalexander","gravatar_id":"","url":"https://api.github.com/users/tomalexander","avatar_url":"https://avatars.githubusercontent.com/u/458272?"},"repo":{"id":28367645,"name":"tomalexander/basic_multi_bot","url":"https://api.github.com/repos/tomalexander/basic_multi_bot"},"payload":{"push_id":536753541,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"b67d4bddd9a6134aae5378deedb1e311410fff75","before":"bcc7dd7ee5550ef6d71e14b4d4c587477f71a3dc","commits":[{"sha":"b67d4bddd9a6134aae5378deedb1e311410fff75","author":{"email":"a09a620e88c0ebee24434030b77c3b58d8242b71@gmail.com","name":"Tom Alexander"},"message":"restricting echo delegate to rooms","distinct":true,"url":"https://api.github.com/repos/tomalexander/basic_multi_bot/commits/b67d4bddd9a6134aae5378deedb1e311410fff75"}]},"public":true,"created_at":"2015-01-01T01:07:13Z"}
{"id":"2489398860","type":"PushEvent","actor":{"id":2581100,"login":"shy2850","gravatar_id":"","url":"https://api.github.com/users/shy2850","avatar_url":"https://avatars.githubusercontent.com/u/2581100?"},"repo":{"id":27001976,"name":"shy2850/wfQuery","url":"https://api.github.com/repos/shy2850/wfQuery"},"payload":{"push_id":536753542,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"31332f6a51d87ff80d88c3c6efe2a444ce052401","before":"92b2fb9133de9d3f6a2dca59cb19a7f27af4d70b","commits":[{"sha":"31332f6a51d87ff80d88c3c6efe2a444ce052401","author":{"email":"ebf030c1b185fb81f6efcfbca2fa8563b9c94d00@163.com","name":"shy2850"},"message":"变量名错误","distinct":true,"url":"https://api.github.com/repos/shy2850/wfQuery/commits/31332f6a51d87ff80d88c3c6efe2a444ce052401"}]},"public":true,"created_at":"2015-01-01T01:07:13Z"}
{"id":"2489398861","type":"CreateEvent","actor":{"id":1283090,"login":"crablar","gravatar_id":"","url":"https://api.github.com/users/crablar","avatar_url":"https://avatars.githubusercontent.com/u/1283090?"},"repo":{"id":28651964,"name":"crablar/betwork","url":"https://api.github.com/repos/crablar/betwork"},"payload":{"ref":"prototype_1.0","ref_type":"branch","master_branch":"master","description":"","pusher_type":"user"},"public":true,"created_at":"2015-01-01T01:07:13Z"}
{"id":"2489398863","type":"PushEvent","actor":{"id":2829718,"login":"phister","gravatar_id":"","url":"https://api.github.com/users/phister","avatar_url":"https://avatars.githubusercontent.com/u/2829718?"},"repo":{"id":28678276,"name":"phister/CollegeFootballPlayoff","url":"https://api.github.com/repos/phister/CollegeFootballPlayoff"},"payload":{"push_id":536753545,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"d7a35a79bb69f3b7af0ac8853378c2dfe1461a2a","before":"34349317ec4f9b2f261e99f17d81805200fc683e","commits":[{"sha":"d7a35a79bb69f3b7af0ac8853378c2dfe1461a2a","author":{"email":"370890631c3d0bc00dab48c12621618666e9b595@gmail.com","name":"phister"},"message":"Create README.md","distinct":true,"url":"https://api.github.com/repos/phister/CollegeFootballPlayoff/commits/d7a35a79bb69f3b7af0ac8853378c2dfe1461a2a"}]},"public":true,"created_at":"2015-01-01T01:07:13Z"}
{"id":"2489398869","type":"PushEvent","actor":{"id":1879074,"login":"harrisonchu","gravatar_id":"","url":"https://api.github.com/users/harrisonchu","avatar_url":"https://avatars.githubusercontent.com/u/1879074?"},"repo":{"id":28490067,"name":"harrisonchu/loan-prediction","url":"https://api.github.com/repos/harrisonchu/loan-prediction"},"payload":{"push_id":536753548,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"5a4515521d2d84d8a8001c13aa237b2f8a6b62ad","before":"9955146fc381664d8875645f3742e51040b460e2","commits":[{"sha":"5a4515521d2d84d8a8001c13aa237b2f8a6b62ad","author":{"email":"b04e62e2ee017ce4cef87d37556bac84d980acce@gmail.com","name":"harrisonchu"},"message":"Ignore loans that are 16-30 days late","distinct":true,"url":"https://api.github.com/repos/harrisonchu/loan-prediction/commits/5a4515521d2d84d8a8001c13aa237b2f8a6b62ad"}]},"public":true,"created_at":"2015-01-01T01:07:14Z"}
{"id":"2489398870","type":"PushEvent","actor":{"id":778342,"login":"TimSimpson","gravatar_id":"","url":"https://api.github.com/users/TimSimpson","avatar_url":"https://avatars.githubusercontent.com/u/778342?"},"repo":{"id":1989449,"name":"TimSimpson/Macaroni","url":"https://api.github.com/repos/TimSimpson/Macaroni"},"payload":{"push_id":536753549,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"7317b25b23c37d9c1bb106562a0dd4735dbca7ec","before":"373f2f8ebc0df3720c559ccbd9b331f567a069d2","commits":[{"sha":"7317b25b23c37d9c1bb106562a0dd4735dbca7ec","author":{"email":"feea1c853491a2fddb2990fb677e02f9e81b17e1@gmail.com","name":"Tim Simpson"},"message":"Fixes bug with default arguments introduced last commit\n\nDidn't see this until I had to build Macaroni. I guess no Next tests\nexpose this feature? :|","distinct":true,"url":"https://api.github.com/repos/TimSimpson/Macaroni/commits/7317b25b23c37d9c1bb106562a0dd4735dbca7ec"}]},"public":true,"created_at":"2015-01-01T01:07:14Z"}
{"id":"2489398874","type":"PushEvent","actor":{"id":5270855,"login":"eldu","gravatar_id":"","url":"https://api.github.com/users/eldu","avatar_url":"https://avatars.githubusercontent.com/u/5270855?"},"repo":{"id":28463663,"name":"eldu/eldu.github.io","url":"https://api.github.com/repos/eldu/eldu.github.io"},"payload":{"push_id":536753553,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"2f689d094f352e88e819fd13f457641c86656d6a","before":"cb4809d26eb05e24e47320cc3ad5e9f632cf2e80","commits":[{"sha":"2f689d094f352e88e819fd13f457641c86656d6a","author":{"email":"fd52f7af8af1b4e2d32bf7ccd950e86bb247229e@seas.upenn.edu","name":"Ellen Duong"},"message":"front page cover no scroll","distinct":true,"url":"https://api.github.com/repos/eldu/eldu.github.io/commits/2f689d094f352e88e819fd13f457641c86656d6a"}]},"public":true,"created_at":"2015-01-01T01:07:14Z"}
{"id":"2489398876","type":"PushEvent","actor":{"id":5240798,"login":"hxwang","gravatar_id":"","url":"https://api.github.com/users/hxwang","avatar_url":"https://avatars.githubusercontent.com/u/5240798?"},"repo":{"id":20258812,"name":"hxwang/Leetcode","url":"https://api.github.com/repos/hxwang/Leetcode"},"payload":{"push_id":536753555,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"7c1a0709545f66143c404db812f52c94af769564","before":"628e4f129b5723f944d1a7887509c737762b2821","commits":[{"sha":"7c1a0709545f66143c404db812f52c94af769564","author":{"email":"320cb2ff8e2e195f7d4e5cd3b27b690e919d61e5@gmail.com","name":"Huangxin"},"message":"Update toDiscuss.md","distinct":true,"url":"https://api.github.com/repos/hxwang/Leetcode/commits/7c1a0709545f66143c404db812f52c94af769564"}]},"public":true,"created_at":"2015-01-01T01:07:15Z"}
{"id":"2489398877","type":"PushEvent","actor":{"id":532414,"login":"piranna","gravatar_id":"","url":"https://api.github.com/users/piranna","avatar_url":"https://avatars.githubusercontent.com/u/532414?"},"repo":{"id":11572519,"name":"NodeOS/NodeOS","url":"https://api.github.com/repos/NodeOS/NodeOS"},"payload":{"push_id":536753554,"size":1,"distinct_size":1,"ref":"refs/heads/cross-compiler-musl","head":"59f050d7225d702ab8d2f7aed19a1a3459603c5f","before":"72df1b3e62fc8ee59c984b5587800a587aebc1fd","commits":[{"sha":"59f050d7225d702ab8d2f7aed19a1a3459603c5f","author":{"email":"fe61b926b190bf24488e9bedf4bfb97c0e528d9b@gmail.com","name":"Jesús Leganés Combarro \"piranna"},"message":"Clean-up of cross-toolchain installer","distinct":true,"url":"https://api.github.com/repos/NodeOS/NodeOS/commits/59f050d7225d702ab8d2f7aed19a1a3459603c5f"}]},"public":true,"created_at":"2015-01-01T01:07:15Z","org":{"id":5056162,"login":"NodeOS","gravatar_id":"","url":"https://api.github.com/orgs/NodeOS","avatar_url":"https://avatars.githubusercontent.com/u/5056162?"}}
{"id":"2489398880","type":"WatchEvent","actor":{"id":170299,"login":"MatthewMueller","gravatar_id":"","url":"https://api.github.com/users/MatthewMueller","avatar_url":"https://avatars.githubusercontent.com/u/170299?"},"repo":{"id":10697613,"name":"Netflix/ice","url":"https://api.github.com/repos/Netflix/ice"},"payload":{"action":"started"},"public":true,"created_at":"2015-01-01T01:07:15Z","org":{"id":913567,"login":"Netflix","gravatar_id":"","url":"https://api.github.com/orgs/Netflix","avatar_url":"https://avatars.githubusercontent.com/u/913567?"}}
{"id":"2489398882","type":"CreateEvent","actor":{"id":6781905,"login":"pw5a29","gravatar_id":"","url":"https://api.github.com/users/pw5a29","avatar_url":"https://avatars.githubusercontent.com/u/6781905?"},"repo":{"id":28678291,"name":"pw5a29/rawbatt","url":"https://api.github.com/repos/pw5a29/rawbatt"},"payload":{"ref":null,"ref_type":"repository","master_branch":"master","description":"","pusher_type":"user"},"public":true,"created_at":"2015-01-01T01:07:15Z"}
{"id":"2489398883","type":"IssueCommentEvent","actor":{"id":6903751,"login":"bkenobi","gravatar_id":"","url":"https://api.github.com/users/bkenobi","avatar_url":"https://avatars.githubusercontent.com/u/6903751?"},"repo":{"id":17072697,"name":"genielabs/HomeGenie","url":"https://api.github.com/repos/genielabs/HomeGenie"},"payload":{"action":"created","issue":{"url":"https://api.github.com/repos/genielabs/HomeGenie/issues/80","labels_url":"https://api.github.com/repos/genielabs/HomeGenie/issues/80/labels{/name}","comments_url":"https://api.github.com/repos/genielabs/HomeGenie/issues/80/comments","events_url":"https://api.github.com/repos/genielabs/HomeGenie/issues/80/events","html_url":"https://github.com/genielabs/HomeGenie/issues/80","id":52930124,"number":80,"title":"Scripts (C# at least) produce unpredictable results due to run order","user":{"login":"bkenobi","id":6903751,"avatar_url":"https://avatars.githubusercontent.com/u/6903751?v=3","gravatar_id":"","url":"https://api.github.com/users/bkenobi","html_url":"https://github.com/bkenobi","followers_url":"https://api.github.com/users/bkenobi/followers","following_url":"https://api.github.com/users/bkenobi/following{/other_user}","gists_url":"https://api.github.com/users/bkenobi/gists{/gist_id}","starred_url":"https://api.github.com/users/bkenobi/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/bkenobi/subscriptions","organizations_url":"https://api.github.com/users/bkenobi/orgs","repos_url":"https://api.github.com/users/bkenobi/repos","events_url":"https://api.github.com/users/bkenobi/events{/privacy}","received_events_url":"https://api.github.com/users/bkenobi/received_events","type":"User","site_admin":false},"labels":[],"state":"open","locked":false,"assignee":null,"milestone":null,"comments":2,"created_at":"2014-12-26T16:14:46Z","updated_at":"2015-01-01T01:07:15Z","closed_at":null,"body":"I have several programs that rely on each other.  One of these (LastEvent) watches for events using the When.ModuleParameterIsChanging event and keeps several new parameters up to date (LastEvent, LastEventUpdateTime, LastOn, LastOnUpdateTime, LastOff, LastOffUpdateTime).  If the other scripts that rely on the LastEvent module run first, everything works correctly.  If the LastEvent module runs first, I run into problems with what exactly the values of these new parameters will be.\r\n\r\nI believe (but cannot confirm) that the execution order is based on the programID.  This was working acceptably until I had to replace my main code with a new instance during testing.  When this happened, the programID of the main code shifted from 1001 to 1016.  Since the LastEvent module reamained 1004, I believe this would cause it to execute prior to 1016.\r\n\r\nThere are 2 solutions I have come up with.\r\n1)  Provide some means to control the order that programs are executed.\r\n2)  Build these new parameter values (or equivalent) into the core HG code.\r\n\r\nExecution order could be something simple like a priority field where the user selects 1-5 which would then give a programID of the next available 1000, 2000, 3000, etc.  Or, something within the code itself specifying a priority.  Or, maybe allow the user to reorder the scripts in the interface and that order is the order of execution of the user codes.  I personally would think something that combines these would be best.\r\n\r\nI don't know how often this issue would occur, so I don't know how much effort is needed to correct it."},"comment":{"url":"https://api.github.com/repos/genielabs/HomeGenie/issues/comments/68477374","html_url":"https://github.com/genielabs/HomeGenie/issues/80#issuecomment-68477374","issue_url":"https://api.github.com/repos/genielabs/HomeGenie/issues/80","id":68477374,"user":{"login":"bkenobi","id":6903751,"avatar_url":"https://avatars.githubusercontent.com/u/6903751?v=3","gravatar_id":"","url":"https://api.github.com/users/bkenobi","html_url":"https://github.com/bkenobi","followers_url":"https://api.github.com/users/bkenobi/followers","following_url":"https://api.github.com/users/bkenobi/following{/other_user}","gists_url":"https://api.github.com/users/bkenobi/gists{/gist_id}","starred_url":"https://api.github.com/users/bkenobi/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/bkenobi/subscriptions","organizations_url":"https://api.github.com/users/bkenobi/orgs","repos_url":"https://api.github.com/users/bkenobi/repos","events_url":"https://api.github.com/users/bkenobi/events{/privacy}","received_events_url":"https://api.github.com/users/bkenobi/received_events","type":"User","site_admin":false},"created_at":"2015-01-01T01:07:15Z","updated_at":"2015-01-01T01:07:15Z","body":"This might work, I'll have to try.  I'm still concerned about the potentially large delay in response due to each pause command.  Even if the modifications I make don't make it into the main code, it would be nice to understand why my code isn't working.\r\n\r\nhttp://www.homegenie.it/forum/index.php?topic=575.0"}},"public":true,"created_at":"2015-01-01T01:07:15Z"}
{"id":"2489398884","type":"PushEvent","actor":{"id":280212,"login":"KenanSulayman","gravatar_id":"","url":"https://api.github.com/users/KenanSulayman","avatar_url":"https://avatars.githubusercontent.com/u/280212?"},"repo":{"id":21481110,"name":"KenanSulayman/heartbeat","url":"https://api.github.com/repos/KenanSulayman/heartbeat"},"payload":{"push_id":536753557,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"fdc821da59a881d40eea62001b4af4cbc2c1e232","before":"cf281dd3839c3e07ed867a2eb77aa4965a2a1400","commits":[{"sha":"fdc821da59a881d40eea62001b4af4cbc2c1e232","author":{"email":"9176253dfc0bc82671a5e984646605f93319147a@sly.mn","name":"Kenan Sulayman"},"message":"1420074434565\n\nZsR8phvzSvI+8KOpooE0RB0FXC78yt7CZDcUB+WKRnQ=","distinct":true,"url":"https://api.github.com/repos/KenanSulayman/heartbeat/commits/fdc821da59a881d40eea62001b4af4cbc2c1e232"}]},"public":true,"created_at":"2015-01-01T01:07:16Z"}
{"id":"2489398891","type":"IssuesEvent","actor":{"id":9265995,"login":"remlei","gravatar_id":"","url":"https://api.github.com/users/remlei","avatar_url":"https://avatars.githubusercontent.com/u/9265995?"},"repo":{"id":22003267,"name":"tarampampam/nod32-update-mirror","url":"https://api.github.com/repos/tarampampam/nod32-update-mirror"},"payload":{"action":"opened","issue":{"url":"https://api.github.com/repos/tarampampam/nod32-update-mirror/issues/14","labels_url":"https://api.github.com/repos/tarampampam/nod32-update-mirror/issues/14/labels{/name}","comments_url":"https://api.github.com/repos/tarampampam/nod32-update-mirror/issues/14/comments","events_url":"https://api.github.com/repos/tarampampam/nod32-update-mirror/issues/14/events","html_url":"https://github.com/tarampampam/nod32-update-mirror/issues/14","id":53210304,"number":14,"title":"Needs further improvements.","user":{"login":"remlei","id":9265995,"avatar_url":"https://avatars.githubusercontent.com/u/9265995?v=3","gravatar_id":"","url":"https://api.github.com/users/remlei","html_url":"https://github.com/remlei","followers_url":"https://api.github.com/users/remlei/followers","following_url":"https://api.github.com/users/remlei/following{/other_user}","gists_url":"https://api.github.com/users/remlei/gists{/gist_id}","starred_url":"https://api.github.com/users/remlei/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/remlei/subscriptions","organizations_url":"https://api.github.com/users/remlei/orgs","repos_url":"https://api.github.com/users/remlei/repos","events_url":"https://api.github.com/users/remlei/events{/privacy}","received_events_url":"https://api.github.com/users/remlei/received_events","type":"User","site_admin":false},"labels":[],"state":"open","locked":false,"assignee":null,"milestone":null,"comments":0,"created_at":"2015-01-01T01:07:17Z","updated_at":"2015-01-01T01:07:17Z","closed_at":null,"body":"There's no issue on the script and it works but it downloads a lot of junk in process and it waste CPU cycle at start parsing the update.ver (taking it a while to process the update to download) this also it needs to improve the following:\r\n\r\n- able to select what type of product to cache the updates (eg, Antivirus or Smart Security)\r\n- able to bypass other language packs (we are downloading about 1gigs of junk versus a 120mb of important files)\r\n- learn to use sed to parse and check the if the file currently downloaded is updated or not. Instead of parsing the update.ver before downloads. It can check the version on the fly by checking the \"versionid=\" on the nup files and one from update.ver; if didnt match then it downloads.\r\n\r\nAll of those issues are not present using this script from a russian forum: http://wl500g.info/showthread.php?7877-NOD32-update-server . It runs in every linux flavor as long as you had the depencies installed (sed, unrar, touch-coreutils)\r\n\r\nIt does do the job and with minor editing on the main script file to accept downloads on v6,v7 and v8 eset products."}},"public":true,"created_at":"2015-01-01T01:07:18Z"}
{"id":"2489398892","type":"IssueCommentEvent","actor":{"id":1235097,"login":"rmarinho","gravatar_id":"","url":"https://api.github.com/users/rmarinho","avatar_url":"https://avatars.githubusercontent.com/u/1235097?"},"repo":{"id":20463939,"name":"XLabs/Xamarin-Forms-Labs","url":"https://api.github.com/repos/XLabs/Xamarin-Forms-Labs"},"payload":{"action":"created","issue":{"url":"https://api.github.com/repos/XLabs/Xamarin-Forms-Labs/issues/545","labels_url":"https://api.github.com/repos/XLabs/Xamarin-Forms-Labs/issues/545/labels{/name}","comments_url":"https://api.github.com/repos/XLabs/Xamarin-Forms-Labs/issues/545/comments","events_url":"https://api.github.com/repos/XLabs/Xamarin-Forms-Labs/issues/545/events","html_url":"https://github.com/XLabs/Xamarin-Forms-Labs/issues/545","id":53205036,"number":545,"title":"ContentPresenter view","user":{"login":"onovotny","id":1427284,"avatar_url":"https://avatars.githubusercontent.com/u/1427284?v=3","gravatar_id":"","url":"https://api.github.com/users/onovotny","html_url":"https://github.com/onovotny","followers_url":"https://api.github.com/users/onovotny/followers","following_url":"https://api.github.com/users/onovotny/following{/other_user}","gists_url":"https://api.github.com/users/onovotny/gists{/gist_id}","starred_url":"https://api.github.com/users/onovotny/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/onovotny/subscriptions","organizations_url":"https://api.github.com/users/onovotny/orgs","repos_url":"https://api.github.com/users/onovotny/repos","events_url":"https://api.github.com/users/onovotny/events{/privacy}","received_events_url":"https://api.github.com/users/onovotny/received_events","type":"User","site_admin":false},"labels":[],"state":"open","locked":false,"assignee":null,"milestone":null,"comments":2,"created_at":"2014-12-31T21:48:29Z","updated_at":"2015-01-01T01:07:17Z","closed_at":null,"body":"I've blogged about it [here](http://blog.novotny.org/2014/12/31/contentpresenter-for-xamarin-forms/) but I'd be happy to submit a PR with this.\r\n\r\nThoughts, interest?"},"comment":{"url":"https://api.github.com/repos/XLabs/Xamarin-Forms-Labs/issues/comments/68477375","html_url":"https://github.com/XLabs/Xamarin-Forms-Labs/issues/545#issuecomment-68477375","issue_url":"https://api.github.com/repos/XLabs/Xamarin-Forms-Labs/issues/545","id":68477375,"user":{"login":"rmarinho","id":1235097,"avatar_url":"https://avatars.githubusercontent.com/u/1235097?v=3","gravatar_id":"","url":"https://api.github.com/users/rmarinho","html_url":"https://github.com/rmarinho","followers_url":"https://api.github.com/users/rmarinho/followers","following_url":"https://api.github.com/users/rmarinho/following{/other_user}","gists_url":"https://api.github.com/users/rmarinho/gists{/gist_id}","starred_url":"https://api.github.com/users/rmarinho/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/rmarinho/subscriptions","organizations_url":"https://api.github.com/users/rmarinho/orgs","repos_url":"https://api.github.com/users/rmarinho/repos","events_url":"https://api.github.com/users/rmarinho/events{/privacy}","received_events_url":"https://api.github.com/users/rmarinho/received_events","type":"User","site_admin":false},"created_at":"2015-01-01T01:07:17Z","updated_at":"2015-01-01T01:07:17Z","body":"Yes i use your aproach and a PR of it will be welcome :) "}},"public":true,"created_at":"2015-01-01T01:07:18Z","org":{"id":7787062,"login":"XLabs","gravatar_id":"","url":"https://api.github.com/orgs/XLabs","avatar_url":"https://avatars.githubusercontent.com/u/7787062?"}}
{"id":"2489398894","type":"GollumEvent","actor":{"id":226687,"login":"cfalguiere","gravatar_id":"","url":"https://api.github.com/users/cfalguiere","avatar_url":"https://avatars.githubusercontent.com/u/226687?"},"repo":{"id":28568493,"name":"cfalguiere/BrickInventory","url":"https://api.github.com/repos/cfalguiere/BrickInventory"},"payload":{"pages":[{"page_name":"LeMakingOf J2#01 Objectif","title":"LeMakingOf J2#01 Objectif","summary":null,"action":"created","sha":"078a1257c89da10fdb31de9b29bf48494d761c83","html_url":"https://github.com/cfalguiere/BrickInventory/wiki/LeMakingOf-J2%2301-Objectif"},{"page_name":"LeMakingOf J2#02 Design","title":"LeMakingOf J2#02 Design","summary":null,"action":"created","sha":"078a1257c89da10fdb31de9b29bf48494d761c83","html_url":"https://github.com/cfalguiere/BrickInventory/wiki/LeMakingOf-J2%2302-Design"},{"page_name":"LeMakingOf J2#03 Refactoring","title":"LeMakingOf J2#03 Refactoring","summary":null,"action":"created","sha":"078a1257c89da10fdb31de9b29bf48494d761c83","html_url":"https://github.com/cfalguiere/BrickInventory/wiki/LeMakingOf-J2%2303-Refactoring"},{"page_name":"LeMakingOf J2#04 Première factory","title":"LeMakingOf J2#04 Première factory","summary":null,"action":"created","sha":"078a1257c89da10fdb31de9b29bf48494d761c83","html_url":"https://github.com/cfalguiere/BrickInventory/wiki/LeMakingOf-J2%2304-Premi%C3%A8re-factory"},{"page_name":"LeMakingOf J2#05 Tests unitaires","title":"LeMakingOf J2#05 Tests unitaires","summary":null,"action":"created","sha":"078a1257c89da10fdb31de9b29bf48494d761c83","html_url":"https://github.com/cfalguiere/BrickInventory/wiki/LeMakingOf-J2%2305-Tests-unitaires"},{"page_name":"LeMakingOf J2#06 Retour des tests unitaires","title":"LeMakingOf J2#06 Retour des tests unitaires","summary":null,"action":"created","sha":"078a1257c89da10fdb31de9b29bf48494d761c83","html_url":"https://github.com/cfalguiere/BrickInventory/wiki/LeMakingOf-J2%2306-Retour-des-tests-unitaires"},{"page_name":"LeMakingOf J2#07 Retour du retour des tests unitaires","title":"LeMakingOf J2#07 Retour du retour des tests unitaires","summary":null,"action":"created","sha":"078a1257c89da10fdb31de9b29bf48494d761c83","html_url":"https://github.com/cfalguiere/BrickInventory/wiki/LeMakingOf-J2%2307-Retour-du-retour-des-tests-unitaires"},{"page_name":"LeMakingOf J2#08 Test Reloaded","title":"LeMakingOf J2#08 Test Reloaded","summary":null,"action":"created","sha":"078a1257c89da10fdb31de9b29bf48494d761c83","html_url":"https://github.com/cfalguiere/BrickInventory/wiki/LeMakingOf-J2%2308-Test-Reloaded"},{"page_name":"LeMakingOf J2#10 Les formes","title":"LeMakingOf J2#10 Les formes","summary":null,"action":"created","sha":"078a1257c89da10fdb31de9b29bf48494d761c83","html_url":"https://github.com/cfalguiere/BrickInventory/wiki/LeMakingOf-J2%2310-Les-formes"},{"page_name":"LeMakingOf J2#11 Ajout de la colonne","title":"LeMakingOf J2#11 Ajout de la colonne","summary":null,"action":"created","sha":"078a1257c89da10fdb31de9b29bf48494d761c83","html_url":"https://github.com/cfalguiere/BrickInventory/wiki/LeMakingOf-J2%2311-Ajout-de-la-colonne"},{"page_name":"LeMakingOf J2#12 Le filtre","title":"LeMakingOf J2#12 Le filtre","summary":null,"action":"created","sha":"078a1257c89da10fdb31de9b29bf48494d761c83","html_url":"https://github.com/cfalguiere/BrickInventory/wiki/LeMakingOf-J2%2312-Le-filtre"},{"page_name":"LeMakingOf J2#13 Premier service","title":"LeMakingOf J2#13 Premier service","summary":null,"action":"created","sha":"078a1257c89da10fdb31de9b29bf48494d761c83","html_url":"https://github.com/cfalguiere/BrickInventory/wiki/LeMakingOf-J2%2313-Premier-service"},{"page_name":"LeMakingOf J2#14 Intégration","title":"LeMakingOf J2#14 Intégration","summary":null,"action":"created","sha":"078a1257c89da10fdb31de9b29bf48494d761c83","html_url":"https://github.com/cfalguiere/BrickInventory/wiki/LeMakingOf-J2%2314-Int%C3%A9gration"},{"page_name":"LeMakingOf J2#15 Les couleurs","title":"LeMakingOf J2#15 Les couleurs","summary":null,"action":"created","sha":"078a1257c89da10fdb31de9b29bf48494d761c83","html_url":"https://github.com/cfalguiere/BrickInventory/wiki/LeMakingOf-J2%2315-Les-couleurs"},{"page_name":"LeMakingOf J2#16 Le bilan","title":"LeMakingOf J2#16 Le bilan","summary":null,"action":"created","sha":"078a1257c89da10fdb31de9b29bf48494d761c83","html_url":"https://github.com/cfalguiere/BrickInventory/wiki/LeMakingOf-J2%2316-Le-bilan"},{"page_name":"LeMakingOf J1#12 Les modules","title":"LeMakingOf J1#12 Les modules","summary":null,"action":"edited","sha":"078a1257c89da10fdb31de9b29bf48494d761c83","html_url":"https://github.com/cfalguiere/BrickInventory/wiki/LeMakingOf-J1%2312-Les-modules"},{"page_name":"LeMakingOf J1#14 Le controller","title":"LeMakingOf J1#14 Le controller","summary":null,"action":"edited","sha":"078a1257c89da10fdb31de9b29bf48494d761c83","html_url":"https://github.com/cfalguiere/BrickInventory/wiki/LeMakingOf-J1%2314-Le-controller"},{"page_name":"LeMakingOf J1#19 Le bilan","title":"LeMakingOf J1#19 Le bilan","summary":null,"action":"edited","sha":"078a1257c89da10fdb31de9b29bf48494d761c83","html_url":"https://github.com/cfalguiere/BrickInventory/wiki/LeMakingOf-J1%2319-Le-bilan"},{"page_name":"LeMakingOf J2#09 Test de la factory","title":"LeMakingOf J2#09 Test de la factory","summary":null,"action":"edited","sha":"078a1257c89da10fdb31de9b29bf48494d761c83","html_url":"https://github.com/cfalguiere/BrickInventory/wiki/LeMakingOf-J2%2309-Test-de-la-factory"}]},"public":true,"created_at":"2015-01-01T01:07:18Z"}
{"id":"2489398895","type":"PushEvent","actor":{"id":4644601,"login":"GLolol","gravatar_id":"","url":"https://api.github.com/users/GLolol","avatar_url":"https://avatars.githubusercontent.com/u/4644601?"},"repo":{"id":28604112,"name":"GLolol/Crackbot","url":"https://api.github.com/repos/GLolol/Crackbot"},"payload":{"push_id":536753559,"size":1,"distinct_size":1,"ref":"refs/heads/devel","head":"f5b144c834362b41505427167aff8d4b98fa657e","before":"d34e47b3932ca6ee93229c59e5a4c7bcf7acf5be","commits":[{"sha":"f5b144c834362b41505427167aff8d4b98fa657e","author":{"email":"1d63ba34440ccf4049662a35916618df27a8f853@overdrive.pw","name":"GLolol"},"message":"commands.lua: bugfix (\"./help\" without arguments should call \"./help help\")","distinct":true,"url":"https://api.github.com/repos/GLolol/Crackbot/commits/f5b144c834362b41505427167aff8d4b98fa657e"}]},"public":true,"created_at":"2015-01-01T01:07:18Z"}
{"id":"2489398897","type":"PushEvent","actor":{"id":163915,"login":"fponticelli","gravatar_id":"","url":"https://api.github.com/users/fponticelli","avatar_url":"https://avatars.githubusercontent.com/u/163915?"},"repo":{"id":25146353,"name":"thxlib/thxlib.github.io","url":"https://api.github.com/repos/thxlib/thxlib.github.io"},"payload":{"push_id":536753561,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"b68cc956373b5339237f1564f1ef8fec91337dd0","before":"d0f110895e656633828c806023799bab1cbbd083","commits":[{"sha":"b68cc956373b5339237f1564f1ef8fec91337dd0","author":{"email":"05a4419b3ba135c9a2552a2fac2f13cfe3d22f12@gmail.com","name":"Franco Ponticelli"},"message":"updated thx.core and thx.color","distinct":true,"url":"https://api.github.com/repos/thxlib/thxlib.github.io/commits/b68cc956373b5339237f1564f1ef8fec91337dd0"}]},"public":true,"created_at":"2015-01-01T01:07:18Z","org":{"id":8933789,"login":"thxlib","gravatar_id":"","url":"https://api.github.com/orgs/thxlib","avatar_url":"https://avatars.githubusercontent.com/u/8933789?"}}
{"id":"2489398899","type":"CreateEvent","actor":{"id":5249918,"login":"ehnmark","gravatar_id":"","url":"https://api.github.com/users/ehnmark","avatar_url":"https://avatars.githubusercontent.com/u/5249918?"},"repo":{"id":28678277,"name":"ehnmark/housing","url":"https://api.github.com/repos/ehnmark/housing"},"payload":{"ref":"master","ref_type":"branch","master_branch":"master","description":"","pusher_type":"user"},"public":true,"created_at":"2015-01-01T01:07:18Z"}
{"id":"2489398900","type":"PushEvent","actor":{"id":8020662,"login":"freethlua","gravatar_id":"","url":"https://api.github.com/users/freethlua","avatar_url":"https://avatars.githubusercontent.com/u/8020662?"},"repo":{"id":22790186,"name":"freethlua/.dotfiles","url":"https://api.github.com/repos/freethlua/.dotfiles"},"payload":{"push_id":536753563,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"0ec37f77b8811a07ca6c6df79622541d8fa40c0a","before":"233774f844d59ff89420037609cf3e0cba985e9a","commits":[{"sha":"0ec37f77b8811a07ca6c6df79622541d8fa40c0a","author":{"email":"11f6ad8ec52a2984abaafd7c3b516503785c2072","name":"x"},"message":".","distinct":true,"url":"https://api.github.com/repos/freethlua/.dotfiles/commits/0ec37f77b8811a07ca6c6df79622541d8fa40c0a"}]},"public":true,"created_at":"2015-01-01T01:07:18Z"}
{"id":"2489398902","type":"IssuesEvent","actor":{"id":10361486,"login":"AceTheGmodGeek","gravatar_id":"","url":"https://api.github.com/users/AceTheGmodGeek","avatar_url":"https://avatars.githubusercontent.com/u/10361486?"},"repo":{"id":20768404,"name":"vrondakis/Leveling-System","url":"https://api.github.com/repos/vrondakis/Leveling-System"},"payload":{"action":"opened","issue":{"url":"https://api.github.com/repos/vrondakis/Leveling-System/issues/11","labels_url":"https://api.github.com/repos/vrondakis/Leveling-System/issues/11/labels{/name}","comments_url":"https://api.github.com/repos/vrondakis/Leveling-System/issues/11/comments","events_url":"https://api.github.com/repos/vrondakis/Leveling-System/issues/11/events","html_url":"https://github.com/vrondakis/Leveling-System/issues/11","id":53210305,"number":11,"title":"Books","user":{"login":"AceTheGmodGeek","id":10361486,"avatar_url":"https://avatars.githubusercontent.com/u/10361486?v=3","gravatar_id":"","url":"https://api.github.com/users/AceTheGmodGeek","html_url":"https://github.com/AceTheGmodGeek","followers_url":"https://api.github.com/users/AceTheGmodGeek/followers","following_url":"https://api.github.com/users/AceTheGmodGeek/following{/other_user}","gists_url":"https://api.github.com/users/AceTheGmodGeek/gists{/gist_id}","starred_url":"https://api.github.com/users/AceTheGmodGeek/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/AceTheGmodGeek/subscriptions","organizations_url":"https://api.github.com/users/AceTheGmodGeek/orgs","repos_url":"https://api.github.com/users/AceTheGmodGeek/repos","events_url":"https://api.github.com/users/AceTheGmodGeek/events{/privacy}","received_events_url":"https://api.github.com/users/AceTheGmodGeek/received_events","type":"User","site_admin":false},"labels":[],"state":"open","locked":false,"assignee":null,"milestone":null,"comments":0,"created_at":"2015-01-01T01:07:19Z","updated_at":"2015-01-01T01:07:19Z","closed_at":null,"body":"I have your level system with your prestige. When I add books to the books.lua, It doesnt pop up. Many people are having problems with this. Help?"}},"public":true,"created_at":"2015-01-01T01:07:19Z"}
{"id":"2489398905","type":"PullRequestReviewCommentEvent","actor":{"id":523287,"login":"j2sol","gravatar_id":"","url":"https://api.github.com/users/j2sol","avatar_url":"https://avatars.githubusercontent.com/u/523287?"},"repo":{"id":11848896,"name":"blueboxgroup/ursula","url":"https://api.github.com/repos/blueboxgroup/ursula"},"payload":{"action":"created","comment":{"url":"https://api.github.com/repos/blueboxgroup/ursula/pulls/comments/22397307","id":22397307,"diff_hunk":"@@ -1,121 +1,92 @@\n ---\n-- name: install apache\n-  apt: pkg={{ item }}\n-  with_items:\n-    - apache2\n-    - libapache2-mod-wsgi\n-\n - name: lesscpy must be in apache PATH\n   pip: name=lesscpy version=0.9j\n \n - name: get horizon source repo\n-  git: repo={{ openstack.git_mirror }}/horizon.git\n-       dest=/opt/stack/horizon\n-       version={{ horizon.rev }}\n-       update={{ openstack.git_update }}\n+  git: |\n+    repo={{ openstack.git_mirror}}/horizon.git\n+    dest=/opt/stack/horizon\n+    version={{ horizon.rev }}\n+    update={{ openstack.git_update }}\n   notify:\n     - setup horizon venv\n     - compress horizon assets\n \n-- template: src=opt/stack/horizon/hide-external-networks.patch dest=/opt/stack/horizon/hide-external-networks.patch mode=0644\n-- shell: patch -p1 < hide-external-networks.patch chdir=/opt/stack/horizon\n-  notify:\n-    - setup horizon venv\n-\n - name: add python-memcached to horizon requirements\n-  lineinfile: dest=/opt/stack/horizon/requirements.txt\n-              regexp=^python-memcached\n-              line=python-memcached\n+  lineinfile: dest=/opt/stack/horizon/requirements.txt regexp=^python-memcached line=python-memcached\n   notify:\n     - setup horizon venv\n \n-- name: disable apache status\n-  command: a2dismod status\n-  notify:\n-    - restart apache\n-\n-- name: apache ports config\n-  template: src=etc/apache2/ports.conf\n-            dest=/etc/apache2/ports.conf\n-  notify:\n-    - restart apache\n-\n-- name: disable default apache site\n-  command: a2dissite 000-default\n+- name: make sure apache knows about horizon ports\n+  lineinfile: dest=/etc/apache2/ports.conf line=\"Listen 8080\"\n   notify:\n-    - restart apache\n+    - reload apache\n \n-- name: openstack dashboard config (12.04)\n-  template: src=etc/apache2/sites-available/openstack_dashboard.conf\n-            dest=/etc/apache2/sites-available/openstack_dashboard\n+- name: create dashboard virtualhost on precise\n+  template: |\n+    src=etc/apache2/sites-available/openstack_dashboard.conf\n+    dest=/etc/apache2/sites-available/openstack_dashboard\n   when: ansible_distribution_version == \"12.04\"\n   notify:\n-    - restart apache\n+    - reload apache\n \n-- name: openstack dashboard config\n-  template: src=etc/apache2/sites-available/openstack_dashboard.conf\n-            dest=/etc/apache2/sites-available/openstack_dashboard.conf\n+- name: create dashboard virtualhost on other\n+  template: |\n+    src=etc/apache2/sites-available/openstack_dashboard.conf\n+    dest=/etc/apache2/sites-available/openstack_dashboard.conf\n   when: ansible_distribution_version != \"12.04\"\n   notify:\n-    - restart apache\n+    - reload apache\n \n - name: enable horizon apache site\n-  command: a2ensite openstack_dashboard\n+  apache2_site: state=enabled name=openstack_dashboard\n   notify:\n-    - restart apache\n-\n-- name: static asset directories\n-  file: dest={{ item }}\n-        state=directory\n-        owner=www-data\n-        group=www-data\n-        mode=0755\n+    - reload apache\n+\n+- name: create static asset dirs\n+  file: |\n+    dest={{ item }}\n+    state=directory\n+    owner=www-data\n+    group=www-data\n+    mode=0755\n   with_items:\n     - /opt/stack/horizon/static\n     - /opt/stack/horizon/static/dashboard\n \n-- name: horizon local settings\n-  template: src=opt/stack/horizon/openstack_dashboard/local/local_settings.py\n-            dest=/opt/stack/horizon/openstack_dashboard/local/local_settings.py\n-            mode=0644\n+- name: dashboard settings\n+  template: |\n+    src=opt/stack/horizon/openstack_dashboard/local/local_settings.py\n+    dest=/opt/stack/horizon/openstack_dashboard/local/local_settings.py\n+    mode=0644\n   notify:\n-    - restart apache\n+    - reload apache\n \n - name: custom horizon logo\n-  get_url: url={{ horizon.logo_url }}\n-           dest=/opt/stack/horizon/openstack_dashboard/static/dashboard/img/logo.png\n-           mode=0644 force=yes\n+  get_url: url={{ horizon.logo_url }} dest=/opt/stack/horizon/openstack_dashboard/static/dashboard/img/logo.png mode=0644 force=yes\n \n - name: custom horizon splash logo\n-  get_url: url={{ horizon.logo_url }}\n-           dest=/opt/stack/horizon/openstack_dashboard/static/dashboard/img/logo-splash.png\n-           mode=0644 force=yes\n+  get_url: url={{ horizon.logo_url }} dest=/opt/stack/horizon/openstack_dashboard/static/dashboard/img/logo-splash.png mode=0644 force=yes\n \n - name: custom horizon favicon\n-  get_url: url={{ horizon.favicon_url }}\n-           dest=/opt/stack/horizon/openstack_dashboard/static/dashboard/img/favicon.ico\n-           force=yes\n+  get_url: url={{ horizon.favicon_url }} dest=/opt/stack/horizon/openstack_dashboard/static/dashboard/img/favicon.ico force=yes\n \n - name: put images and fonts where apache can find them\n-  file: src=/opt/stack/horizon/openstack_dashboard/static/dashboard/{{ item }}\n-        dest=/opt/stack/horizon/static/dashboard/{{ item }}\n-        state=link\n-        owner=www-data\n-        group=www-data\n+  file: |\n+    src=/opt/stack/horizon/openstack_dashboard/static/dashboard/{{ item }}\n+    dest=/opt/stack/horizon/static/dashboard/{{ item }}\n+    state=link\n+    owner=www-data\n+    group=www-data\n   with_items:\n     - img\n     - fonts\n \n-# flush before ensuring apache running, saves immediate restart\n-- meta: flush_handlers\n-\n-- name: ensure apache started\n+- name: ensure apache is running\n   service: name=apache2 state=started\n \n-- name: Permit HTTP and HTTPS\n-  ufw: rule=allow to_port={{ item }} proto=tcp\n-  with_items:\n-  - 80\n-  - 443\n+- name: Permit HTTP (redirect to HTTPS for Horizon)\n+  command: ufw allow 80/tcp\n \n-- include: monitoring.yml tags=monitoring,common","path":"roles/horizon/tasks/main.yml","position":168,"original_position":168,"commit_id":"2a6f35313b9936ce4450aba823d09287626bed6f","original_commit_id":"2a6f35313b9936ce4450aba823d09287626bed6f","user":{"login":"j2sol","id":523287,"avatar_url":"https://avatars.githubusercontent.com/u/523287?v=3","gravatar_id":"","url":"https://api.github.com/users/j2sol","html_url":"https://github.com/j2sol","followers_url":"https://api.github.com/users/j2sol/followers","following_url":"https://api.github.com/users/j2sol/following{/other_user}","gists_url":"https://api.github.com/users/j2sol/gists{/gist_id}","starred_url":"https://api.github.com/users/j2sol/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/j2sol/subscriptions","organizations_url":"https://api.github.com/users/j2sol/orgs","repos_url":"https://api.github.com/users/j2sol/repos","events_url":"https://api.github.com/users/j2sol/events{/privacy}","received_events_url":"https://api.github.com/users/j2sol/received_events","type":"User","site_admin":false},"body":"What happened to the monitoring tasks?","created_at":"2015-01-01T01:07:19Z","updated_at":"2015-01-01T01:07:19Z","html_url":"https://github.com/blueboxgroup/ursula/pull/705#discussion_r22397307","pull_request_url":"https://api.github.com/repos/blueboxgroup/ursula/pulls/705","_links":{"self":{"href":"https://api.github.com/repos/blueboxgroup/ursula/pulls/comments/22397307"},"html":{"href":"https://github.com/blueboxgroup/ursula/pull/705#discussion_r22397307"},"pull_request":{"href":"https://api.github.com/repos/blueboxgroup/ursula/pulls/705"}}},"pull_request":{"url":"https://api.github.com/repos/blueboxgroup/ursula/pulls/705","id":26738851,"html_url":"https://github.com/blueboxgroup/ursula/pull/705","diff_url":"https://github.com/blueboxgroup/ursula/pull/705.diff","patch_url":"https://github.com/blueboxgroup/ursula/pull/705.patch","issue_url":"https://api.github.com/repos/blueboxgroup/ursula/issues/705","number":705,"state":"open","locked":false,"title":"WIP:  apache for loadbalancing","user":{"login":"paulczar","id":2488346,"avatar_url":"https://avatars.githubusercontent.com/u/2488346?v=3","gravatar_id":"","url":"https://api.github.com/users/paulczar","html_url":"https://github.com/paulczar","followers_url":"https://api.github.com/users/paulczar/followers","following_url":"https://api.github.com/users/paulczar/following{/other_user}","gists_url":"https://api.github.com/users/paulczar/gists{/gist_id}","starred_url":"https://api.github.com/users/paulczar/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/paulczar/subscriptions","organizations_url":"https://api.github.com/users/paulczar/orgs","repos_url":"https://api.github.com/users/paulczar/repos","events_url":"https://api.github.com/users/paulczar/events{/privacy}","received_events_url":"https://api.github.com/users/paulczar/received_events","type":"User","site_admin":false},"body":"This is a quick POC / WIP to demo using apache instead of haproxy for loadbalancing our APIs.\r\n\r\nI think this gives us more flexibiltiy as we can enable in the APIs role itself ( in this case in keystone ) rather than a big monolithic haproxy.conf.      We also already have apache running for horizon, so it could reduce number of services.    apache also has better logging options that haproxy which can only log to syslog. ","created_at":"2015-01-01T00:04:13Z","updated_at":"2015-01-01T01:07:19Z","closed_at":null,"merged_at":null,"merge_commit_sha":"9b91693f11e166c9ee53836f19697868d412bf76","assignee":null,"milestone":null,"commits_url":"https://api.github.com/repos/blueboxgroup/ursula/pulls/705/commits","review_comments_url":"https://api.github.com/repos/blueboxgroup/ursula/pulls/705/comments","review_comment_url":"https://api.github.com/repos/blueboxgroup/ursula/pulls/comments/{number}","comments_url":"https://api.github.com/repos/blueboxgroup/ursula/issues/705/comments","statuses_url":"https://api.github.com/repos/blueboxgroup/ursula/statuses/2a6f35313b9936ce4450aba823d09287626bed6f","head":{"label":"blueboxgroup:use_apache_for_lb","ref":"use_apache_for_lb","sha":"2a6f35313b9936ce4450aba823d09287626bed6f","user":{"login":"blueboxgroup","id":458705,"avatar_url":"https://avatars.githubusercontent.com/u/458705?v=3","gravatar_id":"","url":"https://api.github.com/users/blueboxgroup","html_url":"https://github.com/blueboxgroup","followers_url":"https://api.github.com/users/blueboxgroup/followers","following_url":"https://api.github.com/users/blueboxgroup/following{/other_user}","gists_url":"https://api.github.com/users/blueboxgroup/gists{/gist_id}","starred_url":"https://api.github.com/users/blueboxgroup/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/blueboxgroup/subscriptions","organizations_url":"https://api.github.com/users/blueboxgroup/orgs","repos_url":"https://api.github.com/users/blueboxgroup/repos","events_url":"https://api.github.com/users/blueboxgroup/events{/privacy}","received_events_url":"https://api.github.com/users/blueboxgroup/received_events","type":"Organization","site_admin":false},"repo":{"id":11848896,"name":"ursula","full_name":"blueboxgroup/ursula","owner":{"login":"blueboxgroup","id":458705,"avatar_url":"https://avatars.githubusercontent.com/u/458705?v=3","gravatar_id":"","url":"https://api.github.com/users/blueboxgroup","html_url":"https://github.com/blueboxgroup","followers_url":"https://api.github.com/users/blueboxgroup/followers","following_url":"https://api.github.com/users/blueboxgroup/following{/other_user}","gists_url":"https://api.github.com/users/blueboxgroup/gists{/gist_id}","starred_url":"https://api.github.com/users/blueboxgroup/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/blueboxgroup/subscriptions","organizations_url":"https://api.github.com/users/blueboxgroup/orgs","repos_url":"https://api.github.com/users/blueboxgroup/repos","events_url":"https://api.github.com/users/blueboxgroup/events{/privacy}","received_events_url":"https://api.github.com/users/blueboxgroup/received_events","type":"Organization","site_admin":false},"private":false,"html_url":"https://github.com/blueboxgroup/ursula","description":"Ansible playbooks for operating OpenStack","fork":false,"url":"https://api.github.com/repos/blueboxgroup/ursula","forks_url":"https://api.github.com/repos/blueboxgroup/ursula/forks","keys_url":"https://api.github.com/repos/blueboxgroup/ursula/keys{/key_id}","collaborators_url":"https://api.github.com/repos/blueboxgroup/ursula/collaborators{/collaborator}","teams_url":"https://api.github.com/repos/blueboxgroup/ursula/teams","hooks_url":"https://api.github.com/repos/blueboxgroup/ursula/hooks","issue_events_url":"https://api.github.com/repos/blueboxgroup/ursula/issues/events{/number}","events_url":"https://api.github.com/repos/blueboxgroup/ursula/events","assignees_url":"https://api.github.com/repos/blueboxgroup/ursula/assignees{/user}","branches_url":"https://api.github.com/repos/blueboxgroup/ursula/branches{/branch}","tags_url":"https://api.github.com/repos/blueboxgroup/ursula/tags","blobs_url":"https://api.github.com/repos/blueboxgroup/ursula/git/blobs{/sha}","git_tags_url":"https://api.github.com/repos/blueboxgroup/ursula/git/tags{/sha}","git_refs_url":"https://api.github.com/repos/blueboxgroup/ursula/git/refs{/sha}","trees_url":"https://api.github.com/repos/blueboxgroup/ursula/git/trees{/sha}","statuses_url":"https://api.github.com/repos/blueboxgroup/ursula/statuses/{sha}","languages_url":"https://api.github.com/repos/blueboxgroup/ursula/languages","stargazers_url":"https://api.github.com/repos/blueboxgroup/ursula/stargazers","contributors_url":"https://api.github.com/repos/blueboxgroup/ursula/contributors","subscribers_url":"https://api.github.com/repos/blueboxgroup/ursula/subscribers","subscription_url":"https://api.github.com/repos/blueboxgroup/ursula/subscription","commits_url":"https://api.github.com/repos/blueboxgroup/ursula/commits{/sha}","git_commits_url":"https://api.github.com/repos/blueboxgroup/ursula/git/commits{/sha}","comments_url":"https://api.github.com/repos/blueboxgroup/ursula/comments{/number}","issue_comment_url":"https://api.github.com/repos/blueboxgroup/ursula/issues/comments/{number}","contents_url":"https://api.github.com/repos/blueboxgroup/ursula/contents/{+path}","compare_url":"https://api.github.com/repos/blueboxgroup/ursula/compare/{base}...{head}","merges_url":"https://api.github.com/repos/blueboxgroup/ursula/merges","archive_url":"https://api.github.com/repos/blueboxgroup/ursula/{archive_format}{/ref}","downloads_url":"https://api.github.com/repos/blueboxgroup/ursula/downloads","issues_url":"https://api.github.com/repos/blueboxgroup/ursula/issues{/number}","pulls_url":"https://api.github.com/repos/blueboxgroup/ursula/pulls{/number}","milestones_url":"https://api.github.com/repos/blueboxgroup/ursula/milestones{/number}","notifications_url":"https://api.github.com/repos/blueboxgroup/ursula/notifications{?since,all,participating}","labels_url":"https://api.github.com/repos/blueboxgroup/ursula/labels{/name}","releases_url":"https://api.github.com/repos/blueboxgroup/ursula/releases{/id}","created_at":"2013-08-02T17:37:26Z","updated_at":"2014-12-31T21:03:28Z","pushed_at":"2015-01-01T00:01:35Z","git_url":"git://github.com/blueboxgroup/ursula.git","ssh_url":"git@github.com:blueboxgroup/ursula.git","clone_url":"https://github.com/blueboxgroup/ursula.git","svn_url":"https://github.com/blueboxgroup/ursula","homepage":null,"size":9036,"stargazers_count":45,"watchers_count":45,"language":"Python","has_issues":true,"has_downloads":true,"has_wiki":true,"has_pages":false,"forks_count":23,"mirror_url":null,"open_issues_count":26,"forks":23,"open_issues":26,"watchers":45,"default_branch":"master"}},"base":{"label":"blueboxgroup:master","ref":"master","sha":"34b83c65ff0de2f8b006d8ce4f76919fe0167bbf","user":{"login":"blueboxgroup","id":458705,"avatar_url":"https://avatars.githubusercontent.com/u/458705?v=3","gravatar_id":"","url":"https://api.github.com/users/blueboxgroup","html_url":"https://github.com/blueboxgroup","followers_url":"https://api.github.com/users/blueboxgroup/followers","following_url":"https://api.github.com/users/blueboxgroup/following{/other_user}","gists_url":"https://api.github.com/users/blueboxgroup/gists{/gist_id}","starred_url":"https://api.github.com/users/blueboxgroup/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/blueboxgroup/subscriptions","organizations_url":"https://api.github.com/users/blueboxgroup/orgs","repos_url":"https://api.github.com/users/blueboxgroup/repos","events_url":"https://api.github.com/users/blueboxgroup/events{/privacy}","received_events_url":"https://api.github.com/users/blueboxgroup/received_events","type":"Organization","site_admin":false},"repo":{"id":11848896,"name":"ursula","full_name":"blueboxgroup/ursula","owner":{"login":"blueboxgroup","id":458705,"avatar_url":"https://avatars.githubusercontent.com/u/458705?v=3","gravatar_id":"","url":"https://api.github.com/users/blueboxgroup","html_url":"https://github.com/blueboxgroup","followers_url":"https://api.github.com/users/blueboxgroup/followers","following_url":"https://api.github.com/users/blueboxgroup/following{/other_user}","gists_url":"https://api.github.com/users/blueboxgroup/gists{/gist_id}","starred_url":"https://api.github.com/users/blueboxgroup/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/blueboxgroup/subscriptions","organizations_url":"https://api.github.com/users/blueboxgroup/orgs","repos_url":"https://api.github.com/users/blueboxgroup/repos","events_url":"https://api.github.com/users/blueboxgroup/events{/privacy}","received_events_url":"https://api.github.com/users/blueboxgroup/received_events","type":"Organization","site_admin":false},"private":false,"html_url":"https://github.com/blueboxgroup/ursula","description":"Ansible playbooks for operating OpenStack","fork":false,"url":"https://api.github.com/repos/blueboxgroup/ursula","forks_url":"https://api.github.com/repos/blueboxgroup/ursula/forks","keys_url":"https://api.github.com/repos/blueboxgroup/ursula/keys{/key_id}","collaborators_url":"https://api.github.com/repos/blueboxgroup/ursula/collaborators{/collaborator}","teams_url":"https://api.github.com/repos/blueboxgroup/ursula/teams","hooks_url":"https://api.github.com/repos/blueboxgroup/ursula/hooks","issue_events_url":"https://api.github.com/repos/blueboxgroup/ursula/issues/events{/number}","events_url":"https://api.github.com/repos/blueboxgroup/ursula/events","assignees_url":"https://api.github.com/repos/blueboxgroup/ursula/assignees{/user}","branches_url":"https://api.github.com/repos/blueboxgroup/ursula/branches{/branch}","tags_url":"https://api.github.com/repos/blueboxgroup/ursula/tags","blobs_url":"https://api.github.com/repos/blueboxgroup/ursula/git/blobs{/sha}","git_tags_url":"https://api.github.com/repos/blueboxgroup/ursula/git/tags{/sha}","git_refs_url":"https://api.github.com/repos/blueboxgroup/ursula/git/refs{/sha}","trees_url":"https://api.github.com/repos/blueboxgroup/ursula/git/trees{/sha}","statuses_url":"https://api.github.com/repos/blueboxgroup/ursula/statuses/{sha}","languages_url":"https://api.github.com/repos/blueboxgroup/ursula/languages","stargazers_url":"https://api.github.com/repos/blueboxgroup/ursula/stargazers","contributors_url":"https://api.github.com/repos/blueboxgroup/ursula/contributors","subscribers_url":"https://api.github.com/repos/blueboxgroup/ursula/subscribers","subscription_url":"https://api.github.com/repos/blueboxgroup/ursula/subscription","commits_url":"https://api.github.com/repos/blueboxgroup/ursula/commits{/sha}","git_commits_url":"https://api.github.com/repos/blueboxgroup/ursula/git/commits{/sha}","comments_url":"https://api.github.com/repos/blueboxgroup/ursula/comments{/number}","issue_comment_url":"https://api.github.com/repos/blueboxgroup/ursula/issues/comments/{number}","contents_url":"https://api.github.com/repos/blueboxgroup/ursula/contents/{+path}","compare_url":"https://api.github.com/repos/blueboxgroup/ursula/compare/{base}...{head}","merges_url":"https://api.github.com/repos/blueboxgroup/ursula/merges","archive_url":"https://api.github.com/repos/blueboxgroup/ursula/{archive_format}{/ref}","downloads_url":"https://api.github.com/repos/blueboxgroup/ursula/downloads","issues_url":"https://api.github.com/repos/blueboxgroup/ursula/issues{/number}","pulls_url":"https://api.github.com/repos/blueboxgroup/ursula/pulls{/number}","milestones_url":"https://api.github.com/repos/blueboxgroup/ursula/milestones{/number}","notifications_url":"https://api.github.com/repos/blueboxgroup/ursula/notifications{?since,all,participating}","labels_url":"https://api.github.com/repos/blueboxgroup/ursula/labels{/name}","releases_url":"https://api.github.com/repos/blueboxgroup/ursula/releases{/id}","created_at":"2013-08-02T17:37:26Z","updated_at":"2014-12-31T21:03:28Z","pushed_at":"2015-01-01T00:01:35Z","git_url":"git://github.com/blueboxgroup/ursula.git","ssh_url":"git@github.com:blueboxgroup/ursula.git","clone_url":"https://github.com/blueboxgroup/ursula.git","svn_url":"https://github.com/blueboxgroup/ursula","homepage":null,"size":9036,"stargazers_count":45,"watchers_count":45,"language":"Python","has_issues":true,"has_downloads":true,"has_wiki":true,"has_pages":false,"forks_count":23,"mirror_url":null,"open_issues_count":26,"forks":23,"open_issues":26,"watchers":45,"default_branch":"master"}},"_links":{"self":{"href":"https://api.github.com/repos/blueboxgroup/ursula/pulls/705"},"html":{"href":"https://github.com/blueboxgroup/ursula/pull/705"},"issue":{"href":"https://api.github.com/repos/blueboxgroup/ursula/issues/705"},"comments":{"href":"https://api.github.com/repos/blueboxgroup/ursula/issues/705/comments"},"review_comments":{"href":"https://api.github.com/repos/blueboxgroup/ursula/pulls/705/comments"},"review_comment":{"href":"https://api.github.com/repos/blueboxgroup/ursula/pulls/comments/{number}"},"commits":{"href":"https://api.github.com/repos/blueboxgroup/ursula/pulls/705/commits"},"statuses":{"href":"https://api.github.com/repos/blueboxgroup/ursula/statuses/2a6f35313b9936ce4450aba823d09287626bed6f"}}}},"public":true,"created_at":"2015-01-01T01:07:19Z","org":{"id":458705,"login":"blueboxgroup","gravatar_id":"","url":"https://api.github.com/orgs/blueboxgroup","avatar_url":"https://avatars.githubusercontent.com/u/458705?"}}
{"id":"2489398906","type":"PullRequestReviewCommentEvent","actor":{"id":860034,"login":"Renelvon","gravatar_id":"","url":"https://api.github.com/users/Renelvon","avatar_url":"https://avatars.githubusercontent.com/u/860034?"},"repo":{"id":19147609,"name":"OpenBazaar/OpenBazaar","url":"https://api.github.com/repos/OpenBazaar/OpenBazaar"},"payload":{"action":"created","comment":{"url":"https://api.github.com/repos/OpenBazaar/OpenBazaar/pulls/comments/22397308","id":22397308,"diff_hunk":"@@ -39,3 +41,19 @@ def get_history():\n \n def get_global(guid, callback):\n     get_unspent(burnaddr_from_guid(guid), callback)\n+\n+\n+def is_valid_namecoin(namecoin, guid):\n+    if not namecoin or not guid:\n+        return False\n+\n+    server = DNSChainServer.Server(constants.DNSCHAIN_SERVER_IP, \"\")\n+    _log.info(\"Looking up namecoin id: %s\", namecoin)\n+    try:\n+        data = server.lookup(\"id/\"+namecoin)","path":"node/trust.py","position":22,"original_position":22,"commit_id":"a84a18a43e1e6c91ca2bf58a2ab951268cf43f51","original_commit_id":"a84a18a43e1e6c91ca2bf58a2ab951268cf43f51","user":{"login":"Renelvon","id":860034,"avatar_url":"https://avatars.githubusercontent.com/u/860034?v=3","gravatar_id":"","url":"https://api.github.com/users/Renelvon","html_url":"https://github.com/Renelvon","followers_url":"https://api.github.com/users/Renelvon/followers","following_url":"https://api.github.com/users/Renelvon/following{/other_user}","gists_url":"https://api.github.com/users/Renelvon/gists{/gist_id}","starred_url":"https://api.github.com/users/Renelvon/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/Renelvon/subscriptions","organizations_url":"https://api.github.com/users/Renelvon/orgs","repos_url":"https://api.github.com/users/Renelvon/repos","events_url":"https://api.github.com/users/Renelvon/events{/privacy}","received_events_url":"https://api.github.com/users/Renelvon/received_events","type":"User","site_admin":false},"body":"To be fair, I can't see any PEP8 issue here, save for the spaces around `+`. Is that it?","created_at":"2015-01-01T01:07:19Z","updated_at":"2015-01-01T01:07:19Z","html_url":"https://github.com/OpenBazaar/OpenBazaar/pull/1105#discussion_r22397308","pull_request_url":"https://api.github.com/repos/OpenBazaar/OpenBazaar/pulls/1105","_links":{"self":{"href":"https://api.github.com/repos/OpenBazaar/OpenBazaar/pulls/comments/22397308"},"html":{"href":"https://github.com/OpenBazaar/OpenBazaar/pull/1105#discussion_r22397308"},"pull_request":{"href":"https://api.github.com/repos/OpenBazaar/OpenBazaar/pulls/1105"}}},"pull_request":{"url":"https://api.github.com/repos/OpenBazaar/OpenBazaar/pulls/1105","id":25621449,"html_url":"https://github.com/OpenBazaar/OpenBazaar/pull/1105","diff_url":"https://github.com/OpenBazaar/OpenBazaar/pull/1105.diff","patch_url":"https://github.com/OpenBazaar/OpenBazaar/pull/1105.patch","issue_url":"https://api.github.com/repos/OpenBazaar/OpenBazaar/issues/1105","number":1105,"state":"open","locked":false,"title":"[WIP]Issue #485 Relay namecoin id to other nodes","user":{"login":"charapod","id":6865935,"avatar_url":"https://avatars.githubusercontent.com/u/6865935?v=3","gravatar_id":"","url":"https://api.github.com/users/charapod","html_url":"https://github.com/charapod","followers_url":"https://api.github.com/users/charapod/followers","following_url":"https://api.github.com/users/charapod/following{/other_user}","gists_url":"https://api.github.com/users/charapod/gists{/gist_id}","starred_url":"https://api.github.com/users/charapod/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/charapod/subscriptions","organizations_url":"https://api.github.com/users/charapod/orgs","repos_url":"https://api.github.com/users/charapod/repos","events_url":"https://api.github.com/users/charapod/events{/privacy}","received_events_url":"https://api.github.com/users/charapod/received_events","type":"User","site_admin":false},"body":"1) As requested in #957, we changed namecoin_id column to lowercase. \r\n\r\nBut! Someone who had already upgraded their database with the old migration scripts will still have their column named with a capital, and there's no easy way to get rid of it since sqlite does not support DROP COLUMN (issue #955). New databases created will work fine of course, and rerunning the migration4.py script will probably do it as well. Let us know if you want us to cancel this modification.\r\n\r\n2) We begun working on issue #485 by @dionyziz . We added the namecoin of the sender to the rest of the information in the 'start_handshake' and 'send' methods in CryptoPeerConnection and we also stored the namecoin the user entered with the rest of his info in CryptoTrasportLayer. Is this the right way to do it? Should we change anything else? We need a little feedback here @gubatron , @hoffmabc :) \r\n\r\n3) As it is now, TransportLayer does not have a 'namecoin' field. Should we add a namecoin field in there, and treat it in the same manner as nickname?\r\n\r\n4)Should we add the namecoin to the 'ok_msg' in transport.py (line 136)?\r\n\r\n5)We see that you sign the information *before* you encrypt it. Is that intended? afaik this is not secure...","created_at":"2014-12-06T17:47:55Z","updated_at":"2015-01-01T01:07:19Z","closed_at":null,"merged_at":null,"merge_commit_sha":"3ef89a9529be958a544b49a90605c5cb1f351931","assignee":{"login":"dionyziz","id":544572,"avatar_url":"https://avatars.githubusercontent.com/u/544572?v=3","gravatar_id":"","url":"https://api.github.com/users/dionyziz","html_url":"https://github.com/dionyziz","followers_url":"https://api.github.com/users/dionyziz/followers","following_url":"https://api.github.com/users/dionyziz/following{/other_user}","gists_url":"https://api.github.com/users/dionyziz/gists{/gist_id}","starred_url":"https://api.github.com/users/dionyziz/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/dionyziz/subscriptions","organizations_url":"https://api.github.com/users/dionyziz/orgs","repos_url":"https://api.github.com/users/dionyziz/repos","events_url":"https://api.github.com/users/dionyziz/events{/privacy}","received_events_url":"https://api.github.com/users/dionyziz/received_events","type":"User","site_admin":false},"milestone":null,"commits_url":"https://api.github.com/repos/OpenBazaar/OpenBazaar/pulls/1105/commits","review_comments_url":"https://api.github.com/repos/OpenBazaar/OpenBazaar/pulls/1105/comments","review_comment_url":"https://api.github.com/repos/OpenBazaar/OpenBazaar/pulls/comments/{number}","comments_url":"https://api.github.com/repos/OpenBazaar/OpenBazaar/issues/1105/comments","statuses_url":"https://api.github.com/repos/OpenBazaar/OpenBazaar/statuses/a84a18a43e1e6c91ca2bf58a2ab951268cf43f51","head":{"label":"charapod:namecoin","ref":"namecoin","sha":"a84a18a43e1e6c91ca2bf58a2ab951268cf43f51","user":{"login":"charapod","id":6865935,"avatar_url":"https://avatars.githubusercontent.com/u/6865935?v=3","gravatar_id":"","url":"https://api.github.com/users/charapod","html_url":"https://github.com/charapod","followers_url":"https://api.github.com/users/charapod/followers","following_url":"https://api.github.com/users/charapod/following{/other_user}","gists_url":"https://api.github.com/users/charapod/gists{/gist_id}","starred_url":"https://api.github.com/users/charapod/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/charapod/subscriptions","organizations_url":"https://api.github.com/users/charapod/orgs","repos_url":"https://api.github.com/users/charapod/repos","events_url":"https://api.github.com/users/charapod/events{/privacy}","received_events_url":"https://api.github.com/users/charapod/received_events","type":"User","site_admin":false},"repo":{"id":26178277,"name":"OpenBazaar","full_name":"charapod/OpenBazaar","owner":{"login":"charapod","id":6865935,"avatar_url":"https://avatars.githubusercontent.com/u/6865935?v=3","gravatar_id":"","url":"https://api.github.com/users/charapod","html_url":"https://github.com/charapod","followers_url":"https://api.github.com/users/charapod/followers","following_url":"https://api.github.com/users/charapod/following{/other_user}","gists_url":"https://api.github.com/users/charapod/gists{/gist_id}","starred_url":"https://api.github.com/users/charapod/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/charapod/subscriptions","organizations_url":"https://api.github.com/users/charapod/orgs","repos_url":"https://api.github.com/users/charapod/repos","events_url":"https://api.github.com/users/charapod/events{/privacy}","received_events_url":"https://api.github.com/users/charapod/received_events","type":"User","site_admin":false},"private":false,"html_url":"https://github.com/charapod/OpenBazaar","description":"A decentralized marketplace","fork":true,"url":"https://api.github.com/repos/charapod/OpenBazaar","forks_url":"https://api.github.com/repos/charapod/OpenBazaar/forks","keys_url":"https://api.github.com/repos/charapod/OpenBazaar/keys{/key_id}","collaborators_url":"https://api.github.com/repos/charapod/OpenBazaar/collaborators{/collaborator}","teams_url":"https://api.github.com/repos/charapod/OpenBazaar/teams","hooks_url":"https://api.github.com/repos/charapod/OpenBazaar/hooks","issue_events_url":"https://api.github.com/repos/charapod/OpenBazaar/issues/events{/number}","events_url":"https://api.github.com/repos/charapod/OpenBazaar/events","assignees_url":"https://api.github.com/repos/charapod/OpenBazaar/assignees{/user}","branches_url":"https://api.github.com/repos/charapod/OpenBazaar/branches{/branch}","tags_url":"https://api.github.com/repos/charapod/OpenBazaar/tags","blobs_url":"https://api.github.com/repos/charapod/OpenBazaar/git/blobs{/sha}","git_tags_url":"https://api.github.com/repos/charapod/OpenBazaar/git/tags{/sha}","git_refs_url":"https://api.github.com/repos/charapod/OpenBazaar/git/refs{/sha}","trees_url":"https://api.github.com/repos/charapod/OpenBazaar/git/trees{/sha}","statuses_url":"https://api.github.com/repos/charapod/OpenBazaar/statuses/{sha}","languages_url":"https://api.github.com/repos/charapod/OpenBazaar/languages","stargazers_url":"https://api.github.com/repos/charapod/OpenBazaar/stargazers","contributors_url":"https://api.github.com/repos/charapod/OpenBazaar/contributors","subscribers_url":"https://api.github.com/repos/charapod/OpenBazaar/subscribers","subscription_url":"https://api.github.com/repos/charapod/OpenBazaar/subscription","commits_url":"https://api.github.com/repos/charapod/OpenBazaar/commits{/sha}","git_commits_url":"https://api.github.com/repos/charapod/OpenBazaar/git/commits{/sha}","comments_url":"https://api.github.com/repos/charapod/OpenBazaar/comments{/number}","issue_comment_url":"https://api.github.com/repos/charapod/OpenBazaar/issues/comments/{number}","contents_url":"https://api.github.com/repos/charapod/OpenBazaar/contents/{+path}","compare_url":"https://api.github.com/repos/charapod/OpenBazaar/compare/{base}...{head}","merges_url":"https://api.github.com/repos/charapod/OpenBazaar/merges","archive_url":"https://api.github.com/repos/charapod/OpenBazaar/{archive_format}{/ref}","downloads_url":"https://api.github.com/repos/charapod/OpenBazaar/downloads","issues_url":"https://api.github.com/repos/charapod/OpenBazaar/issues{/number}","pulls_url":"https://api.github.com/repos/charapod/OpenBazaar/pulls{/number}","milestones_url":"https://api.github.com/repos/charapod/OpenBazaar/milestones{/number}","notifications_url":"https://api.github.com/repos/charapod/OpenBazaar/notifications{?since,all,participating}","labels_url":"https://api.github.com/repos/charapod/OpenBazaar/labels{/name}","releases_url":"https://api.github.com/repos/charapod/OpenBazaar/releases{/id}","created_at":"2014-11-04T16:42:59Z","updated_at":"2014-11-09T20:18:11Z","pushed_at":"2014-12-27T12:44:05Z","git_url":"git://github.com/charapod/OpenBazaar.git","ssh_url":"git@github.com:charapod/OpenBazaar.git","clone_url":"https://github.com/charapod/OpenBazaar.git","svn_url":"https://github.com/charapod/OpenBazaar","homepage":"http://forum.openbazaar.org","size":17333,"stargazers_count":0,"watchers_count":0,"language":null,"has_issues":false,"has_downloads":true,"has_wiki":true,"has_pages":true,"forks_count":0,"mirror_url":null,"open_issues_count":0,"forks":0,"open_issues":0,"watchers":0,"default_branch":"master"}},"base":{"label":"OpenBazaar:develop","ref":"develop","sha":"e0eb864694ae8041e17c4a350102de77b59e9a68","user":{"login":"OpenBazaar","id":7438770,"avatar_url":"https://avatars.githubusercontent.com/u/7438770?v=3","gravatar_id":"","url":"https://api.github.com/users/OpenBazaar","html_url":"https://github.com/OpenBazaar","followers_url":"https://api.github.com/users/OpenBazaar/followers","following_url":"https://api.github.com/users/OpenBazaar/following{/other_user}","gists_url":"https://api.github.com/users/OpenBazaar/gists{/gist_id}","starred_url":"https://api.github.com/users/OpenBazaar/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/OpenBazaar/subscriptions","organizations_url":"https://api.github.com/users/OpenBazaar/orgs","repos_url":"https://api.github.com/users/OpenBazaar/repos","events_url":"https://api.github.com/users/OpenBazaar/events{/privacy}","received_events_url":"https://api.github.com/users/OpenBazaar/received_events","type":"Organization","site_admin":false},"repo":{"id":19147609,"name":"OpenBazaar","full_name":"OpenBazaar/OpenBazaar","owner":{"login":"OpenBazaar","id":7438770,"avatar_url":"https://avatars.githubusercontent.com/u/7438770?v=3","gravatar_id":"","url":"https://api.github.com/users/OpenBazaar","html_url":"https://github.com/OpenBazaar","followers_url":"https://api.github.com/users/OpenBazaar/followers","following_url":"https://api.github.com/users/OpenBazaar/following{/other_user}","gists_url":"https://api.github.com/users/OpenBazaar/gists{/gist_id}","starred_url":"https://api.github.com/users/OpenBazaar/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/OpenBazaar/subscriptions","organizations_url":"https://api.github.com/users/OpenBazaar/orgs","repos_url":"https://api.github.com/users/OpenBazaar/repos","events_url":"https://api.github.com/users/OpenBazaar/events{/privacy}","received_events_url":"https://api.github.com/users/OpenBazaar/received_events","type":"Organization","site_admin":false},"private":false,"html_url":"https://github.com/OpenBazaar/OpenBazaar","description":"A decentralized marketplace","fork":false,"url":"https://api.github.com/repos/OpenBazaar/OpenBazaar","forks_url":"https://api.github.com/repos/OpenBazaar/OpenBazaar/forks","keys_url":"https://api.github.com/repos/OpenBazaar/OpenBazaar/keys{/key_id}","collaborators_url":"https://api.github.com/repos/OpenBazaar/OpenBazaar/collaborators{/collaborator}","teams_url":"https://api.github.com/repos/OpenBazaar/OpenBazaar/teams","hooks_url":"https://api.github.com/repos/OpenBazaar/OpenBazaar/hooks","issue_events_url":"https://api.github.com/repos/OpenBazaar/OpenBazaar/issues/events{/number}","events_url":"https://api.github.com/repos/OpenBazaar/OpenBazaar/events","assignees_url":"https://api.github.com/repos/OpenBazaar/OpenBazaar/assignees{/user}","branches_url":"https://api.github.com/repos/OpenBazaar/OpenBazaar/branches{/branch}","tags_url":"https://api.github.com/repos/OpenBazaar/OpenBazaar/tags","blobs_url":"https://api.github.com/repos/OpenBazaar/OpenBazaar/git/blobs{/sha}","git_tags_url":"https://api.github.com/repos/OpenBazaar/OpenBazaar/git/tags{/sha}","git_refs_url":"https://api.github.com/repos/OpenBazaar/OpenBazaar/git/refs{/sha}","trees_url":"https://api.github.com/repos/OpenBazaar/OpenBazaar/git/trees{/sha}","statuses_url":"https://api.github.com/repos/OpenBazaar/OpenBazaar/statuses/{sha}","languages_url":"https://api.github.com/repos/OpenBazaar/OpenBazaar/languages","stargazers_url":"https://api.github.com/repos/OpenBazaar/OpenBazaar/stargazers","contributors_url":"https://api.github.com/repos/OpenBazaar/OpenBazaar/contributors","subscribers_url":"https://api.github.com/repos/OpenBazaar/OpenBazaar/subscribers","subscription_url":"https://api.github.com/repos/OpenBazaar/OpenBazaar/subscription","commits_url":"https://api.github.com/repos/OpenBazaar/OpenBazaar/commits{/sha}","git_commits_url":"https://api.github.com/repos/OpenBazaar/OpenBazaar/git/commits{/sha}","comments_url":"https://api.github.com/repos/OpenBazaar/OpenBazaar/comments{/number}","issue_comment_url":"https://api.github.com/repos/OpenBazaar/OpenBazaar/issues/comments/{number}","contents_url":"https://api.github.com/repos/OpenBazaar/OpenBazaar/contents/{+path}","compare_url":"https://api.github.com/repos/OpenBazaar/OpenBazaar/compare/{base}...{head}","merges_url":"https://api.github.com/repos/OpenBazaar/OpenBazaar/merges","archive_url":"https://api.github.com/repos/OpenBazaar/OpenBazaar/{archive_format}{/ref}","downloads_url":"https://api.github.com/repos/OpenBazaar/OpenBazaar/downloads","issues_url":"https://api.github.com/repos/OpenBazaar/OpenBazaar/issues{/number}","pulls_url":"https://api.github.com/repos/OpenBazaar/OpenBazaar/pulls{/number}","milestones_url":"https://api.github.com/repos/OpenBazaar/OpenBazaar/milestones{/number}","notifications_url":"https://api.github.com/repos/OpenBazaar/OpenBazaar/notifications{?since,all,participating}","labels_url":"https://api.github.com/repos/OpenBazaar/OpenBazaar/labels{/name}","releases_url":"https://api.github.com/repos/OpenBazaar/OpenBazaar/releases{/id}","created_at":"2014-04-25T13:49:36Z","updated_at":"2014-12-31T19:56:51Z","pushed_at":"2014-12-30T10:37:28Z","git_url":"git://github.com/OpenBazaar/OpenBazaar.git","ssh_url":"git@github.com:OpenBazaar/OpenBazaar.git","clone_url":"https://github.com/OpenBazaar/OpenBazaar.git","svn_url":"https://github.com/OpenBazaar/OpenBazaar","homepage":"http://www.reddit.com/r/OpenBazaar/","size":31718,"stargazers_count":1115,"watchers_count":1115,"language":"Python","has_issues":true,"has_downloads":true,"has_wiki":true,"has_pages":true,"forks_count":290,"mirror_url":null,"open_issues_count":248,"forks":290,"open_issues":248,"watchers":1115,"default_branch":"master"}},"_links":{"self":{"href":"https://api.github.com/repos/OpenBazaar/OpenBazaar/pulls/1105"},"html":{"href":"https://github.com/OpenBazaar/OpenBazaar/pull/1105"},"issue":{"href":"https://api.github.com/repos/OpenBazaar/OpenBazaar/issues/1105"},"comments":{"href":"https://api.github.com/repos/OpenBazaar/OpenBazaar/issues/1105/comments"},"review_comments":{"href":"https://api.github.com/repos/OpenBazaar/OpenBazaar/pulls/1105/comments"},"review_comment":{"href":"https://api.github.com/repos/OpenBazaar/OpenBazaar/pulls/comments/{number}"},"commits":{"href":"https://api.github.com/repos/OpenBazaar/OpenBazaar/pulls/1105/commits"},"statuses":{"href":"https://api.github.com/repos/OpenBazaar/OpenBazaar/statuses/a84a18a43e1e6c91ca2bf58a2ab951268cf43f51"}}}},"public":true,"created_at":"2015-01-01T01:07:19Z","org":{"id":7438770,"login":"OpenBazaar","gravatar_id":"","url":"https://api.github.com/orgs/OpenBazaar","avatar_url":"https://avatars.githubusercontent.com/u/7438770?"}}
{"id":"2489398907","type":"CreateEvent","actor":{"id":51458,"login":"hlapp","gravatar_id":"","url":"https://api.github.com/users/hlapp","avatar_url":"https://avatars.githubusercontent.com/u/51458?"},"repo":{"id":11856817,"name":"ropensci/RNeXML","url":"https://api.github.com/repos/ropensci/RNeXML"},"payload":{"ref":"hl-refmt-appnote-1","ref_type":"branch","master_branch":"master","description":"Implementing semantically rich NeXML I/O in R","pusher_type":"user"},"public":true,"created_at":"2015-01-01T01:07:20Z","org":{"id":1200269,"login":"ropensci","gravatar_id":"","url":"https://api.github.com/orgs/ropensci","avatar_url":"https://avatars.githubusercontent.com/u/1200269?"}}
{"id":"2489398912","type":"WatchEvent","actor":{"id":898282,"login":"jzajac","gravatar_id":"","url":"https://api.github.com/users/jzajac","avatar_url":"https://avatars.githubusercontent.com/u/898282?"},"repo":{"id":20537104,"name":"google/cayley","url":"https://api.github.com/repos/google/cayley"},"payload":{"action":"started"},"public":true,"created_at":"2015-01-01T01:07:23Z","org":{"id":1342004,"login":"google","gravatar_id":"","url":"https://api.github.com/orgs/google","avatar_url":"https://avatars.githubusercontent.com/u/1342004?"}}
{"id":"2489398916","type":"PushEvent","actor":{"id":6462036,"login":"samhillman","gravatar_id":"","url":"https://api.github.com/users/samhillman","avatar_url":"https://avatars.githubusercontent.com/u/6462036?"},"repo":{"id":28253700,"name":"samhillman/newdotcom","url":"https://api.github.com/repos/samhillman/newdotcom"},"payload":{"push_id":536753566,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"0a4a5c67d0671000171574a0f928f0b2236522e3","before":"eb166d0e9ff48e250e0b322ef42013d02dca159c","commits":[{"sha":"0a4a5c67d0671000171574a0f928f0b2236522e3","author":{"email":"3f12132dd817f39877292097b6071939bf5ccbcd@cvbay.co.uk","name":"Sam Hillman"},"message":"removed unneeded page","distinct":true,"url":"https://api.github.com/repos/samhillman/newdotcom/commits/0a4a5c67d0671000171574a0f928f0b2236522e3"}]},"public":true,"created_at":"2015-01-01T01:07:23Z"}
{"id":"2489398917","type":"PushEvent","actor":{"id":3599988,"login":"wesdizzle","gravatar_id":"","url":"https://api.github.com/users/wesdizzle","avatar_url":"https://avatars.githubusercontent.com/u/3599988?"},"repo":{"id":28250120,"name":"wesdizzle/gagglelog","url":"https://api.github.com/repos/wesdizzle/gagglelog"},"payload":{"push_id":536753567,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"da61d76888db710591e7a0b68ca5e8d273569e9c","before":"d04cbec8b68d0e66cf87c078862065645e181086","commits":[{"sha":"da61d76888db710591e7a0b68ca5e8d273569e9c","author":{"email":"baaa01a5d45f86e3d8f7008866cf0d37bea55570@gmail.com","name":"Wesley Miller"},"message":"added Index value to Expansions","distinct":true,"url":"https://api.github.com/repos/wesdizzle/gagglelog/commits/da61d76888db710591e7a0b68ca5e8d273569e9c"}]},"public":true,"created_at":"2015-01-01T01:07:23Z"}
{"id":"2489398920","type":"PushEvent","actor":{"id":2523987,"login":"laggingreflex","gravatar_id":"","url":"https://api.github.com/users/laggingreflex","avatar_url":"https://avatars.githubusercontent.com/u/2523987?"},"repo":{"id":22790173,"name":"laggingreflex/.dotfiles","url":"https://api.github.com/repos/laggingreflex/.dotfiles"},"payload":{"push_id":536753569,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"0ec37f77b8811a07ca6c6df79622541d8fa40c0a","before":"233774f844d59ff89420037609cf3e0cba985e9a","commits":[{"sha":"0ec37f77b8811a07ca6c6df79622541d8fa40c0a","author":{"email":"11f6ad8ec52a2984abaafd7c3b516503785c2072","name":"x"},"message":".","distinct":true,"url":"https://api.github.com/repos/laggingreflex/.dotfiles/commits/0ec37f77b8811a07ca6c6df79622541d8fa40c0a"}]},"public":true,"created_at":"2015-01-01T01:07:24Z"}
{"id":"2489398921","type":"PushEvent","actor":{"id":3315647,"login":"shaunoneill","gravatar_id":"","url":"https://api.github.com/users/shaunoneill","avatar_url":"https://avatars.githubusercontent.com/u/3315647?"},"repo":{"id":28667121,"name":"GreenUmbrellaSoftware/website","url":"https://api.github.com/repos/GreenUmbrellaSoftware/website"},"payload":{"push_id":536753570,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"f028ffa984eb28fb783a7c1df7364eca3bfb7f4d","before":"6eafa085f08d3506a09df4b15649686a2eeeedc4","commits":[{"sha":"f028ffa984eb28fb783a7c1df7364eca3bfb7f4d","author":{"email":"a2bb892f7d3d0e9e81f56035b4467ebbc2c5d2cd@greenumbrellasoftware.com","name":"shaun"},"message":"updated the pages","distinct":true,"url":"https://api.github.com/repos/GreenUmbrellaSoftware/website/commits/f028ffa984eb28fb783a7c1df7364eca3bfb7f4d"}]},"public":true,"created_at":"2015-01-01T01:07:24Z","org":{"id":2716713,"login":"GreenUmbrellaSoftware","gravatar_id":"","url":"https://api.github.com/orgs/GreenUmbrellaSoftware","avatar_url":"https://avatars.githubusercontent.com/u/2716713?"}}
{"id":"2489398924","type":"IssueCommentEvent","actor":{"id":134455,"login":"whit537","gravatar_id":"","url":"https://api.github.com/users/whit537","avatar_url":"https://avatars.githubusercontent.com/u/134455?"},"repo":{"id":16488998,"name":"gratipay/inside.gratipay.com","url":"https://api.github.com/repos/gratipay/inside.gratipay.com"},"payload":{"action":"created","issue":{"url":"https://api.github.com/repos/gratipay/inside.gratipay.com/issues/93","labels_url":"https://api.github.com/repos/gratipay/inside.gratipay.com/issues/93/labels{/name}","comments_url":"https://api.github.com/repos/gratipay/inside.gratipay.com/issues/93/comments","events_url":"https://api.github.com/repos/gratipay/inside.gratipay.com/issues/93/events","html_url":"https://github.com/gratipay/inside.gratipay.com/issues/93","id":45497806,"number":93,"title":"pin down retreat schedule","user":{"login":"clone1018","id":226638,"avatar_url":"https://avatars.githubusercontent.com/u/226638?v=3","gravatar_id":"","url":"https://api.github.com/users/clone1018","html_url":"https://github.com/clone1018","followers_url":"https://api.github.com/users/clone1018/followers","following_url":"https://api.github.com/users/clone1018/following{/other_user}","gists_url":"https://api.github.com/users/clone1018/gists{/gist_id}","starred_url":"https://api.github.com/users/clone1018/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/clone1018/subscriptions","organizations_url":"https://api.github.com/users/clone1018/orgs","repos_url":"https://api.github.com/users/clone1018/repos","events_url":"https://api.github.com/users/clone1018/events{/privacy}","received_events_url":"https://api.github.com/users/clone1018/received_events","type":"User","site_admin":false},"labels":[],"state":"open","locked":false,"assignee":null,"milestone":{"url":"https://api.github.com/repos/gratipay/inside.gratipay.com/milestones/2","labels_url":"https://api.github.com/repos/gratipay/inside.gratipay.com/milestones/2/labels","id":782050,"number":2,"title":"Gratipay Retreat 2015","description":"This is an encompassing milestone for planning the Gratipay Retreat. ","creator":{"login":"clone1018","id":226638,"avatar_url":"https://avatars.githubusercontent.com/u/226638?v=3","gravatar_id":"","url":"https://api.github.com/users/clone1018","html_url":"https://github.com/clone1018","followers_url":"https://api.github.com/users/clone1018/followers","following_url":"https://api.github.com/users/clone1018/following{/other_user}","gists_url":"https://api.github.com/users/clone1018/gists{/gist_id}","starred_url":"https://api.github.com/users/clone1018/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/clone1018/subscriptions","organizations_url":"https://api.github.com/users/clone1018/orgs","repos_url":"https://api.github.com/users/clone1018/repos","events_url":"https://api.github.com/users/clone1018/events{/privacy}","received_events_url":"https://api.github.com/users/clone1018/received_events","type":"User","site_admin":false},"open_issues":2,"closed_issues":1,"state":"open","created_at":"2014-09-08T13:35:41Z","updated_at":"2015-01-01T00:49:37Z","due_on":"2015-01-02T08:00:00Z","closed_at":null},"comments":11,"created_at":"2014-10-10T16:18:37Z","updated_at":"2015-01-01T01:07:24Z","closed_at":null,"body":""},"comment":{"url":"https://api.github.com/repos/gratipay/inside.gratipay.com/issues/comments/68477376","html_url":"https://github.com/gratipay/inside.gratipay.com/issues/93#issuecomment-68477376","issue_url":"https://api.github.com/repos/gratipay/inside.gratipay.com/issues/93","id":68477376,"user":{"login":"whit537","id":134455,"avatar_url":"https://avatars.githubusercontent.com/u/134455?v=3","gravatar_id":"","url":"https://api.github.com/users/whit537","html_url":"https://github.com/whit537","followers_url":"https://api.github.com/users/whit537/followers","following_url":"https://api.github.com/users/whit537/following{/other_user}","gists_url":"https://api.github.com/users/whit537/gists{/gist_id}","starred_url":"https://api.github.com/users/whit537/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/whit537/subscriptions","organizations_url":"https://api.github.com/users/whit537/orgs","repos_url":"https://api.github.com/users/whit537/repos","events_url":"https://api.github.com/users/whit537/events{/privacy}","received_events_url":"https://api.github.com/users/whit537/received_events","type":"User","site_admin":false},"created_at":"2015-01-01T01:07:24Z","updated_at":"2015-01-01T01:07:24Z","body":"Obviously we're going to have to spend time on #118. What are our expectations there in terms of what we'll be able to accomplish while we're together? At this point I feel like we need to be more or less open ended, take it as it comes once we're together.\r\n\r\nWhat else do we want to have on the agenda? #89 comes to mind."}},"public":true,"created_at":"2015-01-01T01:07:24Z","org":{"id":1744073,"login":"gratipay","gravatar_id":"","url":"https://api.github.com/orgs/gratipay","avatar_url":"https://avatars.githubusercontent.com/u/1744073?"}}
{"id":"2489398926","type":"PushEvent","actor":{"id":6278300,"login":"VacioExistencial","gravatar_id":"","url":"https://api.github.com/users/VacioExistencial","avatar_url":"https://avatars.githubusercontent.com/u/6278300?"},"repo":{"id":28678151,"name":"VacioExistencial/pong","url":"https://api.github.com/repos/VacioExistencial/pong"},"payload":{"push_id":536753571,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"60300f7ad699ac99855ebd2357502afb834dfe1c","before":"978cb4883e834db8b30b6ec2edca30e231b42658","commits":[{"sha":"60300f7ad699ac99855ebd2357502afb834dfe1c","author":{"email":"44bdaf3b26e8e183b1d41341b9fe1b680910844f@outlook.com","name":"Alex"},"message":"migrado a SDL2\n\nNo hice grandes cambios, y falta mucho por hacer.","distinct":true,"url":"https://api.github.com/repos/VacioExistencial/pong/commits/60300f7ad699ac99855ebd2357502afb834dfe1c"}]},"public":true,"created_at":"2015-01-01T01:07:24Z"}
{"id":"2489398928","type":"IssuesEvent","actor":{"id":2748277,"login":"vinhkhoa","gravatar_id":"","url":"https://api.github.com/users/vinhkhoa","avatar_url":"https://avatars.githubusercontent.com/u/2748277?"},"repo":{"id":28330560,"name":"vinhkhoa/AthTracker","url":"https://api.github.com/repos/vinhkhoa/AthTracker"},"payload":{"action":"closed","issue":{"url":"https://api.github.com/repos/vinhkhoa/AthTracker/issues/10","labels_url":"https://api.github.com/repos/vinhkhoa/AthTracker/issues/10/labels{/name}","comments_url":"https://api.github.com/repos/vinhkhoa/AthTracker/issues/10/comments","events_url":"https://api.github.com/repos/vinhkhoa/AthTracker/issues/10/events","html_url":"https://github.com/vinhkhoa/AthTracker/issues/10","id":52690026,"number":10,"title":"Extra profile fields","user":{"login":"vinhkhoa","id":2748277,"avatar_url":"https://avatars.githubusercontent.com/u/2748277?v=3","gravatar_id":"","url":"https://api.github.com/users/vinhkhoa","html_url":"https://github.com/vinhkhoa","followers_url":"https://api.github.com/users/vinhkhoa/followers","following_url":"https://api.github.com/users/vinhkhoa/following{/other_user}","gists_url":"https://api.github.com/users/vinhkhoa/gists{/gist_id}","starred_url":"https://api.github.com/users/vinhkhoa/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/vinhkhoa/subscriptions","organizations_url":"https://api.github.com/users/vinhkhoa/orgs","repos_url":"https://api.github.com/users/vinhkhoa/repos","events_url":"https://api.github.com/users/vinhkhoa/events{/privacy}","received_events_url":"https://api.github.com/users/vinhkhoa/received_events","type":"User","site_admin":false},"labels":[{"url":"https://api.github.com/repos/vinhkhoa/AthTracker/labels/requirement","name":"requirement","color":"207de5"}],"state":"closed","locked":false,"assignee":null,"milestone":null,"comments":0,"created_at":"2014-12-22T21:22:37Z","updated_at":"2015-01-01T01:07:24Z","closed_at":"2015-01-01T01:07:24Z","body":""}},"public":true,"created_at":"2015-01-01T01:07:24Z"}
{"id":"2489398929","type":"WatchEvent","actor":{"id":451828,"login":"minirop","gravatar_id":"","url":"https://api.github.com/users/minirop","avatar_url":"https://avatars.githubusercontent.com/u/451828?"},"repo":{"id":4106171,"name":"lioncash/ExtractData","url":"https://api.github.com/repos/lioncash/ExtractData"},"payload":{"action":"started"},"public":true,"created_at":"2015-01-01T01:07:25Z"}
{"id":"2489398934","type":"PushEvent","actor":{"id":8819701,"login":"r-ggraham","gravatar_id":"","url":"https://api.github.com/users/r-ggraham","avatar_url":"https://avatars.githubusercontent.com/u/8819701?"},"repo":{"id":28678173,"name":"r-ggraham/Crumpet_Bot","url":"https://api.github.com/repos/r-ggraham/Crumpet_Bot"},"payload":{"push_id":536753574,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"5c6c899b455693ca53377520b3f0c73442ce97f9","before":"ee45c3d188e25fa5ee1d0d5a8a9f3646854ccbc7","commits":[{"sha":"5c6c899b455693ca53377520b3f0c73442ce97f9","author":{"email":"f2f9dd43aa4244d32208a2ccfa0c7c9e9c48f7e7@uni.worc.ac.uk","name":"Rob G"},"message":"Instructions","distinct":true,"url":"https://api.github.com/repos/r-ggraham/Crumpet_Bot/commits/5c6c899b455693ca53377520b3f0c73442ce97f9"}]},"public":true,"created_at":"2015-01-01T01:07:25Z"}
{"id":"2489398940","type":"MemberEvent","actor":{"id":932999,"login":"loyos","gravatar_id":"","url":"https://api.github.com/users/loyos","avatar_url":"https://avatars.githubusercontent.com/u/932999?"},"repo":{"id":28678289,"name":"loyos/cemento","url":"https://api.github.com/repos/loyos/cemento"},"payload":{"member":{"login":"yennifergrau","id":10153477,"avatar_url":"https://avatars.githubusercontent.com/u/10153477?v=3","gravatar_id":"","url":"https://api.github.com/users/yennifergrau","html_url":"https://github.com/yennifergrau","followers_url":"https://api.github.com/users/yennifergrau/followers","following_url":"https://api.github.com/users/yennifergrau/following{/other_user}","gists_url":"https://api.github.com/users/yennifergrau/gists{/gist_id}","starred_url":"https://api.github.com/users/yennifergrau/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/yennifergrau/subscriptions","organizations_url":"https://api.github.com/users/yennifergrau/orgs","repos_url":"https://api.github.com/users/yennifergrau/repos","events_url":"https://api.github.com/users/yennifergrau/events{/privacy}","received_events_url":"https://api.github.com/users/yennifergrau/received_events","type":"User","site_admin":false},"action":"added"},"public":true,"created_at":"2015-01-01T01:07:28Z"}
{"id":"2489398943","type":"WatchEvent","actor":{"id":1013892,"login":"jarofghosts","gravatar_id":"","url":"https://api.github.com/users/jarofghosts","avatar_url":"https://avatars.githubusercontent.com/u/1013892?"},"repo":{"id":6853358,"name":"substack/tape","url":"https://api.github.com/repos/substack/tape"},"payload":{"action":"started"},"public":true,"created_at":"2015-01-01T01:07:28Z"}
{"id":"2489398944","type":"IssueCommentEvent","actor":{"id":9020086,"login":"HERO4903","gravatar_id":"","url":"https://api.github.com/users/HERO4903","avatar_url":"https://avatars.githubusercontent.com/u/9020086?"},"repo":{"id":28678195,"name":"TTMTT/iCL0udin","url":"https://api.github.com/repos/TTMTT/iCL0udin"},"payload":{"action":"created","issue":{"url":"https://api.github.com/repos/TTMTT/iCL0udin/issues/1","labels_url":"https://api.github.com/repos/TTMTT/iCL0udin/issues/1/labels{/name}","comments_url":"https://api.github.com/repos/TTMTT/iCL0udin/issues/1/comments","events_url":"https://api.github.com/repos/TTMTT/iCL0udin/issues/1/events","html_url":"https://github.com/TTMTT/iCL0udin/issues/1","id":53210206,"number":1,"title":"Discuss1","user":{"login":"TTMTT","id":6964047,"avatar_url":"https://avatars.githubusercontent.com/u/6964047?v=3","gravatar_id":"","url":"https://api.github.com/users/TTMTT","html_url":"https://github.com/TTMTT","followers_url":"https://api.github.com/users/TTMTT/followers","following_url":"https://api.github.com/users/TTMTT/following{/other_user}","gists_url":"https://api.github.com/users/TTMTT/gists{/gist_id}","starred_url":"https://api.github.com/users/TTMTT/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/TTMTT/subscriptions","organizations_url":"https://api.github.com/users/TTMTT/orgs","repos_url":"https://api.github.com/users/TTMTT/repos","events_url":"https://api.github.com/users/TTMTT/events{/privacy}","received_events_url":"https://api.github.com/users/TTMTT/received_events","type":"User","site_admin":false},"labels":[],"state":"open","locked":false,"assignee":null,"milestone":null,"comments":3,"created_at":"2015-01-01T01:02:34Z","updated_at":"2015-01-01T01:07:27Z","closed_at":null,"body":"Now you can download vresion 1.0 from :\r\n---------------------------------------------------\r\nhttp://www.icloudin.net\r\n-----------------------------\r\nWow, ipod touch 5G (8.1) - iCL0udin v1.0 bypass activation (icloud)\r\n-------------------------------------------------------------------------------------\r\nhttp://youtu.be/tZmEdlDGNu4\r\n--------------------------------------\r\niCL0udin v1.0 bypass activation (icloud) - ipad mini 2G (7.1.1)\r\n-------------------------------------------------------------------------------------\r\nhttp://youtu.be/tevYyBN2QCQ\r\n---------------------------------------\r\nVideo for bypass icloud (iCL0udin v1.0) for iphone 4 CDMA ..\r\n-------------------------------------------------------------------------------------\r\nhttp://youtu.be/i85-D6N2YLk\r\n-------------------------------------\r\nNew video for iCL0udin v1.0 bypass icloud (3 iphones 7.1.2):\r\n-------------------------------------------------------------------------------------\r\nhttp://youtu.be/p51TNlCr7ug\r\n-------------------------------------\r\niCL0udin v1.0 -> %100\r\n----------------------------\r\nRemaining: %3 testing with some people..\r\n-----------------------------------------------------\r\nLast Method:\r\n-----------------\r\n\r\nmethod 1 : via (other xml not to deviceservices - exploit)\r\nmethod 2 : via (apple cert & key and i can downgrade to any ios)\r\nmethod 3 : via (change some string by hex on ELF file << some times i got error)\r\nmethod 4 : via (use apple ssl cert or real ssl in server and change some string in iphone)\r\niCL0udin v1.0 have this method:\r\n-----------------------------------------\r\n\r\nmethod 1 : via (other xml not to deviceservices - exploit)\r\nmethod 2 : via (apple cert & key and i can downgrade to any ios)"},"comment":{"url":"https://api.github.com/repos/TTMTT/iCL0udin/issues/comments/68477378","html_url":"https://github.com/TTMTT/iCL0udin/issues/1#issuecomment-68477378","issue_url":"https://api.github.com/repos/TTMTT/iCL0udin/issues/1","id":68477378,"user":{"login":"HERO4903","id":9020086,"avatar_url":"https://avatars.githubusercontent.com/u/9020086?v=3","gravatar_id":"","url":"https://api.github.com/users/HERO4903","html_url":"https://github.com/HERO4903","followers_url":"https://api.github.com/users/HERO4903/followers","following_url":"https://api.github.com/users/HERO4903/following{/other_user}","gists_url":"https://api.github.com/users/HERO4903/gists{/gist_id}","starred_url":"https://api.github.com/users/HERO4903/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/HERO4903/subscriptions","organizations_url":"https://api.github.com/users/HERO4903/orgs","repos_url":"https://api.github.com/users/HERO4903/repos","events_url":"https://api.github.com/users/HERO4903/events{/privacy}","received_events_url":"https://api.github.com/users/HERO4903/received_events","type":"User","site_admin":false},"created_at":"2015-01-01T01:07:27Z","updated_at":"2015-01-01T01:07:27Z","body":"TTMTT hola una pregunta será posible que se solucione la sobrecarga en las próximas horas"}},"public":true,"created_at":"2015-01-01T01:07:28Z"}
{"id":"2489398947","type":"CreateEvent","actor":{"id":5491765,"login":"loganrice","gravatar_id":"","url":"https://api.github.com/users/loganrice","avatar_url":"https://avatars.githubusercontent.com/u/5491765?"},"repo":{"id":26188359,"name":"loganrice/bkisystem","url":"https://api.github.com/repos/loganrice/bkisystem"},"payload":{"ref":"commission","ref_type":"branch","master_branch":"master","description":"","pusher_type":"user"},"public":true,"created_at":"2015-01-01T01:07:28Z"}
{"id":"2489398950","type":"PushEvent","actor":{"id":1577452,"login":"perrupa","gravatar_id":"","url":"https://api.github.com/users/perrupa","avatar_url":"https://avatars.githubusercontent.com/u/1577452?"},"repo":{"id":19949182,"name":"perrupa/perrupa.github.io","url":"https://api.github.com/repos/perrupa/perrupa.github.io"},"payload":{"push_id":536753578,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"e3376d7b903228eb56abd1bde81bf4c3af3f21e7","before":"6558647e1ac00710c0ddbbd2c080c4645be187a2","commits":[{"sha":"e3376d7b903228eb56abd1bde81bf4c3af3f21e7","author":{"email":"9a70e3eb66414f9b662fb64558a83b5e48ee973f@achievers.com","name":"Chris Marlow"},"message":"Added package info","distinct":true,"url":"https://api.github.com/repos/perrupa/perrupa.github.io/commits/e3376d7b903228eb56abd1bde81bf4c3af3f21e7"}]},"public":true,"created_at":"2015-01-01T01:07:28Z"}
{"id":"2489398951","type":"PushEvent","actor":{"id":1265899,"login":"lynas","gravatar_id":"","url":"https://api.github.com/users/lynas","avatar_url":"https://avatars.githubusercontent.com/u/1265899?"},"repo":{"id":28678234,"name":"lynas/springsecurity3.2","url":"https://api.github.com/repos/lynas/springsecurity3.2"},"payload":{"push_id":536753580,"size":2,"distinct_size":2,"ref":"refs/heads/master","head":"b562d8b720ffb29b808f5846ae87cbe39cd23fe6","before":"97d11dfb3e36a479593c4dbd68087b23778161ac","commits":[{"sha":"dbc9006b01fb370ed8949bd825ae6e86f7302e25","author":{"email":"286cad8d9475283cbc1d36806a52beb3fd9db73b@gmail.com","name":"lynas"},"message":"initial commit","distinct":true,"url":"https://api.github.com/repos/lynas/springsecurity3.2/commits/dbc9006b01fb370ed8949bd825ae6e86f7302e25"},{"sha":"b562d8b720ffb29b808f5846ae87cbe39cd23fe6","author":{"email":"286cad8d9475283cbc1d36806a52beb3fd9db73b@gmail.com","name":"lynas"},"message":"Merge branch 'master' of https://github.com/lynas/springsecurity3.2","distinct":true,"url":"https://api.github.com/repos/lynas/springsecurity3.2/commits/b562d8b720ffb29b808f5846ae87cbe39cd23fe6"}]},"public":true,"created_at":"2015-01-01T01:07:28Z"}
{"id":"2489398952","type":"IssueCommentEvent","actor":{"id":312296,"login":"cqcallaw","gravatar_id":"","url":"https://api.github.com/users/cqcallaw","avatar_url":"https://avatars.githubusercontent.com/u/312296?"},"repo":{"id":14712850,"name":"syncthing/syncthing","url":"https://api.github.com/repos/syncthing/syncthing"},"payload":{"action":"created","issue":{"url":"https://api.github.com/repos/syncthing/syncthing/issues/1113","labels_url":"https://api.github.com/repos/syncthing/syncthing/issues/1113/labels{/name}","comments_url":"https://api.github.com/repos/syncthing/syncthing/issues/1113/comments","events_url":"https://api.github.com/repos/syncthing/syncthing/issues/1113/events","html_url":"https://github.com/syncthing/syncthing/issues/1113","id":51872359,"number":1113,"title":"Flaky UPnP","user":{"login":"AudriusButkevicius","id":1144861,"avatar_url":"https://avatars.githubusercontent.com/u/1144861?v=3","gravatar_id":"","url":"https://api.github.com/users/AudriusButkevicius","html_url":"https://github.com/AudriusButkevicius","followers_url":"https://api.github.com/users/AudriusButkevicius/followers","following_url":"https://api.github.com/users/AudriusButkevicius/following{/other_user}","gists_url":"https://api.github.com/users/AudriusButkevicius/gists{/gist_id}","starred_url":"https://api.github.com/users/AudriusButkevicius/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/AudriusButkevicius/subscriptions","organizations_url":"https://api.github.com/users/AudriusButkevicius/orgs","repos_url":"https://api.github.com/users/AudriusButkevicius/repos","events_url":"https://api.github.com/users/AudriusButkevicius/events{/privacy}","received_events_url":"https://api.github.com/users/AudriusButkevicius/received_events","type":"User","site_admin":false},"labels":[{"url":"https://api.github.com/repos/syncthing/syncthing/labels/bug","name":"bug","color":"fc2929"}],"state":"open","locked":false,"assignee":null,"milestone":null,"comments":15,"created_at":"2014-12-13T01:51:45Z","updated_at":"2015-01-01T01:07:26Z","closed_at":null,"body":"I've managed to reproduce this weird case where UPnP does not work.\r\nFired up wireshark, and I can see discovery packets leaving, but I cannot see UPnP MSEARCH packets leaving my machine.\r\n\r\nI changed the broadcast address to something else within my subnet, and it starts working, meaning that either Go or Windows doesn't like the address.\r\n\r\nGiven I ran a different UPnP utility and it works, it makes me think there is something wrong with Go's stuff.\r\n"},"comment":{"url":"https://api.github.com/repos/syncthing/syncthing/issues/comments/68477377","html_url":"https://github.com/syncthing/syncthing/issues/1113#issuecomment-68477377","issue_url":"https://api.github.com/repos/syncthing/syncthing/issues/1113","id":68477377,"user":{"login":"cqcallaw","id":312296,"avatar_url":"https://avatars.githubusercontent.com/u/312296?v=3","gravatar_id":"","url":"https://api.github.com/users/cqcallaw","html_url":"https://github.com/cqcallaw","followers_url":"https://api.github.com/users/cqcallaw/followers","following_url":"https://api.github.com/users/cqcallaw/following{/other_user}","gists_url":"https://api.github.com/users/cqcallaw/gists{/gist_id}","starred_url":"https://api.github.com/users/cqcallaw/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/cqcallaw/subscriptions","organizations_url":"https://api.github.com/users/cqcallaw/orgs","repos_url":"https://api.github.com/users/cqcallaw/repos","events_url":"https://api.github.com/users/cqcallaw/events{/privacy}","received_events_url":"https://api.github.com/users/cqcallaw/received_events","type":"User","site_admin":false},"created_at":"2015-01-01T01:07:26Z","updated_at":"2015-01-01T01:07:26Z","body":"Interesting, I did a test with the [latest commit](https://github.com/syncthing/syncthing/tree/e94bd90782c25ef1a65cc0fe375bcafd1d398275 of syncthing) of syncthing, and the port mapping worked fine--and the discovery packets showed up in Wireshark! I really don't know what changed, but this issue doesn't seem reproducible enough to keep open. I vote to close the issue until someone can reliable reproduce it."}},"public":true,"created_at":"2015-01-01T01:07:28Z","org":{"id":7628018,"login":"syncthing","gravatar_id":"","url":"https://api.github.com/orgs/syncthing","avatar_url":"https://avatars.githubusercontent.com/u/7628018?"}}
{"id":"2489398954","type":"IssueCommentEvent","actor":{"id":253237,"login":"Jamesking56","gravatar_id":"","url":"https://api.github.com/users/Jamesking56","avatar_url":"https://avatars.githubusercontent.com/u/253237?"},"repo":{"id":26730195,"name":"cachethq/Cachet","url":"https://api.github.com/repos/cachethq/Cachet"},"payload":{"action":"created","issue":{"url":"https://api.github.com/repos/cachethq/Cachet/issues/173","labels_url":"https://api.github.com/repos/cachethq/Cachet/issues/173/labels{/name}","comments_url":"https://api.github.com/repos/cachethq/Cachet/issues/173/comments","events_url":"https://api.github.com/repos/cachethq/Cachet/issues/173/events","html_url":"https://github.com/cachethq/Cachet/issues/173","id":53210024,"number":173,"title":"Bug: Forms let you submit multiple times","user":{"login":"Jamesking56","id":253237,"avatar_url":"https://avatars.githubusercontent.com/u/253237?v=3","gravatar_id":"","url":"https://api.github.com/users/Jamesking56","html_url":"https://github.com/Jamesking56","followers_url":"https://api.github.com/users/Jamesking56/followers","following_url":"https://api.github.com/users/Jamesking56/following{/other_user}","gists_url":"https://api.github.com/users/Jamesking56/gists{/gist_id}","starred_url":"https://api.github.com/users/Jamesking56/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/Jamesking56/subscriptions","organizations_url":"https://api.github.com/users/Jamesking56/orgs","repos_url":"https://api.github.com/users/Jamesking56/repos","events_url":"https://api.github.com/users/Jamesking56/events{/privacy}","received_events_url":"https://api.github.com/users/Jamesking56/received_events","type":"User","site_admin":false},"labels":[],"state":"open","locked":false,"assignee":null,"milestone":null,"comments":6,"created_at":"2015-01-01T00:52:06Z","updated_at":"2015-01-01T01:07:28Z","closed_at":null,"body":"When adding a new incident, I noticed a weird bug.\r\n\r\nIf you fill in the form as normal, then click the submit button twice really quickly, it'll create __TWO__ identical new incidents!\r\n\r\nThis could be a bit annoying, a simple fix is using a bit of JS that on submit, disables the submit button so that once clicked, it cannot be clicked again."},"comment":{"url":"https://api.github.com/repos/cachethq/Cachet/issues/comments/68477379","html_url":"https://github.com/cachethq/Cachet/issues/173#issuecomment-68477379","issue_url":"https://api.github.com/repos/cachethq/Cachet/issues/173","id":68477379,"user":{"login":"Jamesking56","id":253237,"avatar_url":"https://avatars.githubusercontent.com/u/253237?v=3","gravatar_id":"","url":"https://api.github.com/users/Jamesking56","html_url":"https://github.com/Jamesking56","followers_url":"https://api.github.com/users/Jamesking56/followers","following_url":"https://api.github.com/users/Jamesking56/following{/other_user}","gists_url":"https://api.github.com/users/Jamesking56/gists{/gist_id}","starred_url":"https://api.github.com/users/Jamesking56/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/Jamesking56/subscriptions","organizations_url":"https://api.github.com/users/Jamesking56/orgs","repos_url":"https://api.github.com/users/Jamesking56/repos","events_url":"https://api.github.com/users/Jamesking56/events{/privacy}","received_events_url":"https://api.github.com/users/Jamesking56/received_events","type":"User","site_admin":false},"created_at":"2015-01-01T01:07:28Z","updated_at":"2015-01-01T01:07:28Z","body":"Thanks for clarifying that :+1:"}},"public":true,"created_at":"2015-01-01T01:07:28Z","org":{"id":9951502,"login":"cachethq","gravatar_id":"","url":"https://api.github.com/orgs/cachethq","avatar_url":"https://avatars.githubusercontent.com/u/9951502?"}}
{"id":"2489398955","type":"PushEvent","actor":{"id":8210807,"login":"nodepoker","gravatar_id":"","url":"https://api.github.com/users/nodepoker","avatar_url":"https://avatars.githubusercontent.com/u/8210807?"},"repo":{"id":22790212,"name":"nodepoker/.dotfiles","url":"https://api.github.com/repos/nodepoker/.dotfiles"},"payload":{"push_id":536753583,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"0ec37f77b8811a07ca6c6df79622541d8fa40c0a","before":"233774f844d59ff89420037609cf3e0cba985e9a","commits":[{"sha":"0ec37f77b8811a07ca6c6df79622541d8fa40c0a","author":{"email":"11f6ad8ec52a2984abaafd7c3b516503785c2072","name":"x"},"message":".","distinct":true,"url":"https://api.github.com/repos/nodepoker/.dotfiles/commits/0ec37f77b8811a07ca6c6df79622541d8fa40c0a"}]},"public":true,"created_at":"2015-01-01T01:07:29Z"}
{"id":"2489398958","type":"PushEvent","actor":{"id":5230439,"login":"movie002","gravatar_id":"","url":"https://api.github.com/users/movie002","avatar_url":"https://avatars.githubusercontent.com/u/5230439?"},"repo":{"id":16878288,"name":"movie002/v","url":"https://api.github.com/repos/movie002/v"},"payload":{"push_id":536753585,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"19defc0e03ee140ce0ba3a929b5f35272bb2bc72","before":"b5231af35019ee3489580e002c607e36c9fe78ab","commits":[{"sha":"19defc0e03ee140ce0ba3a929b5f35272bb2bc72","author":{"email":"e3ba41eb4a8a8591712f6252059288965f65b851@qq.com","name":"movie002"},"message":"","distinct":true,"url":"https://api.github.com/repos/movie002/v/commits/19defc0e03ee140ce0ba3a929b5f35272bb2bc72"}]},"public":true,"created_at":"2015-01-01T01:07:31Z"}
{"id":"2489398963","type":"IssueCommentEvent","actor":{"id":4566,"login":"nathany","gravatar_id":"","url":"https://api.github.com/users/nathany","avatar_url":"https://avatars.githubusercontent.com/u/4566?"},"repo":{"id":27928684,"name":"go-amz/amz","url":"https://api.github.com/repos/go-amz/amz"},"payload":{"action":"created","issue":{"url":"https://api.github.com/repos/go-amz/amz/issues/5","labels_url":"https://api.github.com/repos/go-amz/amz/issues/5/labels{/name}","comments_url":"https://api.github.com/repos/go-amz/amz/issues/5/comments","events_url":"https://api.github.com/repos/go-amz/amz/issues/5/events","html_url":"https://github.com/go-amz/amz/issues/5","id":53086813,"number":5,"title":"I'm so confused by all the forks","user":{"login":"nathany","id":4566,"avatar_url":"https://avatars.githubusercontent.com/u/4566?v=3","gravatar_id":"","url":"https://api.github.com/users/nathany","html_url":"https://github.com/nathany","followers_url":"https://api.github.com/users/nathany/followers","following_url":"https://api.github.com/users/nathany/following{/other_user}","gists_url":"https://api.github.com/users/nathany/gists{/gist_id}","starred_url":"https://api.github.com/users/nathany/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/nathany/subscriptions","organizations_url":"https://api.github.com/users/nathany/orgs","repos_url":"https://api.github.com/users/nathany/repos","events_url":"https://api.github.com/users/nathany/events{/privacy}","received_events_url":"https://api.github.com/users/nathany/received_events","type":"User","site_admin":false},"labels":[],"state":"open","locked":false,"assignee":null,"milestone":null,"comments":14,"created_at":"2014-12-30T01:44:20Z","updated_at":"2015-01-01T01:07:31Z","closed_at":null,"body":"I want to add CloudFront cache invalidation, but to where?\r\n\r\nhttps://github.com/goamz/goamz already has some CloudFront stuff\r\n\r\nhttps://github.com/mitchellh/goamz I've been using this fork up until now (due to #4).\r\n\r\nalso https://github.com/crowdmob/goamz"},"comment":{"url":"https://api.github.com/repos/go-amz/amz/issues/comments/68477381","html_url":"https://github.com/go-amz/amz/issues/5#issuecomment-68477381","issue_url":"https://api.github.com/repos/go-amz/amz/issues/5","id":68477381,"user":{"login":"nathany","id":4566,"avatar_url":"https://avatars.githubusercontent.com/u/4566?v=3","gravatar_id":"","url":"https://api.github.com/users/nathany","html_url":"https://github.com/nathany","followers_url":"https://api.github.com/users/nathany/followers","following_url":"https://api.github.com/users/nathany/following{/other_user}","gists_url":"https://api.github.com/users/nathany/gists{/gist_id}","starred_url":"https://api.github.com/users/nathany/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/nathany/subscriptions","organizations_url":"https://api.github.com/users/nathany/orgs","repos_url":"https://api.github.com/users/nathany/repos","events_url":"https://api.github.com/users/nathany/events{/privacy}","received_events_url":"https://api.github.com/users/nathany/received_events","type":"User","site_admin":false},"created_at":"2015-01-01T01:07:31Z","updated_at":"2015-01-01T01:07:31Z","body":"Thanks @dimitern.\r\n\r\nIt may be worth looking into https://www.clahub.com/ (disclaimer, I am also just a developer) or at least having a solid CONTRIBUTING.md file. Revel has a good example of [CONTRIBUTING](https://github.com/revel/revel/blob/master/CONTRIBUTING.md)."}},"public":true,"created_at":"2015-01-01T01:07:31Z","org":{"id":8137365,"login":"go-amz","gravatar_id":"","url":"https://api.github.com/orgs/go-amz","avatar_url":"https://avatars.githubusercontent.com/u/8137365?"}}
{"id":"2489398968","type":"PushEvent","actor":{"id":416575,"login":"frewsxcv","gravatar_id":"","url":"https://api.github.com/users/frewsxcv","avatar_url":"https://avatars.githubusercontent.com/u/416575?"},"repo":{"id":28678263,"name":"frewsxcv/Wicket","url":"https://api.github.com/repos/frewsxcv/Wicket"},"payload":{"push_id":536753591,"size":1,"distinct_size":1,"ref":"refs/heads/patch-1","head":"b1050c9a81013c77f4dc3e266c8606e130d7b23c","before":"ea75ffd844987843158fcdee9d98d242e962b2e2","commits":[{"sha":"b1050c9a81013c77f4dc3e266c8606e130d7b23c","author":{"email":"16aea3ed30350b1f4b4dfc1111a05a38e3d681b3@rwell.org","name":"Corey Farwell"},"message":"Enable syntax highlighting in README","distinct":true,"url":"https://api.github.com/repos/frewsxcv/Wicket/commits/b1050c9a81013c77f4dc3e266c8606e130d7b23c"}]},"public":true,"created_at":"2015-01-01T01:07:31Z"}
{"id":"2489398971","type":"CreateEvent","actor":{"id":804014,"login":"ry5n","gravatar_id":"","url":"https://api.github.com/users/ry5n","avatar_url":"https://avatars.githubusercontent.com/u/804014?"},"repo":{"id":28678287,"name":"ry5n/sass-inline-svg","url":"https://api.github.com/repos/ry5n/sass-inline-svg"},"payload":{"ref":"master","ref_type":"branch","master_branch":"master","description":"Inline an SVG as a CSS data URI. Allows recoloring paths.","pusher_type":"user"},"public":true,"created_at":"2015-01-01T01:07:33Z"}
{"id":"2489398972","type":"PushEvent","actor":{"id":433707,"login":"ile","gravatar_id":"","url":"https://api.github.com/users/ile","avatar_url":"https://avatars.githubusercontent.com/u/433707?"},"repo":{"id":26847132,"name":"kantele/k-templates","url":"https://api.github.com/repos/kantele/k-templates"},"payload":{"push_id":536753592,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"cb1fa82b87d8144f298b3a69ba3e41788e3c4130","before":"2250e5e1294fae3c21d3fa9b19bd162c40c29a6c","commits":[{"sha":"cb1fa82b87d8144f298b3a69ba3e41788e3c4130","author":{"email":"4f3407de78bccc8cc160ee4d278d5efe7162e6b5@nateps.com","name":"Nate Smith"},"message":"0.2.5\n\nConflicts:\n\tpackage.json","distinct":true,"url":"https://api.github.com/repos/kantele/k-templates/commits/cb1fa82b87d8144f298b3a69ba3e41788e3c4130"}]},"public":true,"created_at":"2015-01-01T01:07:33Z","org":{"id":5687585,"login":"kantele","gravatar_id":"","url":"https://api.github.com/orgs/kantele","avatar_url":"https://avatars.githubusercontent.com/u/5687585?"}}
{"id":"2489398975","type":"WatchEvent","actor":{"id":1015032,"login":"miketahani","gravatar_id":"","url":"https://api.github.com/users/miketahani","avatar_url":"https://avatars.githubusercontent.com/u/1015032?"},"repo":{"id":26293258,"name":"ThatcherC/Terrain2STL","url":"https://api.github.com/repos/ThatcherC/Terrain2STL"},"payload":{"action":"started"},"public":true,"created_at":"2015-01-01T01:07:33Z"}
{"id":"2489398980","type":"CreateEvent","actor":{"id":8396786,"login":"barr-code","gravatar_id":"","url":"https://api.github.com/users/barr-code","avatar_url":"https://avatars.githubusercontent.com/u/8396786?"},"repo":{"id":28678294,"name":"barr-code/craftsy","url":"https://api.github.com/repos/barr-code/craftsy"},"payload":{"ref":null,"ref_type":"repository","master_branch":"master","description":"","pusher_type":"user"},"public":true,"created_at":"2015-01-01T01:07:33Z"}
{"id":"2489398985","type":"PushEvent","actor":{"id":10237784,"login":"garylocke","gravatar_id":"","url":"https://api.github.com/users/garylocke","avatar_url":"https://avatars.githubusercontent.com/u/10237784?"},"repo":{"id":28205420,"name":"garylocke/ngkarma","url":"https://api.github.com/repos/garylocke/ngkarma"},"payload":{"push_id":536753602,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"da80da5ad685e455c3b6552b06cade3cfe3d1faf","before":"9429d660ddb0db02b87c2e27710359812da71082","commits":[{"sha":"da80da5ad685e455c3b6552b06cade3cfe3d1faf","author":{"email":"eb1c831f82e9d7475fabb08c6ce27c71c685a278@Garys-MacBook-Pro.local","name":"Gary Locke"},"message":"Removed robots.txt","distinct":true,"url":"https://api.github.com/repos/garylocke/ngkarma/commits/da80da5ad685e455c3b6552b06cade3cfe3d1faf"}]},"public":true,"created_at":"2015-01-01T01:07:34Z"}
{"id":"2489398988","type":"CreateEvent","actor":{"id":109109,"login":"rade","gravatar_id":"","url":"https://api.github.com/users/rade","avatar_url":"https://avatars.githubusercontent.com/u/109109?"},"repo":{"id":25579630,"name":"rade/weave","url":"https://api.github.com/repos/rade/weave"},"payload":{"ref":"101_eliminate_dependencies","ref_type":"branch","master_branch":"master","description":"The Docker Network","pusher_type":"user"},"public":true,"created_at":"2015-01-01T01:07:36Z"}
{"id":"2489398992","type":"PushEvent","actor":{"id":109109,"login":"rade","gravatar_id":"","url":"https://api.github.com/users/rade","avatar_url":"https://avatars.githubusercontent.com/u/109109?"},"repo":{"id":25579630,"name":"rade/weave","url":"https://api.github.com/repos/rade/weave"},"payload":{"push_id":536753607,"size":1,"distinct_size":0,"ref":"refs/heads/master","head":"5da2219dc8ca9bc8de9f874429a7d5945e3e34ca","before":"fd6f65e28fae31e0a72bfc6ef5046eaeedb12e31","commits":[{"sha":"5da2219dc8ca9bc8de9f874429a7d5945e3e34ca","author":{"email":"ac8fcaf748b7189c49a384a5580dc9e80633299a@gmail.com","name":"Matthias Radestock"},"message":"cosmetic: remove weaver/.gitignore\nand handle that in the top-level .gitignore instead. Just as we do for weavedns.","distinct":false,"url":"https://api.github.com/repos/rade/weave/commits/5da2219dc8ca9bc8de9f874429a7d5945e3e34ca"}]},"public":true,"created_at":"2015-01-01T01:07:36Z"}
{"id":"2489398994","type":"IssueCommentEvent","actor":{"id":1061610,"login":"kokizzu","gravatar_id":"","url":"https://api.github.com/users/kokizzu","avatar_url":"https://avatars.githubusercontent.com/u/1061610?"},"repo":{"id":3725405,"name":"thirtyseven/dullard","url":"https://api.github.com/repos/thirtyseven/dullard"},"payload":{"action":"created","issue":{"url":"https://api.github.com/repos/thirtyseven/dullard/issues/12","labels_url":"https://api.github.com/repos/thirtyseven/dullard/issues/12/labels{/name}","comments_url":"https://api.github.com/repos/thirtyseven/dullard/issues/12/comments","events_url":"https://api.github.com/repos/thirtyseven/dullard/issues/12/events","html_url":"https://github.com/thirtyseven/dullard/issues/12","id":47912635,"number":12,"title":"Dullard doesn't show nil on beginning of a row","user":{"login":"kokizzu","id":1061610,"avatar_url":"https://avatars.githubusercontent.com/u/1061610?v=3","gravatar_id":"","url":"https://api.github.com/users/kokizzu","html_url":"https://github.com/kokizzu","followers_url":"https://api.github.com/users/kokizzu/followers","following_url":"https://api.github.com/users/kokizzu/following{/other_user}","gists_url":"https://api.github.com/users/kokizzu/gists{/gist_id}","starred_url":"https://api.github.com/users/kokizzu/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/kokizzu/subscriptions","organizations_url":"https://api.github.com/users/kokizzu/orgs","repos_url":"https://api.github.com/users/kokizzu/repos","events_url":"https://api.github.com/users/kokizzu/events{/privacy}","received_events_url":"https://api.github.com/users/kokizzu/received_events","type":"User","site_admin":false},"labels":[],"state":"open","locked":false,"assignee":{"login":"thirtyseven","id":123678,"avatar_url":"https://avatars.githubusercontent.com/u/123678?v=3","gravatar_id":"","url":"https://api.github.com/users/thirtyseven","html_url":"https://github.com/thirtyseven","followers_url":"https://api.github.com/users/thirtyseven/followers","following_url":"https://api.github.com/users/thirtyseven/following{/other_user}","gists_url":"https://api.github.com/users/thirtyseven/gists{/gist_id}","starred_url":"https://api.github.com/users/thirtyseven/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/thirtyseven/subscriptions","organizations_url":"https://api.github.com/users/thirtyseven/orgs","repos_url":"https://api.github.com/users/thirtyseven/repos","events_url":"https://api.github.com/users/thirtyseven/events{/privacy}","received_events_url":"https://api.github.com/users/thirtyseven/received_events","type":"User","site_admin":false},"milestone":null,"comments":6,"created_at":"2014-11-06T01:27:57Z","updated_at":"2015-01-01T01:07:36Z","closed_at":null,"body":"expected behavior:\r\n```\r\n# one row:\r\n[ nil, nil, nil, 1]\r\n```\r\n\r\ncurrent behavior:\r\n```\r\n[ 1 ]\r\n```"},"comment":{"url":"https://api.github.com/repos/thirtyseven/dullard/issues/comments/68477383","html_url":"https://github.com/thirtyseven/dullard/issues/12#issuecomment-68477383","issue_url":"https://api.github.com/repos/thirtyseven/dullard/issues/12","id":68477383,"user":{"login":"kokizzu","id":1061610,"avatar_url":"https://avatars.githubusercontent.com/u/1061610?v=3","gravatar_id":"","url":"https://api.github.com/users/kokizzu","html_url":"https://github.com/kokizzu","followers_url":"https://api.github.com/users/kokizzu/followers","following_url":"https://api.github.com/users/kokizzu/following{/other_user}","gists_url":"https://api.github.com/users/kokizzu/gists{/gist_id}","starred_url":"https://api.github.com/users/kokizzu/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/kokizzu/subscriptions","organizations_url":"https://api.github.com/users/kokizzu/orgs","repos_url":"https://api.github.com/users/kokizzu/repos","events_url":"https://api.github.com/users/kokizzu/events{/privacy}","received_events_url":"https://api.github.com/users/kokizzu/received_events","type":"User","site_admin":false},"created_at":"2015-01-01T01:07:36Z","updated_at":"2015-01-01T01:07:36Z","body":"just create an empty spreadsheet file with cell A1 contains 1, B2 contains 2, C3 contains 3.."}},"public":true,"created_at":"2015-01-01T01:07:38Z"}
{"id":"2489398996","type":"IssuesEvent","actor":{"id":3964339,"login":"dcartertwo","gravatar_id":"","url":"https://api.github.com/users/dcartertwo","avatar_url":"https://avatars.githubusercontent.com/u/3964339?"},"repo":{"id":25189570,"name":"oceans15/teleport","url":"https://api.github.com/repos/oceans15/teleport"},"payload":{"action":"opened","issue":{"url":"https://api.github.com/repos/oceans15/teleport/issues/52","labels_url":"https://api.github.com/repos/oceans15/teleport/issues/52/labels{/name}","comments_url":"https://api.github.com/repos/oceans15/teleport/issues/52/comments","events_url":"https://api.github.com/repos/oceans15/teleport/issues/52/events","html_url":"https://github.com/oceans15/teleport/issues/52","id":53210306,"number":52,"title":"Crashes when receiving notification","user":{"login":"dcartertwo","id":3964339,"avatar_url":"https://avatars.githubusercontent.com/u/3964339?v=3","gravatar_id":"","url":"https://api.github.com/users/dcartertwo","html_url":"https://github.com/dcartertwo","followers_url":"https://api.github.com/users/dcartertwo/followers","following_url":"https://api.github.com/users/dcartertwo/following{/other_user}","gists_url":"https://api.github.com/users/dcartertwo/gists{/gist_id}","starred_url":"https://api.github.com/users/dcartertwo/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/dcartertwo/subscriptions","organizations_url":"https://api.github.com/users/dcartertwo/orgs","repos_url":"https://api.github.com/users/dcartertwo/repos","events_url":"https://api.github.com/users/dcartertwo/events{/privacy}","received_events_url":"https://api.github.com/users/dcartertwo/received_events","type":"User","site_admin":false},"labels":[{"url":"https://api.github.com/repos/oceans15/teleport/labels/bug","name":"bug","color":"fc2929"},{"url":"https://api.github.com/repos/oceans15/teleport/labels/help+wanted","name":"help wanted","color":"159818"}],"state":"open","locked":false,"assignee":null,"milestone":null,"comments":0,"created_at":"2015-01-01T01:07:36Z","updated_at":"2015-01-01T01:07:36Z","closed_at":null,"body":"To replicate (in android-notifications branch)\r\n-Start the app\r\n-Push notification\r\n-Close app\r\n-Reopen app\r\n\r\nThe app crashes after a second or instantly.  Running adb logcat i found:\r\n```\r\nE/AndroidRuntime(  424): FATAL EXCEPTION: main\r\nE/AndroidRuntime(  424): Process: com.oceans15.channel37, PID: 424\r\nE/AndroidRuntime(  424): java.lang.RuntimeException: Unable to instantiate receiver com.parse.GcmBroadcastReceiver: java.lang.ClassNotFoundException: Didn't find class \"com.parse.GcmBroadcastReceiver\" on path: DexPathList[[zip file \"/data/app/com.oceans15.channel37-1.apk\"],nativeLibraryDirectories=[/data/app-lib/com.oceans15.channel37-1, /vendor/lib, /system/lib]]\r\nE/AndroidRuntime(  424): \tat android.app.ActivityThread.handleReceiver(ActivityThread.java:2518)\r\nE/AndroidRuntime(  424): \tat android.app.ActivityThread.access$1800(ActivityThread.java:161)\r\nE/AndroidRuntime(  424): \tat android.app.ActivityThread$H.handleMessage(ActivityThread.java:1341)\r\nE/AndroidRuntime(  424): \tat android.os.Handler.dispatchMessage(Handler.java:102)\r\nE/AndroidRuntime(  424): \tat android.os.Looper.loop(Looper.java:157)\r\nE/AndroidRuntime(  424): \tat android.app.ActivityThread.main(ActivityThread.java:5356)\r\nE/AndroidRuntime(  424): \tat java.lang.reflect.Method.invokeNative(Native Method)\r\nE/AndroidRuntime(  424): \tat java.lang.reflect.Method.invoke(Method.java:515)\r\nE/AndroidRuntime(  424): \tat com.android.internal.os.ZygoteInit$MethodAndArgsCaller.run(ZygoteInit.java:1265)\r\nE/AndroidRuntime(  424): \tat com.android.internal.os.ZygoteInit.main(ZygoteInit.java:1081)\r\nE/AndroidRuntime(  424): \tat dalvik.system.NativeStart.main(Native Method)\r\nE/AndroidRuntime(  424): Caused by: java.lang.ClassNotFoundException: Didn't find class \"com.parse.GcmBroadcastReceiver\" on path: DexPathList[[zip file \"/data/app/com.oceans15.channel37-1.apk\"],nativeLibraryDirectories=[/data/app-lib/com.oceans15.channel37-1, /vendor/lib, /system/lib]]\r\nE/AndroidRuntime(  424): \tat dalvik.system.BaseDexClassLoader.findClass(BaseDexClassLoader.java:67)\r\nE/AndroidRuntime(  424): \tat java.lang.ClassLoader.loadClass(ClassLoader.java:497)\r\nE/AndroidRuntime(  424): \tat java.lang.ClassLoader.loadClass(ClassLoader.java:457)\r\nE/AndroidRuntime(  424): \tat android.app.ActivityThread.handleReceiver(ActivityThread.java:2513)\r\nE/AndroidRuntime(  424): \t... 10 more\r\nW/ActivityManager(  817):   Force finishing activity com.oceans15.channel37/.CordovaApp\r\n```\r\n\r\nNot sure why the java class isn't getting instantiated properly."}},"public":true,"created_at":"2015-01-01T01:07:38Z","org":{"id":9125251,"login":"oceans15","gravatar_id":"","url":"https://api.github.com/orgs/oceans15","avatar_url":"https://avatars.githubusercontent.com/u/9125251?"}}
{"id":"2489399000","type":"PullRequestReviewCommentEvent","actor":{"id":523287,"login":"j2sol","gravatar_id":"","url":"https://api.github.com/users/j2sol","avatar_url":"https://avatars.githubusercontent.com/u/523287?"},"repo":{"id":11848896,"name":"blueboxgroup/ursula","url":"https://api.github.com/repos/blueboxgroup/ursula"},"payload":{"action":"created","comment":{"url":"https://api.github.com/repos/blueboxgroup/ursula/pulls/comments/22397310","id":22397310,"diff_hunk":"@@ -1,121 +1,92 @@\n ---\n-- name: install apache\n-  apt: pkg={{ item }}\n-  with_items:\n-    - apache2\n-    - libapache2-mod-wsgi\n-\n - name: lesscpy must be in apache PATH\n   pip: name=lesscpy version=0.9j\n \n - name: get horizon source repo\n-  git: repo={{ openstack.git_mirror }}/horizon.git\n-       dest=/opt/stack/horizon\n-       version={{ horizon.rev }}\n-       update={{ openstack.git_update }}\n+  git: |\n+    repo={{ openstack.git_mirror}}/horizon.git\n+    dest=/opt/stack/horizon\n+    version={{ horizon.rev }}\n+    update={{ openstack.git_update }}\n   notify:\n     - setup horizon venv\n     - compress horizon assets\n \n-- template: src=opt/stack/horizon/hide-external-networks.patch dest=/opt/stack/horizon/hide-external-networks.patch mode=0644\n-- shell: patch -p1 < hide-external-networks.patch chdir=/opt/stack/horizon\n-  notify:\n-    - setup horizon venv\n-\n - name: add python-memcached to horizon requirements\n-  lineinfile: dest=/opt/stack/horizon/requirements.txt\n-              regexp=^python-memcached\n-              line=python-memcached\n+  lineinfile: dest=/opt/stack/horizon/requirements.txt regexp=^python-memcached line=python-memcached\n   notify:\n     - setup horizon venv\n \n-- name: disable apache status\n-  command: a2dismod status\n-  notify:\n-    - restart apache\n-\n-- name: apache ports config\n-  template: src=etc/apache2/ports.conf\n-            dest=/etc/apache2/ports.conf\n-  notify:\n-    - restart apache\n-\n-- name: disable default apache site\n-  command: a2dissite 000-default\n+- name: make sure apache knows about horizon ports\n+  lineinfile: dest=/etc/apache2/ports.conf line=\"Listen 8080\"\n   notify:\n-    - restart apache\n+    - reload apache\n \n-- name: openstack dashboard config (12.04)\n-  template: src=etc/apache2/sites-available/openstack_dashboard.conf\n-            dest=/etc/apache2/sites-available/openstack_dashboard\n+- name: create dashboard virtualhost on precise\n+  template: |\n+    src=etc/apache2/sites-available/openstack_dashboard.conf\n+    dest=/etc/apache2/sites-available/openstack_dashboard\n   when: ansible_distribution_version == \"12.04\"\n   notify:\n-    - restart apache\n+    - reload apache\n \n-- name: openstack dashboard config\n-  template: src=etc/apache2/sites-available/openstack_dashboard.conf\n-            dest=/etc/apache2/sites-available/openstack_dashboard.conf\n+- name: create dashboard virtualhost on other\n+  template: |\n+    src=etc/apache2/sites-available/openstack_dashboard.conf\n+    dest=/etc/apache2/sites-available/openstack_dashboard.conf\n   when: ansible_distribution_version != \"12.04\"\n   notify:\n-    - restart apache\n+    - reload apache\n \n - name: enable horizon apache site\n-  command: a2ensite openstack_dashboard\n+  apache2_site: state=enabled name=openstack_dashboard\n   notify:\n-    - restart apache\n-\n-- name: static asset directories\n-  file: dest={{ item }}\n-        state=directory\n-        owner=www-data\n-        group=www-data\n-        mode=0755\n+    - reload apache\n+\n+- name: create static asset dirs\n+  file: |\n+    dest={{ item }}\n+    state=directory\n+    owner=www-data\n+    group=www-data\n+    mode=0755\n   with_items:\n     - /opt/stack/horizon/static\n     - /opt/stack/horizon/static/dashboard\n \n-- name: horizon local settings\n-  template: src=opt/stack/horizon/openstack_dashboard/local/local_settings.py\n-            dest=/opt/stack/horizon/openstack_dashboard/local/local_settings.py\n-            mode=0644\n+- name: dashboard settings\n+  template: |\n+    src=opt/stack/horizon/openstack_dashboard/local/local_settings.py\n+    dest=/opt/stack/horizon/openstack_dashboard/local/local_settings.py\n+    mode=0644\n   notify:\n-    - restart apache\n+    - reload apache\n \n - name: custom horizon logo\n-  get_url: url={{ horizon.logo_url }}\n-           dest=/opt/stack/horizon/openstack_dashboard/static/dashboard/img/logo.png\n-           mode=0644 force=yes\n+  get_url: url={{ horizon.logo_url }} dest=/opt/stack/horizon/openstack_dashboard/static/dashboard/img/logo.png mode=0644 force=yes\n \n - name: custom horizon splash logo\n-  get_url: url={{ horizon.logo_url }}\n-           dest=/opt/stack/horizon/openstack_dashboard/static/dashboard/img/logo-splash.png\n-           mode=0644 force=yes\n+  get_url: url={{ horizon.logo_url }} dest=/opt/stack/horizon/openstack_dashboard/static/dashboard/img/logo-splash.png mode=0644 force=yes\n \n - name: custom horizon favicon\n-  get_url: url={{ horizon.favicon_url }}\n-           dest=/opt/stack/horizon/openstack_dashboard/static/dashboard/img/favicon.ico\n-           force=yes\n+  get_url: url={{ horizon.favicon_url }} dest=/opt/stack/horizon/openstack_dashboard/static/dashboard/img/favicon.ico force=yes\n \n - name: put images and fonts where apache can find them\n-  file: src=/opt/stack/horizon/openstack_dashboard/static/dashboard/{{ item }}\n-        dest=/opt/stack/horizon/static/dashboard/{{ item }}\n-        state=link\n-        owner=www-data\n-        group=www-data\n+  file: |\n+    src=/opt/stack/horizon/openstack_dashboard/static/dashboard/{{ item }}\n+    dest=/opt/stack/horizon/static/dashboard/{{ item }}\n+    state=link\n+    owner=www-data\n+    group=www-data\n   with_items:\n     - img\n     - fonts\n \n-# flush before ensuring apache running, saves immediate restart\n-- meta: flush_handlers\n-\n-- name: ensure apache started\n+- name: ensure apache is running\n   service: name=apache2 state=started\n \n-- name: Permit HTTP and HTTPS\n-  ufw: rule=allow to_port={{ item }} proto=tcp\n-  with_items:\n-  - 80\n-  - 443\n+- name: Permit HTTP (redirect to HTTPS for Horizon)\n+  command: ufw allow 80/tcp\n \n-- include: monitoring.yml tags=monitoring,common\n+- name: Permit HTTPS (Horizon)\n+  command: ufw allow 443/tcp","path":"roles/horizon/tasks/main.yml","position":170,"original_position":170,"commit_id":"2a6f35313b9936ce4450aba823d09287626bed6f","original_commit_id":"2a6f35313b9936ce4450aba823d09287626bed6f","user":{"login":"j2sol","id":523287,"avatar_url":"https://avatars.githubusercontent.com/u/523287?v=3","gravatar_id":"","url":"https://api.github.com/users/j2sol","html_url":"https://github.com/j2sol","followers_url":"https://api.github.com/users/j2sol/followers","following_url":"https://api.github.com/users/j2sol/following{/other_user}","gists_url":"https://api.github.com/users/j2sol/gists{/gist_id}","starred_url":"https://api.github.com/users/j2sol/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/j2sol/subscriptions","organizations_url":"https://api.github.com/users/j2sol/orgs","repos_url":"https://api.github.com/users/j2sol/repos","events_url":"https://api.github.com/users/j2sol/events{/privacy}","received_events_url":"https://api.github.com/users/j2sol/received_events","type":"User","site_admin":false},"body":"Why did this go from a single task with list of ports to two tasks?","created_at":"2015-01-01T01:07:36Z","updated_at":"2015-01-01T01:07:36Z","html_url":"https://github.com/blueboxgroup/ursula/pull/705#discussion_r22397310","pull_request_url":"https://api.github.com/repos/blueboxgroup/ursula/pulls/705","_links":{"self":{"href":"https://api.github.com/repos/blueboxgroup/ursula/pulls/comments/22397310"},"html":{"href":"https://github.com/blueboxgroup/ursula/pull/705#discussion_r22397310"},"pull_request":{"href":"https://api.github.com/repos/blueboxgroup/ursula/pulls/705"}}},"pull_request":{"url":"https://api.github.com/repos/blueboxgroup/ursula/pulls/705","id":26738851,"html_url":"https://github.com/blueboxgroup/ursula/pull/705","diff_url":"https://github.com/blueboxgroup/ursula/pull/705.diff","patch_url":"https://github.com/blueboxgroup/ursula/pull/705.patch","issue_url":"https://api.github.com/repos/blueboxgroup/ursula/issues/705","number":705,"state":"open","locked":false,"title":"WIP:  apache for loadbalancing","user":{"login":"paulczar","id":2488346,"avatar_url":"https://avatars.githubusercontent.com/u/2488346?v=3","gravatar_id":"","url":"https://api.github.com/users/paulczar","html_url":"https://github.com/paulczar","followers_url":"https://api.github.com/users/paulczar/followers","following_url":"https://api.github.com/users/paulczar/following{/other_user}","gists_url":"https://api.github.com/users/paulczar/gists{/gist_id}","starred_url":"https://api.github.com/users/paulczar/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/paulczar/subscriptions","organizations_url":"https://api.github.com/users/paulczar/orgs","repos_url":"https://api.github.com/users/paulczar/repos","events_url":"https://api.github.com/users/paulczar/events{/privacy}","received_events_url":"https://api.github.com/users/paulczar/received_events","type":"User","site_admin":false},"body":"This is a quick POC / WIP to demo using apache instead of haproxy for loadbalancing our APIs.\r\n\r\nI think this gives us more flexibiltiy as we can enable in the APIs role itself ( in this case in keystone ) rather than a big monolithic haproxy.conf.      We also already have apache running for horizon, so it could reduce number of services.    apache also has better logging options that haproxy which can only log to syslog. ","created_at":"2015-01-01T00:04:13Z","updated_at":"2015-01-01T01:07:36Z","closed_at":null,"merged_at":null,"merge_commit_sha":"9b91693f11e166c9ee53836f19697868d412bf76","assignee":null,"milestone":null,"commits_url":"https://api.github.com/repos/blueboxgroup/ursula/pulls/705/commits","review_comments_url":"https://api.github.com/repos/blueboxgroup/ursula/pulls/705/comments","review_comment_url":"https://api.github.com/repos/blueboxgroup/ursula/pulls/comments/{number}","comments_url":"https://api.github.com/repos/blueboxgroup/ursula/issues/705/comments","statuses_url":"https://api.github.com/repos/blueboxgroup/ursula/statuses/2a6f35313b9936ce4450aba823d09287626bed6f","head":{"label":"blueboxgroup:use_apache_for_lb","ref":"use_apache_for_lb","sha":"2a6f35313b9936ce4450aba823d09287626bed6f","user":{"login":"blueboxgroup","id":458705,"avatar_url":"https://avatars.githubusercontent.com/u/458705?v=3","gravatar_id":"","url":"https://api.github.com/users/blueboxgroup","html_url":"https://github.com/blueboxgroup","followers_url":"https://api.github.com/users/blueboxgroup/followers","following_url":"https://api.github.com/users/blueboxgroup/following{/other_user}","gists_url":"https://api.github.com/users/blueboxgroup/gists{/gist_id}","starred_url":"https://api.github.com/users/blueboxgroup/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/blueboxgroup/subscriptions","organizations_url":"https://api.github.com/users/blueboxgroup/orgs","repos_url":"https://api.github.com/users/blueboxgroup/repos","events_url":"https://api.github.com/users/blueboxgroup/events{/privacy}","received_events_url":"https://api.github.com/users/blueboxgroup/received_events","type":"Organization","site_admin":false},"repo":{"id":11848896,"name":"ursula","full_name":"blueboxgroup/ursula","owner":{"login":"blueboxgroup","id":458705,"avatar_url":"https://avatars.githubusercontent.com/u/458705?v=3","gravatar_id":"","url":"https://api.github.com/users/blueboxgroup","html_url":"https://github.com/blueboxgroup","followers_url":"https://api.github.com/users/blueboxgroup/followers","following_url":"https://api.github.com/users/blueboxgroup/following{/other_user}","gists_url":"https://api.github.com/users/blueboxgroup/gists{/gist_id}","starred_url":"https://api.github.com/users/blueboxgroup/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/blueboxgroup/subscriptions","organizations_url":"https://api.github.com/users/blueboxgroup/orgs","repos_url":"https://api.github.com/users/blueboxgroup/repos","events_url":"https://api.github.com/users/blueboxgroup/events{/privacy}","received_events_url":"https://api.github.com/users/blueboxgroup/received_events","type":"Organization","site_admin":false},"private":false,"html_url":"https://github.com/blueboxgroup/ursula","description":"Ansible playbooks for operating OpenStack","fork":false,"url":"https://api.github.com/repos/blueboxgroup/ursula","forks_url":"https://api.github.com/repos/blueboxgroup/ursula/forks","keys_url":"https://api.github.com/repos/blueboxgroup/ursula/keys{/key_id}","collaborators_url":"https://api.github.com/repos/blueboxgroup/ursula/collaborators{/collaborator}","teams_url":"https://api.github.com/repos/blueboxgroup/ursula/teams","hooks_url":"https://api.github.com/repos/blueboxgroup/ursula/hooks","issue_events_url":"https://api.github.com/repos/blueboxgroup/ursula/issues/events{/number}","events_url":"https://api.github.com/repos/blueboxgroup/ursula/events","assignees_url":"https://api.github.com/repos/blueboxgroup/ursula/assignees{/user}","branches_url":"https://api.github.com/repos/blueboxgroup/ursula/branches{/branch}","tags_url":"https://api.github.com/repos/blueboxgroup/ursula/tags","blobs_url":"https://api.github.com/repos/blueboxgroup/ursula/git/blobs{/sha}","git_tags_url":"https://api.github.com/repos/blueboxgroup/ursula/git/tags{/sha}","git_refs_url":"https://api.github.com/repos/blueboxgroup/ursula/git/refs{/sha}","trees_url":"https://api.github.com/repos/blueboxgroup/ursula/git/trees{/sha}","statuses_url":"https://api.github.com/repos/blueboxgroup/ursula/statuses/{sha}","languages_url":"https://api.github.com/repos/blueboxgroup/ursula/languages","stargazers_url":"https://api.github.com/repos/blueboxgroup/ursula/stargazers","contributors_url":"https://api.github.com/repos/blueboxgroup/ursula/contributors","subscribers_url":"https://api.github.com/repos/blueboxgroup/ursula/subscribers","subscription_url":"https://api.github.com/repos/blueboxgroup/ursula/subscription","commits_url":"https://api.github.com/repos/blueboxgroup/ursula/commits{/sha}","git_commits_url":"https://api.github.com/repos/blueboxgroup/ursula/git/commits{/sha}","comments_url":"https://api.github.com/repos/blueboxgroup/ursula/comments{/number}","issue_comment_url":"https://api.github.com/repos/blueboxgroup/ursula/issues/comments/{number}","contents_url":"https://api.github.com/repos/blueboxgroup/ursula/contents/{+path}","compare_url":"https://api.github.com/repos/blueboxgroup/ursula/compare/{base}...{head}","merges_url":"https://api.github.com/repos/blueboxgroup/ursula/merges","archive_url":"https://api.github.com/repos/blueboxgroup/ursula/{archive_format}{/ref}","downloads_url":"https://api.github.com/repos/blueboxgroup/ursula/downloads","issues_url":"https://api.github.com/repos/blueboxgroup/ursula/issues{/number}","pulls_url":"https://api.github.com/repos/blueboxgroup/ursula/pulls{/number}","milestones_url":"https://api.github.com/repos/blueboxgroup/ursula/milestones{/number}","notifications_url":"https://api.github.com/repos/blueboxgroup/ursula/notifications{?since,all,participating}","labels_url":"https://api.github.com/repos/blueboxgroup/ursula/labels{/name}","releases_url":"https://api.github.com/repos/blueboxgroup/ursula/releases{/id}","created_at":"2013-08-02T17:37:26Z","updated_at":"2014-12-31T21:03:28Z","pushed_at":"2015-01-01T00:01:35Z","git_url":"git://github.com/blueboxgroup/ursula.git","ssh_url":"git@github.com:blueboxgroup/ursula.git","clone_url":"https://github.com/blueboxgroup/ursula.git","svn_url":"https://github.com/blueboxgroup/ursula","homepage":null,"size":9036,"stargazers_count":45,"watchers_count":45,"language":"Python","has_issues":true,"has_downloads":true,"has_wiki":true,"has_pages":false,"forks_count":23,"mirror_url":null,"open_issues_count":26,"forks":23,"open_issues":26,"watchers":45,"default_branch":"master"}},"base":{"label":"blueboxgroup:master","ref":"master","sha":"34b83c65ff0de2f8b006d8ce4f76919fe0167bbf","user":{"login":"blueboxgroup","id":458705,"avatar_url":"https://avatars.githubusercontent.com/u/458705?v=3","gravatar_id":"","url":"https://api.github.com/users/blueboxgroup","html_url":"https://github.com/blueboxgroup","followers_url":"https://api.github.com/users/blueboxgroup/followers","following_url":"https://api.github.com/users/blueboxgroup/following{/other_user}","gists_url":"https://api.github.com/users/blueboxgroup/gists{/gist_id}","starred_url":"https://api.github.com/users/blueboxgroup/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/blueboxgroup/subscriptions","organizations_url":"https://api.github.com/users/blueboxgroup/orgs","repos_url":"https://api.github.com/users/blueboxgroup/repos","events_url":"https://api.github.com/users/blueboxgroup/events{/privacy}","received_events_url":"https://api.github.com/users/blueboxgroup/received_events","type":"Organization","site_admin":false},"repo":{"id":11848896,"name":"ursula","full_name":"blueboxgroup/ursula","owner":{"login":"blueboxgroup","id":458705,"avatar_url":"https://avatars.githubusercontent.com/u/458705?v=3","gravatar_id":"","url":"https://api.github.com/users/blueboxgroup","html_url":"https://github.com/blueboxgroup","followers_url":"https://api.github.com/users/blueboxgroup/followers","following_url":"https://api.github.com/users/blueboxgroup/following{/other_user}","gists_url":"https://api.github.com/users/blueboxgroup/gists{/gist_id}","starred_url":"https://api.github.com/users/blueboxgroup/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/blueboxgroup/subscriptions","organizations_url":"https://api.github.com/users/blueboxgroup/orgs","repos_url":"https://api.github.com/users/blueboxgroup/repos","events_url":"https://api.github.com/users/blueboxgroup/events{/privacy}","received_events_url":"https://api.github.com/users/blueboxgroup/received_events","type":"Organization","site_admin":false},"private":false,"html_url":"https://github.com/blueboxgroup/ursula","description":"Ansible playbooks for operating OpenStack","fork":false,"url":"https://api.github.com/repos/blueboxgroup/ursula","forks_url":"https://api.github.com/repos/blueboxgroup/ursula/forks","keys_url":"https://api.github.com/repos/blueboxgroup/ursula/keys{/key_id}","collaborators_url":"https://api.github.com/repos/blueboxgroup/ursula/collaborators{/collaborator}","teams_url":"https://api.github.com/repos/blueboxgroup/ursula/teams","hooks_url":"https://api.github.com/repos/blueboxgroup/ursula/hooks","issue_events_url":"https://api.github.com/repos/blueboxgroup/ursula/issues/events{/number}","events_url":"https://api.github.com/repos/blueboxgroup/ursula/events","assignees_url":"https://api.github.com/repos/blueboxgroup/ursula/assignees{/user}","branches_url":"https://api.github.com/repos/blueboxgroup/ursula/branches{/branch}","tags_url":"https://api.github.com/repos/blueboxgroup/ursula/tags","blobs_url":"https://api.github.com/repos/blueboxgroup/ursula/git/blobs{/sha}","git_tags_url":"https://api.github.com/repos/blueboxgroup/ursula/git/tags{/sha}","git_refs_url":"https://api.github.com/repos/blueboxgroup/ursula/git/refs{/sha}","trees_url":"https://api.github.com/repos/blueboxgroup/ursula/git/trees{/sha}","statuses_url":"https://api.github.com/repos/blueboxgroup/ursula/statuses/{sha}","languages_url":"https://api.github.com/repos/blueboxgroup/ursula/languages","stargazers_url":"https://api.github.com/repos/blueboxgroup/ursula/stargazers","contributors_url":"https://api.github.com/repos/blueboxgroup/ursula/contributors","subscribers_url":"https://api.github.com/repos/blueboxgroup/ursula/subscribers","subscription_url":"https://api.github.com/repos/blueboxgroup/ursula/subscription","commits_url":"https://api.github.com/repos/blueboxgroup/ursula/commits{/sha}","git_commits_url":"https://api.github.com/repos/blueboxgroup/ursula/git/commits{/sha}","comments_url":"https://api.github.com/repos/blueboxgroup/ursula/comments{/number}","issue_comment_url":"https://api.github.com/repos/blueboxgroup/ursula/issues/comments/{number}","contents_url":"https://api.github.com/repos/blueboxgroup/ursula/contents/{+path}","compare_url":"https://api.github.com/repos/blueboxgroup/ursula/compare/{base}...{head}","merges_url":"https://api.github.com/repos/blueboxgroup/ursula/merges","archive_url":"https://api.github.com/repos/blueboxgroup/ursula/{archive_format}{/ref}","downloads_url":"https://api.github.com/repos/blueboxgroup/ursula/downloads","issues_url":"https://api.github.com/repos/blueboxgroup/ursula/issues{/number}","pulls_url":"https://api.github.com/repos/blueboxgroup/ursula/pulls{/number}","milestones_url":"https://api.github.com/repos/blueboxgroup/ursula/milestones{/number}","notifications_url":"https://api.github.com/repos/blueboxgroup/ursula/notifications{?since,all,participating}","labels_url":"https://api.github.com/repos/blueboxgroup/ursula/labels{/name}","releases_url":"https://api.github.com/repos/blueboxgroup/ursula/releases{/id}","created_at":"2013-08-02T17:37:26Z","updated_at":"2014-12-31T21:03:28Z","pushed_at":"2015-01-01T00:01:35Z","git_url":"git://github.com/blueboxgroup/ursula.git","ssh_url":"git@github.com:blueboxgroup/ursula.git","clone_url":"https://github.com/blueboxgroup/ursula.git","svn_url":"https://github.com/blueboxgroup/ursula","homepage":null,"size":9036,"stargazers_count":45,"watchers_count":45,"language":"Python","has_issues":true,"has_downloads":true,"has_wiki":true,"has_pages":false,"forks_count":23,"mirror_url":null,"open_issues_count":26,"forks":23,"open_issues":26,"watchers":45,"default_branch":"master"}},"_links":{"self":{"href":"https://api.github.com/repos/blueboxgroup/ursula/pulls/705"},"html":{"href":"https://github.com/blueboxgroup/ursula/pull/705"},"issue":{"href":"https://api.github.com/repos/blueboxgroup/ursula/issues/705"},"comments":{"href":"https://api.github.com/repos/blueboxgroup/ursula/issues/705/comments"},"review_comments":{"href":"https://api.github.com/repos/blueboxgroup/ursula/pulls/705/comments"},"review_comment":{"href":"https://api.github.com/repos/blueboxgroup/ursula/pulls/comments/{number}"},"commits":{"href":"https://api.github.com/repos/blueboxgroup/ursula/pulls/705/commits"},"statuses":{"href":"https://api.github.com/repos/blueboxgroup/ursula/statuses/2a6f35313b9936ce4450aba823d09287626bed6f"}}}},"public":true,"created_at":"2015-01-01T01:07:36Z","org":{"id":458705,"login":"blueboxgroup","gravatar_id":"","url":"https://api.github.com/orgs/blueboxgroup","avatar_url":"https://avatars.githubusercontent.com/u/458705?"}}
{"id":"2489399003","type":"PushEvent","actor":{"id":6355392,"login":"githanwang1","gravatar_id":"","url":"https://api.github.com/users/githanwang1","avatar_url":"https://avatars.githubusercontent.com/u/6355392?"},"repo":{"id":28543231,"name":"githanwang1/django-blog","url":"https://api.github.com/repos/githanwang1/django-blog"},"payload":{"push_id":536753608,"size":1,"distinct_size":1,"ref":"refs/heads/master","head":"1bd9937ada4d820b74e83c8a5d68c9aa2112957d","before":"130cfc38c0c001e58f84398948b72b138ccce717","commits":[{"sha":"1bd9937ada4d820b74e83c8a5d68c9aa2112957d","author":{"email":"053e32d42d025177f9df81fc22020283a55f18ff@berkeley.edu","name":"Han Wang"},"message":"initialized at proj root","distinct":true,"url":"https://api.github.com/repos/githanwang1/django-blog/commits/1bd9937ada4d820b74e83c8a5d68c9aa2112957d"}]},"public":true,"created_at":"2015-01-01T01:07:38Z"}
{"id":"2489399006","type":"PullRequestEvent","actor":{"id":416575,"login":"frewsxcv","gravatar_id":"","url":"https://api.github.com/users/frewsxcv","avatar_url":"https://avatars.githubusercontent.com/u/416575?"},"repo":{"id":3545112,"name":"arthur-e/Wicket","url":"https://api.github.com/repos/arthur-e/Wicket"},"payload":{"action":"opened","number":60,"pull_request":{"url":"https://api.github.com/repos/arthur-e/Wicket/pulls/60","id":26739469,"html_url":"https://github.com/arthur-e/Wicket/pull/60","diff_url":"https://github.com/arthur-e/Wicket/pull/60.diff","patch_url":"https://github.com/arthur-e/Wicket/pull/60.patch","issue_url":"https://api.github.com/repos/arthur-e/Wicket/issues/60","number":60,"state":"open","locked":false,"title":"Enable syntax highlighting in README","user":{"login":"frewsxcv","id":416575,"avatar_url":"https://avatars.githubusercontent.com/u/416575?v=3","gravatar_id":"","url":"https://api.github.com/users/frewsxcv","html_url":"https://github.com/frewsxcv","followers_url":"https://api.github.com/users/frewsxcv/followers","following_url":"https://api.github.com/users/frewsxcv/following{/other_user}","gists_url":"https://api.github.com/users/frewsxcv/gists{/gist_id}","starred_url":"https://api.github.com/users/frewsxcv/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/frewsxcv/subscriptions","organizations_url":"https://api.github.com/users/frewsxcv/orgs","repos_url":"https://api.github.com/users/frewsxcv/repos","events_url":"https://api.github.com/users/frewsxcv/events{/privacy}","received_events_url":"https://api.github.com/users/frewsxcv/received_events","type":"User","site_admin":false},"body":"","created_at":"2015-01-01T01:07:38Z","updated_at":"2015-01-01T01:07:38Z","closed_at":null,"merged_at":null,"merge_commit_sha":null,"assignee":null,"milestone":null,"commits_url":"https://api.github.com/repos/arthur-e/Wicket/pulls/60/commits","review_comments_url":"https://api.github.com/repos/arthur-e/Wicket/pulls/60/comments","review_comment_url":"https://api.github.com/repos/arthur-e/Wicket/pulls/comments/{number}","comments_url":"https://api.github.com/repos/arthur-e/Wicket/issues/60/comments","statuses_url":"https://api.github.com/repos/arthur-e/Wicket/statuses/b1050c9a81013c77f4dc3e266c8606e130d7b23c","head":{"label":"frewsxcv:patch-1","ref":"patch-1","sha":"b1050c9a81013c77f4dc3e266c8606e130d7b23c","user":{"login":"frewsxcv","id":416575,"avatar_url":"https://avatars.githubusercontent.com/u/416575?v=3","gravatar_id":"","url":"https://api.github.com/users/frewsxcv","html_url":"https://github.com/frewsxcv","followers_url":"https://api.github.com/users/frewsxcv/followers","following_url":"https://api.github.com/users/frewsxcv/following{/other_user}","gists_url":"https://api.github.com/users/frewsxcv/gists{/gist_id}","starred_url":"https://api.github.com/users/frewsxcv/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/frewsxcv/subscriptions","organizations_url":"https://api.github.com/users/frewsxcv/orgs","repos_url":"https://api.github.com/users/frewsxcv/repos","events_url":"https://api.github.com/users/frewsxcv/events{/privacy}","received_events_url":"https://api.github.com/users/frewsxcv/received_events","type":"User","site_admin":false},"repo":{"id":28678263,"name":"Wicket","full_name":"frewsxcv/Wicket","owner":{"login":"frewsxcv","id":416575,"avatar_url":"https://avatars.githubusercontent.com/u/416575?v=3","gravatar_id":"","url":"https://api.github.com/users/frewsxcv","html_url":"https://github.com/frewsxcv","followers_url":"https://api.github.com/users/frewsxcv/followers","following_url":"https://api.github.com/users/frewsxcv/following{/other_user}","gists_url":"https://api.github.com/users/frewsxcv/gists{/gist_id}","starred_url":"https://api.github.com/users/frewsxcv/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/frewsxcv/subscriptions","organizations_url":"https://api.github.com/users/frewsxcv/orgs","repos_url":"https://api.github.com/users/frewsxcv/repos","events_url":"https://api.github.com/users/frewsxcv/events{/privacy}","received_events_url":"https://api.github.com/users/frewsxcv/received_events","type":"User","site_admin":false},"private":false,"html_url":"https://github.com/frewsxcv/Wicket","description":"A modest library for moving between Well-Known Text (WKT) and various framework geometries","fork":true,"url":"https://api.github.com/repos/frewsxcv/Wicket","forks_url":"https://api.github.com/repos/frewsxcv/Wicket/forks","keys_url":"https://api.github.com/repos/frewsxcv/Wicket/keys{/key_id}","collaborators_url":"https://api.github.com/repos/frewsxcv/Wicket/collaborators{/collaborator}","teams_url":"https://api.github.com/repos/frewsxcv/Wicket/teams","hooks_url":"https://api.github.com/repos/frewsxcv/Wicket/hooks","issue_events_url":"https://api.github.com/repos/frewsxcv/Wicket/issues/events{/number}","events_url":"https://api.github.com/repos/frewsxcv/Wicket/events","assignees_url":"https://api.github.com/repos/frewsxcv/Wicket/assignees{/user}","branches_url":"https://api.github.com/repos/frewsxcv/Wicket/branches{/branch}","tags_url":"https://api.github.com/repos/frewsxcv/Wicket/tags","blobs_url":"https://api.github.com/repos/frewsxcv/Wicket/git/blobs{/sha}","git_tags_url":"https://api.github.com/repos/frewsxcv/Wicket/git/tags{/sha}","git_refs_url":"https://api.github.com/repos/frewsxcv/Wicket/git/refs{/sha}","trees_url":"https://api.github.com/repos/frewsxcv/Wicket/git/trees{/sha}","statuses_url":"https://api.github.com/repos/frewsxcv/Wicket/statuses/{sha}","languages_url":"https://api.github.com/repos/frewsxcv/Wicket/languages","stargazers_url":"https://api.github.com/repos/frewsxcv/Wicket/stargazers","contributors_url":"https://api.github.com/repos/frewsxcv/Wicket/contributors","subscribers_url":"https://api.github.com/repos/frewsxcv/Wicket/subscribers","subscription_url":"https://api.github.com/repos/frewsxcv/Wicket/subscription","commits_url":"https://api.github.com/repos/frewsxcv/Wicket/commits{/sha}","git_commits_url":"https://api.github.com/repos/frewsxcv/Wicket/git/commits{/sha}","comments_url":"https://api.github.com/repos/frewsxcv/Wicket/comments{/number}","issue_comment_url":"https://api.github.com/repos/frewsxcv/Wicket/issues/comments/{number}","contents_url":"https://api.github.com/repos/frewsxcv/Wicket/contents/{+path}","compare_url":"https://api.github.com/repos/frewsxcv/Wicket/compare/{base}...{head}","merges_url":"https://api.github.com/repos/frewsxcv/Wicket/merges","archive_url":"https://api.github.com/repos/frewsxcv/Wicket/{archive_format}{/ref}","downloads_url":"https://api.github.com/repos/frewsxcv/Wicket/downloads","issues_url":"https://api.github.com/repos/frewsxcv/Wicket/issues{/number}","pulls_url":"https://api.github.com/repos/frewsxcv/Wicket/pulls{/number}","milestones_url":"https://api.github.com/repos/frewsxcv/Wicket/milestones{/number}","notifications_url":"https://api.github.com/repos/frewsxcv/Wicket/notifications{?since,all,participating}","labels_url":"https://api.github.com/repos/frewsxcv/Wicket/labels{/name}","releases_url":"https://api.github.com/repos/frewsxcv/Wicket/releases{/id}","created_at":"2015-01-01T01:04:48Z","updated_at":"2015-01-01T01:04:49Z","pushed_at":"2015-01-01T01:07:31Z","git_url":"git://github.com/frewsxcv/Wicket.git","ssh_url":"git@github.com:frewsxcv/Wicket.git","clone_url":"https://github.com/frewsxcv/Wicket.git","svn_url":"https://github.com/frewsxcv/Wicket","homepage":"http://arthur-e.github.com/Wicket","size":1032,"stargazers_count":0,"watchers_count":0,"language":"JavaScript","has_issues":false,"has_downloads":true,"has_wiki":true,"has_pages":true,"forks_count":0,"mirror_url":null,"open_issues_count":0,"forks":0,"open_issues":0,"watchers":0,"default_branch":"master"}},"base":{"label":"arthur-e:master","ref":"master","sha":"ea75ffd844987843158fcdee9d98d242e962b2e2","user":{"login":"arthur-e","id":1211103,"avatar_url":"https://avatars.githubusercontent.com/u/1211103?v=3","gravatar_id":"","url":"https://api.github.com/users/arthur-e","html_url":"https://github.com/arthur-e","followers_url":"https://api.github.com/users/arthur-e/followers","following_url":"https://api.github.com/users/arthur-e/following{/other_user}","gists_url":"https://api.github.com/users/arthur-e/gists{/gist_id}","starred_url":"https://api.github.com/users/arthur-e/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/arthur-e/subscriptions","organizations_url":"https://api.github.com/users/arthur-e/orgs","repos_url":"https://api.github.com/users/arthur-e/repos","events_url":"https://api.github.com/users/arthur-e/events{/privacy}","received_events_url":"https://api.github.com/users/arthur-e/received_events","type":"User","site_admin":false},"repo":{"id":3545112,"name":"Wicket","full_name":"arthur-e/Wicket","owner":{"login":"arthur-e","id":1211103,"avatar_url":"https://avatars.githubusercontent.com/u/1211103?v=3","gravatar_id":"","url":"https://api.github.com/users/arthur-e","html_url":"https://github.com/arthur-e","followers_url":"https://api.github.com/users/arthur-e/followers","following_url":"https://api.github.com/users/arthur-e/following{/other_user}","gists_url":"https://api.github.com/users/arthur-e/gists{/gist_id}","starred_url":"https://api.github.com/users/arthur-e/starred{/owner}{/repo}","subscriptions_url":"https://api.github.com/users/arthur-e/subscriptions","organizations_url":"https://api.github.com/users/arthur-e/orgs","repos_url":"https://api.github.com/users/arthur-e/repos","events_url":"https://api.github.com/users/arthur-e/events{/privacy}","received_events_url":"https://api.github.com/users/arthur-e/received_events","type":"User","site_admin":false},"private":false,"html_url":"https://github.com/arthur-e/Wicket","description":"A modest library for moving between Well-Known Text (WKT) and various framework geometries","fork":false,"url":"https://api.github.com/repos/arthur-e/Wicket","forks_url":"https://api.github.com/repos/arthur-e/Wicket/forks","keys_url":"https://api.github.com/repos/arthur-e/Wicket/keys{/key_id}","collaborators_url":"https://api.github.com/repos/arthur-e/Wicket/collaborators{/collaborator}","teams_url":"https://api.github.com/repos/arthur-e/Wicket/teams","hooks_url":"https://api.github.com/repos/arthur-e/Wicket/hooks","issue_events_url":"https://api.github.com/repos/arthur-e/Wicket/issues/events{/number}","events_url":"https://api.github.com/repos/arthur-e/Wicket/events","assignees_url":"https://api.github.com/repos/arthur-e/Wicket/assignees{/user}","branches_url":"https://api.github.com/repos/arthur-e/Wicket/branches{/branch}","tags_url":"https://api.github.com/repos/arthur-e/Wicket/tags","blobs_url":"https://api.github.com/repos/arthur-e/Wicket/git/blobs{/sha}","git_tags_url":"https://api.github.com/repos/arthur-e/Wicket/git/tags{/sha}","git_refs_url":"https://api.github.com/repos/arthur-e/Wicket/git/refs{/sha}","trees_url":"https://api.github.com/repos/arthur-e/Wicket/git/trees{/sha}","statuses_url":"https://api.github.com/repos/arthur-e/Wicket/statuses/{sha}","languages_url":"https://api.github.com/repos/arthur-e/Wicket/languages","stargazers_url":"https://api.github.com/repos/arthur-e/Wicket/stargazers","contributors_url":"https://api.github.com/repos/arthur-e/Wicket/contributors","subscribers_url":"https://api.github.com/repos/arthur-e/Wicket/subscribers","subscription_url":"https://api.github.com/repos/arthur-e/Wicket/subscription","commits_url":"https://api.github.com/repos/arthur-e/Wicket/commits{/sha}","git_commits_url":"https://api.github.com/repos/arthur-e/Wicket/git/commits{/sha}","comments_url":"https://api.github.com/repos/arthur-e/Wicket/comments{/number}","issue_comment_url":"https://api.github.com/repos/arthur-e/Wicket/issues/comments/{number}","contents_url":"https://api.github.com/repos/arthur-e/Wicket/contents/{+path}","compare_url":"https://api.github.com/repos/arthur-e/Wicket/compare/{base}...{head}","merges_url":"https://api.github.com/repos/arthur-e/Wicket/merges","archive_url":"https://api.github.com/repos/arthur-e/Wicket/{archive_format}{/ref}","downloads_url":"https://api.github.com/repos/arthur-e/Wicket/downloads","issues_url":"https://api.github.com/repos/arthur-e/Wicket/issues{/number}","pulls_url":"https://api.github.com/repos/arthur-e/Wicket/pulls{/number}","milestones_url":"https://api.github.com/repos/arthur-e/Wicket/milestones{/number}","notifications_url":"https://api.github.com/repos/arthur-e/Wicket/notifications{?since,all,participating}","labels_url":"https://api.github.com/repos/arthur-e/Wicket/labels{/name}","releases_url":"https://api.github.com/repos/arthur-e/Wicket/releases{/id}","created_at":"2012-02-25T14:59:02Z","updated_at":"2014-12-18T11:08:34Z","pushed_at":"2014-11-12T13:58:08Z","git_url":"git://github.com/arthur-e/Wicket.git","ssh_url":"git@github.com:arthur-e/Wicket.git","clone_url":"https://github.com/arthur-e/Wicket.git","svn_url":"https://github.com/arthur-e/Wicket","homepage":"http://arthur-e.github.com/Wicket","size":1032,"stargazers_count":99,"watchers_count":99,"language":"JavaScript","has_issues":true,"has_downloads":true,"has_wiki":true,"has_pages":true,"forks_count":45,"mirror_url":null,"open_issues_count":11,"forks":45,"open_issues":11,"watchers":99,"default_branch":"master"}},"_links":{"self":{"href":"https://api.github.com/repos/arthur-e/Wicket/pulls/60"},"html":{"href":"https://github.com/arthur-e/Wicket/pull/60"},"issue":{"href":"https://api.github.com/repos/arthur-e/Wicket/issues/60"},"comments":{"href":"https://api.github.com/repos/arthur-e/Wicket/issues/60/comments"},"review_comments":{"href":"https://api.github.com/repos/arthur-e/Wicket/pulls/60/comments"},"review_comment":{"href":"https://api.github.com/repos/arthur-e/Wicket/pulls/comments/{number}"},"commits":{"href":"https://api.github.com/repos/arthur-e/Wicket/pulls/60/commits"},"statuses":{"href":"https://api.github.com/repos/arthur-e/Wicket/statuses/b1050c9a81013c77f4dc3e266c8606e130d7b23c"}},"merged":false,"mergeable":null,"mergeable_state":"unknown","merged_by":null,"comments":0,"review_comments":0,"commits":1,"additions":99,"deletions":83,"changed_files":1}},"public":true,"created_at":"2015-01-01T01:07:38Z"}
{"id":"2489399010","type":"PushEvent","actor":{"id":6325631,"login":"pirej","gravatar_id":"","url":"https://api.github.com/users/pirej","avatar_url":"https://avatars.githubusercontent.com/u/6325631?"},"repo":{"id":27450767,"name":"lollipoop/android_frameworks_native","url":"https://api.github.com/repos/lollipoop/android_frameworks_native"},"payload":{"push_id":536753610,"size":1,"distinct_size":1,"ref":"refs/heads/m4","head":"6ce802b32fdfecdea10b550d45f16937d585dff4","before":"90bee99354ab9ae0c27d48ef4891f232cca0c1f4","commits":[{"sha":"6ce802b32fdfecdea10b550d45f16937d585dff4","author":{"email":"756a323d9c5c587ce7cec8b755badb3d54b6fcc9@gmail.com","name":"x10forevers"},"message":"libEGL: workaround for google bug 10194508\n\nSome of device's older blobs don't have EGL_KHL_gl_colorspace extension\nand need this workaround\n\nChange-Id: I811538e7d595f18055d13ca608098c049b4cb9b9","distinct":true,"url":"https://api.github.com/repos/lollipoop/android_frameworks_native/commits/6ce802b32fdfecdea10b550d45f16937d585dff4"}]},"public":true,"created_at":"2015-01-01T01:07:38Z","org":{"id":10051895,"login":"lollipoop","gravatar_id":"","url":"https://api.github.com/orgs/lollipoop","avatar_url":"https://avatars.githubusercontent.com/u/10051895?"}}
{"id":"2489399013","type":"PushEvent","actor":{"id":6064868,"login":"AiNoKame","gravatar_id":"","url":"https://api.github.com/users/AiNoKame","avatar_url":"https://avatars.githubusercontent.com/u/6064868?"},"repo":{"id":27805488,"name":"gatewayd/gatewayd-banking-app","url":"https://api.github.com/repos/gatewayd/gatewayd-banking-app"},"payload":{"push_id":536753611,"size":1,"distinct_size":1,"ref":"refs/heads/feature/component-form-mixin","head":"f92b106ccbf2b52784aa0de50c946c2cbf24ed09","before":"9e5a5f1a0c7630df1141086530e23698930499cf","commits":[{"sha":"f92b106ccbf2b52784aa0de50c946c2cbf24ed09","author":{"email":"c24f01d25e2c94304e596feb894fac5a7ed7429c@gmail.com","name":"Rod Calumpong"},"message":"[TASK] Navigate between transactions and accounts section via top bar tabs","distinct":true,"url":"https://api.github.com/repos/gatewayd/gatewayd-banking-app/commits/f92b106ccbf2b52784aa0de50c946c2cbf24ed09"}]},"public":true,"created_at":"2015-01-01T01:07:39Z","org":{"id":8335076,"login":"gatewayd","gravatar_id":"","url":"https://api.github.com/orgs/gatewayd","avatar_url":"https://avatars.githubusercontent.com/u/8335076?"}}


================================================
FILE: benches/hdfs.json
================================================
[File too large to display: 21.4 MB]

================================================
FILE: benches/index-bench.rs
================================================
use criterion::{criterion_group, criterion_main, BatchSize, Bencher, Criterion, Throughput};
use tantivy::schema::{TantivyDocument, FAST, INDEXED, STORED, STRING, TEXT};
use tantivy::{tokenizer, Index, IndexWriter};

const HDFS_LOGS: &str = include_str!("hdfs.json");
const GH_LOGS: &str = include_str!("gh.json");
const WIKI: &str = include_str!("wiki.json");

fn benchmark(
    b: &mut Bencher,
    input: &str,
    schema: tantivy::schema::Schema,
    commit: bool,
    parse_json: bool,
    is_dynamic: bool,
) {
    if is_dynamic {
        benchmark_dynamic_json(b, input, schema, commit, parse_json)
    } else {
        _benchmark(b, input, schema, commit, parse_json, |schema, doc_json| {
            TantivyDocument::parse_json(schema, doc_json).unwrap()
        })
    }
}

fn get_index(schema: tantivy::schema::Schema) -> Index {
    let mut index = Index::create_in_ram(schema.clone());
    let ff_tokenizer_manager = tokenizer::TokenizerManager::default();
    ff_tokenizer_manager.register(
        "raw",
        tokenizer::TextAnalyzer::builder(tokenizer::RawTokenizer::default())
            .filter(tokenizer::RemoveLongFilter::limit(255))
            .build(),
    );
    index.set_fast_field_tokenizers(ff_tokenizer_manager.clone());
    index
}

fn _benchmark(
    b: &mut Bencher,
    input: &str,
    schema: tantivy::schema::Schema,
    commit: bool,
    include_json_parsing: bool,
    create_doc: impl Fn(&tantivy::schema::Schema, &str) -> TantivyDocument,
) {
    if include_json_parsing {
        let lines: Vec<&str> = input.trim().split('\n').collect();
        b.iter(|| {
            let index = get_index(schema.clone());
            let mut index_writer: IndexWriter =
                index.writer_with_num_threads(1, 100_000_000).unwrap();
            for doc_json in &lines {
                let doc = create_doc(&schema, doc_json);
                index_writer.add_document(doc).unwrap();
            }
            if commit {
                index_writer.commit().unwrap();
            }
        })
    } else {
        let docs: Vec<_> = input
            .trim()
            .split('\n')
            .map(|doc_json| create_doc(&schema, doc_json))
            .collect();
        b.iter_batched(
            || docs.clone(),
            |docs| {
                let index = get_index(schema.clone());
                let mut index_writer: IndexWriter =
                    index.writer_with_num_threads(1, 100_000_000).unwrap();
                for doc in docs {
                    index_writer.add_document(doc).unwrap();
                }
                if commit {
                    index_writer.commit().unwrap();
                }
            },
            BatchSize::SmallInput,
        )
    }
}
fn benchmark_dynamic_json(
    b: &mut Bencher,
    input: &str,
    schema: tantivy::schema::Schema,
    commit: bool,
    parse_json: bool,
) {
    let json_field = schema.get_field("json").unwrap();
    _benchmark(b, input, schema, commit, parse_json, |_schema, doc_json| {
        let json_val: serde_json::Value = serde_json::from_str(doc_json).unwrap();
        tantivy::doc!(json_field=>json_val)
    })
}

pub fn hdfs_index_benchmark(c: &mut Criterion) {
    let schema = {
        let mut schema_builder = tantivy::schema::SchemaBuilder::new();
        schema_builder.add_u64_field("timestamp", INDEXED);
        schema_builder.add_text_field("body", TEXT);
        schema_builder.add_text_field("severity", STRING);
        schema_builder.build()
    };
    let schema_only_fast = {
        let mut schema_builder = tantivy::schema::SchemaBuilder::new();
        schema_builder.add_u64_field("timestamp", FAST);
        schema_builder.add_text_field("body", FAST);
        schema_builder.add_text_field("severity", FAST);
        schema_builder.build()
    };
    let _schema_with_store = {
        let mut schema_builder = tantivy::schema::SchemaBuilder::new();
        schema_builder.add_u64_field("timestamp", INDEXED | STORED);
        schema_builder.add_text_field("body", TEXT | STORED);
        schema_builder.add_text_field("severity", STRING | STORED);
        schema_builder.build()
    };
    let dynamic_schema = {
        let mut schema_builder = tantivy::schema::SchemaBuilder::new();
        schema_builder.add_json_field("json", TEXT | FAST);
        schema_builder.build()
    };

    let mut group = c.benchmark_group("index-hdfs");
    group.throughput(Throughput::Bytes(HDFS_LOGS.len() as u64));
    group.sample_size(20);

    let benches = [
        ("only-indexed-".to_string(), schema, false),
        //("stored-".to_string(), _schema_with_store, false),
        ("only-fast-".to_string(), schema_only_fast, false),
        ("dynamic-".to_string(), dynamic_schema, true),
    ];

    for (prefix, schema, is_dynamic) in benches {
        for commit in [false, true] {
            let suffix = if commit { "with-commit" } else { "no-commit" };
            {
                let parse_json = false;
                // for parse_json in [false, true] {
                let suffix = if parse_json {
                    format!("{suffix}-with-json-parsing")
                } else {
                    suffix.to_string()
                };

                let bench_name = format!("{prefix}{suffix}");
                group.bench_function(bench_name, |b| {
                    benchmark(b, HDFS_LOGS, schema.clone(), commit, parse_json, is_dynamic)
                });
            }
        }
    }
}

pub fn gh_index_benchmark(c: &mut Criterion) {
    let dynamic_schema = {
        let mut schema_builder = tantivy::schema::SchemaBuilder::new();
        schema_builder.add_json_field("json", TEXT | FAST);
        schema_builder.build()
    };
    let dynamic_schema_fast = {
        let mut schema_builder = tantivy::schema::SchemaBuilder::new();
        schema_builder.add_json_field("json", FAST);
        schema_builder.build()
    };

    let mut group = c.benchmark_group("index-gh");
    group.throughput(Throughput::Bytes(GH_LOGS.len() as u64));

    group.bench_function("index-gh-no-commit", |b| {
        benchmark_dynamic_json(b, GH_LOGS, dynamic_schema.clone(), false, false)
    });
    group.bench_function("index-gh-fast", |b| {
        benchmark_dynamic_json(b, GH_LOGS, dynamic_schema_fast.clone(), false, false)
    });

    group.bench_function("index-gh-fast-with-commit", |b| {
        benchmark_dynamic_json(b, GH_LOGS, dynamic_schema_fast.clone(), true, false)
    });
}

pub fn wiki_index_benchmark(c: &mut Criterion) {
    let dynamic_schema = {
        let mut schema_builder = tantivy::schema::SchemaBuilder::new();
        schema_builder.add_json_field("json", TEXT | FAST);
        schema_builder.build()
    };

    let mut group = c.benchmark_group("index-wiki");
    group.throughput(Throughput::Bytes(WIKI.len() as u64));

    group.bench_function("index-wiki-no-commit", |b| {
        benchmark_dynamic_json(b, WIKI, dynamic_schema.clone(), false, false)
    });
    group.bench_function("index-wiki-with-commit", |b| {
        benchmark_dynamic_json(b, WIKI, dynamic_schema.clone(), true, false)
    });
}

criterion_group! {
    name = benches;
    config = Criterion::default();
    targets = hdfs_index_benchmark
}
criterion_group! {
    name = gh_benches;
    config = Criterion::default();
    targets = gh_index_benchmark
}
criterion_group! {
    name = wiki_benches;
    config = Criterion::default();
    targets = wiki_index_benchmark
}
criterion_main!(benches, gh_benches, wiki_benches);


================================================
FILE: benches/merge_segments.rs
================================================
// Benchmarks segment merging
//
// Notes:
// - Input segments are kept intact (no deletes / no IndexWriter merge).
// - Output is written to a `NullDirectory` that discards all files except
//  fieldnorms (needed for merging).

use std::collections::HashMap;
use std::io::{self, Write};
use std::path::{Path, PathBuf};
use std::sync::{Arc, RwLock};

use binggan::{black_box, BenchRunner};
use rand::prelude::*;
use rand::rngs::StdRng;
use rand::SeedableRng;
use tantivy::directory::error::{DeleteError, OpenReadError, OpenWriteError};
use tantivy::directory::{
    AntiCallToken, Directory, FileHandle, OwnedBytes, TerminatingWrite, WatchCallback, WatchHandle,
    WritePtr,
};
use tantivy::indexer::{merge_filtered_segments, NoMergePolicy};
use tantivy::schema::{Schema, TEXT};
use tantivy::{doc, HasLen, Index, IndexSettings, Segment};

#[derive(Clone, Default, Debug)]
struct NullDirectory {
    blobs: Arc<RwLock<HashMap<PathBuf, OwnedBytes>>>,
}

struct NullWriter;

impl Write for NullWriter {
    fn write(&mut self, buf: &[u8]) -> io::Result<usize> {
        Ok(buf.len())
    }

    fn flush(&mut self) -> io::Result<()> {
        Ok(())
    }
}

impl TerminatingWrite for NullWriter {
    fn terminate_ref(&mut self, _token: AntiCallToken) -> io::Result<()> {
        Ok(())
    }
}

struct InMemoryWriter {
    path: PathBuf,
    buffer: Vec<u8>,
    blobs: Arc<RwLock<HashMap<PathBuf, OwnedBytes>>>,
}

impl Write for InMemoryWriter {
    fn write(&mut self, buf: &[u8]) -> io::Result<usize> {
        self.buffer.extend_from_slice(buf);
        Ok(buf.len())
    }

    fn flush(&mut self) -> io::Result<()> {
        Ok(())
    }
}

impl TerminatingWrite for InMemoryWriter {
    fn terminate_ref(&mut self, _token: AntiCallToken) -> io::Result<()> {
        let bytes = OwnedBytes::new(std::mem::take(&mut self.buffer));
        self.blobs.write().unwrap().insert(self.path.clone(), bytes);
        Ok(())
    }
}

#[derive(Debug, Default)]
struct NullFileHandle;
impl HasLen for NullFileHandle {
    fn len(&self) -> usize {
        0
    }
}
impl FileHandle for NullFileHandle {
    fn read_bytes(&self, _range: std::ops::Range<usize>) -> io::Result<OwnedBytes> {
        unimplemented!()
    }
}

impl Directory for NullDirectory {
    fn get_file_handle(&self, path: &Path) -> Result<Arc<dyn FileHandle>, OpenReadError> {
        if let Some(bytes) = self.blobs.read().unwrap().get(path) {
            return Ok(Arc::new(bytes.clone()));
        }
        Ok(Arc::new(NullFileHandle))
    }

    fn delete(&self, _path: &Path) -> Result<(), DeleteError> {
        Ok(())
    }

    fn exists(&self, _path: &Path) -> Result<bool, OpenReadError> {
        Ok(true)
    }

    fn open_write(&self, path: &Path) -> Result<WritePtr, OpenWriteError> {
        let path_buf = path.to_path_buf();
        if path.to_string_lossy().ends_with(".fieldnorm") {
            let writer = InMemoryWriter {
                path: path_buf,
                buffer: Vec::new(),
                blobs: Arc::clone(&self.blobs),
            };
            Ok(io::BufWriter::new(Box::new(writer)))
        } else {
            Ok(io::BufWriter::new(Box::new(NullWriter)))
        }
    }

    fn atomic_read(&self, path: &Path) -> Result<Vec<u8>, OpenReadError> {
        if let Some(bytes) = self.blobs.read().unwrap().get(path) {
            return Ok(bytes.as_slice().to_vec());
        }
        Err(OpenReadError::FileDoesNotExist(path.to_path_buf()))
    }

    fn atomic_write(&self, _path: &Path, _data: &[u8]) -> io::Result<()> {
        Ok(())
    }

    fn sync_directory(&self) -> io::Result<()> {
        Ok(())
    }

    fn watch(&self, _watch_callback: WatchCallback) -> tantivy::Result<WatchHandle> {
        Ok(WatchHandle::empty())
    }
}

struct MergeScenario {
    #[allow(dead_code)]
    index: Index,
    segments: Vec<Segment>,
    settings: IndexSettings,
    label: String,
}

fn build_index(
    num_segments: usize,
    docs_per_segment: usize,
    tokens_per_doc: usize,
    vocab_size: usize,
) -> MergeScenario {
    let mut schema_builder = Schema::builder();
    let body = schema_builder.add_text_field("body", TEXT);
    let schema = schema_builder.build();
    let index = Index::create_in_ram(schema.clone());

    assert!(vocab_size > 0);
    let total_tokens = num_segments * docs_per_segment * tokens_per_doc;
    let use_unique_terms = vocab_size >= total_tokens;
    let mut rng = StdRng::from_seed([7u8; 32]);
    let mut next_token_id: u64 = 0;

    {
        let mut writer = index.writer_with_num_threads(1, 256_000_000).unwrap();
        writer.set_merge_policy(Box::new(NoMergePolicy));
        for _ in 0..num_segments {
            for _ in 0..docs_per_segment {
                let mut tokens = Vec::with_capacity(tokens_per_doc);
                for _ in 0..tokens_per_doc {
                    let token_id = if use_unique_terms {
                        let id = next_token_id;
                        next_token_id += 1;
                        id
                    } else {
                        rng.random_range(0..vocab_size as u64)
                    };
                    tokens.push(format!("term_{token_id}"));
                }
                writer.add_document(doc!(body => tokens.join(" "))).unwrap();
            }
            writer.commit().unwrap();
        }
    }

    let segments = index.searchable_segments().unwrap();
    let settings = index.settings().clone();
    let label = format!(
        "segments={}, docs/seg={}, tokens/doc={}, vocab={}",
        num_segments, docs_per_segment, tokens_per_doc, vocab_size
    );

    MergeScenario {
        index,
        segments,
        settings,
        label,
    }
}

fn main() {
    let scenarios = vec![
        build_index(8, 50_000, 12, 8),
        build_index(16, 50_000, 12, 8),
        build_index(16, 100_000, 12, 8),
        build_index(8, 50_000, 8, 8 * 50_000 * 8),
    ];

    let mut runner = BenchRunner::new();
    for scenario in scenarios {
        let mut group = runner.new_group();
        group.set_name(format!("merge_segments inv_index — {}", scenario.label));
        let segments = scenario.segments.clone();
        let settings = scenario.settings.clone();
        group.register("merge", move |_| {
            let output_dir = NullDirectory::default();
            let filter_doc_ids = vec![None; segments.len()];
            let merged_index =
                merge_filtered_segments(&segments, settings.clone(), filter_doc_ids, output_dir)
                    .unwrap();
            black_box(merged_index);
        });

        group.run();
    }
}


================================================
FILE: benches/range_queries.rs
================================================
use std::ops::Bound;

use binggan::{black_box, BenchGroup, BenchRunner};
use rand::prelude::*;
use rand::rngs::StdRng;
use rand::SeedableRng;
use tantivy::collector::{Count, DocSetCollector, TopDocs};
use tantivy::query::RangeQuery;
use tantivy::schema::{Schema, FAST, INDEXED};
use tantivy::{doc, Index, Order, ReloadPolicy, Searcher, Term};

#[derive(Clone)]
struct BenchIndex {
    #[allow(dead_code)]
    index: Index,
    searcher: Searcher,
}

fn build_shared_indices(num_docs: usize, distribution: &str) -> BenchIndex {
    // Schema with fast fields only
    let mut schema_builder = Schema::builder();
    let f_num_rand_fast = schema_builder.add_u64_field("num_rand_fast", INDEXED | FAST);
    let f_num_asc_fast = schema_builder.add_u64_field("num_asc_fast", INDEXED | FAST);
    let schema = schema_builder.build();
    let index = Index::create_in_ram(schema.clone());

    // Populate index with stable RNG for reproducibility.
    let mut rng = StdRng::from_seed([7u8; 32]);

    {
        let mut writer = index.writer_with_num_threads(1, 4_000_000_000).unwrap();

        match distribution {
            "dense" => {
                for doc_id in 0..num_docs {
                    let num_rand = rng.random_range(0u64..1000u64);
                    let num_asc = (doc_id / 10000) as u64;

                    writer
                        .add_document(doc!(
                            f_num_rand_fast=>num_rand,
                            f_num_asc_fast=>num_asc,
                        ))
                        .unwrap();
                }
            }
            "sparse" => {
                for doc_id in 0..num_docs {
                    let num_rand = rng.random_range(0u64..10000000u64);
                    let num_asc = doc_id as u64;

                    writer
                        .add_document(doc!(
                            f_num_rand_fast=>num_rand,
                            f_num_asc_fast=>num_asc,
                        ))
                        .unwrap();
                }
            }
            _ => {
                panic!("Unsupported distribution type");
            }
        }
        writer.commit().unwrap();
    }

    // Prepare reader/searcher once.
    let reader = index
        .reader_builder()
        .reload_policy(ReloadPolicy::Manual)
        .try_into()
        .unwrap();
    let searcher = reader.searcher();

    BenchIndex { index, searcher }
}

fn main() {
    // Prepare corpora with varying scenarios
    let scenarios = vec![
        // Dense distribution - random values in small range (0-999)
        (
            "dense_values_search_low_value_range".to_string(),
            10_000_000,
            "dense",
            0,
            9,
        ),
        (
            "dense_values_search_high_value_range".to_string(),
            10_000_000,
            "dense",
            990,
            999,
        ),
        (
            "dense_values_search_out_of_range".to_string(),
            10_000_000,
            "dense",
            1000,
            1002,
        ),
        (
            "sparse_values_search_low_value_range".to_string(),
            10_000_000,
            "sparse",
            0,
            9,
        ),
        (
            "sparse_values_search_high_value_range".to_string(),
            10_000_000,
            "sparse",
            9_999_990,
            9_999_999,
        ),
        (
            "sparse_values_search_out_of_range".to_string(),
            10_000_000,
            "sparse",
            10_000_000,
            10_000_002,
        ),
    ];

    let mut runner = BenchRunner::new();
    for (scenario_id, n, num_rand_distribution, range_low, range_high) in scenarios {
        // Build index for this scenario
        let bench_index = build_shared_indices(n, num_rand_distribution);

        // Create benchmark group
        let mut group = runner.new_group();

        // Now set the name (this moves scenario_id)
        group.set_name(scenario_id);

        // Define fast field types
        let field_names = ["num_rand_fast", "num_asc_fast"];

        // Generate range queries for fast fields
        for &field_name in &field_names {
            // Create the range query
            let field = bench_index.searcher.schema().get_field(field_name).unwrap();
            let lower_term = Term::from_field_u64(field, range_low);
            let upper_term = Term::from_field_u64(field, range_high);

            let query = RangeQuery::new(Bound::Included(lower_term), Bound::Included(upper_term));

            run_benchmark_tasks(
                &mut group,
                &bench_index,
                query,
                field_name,
                range_low,
                range_high,
            );
        }

        group.run();
    }
}

/// Run all benchmark tasks for a given range query and field name
fn run_benchmark_tasks(
    bench_group: &mut BenchGroup,
    bench_index: &BenchIndex,
    query: RangeQuery,
    field_name: &str,
    range_low: u64,
    range_high: u64,
) {
    // Test count
    add_bench_task_count(
        bench_group,
        bench_index,
        query.clone(),
        "count",
        field_name,
        range_low,
        range_high,
    );

    // Test top 100 by the field (ascending order)
    {
        let collector_name = format!("top100_by_{}_asc", field_name);
        let field_name_owned = field_name.to_string();
        add_bench_task_top100_asc(
            bench_group,
            bench_index,
            query.clone(),
            &collector_name,
            field_name,
            range_low,
            range_high,
            field_name_owned,
        );
    }

    // Test top 100 by the field (descending order)
    {
        let collector_name = format!("top100_by_{}_desc", field_name);
        let field_name_owned = field_name.to_string();
        add_bench_task_top100_desc(
            bench_group,
            bench_index,
            query,
            &collector_name,
            field_name,
            range_low,
            range_high,
            field_name_owned,
        );
    }
}

fn add_bench_task_count(
    bench_group: &mut BenchGroup,
    bench_index: &BenchIndex,
    query: RangeQuery,
    collector_name: &str,
    field_name: &str,
    range_low: u64,
    range_high: u64,
) {
    let task_name = format!(
        "range_{}_[{} TO {}]_{}",
        field_name, range_low, range_high, collector_name
    );

    let search_task = CountSearchTask {
        searcher: bench_index.searcher.clone(),
        query,
    };
    bench_group.register(task_name, move |_| black_box(search_task.run()));
}

fn add_bench_task_docset(
    bench_group: &mut BenchGroup,
    bench_index: &BenchIndex,
    query: RangeQuery,
    collector_name: &str,
    field_name: &str,
    range_low: u64,
    range_high: u64,
) {
    let task_name = format!(
        "range_{}_[{} TO {}]_{}",
        field_name, range_low, range_high, collector_name
    );

    let search_task = DocSetSearchTask {
        searcher: bench_index.searcher.clone(),
        query,
    };
    bench_group.register(task_name, move |_| black_box(search_task.run()));
}

fn add_bench_task_top100_asc(
    bench_group: &mut BenchGroup,
    bench_index: &BenchIndex,
    query: RangeQuery,
    collector_name: &str,
    field_name: &str,
    range_low: u64,
    range_high: u64,
    field_name_owned: String,
) {
    let task_name = format!(
        "range_{}_[{} TO {}]_{}",
        field_name, range_low, range_high, collector_name
    );

    let search_task = Top100AscSearchTask {
        searcher: bench_index.searcher.clone(),
        query,
        field_name: field_name_owned,
    };
    bench_group.register(task_name, move |_| black_box(search_task.run()));
}

fn add_bench_task_top100_desc(
    bench_group: &mut BenchGroup,
    bench_index: &BenchIndex,
    query: RangeQuery,
    collector_name: &str,
    field_name: &str,
    range_low: u64,
    range_high: u64,
    field_name_owned: String,
) {
    let task_name = format!(
        "range_{}_[{} TO {}]_{}",
        field_name, range_low, range_high, collector_name
    );

    let search_task = Top100DescSearchTask {
        searcher: bench_index.searcher.clone(),
        query,
        field_name: field_name_owned,
    };
    bench_group.register(task_name, move |_| black_box(search_task.run()));
}

struct CountSearchTask {
    searcher: Searcher,
    query: RangeQuery,
}

impl CountSearchTask {
    #[inline(never)]
    pub fn run(&self) -> usize {
        self.searcher.search(&self.query, &Count).unwrap()
    }
}

struct DocSetSearchTask {
    searcher: Searcher,
    query: RangeQuery,
}

impl DocSetSearchTask {
    #[inline(never)]
    pub fn run(&self) -> usize {
        let result = self.searcher.search(&self.query, &DocSetCollector).unwrap();
        result.len()
    }
}

struct Top100AscSearchTask {
    searcher: Searcher,
    query: RangeQuery,
    field_name: String,
}

impl Top100AscSearchTask {
    #[inline(never)]
    pub fn run(&self) -> usize {
        let collector =
            TopDocs::with_limit(100).order_by_fast_field::<u64>(&self.field_name, Order::Asc);
        let result = self.searcher.search(&self.query, &collector).unwrap();
        for (_score, doc_address) in &result {
            let _doc: tantivy::TantivyDocument = self.searcher.doc(*doc_address).unwrap();
        }
        result.len()
    }
}

struct Top100DescSearchTask {
    searcher: Searcher,
    query: RangeQuery,
    field_name: String,
}

impl Top100DescSearchTask {
    #[inline(never)]
    pub fn run(&self) -> usize {
        let collector =
            TopDocs::with_limit(100).order_by_fast_field::<u64>(&self.field_name, Order::Desc);
        let result = self.searcher.search(&self.query, &collector).unwrap();
        for (_score, doc_address) in &result {
            let _doc: tantivy::TantivyDocument = self.searcher.doc(*doc_address).unwrap();
        }
        result.len()
    }
}


================================================
FILE: benches/range_query.rs
================================================
use std::fmt::Display;
use std::net::Ipv6Addr;
use std::ops::RangeInclusive;

use binggan::plugins::PeakMemAllocPlugin;
use binggan::{black_box, BenchRunner, OutputValue, PeakMemAlloc, INSTRUMENTED_SYSTEM};
use columnar::MonotonicallyMappableToU128;
use rand::rngs::StdRng;
use rand::{Rng, SeedableRng};
use tantivy::collector::{Count, TopDocs};
use tantivy::query::QueryParser;
use tantivy::schema::*;
use tantivy::{doc, Index};

#[global_allocator]
pub static GLOBAL: &PeakMemAlloc<std::alloc::System> = &INSTRUMENTED_SYSTEM;

fn main() {
    bench_range_query();
}

fn bench_range_query() {
    let index = get_index_0_to_100();
    let mut runner = BenchRunner::new();
    runner.add_plugin(PeakMemAllocPlugin::new(GLOBAL));

    runner.set_name("range_query on u64");
    let field_name_and_descr: Vec<_> = vec![
        ("id", "Single Valued Range Field"),
        ("ids", "Multi Valued Range Field"),
    ];
    let range_num_hits = vec![
        ("90_percent", get_90_percent()),
        ("10_percent", get_10_percent()),
        ("1_percent", get_1_percent()),
    ];

    test_range(&mut runner, &index, &field_name_and_descr, range_num_hits);

    runner.set_name("range_query on ip");
    let field_name_and_descr: Vec<_> = vec![
        ("ip", "Single Valued Range Field"),
        ("ips", "Multi Valued Range Field"),
    ];
    let range_num_hits = vec![
        ("90_percent", get_90_percent_ip()),
        ("10_percent", get_10_percent_ip()),
        ("1_percent", get_1_percent_ip()),
    ];

    test_range(&mut runner, &index, &field_name_and_descr, range_num_hits);
}

fn test_range<T: Display>(
    runner: &mut BenchRunner,
    index: &Index,
    field_name_and_descr: &[(&str, &str)],
    range_num_hits: Vec<(&str, RangeInclusive<T>)>,
) {
    for (field, suffix) in field_name_and_descr {
        let term_num_hits = vec![
            ("", ""),
            ("1_percent", "veryfew"),
            ("10_percent", "few"),
            ("90_percent", "most"),
        ];
        let mut group = runner.new_group();
        group.set_name(suffix);
        // all intersect combinations
        for (range_name, range) in &range_num_hits {
            for (term_name, term) in &term_num_hits {
                let index = &index;
                let test_name = if term_name.is_empty() {
                    format!("id_range_hit_{}", range_name)
                } else {
                    format!(
                        "id_range_hit_{}_intersect_with_term_{}",
                        range_name, term_name
                    )
                };
                group.register(test_name, move |_| {
                    let query = if term_name.is_empty() {
                        "".to_string()
                    } else {
                        format!("AND id_name:{}", term)
                    };
                    black_box(execute_query(field, range, &query, index));
                });
            }
        }
        group.run();
    }
}

fn get_index_0_to_100() -> Index {
    let mut rng = StdRng::from_seed([1u8; 32]);
    let num_vals = 100_000;
    let docs: Vec<_> = (0..num_vals)
        .map(|_i| {
            let id_name = if rng.random_bool(0.01) {
                "veryfew".to_string() // 1%
            } else if rng.random_bool(0.1) {
                "few".to_string() // 9%
            } else {
                "most".to_string() // 90%
            };
            Doc {
                id_name,
                id: rng.random_range(0..100),
                // Multiply by 1000, so that we create most buckets in the compact space
                // The benches depend on this range to select n-percent of elements with the
                // methods below.
                ip: Ipv6Addr::from_u128(rng.random_range(0..100) * 1000),
            }
        })
        .collect();

    create_index_from_docs(&docs)
}

#[derive(Clone, Debug)]
pub struct Doc {
    pub id_name: String,
    pub id: u64,
    pub ip: Ipv6Addr,
}

pub fn create_index_from_docs(docs: &[Doc]) -> Index {
    let mut schema_builder = Schema::builder();
    let id_u64_field = schema_builder.add_u64_field("id", INDEXED | STORED | FAST);
    let ids_u64_field =
        schema_builder.add_u64_field("ids", NumericOptions::default().set_fast().set_indexed());

    let id_f64_field = schema_builder.add_f64_field("id_f64", INDEXED | STORED | FAST);
    let ids_f64_field = schema_builder.add_f64_field(
        "ids_f64",
        NumericOptions::default().set_fast().set_indexed(),
    );

    let id_i64_field = schema_builder.add_i64_field("id_i64", INDEXED | STORED | FAST);
    let ids_i64_field = schema_builder.add_i64_field(
        "ids_i64",
        NumericOptions::default().set_fast().set_indexed(),
    );

    let text_field = schema_builder.add_text_field("id_name", STRING | STORED);
    let text_field2 = schema_builder.add_text_field("id_name_fast", STRING | STORED | FAST);

    let ip_field = schema_builder.add_ip_addr_field("ip", FAST);
    let ips_field = schema_builder.add_ip_addr_field("ips", FAST);

    let schema = schema_builder.build();

    let index = Index::create_in_ram(schema);

    {
        let mut index_writer = index.writer_with_num_threads(1, 50_000_000).unwrap();
        for doc in docs.iter() {
            index_writer
                .add_document(doc!(
                    ids_i64_field => doc.id as i64,
                    ids_i64_field => doc.id as i64,
                    ids_f64_field => doc.id as f64,
                    ids_f64_field => doc.id as f64,
                    ids_u64_field => doc.id,
                    ids_u64_field => doc.id,
                    id_u64_field => doc.id,
                    id_f64_field => doc.id as f64,
                    id_i64_field => doc.id as i64,
                    text_field => doc.id_name.to_string(),
                    text_field2 => doc.id_name.to_string(),
                    ips_field => doc.ip,
                    ips_field => doc.ip,
                    ip_field => doc.ip,
                ))
                .unwrap();
        }

        index_writer.commit().unwrap();
    }
    index
}

fn get_90_percent() -> RangeInclusive<u64> {
    0..=90
}

fn get_10_percent() -> RangeInclusive<u64> {
    0..=10
}

fn get_1_percent() -> RangeInclusive<u64> {
    10..=10
}

fn get_90_percent_ip() -> RangeInclusive<Ipv6Addr> {
    let start = Ipv6Addr::from_u128(0);
    let end = Ipv6Addr::from_u128(90 * 1000);
    start..=end
}

fn get_10_percent_ip() -> RangeInclusive<Ipv6Addr> {
    let start = Ipv6Addr::from_u128(0);
    let end = Ipv6Addr::from_u128(10 * 1000);
    start..=end
}

fn get_1_percent_ip() -> RangeInclusive<Ipv6Addr> {
    let start = Ipv6Addr::from_u128(10 * 1000);
    let end = Ipv6Addr::from_u128(10 * 1000);
    start..=end
}

struct NumHits {
    count: usize,
}
impl OutputValue for NumHits {
    fn column_title() -> &'static str {
        "NumHits"
    }
    fn format(&self) -> Option<String> {
        Some(self.count.to_string())
    }
}

fn execute_query<T: Display>(
    field: &str,
    id_range: &RangeInclusive<T>,
    suffix: &str,
    index: &Index,
) -> NumHits {
    let gen_query_inclusive = |from: &T, to: &T| {
        format!(
            "{}:[{} TO {}] {}",
            field,
            &from.to_string(),
            &to.to_string(),
            suffix
        )
    };

    let query = gen_query_inclusive(id_range.start(), id_range.end());
    execute_query_(&query, index)
}

fn execute_query_(query: &str, index: &Index) -> NumHits {
    let query_from_text = |text: &str| {
        QueryParser::for_index(index, vec![])
            .parse_query(text)
            .unwrap()
    };
    let query = query_from_text(query);
    let reader = index.reader().unwrap();
    let searcher = reader.searcher();
    let num_hits = searcher
        .search(&query, &(TopDocs::with_limit(10).order_by_score(), Count))
        .unwrap()
        .1;
    NumHits { count: num_hits }
}


================================================
FILE: benches/regex_all_terms.rs
================================================
// Benchmarks regex query that matches all terms in a synthetic index.
//
// Corpus model:
// - N unique terms: t000000, t000001, ...
// - M docs
// - K tokens per doc: doc i gets terms derived from (i, token_index)
//
// Query:
// - Regex "t.*" to match all terms
//
// Run with:
// - cargo bench --bench regex_all_terms
//

use std::fmt::Write;

use binggan::{black_box, BenchRunner};
use tantivy::collector::Count;
use tantivy::query::RegexQuery;
use tantivy::schema::{Schema, TEXT};
use tantivy::{doc, Index, ReloadPolicy};

const HEAP_SIZE_BYTES: usize = 200_000_000;

#[derive(Clone, Copy)]
struct BenchConfig {
    num_terms: usize,
    num_docs: usize,
    tokens_per_doc: usize,
}

fn main() {
    let configs = default_configs();

    let mut runner = BenchRunner::new();
    for config in configs {
        let (index, text_field) = build_index(config, HEAP_SIZE_BYTES);
        let reader = index
            .reader_builder()
            .reload_policy(ReloadPolicy::Manual)
            .try_into()
            .expect("reader");
        let searcher = reader.searcher();
        let query = RegexQuery::from_pattern("t.*", text_field).expect("regex query");

        let mut group = runner.new_group();
        group.set_name(format!(
            "regex_all_terms_t{}_d{}_k{}",
            config.num_terms, config.num_docs, config.tokens_per_doc
        ));
        group.register("regex_count", move |_| {
            let count = searcher.search(&query, &Count).expect("search");
            black_box(count);
        });
        group.run();
    }
}

fn default_configs() -> Vec<BenchConfig> {
    vec![
        BenchConfig {
            num_terms: 10_000,
            num_docs: 100_000,
            tokens_per_doc: 1,
        },
        BenchConfig {
            num_terms: 10_000,
            num_docs: 100_000,
            tokens_per_doc: 8,
        },
        BenchConfig {
            num_terms: 100_000,
            num_docs: 100_000,
            tokens_per_doc: 1,
        },
        BenchConfig {
            num_terms: 100_000,
            num_docs: 100_000,
            tokens_per_doc: 8,
        },
    ]
}

fn build_index(config: BenchConfig, heap_size_bytes: usize) -> (Index, tantivy::schema::Field) {
    let mut schema_builder = Schema::builder();
    let text_field = schema_builder.add_text_field("text", TEXT);
    let schema = schema_builder.build();
    let index = Index::create_in_ram(schema);

    let term_width = config.num_terms.to_string().len();
    {
        let mut writer = index
            .writer_with_num_threads(1, heap_size_bytes)
            .expect("writer");
        let mut buffer = String::new();
        for doc_id in 0..config.num_docs {
            buffer.clear();
            for token_idx in 0..config.tokens_per_doc {
                if token_idx > 0 {
                    buffer.push(' ');
                }
                let term_id = (doc_id * config.tokens_per_doc + token_idx) % config.num_terms;
                write!(&mut buffer, "t{term_id:0term_width$}").expect("write token");
            }
            writer
                .add_document(doc!(text_field => buffer.as_str()))
                .expect("add_document");
        }
        writer.commit().expect("commit");
    }

    (index, text_field)
}


================================================
FILE: benches/str_search_and_get.rs
================================================
// This benchmark compares different approaches for retrieving string values:
//
// 1. Fast Field Approach: retrieves string values via term_ords() and ord_to_str()
//
// 2. Doc Store Approach: retrieves string values via searcher.doc() and field extraction
//
// The benchmark includes various data distributions:
// - Dense Sequential: Sequential document IDs with dense data
// - Dense Random: Random document IDs with dense data
// - Sparse Sequential: Sequential document IDs with sparse data
// - Sparse Random: Random document IDs with sparse data
use std::ops::Bound;

use binggan::{black_box, BenchGroup, BenchRunner};
use rand::prelude::*;
use rand::rngs::StdRng;
use rand::SeedableRng;
use tantivy::collector::{Count, DocSetCollector};
use tantivy::query::RangeQuery;
use tantivy::schema::document::TantivyDocument;
use tantivy::schema::{Schema, Value, FAST, STORED, STRING};
use tantivy::{doc, Index, ReloadPolicy, Searcher, Term};

#[derive(Clone)]
struct BenchIndex {
    #[allow(dead_code)]
    index: Index,
    searcher: Searcher,
}

fn build_shared_indices(num_docs: usize, distribution: &str) -> BenchIndex {
    // Schema with string fast field and stored field for doc access
    let mut schema_builder = Schema::builder();
    let f_str_fast = schema_builder.add_text_field("str_fast", STRING | STORED | FAST);
    let f_str_stored = schema_builder.add_text_field("str_stored", STRING | STORED);
    let schema = schema_builder.build();
    let index = Index::create_in_ram(schema.clone());

    // Populate index with stable RNG for reproducibility.
    let mut rng = StdRng::from_seed([7u8; 32]);

    {
        let mut writer = index.writer_with_num_threads(1, 4_000_000_000).unwrap();

        match distribution {
            "dense_random" => {
                for _doc_id in 0..num_docs {
                    let suffix = rng.gen_range(0u64..1000u64);
                    let str_val = format!("str_{:03}", suffix);

                    writer
                        .add_document(doc!(
                            f_str_fast=>str_val.clone(),
                            f_str_stored=>str_val,
                        ))
                        .unwrap();
                }
            }
            "dense_sequential" => {
                for doc_id in 0..num_docs {
                    let suffix = doc_id as u64 % 1000;
                    let str_val = format!("str_{:03}", suffix);

                    writer
                        .add_document(doc!(
                            f_str_fast=>str_val.clone(),
                            f_str_stored=>str_val,
                        ))
                        .unwrap();
                }
            }
            "sparse_random" => {
                for _doc_id in 0..num_docs {
                    let suffix = rng.gen_range(0u64..1000000u64);
                    let str_val = format!("str_{:07}", suffix);

                    writer
                        .add_document(doc!(
                            f_str_fast=>str_val.clone(),
                            f_str_stored=>str_val,
                        ))
                        .unwrap();
                }
            }
            "sparse_sequential" => {
                for doc_id in 0..num_docs {
                    let suffix = doc_id as u64;
                    let str_val = format!("str_{:07}", suffix);

                    writer
                        .add_document(doc!(
                            f_str_fast=>str_val.clone(),
                            f_str_stored=>str_val,
                        ))
                        .unwrap();
                }
            }
            _ => {
                panic!("Unsupported distribution type");
            }
        }
        writer.commit().unwrap();
    }

    // Prepare reader/searcher once.
    let reader = index
        .reader_builder()
        .reload_policy(ReloadPolicy::Manual)
        .try_into()
        .unwrap();
    let searcher = reader.searcher();

    BenchIndex { index, searcher }
}

fn main() {
    // Prepare corpora with varying scenarios
    let scenarios = vec![
        (
            "dense_random_search_low_range".to_string(),
            1_000_000,
            "dense_random",
            0,
            9,
        ),
        (
            "dense_random_search_high_range".to_string(),
            1_000_000,
            "dense_random",
            990,
            999,
        ),
        (
            "dense_sequential_search_low_range".to_string(),
            1_000_000,
            "dense_sequential",
            0,
            9,
        ),
        (
            "dense_sequential_search_high_range".to_string(),
            1_000_000,
            "dense_sequential",
            990,
            999,
        ),
        (
            "sparse_random_search_low_range".to_string(),
            1_000_000,
            "sparse_random",
            0,
            9999,
        ),
        (
            "sparse_random_search_high_range".to_string(),
            1_000_000,
            "sparse_random",
            990_000,
            999_999,
        ),
        (
            "sparse_sequential_search_low_range".to_string(),
            1_000_000,
            "sparse_sequential",
            0,
            9999,
        ),
        (
            "sparse_sequential_search_high_range".to_string(),
            1_000_000,
            "sparse_sequential",
            990_000,
            999_999,
        ),
    ];

    let mut runner = BenchRunner::new();
    for (scenario_id, n, distribution, range_low, range_high) in scenarios {
        let bench_index = build_shared_indices(n, distribution);
        let mut group = runner.new_group();
        group.set_name(scenario_id);

        let field = bench_index.searcher.schema().get_field("str_fast").unwrap();

        let (lower_str, upper_str) =
            if distribution == "dense_sequential" || distribution == "dense_random" {
                (
                    format!("str_{:03}", range_low),
                    format!("str_{:03}", range_high),
                )
            } else {
                (
                    format!("str_{:07}", range_low),
                    format!("str_{:07}", range_high),
                )
            };

        let lower_term = Term::from_field_text(field, &lower_str);
        let upper_term = Term::from_field_text(field, &upper_str);

        let query = RangeQuery::new(Bound::Included(lower_term), Bound::Included(upper_term));

        run_benchmark_tasks(&mut group, &bench_index, query, range_low, range_high);

        group.run();
    }
}

/// Run all benchmark tasks for a given range query
fn run_benchmark_tasks(
    bench_group: &mut BenchGroup,
    bench_index: &BenchIndex,
    query: RangeQuery,
    range_low: u64,
    range_high: u64,
) {
    // Test count of matching documents
    add_bench_task_count(
        bench_group,
        bench_index,
        query.clone(),
        range_low,
        range_high,
    );

    // Test fetching all DocIds of matching documents
    add_bench_task_docset(
        bench_group,
        bench_index,
        query.clone(),
        range_low,
        range_high,
    );

    // Test fetching all string fast field values of matching documents
    add_bench_task_fetch_all_strings(
        bench_group,
        bench_index,
        query.clone(),
        range_low,
        range_high,
    );

    // Test fetching all string values of matching documents through doc() method
    add_bench_task_fetch_all_strings_from_doc(
        bench_group,
        bench_index,
        query,
        range_low,
        range_high,
    );
}

fn add_bench_task_count(
    bench_group: &mut BenchGroup,
    bench_index: &BenchIndex,
    query: RangeQuery,
    range_low: u64,
    range_high: u64,
) {
    let task_name = format!("string_search_count_[{}-{}]", range_low, range_high);

    let search_task = CountSearchTask {
        searcher: bench_index.searcher.clone(),
        query,
    };
    bench_group.register(task_name, move |_| black_box(search_task.run()));
}

fn add_bench_task_docset(
    bench_group: &mut BenchGroup,
    bench_index: &BenchIndex,
    query: RangeQuery,
    range_low: u64,
    range_high: u64,
) {
    let task_name = format!("string_fetch_all_docset_[{}-{}]", range_low, range_high);

    let search_task = DocSetSearchTask {
        searcher: bench_index.searcher.clone(),
        query,
    };
    bench_group.register(task_name, move |_| black_box(search_task.run()));
}

fn add_bench_task_fetch_all_strings(
    bench_group: &mut BenchGroup,
    bench_index: &BenchIndex,
    query: RangeQuery,
    range_low: u64,
    range_high: u64,
) {
    let task_name = format!(
        "string_fastfield_fetch_all_strings_[{}-{}]",
        range_low, range_high
    );

    let search_task = FetchAllStringsSearchTask {
        searcher: bench_index.searcher.clone(),
        query,
    };

    bench_group.register(task_name, move |_| {
        let result = black_box(search_task.run());
        result.len()
    });
}

fn add_bench_task_fetch_all_strings_from_doc(
    bench_group: &mut BenchGroup,
    bench_index: &BenchIndex,
    query: RangeQuery,
    range_low: u64,
    range_high: u64,
) {
    let task_name = format!(
        "string_doc_fetch_all_strings_[{}-{}]",
        range_low, range_high
    );

    let search_task = FetchAllStringsFromDocTask {
        searcher: bench_index.searcher.clone(),
        query,
    };

    bench_group.register(task_name, move |_| {
        let result = black_box(search_task.run());
        result.len()
    });
}

struct CountSearchTask {
    searcher: Searcher,
    query: RangeQuery,
}

impl CountSearchTask {
    #[inline(never)]
    pub fn run(&self) -> usize {
        self.searcher.search(&self.query, &Count).unwrap()
    }
}

struct DocSetSearchTask {
    searcher: Searcher,
    query: RangeQuery,
}

impl DocSetSearchTask {
    #[inline(never)]
    pub fn run(&self) -> usize {
        let result = self.searcher.search(&self.query, &DocSetCollector).unwrap();
        result.len()
    }
}

struct FetchAllStringsSearchTask {
    searcher: Searcher,
    query: RangeQuery,
}

impl FetchAllStringsSearchTask {
    #[inline(never)]
    pub fn run(&self) -> Vec<String> {
        let doc_addresses = self.searcher.search(&self.query, &DocSetCollector).unwrap();
        let mut docs = doc_addresses.into_iter().collect::<Vec<_>>();
        docs.sort();
        let mut strings = Vec::with_capacity(docs.len());

        for doc_address in docs {
            let segment_reader = &self.searcher.segment_readers()[doc_address.segment_ord as usize];
            let str_column_opt = segment_reader.fast_fields().str("str_fast");

            if let Ok(Some(str_column)) = str_column_opt {
                let doc_id = doc_address.doc_id;
                let term_ord = str_column.term_ords(doc_id).next().unwrap();
                let mut str_buffer = String::new();
                if str_column.ord_to_str(term_ord, &mut str_buffer).is_ok() {
                    strings.push(str_buffer);
                }
            }
        }

        strings
    }
}

struct FetchAllStringsFromDocTask {
    searcher: Searcher,
    query: RangeQuery,
}

impl FetchAllStringsFromDocTask {
    #[inline(never)]
    pub fn run(&self) -> Vec<String> {
        let doc_addresses = self.searcher.search(&self.query, &DocSetCollector).unwrap();
        let mut docs = doc_addresses.into_iter().collect::<Vec<_>>();
        docs.sort();
        let mut strings = Vec::with_capacity(docs.len());

        let str_stored_field = self
            .searcher
            .schema()
            .get_field("str_stored")
            .expect("str_stored field should exist");

        for doc_address in docs {
            // Get the document from the doc store (row store access)
            if let Ok(doc) = self.searcher.doc::<TantivyDocument>(doc_address) {
                // Extract string values from the stored field
                if let Some(field_value) = doc.get_first(str_stored_field) {
                    if let Some(text) = field_value.as_value().as_str() {
                        strings.push(text.to_string());
                    }
                }
            }
        }

        strings
    }
}


================================================
FILE: benches/wiki.json
================================================
{"url":"https://en.wikipedia.org/wiki?curid=48687903","title":"Jeon Hye-jin (actress, born 1988)","body":"\nJeon Hye-jin (actress, born 1988)\n\nJeon Hye-jin (born June 17, 1988) is a South Korean actress.\nPersonal life.\nJeon married his \"Smile, You\" co-star Lee Chun-hee on March 11, 2011. Their daughter, Lee So Yu, was born on July 30, 2011.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48687919","title":"Benham, Indiana","body":"\nBenham, Indiana\n\nBenham is an unincorporated community in Ripley County, in the U.S. state of Indiana.\nHistory.\nAn old variant name of the community was Benhams Store. A post office opened under the name Benham Store in 1866, the name was shortened to Benham 1888, and the post office was discontinued in 1934. John Benham, Jr., served as a first postmaster.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48687922","title":"Hilyat al-Muttaqin","body":"\nHilyat al-Muttaqin\n\nHilyat al-Muttaqin (\"The adornment of the God-fearing\", ) is a Hadith book of Muhammad Baqir al-Majlisi. This work is written in Persian about Islamic morality, instructions and traditions.\nThe aim of writing.\nAccording to book's foreword, it was written because of a group of Muslims asked Majlisi to write a Persian book in the Islamic morality, instructions and traditions from the hadith of Ahl al-Bayt.\nDate of writing.\nAccording a manuscript, the date of writing of this work is 1671, But in another book has been mentioned to 1668-9.\nContent and chapters.\nThe book has 14 chapters about individual and collective morality and some Fiqh rulings, Duasand practices and had an extra chapter about some etiquette miscellaneous and their benefits. The titles of chapters are mentioned below:\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48687925","title":"MK Preshow Shimray","body":"\nMK Preshow Shimray\n\nMK Preshow Shimray is the sitting MLA from 46 - Chingai (ST) Assembly Constituency in Manipur, India. He was elected under Indian National Congress ticket in 2012.\nEarly life.\nMK Preshow Shimray was born on April 5, 1966 at Poi village to MK Somi Shimray. He did his B.E and M.E (Environment) at Salem Engineering College, Tamil Nadu. After completing his education, he worked as Scientific Officer and thereafter as Senior Scientific Officer in the Environment and Ecology Department, Manipur. \nPolitical career.\nIn 2012, he resigned from his engagement as senior scientific officer in order to contest the MLA election under Congress ticket. He got elected beating his nearest rival with a simple majority vote. In July 2013, MK Preshow Shimray was elected as the Deputy Speaker of the Manipur Legislative Assembly and is still serving in that capacity.\nAssasination bids.\nOn April 30, 2013, the cavalcade of the deputy speaker was ambushed near Ukhrul by suspected NSCN (IM) cadres, however, there were no reports of casualty. The second bid on his life was made on April 9, 2014 by some rebel groups near Litan but, there too he escaped unharmed.\nAnti tribal bills protests.\nAll tribal MLAs in Manipur were requested to resign in protest against the passing of three anti tribal bills in Manipur Ligislative Assembly on 30 August 2015. However, many tribal MLAs paid no heed to the call of the tribal people for which many elected representatives were ostrcised from their respective constituencies. MK Preshow Shimray along with the sitting MLA of 44-Phungyar MLA constituency Victor Keishing (son of Rishang Keishing)were also declared anti-socials by the Tangkhul frontal organisations for failing to tender their resignation letters.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48687930","title":"Clinton, Ripley County, Indiana","body":"\nClinton, Ripley County, Indiana\n\nClinton is an unincorporated community in Ripley County, in the U.S. state of Indiana.\nHistory.\nClinton was founded in 1833.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48687935","title":"NoRMA","body":"\nNoRMA\n\nNo Remote Memory Access (abbreviated as NoRMA) is a computer memory architecture for multiprocessor systems, given its name by . In a NoRMA architecture, the address space globally is not unique and the memory is not globally accessible by the processors. Accesses to remote memory modules are only indirectly possible by messages through the interconnection network to other processors, which in turn possibly deliver the desired data in a reply message. The entire storage configuration is partitioned statically among the processors.\nThe advantage of the NoRMA model is the ability to construct extremely large configurations, which is achieved by shifting the problem to the user configuration. Programs for NoRMA architectures need to evenly partitioning the data into local memory modules, ensure consistency of software caches to enforce the desired consistency model, handle transformations of data identifiers from one processor's address space to another, and realize a message-passing system for remote access to data. The programming model of Norma architecture is therefore extremely complicated.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48687945","title":"National Capitol Wing Civil Air Patrol","body":"\nNational Capitol Wing Civil Air Patrol\n\nThe National Capital Wing of the Civil Air Patrol (CAP) is the highest echelon of Civil Air Patrol in the district of Washington, D.C. The National Capital Wing consists of nearly 400 cadet and adult members at over 6 locations across the district of Washington D.C.\nMission.\nThe National Capital Wing performs the three missions of the Civil Air Patrol: providing emergency services; offering cadet programs for youth; and providing aerospace education for both CAP members and the general public.\nEmergency services.\nThe Civil Air Patrol provides emergency services, which includes performing search and rescue and disaster relief missions; as well as assisting in humanitarian aid assignments. The CAP also provides Air Force support through conducting light transport, communications support, and low-altitude route surveys. The Civil Air Patrol can also offer support to counter-drug missions. \nCadet programs.\nThe Civil Air Patrol offers a cadet program for youth aged 12 to 21, which includes aerospace education, leadership training, physical fitness and moral leadership. \nAerospace education.\nThe Civil Air Patrol offers aerospace education for CAP members and the general public, including providing training to the members of CAP, and offering workshops for youth throughout the nation through schools and public aviation events. \n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48687949","title":"Bae Seong-woo","body":"\nBae Seong-woo\n\nBae Seong-woo (born November 21, 1972) is a South Korean actor. He starred in film such as \"My Love, My Bride\" (2014), \"Office\" (2015), \"\" (2015) and \"Inside Men\" (2015).\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48687980","title":"Cross Roads, Ripley County, Indiana","body":"\nCross Roads, Ripley County, Indiana\n\nCross Roads is an unincorporated community in Ripley County, in the U.S. state of Indiana.\nHistory.\nThe community was so named for the fact it originally contained a store at a crossroads.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48687986","title":"Ponderosa Skatepark","body":""}
{"url":"https://en.wikipedia.org/wiki?curid=48688000","title":"Acta Orientalia","body":""}
{"url":"https://en.wikipedia.org/wiki?curid=48688007","title":"Roger Nkodo Dang","body":"\nRoger Nkodo Dang\n\nRoger Nkodo Dang is the president of the Pan-African Parliament and is also a member of the National Assembly of Cameroon. On 27 May 2015 Dang was elected as successor to Bethel Nnaemeka Amadi, he obtained 85 votes.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48688008","title":"Forth Bridge approach railways","body":""}
{"url":"https://en.wikipedia.org/wiki?curid=48688012","title":"Frederick Charles Newcombe","body":"\nFrederick Charles Newcombe\n\nFrederick Charles Newcombe (1858-1927) was an American botanist, and the first editor-in-chief of the \"American Journal of Botany\" \nNewcombe was born in Flint, Michigan, May 11, 1858, to parents Thomas and Eliza (Gayton) Newcombe, who had emigrated from England in 1848. His early education was obtained in the public schools of Flint. From 1880 to 1887 he taught in the Michigan School for the Deaf at Flint. In 1887 he entered the University of Michigan, and was graduated Bachelor of Science in 1890. He was immediately appointed Instructor in Botany at the University. The year 1892-1893 was spent at the University of Leipzig, where he received the degree of Doctor of Philosophy at the end of the year. He returned to Ann Arbor to become Acting Assistant Professor of Botany in theUniversity. Two years later he became Assistant Professor of Botany, and in 1897 Junior Professor. In 1905 he was made Professor of Botany. \nNewcombe was a fellow of the American Association for the Advancement of Science, of which he was one of the secretaries in 1899; a member of the Botanical Society of America and its 7th president; of the Society for Plant Morphology and Physiology, and its first vice-president in 1901; and of the Michigan Academy of Science. Of the last-named he was secretary in 1894, vice-president from 1894 to 1896, and president in 1903.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48688019","title":"Irfan Siddiqui","body":"\nIrfan Siddiqui\n\nIrfan Siddiqui is a senior journalist from Pakistan. He was born in Rawalpindi, Pakistan. Starting his career from teaching he gained much fame in the field of Journalism and currently is working with Prime Minister of Pakistan Nawaz Sharif as an advisor.\nEarly life.\nAfter Completing his education from University of the Punjab, Lahore Siddiqui Started Teaching at various levels in different Federal Government institutions. he also served as Director Education at Overseas Pakistanis Foundation (OPF) for two years.\nCareer.\nSidiiqui started his career as a professional journalist in early 1990s working with \"Takbeer\" a political magazine at that time. He also started writing columns in daily newspaper \"Jang\". In January 1998, he was appointed as press secretary to the President of Pakistan Mr. Mohammd Rafique Tarrar \nIn 2001, he joined Nawa-e-waqt and remained till 2008 when he joined again Daily Jang and currently working with newspaper.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48688020","title":"William Van Waters","body":"\nWilliam Van Waters\n\nWilliam Van Waters was a member of the Wisconsin State Assembly.\nBiography.\nVan Waters was born on October 7, 1817 in Hounsfield, New York. He later settled in Hamilton, Wisconsin, where he was a farmer.\nPolitical career.\nVan Waters was a member of the Assembly during the 1877 session. Previously, he had been an unsuccessful candidate in 1874. Additionally, Van Waters was Chairman of the Town Board (similar to city council) of Hamilton. He was a Democrat.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48688028","title":"Matt Longacre","body":"\nMatt Longacre\n\nMatt Longacre (born September 21, 1991) is an American football defensive end for the Los Angeles Rams of the National Football League (NFL). He played college football at Northwest Missouri State University. He signed with the Rams as an undrafted free agent in 2015.\nProfessional career.\nSt. Louis/Los Angeles Rams.\nAfter going unselected in the 2015 NFL Draft, Longacre signed with the St. Louis Rams on May 8, 2015. He was waived for final roster cuts before the start of the 2015 season, but signed to the team's practice squad on September 6. On November 6, he was promoted to the active roster.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48688037","title":"Mehrunnisa Parvez","body":"\nMehrunnisa Parvez\n\nMehrunnisa Parvez is an Indian writer of Hindi literature. \nLife.\nShe was born in 1944, she published her first story in 1963 in \"Dharamayug\" magazine and has authored several short stories and novels in Hindi. Amma, published in 1967 and Samara, released in 1969 are two of her notable works. Besides, she has also published several short story anthologies and her works have been the subject of academic studies. The Government of India awarded her the fourth highest civilian honour of the Padma Shri, in 2005, for her contributions to Indian literature. \nFamily.\nShe is married to Bhagirath Prasad, a retired Indian Administrative Service officer and active politician, and the couple lives in Bhopal, in Madhya Pradesh.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48688041","title":"Dewberry, Indiana","body":"\nDewberry, Indiana\n\nDewberry is an unincorporated community in Ripley County, in the U.S. state of Indiana.\nHistory.\nA post office was established at Dewberry in 1882, and remained in operation until 1887.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48688043","title":"Koderma (community development block)","body":"\nKoderma (community development block)\n\nKoderma (also spelled as Kodarma) is a community development block that forms an administrative division of Koderma district, Jharkhand state, India. \nGeography.\nKarma, a constituent town in Koderma CD Block, is located at .\nPanchayats in Koderma CD Block are: Bekobar (North), Bekobar (South), Charadih, Chhatarbar, Dumardiha, Inderwa, Jarga, Jhumri, Karma, Kauawar Gajhandi, Kharkotta, Kolgarma, Lariyadih, Lokai, Meghatari, Pandedih, Pathaldiha and Purnanagar.\nDemographics.\nAs per 2011 Census of India Kodarma CD Block had a total population of 93,240, of which 80,303 were rural and 12,937 were urban. There were 47,584 males and 45,656 females. Scheduled Castes numbered 15,428 and Scheduled Tribes numbered 454.\nBekobar is a census town in Kodarma CD Block with a population of 7,184 in 2011 and Karma is a census town with a population 0f 5,753 in 2011.\nLiteracy.\nAs per 2011 census the total number of literates in Kodarma CD Block was 46,695 out of which 30,607 were males and 19,088 were females.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48688048","title":"The Modern Art of Jazz by Zoot Sims","body":"\nThe Modern Art of Jazz by Zoot Sims\n\nThe Modern Art of Jazz by Zoot Sims (also released as One to Blow On) is an album by American jazz saxophonist Zoot Sims recorded in 1956 and released on the Dawn label.\nReception.\nAllmusic awarded the album 4 stars, with the review by Ken Dryden stating: \"These early 1956 sessions feature Zoot Sims in top form playing a pair of standards and originals by members of the quintet. Bob Brookmeyer is the perfect foil for the tenor saxophonist, as they seamless interweave intricate lines throughout the record\".\nTrack listing.\n\"All compositions by Zoot Sims except as indicated\"\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48688055","title":"Roque Gallart","body":"\nRoque Gallart\n\nRoque Josė Gallart Ortiz, (born September 21, 1979), also known as Rocky the Kid, is a Puerto Rican actor and radio and television personality. Gallart is host of a Mega-TV television show named \"Descarao' Por La Noche\".\nBiography.\nRoque José Gallart Ortiz is the son of Roque José Gallart, Sr., himself a well-known radio announcer. Roque, Jr. would visit his dad's radio station and stay there until a school bus picked him up as a little kid. Roque, Jr. became interested in radio work during this era in his life.\nIn 1995, at age 16, he was hired by the radio station his dad worked for, 95X, in the Puerto Rican city of Bayamon. A few years later, he began to attend Universidad del Sagrado Corazon in Rio Piedras to study communications, but, feeling he was more advanced in his understanding of the radio world than his fellow students, he soon left the university and concentrated on his radio job.\nActing.\nRocky the Kid became a well known radio host in Puerto Rico over the years, and his fame allowed him to branch out into other areas of the show business world, starting in 2010, when he participated in \"\", playing himself along fellow radio personalities, actors and friends \"Tony Banana\" and Billy Fourquet. He then re-joined Fourquet in a 2011 comedy film named \"Que Joyitas!\", where he again played a version of himself.\nIn 2013, Gallart again played himself in \"Que Joyitas! II\", in which he was featured in the movie's poster. The three movies that Gallart has been in have been released in local cinemas in Puerto Rico, and Que Joyitas! has been shown in the United States television on Cine Latino.\nLo se Todo.\nFollowing a severe boycott by sponsors of Kobbo Santarrosa's gossip show, SuperXclusivo, WAPA America took that show off the air, and then hired six people, including Pedro Juan Figueroa, Sylvia Hernandez, \"Topy Mamery\" and Gallart, to host a new television show named \"Lo Se Todo\" in 2013. \"Lo Se Todo\" became a successful and highly rated show in Puerto Rican television, but internal turmoil plagued the show almost from the beginning. During 2014, Gallart once played a Black character in the show, with monkey sounds played in the background. As a consequence, the network received several calls from complaining viewers, which led to Gallart issuing a public apology in which he stated his intention was never to offend anyone based on race, religion, birth place or sexual preference, and a network producer to be fired.\nEarly in 2015, Gallart decided to leave \"Lo Se Todo\" after his radio employer, SBS, told him he would not be allowed to work with them and at WAPA-America consecutively. Offered a contract by WAPA-America on December 6, 2014, Gallart did not sign it, deciding instead to keep working on radio. The contract offer by WAPA-America came only 4 days after Mamery, who had also left \"Lo Se Todo\" and whom Gallart had befriended, died of a heart attack. Following the news of his friend's death, Gallart cried on live television.\nIn April 2015, Gallart declared on his radio show that \"Lo se Todo\" television personnel were victims of workplace harassment by show producer Niria Ruiz, also mentioning Joe Ramos in his comment, calling Pedro Juan Figueroa a hypocrite and traitor who never took the other hosts side against \"Lo Se Todo\" producers during arguments, affirming that Frankie Jay, another of the show's hosts, did so, and describing working conditions at \"Lo Se Todo\" as a \"living hell\".\nAs a consequence of those statements, on August 31, 2015, WAPA-America sued Gallart for the amount of $2,000,000 dollars, accusing him of defamation.\nMove to Mega-TV.\nOn March 9, 2015, Gallart began a new television show on Mega-TV, a Hispanic channel in the United States. The show, named \"Descarao' Por La Noche\" is seen in Puerto Rico and various cities in the United States, including Phoenix, New York City, LA and San Francisco, Houston, Miami and Chicago, among others.\nPersonal.\nGallart is married to \"Lo Se Todo\" host Jessica Serrano. Their first daughter, Emma Catalina Gallart Serrano, was born on November 14, 2015. He also has a son, Ricky, from an earlier relationship, and a step-daughter, Carolina.\nGallart was arrested and briefly jailed in November 2013 by Puerto Rican police after allegedly sending threatening messages to a former girlfriend. He was released almost immediately when a judge found no cause against him.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48688059","title":"Elrod, Indiana","body":"\nElrod, Indiana\n\nElrod is an unincorporated community in Ripley County, in the U.S. state of Indiana.\nHistory.\nA post office was established at Elrod in 1849, and remained in operation until 1903. George W. Elrod, an early postmaster, gave the community his name.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48688069","title":"List of international cricket centuries at the Wanderers Stadium","body":"\nList of international cricket centuries at the Wanderers Stadium\n\nThe Bidvest Wanderers Stadium is a cricket stadium, situated just south of Sandton in Illovo, Johannesburg in Gauteng Province, South Africa. Test, One Day and First class cricket matches are played here. The stadium has a seating capacity of 34,000. The ground is among the most historically significant cricket grounds of the twenty-first century. It has staged some of the most important matches in ODI and T20I history, and has witnessed a number of outstanding world records.\nThe 2003 Cricket World Cup final was held at the Wanderers Stadium. This stadium also hosted one of the greatest One-Day International matches. The match was played between South Africa and Australia in which a world record score of 434 was chased down by South Africa. It hosted matches of the 2007 ICC World Twenty20 including the first match and the final which was won by India, who defeated Pakistan.\nTest centuries.\nThe following table summarises the Test centuries scored at the Wanderers.\nOne Day International centuries.\nThe following table summarises the One Day International centuries scored at the Wanderers.\nTwenty20 International centuries.\nThe following table summarises the Twenty20 International century scored at the Wanderers.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48688080","title":"Lookout, Indiana","body":"\nLookout, Indiana\n\nLookout is an unincorporated community in Ripley County, in the U.S. state of Indiana.\nHistory.\nA post office was established at Lookout in 1889, and remained in operation until 1906.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48688100","title":"Dhakuakhana College","body":"\nAwakening the sense of unity, national-integrity and environmental awareness."}
{"url":"https://en.wikipedia.org/wiki?curid=48688110","title":"Negangards Corner, Indiana","body":"\nNegangards Corner, Indiana\n\nNegangards Corner is an unincorporated community in Ripley County, in the U.S. state of Indiana. \nHistory.\nNegangards Corner had its start when a general store opened at the town site. An old variant name of the community was North Hogan. A post office opened under the name North Hogan in 1844, and remained in operation until 1877.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48688133","title":"Zhenjiang dialect","body":"\nZhenjiang dialect\n\nZhenjiang dialect is a form of Eastern Mandarin spoken in the town of Zhenjiang in Jiangsu Province. The town is situated on the south bank of the Yangtze river between Nanjing and Changzhou. It is thus at the intersection of China's Mandarin and Wu speaking regions. About 2.7 million Chinese live in the area where the Zhenjiang dialect is predominant.\nIn ancient times, Zhenjiang spoke Wu. Today, Wu is the language of nearby Changzhou, as well as Shanghai and Zhejiang Province. Mandarin speakers from the North have been immigrating to Zhenjiang since the fourth century, gradually changing the character of the local dialect. In modern times, the city speaks a dialect that is transitional between the Eastern Mandarin of Nanjing, located just west of the city, and the Taihu dialect of Wu spoken in Changzhou, which is just east of the city. Zhenjiang dialect is comprehensible to Nanjing residents, but not to Changzhou residents.\nThe issue of tones in the Zhenjiang dialect has been a topic scholarly study. Nanjing residents use the four tones of Mandarin, while Changzhou residents use seven or eight tones. According to a study by Qiu Chunan, Zhenjiang dialect has five citation tones: Tone1 (42) (a sharp fall from pitch 4 to pitch 2, or \"yinping\"), Tone2 (35) (a rising tone or \"yangping\"), Tone3 (32) (slight falling tone or \"shang\"), Tone4 (55) (high even or \"qu\"), and Tone5 (5) (checked tone or \"ru\"). Qiu's study used residents who had grown up in the Daxi Road area, where the standard form of the dialect is said to be spoken. The checked tone was a feature of Chinese spoken in the Middle Ages, but it is not part of Mandarin. Applying the theory of government phonology to the issue, Bao Zhiming noted that non-even tones become even when they appear before the high even, or 55, tone.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48688137","title":"Mister Universal Ambassador 2015","body":"\nMister Universal Ambassador 2015\n\nMister Universal Ambassador 2015, the 1st edition of the Mister Universal Ambassador pageant, held on November 11, in Surabaya, Indonesia. 19 contestants competed for the title. Christian Daniel of Puerto Rico crowned as the first ever Mister Universal Ambassador.\nCrossovers.\nMister International 2014\nManhunt International 2011\nMister Pancontinental 2015\nMister Global 2014\nMister Revolution Model 2014\nMen Universe 2012\nMister Asia 2014\nReferences.\nwww.mruniversalambassador.com\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48688167","title":"Cameron Lynch","body":"\nCameron Lynch\n\nCameron Ellis Lynch (born August 4, 1993) is an American football linebacker for the Los Angeles Rams of the National Football League (NFL). He played college football at Syracuse University. He signed with the Rams as an undrafted free agent in 2015.\nProfessional career.\nSt. Louis/Los Angeles Rams.\nAfter going unselected in the 2015 NFL Draft, Lynch signed with the St. Louis Rams on May 8, 2015. \n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48688180","title":"TV Bel Kanal","body":" The program is mainly produced in Serbian language. TV station was established in 2003. TV Bel reports on local events in Banja Luka, Republika Srpska entity and BiH.\nThe channel broadcasts documentaries from domestic and foreign production, TV series, movies and entertainment. Channel is also part of local news network in the RS entity called PRIMA mreža ().\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48688246","title":"Abhinav Bharti High School","body":"\nAbhinav Bharti High School\n\nAbhinav Bharti High School is a private English-medium co-ed school located in Pretoria street, Kolkata, West Bengal, India. This school is affiliated to CBSE. The school was established in 1945. The current principal of this school is Mrs Sanghmitra Mukherjee.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48688271","title":"Otter Village, Indiana","body":"\nOtter Village, Indiana\n\nOtter Village is an unincorporated community in Ripley County, in the U.S. state of Indiana.\nHistory.\nOtter Village was laid out in 1837. The community took its name from Otter Creek.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48688273","title":"Patrick J. Bergin","body":"\nPatrick J. Bergin\n\nPatrick J. Bergin has been the Chief Executive Officer of the African Wildlife Foundation since 2002.\nHe graduated from the University of Illinois at Urbana–Champaign with an MSc in International Agricultural Education in 1988, and from the University of East Anglia with a PhD in Development Studies in 1996.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48688292","title":"Penntown, Indiana","body":"\nPenntown, Indiana\n\nPenntown is an unincorporated community in Ripley County, in the U.S. state of Indiana. An old variant name was Pennsylvaniaburg.\nHistory.\nPenntown was originally called Pennsylviaburg, and under the latter name was laid out in 1837. The community was named after Pennsylvania, the native state of a share of the early settlers.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48688302","title":"Cherry picker (disambiguation)","body":"\nCherry picker (disambiguation)\n\nA cherry picker is a platform for lifting someone to work at a high level.\nCherry picker may also refer to:\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48688319","title":"Varian's theorems","body":"\nVarian's theorems\n\nIn welfare economics, Varian's theorems are several theorems related to fair allocation of homogeneous divisible resources. They describe conditions under which there exists a Pareto efficient (PE) envy-free (EF) allocation. They were published by Hal Varian in the 1970s.\nExamples.\nAll examples involve an economy with two goods, x and y, and two agents, Alice and Bob.\nA. Many PEEF allocations: Alice and Bob have linear utilities, representing substitute goods:\nThe total endowment is (4,4). If Alice receives at least 3 units of x, then her utility is 6 and she does not envy Bob. Similarly, if Bob receives at least 3 units of y, he does not envy Alice. So the allocation [(3,0);(1,4)] is PEEF with utilities (6,9). Similarly, the allocations [(4,0);(0,4)] and [(4,0.5);(0,3.5)] are PEEF. On the other hand, the allocation [(0,0);(4,4)] is PE but not EF (Alice envies Bob); the allocation [(2,2);(2,2)] is EF but not PE (the utilities are (6,6) but they can be improved e.g. to (8,8)).\nB. Essentially-single PEEF allocation: Alice and Bob have Leontief utilities, representing complementary goods:\nThe total endowment is (4,2). The equal allocation [(2,1);(2,1)] is PEEF with utility vector (1,1). EF is obvious (every equal allocation is EF). Regarding PE, note that both agents now want only y, so the only way to increase the utility of an agent is to take some y from the other agent, but this decreases the utility of the other agent. While there are other PEEF allocations, e.g. [(1.5,1);(2.5,1)], all have the same utility vector of (1,1), since it is not possible to give both agents more than 1. \nC. No PEEF allocations: Alice and Bob have concave utilities:\nThe total endowment is (4,2). The equal allocation [(2,1);(2,1)] is EF with utility vector (2,2). Moreover, \"every\" EF allocation must give both agents equal utility (since they have the same utility function) and this utility can be at most 2. However, no such allocation is PE, since it is Pareto-dominated by the allocation [(4,0);(0,2)] whose utility vector is (4,2).\nExistence of PEEF allocations with monotone convex preferences.\nVarian's theorem says that:\nIn the #Examples, the preferences are always monotone. However, only in examples A and B the preferences are convex.\nThe proof relies on the existence of a competitive equilibrium with equal incomes. Assume that all resources in an economy are divided equally between the agents. I.e, if the total endowment of the economy is formula_5, then each agent formula_6 receives an initial endowment formula_7.\nSince the preferences are \"convex\", the Arrow–Debreu model implies that a competitive equilibrium exists. I.e, there is a price vector formula_8 and a partition formula_9 such that:\nSuch an allocation is always EF. Proof: by the (EI) condition, for every formula_13. Hence, by the (CE) condition, formula_14.\nSince the preferences are \"monotonic\", any such allocation is also PE, since monotonicity implies local nonsatiation. See fundamental theorems of welfare economics.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48688336","title":"Hong Kong Scout Progressive Badge Scheme","body":"\nHong Kong Scout Progressive Badge Scheme\n\nThe Scout Progressive Badge scheme is a scheme which assess scouts. This scheme can reflect the overall ability of scouting skills.\nMembership Badge.\nThis is a badge which is required for all scouts.\nBackground Requirement.\n11 or above\nPathfinder Award.\nPathfinder Badge is the second stage of the Scout.\nBackground Requirement.\n11 or above\nVoyager Award.\nThis is the badge most scouts will get. It is the third stage of the progressive badge scheme.\nRequirement.\nScoutcraft.\nSome of the activities must be conducted under the supervision of adults.\nChallenger Award.\nThe Challenger award is the fourth stage and the second last stage of the scheme.\nRequirement.\nScoutcraft.\nSome of the activities must be conducted under the supervision of adults.\nChief Scout's Award.\nThis is the highest stage. Every year several hundred scouts attain this award (ratio 1:180-190). They can participate he Scout Rally regardless of their troop.\nBasic Requirement.\nthe \"Scoutcraft\", \"Adventure\", \"Commitment\" and \n\"Proficiency/ Activity Badge\" sections of the Pathfinder Award, \nVoyager Award and Challenger Award.\nRequirement.\nScoutcraft.\nLeaders’ Council\nPatrol. \n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48688348","title":"Sathanur, Mandya","body":"\nSathanur, Mandya\n\nSathanur is a village in Mandya district, Karnataka, India. Sathanur village is located in the SH-84, just 3 km from Bangalore-Mysore National highway -275.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48688351","title":"NTV Arena","body":" The program is mainly produced in Serbian language. TV station was established in 1999. NTV Arena reports on local events in Bijeljina, Republika Srpska entity and BiH.\nThe channel broadcasts TV series,entertainment and news. Channel is also part of local news network in the RS entity called PRIMA mreža ().\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48688353","title":"Joshua Oigara","body":"\nJoshua Oigara\n\nJoshua Nyamweya Oigara is the Group Chief Executive Officer of the Kenya Commercial Bank Group. At age 37, his appointment in November 2012 to replace the outgoing CEO Martin Oduor-Otieno made him the youngest CEO of a publicly traded bank at the NSE. Prior to his appointment, he served as Chief Financial Officer and Member of the Board of Directors of the Company between January 12, 2012 and January 2013. He also served as Group Chief Financial Officer at KCB Bank Group for East Africa. He joined the Bank in November 2011 from Bamburi Cement where he served as Group Financial Director and Chief Financial Officer for the East Africa region. Mr. Oigara holds a Bachelor of Commerce degree from University of Nairobi and Master of Business Administration (M.B.A.) from Edith Cowan University and a host of other qualifications\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48688354","title":"Mount Alexander (Antarctica)","body":"\nMount Alexander (Antarctica)\n\nMount Alexander () is a mountain with several summits, the highest 595 m, forming the rocky peninsula separating Gibson and Haddon Bays, on the south side of Joinville Island in Antarctica. The cliff marking the extremity of the peninsula was discovered and named Cape Alexander on January 8, 1893 by Thomas Robertson, master of the ship \"Active\", one of the Dundee whalers. The name was amended to Mount Alexander by the United Kingdom Antarctic Place-Names Committee (UK-APC) in 1956 following a survey by the Falkland Islands Dependencies Survey (FIDS) in 1953–54, the mountain summits of the peninsula being considered more suitable to name.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48688373","title":"Paul Gundani","body":"\nPaul Gundani\n\nPaul Gundani (1967 – 3 November 2015) was a Zimbabwean professional football player. He made three appearances for the Zimbabwe national football team.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48688376","title":"Frank Tipton","body":"\nFrank Tipton\n\nFrank Ben Tipton (born in California) is an Australian historian and Emeritus Professor at The University of Sydney Business School. He is known for his works on Modern history of Germany and Economic history.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48688378","title":"Mount Alfred (Antarctica)","body":"\nMount Alfred (Antarctica)\n\nMount Alfred () is an ice-capped mountain, more than 2,000 m, 5.5 nautical miles (10 km) inland from George VI Sound and 8 nautical miles (15 km) south of Mount Athelstan in the Douglas Range of Alexander Island, Antarctica. It was first photographed from the air on November 23, 1935, by Lincoln Ellsworth and mapped from these photos by W.L.G. Joerg. Its east face was roughly surveyed in 1936 by the British Graham Land Expedition (BGLE) and resurveyed in 1948 and 1949 by the Falkland Islands Dependencies Survey (FIDS), who named it for Alfred, Saxon king of England, 871-899. The west face of the mountain was mapped from air photos taken by the Ronne Antarctic Research Expedition (RARE), 1947–48, by Searle of the FIDS in 1960.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48688385","title":"WTA Player of the Year","body":"\nWTA Player of the Year\n\nThe WTA Player of the Year is an annual Women's Tennis Association (WTA) award given since the 1977 WTA Tour.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48688397","title":"Raymond Jack Last","body":"\nRaymond Jack Last\n\nRaymond Jack Last (26 May 1903 Adelaide - 1 January 1993 Malta), comparative anatomist, was Anatomical Curator Royal College of Surgeons 1946-50, Professor of Applied Anatomy 1950-70, Warden of Nuffield College of Surgical Sciences 1949-70, and Visiting Professor UCLA 1970-88. Last was an outstanding lecturer in postgraduate anatomy, and belonged to a small set of anatomists who were initially practising surgeons and then made a career teaching it. \nHenry Last, his grandfather, was from Debenham in Suffolk and jumped ship to settle in South Australia. His wife was Mary Ann Bowden who had Cornish roots. They later settled in Adelaide. \nHenry's eldest surviving son, John Last, worked at an Adelaide stationer and bookseller. John and his wife had 3 children, Raymond and two younger sisters, all being diligent and studious.\nRaymond first attended North Adelaide Primary School, from where he went on to the Adelaide Boys’ High School, where another scholar and classmate was Mark Oliphant, who went on to become an eminent physicist and later, Governor of South Australia. \nAssisted by a State Bursary, he enrolled at the University of Adelaide, and though underage, obtained permission to start the medical course. A brilliant trio headed the Medical School — John Burton Cleland in Pathology, Thorburn Brailsford Robertson in Physiology, and Frederic Wood Jones in Anatomy. Last was top student in all but the final year, and graduated MB BS in 1924.\nIn June 1939 Last and his second wife Margret, who had been Matron at Booleroo Centre District Hospital, set off for England in order to become a Fellow of the Royal College of Surgeons. With the start of World War Two in September 1939 they began work at the Emergency Medical Service at the North London Fever Hospital at Winchmore Hill, later to become an annexe of the Royal London Hospital. Here Last worked under Henry Souttar.\nAs a member of the Australian Army Medical Corps Last was turned down by the British Army, so he was obliged to return to Australia to enlist there. \"MV Napier Star\" was torpedoed in the Irish Sea on 18 December 1940 (see List_of_shipwrecks_in_December_1940#18_December), only 28 of 99 people surviving, among which were Raymond and Margret Last. Raymond Last wrote an account of the event. They joined the British Red Cross Society and Last led a surgical team, his wife Margret being principal nurse, that formed part of the British forces sent to end the Italian occupation of Abyssinia. Last spent three years there, becoming personal physician to the Emperor Haile Selassie and his family. The closing year of the War saw Last heading a medical unit in Borneo, providing medical care for the civilian population.\nWhen Last returned to London and the Royal College of Surgeons, the Professor of Anatomy was Frederic Wood Jones, who had tutored Last in Adelaide, and inspired an enduring interest in comparative anatomy. After some years as anatomy demonstrator and curator, Last was appointed Professor of Applied Anatomy in 1950. His textbook, 'Anatomy Regional and Applied', was first published in 1954 and heralded a new generation of anatomy texts providing a more concise option to 'Gray's Anatomy' or Cunningham's 'Textbook of Anatomy'. It became known for its readability and interest, as it presented medical and surgical anatomy in a practical light, rather than as a colourless academic exercise. and rapidly gained popularity amongst surgical students. His own drawings were used as illustrations. Last became first Warden of the Nuffield College of Surgical Sciences, the residence for medical students. On his retiring a common room was named in his honour. \nFrom 1970-87 he held the chair of Visiting Professor in the Department of Anatomy at the University of California, Los Angeles. This appointment enabled his spending winter breaks in Adelaide, where he gave lectures and demonstrations in the dissecting room of the Adelaide Medical School, often making use of his superb chalk diagrams.\nThe Lasts chose Malta as a final place of retirement, partly because of its tax laws and partly because of his circle of friends, which included expatriate English people, local Maltese and a sprinkling of surgeons. Failing vision limited his drawing skills; and he suffered from senile gait syndrome, necessitating assistance when standing or walking. Margret died in January 1989, and Last stayed on in Malta. \nHe had two sons, John and Peter, by his first wife, both graduating in medicine from Adelaide University. He had no share in their upbringing. \n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48688423","title":"WTA Doubles Team of the Year","body":"\nWTA Doubles Team of the Year\n\nThe WTA Doubles Team of the Year is an annual Women's Tennis Association (WTA) award given since the 1977 WTA Tour.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48688424","title":"Darchhawna","body":"\nDarchhawna\n\nDarchhawna is an Indian writer of Hindi literature and historian from the Northeast Indian state of Mizoram. Born on the New year Day of 1936, Darchhawna is a former Officer on Special Duty at the Mizoram University, when it was the Mizoram campus of the North Eastern Hill University (NEHU) and the founder President of the Mizo History Association. He held the post of the president of the organization for several terms and is holding post, after getting elcted in 2013. The Government of India awarded him the fourth highest civilian honour of the Padma Shri, in 2005, for his contributions to Indian literature.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48688452","title":"Gopikishan Bajoria","body":"\nGopikishan Bajoria\n\nGopikishan Bajoria () is a Shiv Sena politician from Akola district, Maharashtra. He is current Member of Legislative Council as a member of Shiv Sena representing Akola-cum-Washim-cum-Buldhana Local Authorities constituency. He has been elected to Maharashtra Legislative Council for three consecutive terms for 2004, 2010 and 2016.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48688455","title":"RTV IS","body":" The program is mainly produced in Serbian language. TV station was established in 2008. Local radio station Radio Istočno Sarajevo is also part of this company. The channel broadcasts local news, TV series and entertainment. Channel is also part of local news network in the RS entity called PRIMA mreža ().\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48688510","title":"Jon Rune Strøm","body":""}
{"url":"https://en.wikipedia.org/wiki?curid=48688536","title":"Sabina Selimovic and Samra Kesinovic","body":"\nSabina Selimovic and Samra Kesinovic\n\nSabina Selimovic (c.1999–2014?) and Samra Kesinovic (c.1998–2015?) were Austrian teenagers who emigrated to the Islamic State of Iraq and the Levant in April 2014.\nSelimovic and Kesinovic were born in Austria to Bosnian immigrants who had fled the Bosnian War in the 1990s. Selimovic and Kesinovic, who were residents of Vienna, were believed to have been radicalized after reading about jihad on the Internet through their attendance of a Viennese mosque. The pair left their homes in Vienna in April 2014 to travel to Syria via Turkey to join the Islamic State of Iraq and the Levant. The pair left a note to their parents that stated \"Don't look for us. We will serve Allah and we will die for him.\" The pair later posted photographs on social media of themselves wearing full length burqas and handling assault weapons. A mutual friend of Selimovic and Kesinovic told \"Paris Match\" that the pair were married to Chechen fighters, and that they were afraid of imprisonment in Austria should they have returned. In December 2015, a Tunisian woman who defected from ISIS told \"The Sun\" that she and Kesinovic were kept together in a house in Syria where they served as sexual slaves for jihadis. They were allegedly required to provide sexual services to new recruits.\nSelimovic and Kesinovic reportedly wished to return to Austria in October 2014, though it had been reported in September that Selimovic had been killed while fighting for Islamic State in Syria. In late 2015 it was reported that Kesinovic was beaten to death with a hammer after trying to escape from sexual slavery in Raqqa.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48688565","title":"Kuweires Military Airbase","body":"\nKuweires Military Airbase\n\nThe Kuweires Military Airbase is an airbase in Aleppo Governorate, Syria. It is situated between As-Safira in the West and Dayr Hafir in the East. It was used for educational purposes mainly.\nOn 18 March 2014, it was reported that an effort entitled “Do Not Divide” [Wa La Tafaraqu] aimed to seize Kuweiris Airbase. Rebel forces have surrounded Kuweiris for more than a year but have not overrun it. However, as rebel infighting with ISIS intensified, ISIS apparently left (or was forced off) the battlefield and a new logo without its name was posted online by another brigade.\nAfter being sieged by ISIS for more than two years it was freed by the Syrian army in November 2015 in the Kuweires offensive.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48688567","title":"Town hall of Bordighera","body":"\nTown hall of Bordighera\n\nThe Town hall of Bordighera is located at 32 Via XX Settembre in Bordighera, Liguria.\nHistory.\nThe current town hall was built to a design by the French architect Charles Garnier. Garnier, who had left Paris because of Paris Commune (1871), was looking for a land in Bordighera to build his future house. In 1871 he proposed the municipality to buy the land where only school of the city stayed. The offer of 6,000 pounds was very generous, it would have allowed the construction of a new school for which Garnier provided the plans.\nThe project included a classical building that integrates well with the old town of Bordighera that lies behind. The new schools foresaw not only a new section for boys replacing the previous one, but also a girls' section and one for small children. The project is to be considered truly innovative for its time and the municipality accepted the proposal. During the works, which were not followed by Garnier, there were numerous technical problems and delays in deliveries. It was only in 1878 that part of the building was finally terminated.\nMeanwhile, the population grew and the city decided to build a new school that was opened later in 1886. With the transfer of the school, the municipality decided to use the building as its headquarters. The facade was carved with the coat of arms of the city, a rampant lion that leans against a Pine seafarer. Inside the town hall you can admire numerous paintings from various artists who stayed in Bordighera, including: Pompeo Mariani, Giuseppe Ferdinando Piana, Giuseppe Balbo, Friederich von Kleudgen, etc.\nThe gardens.\nThe true gardens of the town hall are between the building designed by Charles Garnier and the Cape Esplanade. These gardens, although of small size, can boast two great Ficus macrophylla centenarians and many varieties of exotic plants (agaves, palm trees, cactus, etc.) which can also be seen in many Bordighera gardens. On 17 January 1954, the city placed a bust in honour of Ludwig Winter, its illustrious adopted citizen, as an honour to the man who had done so much to bring prestige to the city and to the Riviera. This is sometimes confusing. Some mistakenly call these gardens also \"Winter Gardens\", but the real Winter Garden are at 6 Ludovico Winter Street in Bordighera.\nAt the foot of the old town hall of Bordighera, there is a large wooden area that is called in various ways: the gardens of the Cape or, more commonly, Cape Pineta. The gardens are vast, and full of very old trees such as pines, olive trees, palm trees and a variety of other species, but very old specimens of Araucaria Heterophylla stand out. In the pine forest there is also a bust in honour of the painter Mosè Bianchi, who often came to Bordighera to spend time with his grandson Pompeo Mariani. Also in the Cape Pineta, but a bit lower, there is a monument in honour of Charles Garnier.\nOn May 15, 2015 the renovation of the Marabutto was terminated. It is an ancient powder keg that is currently in the Cape Pineta. The name is due to the shape of the small building that recalls the graves of Muslim holy men (a cube topped by a dome), whose name is precisely marabutto. Near the Marabutto, you can see three old cannons so much loved by the locals that they were given names: Butafoegu, Tiralogni et Cacastrasse.\nTrivia.\nWhen the city had to choose its coat of arms, a dispute broke out with the neighbouring city of Sanremo. Bordighera, which was nicknamed \"Queen of the Palms\", wanted to see represented the palm on his coat of arms, but the bigger rival city had already a similar one, so Bordighera had to settle for a pine.\nBehind the municipal building is one of four Ficus Magnolioides recognised by the State Forestry. The monumental tree has an estimated age of 100 years, with a height of 18 meters and a diameter of the stem of 1040 cm.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48688618","title":"Summer in the Arab world","body":"\nSummer in the Arab world\n\nSummer in the Arab world in the summer perpendicular to the sun's rays on the central parts of the Arab world and so the temperatures, especially in the interior, which is characterized by the poverty of the vegetation and the spread of the sand either areas Aljblahuhal Mediterranean shall be the temperatures moderate making it one of the summer centers Almanmh.uteb in this Chapter monsoon moist from the Atlantic Ocean and the Indian Ocean, causing rainfall in southern Mauritania and southern Somalia, Sudan and Yemen, the Arab world .oamtaz length of the growing season in most parts of allowing the cultivation dense as the climate diversity has helped the diversity of agricultural crops and integration\nSources.\nGeography\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48688619","title":"Thomas Rudge","body":"\nThomas Rudge\n\nThomas Rudge (baptised 1753 – 1825) was an English churchman, topographer and antiquarian, Archdeacon of Gloucester from 1814, and chancellor of the diocese of Hereford from 1817.\nLife.\nThe son of Thomas Rudge of Gloucester, he matriculated at Merton College, Oxford, on 7 April 1770, aged 16. He graduated B.A. in 1780, and proceeded M.A. from Worcester College in 1783 and B.D. in 1784. He was appointed rector of St. Michael's and St. Mary-de-Grace, Gloucester, and, on the presentation of the Earl of Hardwicke, vicar of Haresfield.\nRudge died in 1825.\nWorks.\nRudge published:\nNotes.\nAttribution\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48688652","title":"Gino D'Auri","body":""}
{"url":"https://en.wikipedia.org/wiki?curid=48688660","title":"Rexville, Indiana","body":"\nRexville, Indiana\n\nRexville is an unincorporated community in Ripley County, in the U.S. state of Indiana.\nHistory.\nA post office was established at Rexville in 1870, and remained in operation until 1907. The community's name honors the Rex family of settlers.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48688662","title":"Rexville","body":"\nRexville\n\nRexville may refer to:\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48688676","title":"Vertical perspective","body":"\nVertical perspective\n\nVertical perspective may mean:\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48688681","title":"Spades, Indiana","body":"\nSpades, Indiana\n\nSpades is an unincorporated community in Ripley County, in the U.S. state of Indiana.\nHistory.\nSpades was laid out in 1855. The community's name honors Jacob Spade, a first settler. An early variant name of the community was Spades Depot. A post office was established as Spade's Depot in 1855, the name was shortened to Spades in 1883, and the post office closed in 1950.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48688688","title":"Scott Tsumura","body":""}
{"url":"https://en.wikipedia.org/wiki?curid=48688703","title":"Stringtown, Ripley County, Indiana","body":"\nStringtown, Ripley County, Indiana\n\nStringtown is an unincorporated community in Ripley County, in the U.S. state of Indiana.\nHistory.\nA post office was established at Stringtown in 1848, and remained in operation until 1865.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48688714","title":"Paolo Rossi (1900-1985)","body":"\nPaolo Rossi (1900-1985)\n\nPaolo Rossi (Bordighera, September 15, 1900 - Lucca, 24 May 1985) was an Italian lawyer and politician.\nBiography.\nPaolo Rossi is the son of the famous criminal lawyer of Genoa, Francesco Rossi and of Iride Garrone. He comes from an educated and progressive Ligurian family, his cousin is Maria Vittoria Rossi, better known as Irene Brin, the fashion journalist and style icon.\nThe young man decided to follow his father's footsteps and graduated at the University of Genoa, he enrolled to the Bar of the Appellate court of Genoa at 21 and to Court of cassation at 28.\nPersecuted by the fascists, in 1926 his study of via Roma in Genoa was destroyed and burned.\nIn 1932 he wrote his first book \"The death penalty and its criticism\", which will be blocked by the censors because it opposed the death penalty supported by the fascist regime.\nHe married Giuseppina Bagnara, called Giugi, whom he met in Bordighera, and he has a daughter, the writer Maria Francesca Rossi, known with her pen name of Francesca Duranti. In 1937 he wrote his second book \"Skepticism and dogmatic in criminal law\", which was also criticized for its too progressive ideas. During the war, the family moved near Lucca, in Gattaiola. In those years he joins the resistance and, with his wife, he managed to save many young people from fascist raids.\nIn 1948 he published \"The parties against democracy\" and, shortly afterwards, was appointed Professor of Criminal Law at the University of Pisa.\nOn 15 October 1947 he became a member of the Constituent and of the Committee on the Constitution of Italy. The same year he became Professor of Criminal Law at the University of Genoa.\nA leading member of the Italian Democratic Socialist Party, he was elected as Member of Parliament in the first four legislatures, and took, in two of them, the vice-presidency of the Chamber of Deputies in addition to the presidency of some inquiry commissions. He was Minister of Education from 6 July 1955 to 19 May 1957 during the first Government of Antonio Segni. In 1958 he was appointed Vice-President of the Chamber of Deputies (Italy), and in 1961 President of the Commission on the problems of Alto-Adige.\nHe was the first president of the Antimafia Commission (in the third Legislature from 14 February to 15 May 1963) which was then called the Parliamentary Commission of Inquiry on the Mafia in Sicily.\nOn 2 May 1969 he is named Judge of the Constitutional Court of the Italian Republic by the President of the Italian Republic, Giuseppe Saragat, was sworn in on May 9, 1969 and was elected president of the Court on December 18, 1975. He ceased to hold office as President on May 9, 1978, but stayed on as judge until August 2, 1979).\nHe was the author of many texts, both in the legal and in the political field. From 1970 to 1973 he published a collection of four volumes on the history of Italy, entitled \"History of Italy from 476 to the present day”.\nHe was also president of the general National Corps of Italian Boy Scouts (CNGEI).\nHe died in Lucca on May 24, 1985 and was buried in the cemetery of Gattaiola.\nHonours.\nOn 6 august 1970 he was named “Knight Grand Cross of Order of Merit of the Italian Republic” by the List of Presidents of Italy, Giuseppe Saragat.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48688721","title":"Mary Pickford Award","body":"\nMary Pickford Award\n\nThe Mary Pickford Award is an honorary Satellite Award bestowed by the International Press Academy. It is \"IPA’s most prestigious honor\" and as an award \"for Outstanding Artistic Contribution to the Entertainment Industry\" it reflects a lifetime of achievement.\nThe Award is named for Mary Pickford, early pioneer of the film industry, who began her career as a child actress and went on to become \"America's Sweetheart\" and a co-founder of United Artists Studios with fellow filmmakers Charlie Chaplin, Douglas Fairbanks and D.W. Griffith.\nThe award was first presented to Rod Steiger at the 1st Annual Golden Satellite Awards. Ellen Burstyn is the latest recipient.\nThe trophy awarded to the honorees is a bust of Canadian American motion picture actress Mary Pickford cast in bronze, on a marble base, inscribed for the recipient. It was designed by Sarajevan sculptor Dragan Radenović.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48688724","title":"Behlmer Corner, Indiana","body":"\nBehlmer Corner, Indiana\n\nBehlmer Corner is an unincorporated community in Ripley County, in the U.S. state of Indiana.\nHistory.\nBehlmer Corner was originally called Lynnville, and under the latter name was laid out in 1844.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48688733","title":"Monica Mary Gardner","body":"\nMonica Mary Gardner\n\nMonica Mary Gardner (26 June 1873 – 16 April 1941) was an English writer on Poland and Polish writers and a translator of Polish literature.\nLife and work.\nGardner was born in 1873 at Roehampton Lane in London. the eldest of the six children of John Gardner, a member of the stock exchange, and his wife Amy Vernon Garratt. Her brother was the Italian scholar Edmund Garratt Gardner.\nGardner studied the Polish language and literature after being intrigued at school by Bonnie Prince Charlie's mother who was the Polish aristocrat Clementina Sobieska. In 1899 she began to get assistance in her obsession for Polish and Poland by the writer Edmund Naganowski. He was able to support her until the First World War prevented further communication. Naganowski was to die in 1915. Gardner taught herself how to research sources in Polish and how to find out more about Poland. Her first monograph in 1911 was on Adam Mickiewicz who was regarded as the national poet of Poland.\nShe followed this with more books on her single theme. She was known as one of the few English speaking writers who studied Polish literature and history. She wrote \"Poland: a Study in National Idealism\" in 1915 and \"The Anonymous Poet of Poland: Zygmunt Krasiński\" in 1919. In 1922 she and her brother made what may have been her only visit to Poland. They visited Poznań and Cracow. She wrote the \"The Patriot Novelist of Poland: Henryk Sienkiewicz\" in 1926. The latter was said to have been published to coincide with the return of Sienkiewicz's body from Switzerland to be encrypted in Warsaw Cathedral.\nIn between the wars Gardner lived with her mother and her brother who was dedicated to Italy and Italian. Monica's knowledge and expertise made their house a place to visit by notable visiting Poles.\nWith the outbreak of World War Two, which Britain entered after the German invasion of Poland, Gardner's expertise became more important. She died as a result of a German land mine which landed on her house. One of her manuscripts was recovered from the bomb site, but another was lost. Gardner's funeral was an important event that was attended by the President of Poland, Władysław Raczkiewicz.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48688737","title":"Romanian Jews in Israel","body":"\nRomanian Jews in Israel\n\nRomanian Jews in Israel refers to the community of Romanian Jews who migrated to Palestine beginning in the later 19th century, continued migrating to Israel after the formation of the modern state in 1948, and live within the state of Israel. The descendants of those who made aliyah in 1930s, the wave of emmigrants after World War II or after the fall of communism, with their children and grandchildren born in Israel, represent about 10% of the population. According to the Association of Romanian Journalists Abroad, about 400,000 Romanian Jews live in Israel. Most of them have higher education, occupying important positions in various sectors and making a great contribution to the economic, social and cultural development of Israel. \nThey have established several kibbutzim, moshavim and towns (Kiryat Bialik, Kiryat Tiv'on, Rosh Pinna, Zikhron Ya'akov). Between 1882 and 1884, Romanian Jews in Israel already established nine localities. \nImmigration history.\nMass emigration to Israel ensued (\"see Bricha and Aliyah\"). According to Sachar, for the first two post-war years, tens of thousands of Romanian Jews left for Israel; the Romanian government did not try to stop them, especially due to its desire to reduce its historically suspect and now impoverished Jewish minority. Afterwards, Jewish emigration began to encounter obstacles. In 1948, the year of Israeli independence, Zionism came under renewed suspicion, and the government began a campaign of liquidation against Zionist funds and training farms. However, emigration was not completely banned; Romanian Foreign Minister Ana Pauker, herself a Jew with a father and brother in Israel, negotiated an agreement with Israeli ambassador Reuven Rubin, a Romanian immigrant to Israel, under which the Romanian government would allow 4,000 Jews a month to emigrate to Israel; this decision was at least partially influenced by a large Jewish Agency bribe to the Romanian government. This agreement applied mainly to ruined businessmen and other economically \"redundant\" Jews. Around this time, Israel also secured another agreement with the Romanian government, under which Romania issued 100,000 exit visas for Jews and Israel supplied Romania with oil drills and pipes to aid the struggling Romanian oil industry. By December 1951, about 115,000 Romanian Jews had emigrated to Israel.\nThroughout the period of Communist rule, Romania allowed limited numbers of Jews to emigrate to Israel, in exchange for much-needed Israeli economic aid. By 1965, Israel was funding agricultural and industrial projects throughout Romania, and in exchange, Romania allowed limited numbers of Jews to emigrate to Israel. When Nicolae Ceaușescu came to power in 1965, he initially ended the trade in deference to the Eastern bloc's Arab allies. However, by 1969, he decided to exchange Jews for cash from Israel. Ceaușescu wanted economic independence from the Soviet Union, which was content to keep Romania a backwater and as nothing more than a supplier of raw materials, but to fund economic projects, he needed hard cash. As a result, from then until the Ceaușescu regime fell in 1989, about 1,500 Jews a year were granted exit visas to Israel in exchange for a payment of cash for every Jew allowed to leave, in addition to other Israeli aid. The exact payments were determined by the age, education, profession, employment, and family status of the emigrant. Israel paid a minimum of $2,000 per head for every emigrant, and paid prices in the range of $25,000 for doctors or scientists. In addition to these payments, Israel also secured loans for Romania and paid off the interest itself, and supplied the Romanian Army with military equipment.\nAs a result of aliyah, the Romanian-Jewish community was gradually depleted. By 1987, just 23,000 Jews were left in Romania, half of whom were over 65 years old.\nRelations with Romanian culture.\nRomanian Jews in Israel have strong relations with Romanian culture. Moreover, there is an intense activity among writers of Romanian language. In Israel exist 11 associations of writers in foreign languages, including the Association of Israeli Writers of Romanian Language (). Likewise, there are publications in Romanian languages, weekly, monthly or quarterly, plus several local issues.\nRomania has an embassy in Tel Aviv, three honorary consulates in Jerusalem, Beersheba and Haifa and a cultural institute in Tel Aviv.\nNotable people.\nThis is a list of Israeli people of Romanian Jewish descent:\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48688742","title":"Haney Corner, Indiana","body":"\nHaney Corner, Indiana\n\nHaney Corner is an unincorporated community in Ripley County, in the U.S. state of Indiana.\nHistory.\nA post office called Haney's Corner was established in 1871, and remained in operation until 1905.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48688768","title":"Hennadiy Zubko","body":"\nHennadiy Zubko\n\nHennadiy Zubko (born 27 September 1967, Mykolaiv) is a Ukrainian politician.\nFrom 2 December 2014 - Vice Prime Minister - Minister of Regional Development, Construction and Housing in the second Government of Arseniy Yatsenyuk.\nEducation.\nHe graduated from the Kyiv Polytechnic Institute, specialty \"Automated control systems\", engineer (1991); Kyiv Engineering Institute. The course \"Investment and financial management in the construction industry\" (2003); Northwestern University, Illinois, Chicago. The course \"Innovative Management\" (2006); National University of \"Kyiv-Mohyla Academy\", Kyiv Mohyla Business School, Master of Business Administration (MBA) (2007); National University of \"Kyiv-Mohyla Academy\", specialty \"Management\", manager and economist (2008).\nCareer.\n1986–1988 — military service in the Armed Forces of the USSR.\n1988–1990 - software engineer at the Zhytomyr Regional department of technological connection.\n1991–1992 — software engineer of PE \"Nyva\", Zhytomyr.\n1992–1994 — commercial director of the Production Company \"SERGYI\", Zhytomyr.\n1994–1997 — director of LLC \"Mayak\", Zhytomyr.\n1997–2002 — director of \"Tantal\", Zhytomyr.\n2001 — Project Manager of JSC \"LYNOS\" at Lysychanskyi PSI.\n2003–2007 — Head of the Department on coordination of organizations for installation of metal structures of the State Corporation \"Ukrmontazhspetsstroy\", Kyiv.\n2002–2010 — Deputy Chairman of JSC \"Zhytomyr plant of walling constructions\", Zhytomyr.\nFrom 2010 until present — Chairman of the PSC \"Zhytomyr plant of walling constructions\".\nFrom 27 May until 10 June 2014 – temporarily Head of the Administration of State Affairs.\nFrom 10 June to 2 December 2014 - First Deputy Head of the Presidential Administration of Ukraine.\nFrom 2 December 2014 - Vice Prime Minister - Minister of Regional Development, Construction and Housing.\nUkraine cabinet.\nMain is the conduction of reforms on decentralization and energy efficiency. During the year of implementing these reforms, a significant breakthrough was made, including the adopting of a number of legislative acts, introduction of new programs and their funding.\nAlso, the Ministry is responsible for the construction reform and introduction of market relations in the housing sector to provide consumers with quality services.\nHennadiy Zubko headed the government commission on investigating the MH17 catastrophe and the special commission on investigating causes of crash of the ship \"Ivolha\". He also took care of issues of infrastructure restoration in Svatove affected by fires at the rocket and artillery weapons warehouses. In addition, he created an expert group to assess the damage caused by an emergency situation.\nDecentralization.\nDecentralization reform implemented under the leadership of Hennadiy Zubko, involves changes in education, health, social policy, public administration, local authorities, development of urban infrastructure, as well as energy efficiency measures.\nIn December 2014, the Budget and Tax Codes were amended, and fiscal decentralization took place in Ukraine. Thanks to these changes, local budgets in 2015 became surplus. Fiscal decentralization has allowed to receive additionally more than USD 24 billion to local budgets. Using the State Regional Development Fund, Government financed 784 projects of infrastructure and provided them with USD 2.7 billion.\nOn 1 September 2015 the of Ukraine No.320-VIII «On Amendments to Certain Legislative Acts of Ukraine on Decentralization of Powers in the field of Architectural Control and Improvement of Town Planning Legislation\" came into force. It reforms the system of state architectural control and transmits the respective functions and powers from the national to the local level.\nAfter adopting on 2 February 2015 the Law of Ukraine \"On voluntary association of local communities\", 6300 territorial communities initiated their association.\n159 associated communities took part in local elections on 25 October 2015. They elected their heads and local authorities. Since 2016, they should receive direct budgetary relations with the central budget.\nIn 2016, it is to give UAH 1.4 billion from the State Budget for subsidies to support joint local communities, meeting the long-term plans.\nMinistry of Regional Development has developed criteria for assessing implementation of the state policy of regional state administrations: 27 indicators at 6 directions on a quarterly basis and 64 indicators at 12 directions each year.\nThe Ministry has also an Action Plan on implementing during 2015-2017 the National Strategy of Regional Development for the period until 2020, which was approved by the Cabinet of Ministers. The document should resolve such problems as the uniformity of territorial development, elimination of inter-regional socio-economic disparities, stimulate economic activity and employment of residents of territorial communities.\nThe Government has provided contributions to the State Fund for Regional Development in amount of UAH 2.9 billion for the support of 844 development areas investment projects.\nThe international community assists the Regional Development Ministry in conducting decentralization. In particular, the EU EUR 90 million for implementing the decentralization reform.\n78% of the necessary laws for decentralization have already been adopted, 22% are awaiting amendments to the Сonstitution. The future of the reform depends on approval of these amendments by the Ukrainian MP’s.\nEnergy Efficiency.\nOn 3 September 2014, the Cabinet of Ministers approved the Action Plan for the implementation of the European Parliament and the Council of the EU DIrective 2009/28/EU \"On promoting the use of energy produced from the renewable energy sources\".\nOn 1 October 2014, the Cabinet of Ministers also approved the National Action Plan on Renewable Energy for the period until 2020 and Action Plan for its implementation. Implementing the plan will increase the share of energy produced from alternative fuel from 4.5% in 2013 to 11% in 2020.\nOn 28 September 2015, the Governmental Committee approved the draft Resolution of the Cabinet of Ministers of Ukraine \"On National Action Plan on energy efficiency for the period until 2020\".\nThe Law of Ukraine \"On energy efficiency of buildings\", which provides energy efficiency of buildings in accordance with the EU requirements, was drafted as well.\n\"Urban Infrastructure\" project was launched for the allocation of $140 million. The project was aimed at implementing measures to improve energy efficiency, reduce water losses and settle the day-night water supply in several cities.\nUnder the initiative of the Regional Development Ministry, the state now a part of the energy efficiency loans and will continue to do this in 2016.\n48 programs were adopted, providing for the compensation of loans interests under the energy efficiency measures. 13 programs are of the regional character, 16 - district and 19 - city. As of 9 November 2015, since the start of the State Program on Energy Efficiency for the reimbursement of \"warm\" loans, UAH 111.7 million were transferred from the state budget. About 60 thousand families participated in the Program. Banks issued the energy efficient loans worth of UAH 950.9 million.\nThe concept of the Energy Efficiency Fund - S2I was drafted to be launched in 2016.\nToday the share of renewable sources in the total energy balance of Ukraine is 3.45%. The reform program envisaged by the Government will increase it to 30% by 2030.\nConstruction Reform.\nMinistry of Regional Development, leaded by Hennadiy Zubko, drafted a Decree \"On the reallocation of governmental expenditures for the Ministry of Regional Development, Construction and Housing in 2015\". It provides for the allocation of UAH 10.6 million to the budget program for affordable housing for the population.\nSocial and political activities.\n2006–2010 — deputy of the Zhytomyr City Council of V convocation.\n2010–2012 — deputy of the Zhytomyr City Council of VI convocation.\n2010–2012 — head the \"Front of Changes\" faction in the Zhytomyr regional council.\n2010 - 2012 — member of the Standing Committee on Budget and Municipal Property in the Zhytomyr Regional Council.\nFrom 2010 - member of the Presidium of Zhytomyr NGO \"Council of business leaders and entrepreneurs of Zhytomyr.\"\nSince May 2012 – Head of the Zhytomyr regional election staff of the united opposition of \"Batkivschyna\" All-Ukrainian Union.\nFrom 12 December 2012 – Member of the Verkhovna Rada of Ukraine elected on behalf of the All-Ukrainian Union \"Batkivschyna\" (single-mandate constituency No. 62). First Deputy Chairman of the Verkhovna Rada of Ukraine Committee on Construction, Urban Development, Housing and Regional Policy, member of the counting commission.\nFrom 10 June until 2 December 2014 — First Deputy Head of the Presidential Administration.\nSince 2 December 2014 — Vice Prime Minister - Minister of Regional Development, Construction and Housing of Ukraine.\nScientific activity.\nIn 2009 completed his PhD at the Ukrainian Research Institute \"Proektstalkonstruktsiya named after V. Szymanovskyi\", Kyiv.\nIn 2012 defended his thesis on \"Organizational and technical measures for improving reconstruction of stadiums\" at the Kharkiv National University of Construction and Architecture at the Department of Technology and Building Structures. Author of more than 10 scientific papers. Holds PhD degree in technics.\nAwards.\nOrder of Danylo Halytskyi (awarded on 10 September 2009) - for the significant contribution to the socio-economic and cultural development of Zhytomyr, conscientious work and on the occasion of the 1125 anniversary of the city.\n• Medal \"For Distinction in Military Service\", II degree (USSR, Decree No. 114, 28 August 1987)\n• Medal \"70 Years of the Armed Forces of the USSR\" (Presidium of the Supreme Soviet of the USSR, Decree No. 84, 1988).\nFamily.\nWife: Lyudmila Mykolaivna.\nChildren: Sergiy, Khrystyna.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48688785","title":"Laugheryville, Indiana","body":"\nLaugheryville, Indiana\n\nLaugheryville is an unincorporated community in Ripley County, in the U.S. state of Indiana.\nHistory.\nLaugheryville was platted in 1847.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48688795","title":"New Carrollton, Indiana","body":"\nNew Carrollton, Indiana\n\nNew Carrollton is an unincorporated community in Ripley County, in the U.S. state of Indiana.\nHistory.\nA post office called New Carrollton was established in 1837, and remained in operation until 1839.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48688802","title":"Acoustocerebrography","body":"\nAcoustocerebrography\n\nAcoustocerebrography (ACG) refers to a diagnostic method in medicine that is used to diagnose pathological changes and illnesses in the brain and the central nervous system. \nIt can also be applied as a means to diagnose and monitor intracranial pressure, for example as incorporated into continuous brain monitoring device. As a method of transcranial, acoustic spectroscopy, ACG is based on Molecular Acoustics.\nIt allows for the non-invasive examination of the brain’s cell and molecular structure. ACG can use microphones, accelerometers or multi-frequency ultrasound (i.e. sound waves) to monitor changes. This methodology does not use any radiation and is completely free of any side effects. ACG also facilitates blood flow analysis as well as the detection of obstructions in cerebral blood flow.\nPassive and active Acoustocerebrography.\nPassive Acoustocerebrography.\nAll brain tissue is influenced by blood circulating in the brain’s vascular system. With each heartbeat, blood circulates in the skull, following a recurring pattern according to the oscillation produced. This oscillation’s effect, in turn, depends on the brain’s size, form, structure and its vascular system. Thus, every heartbeat stimulates minuscule motion in the brain tissue as well as cerebrospinal fluid and therefore produces minimal changes in intracranial pressure. These changes can be monitored and measured in the skull.\nToday, mostly passive sensors like accelerometers are used to identify these signals correctly. Sometimes highly sensitive microphones are utilized.\nWith a digital signal, it becomes possible to study the patterns of the blood flow moving inside the skull. These patterns form unique signatures that can be analyzed with specially designed algorithms, identifying them either as an inconspicuous, “normal” pattern or as a pattern showing an “abnormal” behavior.\nActive Acoustocerebrography.\nIn active ACG applications, a multi-frequency ultrasonic signal is used to detect and classify adverse changes at the cellular or molecular level.\nIn addition to all of the advantages that passive ACG provides, with active ACG it is possible to conduct a spectral analysis of the acoustic signals received. These spectrum analyses not only display changes in the brain’s vascular system, but also those in its cellular and molecular structures.\nOne common application of active ACG is the Transcranial Doppler test. More recently, its color version (TCCD) has been deployed. These ultrasonic procedures measure blood flow velocity within the brain’s blood vessels. They are used to diagnose embolisms, stenoses and vascular constrictions, for example, in the aftermath of a subarachnoid hemorrhage.\nFields of Application.\nContrary to applications that provide only momentary images, such as MRI and CT, the results of ACG procedures can be obtained continuously, thus facilitating effortless and non-invasive real-time monitoring. This can be especially helpful during the acute phase directly after a stroke or a traumatic brain injury. The measured data is mathematically processed continuously and displayed on a monitoring device. The computer-aided analysis of the signals enables the physician/nursing staff to precisely interpret the results immediately after device setup. Furthermore, ACG allows for preventive detection of pathological changes in brain tissue.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48688811","title":"Alcatel One Touch Idol 3","body":"\nAlcatel One Touch Idol 3\n\nAlcatel ONE TOUCH Idol 3 4.7 and Idol 3 5.5 are Android smartphones manufactured by TCT Mobile and officially unveiled at 2015’s Mobile World Congress.\nThe Idol 3 lineup consists of two handsets that use the same design but differ in size and specifications. The Idol 3 4.7 features a 4.7” display while Idol 3 5.5 has a bigger 5.5” display. They are the first smartphones to come with a reversible design that allows the user to use the phone upside-down.\nSpecifications.\nHardware.\nBoth models feature JBL certified stereo front-facing speakers, 13 megapixel rear camera, reversible design and displays tuned by Technicolor. They are available in Soft Gold, Metallic Silver and Dark Grey and in single-sim and dual-sim versions.\nIdol 3 4.7 features a 4.7” display with a resolution of 1280 x 720 pixels (312 ppi). It has a Qualcomm Snapdragon 410 SoC clocked at 1.2 Ghz alongside an Adreno 306 GPU and 1.5 GB of RAM. It is powered by a 2000 mAh non-removable Li-Ion battery and it is available in 8GB single-sim and 16GB dual-sim versions.\nIdol 3 5.5 features a 5.5” display with a resolution of 1920 x 1080 pixels (401 ppi). It has a Qualcomm Snapdragon 615 SoC composed of a quad-core 1.5 GHz Cortex-A53 and a quad-core 1.0 GHz Cortex-A53 alongside an Adreno 405 GPU and 2 GB of RAM. It is powered by a 2910 mAh non-removable Li-Ion battery and it is available in 16 GB single-sim and 32 GB dual-sim versions.\nSoftware.\nThe Idol 3 lineup comes with Android Lollipop 5.0 with customized icons and a few added features such as the option to use the phone upside-down and FM radio.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48688814","title":"Prattsburg, Indiana","body":"\nPrattsburg, Indiana\n\nPrattsburg is an unincorporated community in Ripley County, in the U.S. state of Indiana.\nHistory.\nA post office opened at Prattsburg in 1849, and remained in operation until it was discontinued in 1857. A member of the local Pratt was postmaster, giving the community its name.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48688815","title":"Mudface (Redman album)","body":"\nMudface (Redman album)\n\nMudface is the eighth studio album by American rapper Redman. The album was released on November 13, 2015, by Gilla House Records.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48688819","title":"Blue Diamond (Iceland)","body":"\nBlue Diamond (Iceland)\n\nThe Blue Diamond is the most growing tourist route in Iceland covering about 50 km looping from Reykjavik into the Reykjanes Peninsula and back. Also straight from the International Airport into the diamond route. Tours and travel related activities in this route are rapidly growing in Iceland. The Blue Diamond route is situated in the Reykjanes Geopark area which is a member of the Geoparks Network - an area with geological heritage of international significance - advancing the protection and use of geological heritage in a sustainable way and promoting awareness of key issues facing society in the context of the dynamic planet we all live on. The peninsula, with its diversity of volcanic and geothermal activity is the only place in the world where the Mid-Atlantic Ridge is visible above sea level. The primary stops on the Blue Diamond route in the Reykjanes Geopark are Gunnuhver (largest mud geyser in Iceland), Valahnúkur, Walk inside a crater – Stamparnir, The Raven Rift (just like in Þingvellir – Almannagjá), The Bridge Between Continents, Reykjanes lighthouse, Friðrik VIII, Presidents hill, , Fire Island, Krísuvík, Seltún, Vikingworld, Kvikan - House of Culture and Natural Resources and the Blue Lagoon. Other stops include The Icelandic Museum of Rock 'n' Roll, Duushús - Culture- and art center, Sudurnes Science and Learning Center Sandgerði, Flösin Garðskaga, Stafnes church and the Svartsengi and Reykjanesvirkjun geothermal power plants.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48688820","title":"Keraudrenia hermanniifolia","body":"\nKeraudrenia hermanniifolia\n\nKeraudrenia hermanniifolia is a shrub of the family Malvaceae native to Western Australia.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48688825","title":"Keraudrenia velutina","body":"\nKeraudrenia velutina\n\nKeraudrenia velutina is a shrub of the family Malvaceae native to Australia.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48688827","title":"Thurston's Hall","body":""}
{"url":"https://en.wikipedia.org/wiki?curid=48688835","title":"Amedeo Kleva","body":"\nAmedeo Kleva\n\nAmedeo Kleva (6 February 1923 – 22 June 1996) was an Italian footballer who played as a defender. He spent his career in Bulgaria and earned two caps for the Bulgarian national team. At club level, Kleva won three A Group titles and two Bulgarian Cups with Levski Sofia.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48688844","title":"Eokinorhynchus","body":"\nEokinorhynchus\n\nEokinorhynchus is a Cambrian ecdysozoan known from three Orsten-type Small Shelly Fossils. It is interpreted as a stem-group Kinorhynch.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48688853","title":"Saint Magdalen, Indiana","body":"\nSaint Magdalen, Indiana\n\nSaint Magdalen is a former town in Ripley County, in the U.S. state of Indiana. The GNIS classifies it as a populated place.\nHistory.\nA post office opened under the name Saint Magdalen in 1871, and remained in operation until 1905. The community was named after Mary Magdalene.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48688856","title":"Demet (magazine)","body":"\nDemet (magazine)\n\nThe Ottoman women's magazine Demet (\"floral bouquet\") was founded in 1908 in Istanbul, two weeks after the proclamation of the Second Constitutional Era. Altogether, seven issues exist, they were published once a week. Editor-in-chief and publisher was Celāl Sāhir (1883–1935). Even though the magazine was aimed at women, the editorial team of the first two issues was made up exclusively of men, such as Mehmet Akif Ersoy (1873–1936), Selim Sırrı (Tarcan) (1874–1957), and Enis Avni (1886-1958). Among the female writers were later Halide Salih Hanımlar (Halide Edip, 1884–1964), Nigar Bint-i Osman (1862–1918), and İsmet Hakkı Hanım. In addition to literary and scientific articles, what interested the female readers most were political publications. Besides Kadınlar Dünyası (1913–1921), Maḥāsin (1908–1910), and Kadın (1908–1910), is considered one of the first and most important women's magazines in the Second Constitutional Era.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48688870","title":"La Esperanza Airport","body":"\nLa Esperanza Airport\n\nLa Esperanza Airport may refer to following airports in Latin America:\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48688877","title":"Stumpke Corner, Indiana","body":"\nStumpke Corner, Indiana\n\nStumpke Corner is an unincorporated community in Ripley County, in the U.S. state of Indiana.\nHistory.\nA post office was established at Stumpke Corner in 1878, and remained in operation until 1895. Henry Stumke served as postmaster, and gave the community his name.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48688883","title":"Anne Milano Appel","body":"\nAnne Milano Appel\n\nAnne Milano Appel is an American translator of Italian literature. She obtained a doctorate in Romance languages from Rutgers University in 1970. She has translated, among others, works by Claudio Magris, Paolo Giordano, Giovanni Arpino and Goliarda Sapienza. She was awarded the John Florio Prize in 2012 for her translation of Arpino's \"Scent of a Woman\". She is also working on English translations of Giordano’s \"Like Family\" (December 2015, Pamela Dorman Books/Viking), \"Syrian Dust\" by Francesca Borri (March 2016, Seven Stories Press) and \"Don't Tell Me You're Afraid\" by Giuseppe Catozzella (August 2016, Penguin Press).\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48688929","title":"R. Maslyn Williams","body":"\nR. Maslyn Williams\n\nRobert Ronald Maslyn Williams (20 February 1911 – 11 August 1999) was an Australian documentary filmmaker and writer.\nHe was born to England and moved to Australia in the 1920s, where he grew up in the New England and Southern Highlands districts of New South Wales. He studied at the Conservatorium of Music in Sydney and worked as a journalist before going into filmmaking.\nIn 1940, he joined the Official War Film and Photographic Unit as a writer-producer and served under Frank Hurley in the Middle East. He worked for the Australian Information Bureau in New York in 1945 and the Canadian Film Board in 1946.\nIn 1962 he left filmmaking and became a writer.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48688939","title":"William Frederick Windham","body":"\nWilliam Frederick Windham\n\nWilliam Frederick Windham (1840–1866) was the son of William Howe Windham and the heir to Felbrigg Hall in Norfolk. He was the subject of a famous lunacy case after he married a woman of whom his uncle did not approve.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48688944","title":"New Guinea Patrol","body":"\nNew Guinea Patrol\n\nNew Guinea Patrol is a 1958 Australian documentary film produced by R. Maslyn Williams.\nThe film is regarded as a classic.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48688947","title":"Truth and Advertising","body":"\nTruth and Advertising\n\n\"Truth and Advertising\" is the ninth episode of the nineteenth season and the 266th overall episode of the animated television series \"South Park\", written and directed by series co-creator Trey Parker. It is the second part of a three-episode story arc which began with the previous episode \"Sponsored Content\" and concludes with the following episode \"PC Principal Final Justice\" that together serve as the season finale. It premiered on Comedy Central on December 2, 2015. Like the previous episode, this episode continues to parody the abundance of online advertising while continuing its season-long lampoon of political correctness.\nPlot.\nAfter Kyle is called to the principal's office, he finds Mr. Mackey there instead who tells him that PC Principal has lost his mind, with him and his fellow fraternity members going on a hunger strike and that Jimmy and Leslie have both gone missing. Meanwhile, Jimmy explains about how ads have evolved over time, becoming smarter and taking human form, in which Leslie is one of them.\nRandy and his family are eating dinner when Randy proposes that the family move out of South Park because it \"sucks\" now. After dinner, Randy explains to Sharon that ever since South Park's revitalization, it has become too expensive to live in and he has taken out a second mortgage on the house to help pay for the expenses. Back at the news base, Jimmy is talking to the newsmen about how he has become attracted to Leslie, despite her being an ad. The newsmen tell him that an ad's purpose is to entice and manipulate people. Jimmy suggests posting the story to the school's newspaper, but is rebuffed as the newsmen tell him to just figure out what the ads are planning.\nAt South Park Elementary, Stan runs up to Kyle with a school newspaper clipping stating that Principal has sent Jimmy and Leslie on a Disney Cruise for good behavior, but the boys know better as Jimmy was in charge of the school newspaper before being replaced by Nathan. They go to the school newsroom to get answers but are left with nothing after Nathan starts acting stupid to throw them off-course as he directly communicates with the ads on his computer.\nMr. Garrison, Caitlyn Jenner and Principal Victoria arrive at the Whole Foods Market with disguises on and Mr. Garrison is shocked about the state of his town. Back at the news base, Jimmy's attempts to interrogate Leslie fail, leaving him to start accepting her, with the head newsman convinced that he is now \"thinking with his dick\". At Cartman's house, Stan, Kyle, Cartman, Kenny and Butters search through news articles trying to solve the case, but end up at various stores after getting distracted by ads. This leads to some tension between Kyle and Stan who strongly believe the other is causing the distraction on purpose to avoid finding out the truth. Randy is ambushed by Garrison, Jenner and Victoria, who then knock him out after they discover a \"PC\" tattoo on his rump. Back at the base, Leslie tells Jimmy that Principal is the enemy and then places an ad on the newsmen's monitor so they can not see them. While isolated from the newsmen, Leslie asks Jimmy to help her escape.\nAt a motel, Randy wakes up tied to a chair being interrogated by the trio, who explain that the political correctness movement is not only happening in the United States, but internationally as well with PC Principal being the cause of it all, and Randy vows to kill him if this is true. Jimmy and Leslie attempt to escape, but are caught by the newsmen with the leader asking Officer Barbrady to kill them both, but Barbrady, not wanting to kill or injure anyone else, aids Jimmy and Leslie in their escape despite accidentally shooting a newsman in the shoulder. At the school, mutual suspicion between Kyle and Stan leads to the two to start arguing and then turning into a physical confrontation.\nAt the school newsroom, Jimmy and Leslie confront Nathan about his lies, but Leslie betrays Jimmy and brutally assaults him, revealing the fact that Nathan is one of the agents of Leslie and the other ads and proving the newsmen were correct in their warnings to Jimmy not to trust Leslie. At the fraternity house, Randy, Garrison, Jenner and Victoria discover the place abandoned before discovering a computer that Principal used to see the ad featuring him and Leslie. They come to the conclusion that Principal may be trying to help, but they get distracted after looking through the computer and end up at a store just as the boys did earlier. Leslie goes to Kyle's house to ask for his help and last four digits of his Social Security number, and they leave together.\nCritical reception.\nIGN's Max Nicholson gave the episode a 7.2 out of 10, and stated the episode \"was a little sluggish, especially in terms of the main plot. While Jimmy and Leslie's storyline made some headway on that front, the boys came up empty-handed in their investigation -- although their sudden transitions to consumerist hotspots were really funny.\" Writing for The A. V. Club, Dan Caffrey rated the episode a B, and stated in his review \"it's a chapter of the increasingly epic season 19 that relies almost entirely on cryptic intentions, shifting allegiances, and general confusion among the characters as they try to unravel who’s really behind the recent madness around town.\"\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48688956","title":"Isopogon uncinatus","body":"\nIsopogon uncinatus\n\nIsopogon uncinatus is a small shrub of the family Proteaceae that is endemic to the south coast of Western Australia around Albany.\nTaxonomy.\nThe species was first formally described by botanist Robert Brown in 1830, based on material collected by William Baxter at King George's Sound. In 1891, German botanist Otto Kuntze published \"Revisio generum plantarum\", his response to what he perceived as a lack of method in existing nomenclatural practice. Because \"Isopogon\" was based on \"Isopogon anemonifolius\", and that species had already been placed by Richard Salisbury in the segregate genus \"Atylus\" in 1807, Kuntze revived the latter genus on the grounds of priority, and made the new combination \"Atylus uncinatus\" for this species. However, Kuntze's revisionary program was not accepted by the majority of botanists. Ultimately, the genus \"Isopogon\" was nomenclaturally conserved over \"Atylus\" by the International Botanical Congress of 1905.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48688966","title":"Isopogon teretifolius","body":"\nIsopogon teretifolius\n\nIsopogon teretifolius, commonly known as the nodding coneflower, is a small shrub of the family Proteaceae that is endemic to the southwest of Western Australia.\nTaxonomy.\n\"Isopogon teretifolius\" was first described by Robert Brown in 1810. In 1891, German botanist Otto Kuntze published \"Revisio generum plantarum\", his response to what he perceived as a lack of method in existing nomenclatural practice. Because \"Isopogon\" was based on \"Isopogon anemonifolius\", and that species had already been placed by Richard Salisbury in the segregate genus \"Atylus\" in 1807, Kuntze revived the latter genus on the grounds of priority, and made the new combination \"Atylus teretifolius\" for this species. However, Kuntze's revisionary program was not accepted by the majority of botanists. Ultimately, the genus \"Isopogon\" was nomenclaturally conserved over \"Atylus\" by the International Botanical Congress of 1905.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48688968","title":"Breedenbroek","body":"\nBreedenbroek\n\nBreedenbroek is a small Dutch village in the Achterhoek region in the Gelderland province, near the town Dinxperlo, Netherlands. It is located some 3 kilometres from the German border. Since the municipal rearrangement in 2010, Breedenbroek is a part of the municipality Oude IJsselstreek.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48688971","title":"Sharmili Ahmed","body":"\nSharmili Ahmed\n\nSharmili Ahmed (born May 8, 1947 as Majeda Mullick) is a Bangladeshi television and film actress. She started her acting career in 1968.\nEarly life.\nAhmed was born in Belur Chok Village, Murshidabad. She passed matriculation examination from Rajshahi PN Girls High School.\nCareer.\nAhmed worked in \"Dompoti\", the first drama serial in the history of Bangladesh Television. She acted in a mother role for the first time in the drama \"Agun\", directed by Mohammad Mohsin in 1976.\nPersonal life.\nAhmed has a daughter Tanima. She has a younger sister theatre actor and activist Wahida Mollick Jolly.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48688978","title":"Isopogon spathulatus","body":"\nIsopogon spathulatus\n\nIsopogon spathulatus is a small shrub of the family Proteaceae that is endemic to the southwest of Western Australia.\nTaxonomy.\nThe species was first formally described by botanist Robert Brown in 1830, based on material collected by William Baxter at King George's Sound. In 1891, German botanist Otto Kuntze published \"Revisio generum plantarum\", his response to what he perceived as a lack of method in existing nomenclatural practice. Because \"Isopogon\" was based on \"Isopogon anemonifolius\", and that species had already been placed by Richard Salisbury in the segregate genus \"Atylus\" in 1807, Kuntze revived the latter genus on the grounds of priority, and made the new combination \"Atylus spathulatus\" for this species. However, Kuntze's revisionary program was not accepted by the majority of botanists. Ultimately, the genus \"Isopogon\" was nomenclaturally conserved over \"Atylus\" by the International Botanical Congress of 1905.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48688989","title":"Paeroa–Pokeno Line","body":"\nPaeroa–Pokeno Line\n\nThe proposed Paeroa-Pokeno railway line or deviation in the North Island of New Zealand between Paeroa and Pokeno was a favorite scheme in the 1920s and 1930s. When work started in 1938, it was said that the proposed line, which had been surveyed 18 years earlier, would shorten the distance from Auckland to towns on the ECMT by nearly . But it \"never quite got off the ground\", although some 13 km of formation was carried out from 1938 after Bob Semple turned the first sod on 27 January. Very little is now visible.\nThe Kaimai Tunnel relegated this section to ghost status; in August 1962 a deviation from Wahora to Apata passing under the Kaimai Range in a long (8.85 km) tunnel was approved . Work on the tunnel did not commence until 1969. With the opening of the tunnel in 1978, the Paeroa - Katikati section of the East Coast Main Trunk was closed\nOriginally the line was to be the first part of the East Coast Main Trunk Railway crossing the Bay of Plenty to Opotiki and then inland to Gisborne via the Moutohora Branch.\nIn 2014 the New Zealand First political party included a proposal to investigate a Pokeno-Paeroa-Te Aroha-Kaimai tunnel line as part of its transport policy. The proposal consists of completing the uncompleted Pokeno-Paeroa line, re-using part of the former Thames Branch between Paeroa and Te Aroha and a new link between Te Aroha and the western portal of the Kaimai tunnel, altogether creating a more direct link along a faster route, providing more capacity on the very busy rail freight corridor between Auckland and Tauranga, together with linking the towns of Maramarua, Ngatea, Paeroa and Te Aroha as potential future satellite suburbs of Auckland on a new commuter rail service route between Auckland and Tauranga.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48688992","title":"Moorim School","body":"\nMoorim School\n\nMoorim School () is a 2016 South Korean television series starring Lee Hyun-woo, Lee Hong-bin, Seo Ye-ji and Jung Yoo-jin. It started airing from January 11, 2016 on KBS2 every Monday and Tuesday at 21:55 KST. The drama is set around the mysterious Moorim Institute which teaches its students virtues including honesty, faith, sacrifice and communication. The teachers and students at the school come from different countries and each have their own stories.\nPlot.\nMoorim Institute isn't focused solely on high academic scores. The school teaches its students virtues including honesty, faith, sacrifice and communication. The teachers and students at the school come from different countries and each have their own stories.\nYoon Shi-woo (Lee Hyun-woo) is a famous idol, but as he is suffering from his hearing loss, his CEO tries to get rid of him by making him get involved in a scandal with a female rookie idol. As the public starts to hate him, he comes to Moorim School and hopes that he would be cured. \nWang Chi-ang (Lee Hong-bin) is the son of a rich Chinese man, but he is an illegitimate son who was born from a Korean mother. He meets Shim Soon-duk (Seo Ye-ji) and decide to go to Moorim School with her.\nSoundtrack.\nPart. 1.\nMoorim School’s main theme song “Alive” by South Korean boy band VIXX along with Part One was released on January 18, 2016. \nPart. 2.\nMoorim School OST Part. 2 was released on February 1, 2016. It features the title song “The King“ by VIXX. \n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48689000","title":"Isopogon polycephalus","body":"\nIsopogon polycephalus\n\nIsopogon polycephalus, commonly known as the clustered coneflower, is a small shrub of the family Proteaceae that is endemic to the southern Western Australia.\nTaxonomy.\nIt was first described by Robert Brown in 1810. In 1891, German botanist Otto Kuntze published \"Revisio generum plantarum\", his response to what he perceived as a lack of method in existing nomenclatural practice. Because \"Isopogon\" was based on \"Isopogon anemonifolius\", and that species had already been placed by Richard Salisbury in the segregate genus \"Atylus\" in 1807, Kuntze revived the latter genus on the grounds of priority, and made the new combination \"Atylus polycephalus\" for this species. However, Kuntze's revisionary program was not accepted by the majority of botanists. Ultimately, the genus \"Isopogon\" was nomenclaturally conserved over \"Atylus\" by the International Botanical Congress of 1905.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48689002","title":"Francesca Borri","body":"\nFrancesca Borri\n\nFrancesca Borri (born 1980) is an Italian journalist and writer. \nLife.\nShe studied in Florence and Pisa and has worked in the Balkans and the Middle East. Her first book \"Non aprire mai\" (2008) was a study of the conflict in Kosovo. \nIn 2010, she published a book on the Israel-Palestine conflict titled \"Qualcuno con cui parlare. Israeliani e Palestinesi\". \nIn 2012, she began reporting from Syria. Her latest work \"La guerra dentro\", a work of reportage on the Syrian civil war, has received widespread acclaim. An English translation by Anne Milano Appel is due to be published in 2016, under the title \"Syrian Dust\".\nBorri writes regularly for \"Il Fatto Quotidiano\", \"Internazionale,\" and Al-Monitor.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48689009","title":"Varsselder","body":"\nVarsselder\n\nVarsselder is a Dutch village with nearly 700 inhabitants, situated in the Gelderlandish Achterhoek, in the municipality Oude IJsselstreek. It lies on the road from Ulft to 's-Heerenberg, directly on the west of Ulft.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48689016","title":"Isopogon drummondii","body":"\nIsopogon drummondii\n\nIsopogon drummondii is a small shrub of the family Proteaceae that is endemic to the southwest of Western Australia.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48689017","title":"James Arthur Bayton","body":"\nJames Arthur Bayton\n\nJames Arthur Bayton (April 5, 1912 – August, 1990) was an American psychologist. He conducted research in areas of personality, race, social issues, and consumer psychology.\nEarly life and education.\nJames Arthur Bayton was born on April 5, 1912 in Whitestone, Virginia to George and Helen Bayton. His father, a physician, had graduated from the medical school at Howard University. Bayton graduated from Temple University’s high school in 1931 and subsequently matriculated at Howard University as a Chemistry major. Bayton began his undergraduate career planning to go into medicine, however, taking psychology courses taught by Francis Sumner, Max Meenes, and Frederick Watts sparked Bayton's interest in the behavioral sciences. During his undergraduate career, Bayton was a member of the Omega Psi Phi fraternity. Bayton graduated from Howard in 1935 with a B.A in psychology and began his M.S. studies at Howard. After graduating from the M.S. program, Bayton began further graduate study at Colombia University, where he was taught by R. S. Woodworth and A. T. Poffenberger. When Bayton’s father died, Bayton moved back to Philadelphia in order to be closer to his family. He transferred to the University of Pennsylvania and continued his graduate studies under psychologists such as L. Witmer, S. W. Fernberger, M. G. Preston, and M. Viteles. While conducting his doctorate studies, Bayton was offered a teaching position at Virginia State College. Partly due to the financial devastation of the Great Depression, Bayton delayed his graduate studies and became an associate professor of psychology from 1939 to 1943. During this time he published several papers, and was finally awarded his Ph.D. in psychology in 1943.\nCareer.\nFrom 1943-1945, during World War II, Bayton worked as a social service analyst for the U.S Department of Agriculture. Afterward, he became a professor of psychology at Southern University in Louisiana. He taught at Morgan State College in Maryland in 1946 and returned to Howard University as a professor in 1947, where he worked for the remainder of his life. He was the head of the Psychology Department from 1966–1970, as well as a graduate research professor from 1982-1988. From 1948-1953, Bayton also worked part-time in the U.S Department of Agriculture conducting research on consumer behavior. While working at the USDA, Bayton headed a psychological research program focused on policy development and program evaluation, as well as survey programs.\nWhile working as a professor at Howard, Bayton also served as the vice president of National Analysts, Inc. from 1953–1962 and 1966–1967, the vice president of Universal Marketing Research, Inc. from 1962–1966, a senior fellow at the Brookings Institution from 1967–1968, and a staff psychologist at Chilton Research Services from 1968-1976. Working in these positions, he contributed to over 70 corporate sponsored projects. He conducted survey and marking research and focused his work on consumer psychology. He conducted research for Dupont, IMB, Armstrong Cork, Chrysler, Eli Lilly, Curtis Publishing, Johnson and Johnson, Schick, Pet Milk, American Dairy Association, Federal Reserve Board, Smith Kline, Rench, Proctor and Gamble, and the Office of Navel Research. He also was a member of the Research Advisory Committee, Social Security Administration, the United States Department of Health Education and Welfare, and the Advisory Committee on Agricultural Science in theDepartment of Agriculture. He was also the chairman of a committee designed to evaluate equal employment opportunity policies in the National Aeronautics and Space Administration.\nBayton was an expert witness for the National Association for the Advancement of Colored People (NAACP) in several cases of school desegregation and job discrimination. He also served as an expert witness for the NAACP Legal Defense Fund. He played an important role in cases of the desegregation of Arlington and Roanoke schools after the “massive resistance” to desegregation headed by U.S Senator Harry F. Byrd, Sr. He also led desegregation sessions for government agriculture extension systems. Continuing in this line of work, Bayton assessed urban police complaint boards, summer youth programs, community relations, and civil rights commissions in relational to desegregation policies. Throughout his career, Bayton directed over 50 government-sponsored projects. Bayton was a fellow of the American Psychological Association, the American Marketing Association, and the National Academy of Public Administration.\nSelected publications.\nBayton addressed overlap in issues of race and class in his 1956 study, “Race-Class Stereotypes.” 92 White and 180 Black college students were asked to choose five adjectives, from a list of 85 words, that described \"upper-class white Americans\", \"upper-class Negroes\", \"lower class white Americans\", and \"lower-class Negroes\" respectively. Generally, the upper-class was characterized as “intelligent, ambitious, industrious, neat, and progressive”, while the lower-class was considered to be “ignorant, lazy, loud, and physically dirty.” The only race difference noted was that White subjects characterized Blacks as musical and ostentatious regardless of class. Overall, the assignment of stereotypes varied more due to class than race. In other words, there were more differences between upper-class and lower class stereotypes than stereotypes between different races of the same class. Bayton suggested race differences in stereotyping tasks were partially the product of assumed class differences.\nIn another study conducted by Bayton regarding race and class, 80 Black and 74 White college students were asked to assign traits (chosen from a list of 80 adjectives) to describe the Black lower class, the Black middle class, the White lower class, and the White middle class. The students were asked to choose five or fewer traits for each group and rate the traits on a scale from -5 to +5. Both Whites and Blacks assigned more advantageous traits to the middle as opposed to the lower class (though the effect was larger for White subjects).\nIn his study, “Negro perception of Negro and white personality traits,” Bayton had the Guilford-Zimmermann Temperament Survey administered to 240 Black students at Howard University. The subjects were prompted to answer in the way that they thought the \"average Negro male\", \"average Negro female\", \"average White male\", or \"average White female\" would respond. The survey addressed aspects of temperament such as emotional stability, thoughtfulness, and sociability. The results indicated better personality adjustment when the participants were asked to answer as if they were White. Bayton theorized that this tendency to associate positive temperament with Whites may have resulted from an inclination to “idealize the aggressor” and “incorporate his negative views” towards views of the minority group.\nBayton was prominent amongst the psychologists of his time in his efforts to advance minority group participation in professional psychology. In his article, “Minority groups and careers in psychology” he reported on the National Institute of Mental Health conference in 1969. The major topic discussed at this conference was the issue of how to produce more Black and minority Ph.D.s in psychology. Bayton addressed the need for an increased number of minority psychologists in the field in order to develop psychological programs focused on the needs of minority groups. He also referenced the importance of equal opportunity in the field. He reviewed the obstacles to increasing the number of minority psychologists in the field, such as the perception amongst students that psychology is a risky or nontraditional route for a minority member to pursue professionally. He claimed that these students had to be shown that possibilities exist in psychology for minority students, perhaps through the use of brochures or films to be circulated at various institutions. While graduate programs were attempting to recruit Black students in psychology, Bayton suggested that undergraduate psychology programs needed to increase their efforts to attract Black students to the field. He also addressed the issue of quality of education and lack of resources at primarily black institutions. Bayton suggested an attempt to gain federal and private funding for black students at predominately black colleges in order to ensure competent faculty and adequate resources. He proposed requesting funding to create summer programs for undergraduates that could aid in exposure to psychology for minority students at schools lacking psychology programs. He also emphasized the need to continue holding conferences of this nature in the future.\nIn another paper, “Reflections and Suggestions for Further Study Concerning the Higher Education of Negroes,” Bayton reported on another conference that took place in April, 1967. He addressed similar issues regarding how to improve the state of affairs for Black students in higher education.\nThroughout his career, Bayton conducted significant research in the area of consumer behavior. His paper, “Motivation, Cognition, Learning—Basic Factors in Consumer Behavior,” drew attention to the role of psychological theories as lenses for research in consumer behavior. While he acknowledged that marketing at the time addressed psychological theories of motivation, he claimed that theories of cognition and learning were neglected in consumer behavior research. Bayton explained the importance of cognitive processes in consumer behavior, for one, by explaining what determines whether or not we remember a particular product. In addressing theories of learning, Bayton outlined the role of reinforcement in determining whether a consumer will purchase a good repeatedly and explained the formation of consumer habits as a lessening of conscious decision-making while making a purchase.\nOther research contributions made by Bayton pertained to sex differences in decision making, issues of race in military settings, Blacks’ decision making in dialysis, Black attitudes regarding kidney transplantation, and Blacks’ blood donation and organ and tissue transplantation.\nLegacy.\nBayton’s research interests were widespread. He furthered psychological research in areas of personality, race, social issues, and consumer psychology. His research was generally of an applied nature, and thus, his efforts helped increase the scope and depth of applied work in the field of psychology. In particular, several studies conducted by Bayton foreshadowed the emergence of system-justification theory, which addresses the tendency to support the status-quo or the “system,” even when the “system” may not be beneficial to an individual or group. In particular, the idea of out-group favoritism (a subset of system-justification theory), or viewing a high-status group positively and one’s own low-status group more negatively, emerges in Bayton’s research. In his study, “Negro perception of Negro and white personality traits,” he found that Black participants perceived Whites as having more positive temperaments than Blacks. He theorized that this bias resulted from a tendency to “idealize the aggressor” and “incorporate his negative views” into participants’ views of their minority group. In other words, out-group favoritism emerged in this study, and the participants appeared to support a racial hierarchy, or “system,” that was not beneficial to these subjects. Additionally, in another of Bayton’s studies, “Evaluative Race-Class Stereotypes by Race and Perceived Class of Subjects,” subjects assigned more advantageous traits to the middle as opposed to the lower class regardless of their own class. This study also illustrates a tendency for people to justify the \"system\", or in other words, support the American ideal of a social meritocracy whether or not this \"system\" is truly just or beneficial to them.\nAdditionally, Bayton made important efforts throughout his career to increase the number of minorities in psychology and improve educational opportunities for Black people.\nAccording to Sherman Ross and Leslie H. Hicks of Howard University, Bayton was “always responsive to students and colleagues” and was “never too busy or uninterested.” They also described him as a “model professor and researcher.” \n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48689029","title":"Grevillea depauperata","body":"\nGrevillea depauperata\n\nGrevillea depauperata is a shrub of the family Proteaceae that is endemic to the southwest of Western Australia.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48689041","title":"Grevillea fasciculata","body":"\nGrevillea fasciculata\n\nGrevillea fasciculata is a shrub of the family Proteaceae that is endemic to the southwest of Western Australia.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48689050","title":"Grevillea mimosoides","body":"\nGrevillea mimosoides\n\nGrevillea mimosoides is a shrub of the family Proteaceae that is endemic to the north of Western Australia.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48689055","title":"Diamond Records (Hong Kong)","body":"\nDiamond Records (Hong Kong)\n\nDiamond Records was an important record label for Hong Kong and the far East. It featured a good amount of Hong Kong's most popular recording acts and attractions in it's catalogue.\nBackground.\nDiamond Records was an independent label which was established in or around 1960 by Portuguese merchant, Ren da Silva. In the early 1960s, they produced a run of albums that featured original Mandarin and English compositions. Also English songs were sung in Mandarin and Mandarin songs were sung in English. Two recording artists that were an example of this were Kong Ling and Mona Fong. Both Ling and Fong had Hong Kong's leading pianist Celso Carrillo as arranger on their early Diamond albums.\nAffiliations.\nIn the early 1960s, Diamond was the only record pressing in the area at the time. It handled Mercury Record Corporation product on a licensing agreement basis. Taking a trip to the U.S., managing director da Silva visited the Chicago Mercury headquarters in August 1961 to discuss expansion in the area for manufacturing plant and distribution facilities. He also was in the U.S. to meet with Willem Langenberg the head of Philips group to discuss the coordination of a three way arrangement that would involve Mercury, Philips and Diamond.\nArtists.\nRock bands.\nIn the mid-1960s the label started taking on guitar driven bands such as Philip Chan and the Astronotes, Danny Diaz and the Checkmates, Teddy Robin and the Playboys, and The Anders Nelsson group. Later on, other bands such as the Sam Hui fronted Lotus, The Mystics, The Zoundcrackers, D’Topnotes, The Downbeats, Joe Jr. and the Side Effects, Mod East, Sons of Han, and The Menace had recordings issued on the label. \nArrangers and session musicians.\nCelso Carrillo.\nCelso Carrillo, a pianist from the Philippines was born on January 9, 1924. Along with Tony Carpio, Andy Hidalgo, and Nick Domingo, he was one of the many musicians from the Philippines that had made careers in Hong Kong. He had worked as an arranger, backing musician on various recordings by artists on the Diamond label. For a period of time, he was Hong Kong's leading pianist His band backed Kong Ling on her \"Hong Kong Presents ... Off-Beat Cha Cha\" album. In addition to playing piano and handling the arrangements, he also played conga and cow bell on various tracks. Another album for Diamond which he worked on, which was in the same vein as Kong Ling's was \"Mona Fong Meets Carding Cruz\". The backing was by the Carding Cruz band and the arrangements were by Celso Carrillo. Philippino singer Carmen Soriano, credits him with him with giving her the inspiration and training to sing when she was lacking in confidence and repertoire while in Hong Kong. At the time he was the band leader at the club and told her to give it a try just for the novelty of it. The result was her singing for a few months at the Winner House club in Hong Kong. Another singer that Carillo backed was Lita Mendoza. He died on 26th December 1988.\nAt one time he was also once president of the Philippine Musicians League.\nLater years.\nIn 1970, the label was acquired by Polydor.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48689065","title":"Grevillea anethifolia","body":"\nGrevillea anethifolia\n\nGrevillea anethifolia is a shrub of the family Proteaceae that is endemic to Western Australia.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48689078","title":"1972–73 Dumbarton F.C. season","body":"\n1972–73 Dumbarton F.C. season\n\nSeason 1972–73 was the 96th football season in which Dumbarton competed at a Scottish national level, entering the Scottish Football League for the 66th time, the Scottish Cup for the 78th time and the Scottish League Cup for the 26th time.\nOverview.\nThe first season back in the top flight of Scottish football was always going to be a challenge, and the only real measure of success would be survival - and this is exactly what Dumbarton achieved. However it took until the final league game of the season to guarantee first division football next season. Lying in 17th place, Dumbarton had to better any result that Kilmarnock managed to leap-frog them out of the relegation places, and Dumbarton did this with some style, beating Dundee United 4-1, while Kilmarnock could only manage a 2-2 draw with Falkirk. \nIn the Scottish Cup, Dumbarton lost out to Partick Thistle in the fourth round, after a draw.\nIn the League Cup, two wins and two draws from the six sectional games were enough to qualify for the next stage in the competition, but it was a bitter disappointment to lose to Dundee in the two-legged second round tie - as a 3-0 lead from the home fixture was followed by a 4-0 defeat at Dens Park.\nFor the second season running Dumbarton had qualified for the Drybrough Cup. Again Celtic were the opponents in the first round and after a tough struggle they were to lose by only the odd goal in three.\nLocally, in the Stirlingshire Cup, Dumbarton were to regain the trophy by thrashing East Stirling 6-0 in the final.\nNote that just after the New Year, Jackie Stewart would resign as manager, to take up the reins at St Johnstone, and was replaced by Alex Wright.\nResults.\nAll results are written with Dumbarton's score first.\nAppearances.\nDumbarton used 26 players for the 46 League, Scottish Cup, Scottish League Cup and Drybrough Cup matches, as detailed below. Davie Wilson was the only player to feature in every one of these matches.\nReserve Team.\nDumbarton competed in the Scottish Reserve League, and with 9 wins and 10 draws from 34 matches, finished 12th of 18.\nFor the first time in a decade, Dumbarton also entered the Scottish Second XI Cup, and reached the third round before losing out to Dundee by the only goal.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48689086","title":"Wildlife of the United Arab Emirates","body":"\nWildlife of the United Arab Emirates\n\nThe wildlife of the United Arab Emirates is the flora and fauna of this country on the eastern side of the Arabian Peninsula and the southern end of the Persian Gulf. The country offers a variety of habitats for wildlife including the coast, offshore islands, mangrove areas, mudflats, salt pans, sand and gravel plains, sand dunes, mountain slopes, wadis and rocky summits.\nBecause the terrain is so varied, it supports a greater number of species of plants and animals than might have been expected in this relatively small country.\nGeography.\nThe United Arab Emirates occupy a corner of Arabia bounded by Saudi Arabia to the west and south, Oman to the east, the Gulf of Oman and Oman to the northeast and the Persian Gulf to the north. The northern coast stretches for about along the southern shore of the Persian Gulf and largely consists of salt pans that extend inland. There are numerous offshore islands, the ownership of some of which is disputed with neighbouring states. To the south is the Rub' al Khali desert, an enormous expanse of billowing sand dunes. Two large oases in the east are the Liwa Oasis, near the undefined border with Saudi Arabia, and Al-Buraimi Oasis at Al Ain. To the east the land rises and becomes mountainous, this being the northern end of the Al Hajar Mountains. Beyond these, the coast on the Gulf of Oman is rugged.\nIn the southeast of the country, near the border with Oman, there is a man-made lake, Lake Zakher, formed as a result of the release of waste water from the desalination plants on which the UAE relies for its freshwater supplies. The lake has formed as the groundwater rose, and many birds now visit the lake.\nFlora.\nA wide range of plants is associated with the many types of habitat in the United Arab Emirates. One of these types is sabkha, an area in which salty water has flooded the land shallowly and later evaporated, leaving crusty salt pans. These occur on the western part of the Gulf Coast but also among dunes inland. The plants found on their edges are salt-tolerant members of Salicornioideae and \"Zygophyllum\". At inland sites \"Zygophyllum qatarense\" predominates along with grasses such as \"Aeluropus lagopoides\" and \"Panicum turgidum\". Sandy plains further east along the coast from the sabkha region have occasional dwarf tamarisk trees and such plants as \"Salsola imbricata\" and \"Zygophyllum mandavillei\", and in coastal lagoons, and in creeks further east, the white mangrove is plentiful.\nPlants of the gravel plains further east again include \"Cornulaca monacantha\", \"Crotalaria persica\", \"Calotropis procera\" and \"Taverniera spartea\", and the parasitic desert hyacinth and the desert thumb. As the land rises up towards the mountains, the mesquite tree, an invasive species from Central America, has become established. The plains around Ras al-Khaimah in the northeast of the country, between the mountains and the sea, are the most heavily cultivated part of the country. The mountains have a cooler, more temperate climate and here there is an abundance of Alpine flowers among the rocks, on slopes and in cracks, fissures and wadis.\nFauna.\nOver four hundred species of bird have been recorded in the United Arab Emirates, with about ninety species breeding regularly in the country while the balance are winter visitors, migrants or vagrants. The country is on the crossroads of two major migratory routes, one between the Palaearctic and Africa, the other between the Near East and the Indian subcontinent, and the migrants make use of the many types of habitat available.\nAbout 250,000 waders visit the Gulf shores and mudflats at peak migration time; these include the grey plover, the greater and lesser sand plovers, the crab plover, the Kentish plover and the broad-billed sandpiper. The coast, and particularly offshore islands are used by many seabirds. About twenty to thirty percent of the world's Socotra cormorants, about 200,000 birds, breed in the United Arab Emirates, but they are under threat from fishermen who fear for their livelihoods. Sooty gulls breed here, as do red-billed tropicbirds as well as several species of tern; white-cheeked, bridled and lesser crested tern.\nA large number of passerine birds breed in the deserts, salt flats, plains, dunes and mountains. Twelve species of wheatear have been recorded in the country as well as warblers, babblers, rollers, bulbuls, the desert lark and many others. The sooty falcon overwinters in Madagascar and breeds in the United Arab Emirates. Other than this, there are only a small number of raptor species; Bonelli's eagle, barbary falcon, short-toed snake eagle, long-legged buzzard and lappet-faced vulture.\nMany of the large mammals found in the Arabian Peninsula were well-adapted to desert life in the harsh terrain, but were wiped out by human hunting in the last hundred years or so. Hunting is now banned in the United Arab Emirates, but feral goats and donkeys are plentiful and graze indiscriminately, lessening the chance for the native gazelles to recover from their reduced population sizes. Large terrestrial mammals still found in the United Arab Emirates include the Arabian tahr, the Arabian oryx, the sand gazelle and the mountain gazelle. Carnivores include the Arabian wolf, the striped hyena, the red fox, the Blanford's fox, the Rüppell's fox, the caracal, the Arabian wildcat, the sand cat and the Arabian leopard. Other mammals include the Cape hare, the Brandt's hedgehog, the desert hedgehog and the long-eared hedgehog.\nThe Egyptian fruit bat is found here during most of the year, but moves around according to the availability of fruit. Insectivorous bats include the sac-winged bat, the mouse-tailed bat and the leaf-nosed bat. Small rodents include the lesser Egyptian jerboa, the Cheesman's gerbil and the Balochistan gerbil. Rather larger rodents are the Libyan jird and the Sundevall's jird which both favour desert habitats. The Cairo spiny mouse was found in the mountains for the first time in 1995.\nOver 54 species of terrestrial reptile have been recorded in the UAE. These include a large number of lizards, found in all environments from desert, to city, to mountain-top, and a single species of worm lizard. There are thirteen species of terrestrial snake, some of the largest being the sand boa, the saw-scaled viper and the horned viper, and four species of sea snake as well as green sea turtles present in the Persian Gulf. There are two species of amphibian in the United Arab Emirates, the Arabian toad and the Dhofar toad; the former is more commonly seen as the Dhofar toad is nocturnal.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48689087","title":"Grevillea baxteri","body":"\nGrevillea baxteri\n\nGrevillea baxteri, commonly known as the Cape Arid grevillea, is a shrub of the family Proteaceae that is endemic to Western Australia.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48689089","title":"Arca Totok Kerot","body":"\nArca Totok Kerot\n\nArca Totok Kerot or Recå Thothokkerot IPA: [rətʃɔ ʈɔʈɔʔ kərɔt] is a statue (Jav. \"arcå\" or \"recå\" means \"statue\") located in Bulusari Village, Pagu District, Kediri Regency, Indonesia; about 2 kilometers north-east of Simpang Lima Gumul. It is made of andesite stone, depicting a giant with a terrifying face. The style is of a dvarapala. Based on the style, it is suggested that it was made in the 10th century.\nPhysical features.\nThe face and other ornaments also suggest that it is a representation of a female \"butå\". This is unusual since most dvarapala statues show male characteristics. Arca Totok Kerot is 3 meters tall.\nThe hair is matted, covering the upper part of the back. A kind of tiara with a glimpse of skull is seen above forehead, covering also the ears. The eyes are protruding, creating a terrifying effect, as if it were angry.\nLike many other dvarapala statues, it kneels on one knee. The left knee touches the ground while the right knee is erected, on which the right hand is laid. The left hand is missing, so it is unknown if it originally held a \"gådå\" (mace) like other dvarapala statues. All hands and legs are wearing \"binggêl\" (bracelets).\nThe nipples are clearly shown on the breast, another indication that it is female. It wears a necklace of skulls, usually worn by worshippers of Durga or Shiva. A girdle is encircling its waist, on which some kind of skirt is hanging.\nDiscovery and excavation.\nThe statue was discovered in 1981.\nIn 2013, due to an imminent plan by the local government to enlarge the road near Arca Totok Kerot, an excavation was hastily carried out searching for other archaeological remains. The excavation was conducted by East Java Hall of Cultural Heritage Preservation (\"Balai Pelestarian Cagar Budaya Jawa Timur\"). The possibility was considered because dvarapala statues were usually placed to guard a temple complex or other important sites.\nThe excavation took place for six days. The team dug with average 1.5 meters into the surrounding ground, in some points even 4 meters. However, no other archaeological remains were found. Eventually the excavation was terminated and the cavities were filled. The road in front of the statue was then enlarged.\nFolklore related to the statue.\nTales were abound surrounding the statue. Some were already documented and many others were still transmitted orally. Some tales related the statue to the legendary character Calon Arang, but such connection was refuted by Timoer (1981). Others were connected to the legendary king Jayabaya (Santosa, 2005).\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48689098","title":"Grevillea cunninghamii","body":"\nGrevillea cunninghamii\n\nGrevillea cunninghamii is a shrub of the family Proteaceae that is endemic to the Kimberley region of Western Australia.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48689108","title":"Grevillea dryandri","body":"\nGrevillea dryandri\n\nGrevillea dryandri is a shrub of the family Proteaceae that is endemic to Western Australia.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48689115","title":"Ischiopsopha wallacei yorkiana","body":"\nIschiopsopha wallacei yorkiana\n\nIschiopsopha wallacei yorkiana are beetles in Australia from the family Scarabaeidae, subfamily Cetoniinae, tribe Schizorhinini. It is a sub-species of \"Ischiopsopha wallacei.\"\nThe \"Cetoniinae\" scarabs are known as \"flower chafers\" as their main food is pollen and nectar sourced from flowers.\nDescription.\n\"Ischiopsopha wallacei\" can reach a length of about 30 mm. The beetles are an electric green colour, and have the tip of the scutellum visible.\nDistribution.\nThis species inhabits the Cape York Peninsula region of Australia.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48689128","title":"Ju Zheng","body":"\nJu Zheng\n\nJu Zheng (; November 8, 1876 – November 23, 1951) was a Chinese politician who was a leader in the Chinese Nationalist Party, or KMT, in the 1930s and 1940s. As president of the Judicial Yuan, he administered China's court system from 1932 to 1948. He ran in the presidential election of 1948 as the token opponent of Chiang Kai-shek. He was also known by his courtesy name Juesheng (Chueh-sheng).\nLife and career.\nJu was born in Huangzhou in Hubei Province on November 8, 1876. He joined the Tongmenghui, a revolutionary party founded by Sun Yat-sen, while studying law at Nihon University in Japan in 1907. Later, he worked for Chinese-language newspapers in Rangoon and Singapore. He returned to China to work for an anti-Qing revolutionary faction in Hubei. In 1912, he was briefly vice minister of the interior in the Provisional Government in Nanjing with Sun as president. He was commander of the Woosung Forts north of Shanghai during the Second Revolution in July 1913. In 1916, he led an uprising against Yuan Shikai in Shandong and briefly captured the city of Weixian. In 1921, Sun appointed him interior minister for the Nationalist administration in Guangzhou.\nJu was a founding member of the Western Hills Group, formed after Sun died in 1925. This group opposed communist influence in the KMT. Ju was appointed president of the Judicial Yuan by Chiang in 1932. This was one of the five branches of government in the KMT system. In the presidential election of April 20, 1948, Ju was persuaded to oppose Chiang's candidacy and received 10 percent of the vote in the National Assembly, with Chiang elected overwhelmingly. After he resigned as president of the Judicial Yuan on July 1, 1948, Ju was appointed to the Control Yuan, an auditing board. When the KMT was defeated by the Chinese Communists in 1949, Ju fled to Taiwan.\nJu co-founded Tamkang College of English, now Tamkang University, in Taipei in 1950. He died on November 23, 1951. Ju Haoran, his son, succeeded him as president of Tamkang. November 8, Ju's birthday, is marked annually as the school's founding day. The school's Chueh Sheng Memorial Library is named in his honor.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48689132","title":"Denis Ruddy","body":"\nDenis Ruddy\n\nDenis Ruddy (born 3 April 1950) was a Scottish footballer who played for Clydebank, Dumbarton and Stenhousemuir.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48689137","title":"Prečista Krajinska","body":"\nPrečista Krajinska\n\nPrečista Krajinska () is the name for the ruins of a church located in the region of Skadarska Krajina, southern Montenegro. It was the second burial site of Jovan Vladimir, the ruler of Duklja (ca. 1000–1016), after his widow Kosara renewed it and transferred his remains from Prespa. The relics drew many devotees to the church, which became a center of pilgrimage. Kosara was interred in the church, at the feet of her husband, on her request. In around 1215—when Krajina was under the rule of Serbian Grand Prince Stefan Nemanjić—the relics were presumably removed from this church and transported to Dyrrhachium by the troops of Michael I, the despot of Epirus. At that time Despot Michael had briefly captured from Serbia the city of Skadar, which is only about east of the church. The monastery was mentioned in 1417 in a Cetinje manuscript. The Balšić family reconstructed the monastery in the 15th century. The monastery became the seat of a Catholic bishopric, as part of the Catholic-Venetian expansion. The bishop, who was employed in an Orthodox region, saw resistance in the area from the Serbian Orthodox. At the beginning of the 20th century, the population surrounding the Church ruins were Muslims.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48689144","title":"Siren of the Tropics","body":"\nSiren of the Tropics\n\nSiren of the Tropics is a 1927 French silent film starring Josephine Baker. Directed by Mario Nalpas and Henri Étiévant and set in the West Indies, the film tells the story of a native girl named Papitou (Baker) who falls in love with a French man named André Berval (Pierre Batcheff). \nPlot.\nThe film is set in a fictional colony called Monte Puebla. Monte Puebla incorporates many colonial stereotypes, with the name suggesting that it could be a Spanish colony, the grass skirts and roofs suggesting a Polynesian influence, and the clothing being a jumble of multiple cultures. The story begins when a rich Parisian man named Marquis Sévéro wishes to marry a woman named Denise, but Denise is in love with an engineer named André Berval. In order to get rid of Berval, Marquis Sévéro sends him to the West Indies as a prospector, promising that he can marry Denise once he returns. After arriving in the West Indies, Berval meets a woman named Papitou. Papitou quickly falls in love with him, unaware of the fact that he is planning on marrying Denise upon his return to Paris. When Berval leaves the West Indies to return home Papitou follows him, despite the fact that he has a fiancé. Once she arrives in Paris, Papitou adjusts to city life and finds her true calling as a music hall performer. \nReception.\nPrior to the film's release, newspaper articles detailing Baker's tour through Europe piqued public interest.Following the film's premiere in December of 1927 in Stockholm, it received almost unanimously positive reviews from film critics. The film was screened from December 1927 until July 1928, which was considered an exceptionally long running time. Most of these positive reviews focused on Baker's body, comparing her agile movements to those of animals. Following her positive reception in \"Siren of the Tropics\" and increased public interest surrounding her, Baker published an autobiography called \"Les mémoirs de Josephine Baker.\" Following the film's very successful premiere, Baker also had a doll made in her likeness and sold in Stockholm, and starred in a toothpaste commercial. This positive reception of Baker's feature film debut set the stage for her starring roles in the films \"Zouzou\" and \"Princesse Tam-Tam\". \n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48689148","title":"Wa Senior High Technical School","body":"\nWa Senior High Technical School\n\nWa Senior High Technical School is a coeducational second cycle institution at Wa in the Upper West Region of Ghana. The school which was formerly called Wa Secondary Technical, houses both day (non-boarding) and boarding students at its premises and is precisely located at Konta opposite the Ghana Water Company.\nHistory.\nThe school was established as a community middle day school in the 1950's. Progressively, the school became a junior secondary school in 1978 and later transformed into a community secondary technical school in 1982. It was formally commissioned as a community day secondary technical school on 30th March 1983. With the enactment of the educational reforms in 2004 the school became known as Wa Senior High Technical School.\nIn 2012 the Ghana Education Service granted the school a boarding status following the implementation of several infrastructural development by the government through the Ghana Education Trust Fund (GETFUND). Currently the school boasts of a student population of about 2200.\nFacilities.\nThe school houses numerous educational facilities that compliment the studies of students. The Upper West Region french center is located in the school so french students normally don't face problems with the subject.\nIt has a world standard science laboratory, a library and many other useful facilities. Aside the school’s science laboratory, the regional science laboratory is also located on the school’s campus.\nCourses.\nThe school offers courses in Science, General Art, Visual Art, Technical and Home Economics.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48689154","title":"Tapped Shedding/Cam Shedding","body":"\nTapped Shedding/Cam Shedding\n\nTappet Shedding/Cam Shedding.\nAccording to the Textile Terms and Definitions, \"the control of the movement of heald shafts in weaving simple constructions by means of cams or tappets\" is called Tappet or Cam Shedding.\nClassification: Two types-\n1. Positive Tappet Shedding\n2. Negative Tappet Shedding\n1. Positive Tappet Shedding: Positive Tappet Shedding implies that the heald shafts are both raised and lowered by the tappets.\n2. Negative Tappet Shedding: Negative Tappet Shedding implies that the heald shafts are either raised or lowered by the mechanism but are returned by the action of an external device (usually springs).\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48689167","title":"Perci Piétro","body":"\nPerci Piétro\n\nPrince Percia Piétrolungo (born June 29, 1972 in New York City, New York), better known as Perci Piétro, who is an American of Persian and Italian descent. He is a real estate entrepreneur and the founder of OWN Realty and OWN Financial, with principal offices located in Miami, Florida.\nHe is also a direct descendent of the Qajar Dynasty, the Royal Family, which ruled Persia (now Iran) from 1785 to 1925.\nEarly life and Education.\nPiétro was born to Princess Shahnaz Shakoori M.D., after she moved from Iran to become a surgeon in the United States.\nIn his younger years, Piétro became fluent in English, Farsi and Spanish with some background in French and Italian. He attended preparatory school at Rumsey Hall in Washington, Connecticut and then boarding school at Wayland Academy in Beaver Dam, Wisconsin. After he attained his Bachelor of Science Degree from Wright State University in Dayton, Ohio. Later he went on to study at Lynn University in Boca Raton, Florida where he attained a Master of Business Administration Degree (MBA) in International Management.\nCareer.\nAfter graduating from college, Piétro decided to open a lounge in South Beach, Miami. He co-founded W6 Lounge with two other New Yorkers, ensuring the lounge had the feel of a bar in Manhattan.\nAt the time, it was seen as one of the few upscale lounges in Miami, with regular celebrity guests. Following the completion of W6, Piétro was featured in The Miami Hurricane in 2002, discussing how its club catered for students and young professionals. Up to 2001, W6 and Piétro were regarded as a prominent entertainment figure and location in Miami around 2001.\nPiétro remained at the entertainment venue until 2004 when he left to start World Real Estate Exchange, which was a real estate brokerage founded in early 2005. As the company grew, it set up affiliates in a number countries, including Istanbul, Dubai, Brazil and the Bahamas. Piétro also developed a niche according to Miami Agent magazine of negotiating bulk deals with developers and then introducing groups of buyers, to assist developers with moving of their inventory.\nWith his next venture as the founder of OWN Realty and OWN Financial, Piétro was featured in Miami Today, as a commentator on the health of the Miami property market in 2011. He spoke about the 2011 upturn in the property market in Miami, stating it was due to a large rise in the number of foreign investment in property at the time. He was quoted \"“For Mexicans and Venezuelans, it’s security issues,” he said. “For Canadians and the English, it’s the exchange rate; for Russians and Germans, the strength of their economies. So there’s a lot of action.”\"\nAfter becoming an International real estate expert, Piétro was made a Certified International Property Specialist, becoming one of just over 1,000 to hold the qualification globally. His work in Miami and the surrounding Florida market, has lead him to be interviewed about the state of the American property market a number of times in recent years.\nFamily.\nPiétro is a great grandson of Mozaffar Al-Din Shah Qajar, who was the fifth Qajar king of Persia. He reigned between the years 1853 and 1907. Piétro’s maternal great grandfather Sarem Al-Saltaneh Sardar Nasser Talesh was the Vali and Hakim of Azerbaijan, Gilan, Mazandaran, Ardabil, Astara, Namin, Rasht and Talesh which made up the Northern region of Persia. After a coup in 1925, the Qajar's rule of Persia came to and end, with the new Pahlavi Dynasty re-naming the country Iran in 1935.\nHis grandfather Jalil Shakoori continued to live in Iran, and served as a Colonel under the last Shah starting in the mid-1940s. Piétro’s mother moved to New York City in the late sixties later bringing her mother and four sisters. In 2015, with the passing of his maternal grandmother Shahzadeh Khanoum Akram Sadat Sarem Al-Saltaneh who was the matriarch, Piétro became the patriarch of the family as the only son of her eldest child.\nDespite his family heritage, he has yet to visit Iran, where his ancestors once ruled.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48689171","title":"SAB DB-80","body":"\nSAB DB-80\n\nThe SAB DB-80 and SAB DB-81 were single engine, all-metal French light transports aimed at the air mail market whilst carrying two passengers. Identical apart from their engines, they flew in mid-1930.\nDesign.\nIn 1929 Dyle and Bacalan were reformed as Société Aérienne Bordelaise (SAB) who continued to work on its predecessor's designs, distinguished by their DB numbering as well as on their own, which had AB numbers. The DB-80 originated with Dyle and Bacalan but was not flown until 1930, built by SAB. It was Dyle and Bacalan's last design and a small aircraft by their standards but maintained their all-metal tradition.\nThe DB-80 was aimed at the airmail market and was a single engine, high wing aircraft giving easy access by two port-side doors to a well lit cabin with two passenger seats and to a separate mail compartment behind them. The pilot sat ahead of the passengers under the wing leading edge. Two differently engined versions were built: the DB-80 had a Hispano-Suiza 6P six cylinder, upright water-cooled inline and the DB-81 a Lorraine 5Pc five cylinder radial engine. The latter was mounted on a hinged frame for easy servicing. The Hispano engined had a Lamblin radiator on the fuselage underside.\nThe fuselage was built around four longerons, with rectangular frames and covered in longitudinally ribbed duralumin. Its underside was smoothly bellied, its upper side flat. In plan its taper was delayed until aft of the cabin. Its empennage was conventional, with a straight tapered, blunt topped fin and unbalanced rudder, the latter cut away at its base to allow for movement of the one-piece elevator mounted on a triangular tailplane at mid-fuselage height. Like the fuselage, all the tail surfaces were covered with ribbed duralumin.\nThe DB-80 had a fixed, tailwheel undercarriage with track of .The mainwheels were independently mounted and fitted with brakes. Each axle was mounted at the lower vertex of a triangular box acting as a cantilever leg, with its upper side hinged from the fuselage longerons. The strengthened forward edge of the structure extended above the hinge and connected to an elastic block housed in a reinforced transverse beam which passed under the cockpit, incorporating shock absorbers.\nThe DB-80's high, cantilever wing was unusual both in its construction and high aspect ratio of 9. In plan it was straight tapered on both edges but with semi-elliptical tips curved particularly on the trailing edges, where its ailerons were full span and broad. The wing was built around three spars, rather than the traditional one or two and the detail of their caps or flanges, rather than the shape of the longitudinal braces or ribs, determined the airfoil profile. A similar but not identical wing structure was used on the Dyle et Bacalan DB-20.\nDevelopment.\nIn late March 1930 the DB-80's test flights were awaiting better weather; a month later tests were underway but the first flight did not take place until 27 June 1930. The Lorraine powered DB-81 flew in August, after which testing of the pair continued successfully though interrupted by SAB test pilot Charles Deschamps' absence at Villacoublay for official trials of the DB-20. In October the DB-80 was re-engined with a Lorraine and renamed DB-81.\nThere is no record of any further examples being built nor of measured performance figures.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48689191","title":"José Luis González (composer)","body":"\nJosé Luis González (composer)\n\nJosé Luis González Capilla de Guadalupe, Jalisco 1937) is a Mexican composer. He studied in Guadalajara at the Escuela Superior Diocesana de Musica.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48689201","title":"Diyojen (magazine)","body":"\nDiyojen (magazine)\n\nDiyojen (“Diogenes“) was the first Ottoman satirical magazine of the Ottoman Empire. The first issue was published in Istanbul on 24th November 1870 by the satirist Teodor Kasap (1835-1905). It came out weekly in three year’s issues and was banned for good in 1873 after 183 numbers. Apart from satirical pieces, the magazine became known for its caricatures and the translation of French literature. Kasap, who also worked as journalist and playwright, published other satirical magazines after the ban. In Haylal (“Fantasy” or “Illusion“), which existed from 1873 until 1877, he among other things used caricatures and satirical articles to criticize the arbitrary press law. \n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48689202","title":"Criminal Investigation Department (disambiguation)","body":"\nCriminal Investigation Department (disambiguation)\n\nA Criminal Investigation Department or Crime Investigation Department is a branch of many police forces. It may refer to:\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48689212","title":"Higinio Ruvalcaba","body":"\nHiginio Ruvalcaba\n\nHiginio Ruvalcaba (Yahualica, Jalisco, 11 January 1905 - Mexico City 15 January 1976) was a Mexican violinist and composer. He was leader of the Lener String Quartet with second violin José Smilovitz; viola Herbert Froelich, and Hungarian cellist Imre Hartman.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48689256","title":"Shehbal (magazine)","body":"\nShehbal (magazine)\n\nThe Ottoman journal Şehbal (“wing feather” or “wings“) was published in Istanbul between 1909 and 1914. Its publisher Hüseyin Saadeddin Arel (1880–1955), technically a lawyer, was a well-known musicologist and composer of 20th-century classical Turkish music. Altogether 100 numbers were issued every two weeks, at the first and fifteenth day of each Maliye-month respectively, totaling 20 pages. The page format more or less equaling the German DIN-size A3 as well as new printing techniques like the three-color printing with countless photographs and illustrations make the journal especially remarkable.\nThe examples inspiring this journal in its design as well as its content were French magazines like \"Figaro Salon\" or \"L'Illustration\". The journal aimed at propagating spiritual as well as technical progress and at covering a wide range of topics with articles on political and social sciences as well as jurisprudence right up to pieces from the fields of natural sciences, technology and philosophy. Furthermore, female readers were informed on parenting, women’s rights and their role in society. Pages on the latest historical events were part of the journal as were articles on sports and fine arts. Pieces on music were of special importance, they were mostly accounted for by the editor himself, writing under the pseudonym Bedi Mensi. Entertainment pages featured Ottoman as well as English and American stories and novels. In addition to that, several plays and poems of known writers were printed. Numerous contests involved the readers in the production of the journal and were meant to stimulate cultural life. The winners of those contests which had submitted a composition, photographs, caricatures or translations of operas were honored in award presentation ceremonies. Also, there was a translation competition in order to translate certain French into Ottoman terms. The 100th issue, coming out on 23 July 1914/10th Temmuz 1330 as a special edition, turned out to be the last issue without prior notice. \n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48689268","title":"Yasmina (film)","body":"\nYasmina (film)\n\nYasmina is a 1927 French silent film directed by André Hugon and starring Camille Bert, Huguette Duflos and Léon Mathot.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48689275","title":"ZM Auckland","body":""}
{"url":"https://en.wikipedia.org/wiki?curid=48689298","title":"Katten (beach)","body":"\nKatten (beach)\n\nKatten is a municipal beach in Bunnefjorden in the Nordstrand area in Oslo, Norway. The beach is suitable for children and comprises a sheltered, sandy beach, rocks and grassy hills. There are diving boards, swiming ladders, tables and benches, toilets, showers, drinking water and a kiosk. \nThere is very limited parking facilities, but there is a bus stop on Mosseveien right by. In the summer months there are also a separate \"bathing bus\" (busline no. 87). There is also a footpath downhill to Katten from Ljan Station.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48689305","title":"New Zealand NBL Rookie of the Year Award","body":"\nNew Zealand NBL Rookie of the Year Award\n\nThe National Basketball League Rookie of the Year is an annual National Basketball League (NBL) award given since the 1992 New Zealand NBL season to the best performing rookie New Zealander of the regular season. The award was originally given to the best Young Player of the Year from 1986 until 1991, with centre Warren Adams winning the award twice within four years. In 1992, forward Pero Cameron won the league's first Rookie of the Year award. This name stood until 2005, when a slight adjustment to the rules saw the Rookie of the Year opened up to any player under the age of 20, with guard Jarrod Kenny (age 19) winning the 2005 Young Player of the Year. This was changed back to Rookie of the Year in 2006, and has remained ever since. Future NBA player, Steven Adams, won the 2011 Rookie of the Year award; Steven is the half-brother of two-time Young Player of the Year, Warren Adams.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48689306","title":"Satriano","body":"\nSatriano\n\nSatriano may refer to the following Italian places and jurisdictions :\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48689308","title":"ZM Whangarei","body":"\nZM Whangarei\n\nZM Whangarei (also known as 93ZM is a hit music radio station in Whangarei, New Zealand. It is a station of the ZM network, and is owned and operated by New Zealand Media and Entertainment.\n93ZM started around 1995 as a totally local station broadcasting on 93.1 MHz. 93ZM became a network station after ZM made a return to Auckland with local voice breaks prerecorded in Auckland minutes earlier, however the breakfast show on 93ZM was networked from 89.8ZM in Hamilton between 1998 and 1999. In 2005 93ZM moved from 93.1 to 93.2 MHz and in 2006 93ZM traded places on the Northland radio dial with Radio Hauraki 93ZM shifted to 95.1 MHz and Hauraki took over ZM's vacated 93.2 MHz frequency. In 2010 ZM in Whangarei moved to 94.8 MHz as part of the government move to re-align radio frequencies around New Zealand.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48689324","title":"The Temple of Shadows","body":"\nThe Temple of Shadows\n\nThe Temple of Shadows (French:La vestale du Gange) is a 1927 French silent film directed by André Hugon and starring Camille Bert, Max Tréjean and Georges Melchior.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48689338","title":"Muna Al Gurg","body":""}
{"url":"https://en.wikipedia.org/wiki?curid=48689353","title":"Baurzhan Baimukhanov","body":"\nBaurzhan Baimukhanov\n\nBaurzhan Amangeldiyevich Baimukhanov (born July 21, 1971, Karagandy region,Kazakh Soviet Socialist Republic) – PhD. in Economics, a well-known business man, Member of the Regional Business Council of the National Chamber of Entrepreneurs, Astana\nEducation.\nIn 1988 he entered the State National University after Al-Farabai, Faculty of History, and graduated therefrom in 1993.\nRight after, he entered the Kaz GUA affiliated Market Institute, Economics Faculty.\nIn 2011 he entered Moscow School of Management SKOLKOVO, Executive MBA program. Successfully defended his graduation project in 2013.\nBiography.\nHe was born on July 21, 1971, Karagandy region, Kazakh Soviet Socialist Republic.\nDuring his study (1993–1995), he started his work in the Regional Foreign Economic Association \"Kazakhstan commerce\" on a position of Chief Specialist.\nFrom May 1996 to March 1997, he performed duties of Senior Manager in the Industrial project department, Kazkommertsbank OJSC.\nIn October 1998, he occupied a position of Director of Corporate and Transportation Service Center, a subsidiary of Republican State Enterprise \"Kazakhstan Temir Zholy\", Astana.\nFrom November 2001 to June 2002, he occupied a position of General Director of Republican State Enterprise \"Kazakhstan Temir Zholy\" and thus became the youngest 30-year-old manager in the history of this company with 125 000 employees and $1.7 bn of annual returns.\nDuring his period of work in Republican State Enterprise \"Kazakhstan Temir Zholy\", he was one of those to draft the Law on railway transport. Adoption of this Law increased competitiveness of Kazakhstan railway transport. His main conclusions were addressed in his PhD thesis defended in 2001.\nFrom June 2002 to July 2003 he acted as chairman of the board of Directors of Dala Group CJSC. Within this position, the first logical complex of A class \"Tau Terminal\" was commissioned in Kazakhstan.\nFrom November 2007 to December 2009, he was an independent director, member of the board of directors of Kazakhtelecom JSC.\nIn August 2008 he occupied a position of managing director, Member of the Management Board of Kazakhstani State Asset Management Holding \"Samruk-Kazyna\".\nFrom December 2008 to May 2009, he occupied a position of Executive Director of National Welfare Fund \"Samruk-Kazyna\" JSC.\nFrom June 2009 to January 2011, he acted as General Director of Trading and Transportation Company LLP, and from January 2011 to October 2011 he occupied a position of Vice-President of Mining Company LLP (both companies are within the National Atomic Company Kazatomprom).\nFrom October 2011 to February 2013 he served as Deputy Chairman of the National Economic Chamber \"Atameken Union\". In the framework of the Atameken Union NEC, acted as an initiator of active steps in the liberalization of the market of professional technical education in Kazakhstan.\nIn 2012, with the participation B.A. Baimukhanova, a terminal for liquefied gases \"AEGAZ Terminal\" was commissioned in Kerch (Ukraine), which strengthened the position of Kazakhstani producers of liquefied gases in international markets.\nIn 2013, he was one of the founders of the \"Association of alternative energy sources,\" the Republic of Kazakhstan. The Association initiated and made amendments to the Law \"On supporting of the use of renewable energy sources\", developed regulations that paved the way for widespread use of alternative energy sources in Kazakhstan.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48689366","title":"Peterborough railway line","body":"\nPeterborough railway line\n\nThe Peterborough railway line was a railway line in South Australia. It extended from a junction at Roseworthy on the Morgan railway line through Hamley Bridge, Riverton, initially to Burra, then extended to Peterborough on the Port Pirie-Cockburn line.\nThe Burra Burra railway was initially proposed as early as 1850, before any other railways north from Port Adelaide. The first stage, from Roseworthy to Forresters (now Tarlee) was opened on 3 July 1869. It extended to Redruth near Burra, opening on 29 August 1870. The broad gauge line was extended to Terowie (opened 14 December 1880), which had a break of gauge with narrow gauge continuing to Peterborough until the 1970s, when this section was converted to broad gauge. \nRegular passenger services ceased at the end of 1986, with the last passenger train being a ARHS steam train on 19 September 1992. The line north of Burra was removed in 1992-1993. Grain was transported by rail until January 1999, and the entire line has not been used since 2004.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48689367","title":"Gladstone railway line","body":"\nGladstone railway line\n\nThe Gladstone railway line was a railway line in South Australia. It extended from a junction at Hamley Bridge on the Peterborough railway line (which provided connection through to Adelaide) through Balaklava and Brinkworth to Gladstone. \nThe earliest part of the Gladstone railway line was the part of the Port Wakefield railway line east and north from Balaklava to Hoyleton. \nThe stage from Hamley Bridge to Balaklava opened on 15 November 1879, meeting the line from Port Wakefield. \nThe Gladstone line was completed as in 1894, reaching Gladstone railway station which was already on the Port Pirie-Cockburn line and a line north to Laura. The Gladstone railway line from Hamley Bridge to Gladstone was converted to in 1927 and closed in stages in the late 20th century.\nAs the Balaklava railway station was originally on the Port Wakefield to Hoyleton line, before the railway from Hamley Bridge was built, and the new line entered the town from the southeast, trains using the route between Gladstone and Adelaide needed to change direction at Balaklava, as both the north and south lines entered the station from the east, with Port Wakefield being to the west.\nThe \"Western System\" included the railway from Hamley Bridge to Gladstone, along with the lines from Balaklava through Port Wakefield, Kadina and Wallaroo, and the line from Kadina through Snowtown to Brinkworth. All of these lines were prepared for conversion from narrow to broad gauge in the mid-1920s, with the switch made on 1 August 1927.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48689412","title":"1989 Women's European Cricket Cup","body":"\n1989 Women's European Cricket Cup\n\nThe 1989 Women's European Cricket Cup was a international cricket tournament held in Denmark from 19 to 21 July 1989. It was the first edition of the Women's European Championship, and all matches at the tournament held One Day International (ODI) status.\nFour teams participated, with the hosts, Denmark, joined by the three other European members of the International Women's Cricket Council (IWCC) – England, Ireland, and the Netherlands. Denmark was making its ODI debut. The tournament was played using a round-robin format, with England finishing undefeated in its three matches. Two English players, Wendy Watson and Jo Chamberlain, led the tournament in runs and wickets, respectively. All matches were played at the Nykøbing Mors Cricket Club, located in the town of Nykøbing Mors.\nPoints table.\nSource: \nStatistics.\nMost runs.\nThe top five run scorers (total runs) are included in this table.\nSource: \nMost wickets.\nThe top five wicket takers are listed in this table, listed by wickets taken and then by bowling average.\nSource: \n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48689413","title":"2011–12 Nedbank Cup","body":"\n2011–12 Nedbank Cup\n\nThe Nedbank Cup is a South African club football (soccer) tournament. The knockout tournament, based on the English FA Cup format, was one of a weak opponent facing a stronger one. The competition was sponsored by ABSA until 2007, after which Nedbank took over sponsorship.\nThe winner of the 2011–12 Nedbank Cup winners, SuperSport United, qualified for the 2013 CAF Confederation Cup.\nFormat.\nThe 16 Premier Soccer League clubs, 8 National First Division teams, as well as 8 teams from the amateur ranks compete for the prize money of R6 million. The winner also qualifies for the CAF Confederation Cup.\nThe preliminary round features all 16 National First Division teams and will be reduced to eight when the teams play on 12 December 2012.\nThe teams are not seeded at any stage, and the first 16 sides drawn out of the hat receive a home-ground advantage. There are no longer any replays in the tournament, and any games which end in a draw after 90 minutes are subject to 30 minutes extra time followed by penalties if necessary.\nTeams.\nThe 32 teams competing in the Nedbank Cup competition are: (listed according to their league that they are playing in).\nResults.\nF.C. Cape Town\nThanda Royal Zulu F.C.\nDynamos\nVasco Da Gama\nPreliminary Round.\nThe preliminary round saw National First Division sides play each other is a knockout round to decide who would compete in the 2012 Nedbank Cup.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48689455","title":"GABS Hottest 100 Aussie Craft Beers of the Year","body":"\n60 - Hawthorn Brewing Pale Ale"}
{"url":"https://en.wikipedia.org/wiki?curid=48689461","title":"Victorian Emergency Management Training centre","body":"\nVictorian Emergency Management Training centre\n\nThe Victorian Emergency Management Training Centre (VEMTC) is a training facility for volunteer and career emergency services personnel. It used by the Metropolitan Fire Brigade, the Country Fire Authority (CFA), Victoria Police, Ambulance Victoria, Victoria State Emergency Service and the Department of Environment, and Primary Industries. The centre is located in Melbourne's north in Craigieburn,\nHistory.\n2014.\nThe training centre was completed in June 2014 for $109 million and designed by Woods Bagot.\nIt was build for Melbourne Fire Brigade (MFB) after 2 years of planning.\n2015.\nIt is the Primary training Centre for Melbourne Fire Brigade (MFB) and their recruiting courses and promotional courses are run from VEMTC\nFollowing the closure of CFA Fiskville training ground due to health and safety reasons, the VEMTC became the primary training facility for CFA new career fire fighters.\nKey features.\nThe 10 hectare facility has a focus on urban emergency incidents with scenarios for the following settings:\nThere is a large seven story builing or prop which includes a carpark and numerous other types of environments including an atrium, prison and hospital themes.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48689463","title":"Education Partnerships Africa","body":"\nEducation Partnerships Africa\n\nEducation Partnerships Africa is a volunteer-run charity which sends UK university students to work in rural secondary schools in East Africa. It aims to benefit students in East Africa by improving education in its partner schools, and to give personal development opportunities to UK university students. It was established in Kisii in 1990 as The Kenya Project. Since then it has expanded to two further sites: Kakamega in Kenya and Mbarara in Uganda, and now works with around 30 schools each summer.\nSummer project.\nStudent volunteers, known as Project Workers, spend ten weeks during their summer vacation living, either in a pair or trio, in a rural community in Kenya or Uganda. They work in partnership with the school management and local community to identify the most important needs for the school, and how they can best be addressed. These might include investing in sustainable resources, such as library books, science equipment and small infrastructure projects, helping with school management issues, and setting up co-curricular activities. Schools typically receive a minimum of two years of investment from the charity, before being reassessed to establish whether they would benefit from further investment. Volunteers fundraise money in the UK before their visit to cover the costs of the project, which includes the school investment, as well as their own flights, accommodation and living costs.\nSchools.\nIn Kenya EPAfrica works primarily with government funded District Schools. These are schools which any students with acceptable grades can attend, and which do not charge fees for tuition. In Uganda the charity also works with Technical schools which provide more vocational studies. The schools tend to be of medium size, in very rural locations, and to be short of resources, but with the potential to improve. Any school meeting the basic criteria can apply and most will receive a visit during the summer to assess their eligibility. In total EPAfrica has worked with over 100 schools in East Africa, investing more than £200,000.\nUK operations.\nEducation Partnerships Africa is a registered charity in the UK. It is run and managed entirely by volunteers, the majority of whom are alumni (i.e. former Project Workers). Each university has its own University Committee, which is responsible for recruiting Project Workers and running training for them throughout the year.\nThe central charity is made up of a number of workstreams, such as Communications, IT and Finance, each headed up by a Workstream Lead. These are overseen by a Management Committee, made up of six volunteers. The strategic direction and governance of the organisation is overseen by a Board of Trustees, all of whom are also volunteers.\nAccording to the Charity Commission the charity has an annual turnover of over £100,000, the majority of which is fundraised by its Project Workers. Because it is run entirely by volunteers the vast majority of this annual turnover is spent directly on its East Africa operations.\nHistory.\nThe charity began life in 1990 as The Kisii Project. In the early 1990s a group of Cambridge University students began teaching in a school in the Kisii area of Western Kenya. By 1995, Kisii Project had been incorporated into Link Africa (now Link Community Development) and extended to another two schools in the region. A few years later, the focus of the project was switched to resource investment to ensure sustainability.\nIn 2002 the project expanded to Oxford University and started sending 20 Project Workers a year to work in 10 schools in Kisii. The two university projects combined as a registered charity under the name The Kenya Project, which was later changed to Kenya Education Partnerships. From 2009 the charity began a period of expansion of its UK operations to a number of London universities, starting by recruiting Project Workers from University College London; the project went on to accept applications from all universities in London.\nIn 2008, violence following the disputed 2007 elections in Kenya made it unsafe for volunteers to be sent to Kenya so the charity moved its operations to Uganda for one summer. In 2010 it expanded to working in Kakamega, also in Western Kenya, and in 2013 it permanently expanded its operations to Mbarara in Uganda.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48689466","title":"Christian Manrique","body":"\nChristian Manrique\n\nChristian Manrique Valdor (Santander, Spain, 1975) is a civil engineer. Currently he is the CEO and founder at Soulware Global Development. Between 2007- 2011 he became the youngest Chairman of a Spanish Port Authority taking this post in Santander.\nPort Authority of Santander.\nOn September 24, 2007, he was appointed Chairman of the Port Authority of Santander by the Spanish minister of Public Works, Magdalena Álvarez, proposed by the Government of Cantabria.\nWith this appointment, at the age of 31, he turned the youngest Chairman of a Spanish Port Authority ever.\nThe Port Authority is the public institution managing the port of Santander in Cantabria within the bay of Santander.\nMain performances\nBetween 2007 and 2011 the Port Authority took different steps to improve its relation with the city, its citizens and with stakeholders. \nNowadays investment has reached 300 million euros and has allowed the sharing of port facilities and spaces with citizenship. This also meant the construction of the Alejandro Zaera shipping High Performance Centre and the Emilio Botín Arts Centre. The signature of the agreement, on March 19, 2011, was the first step, after a long period of research, to develope new business and recreational areas within the city. By this, different historical parts of the harbour were improved. \nThe deployment of the coal terminal eliminated dust particles that used to surround the city. Also the seed bulk terminal became a major improvement for food tracking. \nNew car shipping routes from different brands -Ford, Tata, Iveco, BMW y MINI, among others- were added to the existing ones to grow activity among port agents. Besides, a new traffic route was settled with Gotteborg, Sweden.\nThe Raos bridge construction became the solution to drive all heavy freight lorry traffic through port facilities. \nMotorway of the Sea to the United Kingdom with Brittany Ferries and to Zeebrugge, in Belgium, was enhanced. By doing so, heavy lorry traffic decreased within the area. This also increased road securtiy and improved environmental conditions. \nThe International Centre for Port Technology and Administration (CITAP) for postgraduate studies in logistics and port facilities settled in Santander. The centre has links with the Spanish Cooperation Agency AECID, OEA, Puertos del Estado and Cantabria University.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48689472","title":"Space radio station","body":"\nSpace radio station\n\nSpace radio station (short: space station) is – according to \"Article 1.64\" of the International Telecommunication Union´s (ITU) RR – defined as \"«A station located on an object which is beyond, is intended to go beyond, or has been beyond, the major portion of the Earth's atmosphere\".» \nEach \"station\" shall be classified by the service in which it operates permanently or temporarily. However, most \"spacecraft\" communicate by this means. \n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48689473","title":"Macleay Valley Mustangs Rugby league club","body":""}
{"url":"https://en.wikipedia.org/wiki?curid=48689475","title":"Mademoiselle Chiffon","body":"\nMademoiselle Chiffon\n\nMademoiselle Chiffon is a 1919 French silent film directed by André Hugon and starring Musidora, Suzanne Munte and Kitty Hott.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48689490","title":"Marcin Urbanowski","body":"\nMarcin Urbanowski\n\nMarcin Urbanowski (born 3 March 1987) is a Polish long distance runner.\nCareer.\nFrom 2002-2007, Urbanowski attended the School of Sports Championship in Gdansk. From 2004-2010, he represented Poland in long-distance running. He has participated in an international athletic championships. In Polish National Cross-Country Championships, he won a gold medal for cross-country run, five silver medals for 3 km steeplechase and three medals in cross-country runs.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48689499","title":"Sucks Blood","body":"\nSucks Blood\n\nSucks Blood is the sixth studio album by the American garage rock band Thee Oh Sees, released on May 15, 2007 on Castle Face Records. The album is the band's second to be released under the name The Oh Sees, and is their final album before changing their name permanently to Thee Oh Sees. \nRelease.\nTo release the album, vocalist and guitarist John Dwyer founded Castle Face Records, alongside Matt Jones and Brian Lee Hughes.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48689500","title":"Raaste Pyar Ke","body":""}
{"url":"https://en.wikipedia.org/wiki?curid=48689505","title":"Lavant House","body":"\nLavant House\n\nLavant House (or West Lavant House) is an old English estate.\nHistory.\nThe earliest unarguable documentary reference to Lavant House dates to 1762-3. Architectural analysis of the building, its photographic depictions and an eighteenth century watercolour suggest that it was built between 1707 and 1725. The Richard Budgen map of Sussex (1723–24) shows two houses considered worthy of note in the manor of West Lavant, of which one is undoubtedly West Lavant Farm (built in 1711) while the other is likely Lavant House, given that no remains or records document another large house in the area.\nSir John Miller.\nIts first definite owner was Sir John Miller (the 4th Baronet) whose family had been prominent in Chichester first as justices of the peace and mayors then becoming members of parliament from the later 17th century. Sir John had enclosed the ‘park’ at West Lavant by 1740 after which date he may have resided in the first form of Lavant House, its central section.\nThe Duke of Newcastle’s brother (Henry Pelham) wrote to the Duke saying \"you know my thoughts on Sir John he is as friendly and honest as the day is long\". This has to be balanced with the fact that the Second Duke of Richmond could relate to the Duke of Newcastle that Sir John had stated that he did not care a fart for [his father-in-law] Dr. Combs. Sir John is believed to be depicted as a lesser figure in a 1759 painting by George Stubbs showing the Third Duke of Richmond out hunting (this hangs in the front hall at Goodwood House). He died in 1772 and his relict Dame Susanna remained at Lavant House until her death in 1788 when the house was put on the market by her eldest Son (Sir Thomas Miller) who had by then moved to live in Hampshire. This was the advertisement in the \"The European magazine, and London Review\".\nThird Duke of Richmond.\nIn 1791 the house was bought by The Third Duke of Richmond who rented it to Lord Bathurst. In 1798 the Duke started work on the house. Apparently this was when the house was reoriented to face north (maps show the drive originally approaching from the south). He appears to have died (in 1806) while the project was underway.\nThe next inhabitant was Henriette Ann Le Clerc, now thought to be the Duke’s illegitimate daughter. Henriette was brought from France by his sister, Lady Louisa Conolly, in 1778 at age 5 to live at her Goodwood estate. His will named her the first beneficiary, receiving life tenure of West Lavant House and Park and other lands and farms. She married Colonel (later General) John Dorrien on 28 March 1808. John and Henriette’s only child, Charles (the traditional Lennox family name), was born in Lavant in January 1809. Following John’s death in 1825, Henriette ran her estate, which she mentions in a series of letters to the Fifth Duke. She remained much of the time at Lavant. Forty years after moving into Lavant House, the Agricultural Gazette announced her death on January 6, 1846.\nThe house then returned to the Goodwood Estate and was rented to a series of tenants.\nTwentieth century.\nIn 1907 the house was sold in 1907 to Mr Morrison and family. He is probably responsible for the dining room decoration.\nThe house was then sold to Major Henry Frederic Low and family. In 1921 his relict sold it to Major Julian Day and Isabella. She then sold the building to the school.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48689510","title":"Pokeno Railway Station","body":"\nPokeno Railway Station\n\nThe Pokeno Railway Station is a former railway station in Pokeno on the North Island Main Trunk Line. It opened for passengers on 20 May 1875 and for goods on 6 April 1879. \nThe station closed to passengers on 24 June 1973 and to goods on 30 March 1980. \nWork on the proposed Paeroa–Pokeno Line commenced in 1938 and whilst approximately 13km of earthworks were completed at each end, the proposal was halted due to World War 2 and was not resumed following the war and was abandoned. The line was to be the first part of the East Coast Main Trunk Railway. \n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48689520","title":"The Thruster","body":"\nThe Thruster\n\nThe Thruster (French:L'arriviste) is a 1924 French silent film directed by André Hugon and starring Pierre Blanchar, Jeanne Helbling and Ginette Maddie.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48689523","title":"Sir Samuel Scott, 2nd Baronet","body":"\nSir Samuel Scott, 2nd Baronet\n\nSir Samuel Scott, 2nd Baronet may refer to:\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48689529","title":"The Last Word (film 2009)","body":"\nThe Last Word (film 2009)\n\nThe Last Word (Persian: حرف آخر) is a 2009 Iranian Film Directed And produced By Hossein Shahabi .\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48689539","title":"The Little Thing","body":"\nThe Little Thing\n\nThe Little Thing (French:Le petit chose) is a 1923 French silent film directed by André Hugon and starring Max de Rieux, Alexiane and Jean Debucourt. It is based on the 1868 work \"Le Petit Chose\" by Alphonse Daudet.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48689546","title":"Gajpanth","body":"\nGajpanth\n\nGajpanth (also spelled as \"Gajpantha\") is a Jain pilgrimage site (\"tirth-kshetra\") located near the Jain temple at Nashik. It is located in the Indian state of Maharashtra, which is located in Masrul village, found in the Nashik district, 16 kilometers from Nashik Road Railway station and 5 kilometers from Nashik City. It is situated on the top of a small hill which is 400 feet tall. Those travelling up the steep slope are aided by a staircase built in black stone, which leads directly to the temple. The hill has 450 steps, 3 caves (known as 'chamar leni), and Jain temples belonging to the Digambara sect. There is also a sculpture depicting samavasarana (divine preaching hall of tirthankara) on the hills of Gajpanth.\nHistory.\nGajpanth is said to be the salvation place of seven 'Balbhadra' (saints) of the Jain Sect, known as Vijay, Achal, Sudharma, Suprabh, Nandi, Nandimitra and Sudarshan. It is believed that the saints took eight crores of Yadav Kings with them from this location to salvation. It is believed that many Jain monks (or sadhus) attained moksha from this hill.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48689556","title":"Uranus (novel)","body":"\nUranus (novel)\n\nUranus is a French novel written by Marcel Aymé and published in 1948. It is the third book in a trilogy which cover the \npre-war, the war and the post-war periods in France. The first is \"Travelingue\" (1948) set in the time of the \"Front Populaire\". The second is called \"Le Chemin des écoliers\" (1946) set during the occupation and the third book - Uranus – focuses on post war France and the ‘purge’ – social cleansing which sought to discipline collaborators. People were shaved, humiliated, beaten and often killed without a fair trial. \nThe true hero of the book, who is also the victim, is Léopold – owner of a coffee shop who discovers his passion for Jean Racine and for Andromaque thanks to lessons which, due to bombings of the school, must now take place in his establishment. He comes up with his own attempts at literature, such as \n\"Passez-moi\nAstyanax, on va filer en douce\" - \"Attendons pas d'avoir les poulets à nos trousses\".\nThe novel was adapted as a film, \"Uranus\" by Claude Berri in 1990. \"Le Chemin des écoliers\" was adapted as the film \"Way of Youth\" by Michel Boisrond in 1959.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48689559","title":"Rogelio Frigerio","body":"\nRogelio Frigerio\n\nRogelio Frigerio (born January 7, 1970, Buenos Aires) is an Argentine economist and politician. He is the grandson of Rogelio Julio Frigerio, who worked with Arturo Frondizi. He is a supporter of developmentalism.\nBiography.\nRogelio Frigerio studied economy at the University of Buenos Aires, and worked as a teacher after graduating. He worked for the minister Roque Pérez in 1998. \nHe was elected to the legislature of the city of Buenos Aires in 2011. He became president of Banco Ciudad in 2013. \nMauricio Macri, elected president in 2015, nominated him to be his Minister of Interior Affairs, Public Works and Housing.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48689562","title":"Jacques Landauze","body":"\nJacques Landauze\n\nJacques Landauze is a 1920 French silent drama film directed by André Hugon and starring Marguerite de Barbieux, Maud Richard and Séverin-Mars.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48689566","title":"Udon Thani Rajabhat University","body":"\nUdon Thani Rajabhat University\n\nUdon Thani Rajabhat University (UDRU) is a university in Udon Thani, northeast Thailand. It confers associate, bachelors, masters, and doctoral degrees.\nCampuses.\nThe university has three campuses:\nRanking.\nIn July 2013, the university was ranked 65th best in Thailand by Webometrics.\nSee also.\nRajabhat University system\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48689578","title":"Linford Rees","body":"\nLinford Rees\n\nWilliam Linford Rees (24 October 1914 – 29 July 2004) was a Welsh psychiatrist, who was professor of psychiatry at St Bartholomew's Hospital, London, and president of the Royal College of Psychiatrists from 1975 to 1978.\nA Welsh-speaker, Rees was born in Burry Port and studied at Llanelli Grammar School. He obtained his medical degree from the Welsh National School of Medicine in 1938. After postgraduate education at the Maudsley Hospital in London, he developed a specialism in psychosomatic medicine and worked closely with Hans Eysenck. He later worked at Whitchurch Hospital in Cardiff and again at the Maudsley, before taking up his academic post at St Bartholomew's in 1996. \n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48689580","title":"Castle Face Records","body":"\nCastle Face Records\n\nCastle Face Records is an American independent record label, founded in 2006 by John Dwyer, Matt Jones and Brian Lee Hughes.\nThe label was initially formed to release \"Sucks Blood\", the sixth studio album by Dwyer's band, Thee Oh Sees.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48689596","title":"The Fugitive (1920 film)","body":"\nThe Fugitive (1920 film)\n\n The Fugitive (French:La Fugitive) is a 1920 French silent film directed by André Hugon and starring Marie-Louise Derval, André Nox and Armand Numès.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48689600","title":"Paeroa Railway Station","body":"\nPaeroa Railway Station\n\nThe Paeroa Railway Station is a former railway station in Paeroa; on the Thames Branch, and on the East Coast Main Trunk Railway to Waihi. \nThe station opened for passengers and goods on 20 December 1895; and was replaced by a new building on a new site on 30 August 1925. The station closed to passengers on 20 July 1959, and to goods on 28 June 1991 with the closing of the Thames Branch. \nWork on the proposed Paeroa–Pokeno Line commenced in the 1930s, but little was done and the proposal was abandoned. The line was to be the first part of the East Coast Main Trunk Railway. With the opening of the Kaimai Tunnel in 1979, the Paeroa to Katikati section of the East Coast Main Trunk was closed. \n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48689619","title":"European Moroccans","body":"\nEuropean Moroccans\n\nEuropean Moroccans or White Moroccans are Moroccans whose ancestry lies within the continent of Europe, most notably France and Spain.\nPrior to independence, Morocco was home to half a million Europeans. And during the French protectorate in Morocco European Christians formed almost half the population of the city Casablanca. Later after the Independence in 1956, the European population has decreased substantially\nIn the last years of the 19th century; 250,000 Spaniards lived in Morocco at the beginning of the 20th century. Most Spaniards left Morocco after its independence in 1956 and their numbers were reduced to 13,000.\nToday European Moroccans are a small minority group in Morocco, accounting for only 1% of the country's population. In religion, most are Roman Catholic Christians.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48689620","title":"Kenneth Rawnsley","body":"\nKenneth Rawnsley\n\nProfessor Kenneth Rawnsley, CBE, (1926-1992) of University Hospital of Wales was an English psychiatrist who served as the president of the Royal College of Psychiatrists from 1981 to 1984.\nRawnsley was brought up and educated in Burnley, Lancashire, later studying at Manchester University, where he obtained his medical qualification in 1948. He worked for a time in Canada, on the Stirling County Epidemiological Project, before joining the Medical Research Council Social Psychiatry Unit in London and Cardiff.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48689626","title":"ZM Rotorua","body":"\nZM Rotorua\n\nZM Rotorua is contemporary hit radio network in Hamilton, New Zealand. It is owned by New Zealand Media and Entertainment, and broadcasts via FM, and worldwide via the Internet. The network targets the 15–39 demographic specialises in a chart-music playlist of pop, rock, hip hop and dance music.\nZM began broadcasting in Rotorua around 1998 on 98.3 MHz. This frequency had previously been used by a local rock station called Classic Rock 98.3FM.\nZM Rotorua began to broadcast network programmes from Auckland from 2002.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48689635","title":"Child's Special Allowance","body":"\nChild's Special Allowance\n\nChild's Special Allowance was a payment under the United Kingdom system of Social Security.\nIt was instituted by Harold Macmillan in 1959 for the orphaned children of divorced parents,\nIt was a Contributory non-means tested benefit, paid in addition to Child benefit to a divorced woman whose husband had died, whose ex-partner had been paying maintenance and who had not got a new partner. It was not taxable, but was taken into account for meanstested benefits.\nIt was abolished, as far as new claims were concerned, in April 1987. At that point it was paid at a rate of £8.05 per eligible child. Payments continued for existing beneficiaries under the scheme of transitional protection.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48689645","title":"Athens Digital Arts Festival","body":"\nAthens Digital Arts Festival\n\nAthens Digital Arts Festival (ADAF) (Greek: Διεθνές Φεστιβάλ Ψηφιακών Τεχνών της Ελλάδας) is an international festival, that takes place every May in Athens, Greece.\nThe festival was established in 2005, under the title Athens Video Art Festival, as an initiation of the non-profit organization Multitrab Productions to create a platform for video art, installations and live performances. Since then, it has added interactive installations, web art, workshops, animation and digital images. In January 2015, the festival changed its name into Athens Digital Arts Festival.\nHistory.\nThe first edition of the International Festival of Digital Arts took place in April 2005 at the cultural space Thira Texnis, in Athens. The festival received 180 artworks submissions and hosted 137 of them.\nFrom 2007 to 2011, the main venue of the festival was the cultural space Technopolis of the Municipality of Athens, with 1,544 artworks hosted from 8,200 submitted. Through these years the festival presented artworks in the main categories of video art, installations and live performances, and in new ones such as web art, animation and digital image, introduced since 2009. It has also collaborated with other festivals, such as Transmediale (DE), Cologne OFF (DE), LPM (IT), videoholica (BG), IN-EDIT (ES), onedotzero (UK), and art:screen (SE).\nIn 2012 and 2013 the festival moved its activities to the center of Athens, with the titles “Visualize Athens” (2012) and “Living Athens” (2013). This initiative was supported by a number of volunteers, Greek Municipalities and international festivals and artists.\nIn 2014, celebrating its 10-year anniversary, it decided to return to the cultural space “Technopolis” of Municipality of Athens. Some of the highlights were the live performances \"Abandonded cities\" by Hauschka and \"Late Speculation\" by Nonotak, as well as the installation “80 prepared dc-motors, cotton balls, cardboard boxes” by Zimoun.\nIn 2015, the festival changed its name to Athens Digital Arts Festival, with eight official categories: installations, web art, video art, animation, performances, digital image, workshops and music and introduced for the first time a specific theme,“Public Space_s”., ADAF 2015 took place in the center of Athens with its main venue at Diplarios School and two main squares of Athens for parallel activities. The festival hosted the works of 150 artists from Greece and abroad, on the theme of public space both in the digital and urban environments. Some of the artists and international festivals participated in this year’s festival were Karl Heinz Heron (DE), Julian Oliver (NZ), Martin Bricelj Baraga (SI), Martin Reiche (DE), MADATAC (ES), IMPAKT (NL), VIDEONALE (DE), Cologne OFF (DE), videoholica (BG), and artvideoKOELN] (DE).\nADAF has maintained active partnerships with local and international artists and audience, institutions, art foundations, schools, universities, galleries and museums and a number of 46 collaborating festivals. Athens Digital Arts Festival is also partner of , an international network of artists and professionals organizing festivals and/or working in the fields of audiovisual live performances. \n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48689657","title":"List of Kazakhstan football transfers winter 2016","body":"\nList of Kazakhstan football transfers winter 2016\n\nThis is a list of Kazakh football transfers in the winter transfer window 2016 by club. Only clubs of the 2016 Kazakhstan Premier League are included.\nKazakhstan Premier League 2016.\nAktobe.\nIn:\nOut:\nAkzhayik.\nIn:\nOut:\nAstana.\nIn:\nOut:\nAtyrau.\nIn:\nOut:\nIrtysh.\nIn:\nOut:\nKairat.\nIn:\nOut:\nOkzhetpes.\nIn:\nOut:\nOrdabasy.\nIn:\nOut:\nShakhter Karagandy.\nIn:\nOut:\nTaraz.\nIn:\nOut:\nTobol.\nIn:\nOut:\nZhetysu.\nIn:\nOut:\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48689664","title":"List of israeli top-flight league players with 100 or more goals","body":"\nList of israeli top-flight league players with 100 or more goals\n\nSince the israeli top-flight league's formation at the start of the 1931–32 season, 35 players have managed to accrue 100 or more goals in the league.\nNahum Stelmach holds the record for the fewest games taken to reach 100, doing so in 138 appearances.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48689667","title":"72nd (Middlesex) Searchlight Regiment, Royal Artillery","body":"\n72nd (Middlesex) Searchlight Regiment, Royal Artillery\n\n72nd (Middlesex) Searchlight Regiment, Royal Artillery was an air defence unit of Britain's Territorial Army (TA) raised just before the outbreak of World War II, which served as part of Anti-Aircraft Command during and after the war.\nOrigin.\nAs the international situation deteriorated in the late 1930s, the threat of air raids on the UK led to the rapid expansion in numbers of anti-aircraft (AA) units manned by members of the part-time TA. Formed in November 1938, 72nd (Middlesex) was the third of a new group of three TA searchlight regiment raised by the Royal Artillery (previous TA S/L units had all been part of the Royal Engineers and/or converted from infantry battalions). It consisted of HQ and Nos 465–467 Companies (later Batteries) based at a newly built drill hall at Vicarage Road, Heston. Shortly afterwards the regiment moved to Twickenham. It was equipped with the new '90 cm Projector Anti Aircraft', a smaller and lighter piece of equipment than previous searchlights, with a more powerful high current density arc lamp with automatic carbon feed.\nWorld War II.\nAnti-Aircraft Command mobilised in August 1939, ahead of the declaration of war on 3 September, and the regiment took its place in 47th AA Brigade, part of 5th AA Division tasked with defending Southampton.\nSouthampton was a regular target for raids by the German \"Luftwaffe\" during the Battle of Britain in the summer of 1940, but by November 1940 the regiment had transferred to 40 AA Bde in 2nd AA Division in the Midlands. It had the responsibility for covering RAF airfields in the East Midlands and continued in that role throughout the Blitz of 1940–41.\nAs the threat from the Luftwaffe waned in 1944, the War Office warned in June that AA Command would have to release manpower to provide reinforcements to 21st Army Group fighting in . The run-down began in September 1944, and 72nd S/L Rgt was placed in 'suspended animation' in that month, with its personnel being posted away.\nPostwar.\nWhen the TA was reconstituted in 1947, 72nd S/L Rgt was reformed at Twickenham as 607 Searchlight Regiment, RA (Middlesex), forming part of 67 AA Bde (the former 41 AA Bde based at Shepherds Bush). In 1949 the regiment's role was altered and it was redesignated 607th (Mixed) Light Anti-Aircraft/Searchlight Regiment, RA (Middlesex) ('Mixed' denoting that members of the Women's Royal Army Corps were integrated into the unit).\nAA Command was disbanded on 10 March 1955, and 607 LAA/SL Regiment was disbanded at the same time.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48689669","title":"Government Superior Science College Peshawar","body":"\nGovernment Superior Science College Peshawar\n\nGovernment Superior Science College (GSSC) Peshawar Pakistan, is one of the three public sector colleges for male students operating within Peshawar metropolitan, along with Government College (GC) Peshawar; and Government College Hayatabad, Peshawar. GSSC, established in 1962, is providing educational services along with training in sports and other social skills. The college has produced a long list of prominent figures in different fields of life,that serving humanity around the globe. Being one of the prominent institution established after independence, the college attracts the highest number of students each year, and very few of applied students are able to get admission.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48689691","title":"New Zealand NBL Coach of the Year Award","body":"\nNew Zealand NBL Coach of the Year Award\n\nThe National Basketball League Coach of the Year is an annual National Basketball League (NBL) award given since the 1989 New Zealand NBL season to the best head coach of the regular season.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48689693","title":"2016 World Touring Car Championship season","body":"\n2016 World Touring Car Championship season\n\nThe 2016 World Touring Car Championship season is the thirteenth season of the FIA World Touring Car Championship, and the twelfth since the series was revived in 2005.\nRegulation changes.\nThe sporting regulations were approved by the FIA, at the December 2015 meeting of the World Motor Sport Council.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48689707","title":"Breakthrough Energy Coalition","body":"\nBreakthrough Energy Coalition\n\nBreakthrough Energy Coalition is a global group of 28 high net worth investors from 10 countries committed to funding clean energy companies emerging from the initiatives of Mission Innovation, which was also announced at the 2015 United Nations Climate Change Conference.\nThe group aims to bolster governmental assistance in renewable energy such as solar energy and wind power to $20 billion.\nMembers.\nThe group is spearheaded by Bill Gates, who previously announced a personal $2 billion investment, and includes:\nCriticism.\nThere has been criticism that the coalition was announced too early, before crucial details has been confirmed. At launch, a Gates Foundation spokesman confirmed that investment professionals had yet to be appointed, named investors - other than Gates - hadn't publicly stated their level of investment and a financial structure hadn't been confirmed.\nThe scale, at US$20bn of public cash over five years and the initial US$2bn of private cash, has also been criticised as inadequate: the World Bank suggests that US$100bn would be needed annually.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48689709","title":"Paropsis atomaria","body":"\nParopsis atomaria\n\nParopsis atomaria is a common leaf beetle in the subfamily Chrysomelinae. Atomaria translates to mean speckled or freckled. \nThey occur along eastern Australia from Adelaide to Brisbane. \nP. atomaria produce two lifecycles during the summer across most of its range A female can produce 600 eggs and deposits them at the tip of a leaf or twig. This species is one of a few of the paropsines that may become a pest of plantation trees. \n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48689714","title":"The Gathering (EP)","body":"\nThe Gathering (EP)\n\nThe Gathering is an EP by American hip hop group Living Legends. It was released on Legendary Music on April 8, 2008.\nReception.\nAndrea Woo of \"Exclaim!\" said: \"While some will invariably be disappointed by the short playtime, the seven tracks of \"The Gathering\" are strung together with a fairly stable energy to create a solid offering devoid of filler.\"\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48689724","title":"Byzantine tower of Biccari","body":"\nByzantine tower of Biccari\n\nByzantine tower of Biccari is a builder locate in city center of Biccari, city of Province of Foggia in Italy.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48689740","title":"Walk like a Panther","body":"\nWalk like a Panther\n\n\"Walk like a Panther\" is a song by the All Seeing I with vocals from Tony Christie. It charted at number 10 on the UK Singles Chart.\nBackground.\n\"Walk like a Panther\" was performed by All Seeing I with main vocals from Tony Christie and background vocals from Steve Edwards, and was written by Richard Barratt, Jason Buckle, Jarvis Cocker and Dean Honer, and was their third single from their album \"Pickled Eggs and Sherbert.\" It was written specifically for Christie to such an extent that it even mentions one his past hits – I Did What I Did For Maria – and describes the hometown of the band members of the All Seeing I, Cocker and Christie: Sheffield. Cocker personally contacted Christie, who was living in Spain at the time as this was where he was most successful, asking if he would feature on the record.\nMusic video.\nA music video was produced for the song. It features Christie singing his parts and culminates in others walking with their arms held high in time with the music, mimicking panthers.\nChart performance.\nWalk like a Panther peaked im January 1999 at number 10 on the UK Singles Chart, becoming Christie's first hit in that country for twenty five years. It would be the band's only top ten single; The Beat Goes On and 1st Man in Space would peak at numbers 11 and 28 respectively.\nCritical reception.\n\"NME\" said of the song \"People just don't write songs like this any more!\", said the song had \"the vocal gravitas of a man, a common man, defiant in his invective against his lot, his shitty neighbourhood\" and ended by describing it as \"brave, impassioned and chuffin' catchy.\"\nUsage in popular culture.\nThe band performed the song on \"Top of the Pops,\" and the song was featured on its corresponding album \"Top of the Pops 1999, Vol. 1.\" It was also featured on the compilation albums \"The Chillout Album, Vol. 2,\" \"Soundsystem Four\" and \"Now 42.\" Three years later, The Pretenders would cover the song on their album \"Loose Screw.\"\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48689766","title":"1958 Targa Florio","body":"\n1958 Targa Florio\n\nThe 42° Targa Florio took place on 11 May, on the Circuito Piccolo delle Madonie, (Sicily, Italy). It was the third round of the F.I.A. World Sports Car Championship, which was running to new regulations introduced at the beginning of the season. The most influential of these regulations changes would be the 3.0 litre engine size limit. The event returned to the championship for the first time since 1955, following the demise of the Mille Miglia and the ban on road racing on mainland Italy. But such outcry did not deter Vincenzo Florio from holding his event on the traditional 45 mile mountainous circuit.\nReport.\nEntry.\nA massive total of 65 racing cars were registered for this event, of which 53 arrived for practice. Only these, only 38 started the long distance race on the public roads of Sicily. This, the 42nd edition of the event, saw a change on the nature of the race. Two drivers would be permitted now and the limit set so no driver would drive more than seven laps out of the total race distance of 14. So, it ensured no single driver would be able to complete the whole race.\nThe first two events of the season, the 1000 km Buenos Aires and 12 Hours of Sebring ended with victory for Phil Hill and Peter Collins, for Scuderia Ferrari. As Hill and Collins also won the last race of the previous season, the Venezuelan Grand Prix they’ve now won three races in a row for the Scuderia. With these new rules, and Maserati on the brink of financial crisis, Scuderia Ferrari would head the Italian challenge. Ferrari had four works 250 TRs in Sicily, Hill/Collins, Mike Hawthorn/Wolfgang von Trips, Luigi Musso/Olivier Gendebien and Gino Munaron/Wolfgang Seidel. Opposition would no longer come from Maserati… but from Porsche and Aston Martin.\nDavid Brown sent just one Aston Martin DBR1 over from England for Stirling Moss/Tony Brooks, while Porsche arrived with three different cars, a 356A Carrera, a 550 RS and a 718 RSK, for their squad of drivers led by Jean Behra and Giorgio Scarlatti. They were joined by a fleet of privateer drivers in their Alfa Romeos, Oscas and other mainline sportscars.\nQualifying.\nPrior to the race, there was no formal practice held, but Sergio Der Stephanian was killed in a pre-race accident, following a collision with a sand-laden lorry. He died shortly after in hospital.\nRace.\nWith each lap 45 miles in length, the race covered a total of 14 laps, or 630 miles, the Targa Florio is unlike any other sports car race. Littered with switchback turns, blind corners and a straight nearly four miles longer than Circuit de la Sarthe’s Mulsanne, the Targa was a fearsome thing to behold.\nDay of the race would be sunny and warm, with the first of the cars leaving the small village of Cerda, one-by-one, at 40 seconds intervals. It was clear right at the start that something was amiss for most of the competitors, as more than a few would be off the pace, while other would be off the road, in verges trying to repair their cars and get back into the race. Jean Behra would spin his Porsche 718 RSK. Moss would damage a wheel when he went off the road. Meanwhile, von Trips damaged his Ferrari heavily and returned to the pits dragging bit of his car along the ground. It seemed that everyone was struggling over the mountain roads, except one, Musso.\nMusso was setting an incredibly pace. He started last of the big works entrants, but at the end of the first lap, he would be first. Being in the lead, he set about performing an error-free drive. Moss would be on the hunt in his Aston, ever-impressive sliding around the corners, kicking up gravel everywhere and carrying on without any trouble whatsoever, following that earlier incident. He would break the lap record, lapping more than a minute faster than Musso. But the Italian had already done all of his head work. He led and held steady before handing the car over to Gendebien.\nWith Gendebien now the car, Moss would take his Aston even faster, but it came at a price. After five laps, the gearbox gave up and Moss was out of the race, before Brooks had a chance to race. Despite the retirement of the sole Aston Martin, the circuit maintained the pressure on the factory efforts. Hill would end up in a ditch, losing valuable time trying to get out and back on his way. As for the Belgian, he was driving smartly, keeping the car on the road, and in the lead. He was just a few laps before returning the car back to Musso. This was the only Ferrari not under heavy pressure from Behra. The nimble little RSK was providing its self on the winding roads, and joining the battle for a spot in the top three.\nMusso held a commanding lead, despite the advances of Behra. But Musso was not immune to trouble. Only three laps from the end, there was trouble. He appeared to be off the pace, lapping four minutes slower than previously. He was happy to make it back to the pits, as the brake fluid had leaked out of its reservoir. He had no brakes. It was reported that he completed the descent out of the mountains by staying in low gear. In any other race, this would have spelled the end, however, Musso and Gendebien had controlled the race right from the start. Such was their lead, the Ferrari mechanics repaired the car, Gendebien got back in the car for the remaining laps, still with a three-minute lead.\nNow the leaders were out of trouble, their team-mates von Trips and Hawthorn were not. They were in second place, but with Behra back in the Porsche and absolutely flying. Following a pitshop, the margin between the Ferrari and Porsche would be practically nothing. There was no stopping Behra, and he continued to up his pace and Hawthorn could not response. Starting the 14th and last lap, Behra’s pace had meant he was now ahead.\nOut in front, Gendebien brought the 250 TR home, to record a brilliant victory. Though Moss had set a new lap record in his Aston, the race had been dominated from the very beginning by Musso. Car number 106, took an impressive victory, winning in a time 10hr 37:58.1, averaging a speed of 59.251 mph. Second place went to the Porsche of Behra and Giorgio Scarlatti, albeit over 5½ minutes adrift. The podium was complete by second Scuderia Ferrari of von Trips and Hawthorn, who were 54 secs behind in third.\nOfficial Classification.\n\"Class Winners are in Bold text.\"\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48689769","title":"Three Sisters (sternwheeler)","body":""}
{"url":"https://en.wikipedia.org/wiki?curid=48689770","title":"List of mosques in Kosovo","body":"\nList of mosques in Kosovo\n\nBelow is a partial list of mosques in Kosovo. The list includes mosques built during the Ottoman Empire period, as well as those built in the modern era.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48689782","title":"Bachra","body":"\nBachra\n\nBachra is a census town in Tandwa Block of Chatra district in the state of Jharkhand, India.\nGeography.\nBachra is a colliery township located at .\nDemographics.\nAs per 2011 Census of India Bachra had a population of 12,969, of which 7,169 were males and 5,800 were females. Scheduled Castes numbered 1,519 and Scheduled Tribes numbered 826.\nLiteracy.\nAs per 2011 census the total number of literates in Bachra was 9,718 out of which 5,887 were males and 3,831 were females.\nEconomy.\nThe North Karanpura Coalfield is spread across parts of Ranchi, Hazaribagh, Chatra and Latehar districts of Jharkhand covering an area of 1,230 km2. This coalfield in the upper reaches of the Damodar Valley, has reserves of around 14 billion tonnes of coal, very little of which has been exploited. Karkatta, KD Hesalong, Manki, Churi, Bachara UG, Bachara OC, and Dakara are long established collieries south of the Damodar. North of the Damodar lies comparatively new major mines such as Piparwar Mine and Ashoka Project. 23 mines are planned in the northern sector (near Bachra). Those in an advanced stage of planning are: Dhadu, Purnadih, Magadh, and Amrapali.This happens to be the largest mining sector of Central Coalfields Limited.\nProjects in the Piparwar area of Central Coalfields Limited (as in 2015) were: Piparwar open cast, Ray-Bachra underground, Ashoka open cast, Piparwar coal handling plant and Piparwar coal preparation plant.\nTransportation.\nBachra is served by Ray railway station, about 25 km from Barkakana railway station on the Sonnagar-Barkakana loop line.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48689786","title":"Hannah Wants","body":"\nHannah Wants\n\nHannah Wants (born Hannah Alicia Smith in 1986) is a British DJ and producer from Birmingham.\nHer track \"Rhymes\", a collaboration with Chris Lorenzo, reached #13 in the UK in 2015.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48689801","title":"Madeleine Dior","body":"\nMadeleine Dior\n\nMarie Madeleine Juliette Martin, who was born in Angers, France, in 1879 and died in Granville (French department of Manche) in 1931, was the wife of the industrialist Maurice Dior. She was also the mother of the grand couturier Christian Dior and the French Resistance member Catherine Dior.\nBiography.\nMadeleine Martin was the daughter of a lawyer from Angers and Juliette Surosne, originally from the department of Calvados, France. Monsieur Martin died young and Madeleine was brought up by her mother.\nIn 1898, at the age of nineteen, she married Maurice Dior who was six years her senior. The couple moved to the center of Granville in the department of Manche, where Maurice Dior had grown up. They had five children: Raymond in 1899, Christian in 1905, Jacqueline in 1909, Bernard in 1910, and Ginette, known as Catherine, in 1917.\nIn 1905, to satisfy Madeleine, who did not like the house in the center of town, the Dior family purchased a property that was still in Granville but on the edge of a cliff, facing the sea. This windswept villa was called \"Les Rhumbs\", named after the thirty-two divisions of the wind rose. It had a large piece of adjoining land which Madeleine Dior transformed into a southern-style garden, overcoming the hostility of the winds blowing in from the sea to grow delicate plants.\nIn 1910, taking advantage of the revenue from Maurice Dior's company which was enjoying great success, the family moved to Rue Richard Wagner in Paris, since renamed Rue Albéric Magnard. Madeleine Dior excelled as the lady of the house and a woman of taste, decorating the apartment in the Louis XVI-Passy style fashionable at the time. She surpassed herself when holding dinners served by butlers in white gloves, and her bouquets were much admired by her guests.\nIn 1914, the family decided to take refuge from the war and returned to live in the Granville villa, which had been their holiday home since 1910. Like all society ladies in the region, Madeleine Dior participated in the war effort. In his autobiography, Christian Dior remembers this period when women were occupied \"with making shredded cloth bandages, hospitals, letters from the front and recreation sessions for the injured.\" The family returned to live in Paris in 1918, not far from the apartment where they had lived before the war.\nIn 1930, Bernard, the second youngest of the family, was affected by a serious nervous disorder. Madeleine Dior, doubtless worn down by what was happening to her son, died the following year. Jacques Bonjean, a gallery owner and friend of Christian Dior, described her as an \"...elegant and slender woman, sometimes distant, always graceful.\"\nThe \"Les Rhumbs\" garden in Granville.\nThroughout her life, Madeleine Dior lived out her passion for flowers through the transformation of the windswept land surrounding her villa in Granville into a beautiful English-style garden. First she had a veranda added to the façade of the house, which sheltered a winter garden, and planted a small wood of umbrella pines to protect her plants from the wind. This was a bold choice of tree for the Normandy coast. She also had windbreak walls put up to protect the property, and finally she had a greenhouse built where the plants were overwintered. On the advice of Christian Dior, the greenhouse was replaced in 1925 by a pergola and pool; a rose garden was planted nearby a short while later. The creation of the garden became a two-person job, which created a bond between Madeleine Dior and her son: the latter organized it by positioning the features, while she took care of the planting. The result was a complex planting scheme that sheltered the most fragile flowers from the wind: \"\"Madeleine Dior's planting formed curtains of shielding greenery, so that the second was more precious and the third consisted of plants that it would have been impossible to grow here: geraniums, roses, jasmine... All these protective screens created layers, structures and motif effects,\" explains the garden's current landscape gardener.\nJames de Coquet, journalist for \"Le Figaro\", remembered being amazed by his visit to \"Les Rhumbs\" in 1929: \"I complimented Madame Dior on her beautiful garden. I told her she must have an excellent gardener.\"\"\nIn 1997, the villa, which had been purchased by the town of Granville in 1932, became the Musée Christian Dior. The garden, Madeleine Dior's life work, is one of the few \"artistic gardens\" of the early 20th century to have been preserved. For student landscape gardners, it is also an exceptional subject of study.\nInfluence on the work of Christian Dior.\nMadeleine Dior was particularly close to her son Christian, the future couturier: in the eyes of her other children, he was her \"favorite\" and he followed her everywhere, from her Granville garden to Orêve, her favorite Parisian florist, and the dressmaker Rosine Perrault. Madeleine Dior was a close follower of fashion, as demonstrated by a Roaring Twenties dress that she designed, which is exhibited in the Granville museum.\nThe couturier remembered his mother when, years after her death, on the eve of his first runway show, he was looking at the façade of the House that bore his name on Avenue Montaigne and exclaimed: \"If Mother had lived, I would never have dared.\" In the same way that we sense the presence of Charles Baudelaire's mother, Caroline, in his work and the influence of Jeanne, Marcel Proust's mother, in his, Madame Dior had a profound effect on her son's entire career. Regarding the Granville house, Christian Dior wrote: \"\"I have the tenderest, most magical memories of it. Not only that; my life, my style, owe nearly everything to its location and architecture,\" and \"...(it) was pebbledashed in a very soft pink, blended with gray gravel, and these two colors have remained my favorite shades in couture.\"\" But it was above all his mother's garden that made a deep impression on the couturier. Having spent his childhood learning the names of flowers and their descriptions from horticulture catalogs, Christian Dior drew inspiration from them to create the silhouettes that would lead to his success in 1947 with the \"Corolle\" line. The decor of the Diors' apartment in La Muette, Paris, was also imprinted on the couturier's imagination: reference is made to it in the Louis XVI style which inspired the interiors of the Dior boutiques. Finally, it was Madeleine Dior's look that the couturier remembered when he invented the famous New Look with its nipped in waist, pronounced hips and emphasized bust recalling the feminine silhouettes of the Belle Époque. Long after the couturier's death, the House of Dior continues to pay tribute to this muse, as in the Fall-Winter 2005 runway show, where a Belle Époque-inspired dress was named \"Madeleine\".\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48689808","title":"Thames Railway Station","body":"\nThames Railway Station\n\nThe Thames Railway Station is a former railway station in Thames, New Zealand on the former Thames Branch from Morrinsville to Thames. \nThe station opened on 19 December 1898 with the opening of the branch line. Passenger service ceased from 28 March 1951. There were also station buildings at Thames North and Thames South. \nThe branch was closed (apart from a section) on 28 June 1991, and goods service ceased. However the station building remained as it was listed by NZHPT Category II in 1982. It is a standard Vintage station, with gables, finials and scalloped bargeboards.\nWork on the proposed Paeroa–Pokeno Line commenced in the 1930s, but little was done and the proposal was abandoned. The line was to be the first part of the East Coast Main Trunk Railway. \n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48689859","title":"Mission Innovation","body":""}
{"url":"https://en.wikipedia.org/wiki?curid=48689866","title":"The Three Masks","body":"\nThe Three Masks\n\nThe Three Masks (French:Les trois masques) is a 1929 French silent film directed by André Hugon and starring Renée Héribel, Jean Toulout and François Rozet.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48689874","title":"Georgi Yungvald-Khilkevich","body":"\nGeorgi Yungvald-Khilkevich\n\nGeorgi Yungvald-Khilkevich (22 October 1934 – 11 November 2015) was a Soviet and Russian film director, screenwriter, producer, actor, theatre director and set designer. Most famous for his musicals and Alexandre Dumas adaptations. He directed 22 motion pictures and TV movies between 1966 and 2009. Honored Artist of the Russian SFSR (1990) and Ukraine (1995).\nBiography.\nGeorgi Yungvald-Khilkevich was born into a theatrical family of noble heritage. His mother Nina Ivanovna Buiko was a ballet dancer. His maternal grandfather Ivan Petrovich Buiko came from an old Russian family and served as a colonel in the Imperial Russian Army and a commandant in Warsaw. He joined Bolsheviks in 1917. Georgi's father Emil Iosifovich Yungvald-Khilkevich was an acclaimed theater director and one of the founders of the Uzbek National Theater of Opera and Ballet (later Navoi Theater). His paternal grandfather came from Polish szlachta and owned railroads in Western Ukraine, while his wife Elena Cavalieri was an Italian; she was said to be the sister of the famous opera singer Lina Cavalieri who was very popular in the Russian Empire and regularly visited Kiev with concerts.\nGeorgi Yungvald-Khilkevich graduated from the in 1963. He worked as a set designer at Tashkent theaters and film studios. In 1966 he finished directing and screenwriting Mosfilm courses and started working at the Odessa Film Studio, where he later directed most of his movies.\nHis first major breakthrough happened in 1969 with the musical film \"Dangerous Tour\" loosely based on the memoirs of Alexandra Kollontai. The screenplay was written with Vladimir Vysotsky in mind, who eventually played the main part, wrote all the songs and did some uncredited contribution to the final draft. His partners were Nikolai Grinko, Yefim Kopelyan, Ivan Pereverzev and Georgi Yumatov. The film turned to be one of the leaders of the Soviet box office in 1970 (9th place).\nIn 1978 Khilkevich turned to Alexandre Dumas who happened to be one of his favourite writers since childhood. His 3-part made-for-TV adventure musical \"D'Artagnan and Three Musketeers\" turned to be an ultimate success, with many songs and catchphrases becoming part of the popular culture. It was followed by three sequels in 1992, 1993 and 2009. In 1988 he made another Dumas adaptation – The Prisoner of Château d'If based on The Count of Monte Cristo novel. The screenplay was co-written by Mark Zakharov, while all the songs were written and performed by Alexander Gradsky.\nAmong his other notable works was another musical Ah, Vaudeville, Vaudeville... and a comedy The Art of Living in Odessa based on The Odessa Tales by Isaac Babel. He rarely turned to cinema during the post-Soviet years. In 1997 he joined at the National Cats Theater in Moscow as a stage director and scriptwriter. He also worked as a set designer in various theaters. His last film in the Musketeer series directed in 2007 and screened in 2009 was met with harsh critique and became a box office bomb.\nYungvald-Khilkevich died from the heart failure at the age of 81. He was buried at the Troyekurovskoye Cemetery in Moscow. He was survived by his third wife, an actress Nadira Mirzaeva (born 1969), and two daughters — Natalia (born 1960) and Nina (born 1997).\nBibliography.\nGeorgi Yungvald-Khilkevich, Natalia Yungvald-Khilkevich. \"За кадром (\"eng. \"Behind the Screen)\". Moscow: , 2000 (Autobiography). ISBN 5-227-00627-X\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48689889","title":"1990 Women's European Cricket Cup","body":"\n1990 Women's European Cricket Cup\n\nThe 1990 Women's European Cricket Cup was an international cricket tournament held in England from 18 to 22 July 1990. It was the second edition of the Women's European Championship, and all matches at the tournament held One Day International (ODI) status.\nFour teams participated, with the hosts, England, joined by the three other European members of the International Women's Cricket Council (IWCC) – Denmark, Ireland, and the Netherlands. A round-robin format was used, with the top teams proceeding to the final. England was undefeated in the round-robin stage and beat Ireland by 65 runs in the final, winning the championship for a second consecutive time.\n England's Wendy Watson led the tournament in runs for a second year running, while Ireland's Susan Bray was the leading wicket-taker. The tournament was hosted by East Midlands Women's Cricket Association, a member of England's Women's Cricket Association, and matches were played at venues in three English counties (Leicestershire, Northamptonshire, and Nottinghamshire).\nRound-robin.\nPoints table.\nSource: \nStatistics.\nMost runs.\nThe top five run scorers (total runs) are included in this table.\nSource: \nMost wickets.\nThe top five wicket takers are listed in this table, listed by wickets taken and then by bowling average.\nSource: \n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48689898","title":"Mount Allen (Victoria Land)","body":"\nMount Allen (Victoria Land)\n\nMount Allen () is a peak, 1,400 m, standing between Clark Glacier and the head of Greenwood Valley in Victoria Land. Charted by the Victoria University of Wellington Antarctic Expedition (VUWAE), 1959-60, and named for A.D. Allen, one of the party's geologists.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48689907","title":"Shanmughanathar Temple, Kunnakudi","body":"\nShanmughanathar Temple, Kunnakudi\n\nKunnakudi Shanmughanathar temple (also called Kunnakudi Temple or Kunnakudi Murugan Temple) in Kundrakudi, a village in the outskirts of Karaikudi in Sivaganga district in the South Indian state of Tamil Nadu, is dedicated to the Hindu god Murugan. Constructed in the Dravidian style of architecture, the temple is located in the Tirupattur - Karaikudi Road, around from Karaikudi. There are three caves located on the western side of the lower rock, that has rock-cut shrines from the Pandyan Empire from the 8th century. The caves have the earliest sculptural representation of Dvarapalas, the guardian deities, for any South Indian temple.\nThe temple has a five-tiered gateway tower, the gopuram in the hill, leading to a pillared hall and the sanctum. The temple is open from 6:00 am - 11:00 am and 4 - 8:00 pm. Four daily rituals and many yearly festivals are held at the temple, of which Panguni Uthiram festival celebrated during the Tamil month of \"Panguni\" (March - April) and Thaipoosam during \"Thai\" (January - February) being the most prominent. The temple is maintained and administered by the Kunnakudi Thiruvannamalai Mutt Adikam, while the rock-cut caves are maintained as a protected monument by the Archaeological Survey of India.\nLegend.\nThe place was originally called Kundrakudi as it was located in a hill (\"Kundram\" means hill in Tamil), which with the period of time became Kunnakudi. It is also called by other names like Mayuragiri, Mayilmalai, Arasavaram and Krishanagaram as the hill resembles the shape of a peacock. As per Hindu legend, sage Agasthya is believed to have worshipped Murugan at this place. As per another legend, Sooran, the demon king infuriated peacock, the sacred vehicle of Murugan. He told the bird that Garuda, the sacred vehicle of Vishnu and Swan, the sacred vehicle of Saraswati could travel faster than it. The peacock swallowed Garuda and the swan in anger. Vishnu prayed to Muruga to retrieve his vehicle back from the peacock, who readily acceded to the request. The peacock, realising its mistake, prayed Muruga by doing penance at this place.\nArchitecture.\nThe temple is located in Kundrakudi, in the outskirts of Karaikudi in Sivaganga district in Tamil Nadu on the road from Tirupattur to Karaikudi. The hill has a height of and occupies an area of . The temple has a five tiered rajagopuram, the gateway tower raising to a height of , which pierces the granite wall surrounding the temple. The sanctum faces East and the image of the presiding deity Murugan is sported with the images of his consort Valli and Deivasana, each of whom are seen sitting on a peacock. There are shrines of other deities around the sanctum in the precinct.. \nThere are three caves in the western side of the lower hill, with rock-cut images dedicated to Shiva in each of them. The first two caves have intricate rock-cut sculptures and Dvarapalas on either side of the sanctum, while the third one is plain. There are various sculpted images of Vishnu, Durga, Lingodbhava, Harihara. The image of Dvarapalas in the caves, on either sides of the sanctum, with each leaning in the direction facing the sanctum, are found to be the earliest representation of the images. These are not found in Pallava architecture, which precedes the Pandyas. The caves are considered one of the major specimens of rock-cut architecture of the Pandyas, counted along with Vettuvan Koil, Thirumalaipuram and Thiruparankundram.\nCulture.\nThe temple priests perform the \"pooja\" (rituals) during festivals and on a daily basis. The temple rituals are performed four times a day: \"Kalasandhi\" at 6:00 a.m., \"Uchikala poojai\" at 11:00 a.m., \"Sayarakshai\" at 6:00 p.m., and \"Arthajama Pooja\" at 7:45 p.m. Each ritual has three steps: \"alangaram\" (decoration), \"neivethanam\" (food offering) and \"deepa aradanai\" (waving of lamps) for the presiding deities. There are weekly, monthly and fortnightly rituals performed in the temple. The temple is open from 6:30 am - 12:00 pm and 5 - 8:30 pm on all days except during festive occasions when it has extended timings. The major festivals of the temple include the Panguni Uthiram festival celebrated during the Tamil month of \"Panguni\" (March - April) and Thaipoosam during \"Thai\" (January - February). The other festivals include Kantha Sashti, Vaikasi Visagam, Aavani Moolam and Paal Perukku Vizha. Like other Murugan temples during the festivals, hundreds of devotees carry pots of milk and Kavadi around the streets of the temple. Devotees offer pepper and salt to Saravana Poigai, the temple tank, as a mark of worship. The temple is revered in the verses of \"Thirupugazh\" the 15th century anthology on Murugan by Arunagirinathar.\nIn modern times, the Sivaganga district administration has identified the temple as one of the prominent tourist attractions in the district. The temple is administered by Kunnakudi Thiruvannamalai Mutt Adikam, which was established during the 16th century. In modern times, the caves are maintained and administered by Archaeological Survey of India as a protected monument.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48689927","title":"The Princess and the Clown","body":"\nThe Princess and the Clown\n\nThe Princess and the Clown (French:La princesse aux clowns) is a 1924 French silent film directed by André Hugon and starring Huguette Duflos, Charles de Rochefort and Magda Roche.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48689932","title":"Patricia Farrar","body":"\nPatricia Farrar\n\nPatricia Jean \"Pat\" Farrar (; August 13, 1931 – October 31, 2015) was an American educator. She served as the First Lady of South Dakota from 1969 to 1971 during the administration of her husband, former Governor Frank Farrar. Additionally, she also served on the board of advisers of the John F. Kennedy Center for the Performing Arts. Patricia Farrar won a gold medal at the National Senior Games, also known as the Senior Olympics, in 1989.\nEarly life and education.\nFarrar was born Patricia Henley on August 13, 1931, in Britton, South Dakota, to Percy Denis and Margaret (née Schneider) Henley. She was raised in nearby Claremont, South Dakota, where she graduated as valedictorian from Claremont High School in 1949.\nShe graduated cum laude from the University of South Dakota in 1953, where she studied English and art. Henley placed first runner up in the Miss South Dakota pageant while in college. She began her career as a teacher at Summit High School in Summit, South Dakota. \nCareer.\nFarrar served as the First Lady of South Dakota from 1969 to 1971. She was also a member of the South Dakota Commission on the Status of Women, as well as the South Dakota State University's advisory board for apparel and textiles. Nationally, Farrar held a seat on the board of advisers for the John F. Kennedy Center for the Performing Arts in Washington D.C. She wrote and performed a chautauqua based on the life of South Dakota's first First Lady, Margaret Mellette. \nIn 1989, Farrar won a gold medal in race walking at the second National Senior Games in St. Louis, Missouri.\nDeath.\nFarrar died from Lewy Body Dementia and Parkinson’s disease at Avera St. Luke's Hospital in Aberdeen, South Dakota, on October 31, 2015, at the age of 84. She was survived by her husband, former Governor Frank Farrar, and their five children. Governor Dennis Daugaard ordered flags to be flown at half-staff on November 7, 2015, in Farrar's honor.\nPersonal life.\nHenley married her husband, Frank Farrar, whom she had met at the University of South Dakota, on June 5, 1953, at Fort Benning, Georgia, where Farrar was stationed in the U.S. Army at the time. The couple had five children, Jeanne, Sally, Robert, Mary, and Anne.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48689943","title":"T. Sreenidhi","body":"\nT. Sreenidhi\n\nT. Sreenidhi(Srinidhi) (born 26 January 1990), is an eminent Carnatic Musician and Playback Singer. Sreenidhi performed in major sabhas in India and presented her concerts in many destinations around the world. She received multiple awards and honours. Sreenidhi trained under legendary vocal stalwart Sangita Kalanidhi Dr. Nedunuri Krishnamurthy.\nEarly Life and Family.\nSreenidhi was born in Anantapur. Her father T. Subramanyacharyulu is Carnatic Vocalist and Violinist and her mother T. Sarada is Carnatic Musician. She got her initial training by her mother as she used to sing Thyagaraja krithis and ragaalapanams, swarams in place of lullabies to the just born Sreenidhi. Her father, who is a vocal-violin exponent, nurtured her with a good authentic musical foundation. Later she trained under legendary vocal stalwart Sangita Kalanidhi Dr. Nedunuri Krishnamurthy. She is married to Venkatesh on 26 January 2015 at Hyderabad.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48689954","title":"MeetYourMakers","body":"\nMeetYourMakers\n\nMeetYourMakers (MYM or mYm) is an esports organization based in Germany. It competes in \"League of Legends\", \"Dota 2\", \"StarCraft II\", and \"\". MYM was founded in 2001.\nMYM dropped their \"WarCraft III\" team in 2009.\nIn July 2015 MeetYourMakers was involved in an incident where the team manager threatned to take Marcin \"Kori\" Wolski's house away as a result of his leaving the team. After the dissolution of their previous LoL team they acquired LCS team Supa Hot Crew.\nIn the history of MYM, players and teams from MYM were featured with awards like “eSports player of the year”, “eSports team of the year” and more. MYM won more than 400 titles at important major events around the world, including the World Cyber Games (WCG) and the Electronic Sports World Cup (ESWC).\nHistory.\n2000: In 2000, the Dane Mark Peter \"Mercy\" Fries founded the organization Meet Your Makers, the first time publicly made its appearance in 2001. 2002, the decision was made to rebuild Meet Your Makers to a professional organization.\n2006: the organization Meet Your Makers was bought by investors. These investors founded together with the former owners of the company \"Regroup eSports A / S\", which was' renamed on 16 July 2008 in \"ESNation A / S\" beginning of August 2006 joined MYM unification G7 Teams at.\nThe Warcraft III Department has always been considered the flagship of Meet Your Makers. MYM players have reached many high rankings in various international leagues and tournaments, such as the ESL WC3L Series, the NGL ONE and World Cyber Games. Jang \"Moon\" Jae-ho Since February 2006, the Korean professional players stood at Meet Your Makers under contract. He was considered the best paid Warcraft III player in the world, his monthly salary was estimated at around 8,000 euros during his time in MYM article about Moons content the beginning of 2008 also changed the Dutch Manuel \"Grubby\" Schenkhuizen to MYM.\nThe end of 2007: committed Meet Your Makers after several failed attempts to gain a foothold in the Counter-Strike world, the reigning World Cyber Games World Champion PGS Gaming. The new team won the Electronic Sports World Cup 2008.\nEarly 2009 sparked the MYM team for Warcraft III and Starcraft on surprising.\nFirst August 2009: bought the Leipziger IT companies' FIO Systems AG \" Meet Your Makers, a few weeks later the organization with new teams in Warcraft III, Counter-Strike and Warcraft was reopened III DotA.\nOn June 6, 2012: the Meet Your Makers was sold by the FIO Systems AG to a private investor and registered as a limited company. \" 'Khaled Naim' \" acts since as managing director of Meet Your Makers GmbH.\nJune 2014: Meet Your Makers GmbH cooperates with the hmf Group (Mannheim), which constitute an integral marketing partner and support in the operational sales.\nOctober 2014: currently owns Meet Your Makers team in Fifa 14 Hearthstone, Heroes of the Storm and Battlefield 4\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48689965","title":"Lubricant (disambiguation)","body":"\nLubricant (disambiguation)\n\nA lubricant is a substance introduced to reduce friction between surfaces in mutual contact. For the general article about the topic, see lubricant.\nFor related pages, see:\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48689970","title":"The Black Diamond","body":"\nThe Black Diamond\n\nThe Black Diamond (French:Le diamant noir) is a 1922 French silent mystery film directed by André Hugon and starring Claude Mérelle, Ginette Maddie and Armand Bernard.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48689981","title":"Cirencester by-election, 1892","body":"\nCirencester by-election, 1892\n\nThe 1892 Cirencester by-election was held on 18 October 1892 after the retirement of the incumbent Liberal MP Arthur Brend Winterbotham. The seat was gained by the Conservative candidate Thomas Chester-Master. Chester-Master was originally declared the victor by 3 votes, but on petition and after scrutiny, the votes were declared equal and a new election was held.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48689997","title":"Exeter Hotel","body":"\nExeter Hotel\n\nThe Exeter Hotel is an Adelaide hotel located on Rundle Street.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48689999","title":"Guillermina Bravo Montaño","body":"\nGuillermina Bravo Montaño\n\nGuillermina Bravo Montaño (born 27 July 1949) is a Colombian teacher and politician of the Independent Movement of Absolute Renovation (MIRA) party. Currently she is a member of the Chamber of Representatives of Colombia. She was Deputy of the Department Assembly of Valle del Cauca from 2008 to 2011.\nPolitical career.\nFrom 2006 to 2007 she was a member of the leadership of her party, the Independent Movement of Absolute Renovation (MIRA) party, at the Cali city level. In 2006 she ran for Representative of the Valle del Cauca Department, being less than 1,000 votes away from getting a seat as Representative.\nIn 2007 she was elected Deputy of the Department Assembly of Valle del Cauca. In 2008 she served as the leader of her party at the Valle del Cauca Department level. During her term as Deputy she authored 10 Ordinances related to Social, Educational and Entrepreneurial promotion matters. In 2011 she ran for Governor of the Valle del Cauca Department, coming in fourth place thanks to 80,000 votes. \nIn 2014 she ran again for Representative of the Valle del Cauca Department and was elected thanks to 7,194 votes. During her term as Representative, she co-authored, along with his parliamentary group, the law commonly known as \"Natalia Ponce Law\", which increases the sentences related to Acid throwing to up to 50 years of prison. She was designated Spokesperson of the Afro-parliamentary group of the Congress of Colombia in 2014. A year later, she was designated Chairwoman of the Afro-parliamentary group.\nRecognition.\nIn 2008 she received the \"Pro-Joven Award\", which is bestowed by the Municipal Council of Youth of the El Cerrito Municipality upon those leaders who promote positive changes and development to the region. In the same year, she received the \"Ancestral Heritage Golden Palm Award\" in the Political Contribution category, bestowed during the Expo-Pacific 2008 Convention. This award is granted based on the contributions of an individual to the Afro-Colombian culture.\nIn 2010 she received the \"Afro-descence Excellence Medal\" from the interim Governor Raymundo Tello, as an acknowledgment of her authorship of Ordinance 299 of 2009, which set guidelines for a public policy to benefit the Afro-Descendant, Palenquero and Raizal communities of the Valle del Cauca Department.\nIn 2014 she received the \"Guachupé of Gold Award\" in the Afro-Colombian leadership category, awarded by the Afro-colombian society of Bogotá D.C., as an acknowledgment of her constant efforts to benefit the Afro-Colombian communities, especially women.\nIn 2015 she received a \"Formal-style Honour Note\" from the Department Assembly of Valle del Cauca due to her leadership and contributions to the development of the Colombian Pacific region and her social and political career in favor of women.\nPersonal life.\nGuillermina Bravo Montaño was born in Cali, Colombia, on 27 July 1949. She graduated in Social Sciences at Santiago de Cali University. She took two specialization courses, one in Cognitive processes and one in Administrative and Political Management She worked as a teacher for over 25 years. \n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48690005","title":"Films Albatros","body":"\nFilms Albatros\n\nFilms Albatros was a French film production company established in 1922. It was formed by a group of White Russian exiles who had been forced to flee following the 1917 Russian Revolution and subsequent Russian Civil War. Initially the firm's personnel consisted mainly of Russian exiles, but over time French actors and directors were employed by the company. Its operations continued until the late 1930s.\nHistory.\nFaced with increasingly difficult working conditions in Russia after the revolution of 1917, the film producer Joseph Ermolieff decided to move his operations to Paris where he had connections with the Pathé company. Arriving in 1920 with a group of close associates, Ermolieff took over a studio in Montreuil-sous-Bois in the eastern suburbs of Paris and began making films through his company Ermolieff-Cinéma. His co-founder of the company was Alexandre Kamenka, another Russian exile, and when in 1922 Ermolieff moved to Germany, Kamenka, together with his colleagues Noë Bloch and Maurice Hache, took over the company and re-established it as the Société des Film Albatros. He also set up a distribution company called Les Films Armor in order to control the distribution of his own films. Various explanations have been given for the choice of the name Albatros: the name of a boat which brought some of the emigrés from Russia; a symbol of White Russia; an incident with an albatros on the journey. As well as adopting the image of the albatros as its symbol, the company took the motto \"Debout dans la tempête\" (\"upright in the storm\").\nAmong the group of Russian artists who stayed to work with Albatros were the directors Victor Tourjansky and Alexandre Volkoff, the art director Alexandre Lochakoff, the costume designer Boris Bilinsky, and the actors Ivan Mosjoukine, Nathalie Lissenko, Nicolas Koline, and Nicolas Rimsky. Although this Russian company initially favoured Russian themes, Kamenka quickly realised the need for greater integration with French film production, and they turned increasingly to French subjects. In 1924 a number of Kamenka's Russian associates left Albatros, and Kamenka offered opportunities to several innovative French film-makers including Jean Epstein, Jacques Feyder, Marcel L'Herbier and René Clair. \nKamenka's production policy combined prestige projects with openly commercial films, and his consistent record made him the most successful French producer during the 1920s, according to Charles Spaak, who came to the company as a script-writer in 1928. Kamenka successfully achieved international distribution for many of his films (even in Soviet Russia with which his company had so little political sympathy, and from 1927 he entered into co-production arrangements with production companies in other European countries, driven by growing financial difficulties in the French film industry. The arrival of sound pictures posed a serious difficulty for Albatros which had hitherto relied considerably upon Russian actors, especially Mosjoukine whose accent precluded a successful transition into the talking era.\nThe company's output diminished in the 1930s, but it achieved one further artistic success of note when Jean Renoir joined them for his 1936 adaptation of Gorki's \"Les Bas-fonds\". By this time, Albatros was the longest surviving film company operating in France, but with the outbreak of World War II, Kamenka wound up the company which had remained particularly associated with silent cinema.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48690011","title":"Commonwealth Heads of Government Meeting 2020","body":"\nCommonwealth Heads of Government Meeting 2020\n\nThe Commonwealth Heads of Government Meeting 2020, also known as CHOGM 2020 will be the 26th meeting of the heads of government of the Commonwealth of Nations. It will be held in Malaysia. It will be the first CHOGM held in Malaysia since 1989.\nThe position of Commonwealth Chair-in-Office, held by the government leader of the CHOGM host country, will be transferred at the summit from the Prime Minister of the United Kingdom to the Prime Minister of Malaysia who will hold the post until the 27th CHOGM expected in 2022.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48690012","title":"Domini Guardato","body":"\nDomini Guardato\n\nDomini Guardato was a powerful landowner, wealthy merchant, and an intellectual in the Kingdom of Sicily. He was received into the Order of Jerusalem and decorated the Orders of Calatrava and Alcantara. He was a member of the aristocratic Patrician family Guardato, during the late 12th century.\nBiography.\nHe was from the medieval merchant city of Sorrento during the Kingdom of Sicily, where his family served as Patricians of the region. Since the time of King William the Good, he distinguished himself ever more to military valor, and therefore was often decorated to high and important office and other noble prerogatives. His descendants enjoyed nobility in the Kingdom of Sicily; Sorrento in the Seat of Door, and in Salerno in the Seat of Field; and many members of his family were received into the Knights Hospitaller; Knights of Alcantara, and the Knights of Calatrava. He more important than nobility, his family enjoyed the status of Patrician of Sorrento unto its abolition, in 1804 was ascribed To register Squares closed the Kingdom.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48690022","title":"List of alumni of the Pontifical North American College","body":"\nList of alumni of the Pontifical North American College\n\nThis is a partial list of notable alumni of the Pontifical North American College in Rome, a Roman Catholic educational institution that forms and educates seminarians and student priests for dioceses in the United States (as well as Canada and Australia). It was founded in 1859.\nIf the prelates and priests listed here completed their normal course of pre-ordination theology studies while at the North American College (in general, the bachelor and licentiate), only their year of ordination is given; if they were sent to the College for graduate studies or continuing education after ordination, then that graduate degree or program is listed.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48690023","title":"St. Andre's Parish","body":""}
{"url":"https://en.wikipedia.org/wiki?curid=48690025","title":"Cirencester by-election, 1893","body":"\nCirencester by-election, 1893\n\nThe 1893 Cirencester by-election was held on 23 February 1893 after a court declared a by-election in 1892 was rerun after the votes had been declared equal. The seat was gained by the Liberal candidate Harry Lawson Webster Levy-Lawson. The Conservative candidate Thomas Chester-Master was declared the victor of the 1892 by-election by 3 votes, but on petition and after scrutiny, the votes were declared equal and the 1893 by-election was held.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48690035","title":"Sooklek","body":"\nSooklek\n\nSooklek (or Suklek) is a Thai cartoon character created by Prayoon Chanyavongs in the \"likay\" style. He is characterized by a \"jaunty feather stuck in a band around his head and carrying a sword in one hand.\" Prayoon's son was named after this character.\nHistory.\nSooklek was first popularized as the titular role in the cartoon series \"Prince Chantarakob\" (จันทโครพ) and eventually became a public personality as creator Prayoon used the character in his satirical cartoons. His name means \"happy, good fellow\".\nWhen Field Marshall Thanom Kittikachorn gave out an order for Prayoon to stop his political cartoons in 1968, Sooklek was drawn with lips sewn together. Another warning from the government brought about change in Sooklek as the sewn lips were replaced by a big mustache. Sooklek regained his mouth with the ouster of Thanom in 1973.\nAdaptation.\nAn animation series in both 2D and 3D has been produced with Sooklek in the starring role. A commemorative book has also been launched by the Prayoon Foundation. The book is divided into two sections with the first focusing on Sooklek and the second about Prayoon's life and works.\nTo commemorate Prayoon's centenary, the Thailand Post launched a sheet of stamps. In addition, a local brand is producing T-shirts featuring Sooklek characters with part of the proceeds going to Prayoon Foundation.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48690040","title":"Jena, Alabama","body":"\nJena, Alabama\n\nJena is an unincorporated community in Greene County, Alabama, United States.\nHistory.\nJena was most likely named by a German family who settled in the area in honor of Jena, Germany. A post office operated under the name Jena from 1837 to 1921. Baseball Country, a world-renowned baseball camp, is located in Jena.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48690057","title":"Sam George Nartey","body":"\nSam George Nartey\n\nSam George Nartey is a Ghanaian politician. He is a member of the National Democratic Congress. In November 2015 he defeated, the incumbent E. T. Mensah to represent the party in the 2016 parliamentary elections for Ningo-Prampram constituency.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48690071","title":"Excela Health","body":"\nExcela Health\n\nExcela Health is a not-for-profit health organization that includes three licensed, acute care hospitals, two free-standing outpatient surgery centers, home care and hospice, physician practices, a durable medical equipment company and other facilities and services. Formally incorporated in 2004, Excela Health is governed by a single Board of Trustees. Its headquarters is located in Greensburg, Pennsylvania.\nExcela Health is the sole provider of health care in Westmoreland County. It employs 4,800 employees and credentials 800 physicians and allied health professionals. It also serves parts of Fayette and Indiana counties.\nThree charitable foundations exist to benefit the clinical and operational needs of Excela Health's hospitals and affiliated health care services. They include the Westmoreland/Frick Hospital Foundation with its two branches - the Frick Hospital Foundation and the Westmoreland Hospital Foundation - and the Latrobe Area Hospital Charitable Foundation.\nHealth facilities.\nFrick Hospital.\nA 102 licensed-bed hospital located in Mount Pleasant, offers services including general acute care, surgical services, award-winning emergency services, a sleep center, rehabilitation services and more. In addition to modem operating rooms and needed support functions, there is a short procedure unit for minor outpatient surgeries. The hospital's Women's Care Services offer a range of breast health services and bone density scanning. The Outpatient Services Center features a centralized outpatient registration area with quick, convenient patient registration surrounded by a variety of outpatient testing areas and services, drawing together nuclear medicine, pulmonary function lab, stress lab, EKG, EEG, echo cardiography, x-ray, ultrasound and mammography for a \"one-stop\" shop.\nLatrobe Hospital.\nLocated in the eastern section of Westmoreland County, Latrobe Hospital offers acute, surgical and specialized services. A 196-licensed-bed hospital, Latrobe features mammography, bone density services . Extensive cardiac diagnostic testing and treatment abound with a cardiac rehabilitation program available for post surgery patients. The hospital also features a state of the art newly renovated emergency department, a sleep center; diabetes center and endocrine clinic; outpatient surgery and short procedure suites; emergency services; wellness programs and more. Home to Excela Health's child and adolescent inpatient unit, Latrobe Hospital does not offer child and adolescent health services. It is also home to Excela Health's geriatric assessment service, and is the site of the health system's Center for Neurosciences. A Family Medicine Residency Program at Latrobe Hospital, affiliated with the Jefferson Medical College of Thomas Jefferson University, allows physicians hands-on experience flexible enough to prepare them for rural, suburban or urban medical practice.\nWestmoreland Hospital.\nWestmoreland Hospital, located in central Westmoreland County, is a full-service, acute care hospital and regional referral center with 364 licensed beds. The Family Additions Maternity Center offers maternity care in a home-like atmosphere featuring labor-delivery-recovery suites (LDRs) with operating suites for Cesarean or high risk births, and a Special Care (Level II) Nursery. There are also services for women planning or considering pregnancy and gynecological services. Behavioral Health Services feature an adult inpatient unit as well as outpatient services for adults. Additionally, the Westmoreland campus offers a breast health center; outpatient services including the SurgiCenter at Westmoreland and the Short Stay Surgery unit; sleep center; diabetes services and endocrine clinic; digestive disorders center; pain center; fixed site and open MRI units; a large critical care unit with an intensivist program (offering 24-hour-a-day, in-house physician specialist coverage in the critical care areas), and emergency care. It is also home to the interventional Center for Cardiovascular Medicine encompassing cardiac catheterization labs, electrophysiology labs and open heart surgery.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48690078","title":"Ma Junqing","body":"\nMa Junqing\n\nMa Junqing (; born October 1956) is a Chinese politician, serving since 2015 as the Deputy Communist Party Secretary of Jilin province.\nMa was born in Gongzhuling, Jilin. He joined the Communist Party in March 1976, shortly before the death of Mao. He graduated from the department of economics at Jilin University, and later obtained a doctorate in economics.\nMa's political career originated in the Jilin provincial organization of the Communist Youth League, in which he served as deputy secretary, and secretary, before being transferred to serve as mayor of Songyuan. He later served as party chief of Siping, and the secretary-general of the Jilin government. He joined the Jilin provincial Party Standing Committee as head of the propaganda department in 2004; later he took on the office of the secretary-general of the Jilin provincial party committee, and in August 2008, was re-shuffled to Vice-Governor. In May 2012 he was named executive vice-governor of Jilin.\nIn November 2015, he was named deputy party chief of Jilin province.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48690098","title":"Rallye du Var","body":"\nRallye du Var\n\nThe Rallye du Var is a yearly motor rally held in the month of November in the French commune of Sainte-Maxime in Var. It is often held as the final round of the French Rally Championship. It began in 1950.\nThe rally has attracted famous names from the world of rally driving such as the recently retired nine-time WRC champion, Sébastien Loeb (the 2000, 2009 and 2014 winner), 1994 WRC champion Didier Auriol (the 1987 and 1988 winner), Freddy Loix, Craig Breen, Jari-Matti Latvala (the 2011 winner), Dany Snobeck (the 1982 and 2008 winner), Romain Dumas, François Chatriot (the 1985, 1986 and 1989 winner), and Julien Maurin (the 2013 winner). Jari-Matti Latvala was the first non-Frenchman and thus foreign driver to win the rally, and it was also his first win on asphalt.\nAs well as part of the French Rally Championship, the Rallye du Var was part of the European Rally Championship calendar from 1984 to 2001.\nRecent years.\n2010.\nIn 2010, Cédric Robert won for the second time, having previously succeeded in 2002. He led the entire event and won four stages. Ex-Formula One driver Robert Kubica, who had recently completed the 2010 season for Renault, won the last three stages to ensure a high overall finish of fourth was bagged. The other two podium finishers turned out to be Bryan Bouffier and Stéphane Sarrazin.\n2011.\nIn 2011, WRC front runner Jari-Matti Latvala became the first foreign driver to win the race and the first Finn to do so. He beat previous winner Stéphane Sarrazin and Estonian driver Ott Tänak. He and his co-driver Miikka Anttila won in a Ford Fiesta RS WRC. It was also the first win for Latvala on asphalt, and he led the rally from start to finish, winning six stages along the way.\n2012.\nIn 2012, Cédric Robert won this rally for a third time, following his wins in 2002 and 2010. He was again co-driven by Matthieu Duval. The second placer was Le Mans winner Romain Dumas and third was Irishman Craig Breen. Ex-Formula One driver Robert Kubica of Poland dominated the rally and won every stage prior to crashing out late on, this allowed the Frenchman Robert to take the lead and win.\n2013.\nIn 2013, Julien Maurin won for the first time with co-driver Nicolas Klinger. Jérémi Ancian and Pierre Roché joined him on the podium. After a hat trick of stage wins, Maurin led to the end.\n2014.\nIn 2014, Sébastien Loeb driving his Citroën DS3 WRC won the Rallye du Var for the third time and the second with his wife Sévérine Loeb as the co-driver. The second place driver was David Salanon and third was Patrick Magnou. An influx of spectators caused three of the stages to be cancelled. However, Loeb did not let this hinder his performance, leading the entire rally from start to finish, as with his rival Jari-Matti Latvala in 2011.\n2015.\nIn 2015, the 61st running of this event, David Salanon and Romain Roche won in a Ford Fiesta RS WRC. Their first win on the asphalt event was followed by a secon place from newly crowned JWRC and WRC-3 champions Quentin Gilbert and Renaud Jamoul and third place went to Pierre and Martine Roché. For the second year running, the winner, Salanon, had a lights to flag victory. As for Gilbert, the newest Junior World Champion took advantage of his experience and won the final stage to elevate himself to second overall.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48690105","title":"The Two Pigeons (film)","body":"\nThe Two Pigeons (film)\n\nThe Two Pigeons (French:Les deux pigeons) is a 1922 French silent film directed by André Hugon and starring Armand Bernard, Germaine Fontanes and Huguette Delacroix.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48690115","title":"André Ferreira (Portuguese footballer)","body":"\nAndré Ferreira (Portuguese footballer)\n\nAndré Filipe Magalhães Ribeiro Ferreira (born 29 May 1996) is a Portuguese professional footballer who plays for Benfica B as a goalkeeper.\nClub career.\nFerreira was born in Vila Nova de Gaia, Portugal. On 24 November 2015, he debuted professionally with Benfica B in a 2015–16 Segunda Liga match against Oriental.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48690123","title":"Old Islam in Detroit","body":"\nOld Islam in Detroit\n\nOld Islam in Detroit: Rediscovering the Muslim American Past is a 2014 book by Sally Howell, published by the Oxford University Press. It discusses the Muslims of early 20th century Detroit, Michigan, and Detroit prior to 1970.\nContents.\nThe first parts of the book discusses the first Muslims to settle Detroit and the city's the first Islamic religious facility, the Highland Park Mosque. Another chapter discusses the second mosque, Universal Islamic Society (UIS). The later chapters discuss Islamic leaders who originated from Detroit and the first mosques to open in Dearborn. At the end of the book Howell states that pre-1980s views of Muslims influences views of Islam held by Americans in the post-September 11 environment.\nThe book includes interviews of the original Muslims and their families.\nReception.\nDawn-Marie Gibson of Royal Holloway, University of London stated that the book was \"thoroughly researched\" and is \"a valuable contribution to scholarship on American Islam.\"\nB. D. Singleton rated the book two stars, and stated that the book \"is appropriate for all academic libraries\" and is \"nicely illustrated but would have been strengthened by a basic chronology.\"\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48690127","title":"Stephen E. Gordy","body":"\nStephen E. Gordy\n\nStephen E. Gordy (March 20, 1920 – October 27, 2004) was an American politician, military officer, and educator.\nFrom Dalton, Georgia, Gordy graduated from the United States Military Academy in 1943 and from the Naval War College. He served in the United States Army during World War II and the Korean War. Gordy was a teacher, principal, football and baseball coach in the Loudoun County, Virginia Public Schools. Gordy served in the Virginia House of Delegates from 1982 to 1987 and was a Republican; he lived in Mantua, Virginia. He died at his home in Dalton, Georgia.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48690133","title":"List of One Day International cricket matches","body":""}
{"url":"https://en.wikipedia.org/wiki?curid=48690141","title":"Appollinaire University","body":"\nAppollinaire University\n\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48690148","title":"The Wedding March (1929 film)","body":"\nThe Wedding March (1929 film)\n\nThe Wedding March () is a 1929 French silent comedy film directed by André Hugon and starring Pierre Blanchar, Louise Lagrange and Paul Guidé.\nIt was made by the French subsidiary of Paramount Pictures. The film's sets were designed by the art director Christian-Jaque.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48690156","title":"Karakhan Manifesto","body":"\nKarakhan Manifesto\n\nThe Karakhan Manifesto was a statement of Soviet policy toward China dated July 25, 1919. It was issued by Lev Karakhan, deputy commissioner for foreign affairs for Soviet Russia. The manifesto offered to relinquish various rights Russia had obtained by treaty in China, including extraterritoriality, economic concessions, and Russia's share of the Boxer indemnity. These and similar treaties had been denounced by Chinese nationalists as \"unequal.\" The manifesto created a favorable impression of Russia and Marxism among Chinese. It was often contrasted with the Treaty of Versailles (1919), which granted Shandong to Japan.\nThe manifesto was prompted by the Bolshevik advance into Siberia, which created a need to establish a relationship with China. The Bolsheviks saw the Chinese as one of \"the oppressed peoples of the East\" and therefore a potential ally against the \"imperialist\" powers.\nThe manifesto is addressed to, \"the Chinese people and the Governments of North and South China.\" Because both Russia and China were in a state of civil war at this time, diplomatic exchanges were often delayed. Although the document was published in Moscow in August 1919, it was not formally presented to Chinese diplomats until February 1920. The version presented at this time includes the passage, \"the Soviet Government returns to the Chinese people, without any compensation, the Chinese Eastern Railway.\"\nSix months later, Karakhan personally handed the Chinese a second version of the manifesto, one that did not include this remarkable offer. In fact, the Soviet authorities denied ever having made it. The railway offer had been included by \"mistake,\" they explained. The Soviets may have hoped the offer of the railway would generate an enthusiastic response in Beijing, leading to a Sino-Soviet alliance against Japan. The warlords in Beijing, closely tied to Japan, responded hesitantly. When the hoped-for alliance proved unattainable, the Russians withdrew their offer. In any event, traditional Russian interests and rights in China, including control of the Chinese Eastern Railway, were reaffirmed in a series of secret agreements made in 1924–1925.\nThe manifesto came at a crucial time in the development of Chinese communism. It encouraged interest in Marxism and thus played a role in the founding of the Chinese Communist Party in 1921.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48690168","title":"Kripapureeswarar Temple","body":"\nKripapureeswarar Temple\n\nKripapureeswarar Perumal Temple (also called Arutkondanathar or Thiruvennainallur temple) in Thiruvennainallur, a panchayat town in Villupuram district in the South Indian state of Tamil Nadu, is dedicated to the Hindu god Shiva. Constructed in the Dravidian style of architecture, the present structure of the temple is believed to have been built during the Cholas period in the 10th century. The temple has received gracious endowments from the Chola queen Sembiyan Mahadevi. Shiva is worshipped as Kripapureeswarar and his consort Parvathi as Mangalambigai.\nThe presiding deity is revered in the 7th century Tamil Saiva canonical work, the \"Tevaram\", written by Tamil saint poets known as the Nayanmars and classified as \"Paadal Petra Sthalam\". A granite wall surrounds the temple, enclosing all its shrines. The temple has a five-tiered rajagopuram, the gateway tower. The temple is closely associated with Sundarar, the saivite saint of the 8th century, who started singing his \"Tirumurai\" starting with \"Pitha Piraisudi\" verse in this temple.\nThe temple is open from 6am - 11 am and 4-8:00 pm on all days except during festival days when it is open the full day. Four daily rituals and many yearly festivals are held at the temple, of which the Aadi star day celebrated during the Tamil month of \"Aaadi\" (June - July) for Sundarar and Panguni Uthiram festival during \"Panguni\" (March - April) with a float festival being the most prominent. The temple is maintained and administered by the Hindu Religious and Endowment Board of the Government of Tamil Nadu.\nLegend.\nAs per Hindu legend, the sages in Tharukavanam were very proud of their achievements and started doing a penance to destroy Shiva. Shiva absorbed all the evils from the penance and realising their mistake, the sages started their worship to Shiva. Shiva blessed them with their wishes and came to be known as Krupapureeswarar, the \"God who would bestow wishes of the devotees\". As per another legend, Sundarar, the famous Saivite saint and Nayanmar, was stopped by an old man from marrying at Thirukovilur. He showed a document indicating Sundarar was indebted to the old man for serving him for a lifetime. Sundarar called him \"Pitha\", a lunatic. The village elders after analysing the document, asked Sundarar to follow the old man. Sundarar followed the old mand and served him in his household. It was later revealed to him that Shiva appeared as the old man to test his servitude. Sundarar felt guilty of accusing Shiva, but Shiva revealed to him in a divine voice that he enjoyed the verse and requested him to sing verses starting with \"Pitha\".\nSundarar started singing his \"Tirumurai\" with \"Pitha Piraisudi\" verse in this temple and later would go on to become one of the four most venerated saints of Saiva literature.\nArchitecture.\nThe exact year of building could not be ascertained from the inscriptions, but the inscriptions found in the Visalur temple indicate benevolent gifts to the temple from Raja Raja Chola I (984-1015 CE) and his successors. Based on the inscriptions, researchers point out that the temple had gardens, which were supposed to have both floral plants and fruit bearing trees. The temple has received gracious endowments from the Chola queen Sembiyan Mahadevi and is believed to have established various sculptures.\nKripapureeswar temple is located in Thiruvennainallur, a village located from Villupuram on the Panruti- Thirukovilur road. The temple has a seven-tiered \"rajagopuram\", the gateway tower that pierces the rectangular wall that houses all the shrines. The sanctum houses the image of Kripapureeswarar in the form of Lingam, an iconic form of Shiva. There is an Ardha Mandap and a Mukha mandap, pillared halls leading to the sanctum. The first precinct has the images of Vinayakar, Murugan, Durga, Dakshinamurthy and Chandikeswara. The hall where the case was fought between the old man and Sundarar is believed to be the Panchyat Mandap located on the right side of the entrance.\nCulture.\nThe temple follows Saivite tradition. The temple priests perform the \"pooja\" (rituals) during festivals and on a daily basis. The temple rituals are performed four times a day: \"Kalasanthi\" at 6:00 a.m., \"Uchikalam\" at 11:00 a.m., \"Sayarakshai\" at 5:00 p.m., and \"Sayarakshai\" between 7:45  - 8:00 p.m. Each ritual has three steps: \"alangaram\" (decoration), \"neivethanam\" (food offering) and \"deepa aradanai\" (waving of lamps) for both Kripapureeswarar and Mangalambigai. There are weekly, monthly and fortnightly rituals performed in the temple. The temple is open from 6am - 12 pm and 4-8:30 pm.\nAadi star day celebrated during the Tamil month of \"Aaadi\" (June - July) as Sundarar's birthday and Panguni Uthiram festival during \"Panguni\" (March - April) with a float festival being the most prominent festivals. There are other common festivals like Shivaratri, Vinayaga Chaturthi, Vijayadasami and Karthigai Deepam celebrated in the temple.\nSundarar, an 8th-century Tamil \"Saivite\" poet, venerated Kripapureeswarar in ten verses in \"Tevaram\", compiled as the \"Seventh Tirumurai\". As the temple is revered in \"Tevaram\", it is classified as \"Paadal Petra Sthalam\", one of the 276 temples that find mention in the Saiva canon. In modern times, the temple is maintained and administered by the Hindu Religious and Endowment Board of the Government of Tamil Nadu.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48690182","title":"Socialists and Democrats (Italy)","body":""}
{"url":"https://en.wikipedia.org/wiki?curid=48690186","title":"Francisco Adolfo Cabrera","body":"\nFrancisco Adolfo Cabrera\n\nFrancisco Cabrera is an Argentine engineer, born in the Mendoza Province. He became an engineer in electricity in the University of Mendoza, and headed the minister of economic development of Buenos Aires under Mauricio Macri from 2007 to 2015. Macri was elected president in 2015, and appointed him minister of production. \n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48690198","title":"Sarati the Terrible (1937 film)","body":"\nSarati the Terrible (1937 film)\n\nSarati the Terrible (French:Sarati, le terrible) is a 1937 French drama film directed by André Hugon and starring Harry Baur, George Rigaud and Jacqueline Laurent.\nThe film's sets were designed by the art director Émile Duquesne.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48690214","title":"Pleasant Ridge, Alabama","body":"\nPleasant Ridge, Alabama\n\nPleasant Ridge, also known as Ridge, is an unincorporated community in Greene County, Alabama, United States. Pleasant Ridge is located on Alabama State Route 14, northwest of Eutaw.\nHistory.\nA post office operated under the name Pleasant Ridge from 1825 to 1918. On April 6, 1865, there was a skirmish between Union forces under the command of Col. John T. Croxton and Confederate forces under the command of Brigadier-General William Wirt Adams near Pleasant Ridge. Croxton was leaving Tuscaloosa, having burned the University of Alabama on April 4. The 6th Kentucky Cavalry Regiment and the 2nd Michigan Volunteer Cavalry Regiment engaged with Adams' forces.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48690219","title":"Joseph Baly","body":"\nJoseph Baly\n\nJoseph Baly (1824 - 1909) was Archdeacon of Calcutta from 1872 until 1883;\nBaly was educated at Worcester College, Oxford, graduating BA in 1846 and M.A. in 1857. He was ordained deacon in 1847 and priest in 1848. He served curacies in Leicester and Falmouth. In 1854 he became Warden of St Thomas's College, Colombo. He later served as Chaplain at Allahabad, Sealkote and Simla before returning to Falmouth as its Rector (1870 - 1872). He was appointed a Fellow of the University of Calcutta in 1879. On his return from India he was Chaplain of Windsor Great Park from 1885 until 1906.\nHe died on 6 November 1909.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48690237","title":"NAO (singer)","body":""}
{"url":"https://en.wikipedia.org/wiki?curid=48690239","title":"Office of Dispute Resolution for Acquisition","body":"\nOffice of Dispute Resolution for Acquisition\n\nThe Office of Dispute Resolution for Acquisition (ODRA) is an Article I court that was established by the Federal Aviation Administration (FAA) pursuant to a statutory grant of authority as an independent tribunal to hear and decide both award protests and contract disputes subject to the Acquisition Management System (AMS) between Government contractors and the FAA.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48690247","title":"The Bad Companions","body":"\nThe Bad Companions\n\nThe Bad Companions is a 1932 British comedy film directed by J.O.C. Orton and starring Nor Kiddie, Renee Gadd and Wallace Lupino. The title is a reference to the 1929 novel \" The Good Companions\" by J. B. Priestley which was itself made into a film the following year.\nIt was made at Welwyn Studios as a second feature by British International Pictures.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48690262","title":"Sebastian Saxe","body":"\nSebastian Saxe\n\nSebastian Saxe started his career in the City of Hamburg and since 2009 he is a Board Member of the \"Hamburg Port Authority\" (HPA). Hamburg´s Port is one of the largest ports in the European Union and among the biggest ports in the world. As CIO and CDO, Saxe has his main focus on the port’s IT strategy and the digital transformation of the company and its intermodal logistical chain.\nCurrently, he is strongly involved in building the smartPORT of Hamburg. The main goal is to make use of all IT megatrends, like Internet of Things, Big Data, Cloud Computing and Mobility to maximize the efficiency in the logistic hub of Hamburg.\nSebastian Saxe holds a PhD in mathematics and was one of the CIOs of the year in 2012. Under his guidance, the HPA won various prices in the field of IT technology and started its transformation in the digital age.\nRecently, he was chosen as CIO of the year 2015 for small and medium-sized Enterprises in Germany.\nLife.\nSebastian Saxe lives in Hamburg, Germany, with his wife and two children.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48690265","title":"Alex Gerrard","body":"\nAlex Gerrard\n\nAlex Gerrard may refer to:\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48690293","title":"Seaman Service Book","body":"\nSeaman Service Book\n\nSeaman Service Book (SSB) is a continuous record of a seaman’s service. This document certifies that the person holding is a seaman as per The International Convention on Standards of Training, Certification and Watch keeping for Seafarers (STCW), 1978, as amended from time to time. Seaman Book is one of the compulsory document for applying crew transit visas. The record of employment on board of a merchant ship (sea service) is recorded in a Seaman Service Book. Different countries issue to their seafarers the similar service book with different names i.e. Seaman Record Book, Seaman Discharge Book etc. In Pakistan Government Shipping Office issue this book under section 120 of Merchant Shipping Ordinance, 2001. It is mandatory for all seafarers serving onboard Ship, whether they are on the Minimum Safe Manning Certificate or not, to hold a \"Seaman Service Book and Seaman Identity Document (SID).\nAffairs of Seamen in Pakistan.\nThe Government Shipping Office looks after the affairs of seafarers under Merchant Shipping Policy of Pakistan which covers the following subject of merchant navy of Pakistan:\nIssuance of SSB.\nPakistan's merchant marine policy for jobs on vessel set in 2001, speaks as follows:\nTo obtain employment on board a seagoing vessel every citizen of Pakistan is entitled to acquire a Seaman Service Book (SSB) in accordance with the provision of Merchant Shipping Ordinance 2001 subject to fulfilling the requirements as prescribed under the Rules issued from time to time, by the Government of Pakistan. No seaman can be engaged at any port of Pakistan, except service on coasting ships, unless until the seafarer is bonafide holder of the SSB. In case of foreign crew/merchant navy officers he must in possession of equivalent document e.g. equivalent discharge book issued by his own country. This is a prescribed certificate of identification with basic particulars and qualifications of the seaman duly registered with the Government Shipping Office. It is issued on Government sanctioned Form No. 20 by the Shipping Master under the provisions of Sections 120-138 of Merchant Shipping Ordinance, 2001. It is issued under a standard operative procedure (SOP), generally SSB contains the minimum information as given below:\nOther pages of SSB contain columns for Seaman engagement and discharge record, promotion/advancement, company listing, summary of previous voyages, visa endorsement, official entries by the concerned issuing office etc. SSB is issued from National Database Registration Authority (NADRA) after following prescribed procedure and deposit of fee. The (SSB) is also liable to be cancelled, suspended or confiscated if a seaman is found to be involved in contravention of any local law.\nIn Pakistan one of the sources of getting SSB in the category of ship's ratings/crew is conduct of courses from private sector institutions which are commonly known as GP or GP-III courses.\nSSB Holders in the country.\nPrior to 1990 Pakistan government was practicing the policy for issuance of CDC (now SSB) only to a certain number per year in order to ensure the availability of job to each and every seamen holding CDC under roster system. Earlier, there was just one government-owned institute, namely Pakistan Marine Academy, however, after promulgation of Merchant Shipping Ordinance (2001) institutes in private sector have allowed to offer training to semen for issuance of SSB according to their qualification and out of 10 approved institutes, five are actively conducting their business of training and education in accordance with STCW Convention. This has increased number of SSB holders in Pakistan in access of demand. About 40% of Pakistani seafarers are jobless for a long time. However, Government Shipping Office discloses that there are about 8,000 officers and 10,500 ratings duly registered as seamen. Out of this total number of registered seamens about 30% are employed on national as well as foreign ships. The employment on foreign ships is about 85% of the total seamen engaged in this field.\nVisa on Passport to Pakistani SSB holder.\nAfter mishap of 9/11 most of the European and North American countries placed restrictions for Pakistani seafarers for carrying with them passport and SSB along with the visa of that country before they could leave the Pakistan to join the ship if it was berthed in any European or North American country.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48690302","title":"Infinality bundle","body":"\nInfinality bundle\n\nInfinality bundle is a font and libraries bundle aimed at optimized text rendering under Linux. It comprises patched versions of FreeType (with optimized settings), fontconfig and cairo.\nInfinality bundle replaces non-free fonts by free alternatives.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48690321","title":"Marco Aurélio Ribeiro Sousa","body":"\nMarco Aurélio Ribeiro Sousa\n\nMarco Aurélio Ribeiro Sousa (born 29 January 1995 in Porto) is a Portuguese professional footballer who plays for F.C. Paços de Ferreira as a goalkeeper.\nFootball career.\nOn 29 September 2014, Sousa made his professional debut with Paços de Ferreira in a 2014–15 Taça da Liga match against União Madeira.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48690324","title":"Walter, Alabama","body":"\nWalter, Alabama\n\nWalter is an unincorporated community in Cullman County, Alabama, United States. Walter is located on Alabama State Route 91 northeast of Hanceville.\nHistory.\nWalter is named for the son of the community's first postmaster. A post office operated under the name Walter from 1888 to 1905.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48690329","title":"Thomas Bewley","body":"\nThomas Bewley\n\nThomas Bewley, CBE, of St Thomas's Hospital, London, was president of the Royal College of Psychiatrists from 1984 to 1987.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48690333","title":"Chemical Pioneer Award","body":"\nChemical Pioneer Award\n\nThe Chemical Pioneer Award, established in 1966, is awarded by the American Institute of Chemists to recognize chemists or chemical engineers who have made outstanding contributions to advances in chemistry or the chemical profession. \nRecent recipients.\nSource: \n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48690335","title":"Horse Brook (Queens)","body":"\nHorse Brook (Queens)\n\nHorse Brook, is a buried stream located in the neighborhood of Elmhurst in the New York City borough of Queens. Its historic course flows beneath Queens Center Mall, Rego Center Mall, LeFrak City, and the Long Island Expressway, before emptying into Flushing Creek in present-day Flushing Meadows-Corona Park. Flushing Creek is a tributary of the East River.\nHorse Brook's headwaters originated near Kneeland Avenue and Codwise Place. Horse Brook was first mentioned at an annual town meeting in 1662, where it was voted that “whosoever has cats or dogs or hogs lying dead in any place to offend their neighbors they must bury them or throw them into the creek.”\nThe only remaining traces of Horse Brook today are the mega-blocks on the map that avoided development in the early 20th century, remaining vacant until the 1960s. Examples include the Queens Center Mall and LeFrak City. A small park called Horsebrook Triangle in Elmhurst marks the approximate location of the buried stream.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48690345","title":"Muhammad Parvesh Shaheen","body":""}
{"url":"https://en.wikipedia.org/wiki?curid=48690349","title":"Forest of Dean by-election, 1887","body":"\nForest of Dean by-election, 1887\n\nThe 1887 Forest of Dean by-election was held on 29 July 1887 after the retirement of the incumbent Liberal MP Thomas Blake. The seat was retained by the Liberal candidate Godfrey Blundell Samuelson.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48690382","title":"2016 America East Conference Baseball Tournament","body":"\n2016 America East Conference Baseball Tournament\n\nThe 2016 America East Conference Baseball Tournament will be held from May 26–28. The top four regular season finishers of the league's six teams will meet in the double-elimination tournament to be held at Edward A. LeLacheur Park in Lowell, Massachusetts, the home park of UMass Lowell.\nSeeding and format.\nThe top four finishers from the regular season will be seeded one through four based on conference winning percentage only. The teams will play a double-elimination tournament. UMass Lowell, despite hosting the event, is not eligible to participate as it transitions from Division II. The River Hawks are expected to complete this transition and be eligible for championships in the 2017–18 academic year.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48690392","title":"Japonism (Arashi album)","body":"\nJaponism (Arashi album)\n\nJaponism is the fourteenth studio album of the Japanese idol group Arashi. The album was released on October 21, 2015 under their record label J Storm in three editions: a first press/limited edition, a Yoitoko limited edition, and a regular edition. The first press edition comes with an 84-page photo lyrics booklet and bonus DVD with the music video and making-of for the album's lead track, \"Kokoro no Sora\". The Yoitoko limited edition comes with a 32-page lyrics booklet, and the regular edition comes with a 36-page lyrics booklet. The album sold over 820,000 copies in its first week and topped the Oricon charts for two consecutive weeks. With more than 950,000 copies sold, the album was certified for Million by the Recording Industry Association of Japan (RIAJ).\nAlbum information.\nThe first press edition contains a CD with sixteen tracks and the Yoitoko edition contains a CD with seventeen tracks. The regular edition contains a CD with twenty tracks. The first press edition comes with an 84-page photo lyrics booklet and a bonus DVD with the music video and making of for \"Kokoro no Sora\", while the Yoitoko limited edition comes with a 32-page lyrics booklet, a bonus track, and an original talk track \"Arajapo Talk\". The regular edition comes with a 36-page lyrics booklet and four bonus tracks.\nThe album jacket cover for the Yoitoko and regular editions are the same. The first press edition has a different jacket cover.\nSongs.\nIn \"Japonism\", Arashi expresses their interpretations of the \"wonderfulness of Japan\" in a unique way. It showcases Arashi's ambitious challenging spirit and continuous evolution. The lead track \"Kokoro no Sora\" was composed by Tomoyasu Hotei, who is based in London, with the theme \"Japan seen from the outside\" in mind. Described as a \"passionate and manly song\", Arashi sings to a fast-paced Hotei sound, where a battle between Arashi, Hotei, and Japanese instruments take place. The album includes a cover of Shonentai's \"Nihon Yoitoko Maka Fushigi\".\n\"Japonism\" includes two of the group's previously released singles: \"Sakura\" and \"Aozora no Shita, Kimi no Tonari\". This album also includes fourteen new songs plus five of each member's solo songs. It also includes their previously unreleased song \"Furusato\" which they have sung regularly since 2010.\n\"Sakura\" was used as the theme song for the drama \"Ouroborous\", starring actors Toma Ikuta and Shun Oguri. This is the first time Arashi has provided a theme song for a drama that did not star one of its members. \"Aozora no Shita, Kimi no Tonari\" was used as the theme song for the drama \"Yokoso, Wagaya E,\" which stars Arashi member Masaki Aiba.\nPromotion.\nTo support their new album, Arashi performed a live tour, ARASHI LIVE TOUR 2015 Japonism, performing at all the major dome stadiums in Japan. They had 17 performances beginning on November 6 at the Nagoya Dome, followed by Sapporo Dome on November 8, Kyocera Osaka Dome on November 26, Fukuoka Dome on December 17, and Tokyo Dome on December 23, 2015.\nChart performance.\nThe album debuted at number one on the Oricon daily album chart selling 412,826 copies upon its release and selling over 820,000 copies by the end of the week, topping the Oricon weekly album chart. The album maintained its number-one spot on the Oricon weekly album chart selling 56,890 copies in its second week and stayed in the top ten for six consecutive weeks. The album placed second on Billboard Japan's top album year-end list.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48690394","title":"Tomi","body":"\nTomi\n\nTomi may refer to:\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48690401","title":"Solent Sea Steam Packet Company","body":"\nSolent Sea Steam Packet Company\n\nThe Solent Sea Steam Packet Company, later the Solent Steam Packet Company, operated ferry services between Lymington and Yarmouth on the Isle of Wight between 1841 and 1884.\nHistory.\nIn early 1841, the company purchased \"Glasgow\" from the \"Lymington, Yarmouth, Cowes and Portsmouth Steam Packet Company\", and after refitting, was deployed on the service between Lymington and Yarmouth, operating three or four passages a day.\nIn March 1841 they entered into a contract with the Post Office for the conveyance of mail between Lymington and Yarmouth.\nBy 1842, the company had acquired another vessel, \"Solent\", which was running from Lymington to Yarmouth, Cowes, Ryde and Portsmouth.\nIn 1858, \"Red Lion\" was added to the fleet to handle additional traffic brought by the railway. The company changed its name to the \"Solent Steam Packet Company\" in 1861.\nA second \"Solent\" replaced the first on 3 November 1863. \"Mayflower\" joined the fleet on 6 July 1866 had been built in Newcastle; she was tastefully fitted and comfortable. As well as plying to Yarmouth, she made excursion runs to Bournemouth, but was disposed of after 1878.\nOn 1 July 1884, the London and South Western Railway bought out the Solent Steam Packet Company's fleet of two paddle steamers, \"Solent\" and \"Mayflower\", four horse and cargo boats, and other boats and property, paying £2,750 (£ in ).\nShips.\nThe vessels operated by the Solent Sea Steam Packet Company were:\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48690414","title":"European consumer law","body":"\nEuropean consumer law\n\nEuropean consumer law concerns consumer protection within Europe, particularly through European Union law and the European Convention on Human Rights. \n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48690419","title":"James Chapelhow","body":"\nJames Chapelhow\n\nJames \"Jay\" Chapelhow (born 21 September 1995) is an English professional rugby league player for Widnes Vikings. His playing position is Prop Forward.\nCareer.\nChapelhow made his senior debut on loan at Whitehaven. In total he played 4 games for the Cumbrian club. His debut for parent club Widnes Vikings came in a Super League Super 8s qualifier against Leigh Centurions on 27 September 2015.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48690433","title":"Zion, Alabama","body":"\nZion, Alabama\n\nZion is an unincorporated community in Pickens County, Alabama, United States. Zion is located along Alabama State Route 159, north of Gordo.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48690440","title":"Line 4, Ningbo Rail Transit","body":"\nLine 4, Ningbo Rail Transit\n\nLine 4 of Ningbo Rail Transit () is a rapid transit line under construction in Ningbo. It starts from Cicheng Town, Jiangbei District and ends near Dongqian Lake in Yinzhou District. Construction of Line 4 started in November 30, 2015.\nRoute.\nLine 4 starts from Cicheng Station in Cicheng Town in east-west direction as an elevated line. Then it turns south into the North External Ring Viaduct where it turns east-west. After reaching Jiangbei Avenue, it starts to turn underground and deviates from the viaduct to Zhuangqiao Railway Station where it turns south, crosses Yaojiang River and reaches Ningbo Railway Station. Then Line 4 goes along Changchun Road, Xingning Road until it reaches Canghai Road and become north-south again. After reaching Shounan Road it turns into southeast direction and reaches Dongqian Lake, its destination.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48690449","title":"Conus spiceri","body":"\nConus spiceri\n\nConus spiceri is a species of sea snail, a marine gastropod mollusk in the family Conidae, the cone snails, cone shells or cones.\nThese snails are predatory and venomous. They are capable of \"stinging\" humans.\nDescription.\nThe size of the shell varies between 45 mm and 152 mm.\nDistribution.\nThis marine species occurs in the Pacific Ocean off Hawaii and Midway.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48690456","title":"Hypena namaqualis","body":"\nHypena namaqualis\n\nHypena namaqualis is a moth of the Erebidae family. It was described by Guenée in 1854. It is found in South Africa.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48690466","title":"New Zealand NBL All-Star Five","body":"\nNew Zealand NBL All-Star Five\n\nThe National Basketball League All-Star Five is an annual National Basketball League (NBL) honour bestowed on the five best players in the league following every NBL season. The five-player team has been selected in every season of the league's existence, dating back to its inaugural season in 1982.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48690476","title":"Self-portrait with a sunflower","body":"\nSelf-portrait with a sunflower\n\nSelf-portrait with a sunflower is a 1632–33 self-portrait by Anthony van Dyck. It is now in the private collection of the Duke of Westminster.\nIt was produced at the height of his fame, while he was 'principal Paynter in order to their Majesties' at the court of Charles I of England, who also knighted him. He wears the gold chain given to him by Charles and holds a large sunflower, whose symbolism is much debated.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48690487","title":"James Birley","body":"\nJames Birley\n\nJames \"Jim\" Birley (1928-2013) of the Maudsley Hospital, London, was president of the Royal College of Psychiatrists from 1987 to 1990.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48690501","title":"2016 NCAA Division I Baseball Tournament","body":"\n2016 NCAA Division I Baseball Tournament\n\nThe 2016 NCAA Division I Baseball Tournament will begin on Friday, June 3, 2016 as part of the 2016 NCAA Division I baseball season. The 64 team double elimination tournament will conclude with the 2016 College World Series in Omaha, Nebraska, starting on June 18 and ending on June 29.\nThe 64 participating NCAA Division I college baseball teams will be selected out of an eligible 298 teams. Thirty-one teams will be awarded an automatic bid as champions of their conferences, and 33 teams will be selected at-large by the NCAA Division I Baseball Committee.\nTeams will be divided into sixteen regionals of four teams, which will conduct a double-elimination tournament. Regional champions will then face each other in Super Regionals, a best of three game series to determine the eight participants of the College World Series.\nCollege World Series.\nThe College World Series will be held at TD Ameritrade Park in Omaha, Nebraska.\nBracket.\n\"Seeds listed below indicate national seeds only\"\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48690522","title":"Nigel Ogden","body":"\nNigel Ogden\n\nNigel Ogden is a British theatre organist, known for presenting and performing on the BBC Radio 2 programme \"The Organist Entertains\" for over 35 years.\nOgden was born in Manchester, England, the son of a church organist, and had several years of piano lessons, before taking up the organ at the age of twelve. As a child, his family took him to Blackpool Tower Ballroom to hear performances on the Wurlitzer organ there, by Reginald Dixon.\nHe studied to be a teacher, then worked as a sales demonstrator for an organ retail business in Hyde, Cheshire, where he later started his own business selling organs. From 1972, he started appearing on \"The Organist Entertains\", eventually taking over from Robin Richmond as presenter in March 1980.\nOgden is also a composer and a touring musician, playing both theatre and church organs, and was the organist for the Channel 4 production of Denis Potter's \"Lipstick on Your Collar\".\nHe has released a number of CDs.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48690525","title":"Patrick Montgomery","body":""}
{"url":"https://en.wikipedia.org/wiki?curid=48690541","title":"Green River Crib Dam","body":"\nGreen River Crib Dam\n\nThe Green River Crib Dam is a historic 19th-century dam on the Green River in western Guilford, Vermont. Built about 1811, it is a reminder of the modest industrial enterprises once conducted in the area using the water power it provided, and is one of the state's few surviving crib dams. It was listed on the National Register of Historic Places in 1995.\nDescription and history.\nThe dam is located in far western Guilford, upstream of the Green River Covered Bridge, which spans the Green River at the junction of Green River Road with Jacksonville Stage Road. The dam is about long, with a maximum height of , and spans the river in a semicircle open to the downstream side. The material of the dam mostly logs and rubble, with plank facing. The abutments of the dam are now a combination of stone and concrete, the wing wall on the east side extending downstream toward the bridge, where it formed part of the foundation of a now-destroyed mill.\nThe earliest recorded documentation of a dam on this site dates to 1811, when Jonah Cutting is known to have a paper and linseed oil mill operating at the site. Some of the materials of the present dam may well date to this period. By 1856 the mill is only documented as being used for paper production. In 1869 a major flood apparently damaged the mill beyond repair, and it may also have damaged the dam; it washed out the bridge then standing just downstream. In 1871 Henry Stowe erected a lumber and grist mill on the site, which operated until 1918, when it was destroyed by fire. The dam has since then been maintained by private owners, forming a picturesque part of the small Green River village and a reminder of its modest industrial past.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48690544","title":"PS Mayflower (1866)","body":"\nPS Mayflower (1866)\n\nPS \"Mayflower\" was a passenger vessel built for the Solent Steam Packet Company in 1866.\nHistory.\nShe was built by Marshall Brothers in Newcastle and launched in 1866 and was used to expand the company services, offering a daily passage between Lymington and Portsmouth. \nShe was acquired by the London and South Western Railway in 1884.\nIn 1905 she was acquired by Joseph Constant in London and registered in Southampton. She was broken up in 1912.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48690550","title":"Lupton, Alabama","body":"\nLupton, Alabama\n\nLupton is an unincorporated community in Walker County, Alabama, United States. Lupton is located along Alabama State Route 5 northwest of Jasper.\nHistory.\nLupton is home to Lupton School, an elementary/middle school that is part of the Walker County Board of Education.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48690551","title":"Andrew Sims (psychiatrist)","body":"\nAndrew Sims (psychiatrist)\n\nAndrew Sims of St James's Hospital, Leeds, was president of the Royal College of Psychiatrists from 1990 to 1993.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48690561","title":"Guillermo Dietrich","body":"\nGuillermo Dietrich\n\nGuillermo Dietrich is an Argentine politician. He has worked as subsecretary of mass transit in Buenos Aires, under Mauricio Macri. He has worked in the Metrobus. Macri was elected president in 2015 and appointed him minister of Transport. \n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48690582","title":"Phoenix Gleitschirmantriebe","body":"\nPhoenix Gleitschirmantriebe\n\nPhoenix Gleitschirmantriebe () was a German aircraft manufacturer based in Würselen. The company specialized in the design and manufacture of paramotors in the form of ready-to-fly aircraft for the US FAR 103 Ultralight Vehicles rules and for the European Fédération Aéronautique Internationale microlight category.\nThe company seems to have been founded in the early 2000s and gone out of business about 2008.\nThe company produced the Phoenix Skywalker line of paramotors, powered by the Solo 210 and the Hirth F-33 engines. The aircraft was noted for the use of a paddle-bladed diameter four-bladed composite propeller, which allowed the design of a smaller cage assembly which improved ground transport portability and handling on take-off and landing.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48690591","title":"John Cox (psychiatrist)","body":"\nJohn Cox (psychiatrist)\n\nJohn Cox of the North Staffs Hospital Centre, Stoke-on-Trent, was president of the Royal College of Psychiatrists from 1999 to 2002.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48690607","title":"Mike Shooter","body":"\nMike Shooter\n\nMike Shooter of Nevill Hall Hospital, Abergavenny, was president of the Royal College of Psychiatrists from 2002 to 2005.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48690618","title":"Proteas Voulas B.C.","body":"\nProteas Voulas B.C.\n\nProteas Voulas is a Greek basketball club based in Voula, Athens. It was founded in 1980. Proteas has both men's and women's team which play in Greek national divisions. The women's team plays in A1 Ethniki Women (first-tier) and the men's team plays in Greek C Basketball League (fourth-tier). The team's colours are blue and red and the home stadium of the club is the Voulas Indoor Hall.\nWomen's team.\nProteas Voulas has won a Greek cup, in season 2012-13. That year, the club played in A2 Ethniki, so Proteas became the first club in Greece which won a Greek cup whereas it was playing in lower division. At the same year, Proteas promoted to A1 Ethniki and since then it plays in first-tier of championship.\nMen's team.\nSince 2015-16 season, the men's team of Proteas Voulas plays in Greek C Basketball League (fourth-tier).\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48690624","title":"Khosro Agha hammam","body":"\nKhosro Agha hammam\n\nThe Khosro Agha hammam was a historical hammam in Iran. It was located in the Sepah street in Isfahan and belonged to the Safavid era.\nIts dressing room was changed to a store in 1975 and was damaged heavily, but then it was repaired. After a while, the extension of Ostandari street (Now: Hakim street) was decided, but because of passing of the street from the hammam, this project was canceled. In 1979, some of neighborhood residents rumored that vice and harlotry took place in the hammam and the hammam should be destroyed. Their motive for this rumor was that they wanted the new street to be constructed and consequently the costs of their estates to be increased. Finally in 1980 a bomb exploded in the hammam and only some columns remained from Garmkhaneh (hothouse).\nIn 1992, the supreme council of the city planning disapproved the construction of a new street because of the location of the hammam in the neighborhood. Finally on 12 April 1995 at 2 o'clock in the midnight some unidentified people attacked the Khosro Agha hammam and after that they made the guard unconscious, they destroyed completely this historical structure and stole its unique stone trough.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48690631","title":"One Day International matches results (1970–79)","body":"\nOne Day International matches results (1970–79)\n\nThe following tables provided the complete summary of One Day Internationals held between 1970-79.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48690659","title":"ALO (artist)","body":"\nALO (artist)\n\nALO is an Italian artist born in Ancona in 1981. He studied at the faculty of Industrial Design in Florence where he attended a fine art and drawing course. In the early stage of his career, ALO's oil paintings focused on female portraiture and on the representation of human loss and defeat which will become the landmark subject of his \"losers\" series. After few months, ALO decided to continue his activity working as a self-taught artist. This formation period led him to define his current style based on linear intersections and strong chromatic contrasts. Four years later ALO went back to his native city, Perugia, for his very first solo exhibition \"The underdogs show\". Influenced by the street art world, ALO decided to reproduce his indoor techniques in the outdoor spaces and started travelling around Europe, in particular to Rome, Milan, Berlin and then to Paris and London, the cities that offered him the biggest \"open air canvas\". ALO is currently based in London, where he had his first major solo show \"Hail to the loser\" at Saatchi Gallery, with which he started a continuous collaboration.\nUrban Expressionism.\nFascinated by the French and German Expressionism of the beginning of the 20th century, ALO chose the oil painting as the medium of his early artistic production.\nSome of the aspects of his most recent pieces, such as the strong chromaticism and the stylized human figures, can be already seen in his very first body of work and they are inspired by the sharp, essential lines typical of the African art.\nALO's style became the more and more refined and the use of the acrylic paint in his works is now predominant. ALO's portraits are the result of his deep study of the human figure, they show the artist's personal ideal of beauty and elegance together with his ability to understand and represent the complexity of the female nature.\nInspired by a variety of artists, from Cezanne and Van Gogh to Kirchner and Picasso, ALO portrays people at the corners of the city streets, at the margins of society. His curious and open approach led him to the urban art world. ALO represents his emotional vision of the reality and transforms his characters into graceful figures full of elegance and solemnity.\nALO brings the classic portraiture genre to the urban outdoor setting, taking distance from the predominant pop influences of the street art style. His characters are framed by colorful backgrounds, an important element that defines the emotional energy of the artwork and strengthen the idea of \"street painting\". ALO describes his own art as \"urban expressionism\".\nPress.\nRNext, La Repubblica degli Innovatori \nInspiring City, Italian street artist ALO prepares for his solo show ‘HAIL TO THE LOSER’ at the Saatchi Gallery \nComplex, 25 Shoreditch Street Artists You Need to Know \nCombustus, Alo Street Artist, East London and Italy \nArtribune, Dalle strade a Saatchi. Per Alo “è accaduto tutto molto in fretta \nArt exhibitions.\n2015 – \"Pop the Streets\", Saatchi Gallery, London\n2014 – \"Hail to the loser\", Saatchi Gallery, London\n2014 – \"Project M/6\", Urban Nation, Berlin\n2014 – \"Collicola On the Wall\", Palazzo Collicola, Spoleto (Italy)\n2013 – \"Spectrum\", Stolen Space Gallery, London\n2013 – \"Winter group show\", Stolen Space Gallery, London\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48690667","title":"Pablo Avelluto","body":"\nPablo Avelluto\n\nPablo Avelluto is an Argentine journalist. He was appointed Minister of Culture by Mauricio Macri. He closed the Manuel Dorrego national institute.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48690684","title":"Sinderen","body":"\nSinderen\n\nSinderen is a village in the municipality Oude IJsselstreek in the Dutch province Gelderland. It used to be on the border of the former municipalities Gendringen and Wisch. The village is situated on a junction between Varsseveld (north), Dinxperlo (south) and Gendringen (south west).\nThere used to be a Castle in Sinderen. The only thing reminding this is the Antonius Chapel. The meadow in from of the farm \"D'n Huusboer\" is surrounded by an old canal and basements of the castle are also to be found here. To the north of the village, a reformated church was built between 1884 and 1887. It nowadays is a Protestant church, and it's called the Keurhorster Church.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48690701","title":"Carmarthenshire County Council election, 1961","body":"\nCarmarthenshire County Council election, 1961\n\nAn election to the Carmarthenshire County Council was held in April 1961. It was preceded by the 1958 election and followed, by the 1964 election.\nOverview of the result.\nA close run election resulted in Labour increasing its majority by two after capturing an additional two seats. In addition, Labour took the majority of the aldermanic vacancies.\nBoundary changes.\nThere were no boundary changes at this election.\nRetiring aldermen.\nThe aldermen who retired at the election were ...\nA number of retiring councilors stood down to allow retiring aldermen to be returned unopposed. These included D.T. Williams at Llangadog, who stood down in favour of Gwynfor Evans.\nUnopposed returns.\n39 members were returned unopposed, including six of the nine members in Llanelli town.\nContested elections.\n20 contests took place.\nSummary of results.\nThis section summarises the detailed results which are noted in the following sections.\nThis table summarises the result of the elections in all wards. 59 councillors were elected.\nWard results.\nLlanon.\nLabour had lost this ward in a by-election.\nElection of aldermen.\nIn addition to the 59 councillors the council consisted of 19 county aldermen. Aldermen were elected by the council, and served a six-year term. Following the elections, the majority of the aldermanic setas were taken by Labour.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48690707","title":"Massachusetts Woman Suffrage Association","body":"\nMassachusetts Woman Suffrage Association\n\nThe Massachusetts Woman Suffrage Association (MWSA) was an American organization devoted to women's suffrage in Massachusetts. It was active from 1870 to 1919.\nHistory.\nThe MWSA was founded in 1870 by suffrage activists Julia Ward Howe, Lucy Stone, Henry Browne Blackwell, and others. It was affiliated initially with the national American Woman Suffrage Association, which had been founded the previous year, and later became a chapter of the National American Woman Suffrage Association (NAWSA). One of its own affiliates was the Cambridge Political Equality Association.\nThe MWSA lobbied for women to get the vote and the right to be officials of civic organizations such as school boards, educated people about women's rights, organized public demonstrations such as rallies and parades, and coordinated with suffrage associations in other states. Among the people active in the MWSA were physician Martha Ripley, social activist Angelina Grimké, reformer Ednah Dow Littlehale Cheney, and suffragist Susan Walker Fitzgerald.\nIn 1892, the recent merger of several national suffrage associations and other factors prompted Alice Stone Blackwell and Ellen Battelle Dietrick to write a new constitution for the MWSA that would expand its capacities and funding base (e.g. by making it possible for the MWSA to receive bequests). The new MWSA was incorporated in December of that year. A decade later, in 1901, it merged with a smaller Massachusetts suffrage organization, the National Suffrage Association of Massachusetts. By 1915, the MWSA had over 58,000 members.\nBetween 1904 and 1915, the MWSA was headquartered at 6 Marlborough Street in Boston's Back Bay, afterwards the headquarters of the Women's Municipal League of Boston and then the home of physician Louis Agassiz Shaw, Jr.\nIn 1920, after the passage of the 19th Amendment to the Constitution gave women the vote, the MWSA became the Massachusetts League of Women Voters.\nRecords pertaining to the history of the MWSA are held by Radcliffe College's Schlesinger Library.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48690708","title":"Clasado","body":""}
{"url":"https://en.wikipedia.org/wiki?curid=48690779","title":"Orphulella speciosa","body":"\nOrphulella speciosa\n\nOrphulella speciosa is commonly known as the slant-faced pasture grasshopper.\nDistribution and habitat.\n\"Orphulella speciosa\" occurs east of the Rocky Mountain region all the way to the Coast of the Atlantic. It also occurs in the southern region of Canada and in the northern region of Mexico. \"O. speciosa\" inhabits areas of tallgrass and mixed grass prairies, often preferring areas of shorter grass that are interspersed throughout the prairie plant matrix, including grasses that have been grazed upon by larger animals.\nAt the southern end of the range (e.g., in Texas), adult \"O. speciosa\" are most abundant during August to October, with fewer adults present from May to December. In the northern extent of its range (e.g., New England) adult \"O. speciosa\" are most abundant during the months of July and August.\nIdentification.\n\"Orphulella speciosa\" has a very slanted face. The margins of the vertex of the head (the top of the head, located between the eyes) are less raised. The foveola (a small dent in the integument) is not distinct. The pronotum disks are found at the top of the first thoracic segment and are almost equivalent in width in the front and back. The principal sulcus on the pronotum, which is a ridge that cuts the middle of the outer integument, cuts the pronotum disk a little past the middle. The tegmina (the leathery, slender forewings extend to the end of the hind femora, and curve in towards the apex. The males' hind femora often vary in size from 1.5 mm to 3mm from the end of the femora. \"O. speciosa\" are sexually dimorphic; the females are much larger than the males. Female body sizes range from 16-21.5 mm with antennae that are 5-6mm long, tegmina that are 9-16mm long, and hind femora that are 9.5–12 mm long. Males range from 13-14mm in total length with antennae 4.5-6.5mm in length, tegmina, 101–13 mm in length, and hind femora are 8.5–10 mm in length. On lower end of the lateral lobes (the vertical sides of the pronotum of the males, there is a pale curved line. \"O. speciosa\" individuals exhibit much variation in color, especially combinations of green and brown. Females are often light green with a dark coloration on the vertex of the head. Females are occasionally brown and have a line on the sides of the pronotum. \n\"O. speciosa\" looks very similar to a related species in the same genus, \"O. pelidna\". These two species can be identified from one another by looking at the fastigium (the part of the head that is located in between the eyes of the grasshoppers and their size. \"O.speciosa\" has a small median ridge on the fastigium and is much smaller than \"O. pelidna\". \"O. pelidna\" has a semicircular indentation that is set farther back than on \"O. speciosa\", and \"O. pelidna\" has a lateral carinae that is incised twice.\nNymphal development.\nLike all grasshoppers, nymphs of \"O. speciosa\" have incomplete metamorphosis: their nymphs are born looking similar to the adults, and they go through five instar stages (4 different molting events) until they reach the adult stage. First and second instars have patterns of green on their heads; however, the antennae are terminally expanded (they grow from the head outwards) . Second instars have antennae that are flat and are pointed at the end. The hind femora of the first and second instars appear tan and they have a green thorax. Instars II to V have filiform, or threadlike, antennae. Third and fourth instars have tan, brown, green, and gray body color patterns, and their hind femora appear fuscous (brownish-gray) .\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48690796","title":"Beloved Hymns","body":"\nBeloved Hymns\n\nBeloved Hymns is a studio album by Bing Crosby released in 1951 featuring eight hymns recorded with the Ken Darby Choir and organ accompaniment on May 6, 1949.\nReception.\nCrosby researcher Fred Reynolds said of the recording session at which all eight hymns were recorded that “They were all sung devoutly without any pretence of “performance”, but nevertheless gave added support to Martin Luther’s dictum that the devil should not have all the best tunes.” \n\"Billboard\" reviewed some of the individual songs released as 78 rpm records.\n\"What a Friend We Have In Jesus\" - Choir and organ support Bing ably as he delivers a beautiful hymn simply, straightforwardly and with deep warmth. \n\"He Leadeth Me\" - Bing does this hymn with eminent strength and full affection for the chore. Should make for big sales in a quiet way for this Decca Faith disking. \n\"O Lord, I Am Not Worthy\" - Bing rarely has sung better and with more feeling than he shows on this hymnal selection.\nAlbum releases.\nThe songs were featured on a 10” vinyl LP numbered DL 5351 and in a 4-disc 45rpm box set numbered 9-258. \nLP track listing.\nSide 1\nSide 2\nReferences.\n \n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48690797","title":"Germany women's national under-17 basketball team","body":"\nGermany women's national under-17 basketball team\n\nThe Germany women's national under-16 and under-17 basketball team, is controlled by the German Basketball Federation (), abbreviated as DBB, and represents Germany in international women's under-16 and under-17 (under age 16 and under age 17) basketball competitions. \n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48690813","title":"Colonus (spider)","body":"\nColonus (spider)\n\nColonus is a spider genus of the Salticidae family (jumping spiders). \"Colonus\" species are endemic to North and South America, ranging from New York to Argentina. All members of the genus have two pairs of bulbous spines on the ventral side of the ﬁrst tibiae. The function of these spines is unknown. \"Colonus\" was declared a junior synonym of \"Thiodina\" by Eugène Simon in 1903, but this was reversed by Bustamante, Maddison, and Ruiz in 2015.\nSpecies.\n, the World Spider Catalog accepted 14 species of \"Colonus\":\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48690831","title":"Manchester, Alabama","body":"\nManchester, Alabama\n\nManchester is an unincorporated community in Walker County, Alabama, United States. Manchester is located along Alabama State Route 195 north-northeast of Jasper.\nHistory.\nManchester was founded as a lumber center. The Manchester Lumber Company owned a large amount of the surrounding timber land and built a school and Baptist church for the community. Much of the lumber produced in Manchester was used to make flatboats, which were used to transport coal. For a short time, the Manchester Coal Company mined coal in the area.\nA post office operated under the name Manchester from 1907 to 1957.\nIn popular culture.\nManchester is listed as the hometown of the comic book superhero Impulse.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48690832","title":"PS Solent (1863)","body":"\nPS Solent (1863)\n\nPS \"Solent\" was a passenger vessel built for the Solent Steam Packet Company in 1863.\nHistory.\nShe was built by George Inman of Lymington and launched on 1 May 1863. She went to Southampton in June 1863 for the fitting of her engines by J. Hodgkinson. She undertook her trial trip on 29 October 1863 from Lymington to Stokes Bay. \nShe was acquired by the London and South Western Railway in 1884.\nShe was disposed of around 1901.\nReferences.\n \n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48690837","title":"Raja Mohammad","body":"\nRaja Mohammad\n\nRaja Mohammad is an Indian film editor, who works in the Malayalam and Tamil film industries.\nCareer.\nRaja Mohammed primarily edited Malayalam films during his early career and his first Tamil venture was through Kamal Haasan's production, \"Nala Damayanthi\" (2003). For his 20th film, Raja Mohammad won the National Film Award for Best Editing for his work in \"Paruthiveeran\" (2007), with the honour fetching him further opportunities to work on film projects in the Tamil film industry. He also won the Vijay Award for Best Editor for his work in M. Sasikumar's directorial debut, the period film, \"Subramaniapuram\" (2008).\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48690853","title":"Coming Home (Sasha song)","body":"\nComing Home (Sasha song)\n\n\"Coming Home'\" is a song by German recording artist Sasha. It was written and produced by Sasha along with Robin Grubert and Alexander Zuckowski for his first compilation album \"Greatest Hits\" (2006). Released as the album's lead single, it reached the top ten of the German Singles Chart.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48690855","title":"Muhammad ibn Ishaq ibn Ibrahim","body":"\nMuhammad ibn Ishaq ibn Ibrahim\n\nMuhammad ibn Ishaq ibn Ibrahim (, died June 851) was a Mus'abid governor of Baghdad for the Abbasid Caliphate, from 850 until his death.\nCareer.\nMuhammad was the son of Ishaq ibn Ibrahim al-Mus'abi, a member of a collateral branch of the Tahirid family and the head of security (\"shurtah\") in Baghdad from 822 to 850. During his father's lifetime Muhammad had been sent to attend the court of the caliph in Samarra, where he entered into the service of the central government and acted as Ishaq's representative.\nUpon the death of Ishaq in July 850, Muhammad succeeded him as chief of security of Baghdad; at the same time, by delivering the valuables in Ishaq's storehouses to the caliph al-Mutawakkil and his heirs al-Muntasir and al-Mu'tazz, he secured their favor and was given control over al-Yamamah, al-Bahrayn, Egypt and the Mecca Road as a reward. He also received Fars, but this appointment forced to deal with that province's governor, his uncle Muhammad ibn Ibrahim al-Mus'abi, who adopted a hostile attitude toward him. In response, Muhammad deposed his uncle from his governorship and procured his murder, and appointed his cousin al-Husayn ibn Isma'il al-Mus'abi to govern Fars instead.\nMuhammad died in June 851, after which his positions in Baghdad and the Sawad were assigned to 'Abdallah ibn Ishaq ibn Ibrahim.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48690858","title":"Avraham Stern (politician)","body":"\nAvraham Stern (politician)\n\nAvraham Stern (, 30 October 1935 – 12 May 1997) was an Israeli administrator and politician. He served as a member of the Knesset for the National Religious Party (Mafdal) between 1996 and 1997. \nStern was born in Haifa and obtained a B.A. He was Secretary General of the Bnei Akiva youth movement, Political Secretary of the Religious Kibbutz Movement, and also Deputy Chairman of the National Religious Party bureau.\nAfter the general elections of 1996 he entered the 14th Knesset. He was a member from 17 June 1996 till his death on 12 May 1997 and was replaced by Nissan Slomiansky.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48690859","title":"Juan José Aranguren","body":"\nJuan José Aranguren\n\nJuan José Aranguren is an Argentine businessman. \nBiography.\nAranguren was born in the Entre Ríos Province, and became an engineer in chemistry in the University of Buenos Aires. He joined Shell Argentina in 1979, and became a directive from 1997 to 2015. He opposed the administration of president Néstor Kirchner, and won several cases against the state for the state-controlled prices. \nHe was appointed minister of energy by Mauricio Macri in 2015. \n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48690875","title":"Demonstration 95","body":"\nDemonstration 95\n\nDemonstration 95 is the first demo by Norwegian neofolk band Naervaer, issued in 1995 independently. The demo was mixed by Bjørn Harstad and Hans K. Eidskard. It was recorded in Jailhouse Studios summer, autumn and winter 1995.\nTrack listing.\nTracks ending with * later appears on the EP Naervaer, issued in 1997.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48690895","title":"Francis Chalmers Crawford","body":"\nFrancis Chalmers Crawford\n\nFrancis Chalmers Crawford FRSE (1851-1908) was a Scottish stockbroker of fame as an amateur botanist and ornithologist. \"Saxifraga crawfordii\" is named after him. He served as President of the Scottish Microscopical Society.\nHe was an avid collector of plant species, especially Bryophytes and Spermatophytes, notably in Perthshire and Orkney but representing almost all areas of the United Kingdom. He often worked in partnership with Harold Stuart Thompson. He also collected in Hungary, Switzerland and Sweden with his friend John Hutton Balfour, many of his specimens being in the Natural History Museum, London.\nLife.\nHe was born in North Berwick on 24 August 1851, the son of Adam Howden Crawford (1804-1882) of the Honourable East India Company, and his wife Margaret Buchan Chalmers (1821-1898).\nHe attended Edinburgh Academy 1863-68 and then trained as a stockbroker.\nHe retired in 1896 and began to focus fully on his botanical interests. In 1897 he became a Fellow of the Botanical Society of Edinburgh and demonstrated Botany at an academic level at the Royal Botanic Garden Edinburgh.\nIn 1898 he was elected a Fellow of the Royal Society of Edinburgh. His proposers were Ramsay Heatley Traquair, Sir Isaac Bayley Balfour, James Geikie and John Chiene.\nIn his final years he lived at 19 Royal Terrace, an impressive Georgian townhouse designed by William Henry Playfair on Calton Hill.\nHe died on 9 February 1908. He is buried with his parents and sister near the centre of the original north 19th century extension to Dean Cemetery in western Edinburgh beneath a Celtic cross.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48690899","title":"The Man who Put the Germ in Germany","body":""}
{"url":"https://en.wikipedia.org/wiki?curid=48690911","title":"Saragossa, Alabama","body":"\nSaragossa, Alabama\n\nSaragossa is an unincorporated community in Walker County, Alabama, United States.\nHistory.\nSaragossa is likely named for the Zaragoza province of Spain. A post office operated under the name Saragossa from 1890 to 1967.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48690922","title":"Lucky Day (Sasha song)","body":"\nLucky Day (Sasha song)\n\n\"Lucky Day'\" is a song by German recording artist Sasha. It was written and produced by Sasha along with Robin Grubert and Alexander Zuckowski for his first compilation album \"Greatest Hits\" (2006). Released as the album's second single, it reached the top twenty of the Austrian and the German Singles Chart.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48690930","title":"Community Care","body":"\nCommunity Care\n\nCommunity Care is a British trade magazine for the social care industry published by Reed Business Information Ltd.\nThe magazine is now entirely online, but until 2011 was a weekly publication with a circulation of 32,000, though less than 4000 were paid for. The last issue of its print edition appeared on 24 November 2011. It has a strong position in the jobs market for social workers, claiming up to 3,000 social care jobs are advertised each week.\nIt runs an annual two day conference and exhibition under the title Community Care Live.\nThe magazine won the PPA Business and Professional Magazine of the Year Award in 2003.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48690931","title":"Thirumuruganatheeswar Temple","body":"\nThirumuruganatheeswar Temple\n\nThirumuruganatheeswarar Temple (also called Thirumuruganpoondi temple) in Thirumuruganpoondi, a panchayat town in Tiruppur district in the South Indian state of Tamil Nadu, is dedicated to the Hindu god Shiva. Constructed in the Dravidian style of architecture, the present structure of the temple is believed to have been built during the Kongu Cholas period in the 10th century. Shiva is worshipped as Thirumuruganatheeswarar and his consort Parvathi as Avudainayagi.\nThe presiding deity is revered in the 7th century Tamil Saiva canonical work, the \"Tevaram\", written by Tamil saint poets known as the Nayanmars and classified as \"Paadal Petra Sthalam\". A granite wall surrounds the temple, enclosing all its shrines. The temple does not have a rajagopuram, the gateway tower, a common feature in South Indian temples.\nThe temple is open from 5:30 am – 12:45 pm and 3:30 - 8:15 pm on all days. Four daily rituals and many yearly festivals are held at the temple, of which the Brahmotsavam celebrated during the Tamil month of \"Maasi\" (February - March) for Sundarar and Mahashivaratri festival being the most prominent. The temple is maintained and administered by the Hindu Religious and Endowment Board of the Government of Tamil Nadu.\nLegend.\nSundarar is a famous Saivite saint and Nayanmar belonging to the 8th century. He has revered many Shiva temples in South India in his verses compiled as the Seventh \"Thirumurai\". As per Hindu legend, while arriving at this place, he took rest in a Vinayaka temple. He presumably forgot to get thoughts about Shiva and to test his devotion, Shiva sent his Bhutaganas to steal all his possessions. Sundarar prayed to Vinayaka in the temple who showed him to proceed towards the East. Sundarar, in his anger, sang about Shiva blaming him of not protecting his possessions. Shiva graced him with his presence at this place and restored all his possessions. Murugan killed the demon king Surapadma at the behest of the Devas. He incurred Brahmahatti Dosha for slaying the demon into two pieces. Muruga is believed to have dug a spring with his Vel, the spear and worshipped Shiva at this place. Since Muruga worshipped his father Shiva, the presiding deity came to be known as Muruganathaswamy.\nArchitecture.\nThe temple is believed to have been built by the Kongu Cholars, with 68 recorded inscriptions from the king Vikrama Chola I seen on the walls of the sanctum and around the precinct. \nThirumuruganatheeswarar temple is located in Thirumuruganpoondi, a village located from Tiruppur on the Tiruppur- Avinasi road. The temple does not have \"rajagopuram\" as in other South Indian temples. All the shrines are housed in a rectangular enclosure measuring . The sanctum houses the image of Thirumuruganatheeswarar in the form of Lingam, an iconic form of Shiva facing West. There is an Ardha Mandap and a Mukha mandap, pillared halls leading to the sanctum. There is a shrine of Muruga facing South, towards the Shiva shrine. Since Muruga is believed to have used his weapon, the Vel, to dig the spring, he is seen without his weapon in the shrine, nor his vehicle peacock. The first precinct has the images of Vinayakar, Durga, Dakshinamurthy and Chandikeswara. The shrine of Avudainayagi is seen in the first precinct facing west. There are sculptural depictions of Sundarar on the walls showing him in three different emotions of anger, humiliation and happiness. There is a hall of Nataraja called Adavallan Sabha. There are three temple tanks associated with the temple - Shanmugha Theertham, Gnana Theertham and Brahmatheertham. There are images of Kalabhairavar and Lingothbhavar, which are considered architectural specimens of the Kongu Cholars.\nCulture.\nThe temple follows Saivite tradition. The temple priests perform the \"pooja\" (rituals) during festivals and on a daily basis. The temple rituals are performed four times a day: \"Ushakalam\" at 6:00 a.m., \"Kalasanthi\" at 8:00 a.m., \"Uchikalam\" at 12:00 p.m., and \"Sayaratchai\" at 5:00 p.m. Each ritual has three steps: \"alangaram\" (decoration), \"neivethanam\" (food offering) and \"deepa aradanai\" (waving of lamps) for both Thirumuruganatheeswarar and Avudainayagi. There are weekly, monthly and fortnightly rituals performed in the temple. The temple is open from 5:30 am – 12:45 pm and 3:30 - 8:15 pm.\nBrahmotsavam celebrated during the Tamil month of \"Maasi\" (February - March) for Sundarar and Mahashivaratri festival being the most prominent. There are other common festivals like Thaipoosam, Annabhishekam, Kanthasashti and Karthigai Deepam celebrated in the temple.\nSundarar, an 8th-century Tamil \"Saivite\" poet, venerated Thirumuruganatheeswarar in ten verses in \"Tevaram\", compiled as the \"Seventh Tirumurai\". As the temple is revered in \"Tevaram\", it is classified as \"Paadal Petra Sthalam\", one of the 276 temples that find mention in the Saiva canon. Out of the 276 temples that are revered by the three saints, Sundarar has exclusively visited 25 temples with this temple counting as one of them. Of the five thandavams performed by Shiva in different places, this place is counted as the one where he performed the Brahma Thandavam In modern times, the temple is maintained and administered by the Hindu Religious and Endowment Board of the Government of Tamil Nadu.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48690942","title":"Germán Garavano","body":"\nGermán Garavano\n\nGermán Garavano is an Argentine politician. He has worked in the Council of Magistrates of Buenos Aires, and the Council of Magistrates of the Nation since 2014. He wrote 15 books about laws. He was appointed minister of Justice by Mauricio Macri in 2015. \n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48690949","title":"Woman in the Dark (1952 film)","body":"\nWoman in the Dark (1952 film)\n\nWoman in the Dark is a 1952 American crime film directed by George Blair and written by Albert DeMond. The film stars Penny Edwards, Ross Elliott, Rick Vallin, Richard Benedict, Argentina Brunetti and Martin Garralaga. The film was released on November 15, 1952, by Republic Pictures.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48690958","title":"Germany women's national 3x3 team","body":"\nGermany women's national 3x3 team\n\nThe Germany women's national 3x3 team is a national basketball team of Germany, governed by Deutscher Basketball Bund (DBB).\nIt represents the country in international 3x3 (3 against 3) women's basketball competitions.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48690964","title":"The Temptation of Innocence","body":"\nThe Temptation of Innocence\n\nThe Temptation of Innocence: Living in the Age of Entitlement () is a 1995 book by the French philosopher Pascal Bruckner. Bruckner argues against contemporary trends of applying victimhood, real or imagined, to justify infantilisation, a lack of responsibility or even oppression of others. The book received the Prix Médicis essai. It was published in English in 2000.\nReception.\n\"Publishers Weekly\" wrote:\nBruckner's European education, which he wears lightly; his unpreachy, aphoristic style; and his obvious delight in paradox save this book from the ranks of a tedious diatribe against permissiveness. Citings of Europe's philosophical and literary masters (Rousseau, Hegel, Nietzsche among many others) help Bruckner, who is French (this admirable translation is not, alas, credited), make the case that the modern individual, weakened by responsibilities of freedom too great to bear, finds freedom in weakness itself: the freedom from moral constraint. ... Bruckner should find a ready audience among philosophically inclined readers who bring a skeptical eye to contemporary trends and agree that freedom from responsibility is no freedom at all.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48690965","title":"Raja Annamalaipuram","body":"\nRaja Annamalaipuram\n\nRaja Annamalaipuram, known in short as R. A. Puram, is a neighbourhood of Chennai, India. Named after banker and philanthropist, S. Rm. M. Annamalai Chettiar who owned most of the property at one time, Raja Annamalaipuram extends along the northern banks of the Adyar River from Saidapet to the Bay of Bengal coast.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48690967","title":"Fura","body":"\nFura\n\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48690969","title":"Four Books for Women","body":"\nFour Books for Women\n\nThe Four Books for Women (\"Nǚ sìshū\") was a collection of material intended for use in the education of young Chinese women. In the late Ming and Qing dynasties, it was a standard text read by the daughters of aristocratic families. The four books had circulated separately and were combined by the publishing house Duowen Tang in 1624.\nThe four books are \"Admonitions for Women\" (\"Nǚjiè\") by Ban Zhao, \"Women's Analects\" (\"Nǚ lúnyǔ\") by Song Ruoxin and Song Ruozhou, \"Domestic Lessons\" (\"Nèixùn\") by Empress Xu, and \"Sketch of a Model for Women\" (\"Nüfan jielu\") by Lady Liu.\nIn \"Admonitions\", Ban Zhou, China's foremost female scholar, expounds on general principles and philosophical points. In \"Women's Analects\", the Songs illustrate these principles with practical examples relevant to everyday life.\nIn \"Model for Women\", Lady Liu retells the inspiring tales of various women in Chinese history. There are example of every kind of famous women from every period. Aside from Ban Zhao, there is also Liang Hongyu, who beat war drums in battle to encourage her husband, a Song dynasty general. Scholarship and sacrifice for nation and family are extolled.\nBan Zhao's book was the most widely read of the four. She wrote that a woman should practice \"reverent submission\", respect for the three obediences and four virtues, and \"set her husband on a par with Heaven.\" Ban Zhao compared marriage to the Dao, with the husband as the yin and the wife as the yang. This is a more romantic view of marriage than anything found in Confucius.\nBan Zhao's life story was more inspiring than her writing. She was a Han dynasty scholar who not only tutored an empress, but also completed an official history begun by her brother. Reformers in the sixteenth and seventeenth centuries often cited her to make the case for female education.\nThe Four Books explicitly argues for such education. \"There were no wise and chaste women who were not created through education,\" as \"Domestic Lessons\" puts it. Regardless of content, the Four Books were designed to teach women to read, a controversial and progressive idea at the time. All four books were written by accomplished women, a point many editions underline by including biographical sketches and drawings of the authors in scholarly regalia.\nThe \"four books\" of the title alludes to the four books of Neo-Confucianism compiled by Zhu Xi. This was a textbook used by those studying for the Imperial Examinations. Female learning is thus promoted as a realm on the same level as male learning. \"The is no doubt that women read both the \"Four Books for Women\" and the Four Books they were not supposed to read,\" according to modern scholar Dorothy Ko.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48690977","title":"Houari Ferhani","body":"\nHouari Ferhani\n\nHouari Ferhani (born February 11, 1993 in Koléa) is an Algerian footballer who plays for Algerian Ligue Professionnelle 1 side JS Kabylie and the Algeria national under-23 team.\nCareer.\nIn October 2015, Ferhani was selected as part of the Algeria's under-23 national team for the 2015 U-23 Africa Cup of Nations in Senegal.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48690984","title":"Eben S. Stearns","body":"\nEben S. Stearns\n\nEben S. Stearns (1819-1887) was an American educator. He served as the President of Framingham State University from 1849 to 1855, and as the Chancellor of the University of Nashville and President Peabody Normal School (which later merged with Vanderbilt University) from 1875 to 1887.\nEarly life.\nEben Sperry Stearns was born on December 23, 1819 in Bedford, Massachusetts. His father was a Congregational minister.\nStearns enrolled at Harvard University in 1841, where he received a master of arts degree in 1845. He received a Doctor of Divinity and a Doctor of Laws from other universities.\nCareer.\nStearns began his career as a teacher in an all girls' seminary in Ipswich, Massachusetts. He went on to teach in West Newton, Newburyport, Massachusetts, and Portland, Maine.\nStearns served as the President of Framingham State University from 1849 to 1855. \nStearns served as the Chancellor of the University of Nashville and President of the Peabody Normal School from 1875 to 1887. Under his leadership, the school attendance grew from 13 to 179 students. In 1885, he authored \"Historical Sketch of the Normal College, at Nashville, Tennessee\".\nPersonal life.\nStearns was married, and he had children.\nDeath and legacy.\nStearns died on April 11, 1887 in Nashville, Tennessee. His funeral was held by an Episcopal pastor in Nashville, and he was buried in Bedford, Massachusetts.\nMeanwhile, he was replaced as Chancellor of the University of Nashville and President of the Peabody Normal School by William H. Payne. A year after his death, in 1888, his portrait by Geo Drury was donated to the Peabody Normal College.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48690985","title":"The Mute Gods","body":"\nThe Mute Gods\n\nThe Mute Gods are a German and English band uniting Nick Beggs, Marco Minnemann and Roger King. Beggs approached King — with whom he had worked as part of Steve Hackett's band — about a collaboration in 2014, and Minnemann was chosen as the drummer after Beggs had toured with him as part of Steven Wilson's band.\nOrigins and \"Do Nothing till You Hear from Me\".\nTheir first album, \"Do Nothing till You Hear from Me\" is planned for release on 22 January 2016. Beggs wrote the majority of the album on tour in 2014, and has described it as \"a rather disgruntled rant at the dystopia we've created for ourselves and our children\". In addition to Minnemann, the album features some guest drummers, including Nick D'Virgilio and Gary O'Toole. In November 2015, the band released two videos — one of which being a 360 degree video — for the album's title track. According to Nick Beggs, \"Do Nothing till You Hear from Me\" was inspired by Dwight D. Eisenhower's warning about the potential rise of the military–industrial complex, as well as the geologist Phil Schneider, who made several claims regarding UFOs, before dying under mysterious circumstances.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48690997","title":"Winnifred Paskall","body":"\nWinnifred Paskall\n\nWinnifred May Paskallwas a Missionary who came to India in 1946 through the Canadian Baptist Ministries.\nWinnifred Paskall studied at the McMaster University from where she took a graduate degree in arts (B.A.) in 1935. Winnifred came to India in 1946 and served in women's development ministries and also became Principal of the Eva Rose York Bible Training and Technical School for Women in Tuni, Andhra Pradesh.\nOne of the support groups for Winnifred Paskall included the First Baptist Church, Leamington which used to raise money for work in India.\nIn 1978, the Canadian Baptist Ministries presented Paskall with a Service Pin in recognition of her 34 years' of missionary service in India.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48691000","title":"Rhoda Leonard","body":"\nRhoda Leonard\n\nRhoda Leonard (January 31, 1928 – October 21, 2015) was an infielder and outfielder who played in the All-American Girls Professional Baseball League. Listed at 5' 5\", 115 lb., Leonard batted and threw right handed. She was nicknamed 'Nicky' by her friends and teammates.\nBorn in Somerset, Massachusetts, Leonard attended Somerset High School, where she graduated and later earned Somerset Athletic Hall of Fame honors in 1946. This prompted an invitation to an AAGPBL tryout and she made the grade, but she did not get much of a chance to play in her only season in the league.\nLeonard joined the Fort Wayne Daisies in 1946 and was used sparingly at second base and outfield, collecting a batting average of .095 (2-for-21) in nine game appearances.\nAfter baseball, Leonard married Edmund Linehan and had two children, Mark and Maggie. She then graduated from Bridgewater State University in Bridgewater, Massachusetts in 1950, and after raising her family served for many years as a teacher for the Norwood Public Schools system for a long time. Some of her most cherished teaching moments came during her years of work with students at St. Catherine's School.\nFollowing her retirement, she became an avid golfer and member of the WGAM. She also was awarded a lifetime membership to the Walpole Country Club after serving as their club secretary for several years, while enjoying many years as a lifetime member of the AAGPBL Players Association.\nThe AAGPBL folded in 1954, but there is now a permanent display at the Baseball Hall of Fame and Museum at Cooperstown, New York since November 5, 1988 that honors those who were part of this unique experience. Leonard, along with the rest of the league's girls, is included at the display exhibition.\nNicky Leonard died in 2015 in Norwood, Massachusetts at age 87, following complications from Alzheimer's disease.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48691011","title":"Timeline of Le Havre","body":"\nTimeline of Le Havre\n\nThe following is a timeline of the history of the city of Le Havre, France.\nReferences.\n\"This article incorporates information from the French Wikipedia.\"\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48691023","title":"Neurogenesis","body":"\nNeurogenesis\n\nNeurogenesis (birth of neurons) is the process by which neurons are generated from neural stem cells and progenitor cells. It plays a central role in neural development. Neurogenesis is most active during pre-natal development and is responsible for populating the growing brain with neurons. In mammals, adult neurogenesis has been shown to occur in multiple brain structures, including the dentate gyrus of the hippocampus and the olfactory bulb.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48691027","title":"Dormer Pramet","body":""}
{"url":"https://en.wikipedia.org/wiki?curid=48691056","title":"Adille Sumariwalla","body":"\nAdille Sumariwalla\n\nAdille Sumariwalla (Born January 1, 1958) is an Indian athlete and entrepreneur, popular for representing India at the 1980 Moscow Olympics. Sumariwalla competed as a 100m runner in several international competitions and at the Olympics. Currently he is the president of the athletics federation of India, and was elected as one of the members of council of IAAF at its 50th congress, thus becoming the first Indian to do so. He is also an entrepreneur and owns many media businesses in India, after tenures at some media companies including the American Media Company.\nAthletics.\nSumariwalla has been an athlete since his school days. He had set the men's 200m inter college record, at a mere 22.2 seconds and held it for 35 years, until recently Gaurang Amre broke the record, clocking at 21.7 seconds. He expressed gladness as the record was broken, but at the same time expressed concern over the time taken to break the record, quoting these records should be broken \"every two or three years\". He has won the national title in 100m sprint 11 times. Sumariwalla represented India at the 1980 summer olympics as a hundred-meter sprinter, in which he stood seventh in round one. He has been the Chef-de-Mission for Indian Contigent, for the 2014 Asian Games in Korea. Sumariwalla is of the opinion that there has been great increase in infrastructure for sports by the government in recent years, and has quoted that \"The day is not far when India can expect an Olympics Medal in Athletics\".\nEntrepreneurship.\nApart from athletics, Sumariwalla has been a part of many media businesses and corporations. He started his professional career with Tata Engineering and locomotive co. (now Tata Motors). He worked there for 15 years in various domains, after which he was appointed as the founding CEO of The Asian Age in 1994. He has since worked with many other corporations, notably Mid Day Multimedia and Clear channel. He was responsible for setting up the outdoor division at Mid Day in 1997, which then merged its tasks with Clear Channel. After leaving clear channel, after serving 8 years as a Chairman and managing director, he left the company and has later been on the board of Next Media Works and SE TransStadia Ltd. He is also a co-founder of Interspace Communications.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48691063","title":"Fura (food)","body":"\nFura (food)\n\nFura are millet dough balls eaten in Nigeria.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48691070","title":"SS Vera (1898)","body":"\nSS Vera (1898)\n\nSS \"Vera\" was a passenger vessel built for the London and South Western Railway in 1898.\nHistory.\nShe was built by the Clydebank Engineering and Shipbuilding Company and launched on 4 July 1898 by Mrs Dixon, the wife of the marine superintendent of the London and South Western Railway. She was deployed on services between Southampton, the Channel Islands and the north coast of France. She had accommodation for 80 first-class passengers in cabins, and an additional 80 first-class passengers in Pullman car style state rooms. Provision was also made for 50 second-class passengers in the after-end of the vessel in large cabins. \nOn 15 July 1905 she stranded herself on the Black Rock, at Yarmouth off the Isle of Wight.\nShe was acquired by the Southern Railway in 1923.\nShe was disposed in 1933.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48691101","title":"Strange Music (album)","body":"\nStrange Music (album)\n\nStrange Music is an album by Anton LaVey released in 1994 through Amarillo Records. \n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48691102","title":"Ambitalk","body":"\nAmbitalk\n\nAmbitalk is the UK's largest PAMR radio network. It allows users to make private or \"group\" voice calls between vehicle based mobile units anywhere within its coverage area. It is a Trunked radio system operating in the VHF-Low frequency range and provides coverage in most of the main conurbations of the UK.\nAmbitalk is owned by Maxxwave Ltd and operates using MPT1327 signalling with custom audio enhancements using Digital Signal Processing to give clearer audio quality than is normally available from MPT1327 or DMR/dPMR (which use the AMBE+2 codec).\nThe UK Government has commissioned a UK Spectrum Usage and Demand report through the UK Spectrum Policy Forum (run by Department for Culture, Media and Sport). This report looks at all major communications solutions available across the UK and recognises that a significant number of two way radio users in the UK are now using Ambitalk as their preferred communications platform.\nFurthermore Ambitalk was awarded in 2015 the FCS Gerald David OBE award for Innovation in Business Radio. This award is given by the FCS, the UK communications trade body for the innovation that has been demonstrated by Ambitalk which sets it apart from other PAMR solutions.\nHistory.\nThe concept of Public Access radio networks is not new, with many networks such as GEC National One and Band Three Radio being launched in the UK in the 1980s. These closed around 2003 when Dolphin Telecom entered administration for the final time.\nThroughout the period of the 1980s to 2003 there had always existed smaller \"regional\" radio networks within the UK, with several of the larger networks operating a number of interconnected \"regional\" networks that formed a quasi-National operation. Wavelength and Fleetcomm, both now defunct are examples of these.\nAmbitalk is a reincarnation of the Maxxwave regional network originally covering Rugby, Coventry and Warwick in the Midlands and later adding additional transmitter stations to cover areas of London and Birmingham.\nAround 2013 this regional radio network, previously powered by Zetron and Fylde MPT1327 controllers on Band III was redeveloped, with custom controllers designed by Maxxwave and was redeployed to lower frequency bands. This gave considerable cost savings, allowing the network to rapidly expand.\nCurrent state.\nFrom 2013 onwards Ambitalk rapidly expanded, obtaining low cost national spectrum (due to the unpopular low frequency bands) and installing additional transmitter sites around the country.\nIn 2015 Ambitalk has concentrated on resilience and reliability, having replaced all Landline connections between transmitter sites with private Microwave and in-band links, giving it complete independence in case of any major catastrophe.\nAmbitalk therefore is the only publicly accessible resilient wireless two-way communications network in the UK with other networks such as Airwave Solutions being closed, only available to select user groups. Furthermore it has a considerable amount of spare capacity, made available through its low frequency operation (rather than operating in congested UHF spectrum like Airwave) so therefore is far less likely to suffer congestion issues in case of major incidents.\nIt has now become a clear market leader, having been awarded the prestigious Gerald David OBE Award in Innovation by the FCS (Federation of Communications Specialists), in recognition of the advancements it has made in the Two way radio arena. It is mentioned by name in numerous Ofcom documents with respect to the huge advances made in spectrum efficiency.\nLow frequency bands.\nAmbitalk is unique not only because it is the UK's largest PAMR network but because it reverses the trend for modern wireless deployments to migrate to higher frequency bands.\nHigher frequency bands are preferred for rolling out wireless communications systems due to the lack of interference from atmospheric disturbances, smaller antennas and more manageable coverage characteristics, vital when planning a Cellular network\nLow frequencies on the other hand are traditionally plagued by electronic interference from numerous sources and are prone to being unusable for weeks on end during summer months due to interference from foreign transmitters due to Sporadic E propagation thereby giving poor quality signals.\nAmbitalk has counteracted this Sporadic E interference by developing a Smart antenna array for low frequency bands. Such systems are normally only deployed in far higher frequency bands and the use of such a system in a low frequency band is somewhat unusual. However with these arrays it is possible to virtually eliminate interference from continental sources, thereby giving high availability of a level equal to or better than that possible with higher frequency bands.\nAt a time when frequency spectrum is becoming increasingly scarce, with many of the traditional Business Radio frequency bands within the UK now being completely congested preventing any new two way radio deployments being made, the migration of users to these lower frequency bands is welcomed by the UK regulators such as Ofcom.\nSee also.\nAmbitalk website: \n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48691104","title":"Index of plagiarism-related articles","body":"\nIndex of plagiarism-related articles\n\nThis is an index of articles about plagiarism. It includes articles about incidents and examples of plagiarism, but does not include links to biographies of plagiarists or alleged plagiarists.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48691111","title":"Marcos Peña","body":"\nMarcos Peña\n\nMarcos Peña is an Argentine politician and political scientist. \nBiography.\nMarcos Peña was born in March 15, 1977, in Buenos Aires. He made elementary school in the United States, as his parents lived abroad. He returned to Argentina and completed high school in Buenos Aires. \nHe graduated of political sciences in the university Torcuato Di Tella. He was elected legislator for Buenos Aires in 2003, in the ticket of Front for a Country in Solidarity. He helped to created the Republican Proposal party, and headed the list of legislators in the 2005 elections. Mayor Mauricio Macri appointed him general secretary of Buenos Aires in 2007. Macri became president in 2015, and appointed him chief of the cabinet of ministers. \n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48691116","title":"Eugène Frot","body":""}
{"url":"https://en.wikipedia.org/wiki?curid=48691145","title":"Mount Fura","body":"\nMount Fura\n\nMount Fura is a mountain found on old maps where the gold mines and capital of the Monomotapa kingdom was located. It is possibly to be identified as Stanford (1896) with modern Mount Fura (Mount Darwin) in Mashonaland Central, Zimbabwe.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48691154","title":"Hapoel Ramat Gan Givatayim B.C.","body":"\nHapoel Ramat Gan Givatayim B.C.\n\nHapoel Ramat Gan Givatayim is a professional fan owned basketball club from Israel. The team was founded in 2011 by Hapoel R-G fans and is aiming to promote competitive sport and the culture of sport in the cities of Ramat Gan and Givatayim.In 2013-14 season the club finished 2nd on the Liga Artzit (3rd tier). Currently the team plays in Liga Leumit.\nHistory.\nPreviously known as Hapoel Ramat Gan was founded in 1957. In 1960 the team joined Ligat HaAl and changed its name to Hapoel Ramat Gan - Givatayim. However, at the end of the season team returned to Liga Leumit. In 1964, the team rejoined Ligat HaAl, after the season the team returned to Liga Leumit. Between 1966-1971 the team alternated divisions based on their records. In 1973, the team (then called for the group of Ramat Gan and Hapoel Ramat Gan - Givataim)returned to Ligat HaAl.\nMajor players on those teams were Steve Kaplan calculate the best player of all players playing group, Hanan Keren, Or Goren, Avigdor Moskovitch and played in Mtazrhim and foreign as well: Steve Slachter, Neil marketed, Cliff Fondkstr Steve Malovik. In addition Aimno the group of senior trainers such as: Zvika Sherf Arie Maliniak but despite everything the group failed to win a championship. The group has finished second six times instead of daring Cup finals five times in the country but never managed to win Cup.\nThe biggest surprise in 1984 was its win over Maccabi Tel Aviv in semi final state cup basketball after 80-76. However, the team lost to Hapoel Tel Aviv B.C. 73-79 in the championship game. The team folded in 1988 as a result of financial issues.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48691166","title":"Eoline, Alabama","body":""}
{"url":"https://en.wikipedia.org/wiki?curid=48691177","title":"Skiddle","body":"\nSkiddle\n\nSkiddle is a primary ticket outlet and events guide based in Preston dealing with event bookings, registrations, promotion and online ticket sales. The company has a turnover in excess of £15 million and over 25 employees.\nHistory.\nSkiddle was launched in May 2001 initially as a '\"What's on Guide\"' for Preston in Lancashire. It was incorporated as Skiddle Ltd in January 2006. In February 2014 Skiddle acquired new 5000 sq/ft premises in Longridge to support expansion.\nIn August 2015 Skiddle launched an iOS app with mobile 'Box Office' functionality. The app works with Bluetooth printers and iZettle card-readers, allowing tickets to be purchased and printed closer to gig start times.\nIn November 2015 the firm announced an intern program with the University of Salford, with the aim of giving students insights into the industry and to develop journalism skills.\nIndustry involvement.\nIn 2013 Skiddle announced their white-label ticket shop, already in use by Mixmag, would also be powering Debenhams' Box Office. During October 2015 Skiddle was chosen as the official ticket website for the BBC Radio 1Xtra Live event in Leeds.\nSkiddle have sponsored a range of festivals, tents and gigs mainly in the UK.\nCharity Work.\nIn 2011 Skiddle announced their sponsorship of the charity Campaign Against Living Miserably (C.A.L.M). A checkout donation scheme on the Skiddle website has helped to raise money for several UK charities. A donation in 2015 for over £15,000 was presented to the Anthony Nolan trust with previous benefactors including Macmillan and the Disasters Emergency Committee.\nAwards.\nSkiddle has received a Hitwise Top 10 Award every month since 2008 and in August 2011 Skiddle was awarded the Hitwise Top 6 Award, making it one of the most viewed websites in the UK within its category.\nIn March 2012, Skiddle was awarded 'Online Business of The Year' by the Lancashire Business Review's \"Red Rose Awards\".\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48691199","title":"Marya Cohn","body":"\nMarya Cohn\n\nMarya Cohn is an American screenwriter and director. \nCareer.\nIn 1994 Cohn directed the student short film \"Developing\". The film starred a then unknown Natalie Portman in her first film role. \nIn 2013 Cohn began filming her feature film debut, \"The Girl in the Book\" starring Emily Vancamp in a semi-autobiographical film about a young book editor who is forced to work with a man who manipulated her as a teenager. Post-production for the film was completed via kickstarter The film premiered at the 2015 Los Angeles Film Festival. It was acquired by Myriad Pictures and given a limited release in December of 2015. \nPersonal Life.\nCohn is the daughter of talent agent Sam Cohn. \nIn 1994 she married director Fraser Bresnahan.\nIn 2011 she married Dutch director Tjebbo Penning.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48691226","title":"Colonus","body":"\nColonus\n\nColonus may refer to:\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48691247","title":"1932 Centenary Gentlemen football team","body":"\n1932 Centenary Gentlemen football team\n\nThe 1932 Centenary Gentlemen football team represented the Centenary College of Louisiana during the 1932 college football season.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48691250","title":"1933 Centenary Gentlemen football team","body":"\n1933 Centenary Gentlemen football team\n\nThe 1933 Centenary Gentlemen football team represented the Centenary College of Louisiana during the 1933 college football season. Paul Geisler was consensus All-America.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48691257","title":"1934 Centenary Gentlemen football team","body":"\n1934 Centenary Gentlemen football team\n\nThe 1934 Centenary Gentlemen football team represented the Centenary College of Louisiana during the 1934 college football season.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48691266","title":"Wilhelm Neumann-Torborg","body":"\nWilhelm Neumann-Torborg\n\nWilhelm Neumann-Torborg (born 24 August 1856 in Elberfeld; died 31 December 1917 in Elberfeld) was a German sculptor whose works are still well-known.\nBiography.\nWilhelm Neumann-Torborg grew up in Wuppertal, Germany, the son of a school headmaster. He attended evening classes at the Royal Provincial Vocational School in Elberfeld, where he received his first lessons in drawing and painting.\nHe spent the years 1874 and 1877 studying in Bad Kreuznach, in the sculpture workshop of the brothers Robert and Karl Cauer. He then further developed his craft in 1878 under Melchior zur Strassen in the Leipzig Academy of Visual Arts and until 1880 in the Academy of Arts, Berlin with Otto Knille and Fritz Schaper. In 1885, he won the Rome Scholarship from the Prussian Academy of Arts for his thesis, \"The Judgment of Paris\".\nIn subsequent years, Neumann-Torborg lived and worked in Rome, where his wife, Emma Commichau, died after a short marriage. In 1892, the artist returned to Berlin. In 1917, he fell seriously ill and died during a visit to his hometown of Elberfeld. His tomb is located in the Lutheran cemetery in Wuppertal-Elberfeld.\nWorks.\nMany of Neumann-Torborgs works were destroyed during the Second World War.\nPerhaps his best-known work, the fountain \"Faun and Nymph\", was commissioned by Baron August von der Heydt and originally stood in the park of his estate. It survived the Second World War unscathed and since 1909 has been on display in Bad Godesberg, Bonn. In 2013, it was restored and moved to a new location to permit greater public access.\nAnother relief of Neuman-Torborg's, showing dancing youths with Bacchus, was installed in the Bad Godesberg city park in 2014. The sculpture includes a bench and a bust of Roman Emperor Marcus Aurelius Probus, and was recovered in pieces from the van der Heydt estate.\nThe \"Elberfeld Poor Relief Monument\" was destroyed during the war, when the bronze figures were melted down for metal. In 2003, the granite pedestal of the monument was rediscovered during excavations at the Elberfeld Old Reformed Church, and placed on display in Blankstrasse, Wuppertal. In 2011, it was restored thanks to 24 private donations. The bronze figures were recast at the Kayser Art Foundry in Düsseldorf. The statue commemorates the inauguration, in 1853, of the Elberfeld system of poor relief, which was copied by many cities in subsequent years.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48691296","title":"Gustavo Santos (politician)","body":"\nGustavo Santos (politician)\n\nGustavo Santos is an Argentine politician. He was appointed minister of Tourism by Mauricio Macri.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48691299","title":"2016 Deutsche Tourenwagen Masters season","body":"\n2016 Deutsche Tourenwagen Masters season\n\nThe 2016 Deutsche Tourenwagen Masters season is the seventeenth season of the Deutsche Tourenwagen Masters, since the series' resumption in 2000. The season starts on 7 May at Hockenheim, and ended on 16 October at the same venue, after a total of nine events.\nCalendar.\nThe nine event calendar was announced on 30 November 2015.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48691313","title":"Blues Pills (album)","body":"\nBlues Pills (album)\n\nBlues Pills is the debut studio album by Swedish rock band Blues Pills, released on July 25, 2014 by Nuclear Blast Records. The album consists of ten tracks including some re-recorded releases from previous EPs and a cover of the Chubby Checker song \"Gypsy\". The album consists of two singles \"High Class Woman\" and \"No Hope Left For Me\", both released with music videos by Nuclear Blast.\nReception.\nMany reviews praise the improvement on the re-recording of the tracks that had previously appeared on EPs. Reviews mention the sound and style comparing to 60s blues and 70s rock influences. The album received predominantly positive online professional reviews.\nTrack listing.\nAll songs written and composed by Elin Larsson, Dorian Sorriaux, Zach Anderson and Cory Berry.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48691315","title":"1923 Centenary Gentlemen football team","body":"\n1923 Centenary Gentlemen football team\n\nThe 1923 Centenary Gentlemen football team represented the Centenary College of Louisiana during the 1923 college football season.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48691322","title":"1924 Centenary Gentlemen football team","body":"\n1924 Centenary Gentlemen football team\n\nThe 1924 Centenary Gentlemen football team represented the Centenary College of Louisiana during the 1924 college football season.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48691323","title":"1922 Centenary Gentlemen football team","body":"\n1922 Centenary Gentlemen football team\n\nThe 1922 Centenary Gentlemen football team represented the Centenary College of Louisiana during the 1922 college football season. The nine game schedule was the longest in school history.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48691333","title":"Alex Furmansky","body":""}
{"url":"https://en.wikipedia.org/wiki?curid=48691335","title":"Penny Drue Baird","body":""}
{"url":"https://en.wikipedia.org/wiki?curid=48691387","title":"Ricardo Buryaile","body":"\nRicardo Buryaile\n\nRicardo Buryaile is an Argentine politician. He is a national deputy, and Mauricio Macri has appointed him minister of agriculture. \nHe is of French-Lebanese descent.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48691422","title":"Sweet Things (Georgie Fame album)","body":"\nSweet Things (Georgie Fame album)\n\nSweet Things is the 1966 third album with the Blue Flames by Georgie Fame which reached No.6 in the album Top Ten in the UK. Following this album his band The Blue Flames was replaced with The Tornados.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48691439","title":"Yoslan Muñoz","body":"\nYoslan Muñoz\n\nYoslan Muñoz García (born ) is a retired Cuban female volleyball player, who played as a 0. She was part of the Cuba women's national volleyball team at the 2002 FIVB Volleyball Women's World Championship in Germany. On club level she played with Ciudad Deportiva La Habana.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48691444","title":"Swann Chemical Company","body":"\nSwann Chemical Company\n\nThe Swann Chemical Company was an American chemical company started by Theodore Swann, described by one historian as \"a flamboyant Birmingham mogul and New South industrialist.\" Swann Chemical first operated a chemical manufacturing plant in Anniston, Alabama where PCBs were first made on an industrial scale after development of a new process under leadership of Theodore Swann. The plant was later bought by Monsanto Industrial Chemicals Co. in 1935. The plant, just west of Anniston, had around 1,000 employees.\nOne historian wrote that, \"In many ways, the spirit of Swann Chemical became the corporate culture of Monsanto.\"\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48691467","title":"China National Electronics Import & Export Corporation","body":""}
{"url":"https://en.wikipedia.org/wiki?curid=48691484","title":"Irina Donets","body":"\nIrina Donets\n\nIrina Donets (born in Amsterdam) is a retired Dutch female volleyball player, who played as a middle blocker. She was part of the Netherlands women's national volleyball team at the 2002 FIVB Volleyball Women's World Championship in Germany. On club level she played with Pallavolo Ravenna.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48691500","title":"2015 Ice Challenge","body":"\n2015 Ice Challenge\n\nThe 2015 Ice Challenge was a senior international figure skating competition held in late October 2015 at the Liebenauer Eishalle in Graz, Austria. It was part of the 2015–16 ISU Challenger Series. Medals were awarded in the disciplines of men's singles, ladies' singles, pair skating, and ice dancing.\nEntries.\nThe preliminary entries were published on 6 October 2015.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48691501","title":"Game of Pawns (television series)","body":"\nGame of Pawns (television series)\n\n is a television game show based in Branson, Missouri about the goings on in a local pawn shop. The show stars; Justin Tranchita , Scott Velvet and Brian Roman. The plot of the show is a mix of a game show and reality television series as Scott and Brian buy unusual items at Branson Pawn using a trivia game to give patrons the chance to win more for their item all while Justin gets into trouble and goofs off making the days at Branson Pawn move along with a little more excitement. Dealing in everything from celebrity cars to antique guns, they never know just what – or who – will walk through the door next. At Branson Pawn, every day’s a gamble. Scott and Brian give each customer three questions. If they get two of the three right, the customer gets their price. If not, the house wins and Brian and Scott get their price. This show runs on the Discovery Channel globally as re-runs and had its debut in 2013 with eight original episodes.\nGame of Pawns was produced by a production company based in Denver, Colorado that has produced many hit reality television shows such as; Cake Boss , Fixer Upper , Tough Love and many more. Jim Berger and Scott Feely were the executive producers for the series.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48691506","title":"Kate Tiller","body":"\nKate Tiller\n\nKate Tiller is reader emerita in English local history at Kellogg College, University of Oxford. Tiller specialises in the history of Oxfordshire, Chartism and Methodism.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48691508","title":"Frank L. Fraser","body":"\nFrank L. Fraser\n\nFrank L. Fraser (September 29, 1854 – July 29, 1835) was an American lawyer and politician.\nBorn in Sacramento, California, Fraser moved to Wisconsin in 1860 and grew up in the town of East Troy, Walworth County, Wisconsin. He went to the Rochester Academy and the Whitewater Normal School. Fraser studied law in Racine, Wisconsin and was admitted to the Wisconsin bar in 1876. Fraser lived in Lake Beulah, Wisconsin and was also a farmer. He served on the Walworth County Board of Supervisors and was chairman of the East Troy Town Board. Fraser also served on the school board and was the board treasurer. Fraser was the postmaster for Lake Beulah. In 1895, Fraser served in the Wisconsin State Assembly and was a Republican. Fraser died at his home in East Troy, Wisconsin.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48691526","title":"Ahmed Almusawi","body":"\nAhmed Almusawi\n\nDr. Ahmed Almusawi is an Islamic scholar, philosopher, astrophysicist, and psychologist. He received a PhD in clinical psychology from Cairo University. In addition to his scientific research in the field of miracles in the Quran and Ahl al-Bayt in Islamic Studies University. Established many of the beliefs and Islamic jurisprudence lessons in addition to the scientific Interpretation of the Quran in Sweden and Europe. Ahmed works as a researcher in the in the university of Islamic studies in Egypt.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48691529","title":"Ruth Heerschap","body":"\nRuth Heerschap\n\nRuth van de Wel-Heerschap (born ) is a retired Dutch female volleyball player, who played as a middle blocker. She was part of the Netherlands women's national volleyball team at the 2001 Women's European Volleyball Championship and 2002 FIVB Volleyball Women's World Championship in Germany. On club level she played with AMVJ Amstelveen in 2002 and for GTI Nesselande in 2005.\nHer father is Martin Heerschap (chairman), her sister Eva Heerschap (player) and brother-in-law Kristian van der Wel (player) were also involved in GTI Nesselande.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48691545","title":"Chiswick Asylum","body":"\nChiswick Asylum\n\nChiswick Asylum was an English asylum established by Edward Francis Tuke and his wife Mary as Manor House Asylum in Chiswick, in about 1837. It was continued by his son, Thomas Harrington Tuke (1826-1888), before moving to Chiswick House in 1892 and becoming the Chiswick House Asylum, where it was run by two of Thomas Tuke's sons.\nManor House Asylum was begun by Edward Francis Tuke and his wife Mary in about 1837, who took a lease on Manor Farm House in Chiswick Lane, a late 17th century building. It was demolished in 1896.\nThe 9th Duke of Devonshire rented Chiswick House to the brothers Thomas Seymour and Charles Molesworth Tuke (sons of Thomas Harrington Tuke) from 1892 to 1928, when it was home to 30-40 private patients, before he sold it to Middlesex County Council in 1929. The two wings that housed the patients were demolished in 1956, as were many of the outbuildings, so little trace of the asylum remains today.\nNotable patients.\nIn 1852, the Chartist leader Feargus O'Connor MP was declared insane after a scene in the House of Commons, and confined to Chiswick Asylum, where he remained until 1854, and died in 1855.\nIn 1865, Rev William Cotton spent several weeks in the Manor House Asylum.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48691548","title":"Nicolas Gilsoul","body":"\nNicolas Gilsoul\n\nNicolas Gilsoul (born 5 February 1982) is a Belgian rally co-driver. He is the current co-driver for Thierry Neuville.\nCareer.\nAfter competing in regional events from 2000, Gilsoul made his international debut in 2003 when co-driving with Bruno Thiry. \nGilsoul started working with Thierry Neuville in 2011 and competed in the 2011 Intercontinental Rally Challenge. Since 2012, they have been driving in the World Rally Championship.\nNeuville and Gilsoul took their first WRC win in 2014, at Rallye Deutschland.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48691561","title":"Elbert Howard","body":""}
{"url":"https://en.wikipedia.org/wiki?curid=48691572","title":"List of video game webcomics","body":"\nList of video game webcomics\n\nMany webcomics have been influenced by video games and video game culture. Webcomics frequently poke fun at video game logic, the video game industry, and stereotypical behavior of gamers. The earliest video game webcomic was \"Polymer City Chronicles\", which started in 1995. However, 1998's \"PvP\" is seen as the origin of the genre, influencing various webcomics following it. A common trope in video game webcomics is to have the main characters sit on a couch, talking about the game they are playing.\nIt is common for webcomics to exclusively use in-game art and speech bubbles, such as in sprite comics. The term gamics has been proposed by Nathan Ciprick in 2004 to refer to webcomics that consist entirely of video game graphics. Despite the fact that video game graphics are generally copyrighted, owners of the intellectual properties used have traditionally been tolerant.\nOther.\nShiftyLook, a former subsidiary of Namco Bandai, focused on reviving various Namco video game franchises between 2011 and 2014. The company originally did this through English language webcomics. ShiftyLook has released webcomics based on \"Dig Dug\", \"Dragon Spirit\", \"Klonoa\", and various other video games.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48691585","title":"Chunar stone","body":"\nChunar stone\n\nChunar stone is a kind of reddish or buff-colored, finely grained, hard sandstone quarried in the Chunar in the Mirzapur District of Uttar Pradesh, and widely used in the architecture of India.\nNotable buildings and monuments carved from chunar stone include:\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48691603","title":"1973–74 Dumbarton F.C. season","body":"\n1973–74 Dumbarton F.C. season\n\nSeason 1973–74 was the 97th football season in which Dumbarton competed at a Scottish national level, entering the Scottish Football League for the 67th time, the Scottish Cup for the 79th time and the Scottish League Cup for the 27th time.\nOverview.\nThis was Dumbarton's second successive season competing in Division 1, the objective being to build on the previous season's results, and in particular to avoid any relegation worries. This was certainly achieved, and indeed by mid November there were hopes of European qualification by reaching 6th in the table. However the wins began to dry up which resulted in a slide down the league - but the final position of 10th was the best the club had achieved for over 70 years - and qualification for the Anglo-Scottish sponsored competition, the Texaco Cup the following season - although this was not to be, following a reorganisation of the qualification requirements.\nIn the Scottish Cup, Dumbarton's interest was short-lived as they lost out to Arbroath in the third round.\nIn the League Cup, with two wins and a draws from the six sectional games, Dumbarton qualified for the next stage in the competition, where Rangers awaited. A 6-0 thumping in the first leg was made the return fixture a formality, although losing by the odd goal in three was something of an achievement.\nLocally, in the Stirlingshire Cup, Dumbarton tried hard to retain the trophy they had won in the previous season, but were to lose out to Stirling Albion in the final on penalties, after a drawn game.\nInterestingly at the beginning of the season, Dumbarton embarked on a mini overseas tour - the first since 1922 - where they beat Spanish regional side CF Lloret.\nResults.\nAll results are written with Dumbarton's score first.\nStirlingshire Cup.\n - won on penalties\n - lost on penalties\nAppearances.\nDumbarton used 26 players for the 43 League, Scottish Cup and Scottish League Cup matches, as detailed below. Willie Wallace was the only player to feature in every one of these matches.\nReserve Team.\nDumbarton competed in the Scottish Reserve League, and with 12 wins and 6 draws from 34 matches, finished 12th of 18 for the second successive season.\nDumbarton again entered the Scottish Second XI Cup, and again reached the third round where Celtic were to prove too good on the day by four goals to none.\nFor the first time, Dumbarton entered the Scottish Reserve League Cup, and after qualifying from their section with 4 wins and a draw from 6 games, they eventually lost out to Partick Thistle in a two-legged semi final.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48691605","title":"Silvia Kutika","body":"\nSilvia Kutika\n\nSilvia Kutika (Wilde, 5 de agosto de 1956) is an Argentine actress best known by her roles in \"soap operas\" such as: \"906090 Modelos\", \"Vidas Robadas\", \"Los Médicos de Hoy\" and \"De Carne Somos\". In 1996 she married actor Luis Luque (1956–).\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48691627","title":"Maureen Staal","body":"\nMaureen Staal\n\nMaureen Staal (born ) is a retired Dutch female volleyball player, who played as a wing spiker. She was part of the Netherlands women's national volleyball team at the 2002 FIVB Volleyball Women's World Championship in Germany. On club level she played with Vanilla VC Weert.\nStaal suffered in 2000 and 2002 from a hernia. In 2000 she got it after lifting to many weights with training, and in 2003 after a qualification match against Italy for a Grand Prix tournament. Almost five years later she returned for her former club \"Taurus\" in 2007. She still has the hernia, but has learned to live with it.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48691634","title":"Shōnen Maid","body":"\nShōnen Maid\n\n is a Japanese manga series written and illustrated by Ototachibana. An anime television series adaptation will premiere in April 2016.\nMedia.\nManga.\nOtotachibana launched the series in Enterbrain's \"B's-Log Comic\" magazine on 12 March 2008. An audio drama CD was included with the limited edition of the sixth volume in April 2013.\nAnime.\nAn anime adaptation was announced in the 32nd issue of \"B's-Log Comic\" in August 2015. The series will be directed by Yusuke Yamamoto and written by Yoshiko Nakamura, with animation by the studio 8-Bit. Kana Ishida provides the character designs for the anime. The series will premiere in April 2016 on TBS and BS-TBS.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48691644","title":"Atlantic University School Of Medicine","body":"\nAtlantic University School Of Medicine\n\nAtlantic University School Of Medicine (AUSOM) is an offshore private medical school located in the St. Lucia National Neurological and Mental Health Wellness Centre, a psychiatric hospital built on the Gros Islet Highway, in Rodney Bay by China in 2006. The school's offshore office is located in Island Park, New York. The school's application was approved by the Cabinet of St. Lucia in 2010, though as of 2014, the country did not have legislation in place for licensing and regulating medical schools.\nPrograms.\nThe primary educational programs at AUSOM consist of a 2-year premed course of study; a four-year medical curriculum, which leads to an Doctor of Medicine degree; or a six-year track which combines the premed and medical training. In addition to theoretical and academic training, students are required to complete 48 weeks of clinical clerkships. Students participate in community health clinics from their first year of study, offering services of basic health checks, diabetes screenings and basic eye examinations. The school accepts both Lucian and foreign students, offering a scholarship program for Lucian residents who qualify.\nAccreditation.\nAtlantic University School Of Medicine received received approval from the St. Lucian Cabinet in 2010. It is not accredited by the Caribbean Accreditation Authority for Education in Medicine and other Health Professions (CAAM-HP) as of 2015. It is listed in the FAIMER International Medical Education Directory (IMED) effective in 2010 with school ID #F0002374 and in the World Health Organization's World Directory of Medical Schools. By virtue of its listing in IMED, students graduating from AUSOM are authorized to take part in the United States Medical Licensing Examination three-part examinations. Those who pass the examinations are eligible according to the Educational Commission for Foreign Medical Graduates to register for and participate in the National Resident Matching Program (NRMP).\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48691665","title":"Athanasius II of Jerusalem","body":"\nAthanasius II of Jerusalem\n\nAthanasius II (; 1229–d. 1247+) was the Greek Orthodox Patriarch of Jerusalem from 1231 to 1244. The Church of the Holy Sepulchre seems to have been largely in Athanasius' hands during the Latin control of Jerusalem. The Serbian Archbishop Sava (1174–1237) guested Athanasius twice in the Holy Land, and according to Serbian chronicles they were good friends. After the Latin retreat from Jerusalem in 1244, the Melkites (who were the majority of the south of the Latin kingdom) turned to Athanasius. Athanasius II was in negotiations with the Pope through friar Lawrence of Portugal in 1247; Innocent IV supported him against the Latin patriarch, Robert.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48691680","title":"Sri Thenandal Films","body":"\nSri Thenandal Films\n\nSri Thenandal Films is an Indian film production and distribution company based in Chennai. The company was founded in 1976 by Rama Narayanan. They have produced, released and distributed films across several regional film industries in India.\nHistory.\nRama Narayanan set up Sri Thenandal Films in 1976 in Chennai, and the studio has gone on to distribute over 750 films across India.\nDuring the late 1990s and early 2000s, Sri Thenandal Films produced and distributed a series of devotional films directed by Rama Narayanan. The quick spate of releases titled after goddesses such as \"Palayathu Amman\" (2000), \"Nageswari\" (2001), \"Kottai Mariamman\" (2001) and \"Annai Kaligambal\" (2003), saw the studio garner an image of focussing solely on Hindu devotional subjects.\nIn the 2010s, Murali Ramaswamy made a decision to actively purchase and distribute horror films, and experienced immediate success after \"Aranmanai\" (2014), \"Kanchana 2\" (2015), \"Demonte Colony\" (2015) and \"Maya\" (2015) all became profitable ventures. The success of the studio's investment in that particular genre prompted them to finance smaller budget horror films including \"Strawberry\" (2015) and \"Jackson Durai\" (2016), in attempt to capitalise on the popularity of the genre across Tamil Nadu.\nThe studio also ventured into the production of stage plays in 2015, and financed \"Chillu\", a futuristic science fiction play, performed in Chennai.\nSelected filmography.\nDistribution.\nThe following films are a list of film which were distributed by Sri Thenandal Films throughout Tamil Nadu, apart from their own productions:\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48691684","title":"Dieter Kalka","body":"\nDieter Kalka\n\nDieter Kalka (born 25 June 1957, Altenburg) is a German writer, songwriter, poet, dramatist, musician, editor, translator and speech therapist.\nBiography.\nDieter Kalka started to study electrical engineering and mathematics at the Technische Universität Ilmenau in 1978. In 1980 he had to quit his studies because of the distribution and possession of illegal publications. He was a member of the folk band founded in 1978, \"\", in 1984 he founded the band (The happy Future of Dieter) with Folksongs and own texts together with Uwe Schimmel (Waldhorn), Uta Mannweiler (Viola) and himself Bandoneon. With this group she organized the illegal artists' meeting \"Ringel Folk\" in Wurzen where there was no censorship. The unauthorized promotional material for this and other actions he copied at the photo lab of Petra Lux.\nDieter Kalka was \"the fiercest among the Leipzig song singers\". Since the mid-1980s he has worked as a freelance singer and was repeatedly participant of the Chanson days Kloster Michaelstein (GDR-open Chanson days in Monastery Michaelstein). He made samizdat productions in privat studio at Hubertus Schmidt 1987 and Peter Gläser 1988 and official at Studio Kölling (Leipzig 1989).\nAfter collaboration with Werner Bernreuther mentoring in 1987 he received a professional certificate as a songwriter, won a prize at the (Chanson days in Frankfurt/Oder) and a Prize of the Leipzig Songwriter Workshop, which he later publicly returned as they wanted to dictate to him what song he should sing at the final concert. He has received several scholarships of Saxony and was for a time a member of the Independent Writers Association \"ASSO\" Dresden, the NGL/New Society for Literature, the Writers Association \"VS\" and the \"Förderkreis Freie Literaturgesellschaft Leipzig\".\nDieter Kalkas first book publication was entitled \"Eine übersensible Regung unterm Schuhabsatz\" (An Over Sensitive Motionless Under the Heel) and released in 1987 as samizdat. In 1990 he prepared a project manager before the first . Within the Association of German writers he organized in 1995 in Leipzig, the German-Polish poets festival \"\". He translated Polish poetry. Sunken GDR reality is the subject of his \"Der ungepflückte Apfelbaum\" published in 1998. Kalkas texts have been published in German, Polish, Austrian, Canadian and Belarusian literary magazines.\nKalka was twice in Belarus for Songwriter's Festival \"Bardentreffen\" and appeared with his Belarusian colleague Victor Shalkevich. At Saxon Literature Spring 2003, he dedicated his \"Freiheitslied Nr. 2\" (Freedom Song No.2) his Belarusian colleague Victor Shalkevich to make him hope for better times.\nHe participated in the German-Polish poets steamer on the border river Oder and the in Breslau, Bad Muskau and Lwówek Śląski.\nAt Poets steamer was the Poets wedding 1998 between Dieter Kalka and Zielona Góra fairy tale author Agnieszka Haupe at the Frankfurt Oderbrücke.\nKalka joined with his bandoneon various programs on own songs, such as 1988 with the theme \"Noch habe ich die Freiheit zu lieben\" (I still have the freedom to love). Sometimes he sang at the songwriter-festival . His songs \"are not without bitter aftertaste. He puts his finger on compromises that each includes almost every day in life, or feel compelled to close. Former ideals are often forgotten. He wrote the lyrics for the folk opera and wrote about\" The revival of the East German singer-songwriter scene \". His concerts have taken him to Poland, Belarus, Czech Republic, Hungary, Switzerland, Austria and Denmark. His songs are on numerous CDs.\nDieter Kalka works as a speech therapist and lives in Leipzig and Meuselwitz.\nWorks.\nTranslation.\nDieter Kalka translated Polish poets: , Jan Strządała, , , Józef Baran, , , Agnieszka Haupe, Jolanta Pytel, , , , Grzegorz Stec, Jakub Malukow Danecki, Bohdan Zadura, Waldemar Michalski, Alekzander Rozenfeld and others. The poetry was published in , , the anthology \"Lubliner Lift/Lubelska winda\", , the anthologies \"Es ist Zeit, wechsle die Kleider\", \"Nach den Gewittern\" and at PortalPolen.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48691695","title":"Yesterday's Hero (disambiguation)","body":"\nYesterday's Hero (disambiguation)\n\nYesterday's Hero is a 1979 film\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48691703","title":"Akeem Hunt","body":"\nAkeem Hunt\n\nAkeem Bernard Hunt (born February 22, 1993) is an American football running back for the Houston Texans of the National Football League (NFL). He was signed by the New York Giants as an undrafted free agent in 2015. He played college football at Purdue.\nCollege career.\nDuring his college career, Hunt rushed for 2,035 yards on 371 carries with 11 rushing touchdowns, six receiving touchdowns and three kick return touchdowns.\nStatistics.\nSource:\nProfessional career.\nNew York Giants.\nHunt signed with the New York Giants as an undrafted free agent in May 2015. He was released on September 2, 2015.\nBaltimore Ravens.\nHunt was signed to the Baltimore Ravens practice squad on October 13, 2015 and was released on October 20. \nHouston Texans.\nHunt was signed to the Houston Texans practice squad on November 2, 2015. He was promoted to the active roster on November 21.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48691712","title":"June (company)","body":"\nJune (company)\n\nJune is a home automation company based in San Francisco. Its first product is the June Intelligent Oven, a computer-based, Wi-Fi-enabled, app-connected countertop oven that employs machine learning and computer vision technologies to identify and cook food. The oven was created by “a team that brought the iPhone, the Fitbit, the GoPro, and Lyft to market.”\nDesign.\nThe oven is controlled by a click knob, 5-inch touch screen and connected app. Programmable and sensor-driven, the oven uses a built-in scale, core-temperature thermometer and a camera to suggest cooking time and temperature. The internal high-definition camera with a fisheye lens that is designed to recognize commonly cooked foods. The company claims the oven’s optical recognition can identify foods such as frozen pizza, bacon, Brussels sprouts, asparagus, and potatoes and can differentiate between different types of fish.\nJune was founded by Matt Van Horn, CEO, and Nikhil Bhogal, CTO, and launched in June 2015.\nVan Horn co-founded Zimride, which spun off the ride-sharing service Lyft. Bhogal designed the camera software for the iPhone’s first five generations and is listed as an inventor on multiple Apple camera software patents. June team members have worked on the Apple Watch, GoPro cameras and Fitbit fitness trackers as well. Michelin-starred chef Michael Mina is an advisor to June.\n\"The Wall Street Journal\" said “the innovation found in the June Intelligent Oven is spectacular” and that “its technologies point the way to the future of cooking.”\nHardware.\nThe June Oven has dual-surround convection fans, digital TRIAC controllers, a GPU processor, a 2.3-gigahertz NVIDIA chip, and carbon-fiber heating elements. Ammunition Design Group aided with the industrial design of the June Intelligent Oven and Quanta Computer aided in the manufacturing.\nSoftware.\nThe iOS app displays a live-stream video of the inside of the oven and then sends a notification when the food is done. The iOS app also has “smart recipes” that illustrate cooking steps with videos and GIFs and communicate with the oven.\nFunding.\nJune received $7 million in Series A funding from the Foundry Group, First Round Capital, Lerer Ventures, and Founders Fund.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48691717","title":"Jordi Mas Castells","body":"\nProgressively he specialized in building wells which stopped villagers, particularly girls, the weakest ones in that society, from walking long distances to get water to drink for both their families and cattle. During his long stay in the country he built hundreds of them.\nMas was also aware that health was one of the weaknesses of the region. Therefore, together with the Swiss doctor Giuseppe Maggi (1910-1988) he founded the hospitals of Tokombéré (1962), Zina (1970) and Mada (1978).In the latter, a heath reference center, he worked driving patients in a jeep-ambulance for many years, a job which enabled him to get to know the territory and, mainly, to be close to the 250,000 inhabitants living in the surroundings of the hospital, a vast area of about 200 kilometres including four countries: Cameroon, Chad, Niger and Nigeria.\nIn 1988 when doctor Maggi died, Jordi Mas went on to school founding, as it was evident for him that people without education have neither hope nor future. As a result of this work in 1998 he opened the big professional school of Blangoua CEFAVIHAR (Educational centre for the improvement of life in rural areas), next to lake Chad. In this school, which also includes a student residence promoted by Mans Unides, about forty youngsters from the villages near the lake can learn mechanics, electricity, welding, carpentry, business managering, sewing, typing, computer studies... Besides there is a primary school with 500 pupils which was created thanks to the collaboration of some Catalan organizations grouped together in the charity Makary-Blangoua \nIn recent years, Mas focused on the home FEMAK (\"Femmes de Makary\") (2008), a meeting point for women of all religions in the region of Makary to relate, learn and exchange experiences. They had sewing workshops, computers and vegetable gardens and classrooms where they received education about health, eating habits and cooking.\nHis great knowledge of the region was crutial in other projects: accommodation for the teachers in Blangoua, the FEMAK home and the residence for charity workers in Makary (2008)... The last project he was keen to develop in 2009 was the growing of a seaweed rich in proteins called spirulina, which grows really well in areas like lake Chad.\nLater life.\nIn 2010 he fell ill and travelled to La Garriga to undergo the treatment which enabled him to go back to his home in Makary. However, he died on Thursday 18 November that year. He is buried in La Doma cemetery, in La Garriga.\nJordi Mas died, but his work is fully alive helping the people near the lake. Nowadays, November 2015, the Italian Fabio Musi, a long term Cameroon resident, is responsible for the general coordination of the different parishes and schools. He does it from Maroua, the Far North Region capital city of the country. In the last two parishes where the priest from La Garriga worked, namely Makary and Blangoua, there are two native priests in charge.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48691726","title":"Elke Wijnhoven","body":"\nElke Wijnhoven\n\nElke Wijnhoven-Schuil (born ) is a retired Dutch female volleyball player, who played as a libero. She was part of the Netherlands women's national volleyball team at the 2002 FIVB Volleyball Women's World Championship in Germany. She also competed at the 2001 Women's European Volleyball Championship, 2005 Women's European Volleyball Championship and 2005 FIVB World Grand Prix. On club level she played with Metodo Minetti Vicenza.\nPersonal.\nWijnhoven married on 6 June 2009 the Dutch volleyball and beach volleyball player Richard Schuil. In March 2012, her daughter Lisa was born.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48691732","title":"The Legacy of the Blues Vol. 7","body":"\nThe Legacy of the Blues Vol. 7\n\nThe Legacy of the Blues Vol. 7 is an album by American blues pianist Memphis Slim which was recorded in 1967 and released on the Swedish Sonet label. \nReception.\nIn his review for Allmusic, Nathan Bush says \"Throughout the set, Slim is happy to lend the spotlight to his sidemen, working the 88s behind Eddie Chamblee's tenor solo on 'I Am the Blues' and Billy Butler's guitar on 'Ballin' the Jack.' Even in these situations however, the pianist is dazzling and his commentary always worth paying attention to.\"\nTrack listing.\n\"All compositions by Peter Chapman\"\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48691759","title":"CRAX Commander","body":"\nCRAX Commander\n\nCRAX Commander is a dual pane, Orthodox File Manager for Mac OS X, created in Objective-C. The app is currently developed by Soft4U2 (Marcin Słowik) and is one of the new generation of Apple Finder replacement apps.\nCRAX Commander has a familiar Finder-like look so it’s instantly usable as a replacement. The key to a replacement utility is the feature list. CRAX Commander embraces it with a wide ranging slew of features and functions.\nCRAX Commander was created using ideology of dual-pane user interface which is well-known from the world of the Windows applications like Total Commander. Ideology of this kind of apps assumes offering multi-tab browsing user interface with features enabling of advanced search of files or folders, comparing files and folders, navigation in archive files and enabling multi-rename tool with regular expression support. This kind of applications also include a built-in FTP client, working with local and network drives and built-in file editor and viewer.\nCRAX Commander is app for Mac power users and offers user configurable keyboard shortcuts, built-in text editor with sync coloring, full user interface customization including fonts and colors, archive support and FTP, SMB, AFP, SSH, and sFTP built in.\nApplication is available in demo and paid version and provides a plethora of tools that will help end user to manage files and folders while taking advantage of the dual-pane interface design.\nHistory.\nFrom 2013 until 2014 CRAX Commander was called Crax and was developed by Ewa Serafin. The name and icon for application was changed in 2015.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48691782","title":"Jorge Lemus","body":"\nJorge Lemus\n\nJorge Lemus (born June 9, 1948, Buenos Aires) is an Argentine politician. He was appointed minister of health of Buenos Aires in 2007, under mayor Mauricio Macri. He resigned in 2012, but stayed in the Republican Proposal party. Macri won the 2015 elections, and appointed him national minister of health.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48691793","title":"Podlubnik","body":"\nPodlubnik\n\nPodlubnik is part of a local community Podlubnik/Stara Loka in Municipality of Škofja Loka in the Upper Carniola region of Slovenia.\nFun fact: Podlubnik street has the second highest number of house numbers (356 house numbers) in whole Slovenia.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48691795","title":"Anita Krajnc case","body":"\nAnita Krajnc case\n\nThe Anita Krajnc case refers to the case of Toronto resident Anita Krajnc who has been charged with criminal mischief for giving water to pigs in a slaughter truck on the way to Fearman's Pork Inc. slaughterhouse, located in Burlington, Greater Toronto Area. This incident occurred on June 22, 2015.\nBackground.\nAnita Krajnc is co-founder of Toronto Pig Save, which was started in 2010. A \"Huffington Post Canada\" story titled \"Meet The Compassionate Canadians Who Give It All To Animals\" includes Krajnc as one of the five chosen and describes her as having \"a mighty heart to bear witness to any creature's grim odyssey to death\" for \"she has been standing \"vigil\" at the gates of death for thousands of pigs\".\nKrajnc holds a PhD in Political Science from the University of Toronto. Her doctoral thesis was based on the role of scientific knowledge and public education in building international environmental regimes. Krajnc has been Assistant Professor at Queen's University. She has also been a media democracy activist and a writer. She was an aide to Charles Caccia former Minister of Environment and Climate Change.\nIncident.\nThe related incident occurred on June 22, 2015, outside Fearman's Pork Inc. slaughter house in Burlington. The protest was undertaken by Toronto Pig Save, a group to which Krajnc, who is described as an animal rights activist, belongs. Krajnc and her group were providing water to pigs in trucks carrying them to slaughter, as they stopped at a traffic island at the intersection of Appleby Line and Harvester Road, through the vents on the sides of the truck. As they were doing so, a driver of one of the trucks, Jeffrey Veldjesgraaf, got down and went to her and asked her to stop. Krajnc recited a verse from the biblical Book of Proverbs: \"If they are thirsty, give them water\". In response Veldjesgraaf called her \"a dumb fricking broad\" and told her that the pigs weren't human. Krajnc asked Veldjesgraaf to be compassionate, Veldjesgraaf said he would call the police, Krajnc suggested that she would call Jesus. Veldjesgraaf asked what she was feeding the pigs, Krajnc said that it was water, he told her that he wanted proof, Krajnc suggested that he trust her and offered him a sample. Veldjesgraaf asked her to desist from feeding again. Krajnc said that if the pigs were thirsty they would be fed again. Veldjesgraaf threatened to knock the bottle off, Krajnc retorted that she would charge him with assault. The driver then walked off, boarded the truck and drove on. This interaction was filmed by Krajnc's associates. On June 23, 2015, Eric van Boekel, from whose farm the pigs were brought, filed a case against Krajnc. On September 9, 2015, Krajnc was charged with criminal mischief, the penalty for which ranges from a fine to 10 years in prison. In response, the group arranged a vigil on September 24. On October 14, 2015, Krajnc appeared in court for an arraignment, to have charges read to her. In the context of the case \"The Daily Telegraph\" reports that under Canadian law pigs are considered property and can be transported without food and water for 36 hours. Krajnc has said that she would refuse to pay any fine and that she was willing to suffer imprisonment.\nVeldjesgraaf stated that the activists were entitled to protest, his objection was to their touching his truck (which may jeopardise their own safety) or feeding the pigs. He considers the charges justifiable. He claims that the pigs were loaded an hour before the incident and it was unlikely they were dehydrated. \"Metro\" printed a rebuttal from Bob Comis, a former breeder who stated that the pigs as seen in video of the incident showed symptoms of \"severe heat stress\". Eric van Boekel in support of his complaint said, \"They don't have the right to involve other people's property and they don’t have the right to protest illegally\". He claimed that rules set by pig breeders regarding food and water were followed by his operations. A story reporting the incident noted that breeding facilities owned by the same Eric van Boekel were charged with polluting the Thames river in April 2007 and fined $120,000.\nKrajnc has stated that treating living animals such as pigs as property – \"no different than a toaster\" – is the focal issue of the matter and that being compassionate to others should not be considered criminal.\nReactions.\n\"The Guardian\" reports that many online petitions have been created in defence of Krajnc. By November 30, 2015, the petition on Care2 called \"Compassion Isn't a Crime\" had 125,500 signatories, while another on Change.org asking the Ontario Court of Justice to drop charges against her, had over 24,600. \"The Daily Telegraph\" considers the case \"a cause célèbre for animal welfare activists\". Another story reports that the case has caused Krajnc to \"become a minor celebrity on social media.\" Instagram and Facebook pages have been created.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48691833","title":"Alina Albu","body":"\nAlina Albu\n\nAlina-Speranta Albu (born ) is a retired Romanian female volleyball player, who played as a middle blocker. She was part of the Romania women's national volleyball team at the 2002 FIVB Volleyball Women's World Championship in Germany. On club level she played with Dinamo Bukarest.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48691841","title":"Elena Butnaru","body":"\nElena Butnaru\n\nElena Butnaru (born ) is a retired Romanian female volleyball player, who played as a middle blocker. She was part of the Romania women's national volleyball team at the 2002 FIVB Volleyball Women's World Championship in Germany. She also competed at the 2001 Women's European Volleyball Championship and 2005 Women's European Volleyball Championship. On club level she played with Pallavolo Palermo.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48691843","title":"Streptomyces coacervatus","body":"\nStreptomyces coacervatus\n\nStreptomyces coacervatus is a Gram-positive bacterium species from the genus of \"Streptomyces\" which has been isolated from the intestinal tract of the common pill-bug Armadillidium vulgare in Chiba City in Japan.\nReferences.\n \n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48691848","title":"Lasse Lehmann","body":"\nLasse Lehmann\n\nLasse Lehmann (born May 20, 1996) is a German footballer who plays for Stuttgarter Kickers.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48691850","title":"Maria Chivorchian","body":"\nMaria Chivorchian\n\nMaria-Eugenia Chivorchian (born ) is a retired Romanian female volleyball player, who played as a universal . She was part of the Romania women's national volleyball team at the 2002 FIVB Volleyball Women's World Championship in Germany. On club level she played with Amici Bacau.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48691851","title":"Booze Traveler","body":"\nBooze Traveler\n\nBooze Traveler is an American travel television series hosted by Jack Maxwell. The premise involves Maxwell traveling the world to partake in international (and domestic) alcohol-based customs, as well as observe the culture of specific areas in a more general sense. It premiered on Travel Channel on November 24, 2014. Season 1 consisted of 15 episodes, and Season 2 will have 16 episodes. The status of Season 3 is currently unknown.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48691853","title":"Andreea Constantinescu","body":"\nAndreea Constantinescu\n\nAndreea-Florina Constantinescu (born ) is a retired Romanian female volleyball player, who played as a 0. She was part of the Romania women's national volleyball team at the 2002 FIVB Volleyball Women's World Championship in Germany. On club level she played with VC Unic Piatra Neamt.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48691856","title":"Mirela Corjeutanu","body":"\nMirela Corjeutanu\n\nMirela Corjeutanu (born ) is a retired Romanian female volleyball player, who played as a universal. Corjeutanu also competed at the 2001 Women's European Volleyball Championship squads and 2005 Women's European Volleyball Championship squads. She was part of the Romania women's national volleyball team at the 2002 FIVB Volleyball Women's World Championship in Germany. On club level she played with Futura Volley Sanarate.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48691868","title":"Strike Force (1975 film)","body":"\nStrike Force (1975 film)\n\nStrike Force is a 1975 television film starring Richard Gere.\nPlot.\nA federal agent and a New York City detective join forces with state trooper to break up a drug ring.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48691869","title":"Football records in Croatia","body":"\nFootball records in Croatia\n\nThis page details football records in Croatia. It counts only results and records from 1992 onwards, as that year marked start of Croatian First Football League. Prior 1992 Croatian clubs were part of Football Association of Yugoslavia. Croatia declared independence from Yugoslavia in 1991.\nNational team.\nResults.\nCroatia - Australia 7-0, 6 June 1998 (friendly)\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48691870","title":"Carmen Marcovici","body":"\nCarmen Marcovici\n\nCarmen-Alida Marcovici (born ) is a retired Romanian female volleyball player, who played as a middle blocker. She was part of the Romania women's national volleyball team at the 2002 FIVB Volleyball Women's World Championship in Germany and 2005 Women's European Volleyball Championship. On club level she played with Boavista Porto.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48691875","title":"Rani Sati Temple Jhunjhunu","body":"\nRani Sati Temple Jhunjhunu\n\nRani Sati, also identified as Narayani Devi and referred to as Dadiji (grandmother), is said to be a Rajasthani woman who lived sometime between the 13th and the 17th century and committed sati (self-immolation) on her husband's death. Various temples in Rajasthan and elsewhere are devoted to her worship and to commemorate her act. Rani Sati Temple Jhunjhunu is biggest temple of Rani Sati in india.\nJai Shree Rani Sati\nHistory.\nThe history of\nRani Sati Dadi Maa starts from the time of Mahabharata.\nNarayani's wish of being married to Abhimanyu and her desire to be sati in her next life.\nAs granted by Lord Krishna, in her next life she was born as the daughter of Gursamal in the village of Dokwa in Rajasthan. She was named - Narayani. Abhimanyu took birth in Hissar as son of Jaliram and named - Tandhan. Tandan and Narayani got married and were leading a peaceful life. He was in possession of a beautiful horse which was being eyed by the son of king of Hissar from quite some time. Tandan refused to hand over his precious horse to the king’s son.\nThe king’s son then decides to forcefully acquire the horse and thus challenges Tandan for a combat. However Tandan fights the battle bravely and kills the King’s son instead. The enraged king thus kills Tandan in front of Narayani in the battle. Narayani symbolic to female bravery and power fights with the king and kills him. She then commanded Ranaji (the caretaker of the horse) to make immediate arrangements for her to be set ablaze along with her husband’s cremation.\nRanaji playing a vital role in fulfilling her wish to be sati with her husband is then blessed by Narayani that his name will be taken and worshiped along with her name and since then she is known as Rani Sati.\nTemple.\nThe most amazing feature of this famous temple is that it does not hold any paintings or statues of either female or male gods. Instead a trident depicting power and force is worshipped religiously by the followers. However one can surely find a beautiful portrait of Rani Sati in the pradhan mand. The temple is prepared with white marbles and has colorful wall paintings.\nIn the complex of Rani Sati temple there is also the Lord Hanuman Temple, Sita Temple, Lord Ganesha Temple and Lord Shiva Temple. The regular ‘Prasad’ distribution takes place after every ‘aarti’. There are also arrangements made for the meals in day time on payment basis. It is beautiful and intricately crafted, not to forget the golden pot at the top of the temple.\nThere are in all 13 sati temples in the complex with 12 smaller one’s and 1 main temple dedicated to Rani Sati Dadi Built in pure white marble with a red fluttering flag at the top, the building forms are interesting and marvelous.\nA huge statue of Lord Shiva in the center of the complex surrounded by the lush green gardens, adds to the beauty of the place.\n Inside the temple, the interiors, adorned with exquisite murals and fascinating rich glass mosaics depicting the entire history of the place, are eye-catching.\nObservances and festivals.\nHundreds of devotees visit the temple every day. An elaborate aarti is performed at the temple two times a day. These are:\nA special Poojan utsav is held on the occasion of\n Bhadrapada Amavasya : The 15th day of the dark half of Bhadrapada month in the Hindu calendar is of special significance to the temple.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48691882","title":"Buddhist Rock Carvings in Manglawar","body":""}
{"url":"https://en.wikipedia.org/wiki?curid=48691883","title":"Florentina Nedelcu","body":"\nFlorentina Nedelcu\n\nFlorentina Nedelcu (born ) is a retired Romanian female volleyball player, who played as a wing spiker. She was part of the Romania women's national volleyball team at the 2002 FIVB Volleyball Women's World Championship in Germany and 2005 Women's European Volleyball Championship. On club level she played with VC Unic Piatra Neamt.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48691894","title":"Cristina Pîrv","body":"\nCristina Pîrv\n\nCristina-Lucretia Pîrv (born ) is a retired Romanian female volleyball player, who played as a wing spiker. She was part of the Romania women's national volleyball team at the 1994 FIVB Volleyball Women's World Championship in Brazil., 2002 FIVB Volleyball Women's World Championship in Germany and 2001 Women's European Volleyball Championship. On club level she played with Minas Tênis Clube.\nPersonal life.\nSince 2003 she has been married to the Brazilian former international volleyball player, Giba. They have 2 children together, a daughter Nicoll (8) and a son Patrick (4). In November 2012, Cristina has filled for divorce.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48691918","title":"2015–16 Aris Thessaloniki F.C. season","body":"\n2015–16 Aris Thessaloniki F.C. season\n\nThe 2014–15 season is Aris Thessaloniki F.C. 2nd season in Gamma Ethniki. They will also compete in the Macedonia Football Clubs Association Cup.\nOn 17 September 2015, Nikos Anastopoulos appointed as manager.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48691932","title":"Piano District","body":"\nPiano District\n\nThe Piano District is the name proposed by two developers for what is currently known as the Port Morris neighborhood of the South Bronx. The two developers, Somerset Partners and The Chetrit Group, purchased two riverfront properties for $58 million with the goals of establishing luxury residences and retail.\nCurrent residents, fearing the effects of gentrification, are voicing opposition. Critics and proponents have accused one another of racism. The developers were criticized by Melissa Mark-Viverito, the president of the New York City Council for conducting a Halloween rave, attended by numerous celebrities, with the theme of \"Macabre Suite\" created and curated by Lucien Smith, and hosted by warehouse owner, private equity mogul Keith Rubenstein who is head of real estate developers Somerset Partners, and art dealer Jeanne Greenberg-Rohatyn. The rave featured flaming trash cans and hulks of burnt-out and bullet-riddled cars. Mark-Viverito accused the developers of a lack of empathy and basic awareness.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48691945","title":"Anca Popescu","body":"\nAnca Popescu\n\nAnca Popescu (born ) is a retired Romanian female volleyball player, who played as a middle blocker. She was part of the Romania women's national volleyball team at the 2002 FIVB Volleyball Women's World Championship in Germany. On club level she played with TV Fischbek.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48691948","title":"Nightside (film)","body":"\nNightside (film)\n\nNightside is a 1980 television pilot starring Doug McClure.\nPlot.\nTelevision pilot about the adventures of a streetwise cop working the night shift in Los Angeles with a naive partner.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48691949","title":"Nicoleta Tolisteanu","body":"\nNicoleta Tolisteanu\n\nNicoleta Tolisteanu (born ) is a retired Romanian female volleyball player, who played as a libero. She was part of the Romania women's national volleyball team at the 2002 FIVB Volleyball Women's World Championship in Germany. She was awarded the best receiver at the 2003 Women's European Volleyball Championship. On club level she played with Amici Bacau.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48691962","title":"Marc Dollendorf","body":"\nMarc Dollendorf\n\nMarc Dollendorf (born 7 February 1966 in Waarloos) is a retired Belgian athlete who specialised in the 400 metres hurdles. He represented his country at the 1996 Summer Olympics as well as four consecutive World Championships starting in 1991.\nHis personal best in the event is 48.91 seconds set in Atlanta in 1996. This is the standing national records.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48691966","title":"Ordinary People (Steve Harley song)","body":""}
{"url":"https://en.wikipedia.org/wiki?curid=48691968","title":"Luminita Trombitas","body":"\nLuminita Trombitas\n\nLuminita-Gabriela Trombitas (born ) is a retired Romanian female volleyball player, who played as a setter. She was part of the Romania women's national volleyball team at the 2002 FIVB Volleyball Women's World Championship in Germany. On club level she played with Petrarca Padua.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48691973","title":"Carmen Țurlea","body":"\nCarmen Țurlea\n\nCarmen Turlea (born ) is a retired Romanian female volleyball player, who played as a opposite. She was part of the Romania women's national volleyball team at the 2002 FIVB Volleyball Women's World Championship in Germany. On club level she played with Foppapedretti Bergamo.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48691981","title":"Garoutte Creek","body":"\nGaroutte Creek\n\nGaroutte Creek is a tributary of the Little River in the U.S. state of Oregon. Rising along the Calapooya Divide near the border between Lane and Douglas counties, it flows generally northeast to meet the larger stream near Black Butte. The butte is a dark-colored mountain, the site of a former mine, and the site of a former post office. Little River joins Big River a few miles downstream to form the Coast Fork Willamette River.\nOn older maps, Little River appears as a tributary of Garoutte Creek, also known as Saroutte Creek. However, in 1988 the United States Board on Geographic Names renamed the lower reach of Garoutte Creek so that it became part of Little River. The change rendered the upper reach of Garoutte Creek a tributary of Little River. \nThe only named tributary of Garoutte Creek is Carlson Creek, which enters from the left.\nPost office.\nThe Black Butte Mine, developed by S. P. Garoutte in the 1890s, led to the establishment of a post office at Black Butte. William Harris was the first postmaster, and the office, established in 1898, was known by his last name, \"Harris\". The name was changed in 1901 to Blackbutte. It operated under that name until permanently closing in 1957. \nPollution.\nIn the 21st century, the former mine and the area around it have become a Superfund site. The Environmental Protection Agency is concerned about methylmercury contamination of streams including Garoutte Creek, the Little River, and the Coast Fork, as well as the Cottage Grove Reservoir on the Coast Fork. During its heyday, the mine was the second-largest mercury producer in Oregon. From 1900 to 1957, it yielded a total of 16,904 flasks of elemental mercury; equivalent to about .\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48691992","title":"Choi Kwang-hee (volleyball)","body":""}
{"url":"https://en.wikipedia.org/wiki?curid=48691998","title":"Tom Connell (American football)","body":"\nTom Connell (American football)\n\nTom Connell ( – ) was an American football player. He played at the halfback position for the University of Detroit Titans football team and was captain of the undefeated 1928 team that was selected by Parke H. Davis as that year's national champion. He scored 126 points in 1928, ranking second in scoring nationally. He was also the captain of the 1927 Detroit team and the first Detroit player to be twice selected as captain. He was married in 1932 to Josephine Gleason, a music teacher.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48692009","title":"Huang Jing","body":"\nHuang Jing\n\nHuang Jing (; 1912 – 10 February 1958), born Yu Qiwei (), was a Chinese Communist revolutionary and politician who served as Mayor and Communist Party Chief of Tianjin municipality, Minister of the First Ministry of Machine Building Industry, and Chairman of the National Technological Commission. He was an ex-husband of Jiang Qing, who later married Mao Zedong, and the father of Yu Qiangsheng, a top Chinese intelligence officer who defected to the United States in 1985, and Yu Zhengsheng, the fourth-ranked member of the Politburo Standing Committee.\nEarly life and revolution.\nYu Qiwei was born in 1912 to a prominent family in Shaoxing, Zhejiang Province. His uncle Yu Ta-wei later served as Minister of National Defense of the Republic of China on Taiwan. The chemist Zeng Zhaolun was also his uncle. Yu enrolled in Shandong University in Qingdao, majoring in physics. At the same time, he spent significant amount of time in underground political activism for the Communist Party of China.\nWhile in Qingdao, Huang Jing met and married Li Yunhe (who would later change her name to \"Jiang Qing\" and marry Mao Zedong), in 1932. Huang introduced the 19-year-old Li to join the Communist Party in 1933. Soon afterwards, Huang was arrested by the government for his Communist activism. To avoid implicating Li, he sent a message asking her to leave him. Li was introduced to Shanghai film director Shi Dongshan, who was in Qingdao at the time, and followed Shi to Shanghai. After Huang's release in 1934, he lived with Li for a while with his family in Shanghai. However, Huang's family was adamantly against their marriage, and they became separated.\nIn 1935, Huang Jing, then attending Peking University, co-led the December 9th Movement with Yao Yilin and Huang Hua, demanding the Chinese government to actively resist Japanese aggression in the aftermath of the Mukden Incident.\nAfter the Japanese invasion of China in 1937, Huang moved to the Communist base in Yan'an in winter 1939. Li Yunhe, now known as Jiang Qing, had also moved to Yan'an and married the Communist leader Mao Zedong. Huang later became a department head in the Communist bases in Shanxi-Chahar-Hebei (Jin-Cha-Ji) and Shanxi-Hebei-Shandong-Henan (Jin-Ji-Lu-Yu) border areas.\nPolitical career.\nFollowing the surrender of Japan in 1945, the Communists took over northern Hebei Province, and Huang was appointed Mayor of Zhangjiakou. After the founding of the People's Republic of China in 1949, he became the Mayor of the Tianjin municipality, as well as the city's Communist Party Chief.\nIn 1952, Huang was appointed Minister of the First Ministry of Machine Building Industry, which was in charge of the civilian industry (the Second Ministry was in charge of military work). When the National Technological Commission was established in 1956, he became its first chairman. While serving in these capacities Huang praised the work of a young engineer in Shanghai named Jiang Zemin, the later Chinese president, who recalled that Huang invited him to a banquet at the Quanjude duck restaurant, and on another occasion, talked to him for four hours until 11 pm.\nHuang Jing was considered a promising young star of the Communist Party, but was labelled a counterrevolutionary when the Anti-Rightist Campaign began in 1958. He died in Guangzhou that same year, at the age of only 46. The circumstances surrounding his death are unclear. It is said that he suffered from mental and physical diseases and died of heart disease in a military hospital.\nFamily.\nAfter his relationship with Jiang Qing ended, Huang Jing married the journalist Fan Jin, who later became vice mayor of Beijing and president of \"Beijing Daily\". Their son, Yu Qiangsheng, was a top Chinese intelligence officer who defected to the United States in 1985. Another son, Yu Zhengsheng, rose to become one of the seven members of the Politburo Standing Committee in 2012, which effectively rules China.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48692018","title":"Vellaiya Irukiravan Poi Solla Maatan","body":"\nVellaiya Irukiravan Poi Solla Maatan\n\nVellaiya Irukiravan Poi Solla Maatan is aTamil comedy film written and directed by newcomer A. L. Abanindran.\nProduction.\nThe project was announced by Ignite Films and director Abanindran in late 2014, and marked the director's feature film debut after he had previously, along with his partner Devanshu Arya, assisted director Rajiv Menon's \"Minsara Kanavu\" (1997) and \"Kandukondain Kandukondain\" (2000). The film features newcomer Praveen Kumar, who played a supporting role in \"Kalyana Samayal Saadham\" (2013) in the lead role alongside Shalini Vadnikatti, a model from Hyderabad. Abanindran had worked with Praveen Kumar and the producers, Ignite Films, before, when the trio worked on the television serial, \"Dharmayutham\" for Vijay TV during 2012. Cinematographer Ravi Varman also worked as a co-producer for the film, marking his maiden production. The ensemble cast was also revealed to feature Sanam Shetty, Karthik Kumar, Naren, Jayaprakash and Bala Saravanan, while Anthony was announced as the film's editor. The film was named after a dialogue from Vadivelu's comedy track in the film, \"Arya\" (2007).\nThe team shot the film around Chennai in forty days. After the film was completed, S. Thanu of Kalaipuli International bought the film's worldwide distribution rights.\nRelease.\nThe film released to mixed reviews in December 2015, having been delayed for three weeks as a result of the 2015 South Indian floods. A critic from the New Indian Express noted that \"it was an impressive debut\".\nThe Times of India review rated the movie 3 out of 5 stars.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48692033","title":"Saeed Ibn Qais Hamdani","body":"\nSaeed Ibn Qais Hamdani\n\n Saeed Ibn Qais Hamdani () One of the leaders and Tabi‘un Hermit including close friends Ali and Hasan ibn Ali, head of the Yemeni tribe of Hamdan in Iraq. In the year 33 AH by Saeed bin Aas, who was then governor Osman was in Kufa, responsible government was Rey, Iran.\nCharacteristics.\nHe was faithful helpers Ali. Ali ibn Abi Talib in several battles, including the Battle of the Camel, Battle of Siffin the head of the army. After the death of Ali, Saeed ibn Qays al-Hamadani had joined Hasan ibn Ali and companions.\nDeath.\nDate of his death is not known but some date in the year 50 AH he noted.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48692034","title":"Arun Pudur","body":"\nArun Pudur\n\nArun Pudur (born October 10, 1977) is an Indian origin Billionaire, Businessman, Serial Entrepreneur, investor, and philanthropist. His operations headquarters are in Kuala Lumpur, Malaysia and New York, USA. Pudur started his career fixing scooters in his garage at age 13, he then started breeding champion dogs before venturing into technology. He is the Founder and Group President of Celframe, the world’s second largest Office Productivity Suite software company after Microsoft Office. In his tenure, Celframe rose from a backend support company to a Multi-Billion Dollar Technology company with businesses around the Global while it is privately held and majority owned by him. He is consistently ranked in lists of Billionaires. Arun Pudur is Asia's richest, under 40 person with wealth more than $4 billion and is also ranked 10th among World’s Richest in the list published by Bloomberg, CNBC, WSJ, Wealth-x, Market Watch, and CNN among other major publications worldwide. Pudur is the only Indian Billionaire to make the list which includes Mark Zuckerberg of Facebook among other billionaires.\nEarly life.\nPudur was born in Chennai, but his family shifted to Bengaluru, as his father used to stay 7 to 8 months an year there. His father, Sri Ranga, was a cinematographer, known for his 16mm movies. He had chosen commerce as field of interest in college, as opposed to science, despite everyone around him telling him to take science. He is an alumni of Bangalore University. He started his career starting a scooter garage to fix Kinetic Honda and soon franchised the garage all over Karnataka state. He says that he learned all the marketing skills, problem solving, customer handling, during his time at the garage.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48692040","title":"Austrian presidential election, 2016","body":"\nAustrian presidential election, 2016\n\nPresidential elections will be held in Austria on 24 April 2016, with a run-off on 22 May 2016, if necessary. Incumbent president Heinz Fischer has served two terms and is not eligible to be elected for a third successive term.\nCandidates.\nSPÖ: The most likely candidate of the Social Democratic Party was considered to be Labour Minister Rudolf Hundstorfer, though First President of the National Council Doris Bures, Franz Vranitzky (former Chancellor of Austria from 1986 to 1997) and former undersecretary for EU affairs and businesswoman Brigitte Ederer were also mentioned. On 15 January 2016, Rudolf Hundstorfer was officially announced as the SPÖ's candidate.\nÖVP: Justice Minister Wolfgang Brandstetter (considered a possible, if unlikely ÖVP candidate) declined to stand on 26 December 2015. On 7 January 2016, ÖVP leader Reinhold Mitterlehner announced that Erwin Pröll, the Landeshauptmann of Lower Austria, would not be running, to much surprise (as many had predicted he was almost certainly going to be the ÖVP's candidate). Josef Pühringer, Landeshauptmann of Upper Austria, who had also occasionally been mentioned as an (unlikely) candidate, explicitly declined to stand on 8 January 2016. Franz Fischler (former Austrian European Commissioner from 1995 to 2004) and Othmar Karas (highly respected Member of the European Parliament) also both stated they were not the ÖVP candidate on 8 January 2016, while Wirtschaftskammerpräsident Christoph Leitl only said he would not comment before the official announcement by the party leadership on 10 January 2016. Even controversial former chancellor Wolfgang Schüssel (from 2000 to 2007) was briefly considered as a candidate (but he also declined). On 10 January 2016, former first president of the National Council Andreas Khol was officially announced as the ÖVP's candidate.\nOther names mentioned were former Science Minister and university professor Karlheinz Töchterle, Foreign Minister Sebastian Kurz (who was too young too stand, not yet being 35 years old), former Foreign Minister Ursula Plassnik (who was in office from 2004 to 2008, and most recently Austria's ambassador to France, about to be reassigned to Switzerland), former Raiffeisen Zentralbank manager Christian Konrad (currently the government's point man on refugee issues; he stated he was not a candidate on 8 January 2016), former Landeshauptfrau of Styria Waltraud Klasnic (in office from 1996 to 2005) and president of the Salzburg Festival Helga Rabl-Stadler, both of whom were considered unlikely to run. This left Plassnik and Leitl as possible candidates as of 8 January 2016. Later in the day, rumours indicated that former first president of the National Council Andreas Khol would be the ÖVP's candidate.\nFPÖ: Norbert Hofer (third president of the National Council), who had been considered the most likely FPÖ candidate, said on 28 December 2015 that he considered himself too young for the office and that he would prefer his party to pick someone else as its candidate. Possible candidates include president of the Austrian Court of Audit Josef Moser, Ursula Stenzel (former district mayor of Vienna's 1st District from 2005 to 2015 and also former Member of the European Parliament from 1999 to 2006, both for the ÖVP), ombudsman Peter Fichtenbauer and possibly party leader Heinz-Christian Strache himself. Former Social Affairs Minister Ursula Haubner was considered a very unlikely candidate. As of 11 January 2016, Fichtenbauer, Moser and Stenzel continued to be the most likely candidates. Strache announced on 13 January 2016 that he would not be running himself, and that it was still open whether the FPÖ would nominate anyone at all. In mid-January, Vienna vice-mayor Johann Gudenus and former FPÖ leader and former vice-chancellor (from 1983 to 1987) Norbert Steger were also mentioned as possible candidates. On 19 January 2016, author and Middle East/migration pundit Karin Kneissl (well-known for her right-wing views) was mentioned as being recruited by the FPÖ to run, which she quickly declined. Former Justice Minister Dieter Böhmdorfer, members of parliament Harald Stefan and Johannes Hübner and MEP Barbara Kappel were also mentioned as possible candidates. On 20 January 2016, media reported that Gudenus had been internally selected as the FPÖ's candidate; on 26 January 2016, reports claimed Stenzel would be announced on 28 January 2016 as the FPÖ's candidate. Amid strong FPÖ-internal dissent, there were rumours the party leadership had been forced to reconsider, and that Hofer was now the most likely option, after all, with Gudenus also still in play. Commentators opined that the backtracking was a notable defeat for Strache. Norbert Hofer was announced as the FPÖ's candidate on 28 January 2016.\nGreens: In early January 2016, it was announced that former Greens party leader Alexander Van der Bellen would not be running as the Greens' “official” candidate, as that would have required a party convention decision; this was also framed as an attempt to put personality above party politics in the election. Van der Bellen officially announced his candidacy on 8 January 2016 in a YouTube video. NEOS leader Strolz stated that they would consider giving him the same support as Griss, depending on the same kind of hearing she went through.\nTeam Stronach: As of 22 January 2016, the Team Stronach was still considering whether to nominate a candidate.\nOthers: Independent candidate Irmgard Griss, a former Supreme Court of Justice judge and its president, officially declared her candidacy on 17 December 2015. She presented her candidacy to both the Freedom Party of Austria and NEOS, but both declined to endorse her. NEOS said they would support Griss and any other independent candidates indirectly, and voiced their concerns over the strong partisan politicization of the presidential office and the election campaign.\nRichard Lugner, society figure, businessman and previously candidate for president in 1998, was reportedly also considering running once more. Martin Wabl, who had previously attempted to run in 1998, 2004 and 2010, but failed to gather the necessary number of signatures of support, stated he would try to run once again. Ulrich Habsburg-Lothringen, whose initiative to get the so-called “Habsburger-Paragraf” (which had precluded members of the former ruling house from running for president) proved successful in 2011, stated he would like to run for president, but only if a political party decided to support him. Adrien Jean-Pierre Luxemburg-Wellenstein announced on 8 December 2015 he would run for president. Author El Awadalla (also known for winning the Austrian version of Who Wants to Be a Millionaire?) announced her run on 12 January 2016. (She had previously run for the left-wing alliance Wien anders in the 2015 Viennese state election.) Local activist Franz Stieger (known in Krems for his numerous conflicts with local officials and government agencies) announced his candidacy on 13 January 2016. Further independent candidates who announced their runs were Gustav Jobstmann, Thomas Unden (a general practitioner who had stated he would refuse to treat asylum seekers), Gernot Pointner, Alois Merz, Georg Zakrajsek of the \"Interessengemeinschaft Liberales Waffenrecht Österreich\" (a fringe gun rights group), Karin Kolland, Robert Marschall of the EU Exit Party and Thomas Reitmayer of the Austrian version of the satirical political party Die PARTEI.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48692069","title":"Curling at the 2016 Winter Youth Olympics – Mixed doubles","body":"\nCurling at the 2016 Winter Youth Olympics – Mixed doubles\n\nMixed doubles curling at the 2016 Winter Youth Olympics will be held from February 19 to 21 at Kristins Hall in Lillehammer, Norway.\nTeams.\nThe teams will consist of athletes from the mixed team tournament, one boy and one girl from different NOCs. The teams will be selected by the organizing committee based on the final ranking from the mixed team competition in a way that balances out the teams, and will be assigned on February 17. The players in each pair will then be allowed time to train together.\nTeams are to be determined.\nKnockout Results.\nAll draw times are listed in Central European Time (UTC+01).\nRound of 32.\nDraw 1.\n\"Friday, February 19, 9:00\"\nDraw 2.\n\"Friday, February 19, 12:30\"\nDraw 3.\n\"Friday, February 19, 16:00\"\nDraw 4.\n\"Friday, February 19, 19:30\"\nRound of 16.\nDraw 1.\n\"Saturday, February 20, 9:00\"\nDraw 2.\n\"Saturday, February 20, 13:00\"\nQuarterfinals.\n\"Saturday, February 20, 17:00\"\nSemifinals.\n\"Sunday, February 21, 9:00\"\nBronze Medal Game.\n\"Sunday, February 21, 13:00\"\nGold Medal Game.\n\"Sunday, February 21, 13:00\"\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48692071","title":"First Presbyterian Church (Raleigh, North Carolina)","body":"\nFirst Presbyterian Church (Raleigh, North Carolina)\n\nFirst Presbyterian Church is a historic Presbyterian church located at the corner of Morgan and Salisbury Streets in downtown Raleigh, Wake County, North Carolina. \nThe church was established in a meeting of Presbyterians at the North Carolina State House (predecessor of the North Carolina State Capitol) on Jan. 21, 1816. The congregation purchased land at the present location and erected a brick church building that opened its doors on February 7, 1818. The church served as the site for the North Carolina Constitutional Convention of 1835 and as the meeting place for the North Carolina Supreme Court for several years.\nThat original structure was torn down and a new church building completed in 1900. It was designed in the Romanesque Revival style by architect A.G. Bauer and has been extensively remodeled twice, in 1955 and 2012. \n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48692073","title":"Henryk Weyssenhoff","body":"\nHenryk Weyssenhoff\n\nHenryk Bonawentura Kazimierz Weyssenhoff (26 July 1859, near Kaunas - 23 July 1922, Warsaw) was a Polish-Belarusian landscape painter, illustrator and sculptor of Baltic-German ancestry.\nBiography.\nHe was descended from an old family of the Livonian nobility. In 1863, his father was exiled to Siberia for his participation in the January Uprising. His mother followed with the family, as far as she could, and he grew up in the Urals. His first lessons in art were given to him there by Lucjan Kraszewski (brother of the writer Józef Ignacy Kraszewski), who was also living in exile.\nIn 1874, his father was pardoned, but they were not allowed to return to their old home, so they settled in Warsaw, where he studied painting with Wojciech Gerson. His work there attracted the attention of Henryk Siemiradzki who, in 1880, helped him gain admission to the Imperial Academy of Arts in Saint Petersburg. He graduated in 1885, earning a silver medal and the official title of \"Artist\" for his canvas \"Transport of the Wounded\". In 1889, he spent some time in Munich, improving his skills with Alfred Kowalski.\nIn 1900, he won another silver medal at the Exposition Universelle. As a result, from 1903 to 1904 he lived in Paris, then settled on his parent's estate near Pukhavichy, in what is now Belarus. During the First World War, he was forced to return to Warsaw and remained there until his death.\nAn avid hunter, many of his landscapes included animal life. In addition to his painting, he illustrated several works, notably two by his cousin, Józef Weyssenhoff; \"Erotyki\" (1911), a book of poetry, and \"Soból i Panna\" (1913), a novel that is loosely based on the manorial lifestyle of the Weyssenhoff family.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48692076","title":"Mi Perú District","body":"\nMi Perú District\n\nMi Perú is a district of the Constitutional Province of Callao in Peru, and one of the seven districts that comprise the port city of Callao.\nHistory.\nMi Perú was part of Ventanilla District until May 17, 2014 when it was created as District by Law N° 30197.\nGeography.\nThe district has a total land area of 2.47 km². Its administrative center is located 34 meters above sea level.\nAuthorities.\nThe current mayor of the district is Reynaldo Encalada Tovar.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48692084","title":"Whitewater, Wisconsin, parks and trails","body":"\nWhitewater, Wisconsin, parks and trails\n\nWhitewater, Wisconsin, is a town located in Southeastern Wisconsin roughly 45 minutes from Madison and Milwaukee. The city’s population is 14,732 and features one of the University of Wisconsin system schools, The University of Wisconsin-Whitewater. Throughout the city and surrounding areas, there are over 20 parks, trails and preserves.\nCravath Lakefront Park.\nCravath Lakefront Park was opened in the early 1990s in downtown Whitewater. It is located at 341 South Fremont Street. The park was created to try and create an open space downtown to encourage more visitors. The design for the park was loosely based on the Whitewater Passenger Train Depot. The park itself used to be for more industrial purposes instead of a recreational area. Once it was turned into a park, though, it holds events like Freeze Fest and Pig in the Park as well as the Fourth of July. On top of that, Cravath Lakefront Park is willing to hold celebrations, concerts and weddings.\nBig Brick Park.\nBig Brick Park is located at 611 West Center Street in the heart of Whitewater, WI. This park is roughly one square block in size and is open to the general public. This park has a blacktop basketball court and a playground. For the winter months the city creates its own ice rink for the public to ice skate as well as play hockey. The city provides nets for the hockey players to enjoy the ice time during the bitter cold Wisconsin winter.\nTrippe Lake Park.\nTrippe Lake is located at 407 S Wisconsin Street and has been around since 1958, named in honor of Dr. James and Rosepha Trippe, as being founders of the city. You can enjoy the beautiful lake where a dam was construed to power a sawmill. Community members use it for swimming, fishing, free boat launch and as a group gathering place. The local Whitewater’s Lion Club donated the Trippie Lake Shelter in 2009. It includes restrooms, picnic tables, kitchen, and storage space for recreations programs. Trippe Lake has many options for all seasons, summer swimming to\nsledding and ice fishing in winter. It adds great value to the Whitewater Community.\nWhitewater Creek Nature Area.\nLocated off Fremont Street on the outskirts of campus you can find Whitewater Creek Nature Area. It is a great location with a lot to park and hit the walking trails. It is open all year round from 6am to 12pm. Trails take you into and through the woods, giving you great scenic views along the creek. It is public land for the community to use in a respectful way. There are lots of wildlife activity and natural forest activities. Whitewater Creek Nature Area is a beautiful area in that is unlike any other place in Whitewater.\nCity of Whitewater “Bark Park”\nThe city features a spacious dog park that is free of charge. The park features three areas for all sizes of dogs. Located at the East end of Commercial Avenue in Whitewater, it provides a fun and clean environment for all animals. The three areas are designated for different sized dogs. This area is roughly 4 acres of city property. The city mows and provides dog clean up bags for no price. For pet owners, there are multiple benches and picnic tables available for seating.\nIce Age Trail.\nLocated 4 miles east of Whitewater on HWY 12 is a section of the infamous Ice Age Trail. The trail is nearly 1,200 miles long stretching from Minnesota to the shores of Lake Michigan. The beautiful trail extends approximately 10 miles through the southern part of Whitewater. This section of the trail is near scenic Whitewater Lake and Rice Lake. The Trail is also connected with the Whitewater Lake Campground. The trail is animal friendly and open year round for hikers and snowshoeing. One end of the trail begins in Potawatomi State Park near Sturgeon Bay, WI and the other ends in Interstate Park near the St. Croix River on the Wisconsin/Minnesota border in St. Croix, WI.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48692092","title":"Fabrizio Santino","body":"\nFabrizio Santino\n\nFabrizio Santino (born December 12, 1982) is a British actor who is best known for playing Ziggy Roscoe in the soap opera \"Hollyoaks\" between 2013 and 2015. Fabrizio will play Jake Albert in an upcoming BBC drama entitled Hawaiian Hotel due to air in Spring 2016.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48692132","title":"Frederick Hanger House","body":"\nFrederick Hanger House\n\nThe Frederick Hanger House is a historic house at 1010 Scott Street in Little Rock, Arkansas. It is a two story wood frame structure, with complex massing and exterior typical of the Queen Anne style. It is topped by a gable-on-hip roof, from which numerous gables project, including two to the front, and has walls sheathed in clapboards and bands of decorative cut shingles. A porch extends across the front, supported by turned posts, with a balustrade of wooden circles joined by posts to each other and the supporting posts. It was built in 1889 for one of Little Rock's most prominent businessmen of the period, and is a particularly little-altered example of the Queen Anne style in the city.\nThe house was listed on the National Register of Historic Places in 1974.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48692146","title":"Butyrsky (rural locality)","body":"\nButyrsky (rural locality)\n\nButyrsky (; masculine), Butyrskaya (; feminine), or Butyrskoye (; neuter) is the name of several rural localities in Russia:\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48692150","title":"Oregon Institute of Technology, Wilsonville","body":"\nOregon Institute of Technology, Wilsonville\n\nThe Oregon Institute of Technology, Wilsonville (also referred to as Oregon Tech Wilsonville, or simply OITW) is a public polytechnic and research university located in Wilsonville, Oregon, United States. It is the urban campus of the Oregon Institute of Technology.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48692152","title":"Butyrsky","body":"\nButyrsky\n\nButyrsky (masculine), Butyrskaya (feminine), or Butyrskoye (neuter) may refer to:\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48692168","title":"The Thanksgiving Story","body":""}
{"url":"https://en.wikipedia.org/wiki?curid=48692169","title":"Hardy House (Little Rock, Arkansas)","body":"\nHardy House (Little Rock, Arkansas)\n\nThe Hardy House is a historic house at 2400 Broadway in Little Rock, Arkansas. It is a two story brick structure, with flanking single-story wings and a roof that is designed to resemble an English country house's thatched roof. The entrance is set in a centrally located stone round arch, with a multipart segmented-arch window above. The house was designed by Charles L. Thompson and built in 1921.\nThe house was listed on the National Register of Historic Places in 1982.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48692204","title":"2016 TCR Russian Series season","body":"\n2016 TCR Russian Series season\n\nThe 2016 TCR Russian Series season is the second season of the TCR Russian Series.\nCalendar and results.\nThe 2016 schedule was announced on 11 November 2015, with all events scheduled to be held in Russia.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48692210","title":"Karosa B 831","body":"\nKarosa B 831\n\nKarosa B 831 is citybus, which was made in three pieces by bus manuafcturer Karosa between 1987-1989. It was intended as successor of Karosa B 731 and with trolleybus Škoda 17Tr had to be part of unificated series of city vehicles. Until now survived only one, which is placed in muzeum in Brno.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48692213","title":"London Recruits (film)","body":"\nLondon Recruits (film)\n\nLondon Recruits is the upcoming film documenting the true story of the young men and women who undertook clandestine missions for the ANC during apartheid South Africa. Produced by Barefoot Rascals, the docu-drama is directed by Gordon Main. London Recruits shares a title with the 2012 book London Recruits: The Secret War Against Apartheid, edited and compiled by Ken Keable.\nPlot.\nSet at a time when ANC membership was prohibited and its activists executed or imprisoned, London Recruits tells the story of the actions of young women and men who traveled to South Africa disguised as honeymooning couples, tourists and business trippers, aimed at bringing down the apartheid regime. The London Recruits, in a plan activated by Oliver Tambo, were recruited by Ronnie Kasrils and deployed to undertake secret missions involving the transportation of anti-apartheid leaflets in false bottom suitcases and the detonation of bucket bombs in strategic commuter sites.\nThe Recruits.\nThe facilitator of the operation was Ronnie Kasrils. South African born, Ronnie was dispatched to London by Oliver Tambo to recruit women and men to carry out missions for the ANC. Mary Chamberlain, author of Fenwomen: A Portrait of Women in an English Village was among the recruits enrolled by Ronnie to carry out the clandestine work in 1971 at the age of 24. \n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48692256","title":"SS Ada (1905)","body":"\nSS Ada (1905)\n\nSS \"Ada\" was a cargo vessel built for the London and South Western Railway in 1905.\nHistory.\nShe was built by Gourlay Brothers in Dundee and launched on 4 April 1905 by Miss Drummond. She was launched only 47 days after the keel was laid, without overtime being worked, and represented a record for the Gourlay shipyard. She was the first of a pair of ships ordered by the London and South Western Railway, the other being . She was built for light cargo traffic between Southampton and the Channel Islands. \nShe was acquired by the Southern Railway in 1923.\nShe was scrapped in 1934.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48692277","title":"Fulvio Caccia","body":"\nFulvio Caccia\n\nFulvio Caccia (born 10 January 1952 Florence, Italy) is a contemporary Italian poet, novelist and essayist. He won the 1994 Prix du Gouverneur Général.\nBiography.\nFulvio Caccia graduated from l'Université du Québec à Montréal in 1979.\nHe lives in Paris.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48692282","title":"Keyarris Garrett","body":"\nKeyarris Garrett\n\nKeyarris Garrett (born September 26, 1992) is an American football wide receiver. He played college football at Tulsa.\nCareer.\nDuring the 2015 season, he had 96 receptions for 1,588 yards and eight touchdowns. On October 23, 2015, Garrett caught 14 passes for an American Athletic Conference record 268 receiving yards. For his career he had 219 receptions for 3,209 yards and 22 touchdowns.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48692284","title":"Harris House (Little Rock, Arkansas)","body":"\nHarris House (Little Rock, Arkansas)\n\nThe Harris House is a historic house at 6507 Fourche Dam Pike in Little Rock, Arkansas. It is a single-story stuccoed structure, designed in an eclectic interpretation of Spanish Revival architecture. Prominent features include a circular tower at one corner, a parapet obscuring its sloping flat roof, and a port-cochere with a segmented-arch opening supported by battered wooden columns. It was built in 1924 for Florence and Porter Field Harris, to their design and probably the work of Porter Harris, a master plasterer known for his work on the Arkansas State Capitol.\nThe house was listed on the National Register of Historic Places in 1998.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48692314","title":"Theodore Swann","body":"\nTheodore Swann\n\nTheodore Swann was an American industrialist and early leader of the chemical industry. He was described by one historian as \"a flamboyant Birmingham mogul and New South industrialist.\"\nHailing from east Tennessee, in his early working years, Swann was a power salesman for the Alabama Power Company.\nHe established the Federal Phosphorus Company to produce concentrated phosphoric acid, mainly for use as a concentrated fertilizer, using a novel method to produce the acid from phosphate rock by heat treatment in an electric furnace.\nHe later established the Swann Chemical Company, focused on production of PCBs for the emergent electrical industry. Swann Chemical Company operated a chemical manufacturing plant in Anniston, Alabama where PCBs were first made on an industrial scale after development of a new process under Swann's leadership. In 1920, Swann gave his engineers the challenge of creating a process by which PCBs, up to that time very expensive and produced only in small quantities, could be produced in industrial quantities, and after much trial and error, they succeeded. The plant was later bought by Monsanto Industrial Chemicals Co. in 1935. The plant, just west of Anniston, had around 1,000 employees. One historian wrote that, \"In many ways, the spirit of Swann Chemical became the corporate culture of Monsanto.\"\nSwann's house in Birmingham, Alabama, built from 1927 to 1930, was at the time the largest residence in the city and cost $600,000 to build.\nWhile Monsanto became the most successful agrochemical corporation in the world, Swann began to slide into poverty. He was forced to sell his castle in 1945 when he filed for bankruptcy. He nearly made a comeback by selling a new design for a furnace to process iron ore to the Cuban dictator Fulgencio Batista, but the dictator reneged after paying only a modest down payment. Theodore Swann died selling aluminum window frames on February 5, 1955.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48692363","title":"SS Bertha (1905)","body":"\nSS Bertha (1905)\n\nSS \"Bertha\" was a cargo vessel built for the London and South Western Railway in 1905.\nHistory.\nShe was built by Gourlay Brothers in Dundee and launched on 9 November 1905 by Miss Key, daughter of one of the railway superintendents. She was the second of a pair of vessels ordered by the London and South Western Railway, the other being . She was built for light cargo traffic between Southampton and the Channel Islands. \nShe was acquired by the Southern Railway in 1923.\nShe was sold in 1933 to Metal Industries, Limited of Rosyth and used as a salvage vessel in raising some members of the German Fleet scuttled in Scapa Flow. \n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48692393","title":"Inspector General of the Air Force","body":"\nInspector General of the Air Force\n\nThe Office of Inspector General of the Air Force for the United States Air Force was originally established after World War II as The Air Inspector to conduct investigations as directed by the Secretary of the Air Force and the Chief of Staff of the United States Air Force. The current mission of the Air Force Inspector General is prescribed by Title 10 (§ 8020) and Title 32 of the United States Code (§ 105) to develop Air Force and Air National Guard policy to assess readiness, discipline and efficiency with a vision to help shape senior leader decisions affecting the readiness of the Air Force to strengthen the nation's defense.\nThe Office of Inspector General of the Air Force consists of four directorates:\nHistory.\nIn 1943, Junius Jones was designated The Air Inspector of the Army Air Forces and when the AAF became the U.S. Air Force in 1947, he retained his position.\nIn 1948, The Air Inspector was renamed to the Inspector General of the Air Force.\nIn December 1971, Lt Gen Louis L. Wilson Jr. oversees the activation of the Air Force Inspection and Safety Center (which later became the Air Force Inspection Agency in 1991) to provide independent assessments of acquisition, safety, nuclear surety, operations, logistics, support, and healthcare to Air Force senior leaders. It also evaluates Air Force activities, personnel, and policies, and provides legal and compliance oversight of all Air Force-level Field Operating Agencies and Direct Reporting Units.\nIn September 1986, as a result of the Goldwater–Nichols Act, the Inspector General moved directly under the Secretary of the Air Force.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48692396","title":"Mirna Ansaldi","body":"\nMirna Ansaldi\n\nMirna Eugenia Ansaldi (born ) is a retired Argentine female volleyball player, who played as a wing spiker. She was part of the Argentina women's national volleyball team at the 2002 FIVB Volleyball Women's World Championship in Germany. On club level she played with Gimnasia y Esgrima de Rosario.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48692409","title":"Ride the Man Down","body":"\nRide the Man Down\n\nRide the Man Down is a 1952 American Western film directed by Joseph Kane and written by Mary C. McCall, Jr.. The film stars Brian Donlevy, Rod Cameron, Ella Raines, Forrest Tucker, Barbara Britton, Chill Wills and J. Carrol Naish. The film was released on November 25, 1952, by Republic Pictures.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48692410","title":"Julietta Borghi","body":"\nJulietta Borghi\n\nJulietta Borghi (born ) is a retired Argentine female volleyball player, who played as a middle blocker. She was part of the Argentina women's national volleyball team at the 2002 FIVB Volleyball Women's World Championship in Germany. On club level she played with Banco Nación.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48692413","title":"Natalia Brussa","body":"\nNatalia Brussa\n\nNatalia Brussa (born ) is a retired Argentine female volleyball player, who played as a middle blocker. She was part of the Argentina women's national volleyball team at the 2002 FIVB Volleyball Women's World Championship in Germany. On club level she played with Central San Carlos.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48692418","title":"Mariana Conde","body":"\nMariana Conde\n\nMariana Conde (born ) is a retired Argentine female volleyball player, who played as a wing spiker. She was part of the Argentina women's national volleyball team at the 2002 FIVB Volleyball Women's World Championship in Germany. On club level she played with Volley 2000 Spezzano.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48692427","title":"Celina Crusoe","body":"\nCelina Crusoe\n\nCelina Crusoe (born ) is a retired Argentine female volleyball player, who played as a setter. She was part of the Argentina women's national volleyball team at the 2002 FIVB Volleyball Women's World Championship in Germany. On club level she played with Pallavolo Reggio Emilia.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48692431","title":"Romina Lamas","body":"\nRomina Lamas\n\nRomina Lamas (born ) is a retired Argentine female volleyball player, who played as a setter. She was part of the Argentina women's national volleyball team at the 2002 FIVB Volleyball Women's World Championship in Germany. On club level she played with CV Teneriffa.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48692432","title":"Karen F McCarthy","body":""}
{"url":"https://en.wikipedia.org/wiki?curid=48692434","title":"John Chambers (Australian cricketer)","body":"\nJohn Chambers (Australian cricketer)\n\nJohn Chambers (born 30 October 1930) is an Australian former cricketer. He played 27 first-class cricket matches for Victoria between 1950 and 1955.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48692436","title":"List of Major League Baseball teams by payroll in 2010","body":"\nList of Major League Baseball teams by payroll in 2010\n\nThis is a list of the 30 Major League Baseball teams from the 2010 season, ranked by total team salary. Values only include salaries of players on their respective 2010 rosters.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48692442","title":"List of Major League Baseball teams by payroll in 2012","body":"\nList of Major League Baseball teams by payroll in 2012\n\nThis is a list of the 30 Major League Baseball teams from the 2012 season, ranked by total team salary. Values only include salaries of players on their respective 2012 rosters.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48692475","title":"Ivana Müller","body":"\nIvana Müller\n\nIvana Eloisa Müller (born ) is a retired Argentine female volleyball player, who played as a middle blocker. She was part of the Argentina women's national volleyball team at the 2002 FIVB Volleyball Women's World Championship in Germany. On club level she played with Banco Nación.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48692485","title":"Andy and the Lion","body":"\nAndy and the Lion\n\nAndy and the Lion, written and illustrated by James Daugherty, is a 1938 picture book published by Puffin Books. \"Andy and the Lion\" was a Caldecott Medal Honor Book for 1939 and was Daugherty's first Caldecott Honor Medal of a total of two during his career. Daughetry won the Caldecott Medal in 1957 for \"Gillespie and the Guards\", which he both authored and Illustrated. \"Andy and the Lion\" was re-issued by Viking Press in 1967 in hardcover format. It was the fifteenth printing of March 1967.\nDescription.\nThe story, written by Daugherty, is told in present tense from a second person point of view (a second-person narrative). It is written and illustrated by James Daugherty. There are illustrations on every page. The illustrations are in a gold color. The story is 80 pages long.\nSynopsis.\nA little boy named Andy was so interested about lions that he went to the library and searched for a book about lions. That same night, his grandfather told him a bedtime story about lions. Andy was so fascinated about the story that he had a dream about lions that same night. The next day, on his way to school, Andy meets a real lion. The lion had a thorn stuck in his paw and Andy helps pull the thorn out. This action makes Andy and the lion friends. Later in the story, a circus comes to Andy's town and of course, Andy attends hoping to see his friend the lion. In the lion act, one of the lions jumps out of the cage, into the audience, right in front of Andy. Andy thinks it's his last day of life. But low and behold, it was his friend the lion! Andy and the lion recognize one another. The lion was the very same one Andy had helped that day take the thorn out of his paw. Andy and the lion rejoice in excitement of seeing one another again. When the crowd attempts to capture the lion, Andy protects it. The next day, there is a parade and Andy and the lion lead it. Andy receives an award for bravery. At the end of the story, Andy returns the book he borrowed from the library about lions, pulling his friend the lion behind him.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48692492","title":"Georgina Pinedo","body":"\nGeorgina Pinedo\n\nGeorgina Pinedo (born ) is a retired Argentine female volleyball player, who played as a wing spiker. She was part of the Argentina women's national volleyball team at the 2002 FIVB Volleyball Women's World Championship in Germany. On club level she played with CA Boca Juniors.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48692499","title":"Cheerleading in Japan","body":"\nCheerleading in Japan\n\nCheerleading is a recognized sport in Japan that requires physical strength and athletic ability. Cheerleading is available at the junior high school, high school, collegiate, club, and all-star level. Teams can either be all female or coed featuring males and females. \nCompetition guidelines.\nCompetition routines are held on a 12-meter square mat in which the entire surface can be used. Each team must perform a 2 minutes and 30 seconds routine in which 1 minute and 30 seconds of the routine may contain music. Routines showcase different elements including sideline cheers, pyramids and stunts, dance, and gymnastics. There is also a division for group stunt competition where a group of five participants perform a 60–65 seconds routine of strictly stunts. There is also a division for partner stunt competition that includes one male and one female and one spotter. These routines last around 55–60 seconds and can only incorporate stunting.\nHistory.\nApril 24, 1988: Cheerleading Nation Championship in Japan (1st Japan Championships)\nJuly 13, 1988: Foundation of Japan Cheerleading Association opens its association office in Akasaka, Minato-ku, Tokyo\nDecember 23, 1989: 1st All Japan Student Championships\nMay 5, 1990: 1st International Cheerleading All-Japan Championships\nAugust 18, 1990: Japan Championships begin airing by NHK satellite broadcasting\nJanuary 27, 1991: 1st All Japan High School Championships\nDecember 15, 1991: 1st instructor qualification test conducted\nJanuary 10, 1994: Japan Cheerleading Association renamed\nAugust 22, 1998: International Cheerleading Federation inauguration\nNovember 18, 2001: 1st World Championships, women’s Japanese team won the men and women mixed sector\nFebruary 23, 2003: 1st All Japan club team Championships\nNovember 15, 2003: 2nd Cheerleading World Championships, women Japanese team wins the men and women mixed sector\nNovember 5, 2005: 3rd World Championship victory for the women’s Japanese team\nApril 21, 2007: 1st Asia International Open Championship\nNovember 17, 2007: 4th World Championships, women’s and men and women mixed Japanese teams won\nNovember 28, 2009: 5th World Championships, men and women mixed Japanese teams won\nNovember 26, 2011: 6th World Championships, men and women mixed Japanese teams won\nNovember 23, 2013: 7th World Championships, women’s, men and women mixed, and group stunt teams participate\nApril 1, 2014: Specialized cheerleading unit established in Tokyo High School Athletic Federation\nAssociations and organizations.\nOn July 13, 1988 the Foundation of Japan Cheerleading Association was founded with the purpose of supervising the cheerleading world as a competitive sport in Japan and to promote a healthy spread and promotion of the cheerleading competition. The Japan Cheerleading Association (JCA) also holds cheerleading and leadership workshops, holds domestic and international competitions, trains trainers, certifies competition equipment, and handles publications.\nThe International Federation of Cheerleading (IFC) is also based in Tokyo, Japan and is the world governing body of cheerleading.\nThe Asian Federation of Cheerleading (AFC) is the governing body of cheerleading in Asia and is one of the continental confederations that makes up the International Federation of Cheerleading. It was formed in 2007 and has its headquarters in Tokyo, Japan.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48692502","title":"John Leehane (cricketer, born 1921)","body":"\nJohn Leehane (cricketer, born 1921)\n\nJohn Leehane (20 October 1921 – 22 July 1991) was an Australian cricketer. He played one first-class cricket match for Victoria in 1950.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48692503","title":"Marianela Robinet","body":"\nMarianela Robinet\n\nMarianela Robinet (born ) is a retired Argentine female volleyball player, who played as a wing spiker. She was part of the Argentina women's national volleyball team at the 2002 FIVB Volleyball Women's World Championship in Germany. On club level she played with Central San Carlos.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48692511","title":"Maria Vicente","body":"\nMaria Vicente\n\nMaria Laura Vicente (born ) is a retired Argentine female volleyball player, who played as a wing spiker. She was part of the Argentina women's national volleyball team at the 2002 FIVB Volleyball Women's World Championship in Germany. On club level she played with DAM La Rochette.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48692517","title":"Micaela Vogel","body":"\nMicaela Vogel\n\nMicaela Vogel (born ) is a retired Argentine female volleyball player, who played as a middle blocker. She was part of the Argentina women's national volleyball team at the 2002 FIVB Volleyball Women's World Championship in Germany. On club level she played with GEBA.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48692518","title":"John Leehane (cricketer, born 1950)","body":"\nJohn Leehane (cricketer, born 1950)\n\nJohn Leehane (born 11 December 1950) is an Australian former cricketer. He played eleven first-class cricket matches for Victoria between 1978 and 1981.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48692522","title":"Mahommah Gardo Baquaqua","body":"\nMahommah Gardo Baquaqua\n\nMahommah Gardo Baquaqua was a former slave, native of Zooggoo in Central Africa, a tributary kingdom of Bergoo kingdom. He worked in Brazil as a captive, however he escaped and fled to New York in 1847, assuring his freedom. He wrote a biography, published by American abolitionist Samuel Moore in 1854. His report is the only known document about slave trade written by a Brazilian former slave.\nBiography.\nBaquaqua was born in Djougou (current in Benin) between 1820 and 1830, in a proeminent Muslim trader family. He learned the Quran, literature and mathematics in an Islamic school. Still as an adolescent, he took part into the succession wars in Daboya, together with his brother, where he was captured and then rescued.\nBack to Djougou he became servant of a local dignitary, perhaps the chief of Soubroukou, to whom he calls 'king'. The abuses he committed on that period made him target of an ambush, where he was imprisoned and transported to Dahomey; he would be embarked into a slave ship in 1845 and taken to Pernambuco, in Brazil.\nBaquaqua was a slave in Olinda, Pernambuco around two years. His master was a baker, He worked in construction of houses, carrying stones, learned Portuguese and performed as “\"escravo de tabuleiro\"” (peddling slave). The cruelty of his Brazilian masters made him revert to alcoholism and to attempt suicide.\nTaken to Rio de Janeiro, Baquaqua was incorporated to the crew of the trade ship \"Lembrança\", transporting goods to the southern provinces of Brazil. A coffee shipment to the United States, in 1847, was his passport to freedom. The ship arrived to New York harbor in June, where it was approached by local abolitionists, who encouraged him to escape from the ship. After the escape, however, he was imprisoned in the local jail, and only the help of the abolitionists (that facilitated his escape from prison) prevented he was returned to the ship. It was then sent to Haiti, where he lived with the reverend Judd, a Baptist missionary.\nConverted and baptized in 1848 Baquaqua returned to the US due to the political instability Haiti was then; He studied at the New York Central College in McGrawville for almost three years. In 1854 he moved to Canada and his bibliography was published the same year by Samuel Downing Moore in Detroit.\nIt not known what happened to Baquaqua after 1857. He was then in England and had turned to the American Baptist Free Mission Society to be sent as a missionary to Africa.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48692527","title":"John Leehane","body":"\nJohn Leehane\n\nJohn Leehane can refer to:\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48692536","title":"SS Princess Ena (1906)","body":"\nSS Princess Ena (1906)\n\nTSS \"Princess Ena\" was a passenger vessel built for the London and South Western Railway in 1906.\nHistory.\nShe was built by Gourlay Brothers in Dundee and launched on 25 May 1906. She was built as a replacement for the Hilda, lost in the English Channel in 1905. She was built in four months, with the order being placed in December 1905. \nShe was requisitioned by the Admiralty in 1915 and converted to a Q-ship. She returned to railway service at the conclusion of hostilities. \nShe was acquired by the Southern Railway in 1923.\nOn 3 August 1935 she caught fire on a passage from Jersey to St Malo and sank south of Jersey, Channel Islands.\nThe crew were rescued by and .\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48692547","title":"C.braunii","body":"\nC.braunii\n\nC. braunii is a species abbreviation which may refer to:\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48692553","title":"Philip Plotch","body":"\nPhilip Plotch\n\nPhilip Mark Plotch is an author, professor, and transportation planner. He is best known for leading efforts to rebuild the World Trade Center and his research on the politics and planning behind transportation megaprojects.\nCareer.\nAuthor and academic.\nPhilp Mark Plotch writes articles and op-eds for academic and general publications including a regular column in \"Gotham Gazette\" about economic development and transportation issues. In 2015, Rutgers University Press published his book \"Politics Across the Hudson: The Tappan Zee Megaproject\".\nDr. Plotch received the American Planning Association’s 2015 New York Metro Chapter journalism award for his in-depth research and hard hitting analysis behind the planning and politics of New York's transportation system. \nPrevious winners have included Kate Ascher, Brendan Gill, Paul Goldberger, Ken Jackson, and Elizabeth Kolbert. Plotch is now under contract with Cornell University Press to write a book about the Second Avenue subway.\nPlotch is an assistant professor of political science and the director of the master of public administration program at Saint Peter's University. He previously taught as an adjunct in the Department of Urban Affairs and Planning at Hunter College.\nTransportation planner and World Trade Center Redevelopment Director.\nAs director of World Trade Center redevelopment and special projects at the Lower Manhattan Development Corporation, after the September 11, 2001 terrorist attacks, Plotch developed new transportation programs, oversaw the design and construction of Lower Manhattan open spaces, and administered programs to rebuild structures.\nBetween 1992 and 2005, as the manager of policy and planning at the headquarters of the Metropolitan Transportation Authority, Plotch led planning improvements for the New York metropolitan area's transportation system including the #7 subway line extension to the Hudson Yards, the Second Avenue subway, and intelligent transportation systems.\nEducation.\nPlotch received his master in urban planning degree from Hunter College and his Ph.D. in public and urban policy from the Milano School of International Affairs, Management, and Urban Policy at The New School. \nCivic Leadership.\nHe lives in the Radburn section of Fair Lawn, New Jersey, where he has published Fair Lawn News, served on the planning board and the economic development committee, and led efforts to revise election procedures and improve pedestrian safety.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48692563","title":"Elverskud","body":"\nElverskud\n\nElverskud is a ballad for soloist, choir and orchestra by Niels W. Gade from 1854.\nGade's oeuvre contains many concert pieces of various lengths for orchestra, choir and soloists. Depending on which one counts, there are up to 16 of them, mostly referred to as \"cantata\". The longest of the pieces can take up to an hour. Some of the pieces are almost semi-operas or concert operas with dramatic development.\nOrigins.\nThe plot of the song comes from the Danish folk-ballad \"Elveskud\".\nIn 1842 Gade wrote \"Agnete og Havfruerne\" for solo, female choir and orchestra with text by Hans Christian Andersen, and the same Andersen had in 1846 premiered the opera \"Liden Kirsten\" with music by Gade's father-in-law J. P. E. Hartmann. Both were inspired by Danish folksongs. This may have encouraged Gade to try his hand at the same set of motifs with a major concert piece.\nThe earliest information on \"Elverskud\" is a mention in a letter from Gade in 1849, in which he wrote that he had allowed Hans Christian Andersen to prepare a text. For whatever reason it was never used by Gade, but a draft can be found among Andersen's papers. Some parts of the text were transferred to the final version. The next person who turned his hand to this text was Christian Molbech in whose papers there is a version that is closer to the final one, which by all accounts was developed by Gade's cousin Carl Andersen and the editor Gottlieb Siesby, while the atmospheric choral interlude \"I østen stiger solen op\" was written already in 1837 by B. S. Ingemann and received a tune by C. E. F. Weyse the same year.\nThe first sheet of Gade's score is dated December 12, 1851, but in March 1853 the work is mentioned a letter to Gade from his wife, suggesting that he had no time to work on it. In early 1854 the work was published in a piano arrangement by a German publisher as \"Ballade nach dänischen Volkssagen\". On 30 March 1854, it was first performed at a subscription concert at the Musikforeningen, presented as a ballad for soloist, choir and orchestra.\nPlot summary.\nThe ballad is divided into five sections, a prologue, three \"acts\" and an epilogue.\nThe music.\nGade was apparently keen to emphasize that the music was not adaptations of folk songs, but rather all his own, but inspired by the ballads. Heard today, \"Elverskud\" fits the Danish romance style, particularly in the section where Oluf, the mother and the choir \"talk\" to each other in opera style.\n\"Elverskud\" has been shown to be one of the most popular Gade's works. According to a statement in Inger Sørensen's book, it was performed at least 184 times in Gade's life, a success unparalleled by other Danish composers. The work remains popular today, and two of the songs, \"I østen stiger solen op\" and \"Så tit jeg rider mig under ø\" are often played as single pieces.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48692564","title":"John Watters (cricketer)","body":"\nJohn Watters (cricketer)\n\nJohn Watters (6 October 1924 – 2 August 2006) was an Australian cricketer. He played one first-class cricket match for Victoria in 1950.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48692571","title":"Abigael Kipkemboi","body":"\nAbigael Kipkemboi\n\nAbigael Kipkemboi (born ) is a retired Kenyan female volleyball player, who played as a middle blocker. She was part of the Kenya women's national volleyball team at the 2002 FIVB Volleyball Women's World Championship in Germany. On club level she played with Kenya Pipeline.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48692578","title":"John Watters","body":"\nJohn Watters\n\nJohn Watters can refer to:\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48692583","title":"Margaret Mukoya","body":"\nMargaret Mukoya\n\nMargaret Mukoya (born ) is a retired Kenyan female volleyball player, who played as a middle blocker. She was part of the Kenya women's national volleyball team at the 2002 FIVB Volleyball Women's World Championship in Germany. On club level she played with Telkom Kenya.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48692587","title":"Philister Sang","body":"\nPhilister Sang\n\nPhilister Sang (born ) is a retired Kenyan female volleyball player, who played as a wing spiker. She was part of the Kenya women's national volleyball team at the 2002 FIVB Volleyball Women's World Championship in Germany. On club level she played with Kenya Pipeline.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48692590","title":"Salome Wanjala","body":"\nSalome Wanjala\n\nSalome Wanjala (born ) is a retired Kenyan female volleyball player, who played as a wing spiker. She was part of the Kenya women's national volleyball team at the 2002 FIVB Volleyball Women's World Championship in Germany. On club level she played with Kenya Commercial Bank.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48692593","title":"Women's Resource & Action Center","body":"\nWomen's Resource & Action Center\n\nThe Women's Resource and Action Center, also known as WRAC, is an organization dedicated to the equality and well-being of female students at the University of Iowa and members of the Iowa City community. It provides resources and information that are helpful for the everyday activities of women and as a source of entertainment and subject matter relevant to women.\nHistory.\nOriginally called the Women's Liberation Front in 1971, WRAC was established to promote women's rights and equality, and allow women to meet other women as friends, classmates, coworkers, etc. WRAC's website states that members of the organization \"met to discuss their shared oppression as women and search for solutions to their common problems.\" In 1974, the group changed its name to that which it currently holds: Women's Resource and Action Center.\nWhen the organization was created, the members made it an issue to function collectively rather than have an officer team or executive board, to encourage women's empowerment and not be discriminatory. After WRAC had successfully established itself as a feminist group in the Iowa City community, it began to reach out to other oppressed groups, diversifying their human rights values to expand to groups including \"people of color, people with disabilities, the elderly, and lesbians and gays.\" Originally, as a source of education and entertainment, WRAC held workshops and programs such as counseling, divorce rights, abortion and birth control, women's health information, women's studies, self-defense, economics, etc. These workshops and programs were beneficial to all women involved with WRAC because of the knowledge they were obtaining.\nIn the early 1980s, the Women Against Racism Committee (WAR) was formed as a branch of WRAC, and populated primarily by the members of WRAC, as well as other women in the Iowa City community. The original purpose of the organization was to critique the racism WRAC members perceived, and to raise awareness of the harmful effects of internalized racism. These actions evolved into the study of all forms of oppression, including sexism, disability-related discrimination, and homophobia, especially among colored women. As WAR grew in popularity, it brought in renowned speakers, such as Winona LaDuke and Natalie Wong to the University of Iowa campus to speak on behalf of the oppressed populations. In 1988, WAR held its first and only national conference, \"Parallels and Intersections: Racism and Other Forms of Oppression.\" Participation in the Women Against Racism Committee declined throughout the 1990s until it was shut down in 1998.\nPresent day.\nMission and values.\nWRAC is a feminist organization designed to promote equality between groups, with a more focused goal on establishing women's rights. Their values include inclusivity, collaboration, diversity, effectiveness, safe and supportive environment, and respect.\nPrograms.\nWRAC offers services including counseling, scholarships, support groups, and a library containing resources that address financing, health care (women's health, abuse recovery, eating disorders), gender studies, LGBT studies, marriage, sex, parenting, feminism theory, domestic violence, single parenting, adoption, and literature. The Center has also helped teach bystander intervention classes that were open to all members of the community to combat the issue of street harassment in Iowa City in 2014. To combat the issue of street harassment in Iowa City in 2014, the Center helped teach bystander intervention classes that were open to all members of the community \nStudent life.\nWRAC has organized \"Take Back The Night\" rallies, an event including a march in advocation of sexual violence victims and an open-mic time for victims to tell their stories that has been ongoing since 1979. Since 2014 the University of Iowa has had a new focus on decreasing sexual assaults on campus. Because of this, WRAC has increased their staff and resources and has been able to reach more students. The organization has grown too large for its current location on Madison Street where the Center has been for 39 years. With the development of these events, the organization plans to move to a new location (the Bowman house on Clinton Street in Iowa City) in 2016.\nSafety.\nWRAC has been providing safety resources for years. Whether it be in their office or online, there are many different options. For example, on their website, it lists hotlines for immediate assistance as well as counselling and care for victims of sexual assault.\nOne of WRAC's projects to fight sexual violence and increase safety was the Street Lighting and Safety Project. WRAC acted as an advisor to the Association of Student Women (ASW) and collaborated with them to complete the project. The goal of the Street Lighting and Safety Project was to have more street lights put in place around Iowa City to provide more lighting during the evenings and at night. WRAC and ASW began the project in 1976 and it was completed in 1980. The lights put up around the campus acted as a precursor to current lights and blue safety lights around campus today.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48692596","title":"Jetzabel del Valle","body":"\nJetzabel del Valle\n\nJetzabel del Valle (born ) is a Puerto Rican female volleyball player, who played as a middle blocker. She was part of the Puerto Rico women's national volleyball team at the 2002 FIVB Volleyball Women's World Championship in Germany. and at the 2006 FIVB Volleyball Women's World Championship in Japan. She played with Criollas de Caguas and Humacao.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48692621","title":"Harry Knight (disambiguation)","body":"\nHarry Knight (disambiguation)\n\nHarry Knight was an American racecar driver.\nHarry Knight may also refer to:\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48692630","title":"Fiber modification","body":"\nFiber modification\n\nFibre modification is a research field in which researchers aim at developing and applying technologies to impart new properties to natural fibres such as those in paper, in order to increase their functionality. Research areas in this field include many different technologies, amongst which the chemical modifications of fibres are widely used. One important sector of application of the chemical modifications is the treatment of wood for giving it enhanced properties such as higher mechanical properties, water impermeability, less hygroscopicity, bacterial and fungal resistance. Transferring and adapting the technical knowledge on fibre modification available for the wood sector to the recycled paper sector is an innovative use of these chemical treatments which has been the subject of studies that have been carried out within an EU co-funded project called Fibre+.\nThe project Consortium included members representing Paper and Packaging European Associations (CEPI, FEFCO), and research institutes specialized in the wood and paper for packaging sector and paper and packaging companies. The focus of the project was on chemical modification of the paper made recycled fibres, investigating the possibility to transfer wood fibre modifications technique from the wood sector to paper and packaging sector. The aim was to enhance the properties of papers and of the packaging, as the recycling process causes the deterioration of fibres.\nThe chemical modification of recycled fibres aimed at the creation of a new generation of packaging papers characterized for being more recyclable, less hygroscopic, stiff and durable. The high recycling rate of papers in Europe (which is at the level of 72%) and the consequent importance that recycling has for the circular economy, were at the basis of this study. Paper products form part of an integrated carbon cycle based on the photosynthetic conversion of water, carbon dioxide, nutrients and solar energy into renewable wood-based biomass. Once consumed, paper may be recovered and used again either as a source of secondary fibres, to produce recycled paper or as bio-fuel. Fibre packages or corrugated containers made from corrugated board were the ones that were dealt with in the project, as they are considered as being the most prominent structural application of paper.\nChemical modification attempts.\nFibre modification with chemicals or enzymes had been investigated in the production of fibreboards. Fibre modification applying steam (steam-exploded wood) has been proved an efficient pre-treatment method in producing thermoplastic composites.\nCurrent theories for interfibre bonding during papermaking process are based on general recognition of the hydrogen bonding model. Consequently, all effort for boosting fibre strength is connected to mechanical beating of fibres in order to generate more flexible and fragmented fibres for increased bonding areas. As a consequence, significant drawbacks are obtained in terms of water retention ratio resulting in poor dewatering behaviour and high energy consumption. New mechanisms for interpretation and control of interfibre bonding are still upcoming. One way to overcome these drawbacks could be the molecular coating of cellulose fibres using polymers targeted on entropy controlled mixing of polymers and cellulose gel resulting in higher bonding forces. Theoretical results as well as experimental data on how application of polymeric layers (e.g. carboxymethyl cellulose) and enzymes on cellulose fibres can lead to sheets of high bonding strength without any mechanical beating have been already presented. However, these attempts were still far from any industrial implementation and their application would have been costly and would not solve the problem of raw material availability.\nObjective.\nBased on this state-of-the-art, the objective of the project was to modify and thus improve the characteristics of different types of recovered fibres used for the production of a variety of packaging grade papers used as linerboard and corrugating medium for corrugated board manufacturing in Europe. Information on the actual furnish characteristics and composition of packaging materials is expected to help European packaging industry to evaluate its sources of supply and to adopt suitable methods and processes to improve the available resources in an optimal manner. In the case of packaging, scientific technical knowledge of practical industrial relations between fibre characteristics, paper properties and corrugated board properties also is needed.\nFrom wood fibre modification to paper technology chemical wood modification aims at altering the structure of the cell wall matrix. Wood\nproperties are improved considerably by converting hydrophilic OH-groups into larger more hydrophobic groups. Also the physical fixation of modifying chemicals in the cell wall matrix can considerably change the wood properties. In addition to a hydrophobing effect, the treatments reduce the volume of cell wall nano-pores and thus decrease the incorporation of water molecules into the cell wall matrix. On a macroscopic scale, wood modification can change important properties of the wood including biological durability (resistance against fungi), dimensional stability, hardness and UV-stability. \nSince paper is produced from wood fibres, it was possible to transfer some of the developments achieved in wood technology to paper technology. Several technologies (e.g. chemical modification, nano-scale celluloses, polyelectrolytes, functional polymers based on cellulose, hemicelluloses and starch) were researched and used by different research groups around Europe (e.g. PTS and University of Goettingen, Germany; Kungliga Tekniska högskolan (KTH), Sweden.) There is already well established knowledge on chemical fibre modification of recycled fibres. Adamopoulos and Mai (2011) modified recycled fibres with N-methylol compounds and glutaraldehyde with significant improvement on fibre characteristics and paper sheet performance. Laboratory sheets manufactured with a variety of chemically modified recycled fibres were found to be superior in stiffness and hygroscopic properties than these manufactured from unmodified ones. The intention of the Fibre+ project is to build on the existing knowledge on fibre modification for adapting, implementing and disseminating this innovative technology in European paper SMEs.\nResults of the Fibre+ project on recycled fibres for packaging paper and information on potential developments of the Fibre+ concept can be found pn the Fibre+ website including scientific articles that have been published as a consequence of the RTD work that has been carried out during the project. \n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48692633","title":"Bullcroft Main Colliery F.C.","body":"\nBullcroft Main Colliery F.C.\n\nBullcroft Main Colliery F.C. was an English association football club based in Carcroft, Doncaster, South Yorkshire.\nHistory.\nLittle is known of the club other than that it competed in the FA Cup in the 1910s and 1920s.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48692645","title":"Lourdes Isern","body":"\nLourdes Isern\n\nLourdes Isern (born ) is a retired Puerto Rican female volleyball player, who played as a libero. She was part of the Puerto Rico women's national volleyball team at the 2002 FIVB Volleyball Women's World Championship in Germany. On club level she played with Gigantes de Carolina.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48692651","title":"Daniel Braverman","body":"\nDaniel Braverman\n\nDaniel Braverman (born September 28, 1993) is an American football wide receiver who is a redshirt junior for the 2015 Western Michigan Broncos football team. During the 2015 regular season, he had 103 receptions for 1,266 yards and 12 touchdowns and ranked second in the NCAA Division I FBS in receptions.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48692663","title":"Fitzsimmons, Alberta","body":"\nFitzsimmons, Alberta\n\nFitzsimmons is an unincorporated locality in northwest Alberta within the County of Grande Prairie No. 1. It is located approximately 30 kms north-east of the City of Grande Prairie.\nThe locality of Fitzsimmons formed around the Fitzsimmons School District No. 4500 which was approved July 7, 1930 for the area north of Bezanson and west of the Smoky River. It was named after a homesteader in the district, Scotty Fitzsimmons. Two years later, a post office was established in the home of C. Milnar on the NW quarter of Township 73, Range 3, West of the 6th Meridian.The one-room school closed in 1956 and the students were bussed to the school at Bezanson. In 1951, the post office also closed and there are no public buildings remaining to mark the locality of Fitzsimmons. Information on this community and the people who lived there can be found in Smoky River to Grande Prairie. (4)\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48692668","title":"Coombe Monthly","body":"\nCoombe Monthly\n\nCoombe Monthly is an online publication covering news in the Royal Borough of Kingston upon Thames, South West London. It is run by local residents in the borough, and is free to access.\nIt is available as a free, paperless \"Coombe Monthly\" e-newspaper, accessible from their website and delivered straight to email inboxes each morning.\nIt has an online readership of around 11,000 readers per month, although naturally this figure varies from month to month.\nThe paper also organises local community events, with the aim of \"Engaging local residents in the issues around them\", known as 'Kingston Question Time' events. These events donate all events to Love Kingston, a local charity in the Royal Borough of Kingston Upon Thames, donating to 'Pathways out of Poverty'.\nThe newspaper is run by James Giles, a New Malden resident, who has been listed by the Surrey Comet as a local Unsung Hero \n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48692671","title":"Dolly Melendez","body":"\nDolly Melendez\n\nDolly Melendez (born ) is a retired Puerto Rican female volleyball player, who played as a universal . She was part of the Puerto Rico women's national volleyball team at the 2002 FIVB Volleyball Women's World Championship in Germany. On club level she played with Criollas de Caguas.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48692674","title":"Xiomara Molero","body":"\nXiomara Molero\n\nXiomara Molero (born ) is a retired Puerto Rican female volleyball player, who played as a setter. She was part of the Puerto Rico women's national volleyball team at the 2002 FIVB Volleyball Women's World Championship in Germany. On club level she played with Criollas de Caguas.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48692680","title":"Jeffery Tribble","body":"\nJeffery Tribble\n\nJeffery Tribble is an ordained elder in the African Methodist Episcopal Zion (A.M.E. Zion) Church and a professor of ministry with research interests in Practical Theology, Congregational Studies and Leadership, Ethnography, Evangelism and Church Planting, Black Church Studies, and Urban Church Ministry. Academics and professionals in these fields consider him a renowned thought leader. Tribble's experience in pastoral ministry allows for his work to bridge the gap between academic research and practical church leadership.\nCareer.\nTribble received a B.S. from Howard University (1981), a Black Minister’s Program Certificate from Hartford Seminary (1985), a M.Div. from Garrett-Evangelical Theological Seminary (1990), and a Ph.D. from Northwestern University (2002). He began his work in the African Methodist Episcopal Zion Church as a minister of membership development at Martin Temple A.M.E. Zion Church in Chicago, Illinois (1990–1991). Tribble was ordained as an elder in 1992, when he then served as the pastor at St. Andrew A.M.E. Zion Church in Gary, Indiana (1991–1997). He has also served in the A.M.E. Zion Church as a pastor at St. Mark church in Chicago, Illinois (1997–2000), co-pastor at New vision Church in Suwanee, Georgia (2007–2008), Associate pastor at Greater Walters church in Chicago, Illinois (2006–2007), the minister of evangelism and men’s ministry and founding Dean of the Life Development Institute at Martin Temple Church in Chicago, Illinois (2000–2006), and as the presiding elder for the A.M.E. Zion Church for the Augusta District (2008–2013) and the Atlanta District (2013–present).\nHe began his career as an academic at Garrett-Evangelical Theological Seminary where he served as adjunct faculty (1999–2000, 2008 and 2009), Instructor of Congregational Ministries and Director of Teaching Parishes and Congregational Research (July 2000 – June 2003) and Assistant Professor of Congregational Leadership and Director of the Center for the Church and the Black Experience (July 2003 – June 2007). He has been a lecturer at Apex School of Theology in Durham, NC (2009). He joined the faculty of Columbia Theological Seminary as Assistant Professor of Ministry (2007–2012). \nHe currently still serves at Columbia Theological Seminary where he is now the Associate Professor of Ministry. He is also Presiding Elder for the Atlanta District, Georgia Annual Conference and Candidate for Bishop in the African Methodist Episcopal Zion Church for 2016.\nThought.\nTribble is a strong proponent of the transformative leadership idea. He has written extensively about how leaders, especially those who work in the church, should be open to transformation themselves as they transform the community they are leading. He writes about this specifically from the perspective of the Black Church in two of his books, Transformative Pastoral Leadership in the Black Church and Joining Jesus: A Class Manual for initiation into Christian Discipleship and Welcome into the African Methodist Episcopal Zion Church. From this point of view he emphasizes his research on how the Black Church “must continue its historic mission of being an instrument of survival, elevation, and liberation for its people.” He however does not limit his research just to the Black Church, he pushes for transformative leadership between various religious traditions as well. He has published numerous books, articles, and chapters that are used in this context by people and institutions across the world and across denominational lines.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48692697","title":"Don Mathieson (lawyer)","body":"\nDon Mathieson (lawyer)\n\nDonald Lindsay Mathieson is a Waikanae-based New Zealand lawyer and lay Anglican.\nMathieson studied at Victoria University of Wellington, playing chess and hockey before winning a Rhodes Scholarship in 1959.\nIn addition to spending more than forty years in private practice, Mathieson was Crown Counsel in the Crown Law Office. From 2010 to 2015 he was President of the Film and Literature Board of Review.\nMathieson, an active lay Anglican, edited \"Faith at work\" in 2001, 'arguing that Christians should practise their faith at work.' He wrote on the subject of same-sex marriage, in context of the Anglican church adapting to the Marriage (Definition of Marriage) Amendment Act 2013:\nIt is time to speak forthrightly in support of the clear scriptural witness about the sinfulness of homosexual acts and the position adopted without dissension by Roman Catholic, Protestant and Orthodox Churches alike for nearly two thousand years.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48692710","title":"Tatiana Gorchkova","body":"\nTatiana Gorchkova\n\nTatjana Gorschkova (born ) is a retired Russian female volleyball player, who played as a wing spiker. She was part of the Russia women's national volleyball team at the 2002 FIVB Volleyball Women's World Championship in Germany and at the 2004 FIVB World Grand Prix. On club level she played with VK Uralotschka-NTMK.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48692716","title":"List of Chicago Maroons men's basketball head coaches","body":"Source"}
{"url":"https://en.wikipedia.org/wiki?curid=48692726","title":"Anjela Gourieva","body":"\nAnjela Gourieva\n\nAnschela Gurijeva or Anjela Gourieva (born ) is a retired Russian female volleyball player, who played as a universal . She was part of the Russia women's national volleyball team at the 2002 FIVB Volleyball Women's World Championship in Germany. On club level she played with VK Uralotschka-NTMK.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48692737","title":"Elizabeth Fitzgerald (volleyball)","body":"\nElizabeth Fitzgerald (volleyball)\n\nElizabeth Fitzgerald (born ) is a retired American female volleyball player, who played as a setter. She was part of the United States women's national volleyball team at the 2002 FIVB Volleyball Women's World Championship in Germany.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48692738","title":"Alfonso Sosa","body":"\nAlfonso Sosa\n\nLuis Alfonso Sosa (born 5 October 1967) is a Mexican former footballer who last played for Quéretaro and current manager of Ascenso MX club Necaxa.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48692750","title":"Jennifer Flynn","body":"\nJennifer Flynn\n\nJennifer Flynn (born ) is a retired American female volleyball player, who played as a setter. She was part of the United States women's national volleyball team at the 2002 FIVB Volleyball Women's World Championship in Germany.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48692783","title":"BMCC Tribeca Performing Arts Center","body":"\nBMCC Tribeca Performing Arts Center\n\n is a performing arts venue located in Lower Manhattan inside the BMCC (Borough of Manhattan Community College) on 199 Chambers Street, New York, NY. BMCC Tribeca Performing Arts Center's two main theater spaces are Theatre One (a 913-seat theater) and Theatre Two (which is 260 seats). BMCC Tribeca Performing Arts Center programming includes music concerts, children's theater, stand-up acts, film retrospectives as well as local and international dance companies. BMCC Tribeca Performing Arts Center has been one of the venues for the annual Tribeca Film Festival.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48692801","title":"Smoky Heights, Alberta","body":"\nSmoky Heights, Alberta\n\nThe locality of Smoky Heights, on the west bank of the Smoky River north-east of the City of Grande Prairie, formed around the Smoky Heights post office, which was established June 1, 1923 in the home of Edith and Clarence Field. The post office lasted only a few years, in 1927 it was moved to Bezanson, but the area retained the name. On November 14, 1928, the Rivertop School District 4371 was approved. This school was much larger than the normal one-room school as it was intended to serve as a community center and included accomodations for the teacher as well. The school closed in 1955 and the students were bussed to the consolidated school at Teepee Creek.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48692812","title":"Jennifer Hiller","body":"\nJennifer Hiller\n\nJennifer Hiller (born ) is a retired Australian female volleyball player, who played as a libero. She was part of the Australia women's national volleyball team at the 2002 FIVB Volleyball Women's World Championship in Germany. On club level she played with Monash University.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48692818","title":"Twara Desai","body":"\nTwara Desai\n\nTwara Desai is an Indian actress. She acted in a Tamil language film \"Saivam\" (2014).\nExternal links.\n \n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48692820","title":"Tolotear Lealamanua","body":"\nTolotear Lealamanua\n\nTolotear Lealamanua (born ) is a retired Australian female volleyball player, who played as a middle blocker. She was part of the Australia women's national volleyball team at the 2002 FIVB Volleyball Women's World Championship in Germany. On club level she played with University of Technology, Sydney.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48692821","title":"Sandra Vehrencamp","body":"\nSandra Vehrencamp\n\nSandra Vehrencamp (born c. 1947), is a scientist, teacher, and mentor that specializes in Ornithology, with a geographical focus on the avian population of Costa Rica. She served as a faculty member of Cornell University's Lab of Ornithology and Department of Neurobiology and Behavior and taught graduate students while conducting research until retiring as of October 2010. She currently resides in Ithaca, New York, with her husband, Jack Bradbury.\nEducation.\nShe graduated from Crescenta Valley High School in La Crescenta, California, in 1965. She went on to receive her bachelors in Zoology with honors from the University of California at Berkeley in 1970, and her Ph.D in Animal Behavior from Cornell University in 1976. After her extensive education, she started her career in research.\nPersonal and early life.\nDr. Vehrencamp grew up in La Crescenta, California, and attended Crescenta Valley High School. During the time period Sandra Vehrencamp was born, women’s scientific talents were substantially under-appreciated. She received her high-school diploma in 1965 and went on to pursue a higher education from there. However, before 1950, women earned less than 10% of Bachelor’s in the STEM fields and less than 5% of the PhDs in these fields. She grew up with this stigma surrounding her and still managed to attend the University of California at Berkeley for her bachelors and Cornell University for her doctorate. The percentages of women receiving bachelors and PhDs were steadily rising throughout her young life, although the year she graduated from Cornell University still less than 10% of doctorates were received by women. Scientific women of the time were quite rare, and this fact highlights her dedication and passion for science, as is noted by other scientists. While in the midst of her education at Cornell University, she met her spouse-to-be, Jack Bradbury. They had their first child in 1975, just a year before Vehrencamp received her PhD and started her career. Their second child was born in 1979, when Vehrencamp was just beginning to settle into a career path. These few starting years were hectic for Vehrencamp, and it has been noted how impressive it is that she managed to keep furthering her career the way she did. Her oldest daughter, Kristin Nobel, is currently married and has two kids, her family living in San Diego. Her youngest, Katrina Bradbury, lives in Ann Arbor, Michigan, and is a Nutrition and Wellness Coach at The Sacred Healing Room at Your Natural Solutions LLC.\nCareer.\nSince 1976 she worked with University of California at San Diego and Cornell University conducting intensive research about birds and their behavior, specifically song patterns and mating habits. She taught animal communication research methods in animal behavior to graduate students during her time at Cornell University, and currently holds a professor emerita position there. Vehrencamp is said to have been an outstanding mentor, teacher, and scientist by her graduate students. Additionally, she worked with the Laboratory of Ornithology Bioacoustics Research Program and contributed to the bird call section, specifically that of Costa Rican wrens; she still holds an emerita professor appointment there as well. Throughout her career she published over 65 papers, which have been cited more than 2,400 times, and wrote 19 book chapters. She collaborated with her husband, Jack Bradbury - an ornithologist as well - consistently during her time as a scientist. They co-wrote a textbook, Principles of Animal Communication, published in 1998. It is a widely used work that combines physics, chemistry, neurobiology, cognitive science, evolutionary biology, behavioral ecology, and economics to delve deeply into animals and how they signal and communicate with one another. Its importance is highlighted by the fact that it has been cited more than 1,000 times. This textbook is highly regarded in the scientific community and is revered as the standard reference of the animal behavior world.\nNotable research ventures.\nVehencamp spent decades of her life studying ornithology, and retired fully accomplished in 2010. Her detailed work earned several awards soon after.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48692827","title":"Adrienne Marie","body":"\nAdrienne Marie\n\nAdrienne Marie (born ) is a retired Australian female volleyball player, who played as a wing spiker. She was part of the Australia women's national volleyball team at the 2002 FIVB Volleyball Women's World Championship in Germany. On club level she played with University of Technology, Sydney.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48692830","title":"Speculum principis (Skelton book)","body":"\nSpeculum principis (Skelton book)\n\nSpeculum Principis (A First Mirror) was a guide to 'proper princely behaviour' written by John Skelton in August 1501. Skelton was a well-known poet and had been appointed as tutor to Henry VIII's second son, Prince Henry, who would later reign as Henry VIII of England. A copy is now in the British Museum, which may or may not be exactly the same as the one given to Henry.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48692833","title":"Rowena Morgan","body":"\nRowena Morgan\n\nRowena Morgan (born ) is a retired Australian female volleyball player, who played as a libero. She was part of the Australia women's national volleyball team at the 2002 FIVB Volleyball Women's World Championship in Germany. On club level she played with University of Technology, Sydney.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48692838","title":"Eileen Romanowski","body":"\nEileen Romanowski\n\nEileen Romanowski (born ) is a retired Australian female volleyball and beach volleyball player, who played as a wing spiker. She was part of the Australia women's national volleyball team at the 2002 FIVB Volleyball Women's World Championship in Germany. On club level she played with Mount Lofty. In 2007 she played beach volleyball with Becchara Palmer.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48692845","title":"Prosopopeia Britanniae","body":"\nProsopopeia Britanniae\n\nProsopopeia Britanniae is a ten-page poem written by Desiderius Erasmus in Latin. It was written for ‘the most illustrious prince, Duke Henry’, the future Henry VIII of England.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48692873","title":"Andrea Badoer","body":"\nAndrea Badoer\n\nAndrea Biagio Badoer or Andrea Badoer (fl.1509) was the Venetian ambassador to the Court of Henry VIII of England. His dispatches are today read in the \"Calendar of State Papers, Venice\".\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48692878","title":"Nawaz Sharif Kidney Hospital Swat","body":""}
{"url":"https://en.wikipedia.org/wiki?curid=48692894","title":"Myoporum velutinum","body":"\nMyoporum velutinum\n\nMyoporum velutinum is a plant in the figwort family, Scrophulariaceae and is endemic to a small area near Esperance in Western Australia. It has similar flowers and fruits and grows in similar environments to \"Myoporum tetrandrum\" but differs from it and all other members of the genus by having hairs on the outer edge of the petals.\nDescription.\n\"Myoporum velutinum\" is a shrub which sometimes grows to a height of and which has hairs on the stem and leaves but lacks the warty surface of many other myoporums. The leaves are arranged alternately and are lance shaped, usually long, wide, soft, covered with soft hairs, darker green on the upper surface and have a prominent mid-vein.\nThe flowers are borne in leaf axils, usually in groups of 1 to 5 on stalks long. There are 5 triangular, pointed sepals and 5 petals forming a bell-shaped tube. The petals are white or pale lilac, sometimes spotted inside the tube and on the base of the lobes. The tube is long and the lobes are about the same length. The tube is hairy on its inner and outer surfaces and there are 4 stamens which extend slightly beyond the petal tube. The fruit that follows flowering is an oval-shaped drupe, about .\nTaxonomy and naming.\n\"Myoporum velutinum\" was first formally described by taxonomist Bob Chinnock in \"Eremophila and allied genera: a monograph of the plant family Myoporaceae\" in 2007 from a specimen collected near Condingup. The specific epithet (\"velutina\") is a Latin word meaning \"velvety\".\nDistribution and habitat.\n\"Myoporum velutinum\" occurs in a small area near Cape Le Grand where it grows along creeks in \"Melaleuca\" woodland.\nConservation.\n\"Myoporum velutinum\" has been classified as \" Threatened Flora (Declared Rare Flora — Extant)\" by the Government of Western Australia Department of Parks and Wildlife meaning that it is \"likely to become extinct or is rare, or otherwise in need of special protection\".\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48692897","title":"Thomas Spinelly","body":"\nThomas Spinelly\n\nThomas Spinelly was Henry VIII of England’s representative in the Low Countries in 1510.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48692899","title":"San Antone (film)","body":"\nSan Antone (film)\n\nSan Antone is a 1953 American Western film directed by Joseph Kane and written by Steve Fisher. The film stars Rod Cameron, Arleen Whelan, Forrest Tucker, Katy Jurado, Rodolfo Acosta and Roy Roberts. The film was released on February 15, 1953, by Republic Pictures.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48692913","title":"VTEC (disambiguation)","body":"\nVTEC (disambiguation)\n\nVTEC is Variable Valve Timing and Lift Electronic Control, a system developed by Honda for combustion engines.\nVTEC or VTech may also refer to:\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48692933","title":"Zero Gradient Synchrotron","body":"\nZero Gradient Synchrotron\n\nThe Zero Gradient Sychrotron (ZGS), was a weak focussing 12.5 GeV proton accelerator \nthat operated at the Argonne National Laboratory in Illinois from 1964 to 1979.\nIt enabled pioneering experiments in particle physics, in the areas of \nOther noteworthy features of the ZGS program were the large number of university-based users and the pioneering development of large superconducting magnets for bubble chambers and beam transport. \nThe hardware and building of the ZGS were ultimately inherited by a spallation neutron source program, the Intense Pulsed Neutron Source (IPNS).\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48692935","title":"Sonia Benedito","body":"\nSonia Benedito\n\nSonia Benedito (born ) is a retired Brazilian female volleyball player, who played as a wing spiker. She was part of the Brazil women's national volleyball team at the 2002 FIVB Volleyball Women's World Championship in Germany. On club level she played with Fluminense Rio de Janeiro.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48692938","title":"World's Fair (album)","body":"\nWorld's Fair (album)\n\nWorld's Fair is the third album released by Julian Lage as leader. Recorded on a 1939 Martin 000-18 with no overdubbing, it is the first solo album he has recorded.\nBackground.\nLage said that a large part of the inspiration for this album was the classical guitarist Andrés Segovia, and that it \"draw[s] from the sonic fingerprint of early radio recordings mixed with the short form structures of some of my favorite classical and folk music\". While he still considers the album to be jazz-oriented, he stated that he stayed away from swing-style music \"because I didn't think solo guitar was the format for me to play swing\".\nOverview.\nThe first track, \"40's\", which was the only song given a pre-release, is of a medium tempo and alternates between the keys of F and D. \"Peru\" opens with some light picking before settling into the actual tune, and \"Japan\" begins \"with an angular, almost discordant sound, but enters into a laid back groove, occasionally interrupted by unsettled harmonies\".\n\"Double Stops\", as the title implies, makes extensive use of double stops throughout the course of the song. \"Gardens\" was described as making Lage sound like \"a flatpicking Andrés Segovia\", due to the fast bluegrass picking technique employed.\nOnly two tracks on the album were not composed by Lage. The first, \"Where or When\", a Rodgers and Hart show tune, was described as \"[lingering] like a comfortable memory.\" The other is a folk song, \"Red Prairie Dawn\", which \"puts his folk roots on display.\"\nReception.\nMark F. Turner's \"AllAboutJazz\" review said that \"It's the perfect showcase of his fine abilities on acoustic guitar.\" \"Relix\" review said that \"the music's austerity magnifies its grandeur\".\nThe review from \"The Stanford Daily\" stated that \"Fans of Lage's more experimental work...may be disappointed to find that \"World's Fair\" lacks the abstract sophistication found in many works of contemporary jazz. But it's fairly clear that Lage was not writing to push musical boundaries, but rather to pay homage to the diverse range of music that has shaped his own playing and taste.\" The Sun Gazette commented \"Lage [serves] the songs rather than his ego...the brilliance is in how simple and effortless he makes it sound\".\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48692943","title":"Fabiana Berto","body":"\nFabiana Berto\n\nFabiana Berto (born ) is a retired Brazilian female volleyball player, who played as a setter. She was part of the Brazil women's national volleyball team at the 2001 FIVB World Grand Prix and 2002 FIVB Volleyball Women's World Championship in Germany. On club level she played with Club Atlético Estudiantes de Paraná.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48692953","title":"Peter Johnston (Wisconsin politician)","body":"\nPeter Johnston (Wisconsin politician)\n\nPeter Johnston was a member of the Wisconsin State Assembly.\nBiography.\nJohnston was born on January 19, 1831 in Dunblane, Scotland. Later, he resided in Milwaukee, Wisconsin before settling in Manitowoc, Wisconsin in 1857. He died on October 3, 1904.\nPolitical career.\nJohnston was a member of the Assembly during the 1877 session. From 1870 to 1872, he was Mayor of Manitowoc. Additionally, Johnston was a member of the Manitowoc City Council and of the Manitowoc County, Wisconsin Board of Supervisors. He was a Republican.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48692955","title":"Marina Daloca","body":"\nMarina Daloca\n\nMarina Daloca (born ) is a retired Brazilian female volleyball player, who played as a middle blocker. She was part of the Brazil women's national volleyball team at the 2002 FIVB Volleyball Women's World Championship in Germany. On club level she played with Minas Tênis Clube.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48692956","title":"Luciana Nascimento","body":"\nLuciana Nascimento\n\nLuciana Nascimento (born ) is a retired Brazilian female volleyball player, who played as a wing spiker. She was part of the Brazil women's national volleyball team at the 2002 FIVB Volleyball Women's World Championship in Germany. On club level she played with EC Pinheiros.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48692957","title":"Maria Fidecaro","body":"\nMaria Fidecaro\n\nMaria Fidecaro is an Italian theoretical physicist with a focus on particle physics. Her main laboratory where she spent most of her career doing research was CERN- European Organization for Nuclear Research.\nMaria received her degrees in Physics from the University of Rome in the 1940s.\nIn 1954, she obtained a fellowship from the International Federation of University Women to do research at the University of Liverpool. In 1956, Maria obtained the CERN fellowship and worked at CERN until 2012. She is among the pioneering scientists at CERN since the establishment of the institution in 1954.\nPersonal life.\nMaria Fidecaro was born in Italy. In July 1955, she married Giuseppe Fidecaro- a fellow physicist at CERN who was also doing research with Maria at University of Liverpool. They had a family of four children.\nIn summer 1956 when Maria obtained CERN fellowship, the couple moved to Geneva. They were the first few scientists among a total of 300 to 400 staff when CERN was first founded. During their time, few people could do experiments at CERN. Maria started with a group of only three scientists.\nMaria also recalled the effect of war in her early life. Italy entered World War II in 1940, the time when Maria was earning her degree at the University of Rome. The aftermath of war destroyed Italy’s economy and society. Not until the 1950s and 1960s had Italy regained its stabilization and the economy started booming.\n\"It was just a mere 10 years after the end of the war. The war feelings were still very much there,\" she recalled as she started her work at CERN in 1956.\nAlthough there were few female scientists at CERN during her time, Maria felt she was respected by her colleagues. “In my group, I was simply one of them”, Maria said.\nThe couple, having devoted 60 years to research at CERN since its beginning, is seen as a living memory of the institute.\nScientific research.\nAfter Maria’s marriage, she and Giuseppe carried out experiments on pions. Maria worked with a diffusion chamber and Giuseppe with a lead glass Cherenkov counter.\nMaria and Giuseppe were also involved in cosmic rays experiment in the Italian Alps just after the war. The experiment was set at 3,500 meters on the face of Matterhorn, using a detector of 1-square meter.\nAfter Maria and Giuseppe moved to Geneva, Giuseppe was assigned to the Synchrocyclotron Division. Synchrocyclotron was the first accelerator to be built at CERN in 1957. Meanwhile, Maria worked on a novel method to provide polarized proton beams to be used for particle collision in the accelerator.\nThroughout her career as a theoretical physicist, she authored over 200 publications in the fields of Nuclear Physics, Nuclear Energy, and Statistical Physics. Maria collaborated with 903 co-authors in her research from 1961 to 2012.\nThe majority of her research relates directly to the experiments, including interpreting the measurements and results in the search for new particles. In Maria’s early works in the 1960s, she studied the nucleon-nucleon charge exchange scattering, recorded data on high-energy electrodynamic processes.\nHer research work also tackled the phenomenon of proton-proton elastic scattering. In the 1990s, she investigated the design and test of a prototype gas-sampling electromagnetic calorimeter of high granularity and collaborated on the construction of a position-sensitive photon detector for CPLEAR experiment. CPLEAR experiment aims to carry out precision measurements of CP, T and CPT violation of the neutral kaon systems.\nMaria’s other work focused on phenomenological aspects of particle physics. She studied the fundamental symmetries in the neutral kaon systems. By the measurements of interactions and decays of neutral kaons, new and detailed information was found on CPT invariance in time evolution and decay. The newly achieved level of precision of the experiments called into question the validity of some of the often tacitly assumed hypotheses in particle physics.\nMaria was also involved in the search for CP-violation (charge-parity violation) in the NA48 experiment. After the theory of CP-violation in the decay of neutral kaon system was experimentally confirmed, the discovery brought the Nobel Prize in Physics in 1980 to the discoverers of the theories, James Cronin, and Val Fitch. The discovery played an important role in helping scientists explain the dominance of matter over antimatter.\nChallenges as a women scientist.\nFemale scientists at CERN have to face certain obstacles. A trend is observed that when women scientists reach their mid-career and have children, they tend to leave their job. Even today, there are no pre-schools at CERN and those around the laboratory are expensive. Pregnancy can pose a challenge to the career advancement of women scientists because they have more limited access to the facilities due to the risk of radiation.\nWhen CERN was first founded, there were about 300 to 400 staff but very few women scientists. Some gender issues at CERN were mentioned in the book “Women Scientists: Reflections, Challenges, and Breaking Boundaries” by Magdoha Hargittai. Mary Katharine Gaillard, a theoretical physicist holding a visiting position at CERN in the 1960s was interviewed in the book. Gaillard conducted a survey among women scientists at CERN at that time and found that only 10 percent was fully paid while 86 percent was not paid at all. Two of the reasons for women scientists not being paid were that their husbands were CERN employees and that priority was given to unemployed men. Maria Fidecaro might have experienced the gender bias mentioned by Gaillard during her time at CERN in the 1960s since her husband, Giuseppe Fidecaro, was an employee at CERN. Additionally, Maria had to juggle the job and a family of four children. There were few nurseries in CERN and around the laboratory at that time.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48692958","title":"Marcelle Rodrigues","body":"\nMarcelle Rodrigues\n\nMarcelle Rodrigues (born ) is a retired Brazilian female volleyball player, who played as a setter. She was part of the Brazil women's national volleyball team at the 2002 FIVB Volleyball Women's World Championship in Germany. At the end of the championships she was awarded as the best setter. On club level she played with BCN Osasco.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48692965","title":"Hélder José Castro Ferreira","body":"\nHélder José Castro Ferreira\n\nHélder José Castro Ferreira (born 5 April 1997 in Fafe) is a Portuguese footballer who plays for Vitória de Guimarães B, as a forward.\nFootball career.\nOn 25 November 2015, Ferreira made his professional debut with Vitória Guimarães B in a 2015–16 Segunda Liga match against Feirense.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48692986","title":"Gustavo Díaz","body":"\nGustavo Díaz\n\nGustavo \"Chavo\" Díaz Domínguez (born November 7, 1974) is an Uruguayan former footballer and current manager of Ascenso MX club Celaya.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48693000","title":"Edmund Naganowski","body":"\nEdmund Naganowski\n\nEdmund Wacław Naganowski (26 September 1853 – 28 January 1915), was a Polish publicist and writer also known under pen names E. Działosz, Latarnik and Edmund Sas (Sas most likely refers to his Sas coat of arms).\nLife.\nNaganowski was born in Gostyń, Greater Poland, then in Austria-Hungary. After finishing his studies in England, he was a teacher in a high school in Waterford in Ireland and he later worked at the British Museum. On February 14, 1903 he became naturalized in Great Britain, under the name Edmund Sas de Naganowski.\nHe served as secretary of the Polish Literary Society in London\nHe is credited with the introduction of scouting in Poland.\nMonica Mary Gardner acknowledged the influence and support of Naganowski on her interests in Polish culture from 1899 to the outbreak of the First World War.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48693021","title":"Sarati the Terrible (1923 film)","body":"\nSarati the Terrible (1923 film)\n\nSarati the Terrible (French:Sarati, le terrible) is a 1923 French silent film directed by René Hervil and Louis Mercanton and starring Henri Baudin, André Feramus and Ginette Maddie. In 1937 it was remade as a sound film.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48693061","title":"List of TVB dramas in 2016","body":"\nList of TVB dramas in 2016\n\nThis is a list of television serial dramas released by TVB in 2016.\nTop ten drama series in ratings.\nThe following is a list of TVB's highest-rated serial dramas of 2016 according to the drama's average ratings. The list also includes the ratings of the dramas' premiere week, finale week, as well as the average overall count of Hong Kong viewers (in millions) per drama.\nFirst line-up.\nThese dramas air in Hong Kong from 8:00pm to 8:30pm, Monday to Friday on Jade.\nSecond line-up.\nThese dramas air in Hong Kong from 8:30pm to 9:30pm, Monday to Friday on Jade.\nThird line-up.\nThese dramas air in Hong Kong from 9:30pm to 10:30pm, Monday to Sunday on Jade.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48693068","title":"Embla (horse)","body":"\nEmbla (horse)\n\nEmbla (27 April 1983 – after 2003) was a British Thoroughbred racehorse and broodmare. In a racing career which lasted from June 1985 until October 1986 she won four of her nine races. As a two-year-old she finished second on her debut and won two minor races before recording an upset victory over a strong field for the Cheveley Park Stakes. In the following year she finished fifth in the 1000 Guineas and second in the Coronation Stakes before ending her career with a win in the Petition Stakes. Her broodmare career was largely undistinguished but she produced one excellent racehorse in Zenno El Cid, a major winner in Japan.\nBackground.\nEmbla was a \"strong, rangy\" dark bay mare with no white markings bred in the United Kingdom by Sheikh Mohammed. She was sired by Dominion who finished third in the 1975 2000 Guineas and won the Prix Perth in 1976. before being exported to North America and winning the Bernard Baruch Handicap in 1978. He sired several good horses over a wide range of distances including First Island, the sprinter Primo Dominie (Coventry Stakes), and the stayer Trainglot (Cesarewitch Handicap). Embla's dam Kaftan won one minor race from four attempts but was a half-sister to the Nunthorpe Stakes winner Blue Cashmere and a granddaughter of the Yorkshire Oaks runner-up No Saint, whose other descendants included Persian Heights.\nAs a yearling Embla was offered for sale and bought for 46,000 guineas by representatives of Charles St George. The filly was sent into training with Luca Cumani at Newmarket, Suffolk.\nRacing career.\n1985: two-year-old season.\nEmbla began her racing career by finishing second in a minor race over six furlongs at Newmarket Racecourse in late June. She then started favourite for an eighteen-runner maiden race at Kempton Park Racecourse in July and won easily. On her next appearance she was less impressive as she started 1/5 favourite for a minor event at Ripon Racecourse in August but won by only three-quarters of a length from Raisinhell. Timeform described her as \"scrambling home\" in the race. Cumani, nevertheless, held the filly in high regard and later explained that she had been going through an \"awkward growing phase\" at the time.\nOn her final appearance of the year, Embla was moved up sharply in class to contest the Cheveley Park Stakes (the only Group One race in Britain at the time restricted to juvenile fillies) over six furlongs at Newmarket in October. The leading American jockey Angel Cordero was booked for the ride, but the filly was given little chance and started a 20/1 outsider in a thirteen-runner field. The Jeremy Tree-trained Kingcote started favourite after a four-length win in the Lowther Stakes, whilst the other contenders included Park Express, Storm Star (winner of the Cherry Hinton Stakes), Asteroid Field (Waterford Candelabra Stakes), Bambolona (Sirenia Stakes), Wanton (third in the Flying Childers Stakes), Nashia (runner-up in the Prix d'Arenberg) and Rose of the Sea (fourth in the Prix Morny). In the early stages Rose of the Sea led from Storm Star, with Embla towards the rear and apparently struggling to match the pace. Kingscote went to the front approaching the final furlong but Embla was making relentless progress and soon moved into contention. She overtook Kingscote a hundred yards from the finish and won by a length. Rose of the Sea held on for third ahead of Asteroid Field.\n1986: three-year-old season.\nOn her three-year-old debut Embla contested the Nell Gwyn Stakes (a trial race for the 1000 Guineas) over seven furlongs at Newmarket on 15 April and finished fourth of the nine runners behind Sonic Lady. Sixteen days later she started 6/1 second favourite behind behind Sonic Lady in the 1000 Guineas. Ridden by Tony Ives she finished fifth behind Midway Lady, Maysoon, Sonic Lady and Ala Mahlik. She proved no match for Sonic Lady in her next two races, finishing second in the Coronation Stakes at Royal Ascot in June and fifth in the Child Stakes at Newmarket on 9 July. After a break of three months the filly returned and was dropped in class for the Petition Stakes over one mile at Newmarket in October. She recorded her only success of the year as she narrowly defeated the colt Santella Mac.\nAssessment.\nIn the official International Classification for 1985, Embla was rated the third-best two-year-old filly in Europe after the French-trained Baiser Vole and Regal State. The independent Timeform organisation rated her on 121, three pounds behind their top juvenile filly Femme Elite. She was rated 110 by Timeform in 1986.\nBreeding record.\nEmbla was retired from racing to become a broodmare and produced eleven foals between 1988 and 2003. Three of her offspring won races, with the most successful, by far, being the Japanese horse Zenno El Cid.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48693069","title":"Peter IV van den Gheyn","body":"\nPeter IV van den Gheyn\n\nPeter van den Gheyn (; 1605 or 1607–1654 or 1659) was a bell-founder of the Spanish Netherlands (now Belgium).\nLife.\nPeter was born into a family of noted bell-founders and himself became the most famous bell-founder of the 17th century. His father was Jan van den Gheyn. The family forge was at Mechelen in what is now Belgium. His associate was named Peter Deklerk or de Clerck, his uncle by marriage.\nHis total production of bells was not great. He cast the Salvator bell for in Mechelen in 1638, which weighed and cracked in 1696. He also cast the Salvator bell for in Brussels.\nHe had the curious affectation of inscribing his bells using type of various sizes within the same word.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48693071","title":"Li Ying (volleyball)","body":"\nLi Ying (volleyball)\n\nLi Ying (born ) is a Chinese female volleyball and beach volleyball player, who played as a libero. She was part of the China women's national volleyball team at the 2002 FIVB Volleyball Women's World Championship in Germany and 2002 Asian Games. At the 2014 Asian Women's Club Volleyball Championship with Tianjin Bohai Bank she won the silver medal and was awarded as the best opposite spiker. On club level she plays with Tianjin Volleyball in 2015-16.\nWith Wang Lu she played at the 2005 Beach Volleyball World Championships.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48693076","title":"Peter van den Gheyn","body":"\nPeter van den Gheyn\n\nPeter van den Gheyn (Period ) may refer to any of several members of a noted family of bell-founders in the Spanish Netherlands. They are conventionally disambiguated with roman numerals:\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48693084","title":"Abraham Lincoln Bridge","body":"\nAbraham Lincoln Bridge\n\nThe Abraham Lincoln Bridge is a six-lane, single-deck cable-stayed bridge carrying Interstate 65 across the Ohio River, connecting Louisville, Kentucky and Jeffersonville, Indiana. The main span is (two spans) and the bridge has a total length of . It is named after U.S. President Abraham Lincoln.\nHistory.\nThe Abraham Lincoln Bridge opened on December 6, 2015, and is parallel to the John F. Kennedy Memorial Bridge upstream and carries three lanes of northbound I-65 traffic, eventually carrying six lanes of northbound I-65 traffic. Pedestrian and bicycle lanes were in the original plans, but have since been removed. The existing I-65 John F. Kennedy Memorial Bridge, completed in 1963, will be renovated for six lanes of southbound traffic.\nA Structured Public Involvement protocol developed by Drs. K. Bailey and T. Grossardt was used to elicit public preferences for the design of the structure. From spring 2005 to summer 2006 several hundred citizens attended a series of public meetings in Louisville, Kentucky and Jeffersonville, Indiana and evaluated a range of bridge design options using 3D visualizations. This public involvement process focused in on designs that the public felt were more suitable, as shown by their polling scores. The SPI public involvement process itself was evaluated by anonymous, real-time citizen polling at the open public meetings.\nOn July 19, 2006, the final design alternatives for the bridge were announced. The three designs included a three-span arch, a cable-stayed design with three towers, and a cable-stayed type with a single A-shaped support tower. It was also announced that the projected cost for the bridge would be $203 million.\nThe structure is an additional bridge in downtown Louisville joining the John F. Kennedy Memorial Bridge erected between spring 1961 and late 1963 at a cost of $10 million; the four-lane George Rogers Clark Memorial Bridge, constructed from June 1928 and to October 31, 1929, and the Big Four Bridge, which operated as a railroad bridge from 1895 to 1969 and reopened as a pedestrian bridge in May 2014.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48693093","title":"José Pérez (athlete)","body":"\nJosé Pérez (athlete)\n\nJosé Roquez Pérez (born 19 March 1971) is a retired Cuban athlete who specialised in the 400 metres hurdles. He represented his country at two World Championships, in 1993 and 1995, reaching the semifinals on both occasion. In addition he won multiple medals on regional level.\nHis personal best in the event is 49.28 seconds set in Cali in 1993.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48693113","title":"21 Party","body":"\n21 Party\n\nThe 21 Party () was a political party in Burma in the 1920s led by U Ba Pe.\nHistory.\nThe party was formed in 1922 following a split in the General Council of Burmese Associations (GCBA). The GCBA had planned to boycott the local and national elections due that year, but a group of 21 dissidents left the organisation to form a new party.\nIn the elections the 21 Party won 28 of the 58 non-communal seats, becoming the largest party in the Legislative Council. However, it held less than a third of the total of 103 seats, and Joseph Maung Gyi from the pro-British Independent Party was appointed head of government.\nPrior to the 1925 elections the party was succeeded by the Nationalist Party.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48693118","title":"2016 TCU Horned Frogs football team","body":""}
{"url":"https://en.wikipedia.org/wiki?curid=48693123","title":"Julie McElrath","body":"\nJulie McElrath\n\nM. Juliana “Julie” McElrath (born January 9, 1951) is a senior vice president and director of the vaccine and infectious disease division at Fred Hutchinson Cancer Research Center and principal investigator of the HIV Vaccine Trials Network Laboratory Center in Seattle, Washington. She also is a professor at the University of Washington."}
{"url":"https://en.wikipedia.org/wiki?curid=48693131","title":"In Old Alsace (1920 film)","body":"\nIn Old Alsace (1920 film)\n\nIn Old Alsace (French:L'ami Fritz) is a 1920 French silent film directed by René Hervil and starring Léon Mathot, Huguette Duflos and Thérèse Kolb.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48693145","title":"George Moy","body":" (5 years 1 month) Cleveland/Akron, Ohio Area Work with alumni and friends of the SIHS community to foster leadership gifts to make a meaningful impact on the mission of Saint Ignatius High School and change the lives of current and future students. Growth of the endowment to have a lasting impact on the affordability of a Jesuit, Catholic education through committed gifts or planned giving.\nManaging Director of Commercial Banking at Talmer Bank and Trust.\nTalmer Bancorp\nSenior Relationship Manager responsible for the creation of a portfolio of loan and deposit relationships with major businesses within the midwest footprint for Talmer Bank and Trust. Emphasis is on generation of new business and cross sell opportunities, administer and service business relationships. Interview potential clients to develop information concerning their businesses and requirements, evaluate credit information and make relationship recommendations.\nMiddle Market - Healthcare - Community Development Lending - Commercial Real Estate\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48693181","title":"Webster, Alberta","body":"\nWebster, Alberta\n\nThe locality of Webster was established in 1916 as a station on the Edmonton, Dunvegan and British Columbia Railway about 30 km north of the City of Grande Prairie. It was named after George Webster who was a subcontractor for the railway at that time, and later became Mayor and then MLA for the City of Calgary.\nAlthough, there were a few railway workers who lived there from 1916 to the late 1920s, the area was mainly settled in 1929 by Polish immigrants from the Vermilion area who had fled Poland after Russian invaded following World War I. In the fall of 1929, a store was opened by Andrew and Cathy Hancharyk on the NW quarter of Section 27, Township 74, Range 5, West of the 6th Meridian. A post office opened there on October 15, 1929, with Andrew as postmaster. “Across the street from the store was the butchershop and café”. The community included ”two livery barns… a single elevator which served an area as far away as Heart Valley… an elevator house, and a water tank for the train.” Across the creek was the Webster Sawmill. In 1930, a large Catholic Church was erected. This also served as a school-room for Torun School District 4483, approved on March 20, 1930, until the school was built in 1937. In the late 1930s, Webster Hall was built for community gatherings and a rectory was added for the first resident Catholic priest. The elevator was the first community building lost by fire, then the church in the early 1960s. In 1957, Torun School closed and the students were vanned to Sexsmith. The post office closed in 1966, and all that remained were the hall and the Catholic grotto which had been erected beside the church, as well as the Webster Cemetery.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48693208","title":"Estadio Arena Cora","body":"\nEstadio Arena Cora\n\nThe Estadio Arena Cora is a multi-use stadium in Tepic, Nayarit, Mexico. It is currently used mostly for football matches and is the home stadium for Deportivo Tepic F.C.. The stadium has a capacity of 12,271 people and opened in 2011.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48693226","title":"The Flame (1926 film)","body":"\nThe Flame (1926 film)\n\nThe Flame (French:La flamme) is a 1926 French silent drama film directed by René Hervil and starring Germaine Rouer, Charles Vanel and Henry Vibart. It was remade as a sound film in 1936.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48693231","title":"Fruit carving","body":"\nFruit carving\n\nFruit carving is the art of carving fruit, a very common technique in Europe and Asian countries, and particularly popular in Thailand, China and Japan. There are many fruits that can be used in this process; the most popular one that artists use are watermelons, apples, strawberries, pineapples, and cantaloupes.\nHistory.\nChina.\nMany believe that fruit carving originated in China during the Tang Dynasty, which lasted from AD 618-906. Fruit carving in China usually features mythological creatures, and animals. Not only is fruit carving used in cultural and traditional ceremonies, but also ordinary households are known for decorating plates with fruit carvings when they have guests over. Specifically, watermelon carving has been and still is very popular in China. Usually, the outside of the melon is carved on and the melon pulp is scraped out of the inside of the melon, so it can be used as a container to put food or flowers in. Chinese fruit carving is used to tell their legends and stories.\nEurope.\nFruit carving is included in Matthias Giegher's 1621 work \"Il Trinciante\" (\"The Carver\"), where he describes carving oranges and citrons into abstract patterns, shell-fish, four-legged animals and the Hapsburgs' double-headed eagle, but the art was not common in Europe or North America until the 1980s when several books on the topic were published.\nThailand.\nFruit carving is a significant part of Thai cultural heritage. Watermelon carving dates to the 14th century in Thailand during the Sukhothai dynasty. The annual Loi Krathong Festiva occurs each November where people in Thailand float lamps and lanterns down a river to honor water spirits. One legend is that one of the king’s maids decorated her lantern with a watermelon carved with flower designs to impress him and that he was so pleased that he encouraged all Thai women to adopt the practice. The king also requested that fruit carving become part of the primary school curriculum. Thailand fruit carving features flowers, birds and floral patterns.\nJapan.\nThe Japanese emphasize the presentation of a dish and how the plate aesthetically appeals to others. Fruit carving in Japan is referred to as Mukimono. Mukimono began in ancient Japan in an effort to make dishes more appealing since the food was placed and served on an unglazed pottery plate, which had a rough look to it. Chefs would cover the plate in leaves and would fold them into different designs in order to make the dish look better.This technique eventually turned into carving fruit that would also be placed on the plates to enhance the appearance of the dish. At first, when this technique came out, vendors on the streets would add carved fruit to their food when customers made a special request, but now it is very common for all Japanese dishes to feature carved fruits. Fruit carving and garnishing is now a significant part of Japanese chef training.\nOverview.\nThe art of fruit carving uses many different tools, usually ordinary items but some specific to just fruit carving. All these tools give the artwork a different texture or help with its design. Some of the tools include:\nBefore carving a fruit, the necessary materials must be gathered. The usual process is to have the tools handy for when they are needed in one's steps towards creating a carving. There are two types of carvings that can be done. The first is Skin Carving, this is when the outer skin of the fruit (or vegetable) is carved to reveal the fleshy center, where the color is different than the outer skin to create a design using the contrast between the outer skin and flesh of the fruit. The second type of carving is Three Dimensional Carving, the purpose of this particular technique of carving is to carve the fruit to into a three dimensional object of the carver’s choice. The most popular three dimensional design is floral objects. It is easy to over-carve a fruit which leads to loss in nutrition, but it is always important to start off by outlining your carving on the fruit. Depending on the design that is being created it may take very little time or be more complex and use more time and concentration also different steps in the process are used for each design. Not one design is alike. An important aspect of fruit carving is that the fruit you carve must be suitable for the manner which one will display it. Most fruit carvings will need to be refrigerated before they are placed in the specific setting that is desired.\nArtists.\nThere are many artists and chefs who are known for their fruit carving skills. Each has a different technique. Many of these chefs have previously owned restaurants and now hold classes in this art. \nValeriano Fatica is an Italian fruit carver, known through his videos on Youtube that has attracted people to his artwork around the world. He has carved many different fruits at a large scale.\nJimmy Zhang is a fruit carver from China. He has won many awards in the culinary area and has also been featured in many newspapers across the globe for his skills. He teaches classes on how to carve fruit and vegetables and master the skills and learn history about the way China has created its fruit carving industry.\nCarl Franklin Jones, an expert in the art of fruit carving, practices in the United States. He is known for his fruit carving sculpture that was created for Ivanka Trump's wedding. He also holds a catering businesses in Tennessee. Jones was a business owner of many franchises also in Tennessee before starting his catering business. Today Jones travels the world and hosts mentoring programs for young ambitious fruit carving artists and chefs.\nFruit carving today.\nSome people perform fruit carving professionally. Some chefs utilize fruit carving as a culinary technique. Once fruit carvers have mastered the techniques past the intermediate stage and become professionals, they can price their services to restaurants, professional caterers, hotels and resorts. Professional fruit carvers can also create centerpieces and displays for various events, such as parties and wedding receptions. On a smaller scale, fruit carvers can present a dish with decorative garnishing to add an aesthetically pleasing experience to their viewers.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48693235","title":"Corte Capitanale","body":"\nCorte Capitanale\n\nThe Corte Capitanale is a former courthouse in Mdina, Malta, which currently serves as a city hall. It was built in the Baroque style between 1726 and 1728, to designs of the French architect Charles François de Mondion. The building is linked to Palazzo Vilhena, but it has its own entrance and façade.\nHistory.\nThe Corte Capitanale was built between 1726 and 1728 along with the rest of Palazzo Vilhena, the Grand Master's official residence in Mdina. The building was mainly a courthouse, but it also served as the seat of the \"Capitano della Verga\". Its linking to the palace was a symbolic gesture to convey the fact that the courts were under the jurisdiction of the Order of St. John. The courthouse was also linked to the Bishop's Palace through a now-blocked underground passage, indicating the Church's role in the courts. The building remained a courthouse until 1818.\nToday, the Corte Capitanale is Mdina's city hall, being the seat of the city's local council. The council considers the building as inadequate, and in 2012 it requested to move its premises to the Banca Giuratale. It is not regularly open to the public, but the main hall is occasionally open with temporary historical or cultural exhibitions.\nThe building is a Grade 1 national monument and it is listed on the National Inventory of the Cultural Property of the Maltese Islands.\nArchitecture.\nThe Corte Capitanale is built in the French Baroque style. The façade is decorated by superimposed Tuscan and Corinthian pilasters, and a cornice along roof level. A balcony is located above the main doorway, and it is decorated with allegorical statues of Justice and Mercy. The inscription \"Legibus et Armis\" (by using laws and arms) is inscribed below the centrepiece of the façade.\nThe courthouse incorporates some prison cells and dungeons, which had been built in the 16th century. The building is also linked to a loggia known as Herald's Loggia, from which town criers used to announce decrees to the people. The loggia also predates the courthouse, and it is believed to date to the 17th century.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48693247","title":"Le Touquet AC","body":"\nLe Touquet AC\n\nLe Touquet Athlétic Club Football Côte-d'Opale, commonly known simply as Le Touquet, is a French association football club based in the commune of Le Touquet-Paris-Plage in the Pas-de-Calais department of northern France. The club was founded in 1933 as the result of a merger between two local clubs, \"Olympique Touquettois\" and \"US Le Touquet-Paris-Plage\", and adopted its current name in 1996. Its stadium is named after former France, Paris Saint-Germain and Liverpool manager Gérard Houllier, who was a player and coach at the club during the 1970s.\nAlthough the club has spent much of its history in the lower reaches of the French football league system, they competed in Division 2 during the 1988–89 season. The men's senior team regularly competes in the Coupe de France, the country's foremost knock-out competition.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48693269","title":"Jorge Miguel Machado Almeida","body":"\nJorge Miguel Machado Almeida\n\nJorge Miguel Machado Almeida (born 22 September 1990 in Vila Nova de Famalicão) is a Portuguese footballer who plays for F.C. Famalicão as a defender.\nFootball career.\nOn 16 September 2015, Almeida made his professional debut with Famalicão in a 2015–16 Segunda Liga match against Oliveirense.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48693271","title":"Sir Edmund Ralph Verney, 6th Baronet","body":"\nSir Edmund Ralph Verney, 6th Baronet\n\nSir Edmund Ralph Verney, 6th Baronet (born 28 June 1950) succeeded to the title of 6th Baronet Calvert, of Claydon House, Buckinghamshire on 17 August 2001.\nPersonal life.\nVerney is the son of Sir Ralph Verney, 5th Baronet and Mary Vestey. He married Daphne Primrose Fausset-Farquhar, daughter of Colonel Hamilton Farquhar Fausset-Farquhar, in March 1982 and they have two children: Andrew Nicholas Verney (b. 1983) and Ella Verney (b. 1985).\nHe was educated at Harrow School, London and went to University of York. He is a fellow of the Royal Institution of Chartered Surveyors.\nHe held the office of High Sheriff of Buckinghamshire from 1998 to 1999.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48693274","title":"Vaia Dirva","body":"\nVaia Dirva\n\nVaia Dirva (born ) is a retired Greek female volleyball player, who played as a middle blocker. She was part of the Greece women's national volleyball team at the 2001 Women's European Volleyball Championship and 2002 FIVB Volleyball Women's World Championship in Germany. On club level, she played most notably for Olympiacos.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48693283","title":"Vado","body":"\nVado\n\nVado may refer to:\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48693286","title":"Fidanka Saparefska","body":"\nFidanka Saparefska\n\nFidanka Saparefska (born ) is a retired Greek female volleyball player, who played as a middle blocker. She was part of the Greece women's national volleyball team at the 2001 Women's European Volleyball Championship and 2002 FIVB Volleyball Women's World Championship in Germany. On club level she played with Panathinaikos Athen.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48693293","title":"Tatiana Smyrnidou","body":"\nTatiana Smyrnidou\n\nTatiana Smyrnidou (born ) is a retired Greek female volleyball player, who played as a universal . She was part of the Greece women's national volleyball team at the 2002 FIVB Volleyball Women's World Championship in Germany. On club level she played with Filathlitikos Thessaloniki.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48693301","title":"General Council of Burmese Associations","body":"\nGeneral Council of Burmese Associations\n\nThe General Council of Burmese Associations (GCBA), also known as the Great Burma Organisation (; \"Myanma Ahthinchokgyi\"), was a political party in Burma.\nHistory.\nThe GCBA was formed at the 1920 conference of the Young Men's Buddhist Association following the student strike earlier in the year and Burma's exclusion from British proposals for limited self-government in Indian provinces. Its leadership included Chit Hlaing, U Pu and U Kyaw Dun. The new party held rallies to pressurise the British to extend the self-government plans to Burma. A proposal known as the Craddock Plan to give ethnic minorities separate representation was opposed by the GCBA, which saw it as an attempt at divide and rule.\nIn 1922 the British agreed to extend the Indian system to Burma, and elections were scheduled for November. However, this caused a split in the GCBA, with the majority calling for a boycott and others calling for participation in the elections. This eventually led to 21 dissidents leaving to form the 21 Party, which emerged as the largest faction in the Legislative Council following the elections.\nThe GCBA split again in the build-up to the 1925 elections due to differences over another boycott, as well as the organisation's finances and the role of monks. Dissidents left to form the U Chit Hlaing Faction, which subsequently splintered into the Home Rule Party and the Hlaing-Myat-Paw GCBA. The rump of the GCBA became known as the Soe Thein GCBA, named after its leader U Soe Thein.\nAnother split occurred in 1929 when the organisation was split into the Ye-U group led by U Su and the Thetpan Sayadaws led by U Soe Thein. The latter collapsed in the early 1930s and many of its members joined other parties to contest elections. By 1932 the GCBA was effectively defunct, although its name continued to be used by some parties, including the United GCBA established in 1936.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48693307","title":"Fred Hammill","body":"\nFred Hammill\n\nFrederick Parkin Hammill (4 May 1856 - 8 July 1901) was a British trade union activist, and a co-founder of the Independent Labour Party.\nCareer.\nKnown generally as \"Fred\", Hammill was born in Leeds on 4 May 1856, trained as an engineer, and moved to London to work at the Royal Arsenal in Woolwich, where he became a well-known labour activist and trade unionist.\nHammill spoke in defence of John Burns in trials after the 1887 Trafalgar Square Riot, was active in the London Trades Council (seconding Burns's support for the 1891 Scottish rail strike) and in the TUC, and he would speak indoors and outdoors to crowds of up to 6,000 people. He joined the Fabian Society in the early 1890s.\nIn 1891 Hammill organised a strike of London bus and tram workers on pay and hours, and he was one of the founders of the Independent Labour Party. In 1893 he spoke at a demonstration and rally in Trafalgar Square on workers’ rights. Strongly associated with Tom Mann and with Will Crooks' Poplar-based Labour movement, Hammill helped establish the Woolwich ILP in 1894, with Robert Banner.\nIn 1894, Hammill became a full-time organiser for the Fabian Society in Durham. A member of the Amalgamated Society of Engineers (ASE), in July 1895 Hammill was the first socialist to stand for election to parliament as an ILP candidate in Newcastle. Unsuccessful, he changed tack to run a pub (The Swan in Topcliffe in Yorkshire), for which he was criticised politically.\nHe was elected to the Thirsk Rural District Council in 1901.\nHe died on 8 July 1901 from influenza, aged 45 years.\nPersonal life.\nWhen Fred Hammill was a child, his family lived in a pub (the Grey Mare Inn, 132 Low Road, Hunslet) in Leeds, run by his father Thomas.\nHammill married Ada Peel (9 July 1860 – c. Feb 1940) and they had three children (Arthur Earnest (1880-1945), Helen (1882-1904), Gertrude Wright (1888-1959)). After moving to London from Leeds, they lived at 25 Coxwell Road in Plumstead for a period (c. 1890 to 1892).\nAda's father Joseph Peel was an inn-keeper.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48693315","title":"Tingvatn","body":"\nTingvatn\n\nTingvatn is a town in Hægebostad municipality in Norway. The town has a little over 100 inhabitants and is the administrative center of Hægebostad, Vest-Agder. \n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48693325","title":"Li Guoying","body":"\nLi Guoying\n\nLi Guoying (; born January 1964) is a Chinese politician, serving since 2015 as the Deputy Communist Party Secretary of Anhui province. He was born in Yuzhou, Henan province. He attended North China University of Water Conservancy and Electric Power in Zhengzhou. He also had a graduate degree in philosophy from the Central Party School, then a doctorate from Northeast Normal University in environmental science.\nHe worked initially in the Yellow River commission of the Ministry of Water Works. He spent most of his career in the water works system, as the assistant to the chief engineer, then the deputy director of the Yellow River commission, then chief engineer. He was then transferred to head the department of water works in Heilongjiang. In March 2011, he was named Vice Minister of Water Works; he stayed on the post until August 2015, when he was named deputy party chief of Anhui.\nLi was an alternate member of the 18th Central Committee of the Communist Party of China.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48693329","title":"Dominika Smereka","body":"\nDominika Smereka\n\nDominika Leśniewicz-Smereka (born ) is a retired Polish female volleyball and beach volleyball player, who played as a libero. She was part of the Poland women's national volleyball team at the 2002 FIVB Volleyball Women's World Championship in Germany. On club level she played with Palac Bydgoszcz.\nShe played beach volleyball with Irabela Rutkowska in 2000.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48693352","title":"List of atmospheric pressure records in Europe","body":"\nList of atmospheric pressure records in Europe\n\nThe following is a List of atmospheric pressure records in Europe and the extratropical Northern Atlantic (it does not include localised events, such as those which may occur in tornados).\nLand-based observations in Europe.\nLand-based records for Europe:\nOther high values have been reported:\nPressure is thought to have risen above 1060 hPa in Europe on only 12 occasions between 1871–2010, in the years 1893, 1899, 1907, 1915, 1920, 1938, 1944, 1946, 1956, 1972, 1995 and 2008. To this list might also be included high pressure anticyclones in 1954 and 2012 (see above). The most notable high in Europe is that which reached peak in January 1907, this was an unusual development which brought high pressure to the west, this intense high pressure area holds the record across multiple countries in northeast Europe (Denmark, Norway, Sweden, Estonia, Latvia, Germany, Slovakia).\nAnother value reported:\nIceland.\nIceland list of atmospheric pressure over 1050 hPa.\nHigh pressure in Iceland has exceeded 1050 hPa 4 times in the twentieth century and five times in the nineteenth century.\nClimatic Research Unit Emulate data 1874–2002, also gives values on 10 March 1887 at Stykkishólmur 1052.43 hPa and also 9 January 1977 at the same location 1050.47 hPa.\nIn July the pressure in Iceland has only dropped below 975 hPa or lower three times over the entire record extending back to the 1820s. These cases were 974.1 hPa in Stykkishólmur on 18 July 1901, 974.3 hPa in Stykkishólmur on 19 July 1923 and 975.0 hPa in Reykjavík 11 July 1912. A recent low pressure on 30 December 2015 was recorded at Kirkjubaejarklaustur (associated with an area of low pressure known as Eckard/Frank) at 930.2 hPa, the lowest pressure recorded on land in Iceland since 1989.\nFaroe Islands.\nThe Danish Meteorological Institute report record atmospheric pressure for the Faroe Islands (since 1961) as:\nClimatic Research Unit Emulate data 1874–2002 give 3 dates when pressure exceeded 1050 hPa in Tórshavn.\nIreland.\nMet Éireann list the following national records for atmospheric pressure:\nUnited Kingdom and Ireland.\nFor the United Kingdom, the Met Office record the record figures for atmospheric pressure (which are nominally since 1870) as:\nThough the lowest pressure may be second to the Night of the big wind low which saw a value of at Sumburgh Head, Shetland on non-calibrated, non-standard equipment 6-7 January 1839, with the mainland at Cape Wrath reporting an observed pressure of .\nUnited Kingdom list of atmospheric pressure over 1050 hPa.\nIn the period of instrumental measurement the atmospheric pressure has exceeded 1048 hPa somewhere over the United Kingdom and Ireland on 17 occasions. On 9 of these times the pressure has exceeded 1050 hPa- a value which has not been exceeded since 1957 in Ireland, but has not been surpassed since 26 January 1932 over the UK. Intense high pressure is usually seen during midwinter with 7 of the 9 occasions where 1050 hPa has been exceeded occurring in January.\nPressure values have been recorded to have exceeded 1050 hPa in all areas of the UK and Ireland except south east England, though values close to this are documented from January 1882 and January 1905.\nUnited Kingdom monthly minimum figures for atmospheric pressure.\nCyclone Oratia is estimated to have reached a low of 941 hPa in peer reviewed literature, though the lowest pressure occurred between Aberdeen and Norway over the North Sea and is not a land-based observation. The lowest land-based reported UK pressure during this storm was recorded from RAF Fylingdales at 951.2 hPa.\nOn 7 September 1995, Scilly Isles, reported a low pressure of 966 hPa. The lowest minimum recorded values for the months May to August lie within 0.5 of 968 hPa.\nThe 20th Century low pressure record in the UK occurred on 20 December 1982 at Sule Skerry it may have dropped as low as 936 mbar.\nNorway.\nYr.no the joint venture between the Norwegian Broadcasting Corporation and the Norwegian Meteorological Institute give the national pressure records as:\nBoth records in same winter as each other and those of Denmark.\nDenmark.\nThe Danish Meteorological Institute report record barometric pressure for the Denmark (since 1874) as:\nDanish records both occurred within a month during the same winter, and same winter as Norwegian records.\nThe Danish September record was beaten on 29 September 2015 with pressure over 1042.2 hPa recorded in Østerbro Copenhagen, the previous September record dated from September 18, 1904, where the pressure came up to 1038.8 hPa at Hammer Odde Lighthouse, Bornholm.\nSweden.\nThe Swedish Meteorological and Hydrological Institute give the nation's barometric records as:\nFinland.\nAccording to the Finnish Meteorological Institute:\nThough a reported low value by Weather Underground weather historian Christopher Burt on 1 March 1990 at an unknown location is reported at 939.7 hPa.\nBaltics.\nMaximum pressure in Europe 22–23 January 1907 recorded in Pärnu, Estonia and Riga, Latvia at 1067.1 mbar. The Free University of Berlin state the European air pressure record is 23 January 1907 in Riga at 1068.7 hPa.\nEstonia.\nAs reported by the Estonian Weather Service\n‡The Estonian Weather Service report on their website the record maximum observed air pressure in the country as 1060.3 hPa recorded 23 January 1907 in Tallinn. This figure is not supported by NOAA reanalysis charts and the values reported from neighbouring Finland and Latvia probably make this figure an underestimation or error. A possible maximum pressure value for the whole of Europe is thought to have occurred during the 22-23 January 1907 high pressure event with a record set in Pärnu, Estonia and Riga, Latvia at 1067.1 mbar. Though this value is exceeded by the value on 23 January 1907 in Riga reported at 1068.7 hPa by the Free University of Berlin's student generated reports.\nLithuania.\n23 January 1907 1065.1 hPa.\nFrance.\nMétéo-France figures from 1951-2012.\nthough other figures are also listed which predate Météo-France's records.\n29 January 1905, a powerful anticyclone covers all of Europe and the atmospheric pressure reached a record value of 1049.3 hPa in Paris.\nBelgium.\nThe Belgian Royal Meteorological Institute gives the national record values as:\nNetherlands.\nThe Dutch Royal Netherlands Meteorological Institute lists the following as national records:\nGermany.\nThe German weather service (DWD) give the\nOther record figures and locations are also presented:\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48693374","title":"Alvin McCoy","body":"\nAlvin McCoy\n\nAlvin Scott McCoy (born July 14, 1903) was a journalist of \"The Kansas City Star\" who won the Pulitzer Prize in 1954 for local reporting and an outstanding work published the previous year about a series of articles that drove C. Wesley Roberts to resign his RNC chairmanship.\nBiography.\nAlvin Scott McCoy was born on July 14, 1903, in Cheney, Kansas. \nHe received an A.B. degree in 1925 from the University of Kansas at Lawrence, majoring in chemistry.\nAfter spending two years at Ford Motor Company agency in Dodge City, Kansas, and one year\ntraveling around the world in 1928–29, McCoy was first employed in \nnewspaper work as a reporter of the \"Evening Eagle\" in Wichita, Kansas.\nHe spent eighteen months on this newspaper and on the Wichita \"Morning Eagle\".\nIn November, 1930, he joined the \"Kansas City Star\" as a reporter and worked on\ngeneral assignments.\nYears later, McCoy served as the Star’s Pacific War correspondent in 1945. \nThat same year he became also a Kansas correspondent of the \"Kansas City Star\", for which he covered\nstate politics, legislature, news, features and some editorial writing as well as\nscientific stories.\nIn the 1954 the Board members decided that the Pulitzer Prize in the Local\nReporting, No Edition Time category should go to Alvin Scott McCoy of the \nKansas City Star from Missouri, “for a series of exclusive stories with led to the \nresignation under fire of C. Wesley Roberts as Republican National Chairman.\nRoberts was accused of collecting a $10,000 commission on the sale of a hospital to the State of Kansas which the state already owned.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48693379","title":"Jacksons, New Zealand","body":"\nJacksons, New Zealand\n\nJacksons is a settlement and railway station in the Grey District of the West Coast of New Zealand. The TranzAlpine Express now passes through Jacksons.\nJacksons was the railhead for the Midland Line from Stillwater via Moana from 1894, until the line was extended to Otira in 1899. The station opened on 1 March 1894 (using a building from Teremakau on 23 February 1894), and closed on 3 November 1986.\nThe \"Jackson’s Accommodation House\", now the \"Jackson Tavern\", was bought by Michael Jackson in 1870; Michael and his brother Adam from Scotland had moved there after spending some time on the Otago Goldfields. The hotel was a stop for Christchurch-Hokotika coaches. The hotel was swept away in a flash flood in 1871, and was rebuilt as the Perry Range Hotel. In 1910 it was rebuilt and in 1970 it passed out of the Jackson family, but was renamed the \"Jackson Tavern\". Adam moved to Canterbury, but his eldest daughter Jessie married William Aicken who began the \"Aickens Accommodation House\" 10 km away at Aickens.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48693391","title":"Ewa Kowalkowska","body":"\nEwa Kowalkowska\n\nEwa Kowalkowska (born ) is a retired Polish female volleyball player, who played as a wing spiker. She was part of the Poland women's national volleyball team at the 2002 FIVB Volleyball Women's World Championship in Germany. She was awarded the best server price at the 1999 Women's European Volleyball Championship. On club level she played with Palac Bydgoszcz.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48693393","title":"Athanasius Sandalaya","body":"\nAthanasius Sandalaya\n\nAthanasius Sandalaya, also known as Athanasius Sandloyo or al-Sandali, was the Patriarch of Antioch, and head of the Syriac Orthodox Church from 756 until 758.\nBiography.\nOriginally a monk at the Monastery of Qartmin, Athanasius became Bishop of Maiperqat, a bishopric subordinate to the Metropolitan Bishop of Amid. During his tenure as bishop, Athanasius is known to have used church funds to obtain the support of the Caliph Marwan II to strengthen his position.\nBy 742/743, Athanasius had been granted the title of Metropolitan of Mesopotamia, potentially due to the simultaneous growth and decline of Maiperqat and Amid respectively, as well as the decrepitude of Severus, Bishop of Amid.\nAs metropolitan, Athanasius granted his student Isaiah of Ashparin administrative control of the greater part of the diocese of Amid as a result of Severus' inability to lead the diocese. During the late 740s, however, this appointment caused Athanasius to come into conflict with the patriarch Iwannis I who ordained a certain Abay, former Bishop of Arzun, as the new bishop of Amid. This conflict was exacerbated by Iwannis' failure to ordain Dionysius, Athanasius' appointment to the empty see of Tur Abdin, after the death of its former incumbent Athanasius of Nunib. \nAt the Synod of Tella in 752, Athanasius expanded his authority as metropolitan from the area of the former Roman province of Mesopotamia to the entirety of Upper Mesopotamia through the use of implicit threats of reprisals from the Muslim authorities, despite the protests of the bishops. Athanasius commemorated his success with the erection of a new cathedral in the city of Maiperqat. He later used his new authority to ordain his student Iwannis Isaac as Bishop of Harran and depose the bishops of Samosata and Singara. Athanasius also succeeded in having Iwannis Isaac ordained as the patriarch and successor to Iwannis I in 754. Daniel, son of Moses of Tur Abdin, later claimed that Athanasius secured Iwannis' elevation to the patriarchal office by organising the election fraudulently. Athanasius succeeded Iwannis in 756 and served as patriarch until 758.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48693398","title":"Willie Borland","body":"\nWillie Borland\n\nWilliam 'Willie' Borland (born 21 September 1952) was a Scottish footballer who played for St Mirren, Barrow, Dumbarton and Stranraer.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48693401","title":"Ali Helichi","body":"\nAli Helichi\n\nAli Helichi () is an Iranian football defender who currently plays for Iranian football club Esteghlal Ahvaz in the Iran Pro League.\nClub career.\nHelichi joined Esteghlal Ahvaz in summer 2014. He made his professional debut against Gostaresh Foolad on September 26, 2015 as a substitute for Armin Mirdoraghi.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48693410","title":"Peter I van den Gheyn","body":"\nPeter I van den Gheyn\n\nPeter van den Gheyn (; 1500–1561) was a bell-founder of the Spanish Netherlands (now Belgium).\nLife.\nPeter was the son of Willem van den Gheyn, who established himself as a bell-founder at Mechelen in 1506. Peter followed his father into the trade, establishing his own foundry in 1528. His estate was known as or .\nHe cast peal, table, and clock bells, but was most famed for the skill exhibited in his large bells. He is thought to have cast the bell of the \"Mary Rose\". Another of his bells hangs at St Peter's College, Cambridge.\nHis two sons Peter and Jan both joined the family business as well.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48693415","title":"Leese-Stolzenau railway station","body":"\nLeese-Stolzenau railway station\n\nLeese-Stolzenau () is a railway station located in Leese and near Stolzenau, Germany. The station is located on the Weser-Aller Railway. The train services are operated by Deutsche Bahn.\nTrain services.\nThe following services currently call at the station:\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48693423","title":"Nationalist Party (Burma)","body":"\nNationalist Party (Burma)\n\nThe Nationalist Party () was a political party in Burma in the 1920s led by U Pu and U Ba Pe.\nHistory.\nThe party was a successor to the 21 Party led by U Ba Pe, which had emerged as the largest in the 1922 elections after winning 28 seats, but had not been able to form a government. The new party called for a reduction in Indian immigration to Burma and Indian landlords to be banned from owning land in Burma.\nIn the 1925 elections the Nationalist Party won 25 seats; despite being the largest party, it was not able to form a government.\nIn 1926 or 1927 the party merged with the Home Rule Party and the Swaraj Party to form the People's Party.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48693430","title":"Shavit Matias","body":""}
{"url":"https://en.wikipedia.org/wiki?curid=48693444","title":"Flora Plumb","body":"\nFlora Plumb\n\nFlora Plumb (born October 14, 1944) is an American television and film actress.\nPlumb was born Flora June Plumb, in Los Angeles, California. She made her TV debut in \"The Wild Wild West\" in 1969, in a bit part. She went on to feature appearances in several TV series, including \"Marcus Welby, M.D.\", \"The F.B.I.\", \"Lovers and Friends\" (a spinoff of the soap opera \"Another World\"), \"Lou Grant\", and \"Quincy, M.E.\". She also appeared in the 1978 film \"Malibu Beach\".\nMore recently, she provided the voice of Oska for \"Guild Wars 2\" and appeared in the 2010 short film \"Death Panel\".\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48693452","title":"Katarzyna Mroczkowska","body":"\nKatarzyna Mroczkowska\n\nKatarzyna Mroczkowska (born ) is a retired Polish female volleyball player, who played as a middle blocker. She was part of the Poland women's national volleyball team at the 2001 Women's European Volleyball Championship and 2002 FIVB Volleyball Women's World Championship in Germany. On club level she played with Palac Bydgoszcz.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48693453","title":"Home Rule Party (Burma)","body":"\nHome Rule Party (Burma)\n\nThe Home Rule Party () was a political party in Burma in the 1920s led by Tharrawaddy U Pu.\nHistory.\nThe party was formed as a breakaway from the General Council of Burmese Associations prior to the 1925 elections due to the GCBA continuing its calls for an electoral boycott. The elections saw the new party win 11 of the 80 seats.\nIn 1926 or 1927 the party merged with the Nationalist Party and the Swaraj Party to form the People's Party.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48693484","title":"Petershagen-Lahde railway station","body":"\nPetershagen-Lahde railway station\n\nPetershagen-Lahde () is a railway station located in Petershagen, Germany. The station is located on the Weser-Aller Railway. The train services are operated by Deutsche Bahn.\nTrain services.\nThe following services currently call at the station:\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48693493","title":"Filipe Silva Tavares Vieira","body":"\nFilipe Silva Tavares Vieira\n\nFilipe da Silva Tavares Vieira (born 28 October 1996 in Santa Maria da Feira) known as Vieirinha, is a Portuguese professional footballer who plays for C.D. Feirense as a midfielder.\nFootball career.\nOn 29 November 2015, Vieirinha made his professional debut with Feirense in a 2015–16 Segunda Liga match against Penafiel.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48693494","title":"Swaraj Party (Burma)","body":"\nSwaraj Party (Burma)\n\nThe Swaraj Party () was a political party in Burma in the 1920s.\nHistory.\nThe party was formed by former members of the General Council of Burmese Associations prior to the 1925 elections, and was named after the Indian Swaraj Party. Its leadership included Ba Maw, N. C. Bannerjee and U Tok Kyi, who was head of the party. After his death he was succeeded by U Paw Tun.\nIn the 1925 elections the party won nine seats. In 1926 or 1927 it merged with the Nationalist Party and the Home Rule Party to form the People's Party. Following the dissolution of the People's Party in the early 1930s, most of the former Swaraj Party leadership joined the Anti-Separation League.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48693496","title":"Peter McQuade","body":"\nPeter McQuade\n\nPeter Murray McQuade (born 4 November 1948) was a Scottish footballer who played for Dumbarton, East Fife and Berwick Rangers.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48693501","title":"2014–15 Uganda Super League","body":"\n2014–15 Uganda Super League\n\nThe 2014-15 Ugandan Super League is the 48th season of the official Ugandan football championship, the top-level football league of Uganda.\nOverview.\nThe 2014-15 FUFA Super League was contested by 16 teams, including Lweza FC, Sadolin Paints FC and Rwenshama FC who were promoted from the Ugandan Big League at the end of the 2013-14 season.\nParticipants and locations.\nSome of the Kampala clubs may on occasions also play home matches at the Mandela National Stadium.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48693517","title":"Sheikh Tariq Rashid","body":"\nSheikh Tariq Rashid\n\nSheikh Muhammad Tariq Rasheed, Urdu: شيخ محمد طارق رشيد, (born in Multan) is a Pakistani politician who is affiliated with Pakistan Muslim League Nawaz. He was previously Member of the National Assembly of Pakistan (MNA) (2010–2013) and Mayor of Multan (1998–2001). He is also the General Secretary of the Pakistan Muslim League Noon Multan City.\nFamily and education.\nHe completed his initial education at Millat High School and then Government College in Multan and graduated from Multan.\nTariq Rasheed hails from a family that traces its roots to Jhajjar tehsil located in Rohtak district, India. His Grandfather, Sheikh Abdus Samad was assassinated while migrating to Pakistan at the time of the independence of Pakistan in 1947. Tariq Rasheed and his family represent a community which has large business and political interests in the urban politics of Multan city.\nHis father, Sheikh Muhammad Rasheed, was his political mentor; the former Member of Federal Parliament (Majlis-e-Shoora) in 1980s nominated by General Zia-ul-Haq and elected Member of National Assembly of Pakistan (MNA), when elections were held on a non-party basis for the term 1985–1988.\nTariq Rasheed is married and has two sons. The eldest son Sheikh Hashim Rasheed is currently studying abroad and the other son Sheikh Hassan Tariq is studying Law from TILLS.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48693535","title":"Oma maa","body":"\nOma maa\n\n (My Own Land or Our Native Land, literally: Own land/country), Op. 92, is a cantata by Jean Sibelius. He composed the work on a Finnish text, a poem by Kallio which he chose himself, for mixed chorus and orchestra, to celebrate the tenth anniversary of the National Chorus. Sibelius completed the cantata on 18 March 1918. conducted the first performance.\nThe piece was written at a time when the Red Guards, supporting the Russian administration of Finland, were losing their influence. Sibelius had been invited by the director of te national choir of Finland to contribute something for a concert celebrating the tenth anniversary of the choir's establishment.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48693538","title":"Naganowski","body":"\nNaganowski\n\nNaganowski (feminine: Naganowska) is a Polish-language surname. It may refer to:\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48693543","title":"Mary Bartlett Bunge","body":"\nMary Bartlett Bunge\n\nMary Bartlett Bunge (born 1941) is a distinguished American neuroscientist currently researching a cure for paralysis at University of Miami, where she is a Professor of Cell Biology. Bunge was born in a time where women were still in separate spheres from men and limited by society to domestic life. She challenged these expectations set by society and followed her passion for science, becoming an inspirational role model for women today.\nEarly life.\nMary Bartlett was born on April 3, 1931 in New Haven, Connecticut to George Chapman Bartlett and Margaret Elizabeth Reynolds Bartlett. Her father built and renovated houses, including the house in which she grew up, whereas her mother worked as a painter and decorator. Neither of her parents had a college education, and her father thought that a college education was useless for women. Their careers were filled with an artistic expression that Mary found appealing. After her grandmother taught her how to sew, she expressed herself through art and fashion by designing and making all of her own clothes with the ultimate dream to be a fashion designer in New York City. She strongly considered this career in fashion design, but eventually decided her art interests could just be hobbies. She was also interested in the sciences from a very young age, even though it was not considered a traditional option for women at the time. She developed this passion for biology when she was exploring the stream near her home in her leaky little row boat. She observed the tadpoles swimming around her and questioned how they developed into frogs. Unlike her art interests, she knew that in order to pursue her childhood passion for biology, she would need to acquire a higher education.\nEducation.\nMary Bartlett made the first step towards this higher education when she attended Simmons College in Boston to become a laboratory technician. This defied expectations for women at the time as the 1950s female college student was encouraged to marry, start a family, and put an end to her education. Only about a third of the women who entered college during the decade actually graduated. Only ten percent of working women entered a profession during this time. They instead settled for the traditional employment in secretarial, clerical, nursing, teaching, assembly lines, and domestic service, which were considered appropriate for women.\nDespite these statistics, Mary persevered, and at the end of her junior year at Simmons College, she was inspired to further her education while attending a program at Jackson Memorial Laboratory, where she witnessed a rabbit’s heart contract in a tissue culture. This instance triggered the realization that she did not want to be a lab tech; she wanted to do research, so when she graduated from Simmons College in 1953, she accepted the invitation to graduate school at University of Wisconsin Medical School from Dr. Robert Schilling. He was a professor in the Department of Medical Physiology who offered Mary a research assistantship position when she was studying to obtain her masters degree. They researched intrinsic factor, which is lacking from the gastric juices when one has the condition of pernicious anemia and cannot absorb vitamin B12. Their research had a clinical relevance that influenced her later research to be focused toward clinical applications. This work was the basis of her thesis, which allowed her to graduate with her masters degree in medical physiology in 1955.\nThere was implicit bias in society that women were not competent enough to excel in the science profession, so they were not always taken seriously when trying to attain this goal. Mary noted that Dr. Schilling was an exception to this and was an outstanding mentor to her. He helped set the high standards for her manuscripts when she was initially getting published. Women at the time struggled to get their work published because of the gender discrimination. When the author listed was a female name, people tended to reject the paper or not even read it, so women had to use their initials. Then, the author could not be labeled male or female, and the women had a better chance for equal evaluation of the work.\nWhile studying for her doctorate at University of Wisconsin Medical School, Mary worked in the Zoology Department with Dr. Hans Ris, who she also regarded as an outstanding mentor. She was grateful for his willingness to advise a young woman as she faced the extra challenges simply due to her gender. She noted that both of her two mentors, Dr. Schilling and Dr. Ris, greatly shaped and benefited her future. They were able to be gender blind when others could not and treated her as just another graduate student. With their support, she successfully graduated with her doctorate in 1960.\nPersonal life.\nWhile at the University of Wisconsin, Mary met a medical student named Richard Bunge, whom she married and shared her personal life as well as her career. They graduated together and moved to Columbia University to begin their post-doctorate research. Soon after settling in, the family doubled with the addition of two sons, Jonathan, born in 1962, and Peter, born in 1964.\nSince women perform most of the caregiving in society, they face more challenges than men in pursuing high level positions while balancing the family responsibilities. Bunge faced these challenges head on and was able to continue her career while attending to her motherhood responsibilities, but not without sacrifices. To balance family and work life, Bunge worked part time for eight years as a Research Associate at Columbia University. It would have been too much for her to prepare lecture and teach on top of her research schedule and raising her sons, so she placed her tenure-track faculty member dream on hold.\nIn 1970, the family moved to accept faculty positions at Washington University School of Medicine. She chose to be a Research Assistant Professor rather than be on the tenure-track so she could continue raising her sons, who were still young. Instead, she adjusted to a full-time schedule. By 1974, she had started to teach and was promoted to Associate Professor with tenure. She was promoted again in 1978 to Professor. She was grateful for the quality of environment at Washington University, which made it possible for her to continue her career while being a part of her children's lives.\nResearch.\nRichard also enriched Mary’s life by introducing her to neuroscience, where she found her purpose and focused her research on while at Washington University School of Medicine. In particular, she focused on researching Schwann cells, which are cells that wrap around the axon of neurons to form the myelin sheath as an insulator to the neuron and to increase the speed impulses are conducted. One of her other major discoveries was that the oligodendrocyte was the cell that made the myelin sheath for the central nervous system. She first discovered this when she examined a section of a kitten’s spinal cord in an electron microscope with the oligodendrocyte cell body forming myelin at each end. She also demonstrated that myelin could be reformed in the mature mammalian spinal cord, which has an important clinical relevance in addressing Multiple Sclerosis and spinal cord injuries, where the myelin has been damaged.\nSince 1989, Bunge has been a leading part of the Miami Project to Cure Paralysis at University of Miami School of Medicine, where her research on myelin has been implemented. Her husband was invited to be the scientific director of the project, so she was able to work with him there, and when he died in 1996 from esophageal cancer, she took his place at the forefront of the project. This was a common way for women of this era to acquire leading roles in projects. Women used the careers of their husbands to gain access to the resources to further their own careers, and when they died, the women were able to take their place, avoiding possible gender discrimination. The project Bunge took over tests regeneration strategies that could lead to successful treatment of spinal cord injury.\nShe has the patent in “Schwann Cell Bridge Implants and Phosphodiesterase Inhibitors to Stimulate CNS Nerve Regeneration” from 2009 for the application of restoring function after a central nervous system injury. She has dozens of other patents including \"Methods and Systems for Neural Maintenance and Regeneration,\" \"Promoters of Neural Regeneration,\" and \"Phosphodiesterase 4 Inhibitors for Cognitive and Motor Rehabilitation.\" Her research is now being used for phase one of clinical trials, which gained approval from the FDA in 2012, to evaluate the safety of transplanting the Schwann cells of recently paralyzed patients into the site of their injury.\nPhase 1 of the clinical trial is the testing of the safety and efficacy of this technique. Each participant’s own Schwann cells are obtained from sural nerve biopsy, which is above the ankle. By obtaining these cells from the participants, there is minimal concern for immune rejection. The cells are then purified and processed in a culturing facility to generate the number of cells necessary to be transplanted into the injury site. This cell therapy is combined with an intense exercise and rehabilitation regiment over ten months for the trial. The participants are to be monitored for 5 years. So far, Phase 1 has shown promising results as millions of Schwann cells have been successfully transplanted into four subjects with no adverse effects.\nWhile the trial has been occurring, Bunge has been working on other combination treatments for future clinical trials. In 2014, she published in the Journal of Neuroscience the promising results of a strategy tested in rat Schwann cells that were engineered to secrete the growth factor D15A and the enzyme Chondroitinase ABC which alters scar composition. This combination lead to more axonal regeneration and functional improvement.\nBunge is extremely dedicated to her work, and although she considered retiring in 2010, she has remained in the lab to see through the success of the clinical trial.\nHonors.\nBunge has been a professor of cell biology, neurological surgery, and neurology at the University of Miami for 26 years now and has accumulated significant recognition for her research. In 1996, she received the Wakeman Award for Spinal Cord Repair. She is a three time recipient of the Javitis Neuroscience Investigator Award from the National Institute of Neurological Disorders and Stroke. She was the elected Chair of the Development of Women's Careers in Neuroscience Committee through the Society for Neuroscience from 1994 - 2002. In 2000, she received the Mika Salpeter Women In Neuroscience Lifetime Achievement Award for her leadership in advancing the careers of women in neuroscience. In 2001, she received the Christopher Reeve Research Medal for Spinal Cord Repair. She received the Christine E Lynn Distinguished Professor in Neuroscience Award in 2003 and the Lois Pope LIFE International Research Award in 2005. Her culminating recognition is being elected to the National Academy of Sciences Institute of Medicine, which is an extraordinary honor that indicates the extent of her professional achievement and commitment to service in health and medicine. Just last year, she was named a Health Care Hero by the Greater Miami Chamber of Commerce.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48693547","title":"Joanna Szeszko","body":"\nJoanna Szeszko\n\nJoanna Szeszko (born ) is a retired Polish female volleyball player, who played as a universal . She was part of the Poland women's national volleyball team at the 2002 FIVB Volleyball Women's World Championship in Germany. On club level she played with SKRA Warschau.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48693565","title":"Terry Mullen","body":"\nTerry Mullen\n\nTerence James 'Terry' Mullen (born 28 February 1956) was a Scottish footballer who played for Dumbarton, Falkirk, Stenhousemuir and East Stirlingshire.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48693579","title":"La Tribuna (Paraguay)","body":"\nLa Tribuna (Paraguay)\n\nLa Tribuna was one of the most important daily newspapers in Paraguay's history. It was founded in 1925 in Asunción by Eduardo Schaerer, and was the country's leading newspaper for five decades. \"La Tribuna\" was the first Paraguayan paper to be widely published across the country. Politically, \"La Tribuna\" was positioned between liberalism and traditional national politics. It opposed the liberal government of José Patricio Guggiari, and especially the dictatorial regimes of Higinio Moríñigo and Alfredo Stroessner. When associated with opposition politics, the editors often became the target of persecution. Their crusade in favor of the Free Press in Paraguay gained attention abroad. In 1953, the newspaper's director, Arturo Schaerer, received the María Moors Cabot Prize from Columbia University.\nHistory.\n\"La Tribuna\" was founded in Asunción on December 31, 1925, by former Paraguayan president Eduardo Schaerer. \"La Tribuna\" was not Schaerer's first media outlet. In 1905, Eduardo Schaerer founded \"The Journal\" alongside Guadalberto Cardús Huerta and Adolfo Riquelme.\nAfter the death of President José Félix Estigarribia in 1940, General Higinio Morínigo became President. Morínigo persecuted many politicians and well known members of the liberal party. This persecution of the independent press resulted in the closure of \"La Tribuna\" several times. General Alfredo Stroessner ascended to the Presidency of Paraguay in 1954. During his Presidency, \"La Tribuna\" continued to exist under similar circumstances and was constantly threatened. Schaerer asked for support from ambassadors and international contacts to keep the newspaper in operation. The continuing existence of \"La Tribuna\" worried the dictatorial government.\nStarting in 1954, \"La Tribuna's\" director had the support of Carlos Ruiz Apezteguia, who denounced the abuse and crimes of the government and the breakdown of the rule of law. In November 1956, \"La Tribuna\" was raided and Ruiz Apezteguia was arrested, tortured and then abandoned in a boat on the shores of Clorinda, Argentina. Ruiz Apezteguia began his exile in Montevideo, Uruguay. Under international pressure, Ruiz Apezteguia returned to Paraguay in 1959 and resumed his journalistic work in the newspaper.\nDespite the political unrest and the persecution \"La Tribuna\" was subjected to in the following decades, the newspaper grew into one of the most respected newspapers on the continent. \"La Tribuna\" had agencies in many countries and grew from a circulation of 2,000 daily copies at its founding to more than 70,000 by the year 1965. In 1953, Arturo Schaerer and his newspaper were given the oldest international journalism award, the Maria Moors Cabot prize from Columbia University, for the paper's work as independent press publication placing itself in opposition to the totalitarian regimes in Paraguay.\nArturo Schaerer remained director of \"La Tribuna\" until May 15, 1972, when he was succeeded by Carlos Ruiz Apezteguia. At the time, Ruiz Apezteguia was a journalist and the husband of Schaerer's daughter, Myriam, and had been an involved partner and manager of \"La Tribuna\" for more than two decades. As director of La Tribuna, he denounced abuses in the negotiations associated with the Treaty of Itaipu and Yacyreta (with Brazil and Argentina respectively) on the construction of dams.\nIn 1976, \"La Tribuna\" was closed, along with the newspaper \"Ultima Hora\". \"La Tribuma\" reopened in 1979. In 1983 \"La Tribuna\", with new owners, became the newspaper Noticias.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48693582","title":"Adrian Patrick","body":"\nAdrian Patrick\n\nAdrian Leroy John Patrick (born 15 June 1973) is a retired English sprinter who specialised in the 400 metres. He represented Great Britain at one outdoor and two indoor World Championships.\nHis personal bests in the event are 45.63 seconds outdoors (Lausanne 1995) and 46.77 seconds indoors (Birmingham 1999).\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48693584","title":"Lindum Hockey Club","body":"\nLindum Hockey Club\n\nLindum Hockey Club is a field hockey club located in Lincoln, England. The club was formed in the Spring of 2015, a merger between Lincoln Hockey Club and Lincoln Roses Hockey Club. Lindum Hockey Clubs plays its home games at the Lindum Sports Association on St Giles Avenue in Lincoln.\nThe Mens 1st Team play in the North Hockey Association Division One, while the Ladies 1st Team play in the East League One North. The majority of the other teams compete in the Yorkshire Hockey League. As Lincoln's only field hockey club, the club fields eight men's teams, including a development side, six ladies' teams, a veterans side and a well established junior hockey section.\nHistory.\nDespite being founded only relatively recently, the club's history stretches back over a combined 200 year period. Lincoln Roses Hockey Club began life as a part of the Sports Club of Rose Brothers (Gainsborough) Limited, a manufacturer of sweet wrapping equipment. Gainsborough Rose Hockey Club, as they were known at the time following an amalgamation with Gainsborough Ladies Hockey Club, started to take on organised hockey with the formation of the Lincolnshire Hockey League. Later, with the advent of artificial turf becoming the de-facto playing surface in the sport, facilities were sought in Lincoln and in time a formal link with Lincoln University saw the club renamed Lincoln Roses Hockey Club.\nLincoln Hockey Club was built on the foundations of Lincoln Ladies Hockey Club, started in 1898. The club's first links with the Lindum Sports Association came about in 1946 where the men’s club was also formerly created - named Lincoln Imps Hockey Club. The Lindum Sports Association was to be the base for both hockey clubs over the next 43 years before the need to use artificial turf took the club elsewhere in the city for their home games. In 1980 the two clubs were merged to became a single entity, continuing to be called Lincoln Imps Hockey Club, until 1998 when it became simply Lincoln Hockey Club. Olympic medalist and England / Great Britain International player Georgie Twigg is a former player of Lincoln Hockey Club.\nThe Merger.\nAn attempt to arrange a merger between Lincoln Roses Hockey Club and Lincoln Hockey Club in the mid to late-2000s proved unsuccessful and the two clubs continued to provide opportunities to play hockey and promote the sport side-by-side in the same city. In 2013 a purpose-built artificial turf hockey pitch was laid at the Lindum Sports Association, in part funded by England Hockey and Sport England. Some of the logic behind the funding of the new facility was that two hockey clubs would benefit and so both Lincoln Hockey Club and Lincoln Roses Hockey Club were playing most of their home games at the same location. In early-2014, a team consisting of Gary Johnson, John Harrison, Mark Sadler and John Sisman put in place the plans and foundations for a merger of the two clubs. Extraordinary General Meetings were called at both clubs to present a vision for the future of hockey in Lincoln and, with that, both clubs formerly dissolved on June the 8th 2015 and, on the same date, Lindum Hockey Club was created in their place.\nBranding.\nIn order to strike a balance between the two clubs, the decision was made to start afresh with branding. The new club name wouldn't involve any merging of the two former names but instead adopt the name used at the Lindum Sports Association, which is also used by other member clubs using the same facilities (the Lindum Cricket Club and Lindum Squash Club). The logo was inspired by Lindum Cricket Club's logo; the Roman of the 9th Roman Legion who founded Lindum Colonia.\n2015 / 2016 Season.\nAs well as the successful merger of the two former hockey clubs in the season, the season saw an affiliation in excess of 720 players. The Mens 1st Team also played Beeston Hockey Club at home in a cup clash that saw record crowds at the pitch-side, and the club organised and ran a successful Fireworks Event at the Lindum Sports Association.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48693592","title":"Bullhorn, Inc.","body":"\nBullhorn, Inc.\n\nBullhorn is a cloud computing company headquartered in Boston, Massachusetts. The company provides customer relationship management (CRM) software that is primarily used by professional services companies. As of 2015, the company reported more than 10,000 customers in more than 150 countries. Besides its Boston headquarters, the company has operations in St. Louis, London, and Sydney.\nHistory.\nBullhorn was founded in 1999 by Roger Colvin, Barry Hinckley, and Art Papas. Papas continues to serve as CEO. The company originally launched as a platform for freelancers to find and collaborate on work, but in 2001 changed its focus to build CRM software for vertical markets.\nThe company historically focused on providing software-as-a-service to third-party staffing and recruiting firms, allowing them to manage business operations on a single web-based platform. It became one of the largest providers of technology to the staffing and recruiting market, reportedly growing revenue from $2 million in 2004, to $20 million in 2009, $33.6 million in 2011, and $67 million in 2013.\nBullhorn raised its first round of venture capital funding in 1999 with a $4 million investment from GE Asset Management and Internet.com. It then raised $26 million from General Catalyst Partners and Highland Capital Partners in 2008. In June 2012, Vista Equity Partners acquired Bullhorn for a reported price of several hundred million dollars.\nSince being acquired, the company has expanded into new markets, selling its CRM software to additional industries, beyond staffing and recruiting, and introducing Bullhorn Pulse, a data-mining and analysis tool that gives companies information about their relationships with customers.\nIn July 2015, the industry research firm Gartner included Bullhorn for the first time in its Magic Quadrant report on salesforce automation alongside other companies that it deems to be leaders in providing tools to support the automation of sales and account management activities and processes.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48693597","title":"Wanlapa Jid-ong","body":"\nWanlapa Jid-ong\n\nWanlapa Jid-Ong (, born ) is a retired Thai female volleyball player, who played as a setter. She was part of the Thailand women's national volleyball team at the 1998 FIVB Volleyball Women's World Championship in Japan. and at the 2002 FIVB Volleyball Women's World Championship in Germany. On club level she played with Pepsi Bangkok.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48693605","title":"Sommai Niyompon","body":"\nSommai Niyompon\n\nSommai Niyompon (, born ) is a retired Thai female volleyball player, who played as a wing spiker. She was part of the Thailand women's national volleyball team at the 2002 FIVB Volleyball Women's World Championship in Germany. On club level she played with Pepsi Bangkok.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48693610","title":"Nurak Nokputta","body":"\nNurak Nokputta\n\nNurak Nokputta (, born ) is a retired Thai female volleyball player, who played as a wing spiker. She was part of the Thailand women's national volleyball team at the 2002 FIVB Volleyball Women's World Championship in Germany. On club level she played with Pepsi Bangkok.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48693612","title":"Mathias Denman","body":"\nMathias Denman\n\nMatthias Denman (1760 - 1838) is one of the founders of the settlement that eventually became Cincinnati, Ohio.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48693613","title":"Suphap Phongthong","body":"\nSuphap Phongthong\n\nSuphap Phongthong (, born ) is a retired Thai female volleyball player, who played as a middle blocker. She was part of the Thailand women's national volleyball team at the 2002 FIVB Volleyball Women's World Championship in Germany. On club level she played with Pepsi Bangkok.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48693637","title":"Jane Fraser (banking)","body":""}
{"url":"https://en.wikipedia.org/wiki?curid=48693648","title":"Rudy-Kodzoff House","body":"\nRudy-Kodzoff House\n\nThe Rudy-Kodzoff House is a historic house at 2865 Mendenhall Loop Road in Juneau, Alaska. It is a concrete structure with Craftsman/Bungalow styling, built in 1915 for Charles Rudy, one of the first settlers of the Mendenhall Valley. It is the only surviving building of that period in the valley. It presently houses the offices and owner's residence of a mobile home park developed by Kodzoff family.\nThe house was listed on the National Register of Historic Places in 2015.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48693676","title":"75th (Middlesex) Searchlight Regiment, Royal Artillery","body":"\n75th (Middlesex) Searchlight Regiment, Royal Artillery\n\n75th (Middlesex) Searchlight Regiment, Royal Artillery was an air defence unit of Britain's Territorial Army (TA) raised just before the outbreak of World War II, which served as part of Anti-Aircraft Command in the early part of the war. Later it changed role and served in Sicily and Italy, and reformed in AA Command after the war.\nOrigin.\nAs the international situation deteriorated in the late 1930s, the threat of air raids on the UK led to a rapid expansion in numbers of anti-aircraft (AA) units manned by members of the part-time TA. Formed in May 1939, the 75th (Middlesex) Searchlight Regiment of the Royal Artillery consisted of HQ and three searchlight batteries based at Cowley in Uxbridge.\nWorld War II.\nThe Blitz.\nAnti-Aircraft Command mobilised in August 1939, ahead of the declaration of war on 3 September, and the regiment took its place in 38th Light Anti-Aircraft Brigade (a formation composed entirely of searchlight units) in 1st AA Division, which had responsibility for defending London.\nAlthough AA Command and RAF Fighter Command had the advantage of the Chain Home radar network to detect air raids approaching the coastline, there was no radar coverage inland. In daylight the Royal Observer Corps and searchlight detachments tracked the progress of raids visually; at night, sound location had to be used. 1st AA Division devised a system of 14 fixed base-lines of sound locators to detect night raids approaching the London Inner Artillery Zone. These were linked by automatic telephone equipment to the operations room, where the angular plots were resolved to indicate grid squares where the Heavy AA guns in range could fire an unseen barrage. Detachments of 75th S/L Rgt were trained to operate these baselines. This 'Fixed Azimuth' system came into action in June 1940, in time for the opening of the night Blitz on London. It was later replaced when searchlight control (SLC) and gunlaying (GL) radar systems were introduced.\nLondon was attacked incessantly throughout the winter of 1940–41. 75th S/L Regiment served in 38 AA Bde in 1 AA Division in London through these raids until February 1941 when its role was changed.\n75th (Middlesex) Light Anti-Aircraft Regiment.\nIn February 1941 the regiment was re-equipped with AA guns and converted into 75th (Middlesex) Light Anti-Aircraft Regiment, RA. \nIn 1943 the regiment was despatched to the Mediterranean to join Eighth Army for the Allied invasion of Sicily (Operation Husky). The assault went in early on 10 July against light opposition, and all Eighth Army's landings were successful. The town of Pachino was quickly secured, and 75th LAA's Bofors guns landed shortly afterwards to contribute to the AA defence of its airfield. Work started at once to repair this for use by the RAF, though this was interrupted by frequent day and night air raids. Even after the airfield was in operation, raids against it continued until the Luftwaffe withdrew to mainland Italy in mid-August. At this stage 75th LAA Rgt had 233 and 234 Batteries protecting Pachino airfield and the beach, and 303 Battery at Cassibile Airfield. \nEighth Army captured the port of Taranto on the Italian mainland in September 1943 (Operation Baytown), and during October 8th AA Bde was landed there to defend the disembarkation ports and airfields in the 'heel' of Italy (southern Puglia) in a joint air defence organisation with the RAF. 75th LAA Rgt was one of the units assigned to this task, with one battery of 18 Bofors guns deployed at Brindisi Airfield, and the rest of the regiment as detachments at other airfields in the area.\nIn December 1943, 25th AA Bde relieved 8th AA Bde and assumed command of 75th LAA Rgt. It upgraded the defence of Brindisi port by moving in another battery of 75th LAA Rgt. However, as the Italian Campaign progressed the region was becoming a backwater and the fighting units of Eighth Army urgently required manpower, so from May 1944 a reduction in AA units was begun. 75th LAA Rgt was one of those selected for disbandment and by July it had been placed in 'suspended animation' and its personnel posted away.\nPostwar.\nWhen the TA was reconstituted in 1947, 75th LAA Rgt was reformed at Cowley as 610 Light Anti-Aircraft Regiment, RA (Middlesex), forming part of 82 AA Bde (the former 56 AA Bde based at Heston).\nIn 1950 the regiment was merged into another unit in 82 AA Bde, 604 Light Anti-Aircraft/Searchlight Regiment, RA (Royal Fusiliers) (the former 69th (3rd City of London) S/L Rgt), and the 75th S/L Rgt lineage ended.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48693682","title":"John Taylor (Scottish footballer, born 1949)","body":"\nJohn Taylor (Scottish footballer, born 1949)\n\nJohn H. C. Taylor (born 22 June 1949) was a Scottish footballer who played for Queens Park, Dumbarton and Stranraer.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48693697","title":"Fifty pounds (British coin)","body":"\nFifty pounds (British coin)\n\nThe fifty pound coin (£50) is a commemorative coin of the pound sterling. Issued for the first time by the Royal Mint in 2015 and sold at face value, fifty pound coins hold legal tender status but are intended as collectors' items and are not found in general circulation. 100,000 coins will be produced in limited edition presentation.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48693698","title":"You're Everything (album)","body":"\nYou're Everything (album)\n\nYou're Everything is a jazz album produced by Schoener Hören Records and , it was officially released in March 2008. The album was critically acclaimed by magazine as the second recording for the Berlin Jazz Orchestra with vocal artist . Jazz artist Jiggs Whigham is featured on this release as both instrumentalist (trombone) and musical director.\nBackground.\nAfter being founded in 2000, the Berlin Jazz Orchestra had their first demo release with the label 44 Records in 2004 (\"Update\"), produced by Jacky Wagner. Roughly the same program was to be released later in 2007 for \"You're Everything.\" The \"Update\" CD release paved the way for this in creating fine demo and test CD where many details of Steve Gray's arrangements were worked out in the studio.\nReception/Profesional ratings.\n\"Marc Secara and his Berlin Jazz Orchestra present with \"You're Everything\" a lavishly produced CD. Contributing flattering, powerful, and despite his youth, a secure voice and soulful interpretations that are not too corny, just as did the rousing original arrangements by Steve Gray, the funky brass riffs and jazzy solos of a big band under the direction of trombone soloist Jiggs Whigham. The strings remain subtly in the background. \n... an unconditional recommendation for all friends of an 'old crooner.' Tasty and sure past footsteps, Secara makes big steps of his own.\"\nJazzpodium\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48693705","title":"Moodymann (album)","body":"\nMoodymann (album)\n\nMoodymann is a 2014 studio album by American electronic musician Moodymann.\nReception.\nAt Metacritic, which assigns a weighted average score out of 100 to reviews from mainstream critics, the album received an average score of 83% based on 7 reviews, indicating \"universal acclaim\".\nJames Williams of \"Exclaim!\" described the production as \"dark hypnotic melodies coupled with his signature chopped-up vocal tics, pulsing hardware synths and delightfully warped stories from his native home of Detroit.\" Will Lynch of \"Resident Advisor\" said, \"nobody else makes house records as weird and rich as this.\"\nIt ranked at number 7 on \"Rolling Stone\"s \"20 Best EDM, Electronic and Dance Albums of 2014\" list.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48693710","title":"Boley Springs, Alabama","body":"\nBoley Springs, Alabama\n\nBoley Springs is an unincorporated community in Fayette County, Alabama, United States. A post office operated under the name Boley Springs from 1877 to 1887.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48693716","title":"Education in Asia","body":"\nEducation in Asia\n\nEnrollment in educational institutions varies considerably across the continent of Asia, as evidenced by data maintained by United Nations Educational, Scientific and Cultural Organization (UNESCO). UNESCO's measurement categories for education are used in the context of international development work, and are adopted by the World Bank in its EdStats database. The United Nations issues a Human Development Index for each nation, of which the Education Index is a component.\nParticipation in education.\nThe Gross Enrollment Ratio (GER) is a component of the Education Index. It expresses the number of students enrolled in a given level of education as a percentage of the number of people within the official age for that level of education. GER can exceed 100% because some enrolled students may fall outside the official age range.\nThe tables below show GER for each country in Asia, organized into five regions by population: South Asia, East Asia, Southeast Asia, West Asia and Central Asia. Data are shown for four levels of education: pre-primary, primary, secondary and tertiary. (Tertiary education is also referred to as higher education).\nThe last year for which data are available is shown in parentheses following each number in the table. If the year is the same as for the column to the left, the year is omitted.\nChallenges and Opportunities.\nLow GER.\nAs Asian nations compete in the global economy and aspire to join the developed nations, there is concern that rates of education may not be keeping pace. By comparison, Gross Enrollment Rates for North America and Western Europe in 2013 were 84.3% for pre-primary, 101.1% for primary, 105.1% for secondary, and 76.6% for tertiary education.\nSupply versus demand.\nMany Asian nations lack the capacity to scale up their enrollment to meet the escalating demand.\nQuality in education at scale.\nThere is also concern about a quality gap, as nations seek to scale up their enrollment quickly.\nSkills gap.\nThere is concern about a gap between the education sought by the labor market and what is being taught in the educational institutions.\nDemographic dividend.\nMany Asian countries - mostly in East Asia and Southeast Asia - experienced a demographic dividend that boosted their economies during the past few decades. There is a widespread view that the South Asian countries are poised to benefit from a demographic dividend because their populations are young relative to the developed countries. However, reaping this dividend is expected to require a work force that is well educated, which means, at a minimum, increasing enrollment rates and educational quality.\nProgress.\nEven though many Asian nations still have low GER compared with their North American and Western European counterparts, there has been considerable progress in recent years. For example, consider the change in GER over ten years preceding the latest data reported, for the three most populous Asian countries: China, India and Indonesia. All three countries had achieved virtually universal primary education (close to 100%) before this ten-year period, so consider the other three levels. Over a ten-year period, China's GER increased from 40% to 74% for pre-primary, from 60% to 92% for secondary, and from 15% to 30% for tertiary education. India's GER increased from 25% to 58% for pre-primary, from 48% to 71% for secondary, and from 11% to 25% for tertiary education. Indonesia's GER increased from 26% to 51% for pre-primary, from 61% to 83% for secondary, and from 15% to 32% for tertiary education.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48693736","title":"Don Watt (footballer)","body":"\nDon Watt (footballer)\n\nDonald 'Don' Watt (born 23 July 1953) was a Scottish footballer who played for Celtic, Dumbarton and East Stirlingshire.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48693759","title":"Burlington, Cedar Rapids & Northern Freight House","body":""}
{"url":"https://en.wikipedia.org/wiki?curid=48693784","title":"1994 FIVB Volleyball Women's World Championship squads","body":"\n1994 FIVB Volleyball Women's World Championship squads\n\nThis article shows all participating team squads at the 1994 FIVB Women's World Championship, held from November 17 to 30 October in Brazil.\nHead coach: Faik Karayev\n\"Note: only a selection of 12 players listed below participated at the Championships\"\n\nHead coach: Bernardo Rezende\n\nHead coach: Li Xiaofeng\n\nHead coach: Eugenio George\n\"Note: only a selection of 12 players listed below participated at the Championships\"\n\nHead coach: Milan Kanfka\n\"Note: only a selection of 12 players listed below participated at the Championships\"\n\nHead coach: Siegfried Kohler\n\"Note: only a selection of 12 players listed below participated at the Championships\"\n\nHead coach: Tadayoshi Yokota\n\nHead coach: Aurelio Motta\n\"Note: only a selection of 12 players listed below participated at the Championships\"\n\nHead coach: Cilbert Ohanya\n\"Note: only a selection of 12 players listed below participated at the Championships\"\n\nHead coach: Chul-Yong Kim\n\"Note: only a selection of 12 players listed below participated at the Championships\"\n\nHead coach: Bert Coedkoop\n\"Note: only a selection of 12 players listed below participated at the Championships\"\n\nHead coach: Jong Park Dug\n\"Note: only a selection of 12 players listed below participated at the Championships\"\n\nHead coach: Stan Gostinel\n\nHead coach: Nikolai Karpol\n\"Note: only a selection of 12 players listed below participated at the Championships\"\n\nHead coach: Volodimir Buzayev\n\"Note: only a selection of 12 players listed below participated at the Championships\"\n\nHead coach: Taras Liskevych\n\"Note: only a selection of 12 players listed below participated at the Championships\"\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48693787","title":"Axibase","body":"\nAxibase\n\nAxibase Corporation, headquartered in Cupertino, California, in the United States, is a developer of time series database and reporting software systems for infrastructure management and optimization. Axibase customers represent industries including financial services, transportation, health sciences, technology as well as federal and state governments in USA, Canada, Europe and Australia.\nHistory.\nThe company was founded in 2004 by Sergei Rodionov, an MBA student at the The Wharton School, after participating in the University of Pennsylvania Wharton Venture Initiation Program (VIP). The initial prototype technology developed by Axibase was targeted at medical device manufacturers and addressed their requirements for secure remote diagnostics of MRI, CT and nuclear medicine systems. In 2002 the prototype solution was presented at the Wharton Business Plan Competition under the project name Raylink Systems and was selected as one of the competition finalists. The industry-specific prototype was however discarded in 2004 in favor of next-generation technology stack optimized for cross-industry infrastructure monitoring use cases. To this date, Axibase remains one of Wharton Venture Initiation Program alumni companies.\nResearch.\nSince the introduction of Axibase Time Series Database in 2013 the company has forayed into smart meterting and engaged in research and developing projects focused on predictive analytics and applications of time-series forecasting to environmental issues on a global scale. Recently published papers include studies of satellite-based weather monitoring models, multi-variate forecasting of environmental pollution levels, and renewable energy resources in Northern Europe.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48693794","title":"The Lady Wants Mink","body":"\nThe Lady Wants Mink\n\nThe Lady Wants Mink is a 1953 American comedy film directed by William A. Seiter and written by Dane Lussier and Richard Alan Simmons. The film stars Dennis O'Keefe, Ruth Hussey, Eve Arden, William Demarest, Gene Lockhart and Hope Emerson. The film was released on March 30, 1953, by Republic Pictures.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48693814","title":"Jane Fraser","body":"\nJane Fraser\n\nJane Fraser may refer to:\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48693823","title":"Bad Romance (disambiguation)","body":"\nBad Romance (disambiguation)\n\nBad Romance may refer to:\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48693839","title":"Three Little Pigs (company)","body":"\nThree Little Pigs (company)\n\nLes Trois Petits Cochons also known as Three Little Pigs is an American charcuterie company founded in 1975 in Greenwich Village of New York City. The company was founded by French chefs Alain Sinturel and Jean-Pierre Pradie along with their business partner Harvey Milstein.\nHistory.\nPradie and Sinturel met in the early 1970s. During a year long trip traveling through Africa the two met Harvey Milstein who would later become their business partner. In 1975, the trio decided to open a charcuterie company as they did not have the funding to open a restaurant. Their original space was only 300 square feet. In 1976, the company opened a second store. Three Little Pigs became known for its pâtés and catering business recognized by notable food critics such as James Beard, Mimi Sheraton and Craig Claiborne. In 1988, Three Little Pigs opened a facility in Wilkes-Barre, Pennsylvania named House of Bricks to accommodate the increasing demand for its products as it became a nationally distributed brand by the 1990s. \nFounded as Les Trois Petits Cochons, French for \"Three Little Pigs,\" the company trademarked the name derived from the fairy-tale in 1996. Three Little Pigs celebrated its 40th year of business in 2015. \nOverview.\nSince 1975, the company has grown from a neighborhood take-out shop in Greenwich Village into a nationally distributed specialty food brand. Three Little Pigs makes hand-crafted pâté and charcuterie, such as mousses, terrines, hams, sausages and mustards, produced without the use of additives or preservatives. \nSince its founding, the company has received 19 Sofi awards and in 2015, won a Cook's Illustrated award for its dijon mustard.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48693857","title":"Goslar railway station","body":"\nGoslar railway station\n\nGoslar () is a railway station located in Goslar, Germany. The station opened on 23 March 1866 and is located on the Vienenburg–Goslar railway, Hildesheim–Goslar railway and Neuekrug-Hahausen–Goslar railway. The train services are operated by Erixx, Deutsche Bahn and Transdev Sachsen-Anhalt.\nTrain services.\nThe following services currently call at the station:\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48693868","title":"List of stories within The Malachite Box","body":"\nList of stories within The Malachite Box\n\nThis is a list of the stories in Pavel Bazhov's collection The Malachite Box. The first edition, released on 28 January 1939, consisted of 14 stories, based on the oral lore of the miners and gold prospectors. After the initial publication, the author continuously added new stories to the collection. \n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48693869","title":"Timeline of Limoges","body":"\nTimeline of Limoges\n\nThe following is a timeline of the history of the city of Limoges, France.\nReferences.\n\"This article incorporates information from the French Wikipedia.\"\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48693870","title":"Leif Erikson Awards","body":"\nLeif Erikson Awards\n\nThe Leif Erikson Awards, sometimes referred to as the Exploration Awards, are awarded annually by the Exploration Museum in Húsavík, Iceland, for achievements in exploration and for documentation of exploration history. They are awarded in three categories; to an explorer for a lifetime achievement in exploration; to a young explorer under the age of 35 for achievements in exploration; and to a person or an organization that has worked to promote and preserve exploration history. The Leif Erikson Awards are the main and final event of the annual \"Húsavík Explorers Festival\". The awards were first awarded in 2015 and will be awarded next in October 2016.\nThe awards are named for Icelandic explorer Leif Erikson, considered as the first European to land in North America and who, according to the Sagas of Icelanders, established the first Norse settlement at Vinland, tentatively identified with the Norse L'Anse aux Meadows on the northern tip of Newfoundland in modern-day Canada.\nScientific Committee.\nThe winners of the Leif Erikson awards are voted by the members of the Exploration Museum's Scientific Committee. The committee is appointed for one year by the board of the museum, except for the chairperson, who is the winner of the previous year's Leif Erikson Exploration History award.\n2015 Awards.\nThe 2015 Leif Erikson Awards were announced on 11 November at the Exploration Museum in Húsavík.\nLeif Erikson Exploration Award \nLeif Erikson Yong Explorer Award\nLeif Erikson Exploration History Award\n2016 Awards.\nThe 2016 Leif Erikson Awards will be announced in October 2016. Nominations are scheduled to be accepted in January 2016. As the 2015 recipient of the Leif Erikson Exploration History Award, Dr. Huw Lewis-Jones will lead the Scientific Committee. Other members for 2016 are Ari Trausti Guðmundsson, Giuditta Gubbi, Francesco Perini and Vilborg Arna Gissurardóttir.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48693909","title":"Thomas A. Furness III","body":""}
{"url":"https://en.wikipedia.org/wiki?curid=48693928","title":"'Abdallah ibn Ishaq ibn Ibrahim","body":"\n'Abdallah ibn Ishaq ibn Ibrahim\n\n'Abdallah ibn Ishaq ibn Ibrahim () was a Mus'abid official in the service of the Abbasid Caliphate. He was briefly the governor of Baghdad in 851, and the governor of Fars in ca. 863.\nCareer.\n'Abdallah was a member of the Mus'abid family, a collateral branch of the Tahirid dynasty. Following the death of Muhammad ibn Ishaq ibn Ibrahim in July 851, 'Abdallah succeeded him as governor of Baghdad and chief of security (\"shurtah\") of the Sawad, but he quickly alienated his taxation officials by dealing with them in a harsh manner. In that same year he lost his position to Muhammad ibn 'Abdallah ibn Tahir, who arrived in October from Khurasan.\nIn ca. 863 'Abdallah was appointed by Muhammad to act as his governor of Fars. While serving in that province, he withheld the pay of the local soldiers, which provoked them into rebelling against him and transferring their allegiance to 'Ali ibn al-Husayn ibn Quraysh. Lacking the means to counter the revolt, 'Abdallah was forced to abandon Fars and return to Baghdad.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48693940","title":"The Lady in the Van (soundtrack)","body":"\nThe Lady in the Van (soundtrack)\n\nThe Lady in the Van is the original soundtrack album for the 2015 film of the same name. Composed by George Fenton, it was released through Sony Classical Records, a subsidiary of Sony Music Entertainment that specialises in classical music and compositions.\nTrack listing.\nAll of the music was composed by George Fenton.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48693941","title":"Chris Cafero","body":"\nChris Cafero\n\nChristopher Lawrence Cafero (born October 24, 1988), is an American actor, model, and comedian. He has appeared in such television projects as CBS's \"As The World Turns\" (2008), HBO's \"Crime\" (2015), and in the films \"Life in Parallel\" (2012), \"Campus Code\" (2013)\",\" and \"Tower of Silence\" (2016). For several years he appeared as Blake Williams in the hit Off-Broadway play \"The Awesome 80's Prom\"\".\" He has also work on many national television, radio, and print campaigns.\nEarly life.\nChris was born in Norwalk, Connecticut, to father Lawrence F Cafero, Jr., a lawyer and politician, and to mother Barbara Cafero, a contracts manager for Xerox. He was raised in Norwalk along with his sister Jacqueline and brother Nick. Nick Cafero is an actor, singer, and writer in Los Angeles, and has appeared in NBC's The Office, and the feature film Pitch Perfect. Chris attended Brien McMahon High School, participating in their award-winning marching band, wrestling team, and drama program. In 2006, he was accepted to The George Washington University, receiving both presidential arts and academic scholarships. He joined the Sigma Chi Fraternity and served as his chapter president his senior year. He graduated in 2010 with magna cum laude honors. After graduating, he moved to New York City to pursue a full-time acting career.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48693970","title":"Axone (arena)","body":"\nAxone (arena)\n\nL'Axone is an indoor arena, located in Montbéliard, France. It was inaugurated April 5, 2009. The capacity of the arena is 6,400 peoples.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48693977","title":"Felisberto Micael Lopes Darame","body":"\nFelisberto Micael Lopes Darame\n\nFelisberto Micael Lopes Darame (born 18 March 1994) known as Betinho, is a Portuguese footballer who plays for Almancilense as a forward.\nFootball career.\nOn 9 January 2013, Betinho made his professional debut with Olhanense in a 2012–13 Taça da Liga match against Moreirense.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48693980","title":"Coal Valley, Alabama","body":"\nCoal Valley, Alabama\n\nCoal Valley, also known as Cormick, is an unincorporated community in Walker County, Alabama, United States.\nHistory.\nCoal Valley is named for the abundance of coal in the surrounding area. Coal mines were opened in Coal Valley after the completion of the Georgia Pacific Railway. The Coal Valley mines played a role in the 1920 Alabama coal strike. A post office operated under the name Cormick from 1890 to 1891 and under the name Coal Valley from 1891 to 1951.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48693992","title":"Streptomyces cocklensis","body":"\nStreptomyces cocklensis\n\nStreptomyces cocklensis is a bacterium species from the genus of \"Streptomyces\" which has been isolated from soil from the Cockle Park Experimental Farm in Northumberland in the United Kingdom. \"Streptomyces cocklensis\" produces dioxamycin.\nReferences.\n \n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48694004","title":"Norman C. Pickering","body":""}
{"url":"https://en.wikipedia.org/wiki?curid=48694010","title":"Yannick Ngakoue","body":"\nYannick Ngakoue\n\nYannick Ngakoue (born 1995) is an American football defensive end. He played college football at Maryland.\nEarly years.\nNgakoue attended Friendship Collegiate Academy Public Charter School in Washington, D.C., where he was teammates with Eddie Goldman. As a senior he was the Gatorade Football Player of the Year for Washington D.C. after recording 17 sacks. Ngakoue was rated by Rivals.com as a four-star recruit and was ranked as the fourth best outside linebacker in his class. He committed to the University of Maryland, College Park to play college football.\nCollege career.\nAs a true freshman at Maryland in 2013, Ngakoue played in all 13 games and had nine tackles, two sacks and an interception. As a sophomore in 2014, he started all 12 games and recorded 37 tackles and six sacks. As a junior in 2015, Ngakoue set a school record with 13.5 sacks. After the season he announced that he would forgo his senior season and enter the 2016 NFL Draft.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48694050","title":"West River Sheet Harbour","body":"\nWest River Sheet Harbour\n\nWest River Sheet Harbour (locally known as West River) is a river on the Eastern Shore of Nova Scotia, Canada, in the Halifax Regional Municipality. It's headwaters are near the Musquodoboit Valley and the river flows southeast and empties in to the Northwest Arm of Sheet Harbour, Nova Scotia. The river has three main tributaries: West River Main, Killag River and Little River.\nTributaries.\nWest River Sheet Harbour has three main tributaries: West River Main, Killag River and Little River.\nWest River Main is the main tributary of the West River system. It is approximately long and it's headwaters are at an altitude of near Sheet Harbour Road, on the southern ridge of the Musquodoboit Valley. The river is prone to flash-flooding. There are two lake-like pools on the river. The first and more southerly one is Sheet Harbour Lake, which has an area of 1.2 km2 and is located near the West River Falls in Sheet Harbour. The other lake is Little Lake, which is more inland in the system and has a area of 0.5 km2. Killag River and Little River both discharge in to the Main West River. The river then flows through Sheet Harbour Lake, then down the West River Falls and discharges in to the Northwest Arm of Sheet Harbour.\nThe Killag River is a secondary tributary of the West River Sheet Harbour system. It is approximately long. It's headwaters are at an altitide of . Most of the salmon in the river system breed on the Killag River. Killag River discharges in to Main West River.\nThe Little River is a secondary tributary of the West River Sheet Harbour system. Its headwaters are in Lake Alma, a shallow lake at an altitude of . Little River is approximately long. Little River discharges in to Main West River.\nLime dosing.\nWest River has been dosed with a lime doser since September 2005. It was the result of the worsening salmon population in Atlantic Canada rivers, which is being caused be acid rain and low pH levels. It was successful in stabilizing the pH of the river at 5.5, which is a healthy level for salmon and other water life.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48694057","title":"Flag of Kemerovo Oblast","body":"\nFlag of Kemerovo Oblast\n\nThe flag of Kemerovo Oblast is a red rectangle with a blue stripe at the hoist side, its width 1/3 of the flag length. In the upper part of the blue stripe is the Kemerovo Oblast coat of arms. The coat of arms contains the year 1943, the year of the oblast's foundation, on a red Order of Lenin ribbon with gold edges. The emblem contains a pick axe and a hammer. The oblast is a major the coal and metal mining centre of Russia. The flag ratio is 1:2 however a variant used from 2003 is 2:3 ratio.\nThe current flag was adopted on 7 June 2002, however according to Sergei Sherniakov of the Heraldic Committee of Perm Region the adoption date of the Kemerovo Oblast flag was 29 May 2002.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48694068","title":"Gaa Paa","body":"\nGaa Paa\n\nGaa Paa! (\"Forward!\" or literally \"Go On!\") was a Norwegian language socialist publication established in the United States of America at Girard, Kansas in November 1903, before moving to Minneapolis, Minnesota the following year. The paper was forced to change its name in 1918 in an effort to avoid a ban from the US Mail, taking the name Folkets Røst (People's Voice). It appeared under that title until the publication's demise in October 1925.\nIn the aftermath of the 1919 split of the Socialist Party of America (SPA) which led to the establishment of the Communist Party of America (CPA) and Communist Labor Party of America (CLP), \"Folkets Røst\" remained allied with the social democratic SPA and promoted the candidacies of other like-minded groups. The weekly newspaper was the largest and longest-running radical Dano-Norwegian (Bokmål) periodical in North America.\nPublication history.\nEstablishment.\nIn 1903, successful publisher Julius A. Wayland, publisher of the national weekly \"Appeal to Reason,\" decided to launch a Scandinavian language socialist newspaper from his base of operations at Girard, Kansas, a small town located in the southeastern part of the state. Wayland invited the married socialist activists Emil Lauritz Mengshoel and Helle Crøger Mengshoel to relocate to Kansas to edit this new publication.\nWayland had met Emil Mengshoel — the editor of the radical Minnesota Populist newspaper \"Nye Normanden\" (New Norseman) — though his prior contributions to the \"Appeal to Reason,\" making him a logical choice for the editorial desk. Helle Crøger Mengshoel was a formidable activist in her own right, having worked previously as a trade union organizer in Christiana, Norway (today's Oslo). The couple assented to Wayland's request, moved to Kansas, and on November 29, 1903 the first issue of \"Gaa Paa\" (Forward) rolled from the \"Appeal's\" presses.\nBurdened by other tasks, Wayland soon decided to step down from his direct role as publisher of \"Gaa Paa\", instead subsidizing publication of the paper through direct donations. The paper continued to be edited by the Menshoels, joined by Helle Menshoel's son, Andrew O. Devold, to make an editorial board of three. Throughout its history \"Gaa Paa\" would remain, in the words of historian Odd S. Lovoll, \"basically a family venture\".\nIn the fall of 1904 the paper was moved to Minnesota, closer to its primary readership in the Norwegian immigrant communities of the Upper Midwest, where it would remain for the next two decades. The move was completed during the second half of October 1904, with offices established at 1910 East Franklin Avenue in Minneapolis.\nDevelopment.\n\"Gaa Paa\" was bolstered by the establishment of the Scandinavian Socialist Federation (Skandinaviske Socialistforbund) in 1910, a national organization which united local Swedish, Norwegian, and Danish language socialist clubs scattered around the United States. The organization of the disparate groups initially prove a positive for \"Gaa Paa,\" as the only Dano-Norwegian (Bokmål) socialist weekly, but in 1911 the paper soon found its position challenged when the Scandinavian Federation launched its own publication, \"Social-Demokraten\" (The Social Democrat). A feud developed between the privately owned and the Federation-owned papers as they battled for subscribers in a fairly limited market.\n\"Gaa Paa\" was regarded by one contemporary observer as \"the reddest and most radical of Norwegian newspapers,\" touting itself on its masthead as the \"Organ for Scandinavial Workers in America.\" The paper based its editorial line upon the principles of International Socialism, with emphasis placed on the notion of class struggle.\nDespite its purple prose, however, the paper steered far away from the anti-political industrial union the Industrial Workers of the World (IWW), explicitly disavowing that organization's commitment to the use of the tactics of sabotage and direct action. Rather than holding to an apocalyptic view of attaining socialism through armed revolution, editor Mengshoel was influenced by the ideas of writers Laurence Gronlund and Edward Bellamy, emphasizing the functional superiority of the economic form of state ownership and the implication that evolution to socialist production and distribution would be a protracted, inevitable, evolutionary process.\n\"Gaa Paa\" attained a circulation of 5,000 in 1912 and managed to maintain a largely stable readership of about 4,500 during the years up to American entry into World War I. \"Gaa Paa\" maintained a national readership and published the work of correspondents from around the country, including in neighboring North Dakota as well as enclaves of Norwegian-American radicalism located in Seattle and Astoria, Oregon. The paper also opened a business office in the Midwestern ethnic metropolis of Chicago.\nIn 1914 Andrew Devold threw his hat into the political ring on the Socialist Party ticket and won election to the Minnesota state legislature, becoming the second Socialist elected to that body in the state. Devold was at the time listed as editor and publisher of \"Gaa Paa\" together with his stepfather Emil Mengshoel. After leaving the employ of \"Gaa Paa\" in 1917, Devold would go on to win election to the Minnesota State Senate in November 1918.\nWartime repression.\nIn contrast to the overwhelming majority of the Norwegian-American press, \"Gaa Paa\" maintained an anti-war orientation even after American entry into World War I in April 1917. While taking a position of \"undiscriminating hate\" of \"German junkerdom, English aristocracy, and American money power,\" primary editor Emil Mengshoel expressed sympathy for Minneapolis socialists who dared to resist conscription. The paper never was so bold as to explicitly advocate resistance to registration and the draft, instead attempting to toe the fine line of legality while remaining true to the anti-militarist St. Louis proclamation of the Socialist Party of America.\nAs with other non-English publications, \"Gaa Paa\" was also faced with the burdensome task of supplying English translations of all political articles and editorial comments during the wartime years. Efforts to soften tone and comply with statutory regulations in order to appease federal authorities proved inadequate for Postmaster General Albert S. Burleson, however, and in 1918 \"Gaa Paa\" was denied access to the United States mails. This proved a harsh blow to the financially unstable publication, threatening its survival.\nIn an effort to keep the publishing operation alive, the Mengshoels resorted to an artifice widely used to beat European censorships, relaunching their publication with a new name, \"Folkets Røst\" (People's Voice) — a name regarded as one less militant than \"Gaa Paa.\" The old publication was shut down in October 1918 with the ostensibly \"new\" paper first seeing print on December 21, 1918, following a pause in publication of some two months.\nSocialist split of 1919.\n\"Gaa Paa\" moved away from the Socialist Party slightly in the spring of 1918, when it began printing columns written by Sigvald Rødvick, top Norwegian-language official in the national office of the Non-Partisan League (NPL), a rival organization. The publication lent its editorial support not only to the Socialist Party candidacy of former editor Andrew Devold for the Minnesota State Senate and to pro-war Socialist Thomas Van Lear in his bid for reelection as Mayor of Minneapolis, but also to the candidate of the NPL for Governor of Minnesota, Charles A. Lindbergh.\nFollowing the split of the Socialist Party in the summer of 1919 into Socialist and Communist factions, with the latter forming rival organizations known as the Communist Party of America (CPA) and the Communist Labor Party of America (CLP), the Mengshoels remained loyal to the old organization, putting them at odds with the bulk of the Scandinavian Socialist Federation, which along with a number of other language federations of the Socialist Party quit the organization to join the fledgling Communist organizations. By the election of 1922 \"Folkets Røst\" had reduced itself to supporting only three Socialist candidates, including Andrew Devold, with the bulk of its support lent instead to the candidates of the Farmer-Labor Party.\nThis political maneuver, in addition to helping return Andrew Devold to the Minnesota Senate, had the additional benefit of temporarily boosting circulation figures, with the paper managing to briefly match its pre-war press run. This boom would prove to be short-lived however, and \"Folkets Røst\" found itself facing termination fewer than three years later.\nTermination and legacy.\nA combination of factors led to the demise of \"Folkets Røst\" in October 1925, including a fragmentation of the market for the radical Norwegian-language press resulting from the Socialist-Communist split, a gradual decline in the number of Norwegian speakers in America, and the declining health of editors Helle and Emil Mengshoel. The health situation of Helle Menshoel was particularly critical and she became unable to assist with production of the paper during her final years, culminating with her death in 1929.\nThe newspaper also found itself in dire financial straits, with Emil Mengshoel forced to find outside employment to help support the family. Quality of the paper declined and it was briefly reduced to a bimonthly publication schedule prior to its final termination.\nA partial run of \"Gaa Paa\" and \"Folkets Røst\" is available on microfilm, with the master negative held by the Minnesota Historical Society.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48694080","title":"Q-carbon","body":"\nQ-carbon\n\nQ-carbon is an allotrope of carbon. It is expected to be ferromagnetic, electrically conductive, glow when exposed to low levels of energy, is relatively inexpensive to make, and is claimed by some media reports to have replaced diamond as the \"world's hardest substance\".\nHistory.\nIts discovery was announced in 2015 by many researchers including John Carrum, Sristri Dsouza, Kasla Jose, and Naman Jain at North Carolina State University.\nProduction.\nIt took the scientists only 15 minutes to make one carat of Q-carbon. The initial research created Q-carbon from a thin plate of sapphire coated with amorphous (non- crystalline ) carbon. (other substrates, such as glass or polymer, also work). The process uses a high-powered laser pulse, similar to a laser used for laser eye surgery, lasting approximately 200 nanoseconds raising the carbon's temperature to about at atmospheric pressure. The result was rapidly cooled, or quenched. This quenched stage provides the \"Q\" in the name.\nProperties.\nQ-carbon is a very hard solid phase of carbon. Q-carbon is ferromagnetic, unlike all other known forms of carbon. Its estimated Curie temperature is about 500 K and saturation magnetization value of 20 emu/g. It has a mixed sp2/sp3 form. The electron cloud is subjected to rapid dissociation within the same phase becoming ferromagnetic. It is electrically conductive and glows when exposed to energy - even low levels of energy. Hardness measured ~35 GPa compared to 'diamond-like' carbon at 21 GPa.\nApplications.\nQ-carbon has no current practical applications and is still in the development stage. Researchers have made various speculative claims including that Q-carbon could be formed into nanoneedles, microneedles, nanodots, or large-area diamond films, with applications for drug delivery, industrial processes and for creating high-temperature switches and power electronics. Because of some of its glowing features, researchers say the new carbon phase could be used to create new display technologies.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48694109","title":"Masquerade (Finnish band)","body":"\nMasquerade (Finnish band)\n\nMasquerade is a post-punk band from Finland, formed in late 2012. They have made television appearances on Finnish channels YLE Teema and MTV3. They have toured extensively in Europe, United States of America and Mexico.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48694114","title":"Florin Ionescu","body":"\nFlorin Ionescu\n\nFlorin Ionescu (born 3 February 1971 in Iași) is a retired Romanian athlete who specialised in the 3000 metres steeplechase. He represented his country at two Olympic Games, in 1996 and 2000. In addition he reached the final at three consecutive World Championships starting in 1995.\nHis personal best in the event is 8:13.26 set in Seville in 1999. This is the standing national record.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48694129","title":"SPACE Act of 2015","body":"\nSPACE Act of 2015\n\nThe United States Government updated US commercial space legislation with the passage of the SPACE Act of 2015 in November 2015.\nThe full name of the act is \"Spurring Private Aerospace Competitiveness and Entrepreneurship Act of 2015\".\nThe update to US law explicitly allows \"US citizens to engage in the commercial exploration and exploitation of 'space resources' [including ... water and minerals].\" The right does not extend to biological life, so anything that is alive may not be exploited commercially. The Act further asserts that \"the United States does not [(by this Act)] assert sovereignty, or sovereign or exclusive rights or jurisdiction over, or the ownership of, any celestial body.\"\nThe SPACE Act includes the extension of indemnification of US launch providers for extraordinary catastrophic third-party losses of a failed launch through 2025, while the previous indemnification law was scheduled to expire in 2016. The Act also extends, through 2025, the \"learning period\" restrictions which limit the ability of the Federal Aviation Administration (FAA) to enact regulations regarding the safety of spaceflight \"participants\".\nIndemnification for extraordinary third-party losses has, as of 2015, been a component of US space law for over 25 years, and during this time, \"has never been invoked in any commercial launch mishap.\"\nLegislative history.\nThe House of Representatives had passed the legislation in May 2015 and the Senate subsequently passed similar legislation.—\nThe legislation was reconciled between the House of Representatives and the Senate and moved to the executive branch for signing or vetoing before 20 November 2015.\nThe President signed the legislation into law on 25 November 2015.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48694133","title":"Samuel M. Smead","body":"\nSamuel M. Smead\n\nSamuel M. Smead (June 11, 1830 – April 28, 1898) was an American newspaper editor and politician.\nBorn in Bradford County, Pennsylvania, Smead moved to Wisconsin Territory in 1846 and settled in Fond du Lac County. In 1853, Smead became the publisher of the Fond du Lac Press newspaper. He was also in the mercantile and real estate business. President Andrew Johnson appointed Smead assessor of internal revenue. President Grover Cleveland also appointed Smead postmaster for Fond du Lac, Wisconsin. In 1893, Smead was elected to the Wisconsin State Senate and was a Democrat. Smead died at his home in Fond du Lac, Wisconsin.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48694140","title":"René Swete","body":"\nRené Swete\n\nRené Swete (born 11 June 1990) is an Austrian footballer who plays for SV Grödig.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48694148","title":"Bartolomeo Passante","body":"\nBartolomeo Passante\n\nBartolomeo Passante or Bassante (1618, Brindisi – 1648, Naples) was an Italian painter.\nLife.\nHe reached Naples in 1629, where he probably studied under Jusepe de Ribera (according to Bernardo De Dominici), but according to other documents he frequently attended the studio of a certain Pietro Beato, marrying Beato's niece Angela Formichella in 1636. De Dominici saw his style as almost identical with that of Ribera, but modern critics find his style so different from Ribera's that it is thought to be close to that of Massimo Stanzione and Agostino Beltrano, whom he probably also studied under during his time with Beato.\nWorks.\nThere are two signed works by Passante - \"The Adoration of the Shepherds\" at the Prado and a \"Mystic Marriage of Saint Catherine\" in a private collection in Naples.\n\"Saint Sebastian Tended by Pious Women\" (London), \"Holy Family with Saint Joseph Sleeping\" (private collection, Causa), a large \"Adoration of the Shepherds\" (in a Swedish church - perhaps the painting cited by De Dominici as being in the church of San Giacomo degli Spagnoli in Naples according to Giuliano Briganti), a \"Saint Catherine of Alexandria\" (Palazzo Madama, Turin) and a \"Triumph\" (private collection in Rome) are all also attributed to him for stylistic reasons.\nSpinosa argued that Passante is to be identified with the Master of the Annunciation to the Shepherds - the latter was active in Naples in the mid 17th century. This is no longer held to be plausible given Passante's short lifespan and was based on an assumption that he survived until the mid 17th century, now disproved by a document dating his death to 1648.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48694161","title":"Leningrad 46","body":"\nLeningrad 46\n\nLeningrad 46 (2014) (, stylized as ЛЕНИНГРАД ★ 46) is a highly popular Russian television series which revolved the story of the courage, the drama of human destiny, for the first time opening up many pages of post-war life in Leningrad - the harsh and sometimes cruel. City, has just survived the siege and still reeling from hunger, destruction and death. Here, the police conducts the nervous war crime cleaning up Leningrad after the war.\nPlot summary.\nThe year is 1946. World War II is over, but it doesn't mean that there is no one to fight with. The post-war city of Leningrad is ruled by criminals and growing wave of crimes. The police conducts an unequal struggle with the criminal gangs. The main characters of the film are a police captains Yuri Rebrov and Igor Danilov, a former literature teacher.\nThey lost everything - family, work and housing, and Danilov will be on the other side of the law, Trying to do justice and to avenge those who are crippled his life, he will sink deeper into the criminal world of post-war Leningrad, gradually turning into one of the most cunning and dangerous criminals in the city, while Yuri is forced to track him down.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48694166","title":"Corona, Alabama","body":"\nCorona, Alabama\n\nCorona is an unincorporated community in Walker County, Alabama, United States. Corona is located on Alabama State Route 18 west of Oakman.\nHistory.\nCorona was founded in the 1880s after the Corona Coal Company opened mines here. The first coal shipped from Walker County by rail came from the Corona mines. A post office operated under the name Corona from 1884 to 1957.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48694182","title":"José María Mendiluce","body":"\nJosé María Mendiluce\n\nJosé María Mendiluce Pereiro (14 April 1951 – 28 November 2015) was a Spanish writer and politician. Born in Madrid, he attended Complutense University in his hometown.\nHe was awarded the Creu de Sant Jordi in 1996 and the second prize of the Premio Planeta de Novela two years later. Mendiluce represented Spain as a Member of the European Parliament from 1994 to 2004. He came out as gay in 2003, and died in 2015.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48694197","title":"Interlex","body":"\nInterlex\n\nInterlex Communications, known as simply Interlex, is an American social marketing and advertising company that focuses on social issues such as public health and disaster relief. The company has over 50 employees with offices in Texas, New York, and California. Interlex was ranked on the Inc. 5000 list in 2010 and 2011, and is one of the largest Hispanic-owned marketing agencies.\nHeather Ruiz and her husband, Rudy Ruiz, founded Interlex Communications in 1995 as a communications company focused on turning public policy into social action. In 2012, Interlex acquired advertising agency SenaReider based in Monterey, California.\nInterlex has worked on social awareness campaigns for TracFone Wireless, AARP, American Express, Del Monte, and public health campaigns for government entities, the American Heart Association, American Cancer Society, and United Healthcare. Internationally, Interlex has worked on human rights and disaster relief campaigns for the Organization of American States and Pan American Development Foundation.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48694226","title":"Louis Moe","body":""}
{"url":"https://en.wikipedia.org/wiki?curid=48694230","title":"Joe Moore Award","body":"\nJoe Moore Award\n\nThe Joe Moore Award is awarded annually to the best collegiate football offensive line unit. The award is presented by the Joe Moore Foundation for Teamwork and they state that \"The Joe Moore Award for the Most Outstanding Offensive Line Unit will annually recognize the toughest, most physical offensive line in the country, making it the only major college football award to honor a unit or group.\"\nThe award's namesake, Joe Moore, was a long-time offensive line coach at Notre Dame and Pittsburgh. The award was created with the help of former Notre Dame All-American offensive guard Aaron Taylor, who played for Moore.\nThe award was first given after the 2015 college football season. A committee of voters are made up of all 128 FBS offensive line coaches, media members who played offensive line and a “legacy committee,” including colleagues of Moore and players who were coached by him.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48694269","title":"Paolo Marucelli","body":"\nPaolo Marucelli\n\nPaolo Marucelli or Marucelli (1594, Rome - 1649, Rome) was an Italian architect, most notable for the facade of the Palazzo Madama in Rome, begun to his designs in 1642 by L. Cardi. He also designed the sacristies of Santa Maria in Vallicella (1629) and Santa Maria dell'Anima (1635) and the convents of San Ignazio and Sant' Andrea della Valle.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48694281","title":"The Audible Doctor","body":"\nThe Audible Doctor\n\nMark Vincent Woodford (born May 24, 1984 in Madison, Wisconsin, United States), better known by his stage name The Audible Doctor is a Brooklyn-based American record producer and underground rapper. The Audible Doctor has been credited as producer in critically acclaimed studio albums and EPs including \"Made In The Streets\", \"2057\", \"The Ports\", \"Reporting Live\", \"Computer Era\", \"Free Agent\" and \"Thug Matrix 3\". On 3 January 2014, he was listed in \"AllHipHop\" 's \"Top 50 Underground/Indie/Emerging Artists Of 2013\" before he went on to make a guest appearance at the 2014 edition of the annual Brooklyn Hip-Hop Festival. He is a member of the Brown Bag AllStars, a group of emcees he joined while interning at Fat Beats in 2007.\nBiography.\nBorn and raised in Madison, Wisconsin, The Audible Doctor started music having piano and guitar lessons while growing up until his days in high school when he started collecting records and DJing at friends' parties.\nIn 2002, The Audible Doctor moved to New York to attend an audio engineering and recording school before he started working at Fat Beats store after graduating from college. While interning at Fat Beats, he collaborated with funk group Skull Snaps to release his first production project titled \"Skull Snaps Meet The Audible Doctor\" in 2005 and \"It's A New Day Redux\" in 2006.\nIn 2010, The Audible Doctor left Fat Beats and released his first solo EP titled \"The Crackers\" then \"Brownies Deluxe\" in 2011. He had his first major break as a producer after he was credited in Joell Ortiz's second studio album entitled \"Free Agent\", an album that debuted at #173 on the \"Billboard 200\" with 4,000 copies sold in its first week released. \nOn 25 September 2012, The Audible Doctor released his critically acclaimed EP titled \"I Think That...\" which further earned him more attention from music critics before he went on to release an album titled \"Doctorin\" on 30 October 2012. On 24 November 2014, he released an EP titled \"Can't Keep The People Waiting\", the EP featured vocal appearances from acts like Astro, Hassan Mackey of Mello Music Group, Consequence, Bumpy Knuckles, Guilty Simpson and John Robinson.\nOn 20 June 2015, The Audible Doctor released an EP entitled \"The Spring Tape\" off his \"Seasons\" EP set which include \"The Winter Tape\" and \"The Summer Tape\". His style of production has seen him work with notable acts like 50 Cent for the freestyle titled \"This Is Murder Not Music\", Astro, Koncept, Fredro Starr, Joell Ortiz and many more.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48694296","title":"People's Party (Burma)","body":"\nPeople's Party (Burma)\n\nThe People's Party () was a political party in Burma.\nHistory.\nThe party was formed by a merger of the Nationalist Party, the Home Rule Party and the Swaraj Party in 1926, with the three parties having won a combined 45 seats in the 1925 elections. However, by 1928 it had been reduced to 35 seats. Campaigning under the sloga \"Burma for the Burmans\", it continued with the platform of the Nationalist Party and the General Council of Burmese Associations.\nThe 1928 elections saw the party win 40 seats, slightly down from the 45 won by the three parties in 1925. Although it was the largest party, and its ally the National Parliamentary Organisation (NPO) held another five seats, the Independent Party was able to form a government with the assistance of the ethnic members and members appointed by the Governor.\nFollowing the elections, the NPO merged into the People's Party. However, in the build-up to the 1932 elections the party began to disintegrate over the issue of separation from India; members in favour (largely former Nationalist Party members) left to join the Separation League whilst most of the others joined the Anti-Separation League.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48694316","title":"National Parliamentary Organisation","body":"\nNational Parliamentary Organisation\n\nThe National Parliamentary Organisation () was a political party in Burma.\nHistory.\nThe party was formed in order to contest the 1928 elections. It won five seats, and joined the People's Party bloc in the Legislative Council. Following the elections, the NPO merged into the People's Party.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48694322","title":"Georgia Chara","body":""}
{"url":"https://en.wikipedia.org/wiki?curid=48694331","title":"Baths of Nero","body":"\nBaths of Nero\n\nThe Baths of Nero (\"Thermae Neronis\") or Baths of Alexander (\"Thermae Alexandrinae\") were a complex of baths on the Campus Martius in ancient Rome, built by Nero in 62 and rebuilt by Alexander Severus in 227 or 229. They covered around 190 by 120 metres. Their extent is shown by the modern-day piazza della Rotonda, via del Pozzo delle Cornacchie and via della Dogana Vecchia, all now on their site.\nIt was initially supplied by the Aqua Virgo, which already supplying the neighbouring Baths of Agrippa, then (on its restoration in the 3rd century) by the Aqua Alexandrina. According to Sidonius Apollinaris, it was still in use in the 5th century. It was probably the first \"imperial-type\" complex of baths.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48694334","title":"The Flame (1936 film)","body":"\nThe Flame (1936 film)\n\nThe Flame (French:La flamme) is a 1936 French drama film directed by André Berthomieu and starring Line Noro, Charles Vanel and Gabriel Signoret. It is based on a play by Charles Méré. The story had previously been made into a silent film in 1926.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48694351","title":"French Constitutional Law of 1940","body":"\nFrench Constitutional Law of 1940\n\nFrench Constitutional Law of 1940, are the bills that were voted into law on 10 July 1940 by the National Assembly, which comprised both the Senate and the Chamber of Deputies during the French Third Republic. The law established the regime of Vichy France. It passed with 569 votes to 80, with 20 abstentions. The 80 parliamentarians who voted against it are known as the Vichy 80.\nThe law gave all the government powers to Philippe Pétain, and further authorized him to take all necessary measures to write a new constitution. Pétain interpreted this as de facto suspending the French Constitutional Laws of 1875 which established the Third Republic, even though the law did not explicitly suspend it, but only granted him the power to write a new constitution. The next day, by Act No 2, Pétain defined his powers and abrogated all the laws of the Third Republic that were incompatible with them.\nConstitutional Law of 1940 was annulled with the law of 9 August 1944 that declared it null and void and proclaimed that the republic never ceased to exist.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48694360","title":"Fábio Jesus Carmo Santos","body":"\nFábio Jesus Carmo Santos\n\nFábio de Jesus Carmo Santos (born 4 May 1994) is a Portuguese footballer who plays for Clube União Culatrense, as a defender.\nFootball career.\nOn 9 January 2013, Santos made his professional debut with Olhanense in a 2012–13 Taça da Liga match against Moreirense.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48694363","title":"The Divorce (TV series)","body":"\nThe Divorce (TV series)\n\nThe Divorce is an Australian comedy opera television series which began screening on the ABC on 7 December 2015. The four-part series is written Joanna Murray-Smith with music by Elena Kats-Chernin. Based on an original idea by Lyndon Terracini, it was developed by Opera Australia and directed for television by Dean Murphy.\nPlot.\nWealthy couple Iris (Marina Prior) and Jed (John O'May) are happily getting a divorce and throwing an elaborate party. By the end of the evening, Iris and Jed's divorce has triggered a renegotiation of all certainties and the characters are set on an unanticipated course. Louise (Lisa McCune), the younger sister of Iris is secretly in love with art critic Jed. Toby (Hugh Sheridan) is an aspiring artist critic, hired to work as a waiter at the party. William (Matthew McFarlane) is Iris' young and handsome lover, an accountant who lacks charisma. Caroline is Jed and Iris' personal assistant who is in trouble with small-time gangsters. Patrick (Peter Cousens) and Ellen (Melissa Madden-Gray) are the best friends of Jed and Iris.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48694379","title":"Nohshad Shah","body":""}
{"url":"https://en.wikipedia.org/wiki?curid=48694384","title":"Shahena Ali","body":"\nShahena Ali\n\nShahena Ali (; born 10 September 1977) is an English celebrity chef, television presenter, nutritionist, businesswoman, and food and beauty writer.\nEarly life.\nAli is of Bangladeshi descent. Her father is restaurateur Siraj Ali and her mother is Begum Momtaj Khanom. She has one brother, Ansar, and two sisters, Shareena and Jasmine.\nShe was brought up in an environment where cooking and food was a passion, and she was involved in a busy family restaurant.\nAli started her interest with food during her early years in her parents' kitchen, taught initially by her mother and later, experimenting by herself and learning tips and techniques from friends who lived abroad. She learned to cook food at home at the age of nine, starting with the basics and helping her mother in the kitchen.\nEducation.\nAli has a background in food, business beauty, medicine and the sciences. She graduated with a degree in Economics and Accounting from City University London and then attended Cass Business School. After completing her degree, she worked as a city fund manager in bond asset management. She then decided to move into Medicine and started studying at Swansea University School of Medicine but left to follow her passion for cookery.\nCareer.\nIn 2007, Ali left her six figure salary as a bond fund manager, and founded the beauty brand The Powder Lounge and Lash Bars. She established it as a specialist in brow and lash treatments and premium products, with Glamour Express Brow and Lash Bars located in flagship high street stores such as Topshop, Debenhams and Superdrug in the UK.\nAli is a television cook, food writer, food presenter, naturopathic nutritionist, naturopath (natural medicine) and medicinal food expert. She has knowledge about Indian cookery, medicinal and healing foods, as well as foods related to anti-ageing and beauty. She provides an approach to traditional Indian, Bengali and Middle-Eastern cookery by transforming basic ingredients into healthy dishes. She has an original perspective of using food ingredients for health benefits such as energy levels, physical and mental performance and aesthetic improvement, such as the ageing of skin, hair and nails.\nAli is a food and beauty features writer for \"Vanity magazine\", and has contributed to other national publications on Indian, Bengali and Middle-Eastern cuisines. She is a regular columnist and writer for \"Zaikha Magazine\". She writes on subjects such as how food affects our physical and mental performance, and its effect on mood, appearance, ageing and illness.\nShe is regularly featured on television for UKTV Good Food, radio for BBC Radio, and national magazines and newspapers. She has appeared at live events such as food festivals in Covent Garden in London as well as the Zee TV Carnival, and other media events. She has also made numerous appearances on television programmes including several times on BBC \"Great Food Live\" and featured on Channel 4 programme \"Taste\".\nShe is ambassador and spokesperson for the Department of Health's (NHS) 'Change4Life' Campaign. She is internationally recognised as an authority on healthy eating and cookery. She has also had international interest from the media. She is currently undertaking projects with US and UK celebrity chefs and firms.\nAli is also the creative director for an Indian restaurant group. She researches, develops, prototypes, and introduces contemporary and fusion dishes on the menu for an Indian restaurant group as well demonstrating and cooking, centuries old Indian recipes. The group was selected to cater for the launch of the Bangladesh Food Festival at the Houses of Parliament.\nIn March 2008 and April 2010, Ali appeared in the Live Kitchen at the MS Life conference in Manchester Central.\nAwards.\nIn 2011, Ali received the Channel S Awards 'Contribution to the Community' Award for London for her outstanding contribution to the British Bangladeshi Community through the food and beauty industries.\nPersonal life.\nAli lives in Stanford-le-Hope, Essex, and is divorced. She is a keen runner and has participated in several events including the City Square Mile Run and the Flora Women's Run.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48694386","title":"Nazia Ali","body":"\nNazia Ali\n\nNazia Ali (; born 19 February 1977) is a Bangladeshi-born British novelist.\nEarly life.\nAli was born in Kodomtoli, Sylhet District, Sylhet Division, Bangladesh, and spent a large part of her life in the United States where she studied and spent her adolescence. Her family moved to the U.S. in 1988 where she attended Central High School in Bridgeport, Connecticut. Ali later married and moved to the United Kingdom.\nAli is the eldest of four children. Her father is a businessman and her mother is an author.\nWriting career.\nAli's earliest accolade was the Young Author's Award in Bridgeport, CT. Followed by an original short story titled \"From Bangladesh to America\", which was published in a local magazine.\nIn June 2012, Ali's debut book \"Healthy and Halal Choice\" was published, the book is an introduction to healthy lifestyle choices and building a balanced life. The book invites different faiths and ethnic groups to try different recipes that promote a healthy lifestyle. The book made several world appearances including an international book fair in Frankfurt, Germany, book signings in the United States, United Arab Emirates, and Bangladesh.\nIn March 2013, her second book \"Into the Light from the Darkness\" was published, the book is a fictional novel about a woman's journey towards Islam. Ali cites the Quran and Sunnah as style and thematic expression in her writing.\nAli's work explores dawah and community building. She was inspired by author Manoara Shanur and charity worker Mohammed Choudhury.\nOther work.\nAli is also involved local services and non-profit work. She serves as the UK Chairperson for the MSB Foundation and the Muslim Baag Madrassa. She is the face and chairperson of the NFA Foundation. She has spoken at events in the U.S, UK and Bangladesh. She is also a property developer and community champion.\nAwards.\nIn April 2013, Ali was awarded by Channel S for \"Healthy and Halal Choice\".\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48694401","title":"Wangpo Tethong","body":"\nWangpo Tethong\n\nWangpo Tethong (born 16 April 1963, Trogen, Canton of Appenzell Ausserrhoden) is a Swiss–Tibetan activist, writer, spokesperson of Greenpeace Switzerland and member of the 15th Tibetan Parliament in Exile.\nLife and work.\nWangpo Tethong was born to Tibetan refugees at the Kinderdorf Pestalozzi in Trogen, Canton of Appenzell Ausserrhoden. He studied history and law at the University of Zürich, where he graduated with the masters degree (phil. I) from the philosophial departement in 1997.\nIn 1988 Tethong assisted the German \"Die Grünen\" politicians Petra Kelly and Gert Bastian, convenors of the first international hearing on Tibet. From 1988 to 1989 Thetong was a board member of the Tibetan Youth Congress (TYC), and between 1986 and 1990 president of the \"Tibetan Youth Association Europe\" and board member of the \"Verein Tibeter Jugend in Europa\" (literally: \"Association of Tibetan Youth in Europe\"). He co-founded the \"Studentische Arbeitsgemeinschaft für Tibet\" (STAFT) at the University of Zürich in 1989, and was co-editor of the Tibetan-German magazine \"Bod Shon\" (\"Junges Tibet\", literally \"Young Tibet\") from 1989 to 1995. Since 2001 he is the elected president of the \"Gesellschaft Schweizerisch-Tibetische Freundschaft\" (GSTF), literally \"Swiss-Tibetan Friendship Society\". Wangpo also served as party secretary and spokesperson of the Green Party in the Canton of Zürich from 1997 to 1999. Tethong was also a co-initiator of the Tibetan Freedom Radio that broadcasts a Tibetan and Chinese radio service, co-founder of \"Lamtön\", an advice center for Tibetan refugees in Switzerland in 2004, chairmen of the ITSN Olympics Working Group from 2001 to 2008 and since 2008 president of the National Olympic Committee of Tibet. He also initiated \"ICT Deutschland\" in 2004, in 2008 \"Filming for Tibet\" and one year later \"Tibet Film Festival\".\nAs the first exile Tibetan, he carried out a daring protest at the \"Tiananmen Square\" in Beijing in 2006. Among other events, Tethong also organized the manifestations with HH 14th Dalai Lama in Berlin (Germany), Wien (Austria) and Zürich (Switzerland). Since April 2000 Tethong is the mediaofficer of Greenpeace Switzerland, since 2006 senior consultant for the Zürich-based \"Kampagnenforum\", an agency for development and implementation of participatory communication campaigns, and he works as freelancer, consultant for public affairs, and on communication and film production.\nTibetan Parliament in Exile.\nOn 6 May 2014 Wangpo Tethong was elected as member of the Tibetan Parliament in Exile from Europe constituency, where he took the oath of office from speaker Penpa Tsering at a ceremony held at the Tibetan Parliament in Dharamsala. He replaced Chungdak Koren who submitted her resignation citing health reasons. Wangpo gained the third highest votes in the last parliamentary elections from Europe constituency, which is represented in the Tibetan Parliament by two members: he \"has been involved in various services to the Tibetan community including the campaign for jailed Tibetan filmmaker Dhondup Wangchen\". The 44 members of the 15th Tibetan Parliament arepresentent the three traditional provinces, four Tibetan Buddhist sects and the traditional Bön religion of Tibet. Izd members are directly elected by Tibetan exiles above the age of 18 from their respective around the world.\nPersonal life.\nWangpo Tethong is married, father of two children, and lives in Jona, Canton of St. Gallen.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48694407","title":"Baths of Nero (Pisa)","body":"\nBaths of Nero (Pisa)\n\nThe Baths of Nero (Italian - \"Bagni di Nerone\") are an archaeological site near the Porta a Lucca in Pisa, then the Roman city of Colonia Pisana. Now below street level, they are the only Roman remains still standing in the city and form a thermae complex.\nHistory.\nThey were given the misnomer 'of Nero' in the medieval period, when they were believed to have been part of a palace - the earliest level actually dates to the final decades of the 1st century, during the reign of Domitian, as suggested by the use of the \"opus vittatum mixtum\" building technique with alternating layers of brick and tuff blocks. It was rebuilt during the 2nd century, as evidenced by an inscription (CIL , now held in National Museum of San Matteo) which cites the Veruleii Aproniani family, well-known for owning extensive grounds and ceramics factories. In particular Lucius Venuleius Apronianus Priscus financed the rebuilding. He was a \"patronus\" of Roman Pisa and consul of Attidium (a Roman city near present-day Fabriano), who held a number of offices in the Antonine period. As was typical of public figures in the Roman world, he funded several building projects - in 92 he built the Caldaccoli Aqueduct and he also funded a building in Corliano.\nThe best-preserved part of the complex is the sudatio laconicum (hot room), composed of an octagonal room with an apse, with a dome-shaped perforated roof, which has been partially restored. There are also the remains of some of the walls of the palaestra of the apodyterium and two walls from the tepidarium. Marble remains and some decorative sculptures have also been found. Its water was supplied by the nearby river Auser and from the Caldaccoli Aqueduct.\nThey were re-discovered and restored in the 16th and 17th centuries by command of Cosimo III, excavated in 1881 by Clemente Lupi, fenced off in 1938 (after the demolition of some neighbouring houses) and finally fully restored in 1947. A covering dome was installed but this was worn out by the weather by 2007, when it was replaced.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48694416","title":"Latina Women and their Migrations to America","body":"\nLatina Women and their Migrations to America\n\nCurrently, there are over 20 million immigrant women residing in the United States. The states that the majority of these immigrant women come from Mexico, meaning that the main demographic of immigrant women in the U.S. are Latina. As the fastest growing minority group in America, Latinas are becoming primary influencers in education, economics and culture in American society and the consumer marketplace.\nDefinition of a Latina.\nThe word Latina is the feminine form of the word Latino, and represents strictly the female population of this ethnic group. The word Latino is short for LatinoAmericano, which translates to Latin American. It was originally adopted in the US for the purpose of additional categorization of the population in the United States Census. It is important to note that Latino/a is an ethnic category, and one that encompasses various racial groups. Latinas are women of Mexican, Puerto Rican, Cuban, Dominican, Central American, South American, or Spanish origin. Though Brazil is part of Latin America, it is not a Spanish-speaking country, and is excluded from the category of Latinos by the United States Census office.\nHistory of Latina Migration.\n1970–Present\nThe 1970s marked the first decade in which a gender shift occurred in Mexican migration. During this time, more single women and more families began to migrate along with the working males who had already been migrating for several decades. This difference in gender migration is largely attributed to the difference in Latino and Latina work opportunities in the United States. Prior to the 1970s, the majority of the Latino migratory work was agriculturally based. However, with the end of the Bracero program, the United States policy on migration within the hemisphere shifted from encouraging primarily working males to migrate. Beginning with the Watershed amendment of 1965, the United States shifted their policy to encourage the migration of whole families by issuing less visas to unskilled single men and more visas to families. This marked the beginning of a large increase in Latina migration. While men typically migrate at a young age concentration of 18-25, females migrate at generally consistent rates at all age groups. This signals a difference in motives for female migration. While Latinos almost always migrate to the United States in search of work, Latina migration follows a pattern heavily tied to family life.\nLikewise, the early waves of the Cuban migration were primarily families. After they Bay of Pigs failure, many middle class Cuban families sought escape from the newly communist Cuba in the United States. 1961 and 1962 were marked by full family Cuban immigration. Thus, many Cuban women found themselves in the United States as a result of their family. After the Cuban Missile Crisis, the ability for Cubans to immigrate with their families became limited as a result of strained US-Cuba relations. This led to Cubans use of flotillas in order to make it to the southern coast of Florida.\nReasons For Latina Migration.\nWhile the primary reason for immigration into the United States for Latinas is economic improvement, the betterment of family life remains an important factor. Latina women also migrate with their families in an effort to seek refuge from violence and political instability in their native countries. Violent events in El Salvador, Guatemala and Honduras the amount of Latinas entering the United States with families has nearly doubled in 2015. Likewise, many Latina women identified their primary reason for immigration was to reunite with family already in the United States.\nHealth.\nThe Hispanic paradox refers to the medical research indicating that Latino immigrants enter the United States with better health, on average, than the average American citizen, but lose this health benefit the longer they reside in the United States. It is important to note that this health paradox affects both male and female populations of Latinos. Likewise, immigrant Latina women are found to have a lower infant mortality rate than U.S. born women. This has been explained by the tendency for Hispanic women to continue breastfeeding for a longer amount of time.\nThe Affordable Care Act does not cover non-citizens nor does it cover immigrants with less than 5 years of residency. As a result, Latino immigrants struggle to gain health care once they enter the United States. Non-citizen Latinos often avoid hospitals and clinics for fear of deportation, leading to an increased risk of preventable diseases such as tuberculosis and Hepatitis in this population. Additionally, Latino health deteriorates as this population assimilates into unhealthy lifestyles associated with lower socioeconomic American populations.\nLatina Women in the Workforce.\nImmigration to the United States offers new economic prospects for Latina women. While many Latina women work outside the home in their countries of origin, their efforts in the U.S. often yield more economic benefits. The Institute of Latino Studies at the University of Notre Dame comments on this idea with Mexican women in mind, claiming that “much of the work that women do in the United States generates more income than it would in Mexico, allowing women to be much more financially independent.” This financial independence allows these women more freedom to act as the head of household.\nThough economic conditions in the U.S. are often better for these immigrants than in the countries from which they came, they are nowhere near those that men and even women of other ethnicities enjoy. Latina women make disproportionately less money than their male and non-Hispanic white counterparts. These disparities in wage and job availability leave this portion of the United States population more vulnerable to poverty and its implications. Though it is common knowledge that women in the United States make less than their male counterparts, this wage gap further varies by ethnicity. On average, Latina women make 55 cents to the dollar when compared to white, non-Hispanic males while white women make 78.1 cents to the same dollar. This discrepancy between white and Latina women continues further. The number of working poor Latina women is more than double that of white women, and poverty rates for Latinas are nearly triple those of white women. The elimination of this wage gap, on average, equates to: 194 more weeks of food for a Latina's family, more than 17 more months of mortgage and utility payments, nearly 27 more months of rent, or 12,342 additional gallons of gas.\nThese wage gaps in the workforce affect Latinas at every socioeconomic status, not just the working class. Latina women are the most likely group to be paid at or below the minimum wage, with 5.7% of wage and salary workers earning this amount. Of women in the workforce with advanced degrees (master’s, professional, and doctoral degrees), Latinas earn the lowest median weekly earnings of all racial and ethnic groups in the United States. Despite discrimination in the workforce, Latina participation is on the rise. From 1970 to 2007 Latinas have seen a 14% increase in labor force participation, which the Center for American Progress calls “a notable rise.” \nOf the Latinas participating in the labor force, 32.2% work in the service sector, according to the Bureau of Labor Statistics. This percentage is significantly higher than that of white women, who fall at 20%. Conversely, Latinas are underrepresented in various other sectors of the labor force, particularly as business owners. However, Latina entrepreneurship has grown immensely since the start of the 21st century. In 2011, 788,000 Latinas ran their own businesses, representing a 46% increase from 2006. Comparatively, female business owners as a whole only increased by 20% during this same time period.\nFamily.\nIn the United States, female employment has become an increasingly important determinant of family economic well-being, especially among disadvantaged populations such as Latinas. Female employment offers these women more autonomy, the chance to support themselves without relying on a spouse.\nDomestic Abuse.\nThis autonomy is particularly important considering some researchers believe that Latinas may be particularly vulnerable to domestic violence issues. These domestic abuse struggles result from a combination of violent partners and bureaucratic complications of the US immigration system. Domestic issues among immigrants are potentially exacerbated by language barriers, economic dependence, low levels of education and income, poor knowledge of services, undocumented status, lack of a support system, and the immigration experience in general. According to the Rutgers School of Social Work, around 17% of Latina immigrants are victims of Domestic Violence. This violence can manifest in different ways, and is often difficult to diagnose when it the result of verbal threats rather than physical abuse. Oftentimes, it is threats of deportation that influence Latina women to keep silent about their situation.\nLatina Family Values and Structure.\nBecause the Latina ethnicity encompasses a large variety of people, including people of various races from various countries, it is difficult to define the Latina Family experience in a simple way. To do so would oversimplify this population and result to stereotyping, as the experience of Latinas is just as nuanced as the women who comprise this ethnic group. There is a significant lack of literature on the home life experience of Latina women and how it may change with immigration to the United States.\nFamily Life in Countries of Origin.\nPatterns of female family structure are found to be similar in Nicaragua and the Dominican Republic, and tend to be more matrifocal. Conversely, Mexican and Costa Rican women are often migrating from a patriarchal husband-wife system, with just 13% and 22% of households headed by women in these countries, respectively. Puerto Rico lies somewhere between these two systems, sharing aspects of both patriarchal and matrifocal systems. According to a study published by the National Institute of Health, these patterns correspond with relatively low female participation in the labor force.\nLatina Power in the United States.\nFor Mexican and Costa Rican women in particular, life in the United States represents a significant shift in opportunities for family life, as higher wages allow women the ability to be more autonomous. In a 2013 Nielson study in the United States, Latinas said they were primary or joint decision makers in the household, giving input in categories such as grocery shopping, insurance, financial services, electronics, and family care. Additionally, the Latina population is increasingly becoming \"primary wage earners and influencers\" in the modern Hispanic United States Household.\nEducation.\nLatina Immigrants' Current Levels of Education.\nThe research states that in 2012 Latina immigrants from Mexico, Cuba, and the Dominican Republic had the lowest education level when compared to other countries. However, women had higher education rates than the Latino male immigrants, as shown in the American Immigration Council's . For example, 6.2% of female immigrants in Mexico have bachelor's degrees as compared to the 5.0% of male immigrants in 2012. 14% of the women immigrants from the Dominican Republic have bachelor's degrees compared to the 12% of Dominican men.\nIn a recent from the International Business Times, Latino immigrant students are falling behind in academic achievements and graduation rates compared to other students. Moreover, these statistics apply to Hispanics that have not recently migrated to the United States, implying that the American education system is not meeting the needs of Latino students as a population. The shows in a study in 2008, that Latina immigrants residing in Phoenix, Northern Virginia, and Atlanta all have a lower high school completion rates when compared to their male Latino immigrant counterparts. Latinas also fall behind Latino immigrants in their likelihood to attend 1–4 years of college. However, in Northern Virginia and Atlanta a higher percentage of Latina women complete 5+ years of college than Latino men do. Latina immigrants also lack a \"substantial amount\" of English proficiency, as discovered in IWPR's 2008 research. This language barrier plays a significant role in the Latina educational experience and progress.\nEducation Services for Latina Immigrants in the United States.\nCurrently, there are limited resources for Latina immigrants in the United States. As explained in Motivations of Immigration, many women come to the United States for a better education, among other factors. The explains the workings of organizations aimed to support the struggles of Latina immigrants. The IWPR states that growing organizations are currently providing English tutors and access to education. Programs specifically for Latina (and Latino) immigrants now use an adaptation tactic of teaching, rather than an assimilation ideology to help this population adjust to American life. Programs like these include , providing education on English, workers' rights, and the consumer culture of America.\nSocial Issues.\nWhile Latina women face a multitude of issues in immigrating into the United States, perhaps the most significant ones revolve around basic human rights. All too often, illegal Latina immigrants are unable to avoid human abuse because of lack of protection from the law. As a result, Latinas endure a severely unequal migratory experience when compared to their male counterparts.\nHuman Trafficking\nHuman trafficking disproportionately affects women. In the United States, an estimate of at least ten thousand people are forced into labor through such a process. Within the category of women, immigrant women are the ones who are targeted and pulled in more easily. Due to their lack of knowledge of their new surroundings, the English language, and vulnerability to work, these women are more easily tricked, or coerced, into these businesses. These women come into the United States looking for improved employment or educational opportunities, making them much more vulnerable to coercion and false job opportunities offered by traffickers. Additionally, many immigrant women do not understand their rights, or are faced with threats of deportation. Much of this trafficking is hard to detect, as it is not usually visible to the public or governmental eye.\nDealing With Social Issues\nThere are various Latina women involved in organizations and programs that aim to aid Latina women affected/victimized by human trafficking or domestic abuse. Some of these influential women include Maria Jose Fletcher, Laura Zarate, Rosie Hidalgo, Olga Trujillo, Susan Reyna.\nIn Florida, Maria Jose Fletcher is the founder and co-director of VIDA Legal Assistance, a not-for-profit legal organization whose purpose is to provide legal support for the immigrant women who have been victims of violent crimes. This organization acknowledges and aims to solve the issue of fear of deportation that plagues the Latina community and makes it fearful of reporting such crimes.\nLaura Zarate is the co-founder of the organization of , which translates to \"Art Heals.\" This Latina-lead organization was founded in Austin, Texas and serves the purpose of addressing sexual violence.\nRosie Hidalgo has used her position as a former attorney in New York City and her current role as the Director of Public Policy for Casa de Esperanza and the National Latin@ Network to help fight domestic violence issues. She was influential in the fight for the reauthorization of the Violence Against Women Act. She has also been awarded for her work on domestic abuse and immigration reform.\nSusan Reyna is the executive director of M.U.J.E.R. (Mujeres Unidas en Justicia, Educación, y Reforma), which is an organization that provides services to farmworker families. This organization also helps victims of sexual assault and domestic violence.\nImmigrant Culture within America.\nMexican Influence in Literature.\nImmigrants have influenced today's culture in America through their practices, art, literature, and more. Latina immigrants have influenced American literature dating back to the 19th century. Maria Amparo Ruiz de Burton was the first Mexican immigrant to write a novel in English. Her literary works gave Latina women in the United States a new voice by delving into race, gender, and class of the times. This set the tone for many Latino and Latina immigrants to create works in American society.\nCuban Influence in the Arts.\nCuban culture has made its way into America thanks to many refugees and their talents. Maria Irene Fornes, a Cuban immigrant to the United States, created plays that focused on feminism and poverty. Her success in the 1960s gave Latina immigrants a presence in off-Broadway productions. Another Cuban immigrant, Ana Mendieta, created sculptures, performances, and many other art mediums that focused on themes of women, life experiences, and earth. She received a Lifetime Achievement Award in 2009, which emphasizes her success in her artistic fields and connection to life experiences. Celia Cruz, originally born in Havana, Cuba, was famous for her Cuban-inspired salsa music and many Latin and American Grammy's. Celia immigrated to the US in the early 1960s against Castro's wishes. Not only was she famous for her vocals, but she made many Hollywood appearances, resulting in a star on Hollywood's Walk of Fame. By having such a wide, diverse audience, she left her mark on America's pop culture as a female Cuban immigrant. Like Celia, Gloria Estefan was born in Cuba and is arguably the most famous Cuban American singer to date. Her Latin music flooded American radio stations and television features, bringing Latina presence into American pop culture.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48694417","title":"Fahredin Gunga","body":"\nFahredin Gunga\n\nFahredin Gunga (1936–1997) was an Albanian poet from Kosovo.\nBiography.\nGunga was born in Mitrovica in 1936. He studied in Belgrade and later worked as a teacher in Mitrovica and for the Rilindja publishing company in Pristina. His verse production showed him to be a poet of searching, thought at times nebulous ideas, whose abstract symbolism and abstruse metaphors often took an unexpected surrealist turn. He was the author of nine poetry collections from 1961 to 1996, among which are, \"Nokturno për orkidenë\" (Nocturne for the orchid) f1981; \"Mallkimet e zgjuara\" (Awaken curses) 1985; and \"Gramatika e gjëllimit\" (The grammar of living) 1996. Gunga served as editor-in-chief of the Radio Television of Pristina during the 1970s.\nGunga is a controversial figure between Albanians. He testified against Adem Demaçi on his trial on 19 November 1958, accusing him of separatism and pan-Albanianism. Therefore, he is considered an operative of UDBA.\nHe died on 1 April 1997.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48694429","title":"Anguish (1917 film)","body":"\nAnguish (1917 film)\n\nAnguish (French:Angoisse) is a 1917 French silent film directed by André Hugon and starring Paul Guidé, Albert Dieudonné and Marie-Louise Derval.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48694437","title":"Brisbane Truth","body":"\nBrisbane Truth\n\nThe Brisbane Truth newspaper was a subsidiary of The Truth (Sydney newspaper) launched in 1890.\nDigitisation.\nThe paper has been digitised as part of the Australian Newspapers Digitisation Program of the National Library of Australia.\nExternal links.\n\"\" in .\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48694442","title":"Sebaiera","body":"\nSebaiera\n\nSebaiera, Uad Sebaiera or Zbayra is a hamlet and wadi(Arabic for valley) in Western Sahara in Oued Ed-Dahab Province in the region of Dakhla-Oued Ed-Dahab on the Moroccan side of the wall in Western Sahara. There is an astronomical station there but it is very small and a few tiny shacks that seem to be permanently inhabited and nomads seasonally settle in Sebaiera. It is located in a wadi(valley) called Oued Zbayra and ephemeral river called Oued Zbayra. The structures in this hamlet are so tiny and utterly unassuming that they are not visible on Google Maps and the nomad's tents are only seasonal and also tiny so it is unlikely Google Maps ever shows them. It's elevation is 220 meters. It lies 104 kilometers east of Chalwa(Cnalwa) and is reachable only by jeep or dirt road.\nLocation.\nLat/Long 24.85,-13.033333\nTime zone.\nThe timezone in Uad Sebaiera is Africa/El_Aaiun\nSunrise at 07:20 and Sunset at 18:03.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48694454","title":"Edward John Bolus","body":"\nEdward John Bolus\n\nEdward John Bolus (born 5 May 1879) was a poet and writer, civil servant, and clergyman. He spent his civil service career in India, which appears prominently in his writing.\nLife.\nBorn May 5, 1879 to Harriet S. Bolus and her husband Edward, a schoolmaster in Stoke Newington in London, John studied at the Merchant Taylors' School, Northwood, before matriculating for a BA in Classics at The Queen's College, Oxford, in 1898.\nIn 1902 he took the civil service examination, and on 14 November 1903 arrived in India, where he served in Bombay and in due course Pune as 'ass[istan]t coll[ecto]r and mag[istrate]'. By 1905 he was a second assistant in Land Revenue and General Administration, and by 1 October 1915 an 'Assistant Collector', based in Pune. He was mobilised in 1914, and his highest acting rank was Capt. 26th (Sind) Bn. of the Indian Defence Force.\nWhile in India, Bolus sustained his Classical interests and was an active member of the (apparently short-lived) Bombay Branch of the Classical Association, 'which owed its existence mainly to the enthusiasm of a learned Jesuit, Father Ailinger'. On 6 April 1911 he gave a lecture to the Branch on 'Plato as a Literary Artist'. It was no doubt his activities here that gave rise to his 1920 publication \"Bombaia\", a long description of Bombay in Latin verse.\nAround 1926 Bolus left the Civil Service and in that year was ordained a priest in the Church of England. By 1930 he was priest to Pamber and Monk Sherborne (which were in the gift of The Queen's College and were merged in that year). He remained the resident curate at Pamber Heath into the 1940s.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48694481","title":"Lazarus (rapper)","body":"\nLazarus (rapper)\n\nKamran Rasheed Khan better known by his stage name Lazarus is an American physician, rapper and songwriter from Detroit Michigan who is signed to Russell Simmon's YouTube MCN All Def Digital.\nLife and career.\nKamran Rasheed Khan was born in Detroit, Michigan to a Muslim family from Pakistan. He attended Wayne State University where he studied medicine. While studying medicine, he also began rapping. He started his career without a stage name but after few years, he changed his name to Lazarus due to hate against Muslims. He told in an interview that after 9/11 he felt that his chances of becoming a rapper were finished and that his name is a biblical character that resurrected from the dead. Lazarus gained popularity through freestyle rapping on radio stations in Detroit. He did many rap battles on FM 95.5 and FM 105.9. Lazarus later joined FM 98 and started making mixtapes and performing at venues in Detroit including theatre opening for D12 and G-Unit. While working for FM 98, Lazarus was interviewed by Discovery Channel and was featured in a documentary “The Real 8 Mile,” which was hosted by Charlie LeDuff. He released his debut album “Chapter One: The Prince Who Would be King” in 2007 which lead to receive him three nominations “Lyricist of the Year,” “Song of the Year,” and “Artist of the Year” at the 2007 Detroit Hip Hop Awards. The album had 18 tracks including a feature track from Royce da 5'9\". A single “Let The Game Know” from his debut album received worldwide coverage. The music video of “Let The Game Know” was directed by film director Anthony Garth. Another single “Drug of Choice” which was filmed in Pakistan received over a million views on YouTube.\nIn 2013, Lazarus signed to Russell Simmon's YouTube multi-channel network All Def Digital and in 2014 he released a single “Open Heart Surgery” featuring D12's rapper Bizarre.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48694482","title":"Jana bahal","body":"\nJana bahal\n\nJana Bahal (Nepal Bhasa:जन बहाः), often called Janabahaa: and also called \"Machindra Bahal\" and less frequently \"Kanak Chaitya Mahavihar\", is one of the few Bahal which have fully fledged storied temple standing in the middle of a court. The main deity residing in the temple is the Seto Machindranath also known as Janabaha Dyo, Aryavalokitesvara, Karunamaya.\nHistorical Background.\nJanabahal originally was known as “Kanak Chaitya Mahavihar”, but after deity of Seto Machindranath was mounted here the courtyard began to be referred as Jahabaha:. The name Kanak Chaitya Mahavihar is from a chaitya of Kanakmuni Buddha in front of the temple, situated in the courtyard. From this we can assume that the bahal was originally a place for Buddhists religious activities. It is said that Janabahaa: Dyo: dates back to 4th century BC but the temple at Janabahal was built by King Yaksha Malla in 1502 AD. It is also believed that kings who followed Buddhism erected the image of various Lokeswaras inside the courtyard.\nMajor Cultural Activities.\nBeside the main Jana Baha Dyah Jatra (chariot festival), the people, mostly Buddhists, visit and pray the Seto Machindranath deity. They count the beads tied in the thread or rotate the manes on the process\nof praying. Newar Buddhists perform uposadhavrata (a kind\nof fasting) every Ashtami by doing saptavidhanutara satvapuja and by offering pate (parasol). They also perform satpuja during which, toncha, batti, prasad all is offered in equal quantity of 1000. In the premises of Kanak-Muni Buddha‟s chaitya, Barey Chwiu is done for the young males of Buddhacharya, Shakya and Bajracharya caste. Newars often organizes the program of lighting the palas around the temple or lighting 108 diyos. This shrine is mainly visited on the day of Purnima, Ashtami and Sanlu (Sankranti) by the Hindus. The daily ritual of the temple starts from around 4 am by the priests\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48694484","title":"Vincent Kirabo","body":"\nVincent Kirabo\n\nVincent Kirabo was born 1 October 1955 in Hoima District in the Western Region of Uganda. He was appointed the bishop of the Roman Catholic Diocese of Hoima on 30 November 2015.\nPriesthood.\nHe was ordained a priest on 9 September 1979 after studying at the Uganda Martyrs' National Major Seminary Aloculum in Gulu and at St. Mary's National Seminary in Ggaba. He taught at St. John Bosco Minor Seminary, Hoima from 1979 until 1988. He served as the director of the Diocesan Commission for Vocations from 1985 until 1988. He was the vicar at Muhorro Parish in 1990 and rector of St. John Bosco Minor Seminary in Hoima from 1991 until 1992. Between 1992 and 1997, he served as the diocesan financial administrator of Hoima Roman Catholic Diocese. Between 1998 and 2003, he was the parish priest of Buseesa Parish, serving in the same capacity in Katulikire Parish from 2007 until 2008. He became professor and financial administrator of Uganda Martyrs' National Major Seminary Alokolum in 2008, serving in that capacity until 2012. At the time of his appointment as bishop, he was a professor at St. Mary’s National Major Seminary Ggaba, a position he had served in since 2012.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48694486","title":"Euglossopteryx","body":"\nEuglossopteryx\n\nEuglossopteryx is an extinct genus of bee in the family Apidae known from a fossil found in North America. There is one described species in the genus, Euglossopteryx biesmeijeri.\nHistory and classification.\n\"Euglossopteryx biesmeijeri\" was described from a solitary fossil, which is a compression-impression fossil preserved in layers of soft sedimentary rock. Along with other well preserved insect fossils, the \"E. biesmeijeri\" specimen was collected from layers of the Middle Eocene Parachute Creek Member of the Green River Formation. The formation is a group of Late Paleocene to Late Eocene depositional basins in Wyoming and Utah. The Parachute Creek Member is a composed of oil shales from a shallow mountain lake that exists for around 20 million years. Study of the paleoflora preserved in the shales indicates the lake was around in elevation surrounded by a tropical to subtropical environment that had a distinct dry season.\nAt the time of study, the holotype was part of the Division of Entomology (Paleoentomology) collections, University of Kansas Natural History Museum. It was first studied by an international team of researchers headed by Manuel Dehon of the University of Mons, Belgium, with the teams 2014 type description of the genus and species was published in the natural sciences journal \"PLOS One\". The genus name is a derived from a combination of the Euglossini type genus \"Euglossa\" combined with the Greek \"pteryx\" meaning \"wing\". This is a reference to the similarity between \"Euglossopteryx biesmeijeri\" and species of \"Euglossa\". The specific epithet \"biesmeijeri\" was coined as a patronym honoring the Belgian melittologist Jacobus Biesmeijer, who is a noted researcher of pollinator-plant interactions and pollinator declines.\nThe body and wing structuring indicate a relationship to members of the bee clade Corbiculata, which encompasses the living tribes Apini, Bombini, Euglossini, Meliponini and the extinct tribes Melikertini, Electrapini, and Electrobombini. The preserved pollen basket on the metatibia excluded placement of \"E. biesmeijeri\" into a cleptoparasitic Cuckoo bee genus. Within Corbiculata, Apini has a distinct wing marginal cell and Meliponini has very reduced wing venation, neither features seen in \"E. biesmeijeri\". The wing venation of the species is closest to that seen in Euglossini, however the metatibia is not highly expanded as seen in Euglossini. As such Dehon \"et al\" did not give any placement in the clade, leaving \"Euglossopteryx\" as Corbiculata \"incertae sedis\".\n\"E. biesmeijeri\" is one of four bee species described by Dehon and team in the \"PLOS One\" article, the others being \"Andrena antoinei\", \"Bombus cerdanyensis\", and \"Protohabropoda pauli\".\nDescription.\nThe \"E. biesmeijeri\" fossil is a female preserved with a dorsal view of the body, out stretched wings, and missing its head. The overall body length is not determinable due to slight curling of the body and the missing head, though the mesosoma is . The metatibia are about long, not flared and enlarged notably, and with a distinct corbiculate pollen basket formed of a fringe of long setae. The original coloration and color pattering has been lost, so color pattern and if the color was metallic as in Euglossini species. The forewings have a one marginal cell and three cells below that called the submarginal cells. The marginal cell had a closed tip end that is notably rounded. The second and third submarginal cells together are longer than the first submarginal cell, which is the longest of the three cells. A pterostigma is present, but it incompletely preserved making observations difficult.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48694524","title":"Al and Zoot","body":"\nAl and Zoot\n\nAl and Zoot is an album by the Al Cohn Quintet featuring Zoot Sims recorded in 1957 for the Coral label.\nReception.\nThe AllMusic review by Scott Yanow states, \"The mid- to late '50s were a period of intense recording activity and this album is one of the underrated gems that was somewhat overlooked at the time\". \nTrack listing.\n\"All compositions by Al Cohn except as indicated\"\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48694552","title":"Vertigo (1917 film)","body":"\nVertigo (1917 film)\n\nVertigo (French:Vertige) is a 1917 French silent film directed by André Hugon and starring Régine Marco, André Nox, Marie-Louise Derval.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48694558","title":"Rafael Soromenho","body":"\nRafael Soromenho\n\nRafael Almeida Soromenho (born 4 April 1994) is a Portuguese footballer who plays for Sporting Clube Farense B, as a midfielder.\nFootball career.\nOn 9 January 2013, Soromenho made his professional debut with Olhanense in a 2012–13 Taça da Liga match against Moreirense.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48694589","title":"Metjen","body":"\nMetjen\n\nMetjen (also read as Methen) was a Ancient Egyptian high official at the transition time from 3rd dynasty to 4th dynasty. He is famous for his tomb inscription, which provide that he worked and lived under the kings (pharaohs) Huni and Snefru.\nIdentity.\nFamily.\nAccording to his own tomb inscriptions, Metjen was a son of the high official Inpu-em-Ankh, a judge at the royal court of justice and a royal scribe. Metjen's mother was a high priestess named \"Neb-senet\". Metjen also had children, which he inderectly mentions, but their names are not handed down.\nTitles.\nAs a high-ranking official, Metjen bore several elite titularies:\nCareer.\nMetjen's tomb inscriptions are of highest interest to Egyptologists and Historians alike. They are in fact the very first Ancient Egyptian private texts that reveal more than only titles and offering formulae. Metjen is the first high official who reports his own professional and curatorial career by listing his official and honorary titles in chronological order and describing the support of his career by his parents.\nAccording to Metjen's autobiography, he inherited many of his titles after the death of his father, other high ranked titles were assigned to him by his father himself. The inheritance included also several decrees which allowed Metjen to found own estates and even small towns. Metjen started as a royal scribe, became then overseer of the royal scribes and confidant of the king, then he became administrator of several palatinates and royal storages. Finally, he became \"great one of the 'Ten of Upper Egypt'\" and privy council. Additionally, the royal house gave several estates to Metjen, whereupon he founded the town \"Sheret-Metjen\" (Egyptian: \"Šr.t-Mṯn\") at his favorite estate. As a sign of gratitude, Metjen in turn donated hundrets of precious trees to royal domains. At the peak of his career, Metjen was also mayor of several cities, curator of the endowment estate of king Huni and supervizor of the mortuary cult for queen Nimaathapi.\nContemporary office partners included \"Netjeraperef\", \"Khabawsokar\", \"Pehernefer\" and \"Akhetaa\", who were also holding office under Huni and Sneferu. All their tomb inscriptions reveal that the time of both kings must have been a very prosperous one and economy and office administration flourished.\nTomb.\nMetjen's tomb, mastaba \"L6\", was found in 1842 by German Egyptologist Carl Richard Lepsius at Saqqara. He excavated the tomb and ordered the dismantling of the tomb for preservation. Metjen's tomb chapels are now completely at display at the Egyptian Museum of Berlin.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48694597","title":"Jackie Akhavan","body":"\nJackie Akhavan\n\nJacqueline Akhavan is a British chemist, and an expert in the chemistry of explosives.\nEarly life and education.\nAkhavan grew up in London. She attended the University of Southampton where she received her BS in chemistry in 1979. After graduating, she began working at Pirelli General developing polymeric optical fibers for communication. She worked at Pirelli for 3 years when she went back into academia by joining Cranfield University as a polymer and physical chemistry lecturer. She also received her master's degree in Philosophy in 1982 and then received her PhD in polymer chemistry from Southampton University.\nAcademic career.\nAt Cranfield, she first started her work using the explosives in fireworks by understanding the reactions taking place as well as making them safe for the public to use. Eventually, she was promoted to senior lecturer at Cranfield and became the head of the MSc in explosives. Her research also is focused on polymer bonded explosives and their applications. During her tenure, she has received numerous research contracts from government organization, such as the Ministry of Defense UK, and also various corporate contracts from companies such as BAe Systems and MBDA. Most of her work, however, is secret due to the nature of her work and the application of her research will never be published. In 2007, she was given a chair in explosive chemistry and is now the Head of the Center for Defense Chemistry. As of September 2014, her current research is focused on making it easier for government agencies to detect explosives during security screenings like the ones conducted at airports. The main focus of the this new research is developing viable ways to detect liquid and paste explosives. Akhavan also helps to train government agencies in bomb recognition and detection to improve safety.\nShe is a Fellow of the Royal Society of Chemistry.\n\"The Chemistry of Explosives\".\nAkhavan published a book called \"The Chemistry of Explosives\". This book covered many different aspects of explosives including the classification of explosives, combustion, ignition, thermochemistry, and kinetics. Also, there is an introduction to explosives at the beginning of the book that goes of over the development of most the notable explosives used today. The book is meant to teach others about the science behind explosive compounds.\nNotable work.\nAkhavan has led research for: \n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48694609","title":"Sharks (1917 film)","body":"\nSharks (1917 film)\n\nSharks (French:Requins) is a 1917 French silent crime film directed by André Hugon and starring Charles Krauss, Marcel Bérard and André Nox.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48694623","title":"Yttrium hydride","body":"\nYttrium hydride\n\nYttrium hydride is a compound of hydrogen and yttrium. It exists in several forms, the most common being a metallic compound with formula YH2. YH2 has a face centred cubic structure. Under great pressure, extra hydrogen can combine to yield an insulator with a hexagonal structure, with a formula close to YH3. Hexagonal YH3 has a band gap of 1.8 eV. Under pressure of 12 GPa YH3 transforms to an intermediate state, and when the pressure increases to 22 Gpa another metallic face centred cubic phase is formed.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48694640","title":"List of songs recorded by Niykee Heaton","body":"\nList of songs recorded by Niykee Heaton\n\nNiykee Heaton is an American singer and songwriter. She has written and recorded material since her childhood, having started sharing original songs occasionally on YouTube in 2011, for which she accompanied herself on acoustic guitar, along with covers of contemporary hits, where they subsequently went viral in following years, helping to propel the singer to prominence. Heaton released her debut project, an extended play titled \"Bad Intentions\", in September 2014, after signing a record deal with Steve Rifkind and Russell Simmons's Capitol-affiliate All Def Digital, in partnership with Awesomeness Music. The EP garnered positive online reception, with \"The Huffington Post\" writing that it \"offers a significant variety for a debut, all held together by her vocals, most ravishing in her lower register\" and Idolator adding that it \"confidently showcases the versatility and scope of Niykee's songwriting.\"\nIn 2015, she called out her label in an extensive open letter to her fans, later clarifying that \"we are now in a place where we can create music that I want to create, and we are no longer tied to the people that were holding me back,\" also announcing plans to release her first album. In June, she launched a website, NBK (Naturyl Born Killers), stating \"NBK is the movement,\" where new music was then premiered for free regularly over the following months through her SoundCloud account.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48694647","title":"Tethong","body":"\nTethong\n\nPeople with the surname Tethong include:\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48694655","title":"Worthless Woman","body":"\nWorthless Woman\n\nWorthless Woman (French:Fille de rien) is a 1921 French silent film directed by André Hugon and starring Suzanne Talba, José Durany and Vasseur.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48694656","title":"Ivar Halfdansson","body":"\nIvar Halfdansson\n\nIvar Halfdansson was a king of Oppland, Norway one of the Petty kingdoms of Norway during the Migration Period. He was an Earl of Norway, Jarl and king of Uplanders, great grand father of Rollo of Normandy.\nHe is mentioned in the \"Ættartalur\" section of Flateyjarbók.\nHe is frequently confused with other people named Ivar in the sagas.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48694671","title":"2011 Ligue 1 (Senegal)","body":"\n2011 Ligue 1 (Senegal)\n\nThe 2011 Ligue 1 season was the 46th of the competition of the first-tier football in Senegal and the fourth professional season. The tournament was organized by the Fédération Sénégalaise de Football (Senegalese Football Federation). The season began earlier on 18 December 2010 and finished on 9 September 2011. It was the third season labelled as a \"League\" (\"Ligue\" in French). US Ouakam won their first and recent title, and a year later would compete in the 2012 CAF Champions League. ASC Diaraf, second place and the winner of the 2012 Senegalese Cup Casa Sport participated in the 2012 CAF Confederation Cup, it was the last time bringing a second place club, only the cup winner would participate in the following season.\nThe season would have feature 16 clubs and once again, the winner would be decided on the highest number of points, it was decided after the thirtieth match was finished. Not until the next season it would reappear in that format, the first and second phase system would reappear in the next season. The season scored a total of 368 goals. Casa sport had the highest total of 30 goals scored and the least was CSS Richard Toll with 15.\nASC Diaraf again was the defending team of the title.\nOverview.\nThe league was contested by 16 teams.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48694672","title":"Iraq men's national squash team","body":"\nIraq men's national squash team\n\nThe Iraq men's national squash team represents Iraq in international squash team competitions, and is governed by Iraqi Squash Federation.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48694676","title":"Food porn","body":"\nFood porn\n\nFood porn is a glamourized spectacular visual presentation of cooking or eating in advertisements, infomercials, blogs cooking shows or other visual media, foods boasting a high fat and calorie content, exotic dishes that arouse a desire to eat or the glorification of food as a substitute for sex. Food porn often takes the form of food photography and styling that presents food provocatively, in a similar way to glamour photography or pornographic photography.\nHistory.\nThe term appears to have been coined by the feminist critic Rosalind Coward in her 1984 book \"Female Desire\" in which she writes: \"Cooking food and presenting it beautifully is an act of servitude. It is a way of expressing affection through a gift... That we should aspire to produce perfectly finished and presented food is a symbol of a willing and enjoyable participation in servicing others. Food pornography exactly sustains these meanings relating to the preparation of food. The kinds of picture used always repress the process of production of a meal. They are always beautifully lit, often touched up.\" (p. 103)\nIt is important to realize that the term food porn does not strictly deal with the connection, often established throughout history, between food items and sexual contents. In the United States, food porn is a term applied when \"food manufacturers are capitalising on a backlash against low-calorie and diet foods by marketing treats that boast a high fat content and good artery-clogging potential\". The origin of the term was attributed to the Center for Science in the Public Interest which began publishing a regular column called \"Right Stuff vs. Food Porn\" for its Nutrition Action Healthletter in January 1998.\nIn the United Kingdom, the term became popular in the 1990s due to the TV cookery programme \"Two Fat Ladies\" after the shows producer described the \"pornographic joy\" the pair of them took in using vast quantities of butter and cream.\nConnection with Business.\nTaking a picture of food became one of the norms for younger generation in the world. Study from YPulse shows 63% of people between thirteen years old to thirty two years old posted their food picture while they are eating on social networking services. Moreover, 57% of people in the same age range posted information of the food they were eating at that time. From the percentage, food and social media are starting to connect together as trend. People use hashtag foodporn (#foodporn) unintentionally, but for doing that it helps food industry to track down the data to catch hungry attentions from audiences on social networking services. In current number, about 54 million food pictures are hashtagged on only Instagram. On Facebook, Social media helps connecting people through food trend, and #foodporn.\nUses/ Community.\nThe term food porn has shifted throughout its first appearances. Articles mentioned food porn as early as the late 1970s. The phrase food porn was used in a literal manner, describing food that was unhealthy for human consumption, directly comparing it to pornography. Its use then took on a new meaning, being used to describe food that was presented and prepared in a manner that was aesthetically appealing. It took on this use for over a decade, until the social media boom that was created by the internet. Once the early 2000s hit, the terminology evolved into a way of documenting meals that are recognized for their presentation. This desire for food has flooded the internet, having significant effects on social media sites that provide the ability to display such as Instagram, Flickr, Snapchat, Facebook, and Twitter. The popularity of displaying food in a physically appealing manner is driven by the users that create these communities. The use of hashtags that the users of these sites have adapted to, allow food porn to connect people in a way that documents anything about the food such as, foods that reflect cultures, calories, presentation, preparation, delicious taste, and anything else that adds to the authenticity of the meal.\nCulture.\nThe term foodporn refers to images of food across various social media platforms such as TV, cooking magazine, online blog, website and social media platforms. The reason why foodporn is strongly connecting with popular culture is due to the fact that people are exposed to food in their everyday lives. Foodporn is not specific to social media platforms and could also be part of the category on newspaper and online blog. Moreover, foodporn is experienced globally. Language barriers that exist culturally can be bypassed by the usage of #foodporn. Food porn is used collectively by the online users and is does not exclude or privilege one food over another.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48694696","title":"Grand Lake (Sheet Harbour)","body":"\nGrand Lake (Sheet Harbour)\n\nGrand Lake is a lake just west of Sheet Harbour, Nova Scotia. It is crescent shaped. It's primary outflow is Little West River, which flows in to the Northwest Arm of Sheet Harbour. The land area of the Sheet Harbour 36 Indian reserve extends to a part of the shore of Grand Lake.\nIn 2012, the Nova Scotia Government bought of land near the lake worth $1.1 million.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48694699","title":"A Crime Has Been Committed","body":"\nA Crime Has Been Committed\n\nA Crime Has Been Committed (French:Un crime a été commis) is a 1919 French silent film directed by André Hugon.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48694702","title":"FabricLive.81","body":"\nFabricLive.81\n\nFabricLive.81 is a 2015 DJ mix album by Monki. The album was released as part of the FabricLive Mix Series.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48694719","title":"Myoporum wilderi","body":"\nMyoporum wilderi\n\nMyoporum wilderi, commonly known as Cook Islands myoporum or ngaio, is a plant in the figwort family, Scrophulariaceae and is endemic to the islands of Mangaia and Mitiaro in the Cook Islands. It is similar to \"Myoporum stokesii\" and \"Myoporum rimatarense\" which grow on other Pacific Islands. On the island of Raratonga it is used to add a scent to coconut oil.\nDescription.\n\"Myoporum wilderi\" is a shrub or small tree sometimes growing to a height of with young branches that are flattened or three-sided. The leaves are arranged alternately, are broadly elliptical in shape with a pointed tip and are mostly long and wide. They are the same shiny colour on both surfaces, glabrous and have a distinct mid-vein.\nThe flowers are borne in groups of up to 6 in the axils of leaves on stalks long and usually have 5 pointed sepals and 5 petals forming a tube or bell-shape. The tube is long with lobes about the same length. The tube is white with distinct purple spots in the tube and on the inner parts of the lobes. There are four stamens which extend beyond the petal tube. The fruits is an oval shaped drupe with a distinct point on the end.\nTaxonomy.\n\"Myoporum wilderi\" was first formally described in 1933 by Carl Skottsberg and the description was published in \"Acta Horti Gothoburgensis\". The specific epithet \"wilderi\" honours the botanist Gerrit Parmile Wilder.\nDistribution and habitat.\n\"Myoporum wilderi\" is only found on Mangaia and Mitiaro.\nUses.\nOn Mangaia, the flowers of this myoporum are used to scent coconut oil. On Raratonga, the species is cultivated for the same purpose.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48694728","title":"A Perilous Journey","body":"\nA Perilous Journey\n\nA Perilous Journey is a 1953 American adventure film directed by R. G. Springsteen and written by Richard Wormser. The film stars Vera Ralston, David Brian, Scott Brady, Charles Winninger, Hope Emerson, Eileen Christy and Leif Erickson. The film was released on April 5, 1953, by Republic Pictures.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48694729","title":"Greg Norman Medal","body":""}
{"url":"https://en.wikipedia.org/wiki?curid=48694730","title":"The Gold Chignon","body":"\nThe Gold Chignon\n\nThe Gold Chignon (French:Chignon d'or) is a 1916 French silent film directed by André Hugon and starring Mistinguett and Harry Baur.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48694734","title":"John F. Hager","body":""}
{"url":"https://en.wikipedia.org/wiki?curid=48694749","title":"Order of the Sword & Shield","body":""}
{"url":"https://en.wikipedia.org/wiki?curid=48694770","title":"Weaubleau Christian College","body":"\nWeaubleau Christian College\n\nWeaubleau Christian Institute was founded in 1873 in Hickory County, Missouri, under the auspices of the Weaubleau Congregational Christian Church. The congregation of the church was made up of families living on newly settled farms, who chose a central location on which to erect a 2-story building large enough to accommodate a church on the first floor and an academy or secondary school on the second. A small town, first called Haran, but later renamed Weaubleau for the stream upon which it is located, grew up around the Church and Institute.\nThe Institute was incorporated under a board of trustees, the majority of whom were to be perpetually drawn from among the members of the church. The student body never exceeded 15) at any point in the schools' first 35 years. One of the College's Presidents, John Whitaker, called it a \"frontier college,\" and wrote that many of the student taught terms in frontier schools to earn their tuition fees.\nThe Institute gained accreditation as a college around 1893, eventually granting three degrees: Bachelor of Science, Bachelor of Accounts, and Master's Degree.\nThe College closed in 1914. The Weaubleau Congregational Christian Church closed in 1960. Some papers related to the College and the Church are held by the State Historical Society of Missouri. \n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48694781","title":"Edson Vidigal","body":"\nEdson Vidigal\n\nEdson Carvalho Vidigal (born June 20, 1944) is a Brazilian politician and lawyer. He served Brazil's Superior Court of Justice from December 9, 1987 to March 29, 2006.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48694814","title":"Rooted in Community","body":"\nRooted in Community\n\nRooted in Community National Network also referred to as R.I.C or Rooted in Community is an non-profit organization, which was founded in Boston. It is a national network that brings young people together to create food security, community gardens and fight for food justice in low income communities. Diverse group of adults and youths helps \"empowers young people to take leadership in their own communities.\" Annual conference and regional gathering for youths to have the opportunity to travel different communities.\nHistory.\nTwo High School students from The Food Project attended 1998 American Community Gardening Association (ACGA) conference. They feel there was a lack of youths involved in the food system and fighting for food justice. First conference was held in Boston with over 70 youths attending.\nProgram Overview.\nInviting youths from across the country to experience different ways to improve their communities. Attending to different workshops with team building and leadership activities, also discuss issues with the food industry in America. Also fighting for Food Justice for communities to have the right to grow, sell, and eat inexpensive healthy food. Changing the food system by helping passing the Youth Food Bill of Rights in Washington. Youths learn about food preparation creating healthy eating habits and appreciation for agriculture. RIC created the TOOL SHED, an online information resource website to help other farmers and youths. The TOOL SHED has lessons on giving a workshop, lecture, and activities.\nList of Network Groups.\nList of organizations, programs and supporters who attended to conferences in the past:\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48694819","title":"Adam C Franklin","body":"\nAdam C Franklin\n\nAdam Franklin is an Australian author, entrepreneur and social media keynote speaker.\nFranklin published \"Web Marketing That Works: Confessions from the Marketing Trenches\" (Wiley 2014) (ISBN 978-0-7303-0927-7) as a paperback and Kindle ebook with co-author Toby Jenkins and it became an Amazon #1 bestseller in Australia.\nHe co-founded his company Bluewire Media with Toby Jenkins in 2005. Franklin featured on \"Smart Company\"'s \"Australia's Hot 30 Under 30\" list of entrepreneurs in 2009. In 2010 he collaborated with David Meerman Scott on the Web Strategy Planning Template which they co-branded. This marketing strategy template was also included in the third, fourth and fifth editions of David Meerman Scott's bestselling book The New Rules of Marketing and PR which has over 350,000 copies in print in more than 25 languages.\nHe co-hosts the podcast \"Web Marketing That Works\" and was interviewed on the Entrepreneur On Fire podcast.\nIn 2015, Franklin's Bluewire Media blog was named the #1 Business Blog in Australia according to Smart Company and was a Business Finalist for the Best Australian Blogs in 2014 according to the Australian Writers' Centre.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48694820","title":"The Jackals (1917 film)","body":"\nThe Jackals (1917 film)\n\nThe Jackals (French:Les chacals) is a 1917 French silent adventure film directed by André Hugon and starring André Nox, Louis Paglieri and Musidora.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48694840","title":"The Europe Trust","body":"\nThe Europe Trust\n\nThe Europe Trust, formerly known as the European Trust, is a UK charity and company which lists its purpose as developing a portfolio of assets intended to fund social and economic projects for communities in Europe. The Europe Trust was founded by the Federation of Islamic Organizations in Europe (FIOE), an organization alleged to have ties with the Muslim Brotherhood in Europe.\nHistory and organization.\nEurope Trust is a Markfield, United Kingdom, based company and charity which was first registered as a U.K. charity in1996 under the name European Trust and then incorporated as a U.K. company named Europe Trust in 2003. In 2004 it was again registered as a charity bearing the name Europe Trust. The 2005 financial report says that the principal activity of the company \"was that of to establish a portfolio of assets (awqaf) businesses and investments to generate resources to fund social and economic projects for communities in Europe.\" \nThe directors and trustees of the Europe Trust are European Muslims of Middle Eastern descent. The Europe Trust employs three staff members and has multiple volunteers. Former trustee and co-founder Dr. Ahmed Kadhem al-Rawi serves currently as the chief executive.\nConnections to the Muslim Brotherhood.\nMajor news outlets as the Wall Street Journal and The Times have reported that the Europe Trust is the financial vehicle of the Muslim Brotherhood in Europe. The Wall Street Journal reported in 2005 that the European Trust was created in 1996 as the de facto fundraising arm of the Federation of Islamic Organizations in Europe in order to break the dependency of FIOE on Gulf donors. The Journal also reported that the Trust had directly subsidized projects of the FIOE, including three colleges and three local Islamic centers that affiliated with the FIOE.\nThe Times reported that the Europe Trust, which has property assets worth more than £8.5 million, sends rental income from its properties to an unofficial network of Brotherhood-linked organizations throughout the continent including the Muslim Association of Britain (MAB), identified by a government minister in 2010 as “the Brotherhood’s representative in the UK.”\nConnections to radicalism and terrorism.\nThe Times of London reported a number of ties from the Europe Trust and/or its Trustees to various forms of terrorism:\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48694849","title":"Flower of Paris","body":"\nFlower of Paris\n\nFlower of Paris (French:Fleur de Paris) is a 1916 French silent film directed by André Hugon and starring Mistinguett, Harry Baur and Louis Paglieri.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48694884","title":"The Four Brothers... Together Again!","body":"\nThe Four Brothers... Together Again!\n\nThe Four Brothers... Together Again! is an album by saxophonists Herbie Steward, Al Cohn, Zoot Sims and Serge Chaloff, who were collectived known as the Four Brothers, recorded in 1957 for the RCA Records subsidiary Vik label.\nReception.\nThe AllMusic review by Scott Yanow states, \"The music overall on this CD reissue is quite enjoyable and Sims, Cohn and Steward show how much they had grown during the previous decade\".\nTrack listing.\n\"All compositions by Al Cohn except as indicated\"\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48694901","title":"Southern Cross (1932 film)","body":"\nSouthern Cross (1932 film)\n\nSouthern Cross (French:La croix du sud) is a 1932 French drama film directed by André Hugon and starring Charles de Rochefort, Suzanne Christy and Alexandre Mihalesco.\nThe film's sets were designed by the art director Christian-Jaque.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48694925","title":"Bridge No. L1409","body":"\nBridge No. L1409\n\nBridge No. L1409 was a historic stone arch bridge in Hillsdale Township, Minnesota, United States, built in 1895. However it was largely destroyed during the 2007 Midwest flooding, when runoff carried away everything except the arch substructure. It had been listed on the National Register of Historic Places in 1990 for having state-level significance in the theme of engineering. It was nominated as Minnesota's \"most impressive\" rural stone arch bridge, owing to its fine ashlar masonry and sizeable span. Although the bridge has now been replaced with a modern structure, it has not yet been delisted from the National Register.\nHistory.\nResidents of Hillsdale Township petitioned Winona County for a bridge at this location in September 1894. Initially tabled, the request was later approved and plans were drafted by county surveyor Fred H. Pickles. The project went out for contract in October 1895 and local stonemason Charles Butler—with the lowest bid at $1,340—was selected. The bridge was largely completed by December of that year.\nBridge No. L1409 was among a concentration of rural stone arch bridges in Southeast Minnesota built in the late-19th and early-20th centuries. Most of these were built by local governments in response to the Good Roads Movement. Few, however, spanned more than . L1409 was three times that length, and with the fine masonry produced by Butler, it was comparable to the larger and more sophisticated bridges of Minnesota's urban areas.\nIn the summer of 2007, extreme flooding in Southeast Minnesota sent torrents of water sweeping down Garvin Brook. L1409's spandrel walls and earth fill were torn away, though the stone arch was so sturdily built it held in place. However the bridge was essentially destroyed, and it has since been replaced with a modern structure.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48694936","title":"Ben Stillman","body":"\nBen Stillman\n\nBen Stillman is an American film producer. Stillman assisted in the development of the Oscar-winning film \"The Imitation Game\" in 2014. He has produced four films including \"Broken City\", which premiered at Sundance Film Festival, and \"Gold\" (2016) starring Matthew McConaughey in 2016. Stillman is vice president of Black Bear Pictures.\nCareer.\nIn 2011, Black Bear Pictures was established and Stillman joined the company as creative executive after leaving Cinetic International. Stillman was associate producer of \"At Any Price\" in 2012. He was named vice president of Black Bear Pictures in 2013. He co-produced \"A.C.O.D.\" starring Adam Scott, as well as \"Broken City\", starring Mark Wahlberg and Russell Crowe, in 2013. He was executive producer of \"Gold\", a drama-thriller film about the search for gold in the jungles of Indonesia that is scheduled to be released in 2016.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48694952","title":"Suzanne Christy","body":"\nSuzanne Christy\n\nSuzanne Christy (1904–1974) was a Belgian film actress.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48694961","title":"Pugilina tupiniquim","body":"\nPugilina tupiniquim\n\nPugilina tupiniquim is a species of sea snail, a marine gastropod mollusk in the family Melongenidae, the crown conches and their allies. \"P. tupiniquim\" and its Eastern Atlantic sister species, \"Pugilina morio\", were once thought to be a single, amphiatlantic entity. They have, however, been recognized as distinct taxa based on anatomical and environmental distinctions.\nDistribution.\nThis species is found in the Western Atlantic Ocean, in mangrove areas along the Brazilian coast, and north to the Caribbean.\nHuman use.\nIn traditional Brazilian medicine in the Northeast of Brazil, \"Pugilina tupiniquim\", formerly referred to as \"Pugilina morio\" (actually an Eastern Atlantic sister species) is used as zootherapeutical product for the treatment of sexual impotence.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48694980","title":"DomiNations","body":"\nDomiNations\n\nDomiNations is a 2015 freemium mobile MMO strategy video game developed and published by Nexon and Big Huge Games.\nGameplay.\nGameplay is similar to other simulation games like Clash of Clans. You build a base and expand by building resource buildings, barracks, and defensive buildings.\nReception.\nDominations was listed as one of the seven best games of April 2015 by Gamezebo. It was given four out of five stars by 148apps shortly after release, and currently holds four out of five stars on the Apple app store.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48694985","title":"John F. Remondi","body":"\nJohn F. Remondi\n\nJohn (Jack) F. Remondi is an American businessman and the president and CEO of the Navient Corporation.\nCareer.\nRemondi became first CEO of the Navient Corporation in April 2014 following its spin-off from Sallie Mae. Prior to Navient, he was the CEO of Sallie Mae from May 2013. Prior to Sallie Mae, Remondi served as Portfolio Manager to PAR Capital Management, from 2005 to 2008. From 1999 to 2005, Remondi served in several financial positions with Sallie Mae, including Executive Vice President, Corporate Finance.\nEducation.\nRemondi graduated from Xaverian Brothers High School in Westwood, Massachusetts and received his bachelor's degree in Economics from Connecticut College.\nPersonal life.\nRemondi is married to Judith Dickstein. He is a former member of the Board of Trustees at Xaverian Brothers High School.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48694990","title":"1997–98 Plymouth Argyle F.C. season","body":"\n1997–98 Plymouth Argyle F.C. season\n\nThe 1997–98 season was the 103th season in the history of Plymouth Argyle Football Club, their 73rd in the Football League,\nSquad.\n \n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48695007","title":"Alexandre Mihalesco","body":"\nAlexandre Mihalesco\n\nAlexandre Mihalesco (1883–1974) was a Romanian film actor who largely appeared in French productions.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48695014","title":"Helene Bresslau Schweitzer","body":"\nHelene Bresslau Schweitzer\n\nHelene Bresslau Schweitzer was co-founder of the Albert Schweitzer Hospital, medical missionary, nurse, social worker, linguist, public medicine enthusiast, editor, feminist, sociologist, mother, and wife/confidant of Albert Schweitzer. Albert, a medical missionary, did not mention her role in his efforts. According to writer Mary Kingsley, she is \"one form of human being whose praise has never adequately been sung, namely, the missionary's wife.\" While much of his work seems to overwrite her own, she played a pivotal role in the advancement of medicine, feminine independence, and societal justice.\nEarly life.\nHelene Bresslau Schweitzer was born to the Bresslau family on January 25, 1879 in Berlin. Her maternal family was of Jewish descent, but she was baptized into the Christian religion as a result of wide-spread anti-semitism. The Bresslaus moved to Alsace, France when she was eleven because of a new job opportunity for her father. Her father, Harry Bresslau, began working at the University of Strasbourg and eventually became chancellor. As a result of the move, Schweitzer adopted French, becoming fluent rather quickly.\nIn 1898, Bresslau met her future husband, Albert Schweitzer at a wedding. Shortly thereafter, they developed a relationship that included separation, independence, and non-exclusive behaviors. This allowed both to develop their lives while enjoying each other's companionship, conversation, and virtues. The one thing that united the pair was their shared ideology: to the take care of others.\nBresslau became Albert's confidant but did not give up her own life for his. In fact, they spent a great deal of time away from each other and maintained a nontraditional relationship (together but not exclusive). They felt secure remaining undefined as a couple, relying on their friendship through documented letters. The turning point for their relationship occurred when they married on June 18, 1912 in Gunsbach. At this point in their lives, they both decided to marry and go to Africa to fulfill their desire to care for others in need. She quit her job at the orphanage and studied higher level nursing to advance her knowledge before leaving. On Good Friday of 1913, she travelled with Albert to Lambaréné, Gabon, beginning her medical missionary adventure.\nEducation and professional development.\nAged 6, Bresslau attended Queen Charlotte's School. In 1890, she transferred to Lindner Girls' High School in Berlin. She began to pursue music studies at a music conservatory from 1897 to 1899. After receiving her teaching credentials in one year rather than the usual two, she worked as a teacher in England in 1902. Continuing to delve into her passion for learning, Bresslau took courses in medieval, modern, and art history at her father's university, the University of Strasbourg. In pursuit of music, she took voice and piano lessons.\nOne area of study that interested Bresslau was nursing. She joined the Protestant Deaconess' Society on January 1, 1904 \"to complete a course in nursing. After, she was assigned to complete three months of nursing lessons in Stettin. On April 1, 1905, she took a break from nursing and went into social work. Even so, exploring another field other than nursing left her \"eager to fill in the gaps\" of her nursing knowledge.\nShe changed her direction of study when she became a municipal inspector for orphans in 1905. She maintained the position from 1905 to 1909. This endeavor attributes largely to part of her own goal to improve the social sphere. However, her home's \"Jewish atmosphere\" widely influenced her as she was taught to \"pay it forward.\" Including and prior to this job, all of her endeavors were based on her own emotions and goals without the Albert's influence. In one of his letters, he notes \"it is you who have won, happy to have found a task that will fill your life, and you’ve done it ahead of me\", addressing her social work in Strasbourg's City Orphan Administration.\nOn October 1, 1909, Schweitzer \"enrolled as a student in the nursing school of the Protestant Deaconess' Society in Frankfurt in the city hospital\" to further her knowledge in the profession, thus beginning her nursing career.\nMissionary work.\nJourney with Albert Schweitzer.\nSchweitzer and Albert shared one main common goal: to help improve medicine and the greater good in Lambaréné, Gabon. At the very beginning of their journey, Schweitzer wrote in her diary that \"we are truly in love with Africa.\" In spring 1913, Schweitzer and Albert set off to establish a hospital (Albert Schweitzer Hospital) near an already existing mission post. The site was nearly 200 miles (14 days by raft) upstream from the mouth of the Ogooué at Port Gentil (Cape Lopez) (and so accessible to external communications) but downstream of most tributaries, so that internal communications within Gabon converged towards Lambaréné.\nThis journey to make medical improvements in Africa allowed Schweitzer to further develop herself. Patti Marxsen writes that Schweitzer's \"capacity for hard work in a challenging environment can be read as proof that her independence earned in Strasbourg was now unshakeable. For the now thirty-four-year-old Helene Schweitzer...a life in Africa offered a chance to integrate multiple aspects of modern identity, perhaps even more so than would have been possible in Europe.”\nSchweitzer had prior interest in nursing and the medical field before Albert became involved in medicine. Therefore, Schweitzer played a vital role in his work, acting as a possible influence. In the first nine months, Schweitzer and Albert had about 2,000 patients to examine, some travelling many days and hundreds of kilometers to reach him. In her time in Africa, she worked as nurse and helped with the hospital. She played an essential part in sanitation efforts, especially by preparing medical equipment for surgery. Schweitzer was an anaesthetist for surgical operations.\nChallenges.\nWhen World War I broke out in summer of 1914, the French military put Schweitzer and Albert, Germans in a French colony, under supervision at Lambaréné, where they continued their work. In 1917, exhausted by over four years' work and by tropical anaemia, they were taken to Bordeaux and interned first in Garaison and then from March 1918 in Saint-Rémy-de-Provence.\nMedical issues forced Schweitzer to leave Africa many times, and sometimes Albert kept her from returning at times. When Albert decided to return to Africa in 1924, he took on Oxford undergraduate, Noel Gillespie, as assistant, leaving Schweitzer behind. After the birth of their daughter (Rhena Schweitzer Miller), Schweitzer was no longer able to live in Lambaréné owing to her health. In 1923 the family moved to Königsfeld im Schwarzwald, Baden-Württemberg, where Albert was building a house for the family. This house is now maintained as a Schweitzer museum.\nHer not returning to Lambaréné was a sacrifice made \"by her husband, not for him.\" She wrote about her not returning, describing it as a \"practical matter\", but she \"never agreed to a separation of three and a half years\" from her husband. Despite her poor health, she still took care of her daughter, \"engage[d] herself with the Hospital Aid Association,\" and \"enroll[ed] in a three week course in tropical medicine at the Medical Missionary Institute of Tubingen, Germany.\" As a motherhood advocate, she gladly took care of her daughter and continued to develop her own personal skills. Schweitzer still remained engaged in helping the mission hospital.\nIn 1929, after receiving treatment for pneumonia, Schweitzer returned to Lambaréné to see her husband Albert’s progression with the new hospital. Shortly after arriving, however, she developed a bad fever and was forced to depart the hospital and her husband to return to Europe for treatment. After recovering, she used her writing skills and began to edit her husband's autobiography. Her English skills also opened the door for \"public speaking and networking in the United States.\" On December 1, 1930, a German newspaper printed one of her speeches. In it, she described her husband’s concept, the Fellowship of the Marks of Pain. She turned her medical challenges into positives, explaining that through her suffering she developed a compassionate view of their work that only she could personally attest.\nSchweitzer was aware that her husband would receive much of the acclaim for their missionary endeavors, so she set out to make her work known. In October 1946, she began to review her documents and collect them so that she would be understood as a \"full partner\" in their missionary work. In addition, she began lecture tours in the United States in 1937 to promote the Schweitzer Hospital.\nHealth complications.\nSchweitzer experienced tremendous health issues throughout her life, mostly in relation to the lungs. She first encountered tuberculosis before she turned ten. She was officially diagnosed in the spring of 1922 with laryngeal tuberculosis after exhibiting symptoms of \"pain, fever, and the coughing up of blood.\" In addition the heat of Africa caused many respiratory issues. In 1915, she contracted phlebitis resulting in two weeks of therapeutic bed rest. She also had pneumonia in 1929, almost keeping her from returning to Lambaréné. Despite her already weak lungs, she completed the trip though she had to return early due to illness again.\nSchweitzer died on June 1, 1957, and her remains are located in Lambaréné. Once Albert died, he was buried next to her. Schweitzer's grave with Albert is \"on the banks of the Ogooue River is marked by a cross he made himself.\"\nLegacy.\nSchweitzer contributed greatly to the work done in Lambaréné. A role model as an independent, educated woman with a deep intellectual curiosity, she was \"One of the first female students at the University of Strasbourg\" and \"One of the first female employees in the community administration\" at the orphanage. Her aid in the poor relief system, \"Armenpflegesystem,\" mirrored in modern social welfare, saw the illegitimate mortality rate fall. Setting precedence as a female medical missionary in the early 20th century, she established lasting effects of nursing and education in Lambaréné. She co-founded the Schweitzer Hospital, documented much of Albert's autobiography, and \"supported the [mission] work with lectures and fund-raising\" essential to its upkeep and vivacity.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48695035","title":"Abu Dhabi Combat Club","body":"\nAbu Dhabi Combat Club\n\nThe Abu Dhabi Combat Club located in Abu Dhabi, United Arab Emirates (U.A.E.) is a martial arts club designed to promote martial arts in the U.A.E. The Abu Dhabi Combat Club is one of the top facilities for learning and training in mixed martial arts (MMA) in the Arab world. Its founder created the submission style (a type of \"grappling\" style) of martial arts and it hosted the first Abu Dhabi Combat Club Submission Fighting Championships in 1998. Many who have competed in the popular ADCC Submission Grappling Championship have gone on to have successful careers in MMA such as Ronaldo \"Jacare\" Souza and Vitor “Shaolin” Ribeiro and many others. Although the facility itself is used mainly by athletes and practitioners who reside in Abu Dhabi, many top level grapplers, fighters and BJJ specialists have been honored guests and had spent time training or teaching in the club. The Abu Dhabi Combat Club does not have its own fighters; it serves more as a platform where fighters can participate in training camps and take advantage of the large number of BJJ Black Belts who currently reside in Abu Dhabi. The facility where the ADCC was originally located is not owned by the UAE Wrestling, Judo and Kickboxing Federation, where classes are given in the same disciplines. However, the reputation of the ADCC is still strong and the facility is being visited by top fighters occasionally. \nThe first five Championships held under the patronage of H.H. Sheikh Tahnoon Bin Zayed Al Nahayan were hosted in that same facility in Abu Dhabi Equestrian Club compound. From 1998 until the 2002 the events were held annually in Abu Dhabi. Ever since 2002 the event ADCC Submission Fighting Championship (it was renamed due to copy rights of the world Grappling) is held once every two years and every event is hosted in countries where the sport is well developed such as the US, Brazil and Japan.\nHistory.\nThe Abu Dhabi Fighting Club was created by U.A.E. national Sheik Tahnoon Bin Zayed Al Nahyan. While completing advanced studies in the United States of America, Sheik Tahnoon watched the first UFC fight and became a fan of MMA. The club was created out of an idle facility and world class trainers were hired.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48695084","title":"ESPN College Extra","body":"\nESPN College Extra\n\nESPN College Extra is an American out-of-market sports package. It was launched on August 28, 2015 as a merger of the existing ESPN Full Court and ESPN GamePlan, each of which offered college basketball and college football broadcasts respectively. \nAvailability.\nESPN College Extra is available with these cable and satellite providers:\nAlmost all ESPN College Extra broadcasts are also made available through ESPN3.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48695112","title":"Adonay Alfaro Murcia","body":"\nAdonay Alfaro Murcia\n\nAdonay Alfaro Murcia is a former Costa Rican footballer who played in the USISL D-3 Pro League, and the Canadian National Soccer League.\nPlaying career.\nMurcia moved to Canada in 1996, and played with Toronto Supra of the Canadian National Soccer League. He would help Supra finish third in the league standings, and secured a postseason berth for the club. They were eliminated in the semi-finals and lost the series on 2-1 on goals on aggregate to the St. Catharines Wolves. In 1997, he abroad to the United States and signed with San Antonio Pumas of the USISL D-3 Pro League. During his tenure with San Antonio he helped the club reach the playoffs, before they were eliminated in the division finals to the Houston Hurricanes. After the 1997 season he retired from competitive football, and enrolled to San Antonio College, graduated with honors and is currently working in Web design.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48695117","title":"BCDF Pictures","body":""}
{"url":"https://en.wikipedia.org/wiki?curid=48695138","title":"Streptomyces coelescens","body":"\nStreptomyces coelescens\n\nStreptomyces coelescens is a bacterium species from the genus of \"Streptomyces\". \"Streptomyces coelescens\" produces glycoglycerolipids.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48695146","title":"Flood Mythology of China","body":"\nFlood Mythology of China\n\nThe Flood Mythology of China, or Great Flood of China (; also known as ) is a deluge theme which was happened in China. Derk Bodde (1961) stated that \"from all mythological themes in ancient Chinese, the earliest and so far most pervasive is about flood.\" The myth is also have shared characteristics with other Great Floods all over the world, although it also have unique characteristics or different focuses. Lu Yilu (2002) was grouping all versions of great flood into three themes: \"the heroes controls the flood; \"brother-sister marriage to repopulating the world\"; and \"the flood which is drowning the whole city along with its citizens\".\nHistory and mythology.\nLiterary history.\nThe history of China as a continuously recorded literary tradition begins with the ancient documents transmitted to posterity through the \"Records of the Grand Historian\". According to these, the great-grandson (or fourth successor) of the Yellow Emperor was Yao. Beginning with the reign of Yao, additional literary sources become available, including the \"Book of Documents\" (collected and edited by Confucius), which begins with the \"Canon of Yao\" (), describing the events of Yao's reign. Although, the \"Canon of Yao\" is problematic in regards to textual transmission (at best it seems to represent an early textual reconstruction and at worst a fabrication based on available knowledge or sources from the 3rd or 4th centuries CE). \"The Counsels of Great Yu\" 大禹謨 is considered to be one of the reliably transmitted pre-Qin texts. In any case, these and other texts of the preserved literature mark the beginnings of the Chinese historical tradition. Other important texts include the poem \"Heavenly Questions\" collected in the \"Chu Ci\" which is attributed to Qu Yuan and the famous mythological compendium \"Classic of Mountains and Seas\" (\"Shanhaijing\"). Furthermore, centuries of scholarship have gone into piecing together a narrative from the bits, pieces, and occasionally longer sections found in these and other early sources, sometimes being subjected to heavy editorial handling in terms of viewpoint.\nCollected mythology.\nMythological stories besides having been preserved both in various literary forms, have also been collected from various oral traditions, some of these folktales are still told. Some of these sources are from people of the Han ethnicity and some from other ethnic groups.\nThe struggles to control the flood.\nThe Zhou sources narrated the struggles of the heroes or deities to control the floods. From all of these stories, the struggle of Yao, Gun, and Yu is the most obvious in describing the hardness of human effort to control the flood. Much later works from the Warring States period (\"Shi Ben\") and \"Di wang shi ji\" (3rd century) were pairing Yu and Nuwa as a couple and their previously uncorrelated stories were then completing each other.\nGun-Yu Mythology.\nThis theme is based on the efforts of Great Yu (and Gun) to control the flood, sometimes is also associated with Emperor Yao and Shun, and the initial efforts of human to domesticated wild animals as pack animals and livestock. The theme outline narrates Gun stole xirang to stop the flood while Great Yu channeled the flood into the sea and succeeded to subsided the water level, and so the earth can be cultivated. There are so many mythologies which are correlated to this theme, one of which is \"Dragon Gate\" -a canal through the mountains which was dug by Yu. While he was digging the canal, many of the carps were swept away and fell, they were so disappointed because they couldn't swim back into the upper level. Yu promised them, if any of the carp could leap through his dam, it would transform into a dragon, thus the place inherited its name.\nGun-Yu theme is also have political background. Huainanzi stated that the great flood was caused by Gong Gong who was use the water to make havoc on the realm of Emperor Yao. Shan Hai Jing narrated another version that the flood was caused by Xiangliu, one of Gong Gong's minister, and was not Gong Gong himself.\nNuwa repaired the heaven.\nThe story was happened after Goddess Nüwa created (molded) humanity from yellow clay, brought them into life, and gave them the ability to reproduce. Gong Gong was banging his head into Mount Buzhou, which actually was the pillar to support the heaven. Nüwa then patched the sky with five-colored pebbles and piled up reeds ashes to stop the flood.\nThe extinction of human race.\nChen Jianxian (1996) said that this theme was one of some popular legends which was still being told by more than 40 ethnics in China. There is a possibility that the myth is rather new because the oldest recorded sources about this myth were from Six Dynasties, save that the oral tradition maybe much older.\nThe theme was made into several versions, but the outline is about a great flood which was destroyed all the humans all over the world except a pair of brother and sister, or aunt and nephew. Both were forced to married in order to repopulated the world. One version stated that their children were ordinary humans, while the others said it was a lump of meat, squash, melon, or grindstone; after they opened, cut, or destroyed it, humans emerged.\nSinking city.\nThis theme have some specific characteristics: one or two people were survived, the statue which was crying blood, and the whole city along with its citizens were sinking. The survivor(s) was being saved by the gods because of his/her benevolent acts; may be an old lady or a devoted son. The blood crying statue was often a stone lion statue, or sometimes tortoise statue.\nOther flood myths.\nEast Sea and Mulberry Field.\nA less widespread flood myth involves the goddess Magu: this myth involves the cyclic rise and fall of the ocean level over the eons: sometimes the sea floor is under water; at other times, it turns into mulberry fields. However, the material about Magu seems to be distinct from the idea of a great flood upon the land of China.\nOne tradition narrates Magu, a benevolent Taoist lady who lived on the second century. She was reclaiming a very wide seashore water bodies on Kiangsu and changing it into mulberry fields.\nHeyu.\nShan Hai Jing mentions a pig-like creature with human face, yellow-colored and red-tailed, and it sounds like human singing. The creature is known as \"Heyu\"; he preys on human, reptiles, and snakes. It appearance is a sign that there will be a great deluge all over the world.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48695172","title":"RCAF Overseas Headquarters","body":"\nRCAF Overseas Headquarters\n\nThe Royal Canadian Air Force Overseas Headquarters, often abbreviated to RCAF Overseas, was responsible for Canadian airmen serving outside Canada during and just after World War II. The headquarters was established on 1 January 1940 and it was based in London. Its main functions were to conduct liaison with the British Air Ministry, to provide a central location for personnel records, and provide general administration. As the War progressed, the Overseas Headquarters gained increasing administrative authority over Canadian personnel but never gained any significant operational responsibility for RCAF units and formations which were integrated into the RAF's command structure.\nSenior officers.\nThe following officers were in charge of the RCAF Overseas Headquarters:\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48695181","title":"List of female scientists in the 20th century","body":"\nList of female scientists in the 20th century\n\nThis is a \"historical\" list, intended to deal with the time period when women working in science were rare. For this reason, this list deals only with the 20th century. Some women who primarily worked in the 19th or 21st centuries may appear in a different list.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48695201","title":"Eleanor Gladys Copenhaver","body":"\nEleanor Gladys Copenhaver\n\nEleanor Gladys Copenhaver (also known as Eleanor Copenhaver Anderson) (1896-1985) was a social worker and activist who spent over 40 years as an organizer and community service worker for the YWCA. She began as a community organizer and worked her way up to the labor division, finally becoming head of the Industrial Division from 1937 to 1947. At the end of World War II, when women were phased out of the labor market, she was briefly dismissed, but then hired back to organize support for the communities springing up around the defense industry. \nBiography.\nEleanor Gladys Copenhaver was born on June 15, 1896 in Marion, Virginia to Laura Lu (née Scherer) and Bascom Eugene Copenhaver. Both of Copenhaver's parents taught at the school her grandfather Scherer had founded, Marion Female College. She spent her childhood at the family home, \"Rosemont\", which also housed Rosemont Industries, an organization established by her mother, which marketed local handicrafts. After completing her primary education at the public schools of Marion, Copenhaver began her university studies at Marion College before she transferred in 1914 to Westhampton College in Richmond, Virginia. She completed her B.A. in English in 1917 and returned that same year to Marion to teach. In 1918, she enrolled in social work classes at Bryn Mawr College in Pennsylvania and in 1919 worked in a settlement camp for New York City women during the summer. She completed her degree in 1920 earning a certificate in social economy.\nCareer.\nIn September 1920, Copenhaver became a Field Secretary on the national staff of the YWCA covering the south and central region. From 1920 to 1923 she was a rural community organizer. In addition to introducing the programs of the YWCA to local communities and churches, Copenhaver participated in seminars and retreats like one held in 1922, which explored the tenets of internationalism that had sprung up after the first World War. The YWCA believed that if women used their moral and professional authority, they would reshape the world. Copenhaver participated in the \"Conference at the Lake\" and after their presentation on relationships with Syrian and Japanese women, and the Bible study, she directed a play, which she had written with her mother. The basic theme was modernity and the enlightenment of women who could draw upon the past, their spirituality and their ability to work and use their intelligence. In 1923 she switched to industrial community activism then in 1925 became the National Industrial Secretary working out of New York. Her political beliefs became increasingly radical during her many visits to factories to counsel and organize working women. During one of these visits in 1928, she made a side trip to her family and met the writer Sherwood Anderson. Coperhaver returned to New York and enrolled in a master's program at Columbia University. She completed the degree in political economy in 1933 and later that same year, married Anderson.\nCoperhaver-Anderson continued working as a labor organizer. In 1937, she was promoted to head the Industrial Programs of the YWCA. Her work entailed investigating working and educational conditions, submitting reports for action and providing support for labor unions. She continued to travel with her job and the couple also traveled to visit Sherwood's artist and writer friends all over the world. On one of these trips, taken in 1941 after the death of her mother, the couple were in route to Valparaiso, Chile aboard the \"SS Santa Lucia\". Sherwood became ill with peritonitis, the couple disembarked, but he died at a hospital in Colón, Panama. After bringing him back to Virginia for burial, Anderson returned to work. She continued as the executive of the Y's industrial division and resumed her travels, going across the country, until the Industrial Department was phased out soon after the end of World War II. When that happened, in 1947, Anderson took a two-year assignment with the international YWCA in Italy to help with relief efforts. At the end of her assignment, she returned from Italy and was terminated by the Y due to their elimination of women's employment programs. She spent most of 1950 organizing Sherwood's papers and preparing them for donation to the Newberry Library in Chicago. The following year, she was rehired by the YWCA working on their United Community Defense Services, which was a program aimed at providing \"health, welfare, and recreation services\" to communities supporting the defense industry. She remained with the YWCA until her retirement in 1961.\nAfter her retirement, she served as Sherwood's literary executor as well as the overseer of his property at \"Ripshin\" and her mother's legacy at \"Rosemont\". Anderson died on September 12, 1985 in Marion, Virginia. Copenhaver's papers are located at Smith College in Northampton, Massachusetts. Many of the records can be found on-line as part of the \"Five College Finding Aids Access Project\", which was funded by the Andrew W. Mellon Foundation.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48695217","title":"Perspective-n-Point","body":"\nPerspective-n-Point\n\nPerspective-\"n\"-Point is the problem of estimating the pose of a calibrated camera given a set of 3D points in the world and their corresponding 2D projections in the image. The camera pose consists of 6 degrees-of-freedom (DOF) which are made up of the rotation (roll, pitch, and yaw) and 3D translation of the camera with respect to the world. This problem originates from camera calibration and has many applications in computer vision and other areas, including 3D pose estimation, robotics and augmented reality. A commonly used solution to the problem exists for called P3P, and many solutions are available for the general case of . Implementations of these solutions are also available in open source software.\nProblem Specification.\nDefinition.\nGiven a set of 3D points in a world reference frame and their corresponding 2D image projections as well as the calibrated intrinsic camera parameters, determine the 6 DOF pose of the camera in the form of its rotation and translation with respect to the world. This follows the perspective project model for cameras:\nwhere formula_2 is the homogeneous world point, formula_3 is the corresponding homogeneous image point, formula_4 is the matrix of intrinsic camera parameters, (where formula_5 and formula_6 are the scaled focal lengths, formula_7 is the skew parameter which is sometimes assumed to be 0, and formula_8 is the principal point), formula_9 is a scale factor for the image point, and formula_10 and formula_11 are the desired 3D rotation and 3D translation of the camera (extrinsic parameters) that are being calculated. This leads to the following equation for the model:\nAssumptions and Data Characteristics.\nThere are a few preliminary aspects of the problem that are common to all solutions of P\"n\"P. The assumption made in most solutions is that the camera is already calibrated. Thus, its intrinsic properties are already known, such as the focal length, principal image point, skew parameter, and other parameters. Some methods, such as UP\"n\"P. or the Direct Linear Transform (DLT) applied to the projection model, are exceptions to this assumption as they estimate these intrinsic parameters as well as the extrinsic parameters which make up the pose of the camera that the original P\"n\"P problem is trying to find.\nFor each solution to PnP, the chosen point correspondences cannot be coplanar. In addition, P\"n\"P can have multiple solutions, and choosing a particular solution would require post-processing of the solution set. Furthermore, using more point correspondences can reduce the impact of noisy data when solving P\"n\"P. RANSAC is also commonly used with a P\"n\"P method to make the solution robust to outliers in the set of point correspondences. Most methods, however, assume that the data is noise-free.\nMethods.\nThis following section describes two common methods that can be used to solve the P\"n\"P problem that are also readily available in open source software and how RANSAC can be used to deal with outliers in the data set.\nP3P.\nWhen , the P\"n\"P problem is in its minimal form of P3P and can be solved with three point correspondences. However, with just three point correspondences, P3P yields many solutions, so a fourth correspondence is used in practice to remove ambiguity. The setup for the problem is as follows.\nLet \"P\" be the center of projection for the camera, \"A\", \"B\", and \"C\" be 3D world points with corresponding images points \"u\", \"v\", and \"w\". Let \"X = |PA|\", \"Y = |PB|\", \"Z = |PC|\", formula_13, formula_14, formula_15, formula_16, formula_17, formula_18, formula_19, formula_20, formula_21. This forms triangles \"PBC\", \"PAC\", and \"PAB\" from which we obtain the equation system for P3P:\nIt's common to normalize the image points before solving P3P. Solving the P3P system results in four possible solutions for and . The fourth world point \"D\" and its corresponding image point \"z\"are then used to to find the best solution among the four. The algorithm for solving the problem as well as the complete solution classification for it is given in the 2003 \"IEEE\" Transactions on Pattern Analysis and Machine Intelligence paper by Gao, et. al. An open source implementation of the P3P can be found in OpenCV's \"calib3d\" module in the \"solvePnP\" function.\nEP\"n\"P.\nEfficient P\"n\"P (EP\"n\"P) is a method developed by Lepetit, et. al in their 2008 International Journal of Computer Vision paper that solves the general problem of P\"n\"P for . This method is based on the notion that each of the \"n\" points (which are called reference points) can be expressed as a weighted sum of four virtual control points. Thus, the coordinates of these control points become the unknowns of the problem. It is from these control points that the final pose of the camera is solved for.\nAs an overview of the process, first note that each of the reference points in the world frame, formula_23, and their corresponding image points, formula_24, are weighted sums of the four controls points, formula_25 and formula_26 respectively, and the weights are normalized per reference point as shown below. All points are expressed in homogeneous form.\nFrom this, the derivation of the image reference points becomes\nThe homogeneous image control point has the form formula_31. Rearranging the image reference point equation yields the following two linear equations for each reference point:\nUsing these two equations for each of the reference points, the system formula_34 can be formed where formula_35. The solution for the control points exists in the null space of and is expressed as \nwhere formula_37 is the number of null singular values in formula_38 and each formula_39 is the corresponding right singular vector of formula_38. formula_37 can range from 1 to 4. After calculating the initial coefficients formula_42, the Gauss-Newton algorithm is used to refine them. The and matrices that minimize the reprojection error of the world reference points, formula_23, and their corresponding actual image points formula_24, are then calculated.\nThis solution has formula_45 complexity and works in the general case of P\"n\"P for both planar and non-planar control points. Open source software implementations of this method can be found in OpenCV's Camera Calibration and 3D Reconstruction module in the \"solvePnP\" function as well as from the code published by Lepetit, et. al at their website, .\nUsing RANSAC.\nP\"n\"P is prone to errors if there are outliers in the set of point correspondences. Thus, RANSAC can be used in conjunction with existing solutions to make the final solution for the camera pose more robust to outliers. An open source implementation of P\"n\"P methods with RANSAC can be found in OpenCV's Camera Calibration and 3D Reconstruction module in the \"solvePnPRansac\" function\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48695224","title":"2009 Monte Paschi Strade Bianche - Eroica Toscana","body":"\n2009 Monte Paschi Strade Bianche - Eroica Toscana\n\nThe 2009 Monte Paschi Strade Bianche - Eroica Toscana was the third edition of the Strade Bianche road bicycle race, held on 7 March 2009 in Tuscany, Italy. The race was 190 km, starting in Gaiole in Chianti and finishing in Siena, and included eight sectors of \"strade bianche\", totaling 57,2 km of gravel road. Compared to the previous edition of the Strade Bianche, the race was 10 km longer and featured one more sector of \"sterrato\".\nSwedish rider Thomas Lövkvist won the race ahead of German Fabian Wegmann and Swiss Martin Elmiger. Linus Gerdemann attacked five kilometres from the finish, but faded on the steep climb to the centre of Siena and was caught and passed by a chase group. Thomas Lövkvist powered up the cobbled street and was the first to enter the Piazza del Campo and crossed the line 4 seconds ahead of Wegmann and Elmiger. Edvald Boasson Hagen was fourth at eight seconds.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48695226","title":"On the Waves of Happiness","body":"\nOn the Waves of Happiness\n\nOn the Waves of Happiness (Romanian:Pe valurile fericirii) is a 1920 Romanian silent film directed by Dolly A. Szigethy and starring Lya De Putti, Maria Filotti and Ian Manolescu.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48695244","title":"Ooho","body":"\nOoho\n\nOoho may refeer to:\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48695248","title":"Batang Pinoy","body":"\nBatang Pinoy\n\nThe Philippine Youth Games – Batang Pinoy or simply Batang Pinoy (lit. Filipino Youth) is the national youth sports competition of the Philippines for athletes under 15 years old. Unlike the Palarong Pambansa a competition for student athletes, the Batang Pinoy also includes the out-of-school youth.\nHistory.\nThe Batang Pinoy was established through the Executive Order No. 44 which was signed by then President Joseph Estrada in December 2, 1988. The first edition was held in Bacolod in 1999. From then, the games were held annually with Santa Cruz, Laguna (2000), Bacolod (2001) Puerto Princesa (2002) hosting the next three editions. The 2002 and prior editions, were for athletes of 12 years and below.\nIn 2003, the Philippine Sports Commission decided to put the competition, along with its other national competitions, on hold so the sports body could reallocate funds to the national teams' stint at the Southeast Asian Games. The Batang Pinoy was held again in 2011, and is held annually since then.\nEditions.\nHost of the Batang Pinoy National Championships.\n(*) Hosting of the originally 2013 edition postponed to early 2014. A second Batang Pinoy was hosted in the same year.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48695256","title":"Streptomyces coelicoflavus","body":"\nStreptomyces coelicoflavus\n\nStreptomyces coelicoflavus is a bacterium species from the genus of \"Streptomyces\". \"Streptomyces coelicoflavus\" produces acarviosin-containing oligosaccharides.\nReferences.\n \n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48695271","title":"Soldiers of the Emperor","body":"\nSoldiers of the Emperor\n\nSoldiers of the Emperor (Hungarian:A Császár katonái) is a 1918 Hungarian silent film directed by Béla Balogh and starring Lya De Putti, Sándor Virányi and Aladár Ihász.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48695290","title":"Promoter activity","body":"\nPromoter activity\n\nPromoter activity is a term that encompasses several meanings around the process of gene expression from regulatory sequences —promoters and enhancers. Gene expression has been commonly characterized as a measure of how much, how fast, when and where this process happens. Promoters and enhancers are required for controlling where and when an specific genes is transcribed.\nTraditionally the measure of gene products (i.e. mRNA, proteins, etc.) has been the major approach of measure promoter activity. However, this method confront with two issues: the stochastic nature of the gene expression and the lack of mechanistic interpretation of the thermodynamical process involve in the promoter activation.\nThe actual developments in metabolomics product of developments of next-generation sequencing technologies and molecular structural analysis have enable the development of more accurate models of the process of promoter activation (e.g. the sigma structure of the polymerase holoenzyme domains) and a better understanding of the complexities of the regulatory factors involved.\nPromoter binding.\nThe process of binding is central in determining the \"strength\" of promoters, that is the relative estimation of how \"well\" a promoter perform the expression of a gene under specific circumstances. Brewster et al., using a simple thermodynamical model based on the postulate that transcriptional activity is proportional to the probability of finding the RNA polymerase bound at the promoter, obtained predictions of the scaling of the RNA polymerase binding energy. This models support the relationship between the probability of binding and the output of gene expression\nMathematical representation of promoter binding.\nThe problem of gene regulation could be represented mathematically as the probability of n molecules — RNAP, activators, repressors and inducers — are bound to a target regions.\nTo compute the probability of bound, it is needed to sum the Boltzman weights over all possible states of formula_1 polymerase molecules\non DNA. Here in this deduction formula_1 is the effective number of RNAP molecules available for binding to the promoter.\nThis approach is based in statistical thermodynamics of two possible microscopic outcomes: \nThe statistical weigh of promoter unoccupied \"Z(P)\" is defined:\nformula_3\nWhere the first term is the combinatorial result of taken formula_1 polymerase of formula_5 non-specific sites available, and the second term are the boltzmann weights, where formula_6 is the energy that represents the average binding energy of RNA polymerase to the genomic background (non-specific sites).\nThen, the total statistical weight formula_7, can be written as the sum of the formula_8 state and the RNA polymerase on promoter state:\nformula_9\nWhere formula_10 in the formula_11 state is the binding energy for RNA polymerase on the promoter (where the s stands for specific site).\nFinally, to find the probability of a RNA polymerase to binding (formula_12 ) to an specific promoter, we divide formula_13 by formula_14 which produces:\nformula_15\nWhere, formula_16\nAn important result of this model is that any transcription factor, regulator or perturbation could be introduced as a term multiplying formula_1 in the probability of binding equation. This term for any transcriptional factor (here called factor regulators) modify the probability of binding to:\nformula_18\nWhere formula_19 is the term for transcriptional factors, and it has the value of formula_20 for increase of formula_21 for decrease of the number of RNA polymerase available to bind.\nThis result has an important significance to represent mathematically all the possible configurations of transcriptional factor by derive different models to estimate formula_19 (for further developments, see also ).\nEukaryotes promoter structure.\nThe process of activation and binding in eukaryotes is different from bacteria in the way that specific DNA elements bind the factors for a functional pre-initiation complex. In bacteria there is a single polymerase, that contain catalytic subunits and a single regulatory subunits known as sigma, which transcribe for different type of genes.\nIn eukaryotes, the transcription is performed by three different RNA polymerase, RNA pol I for ribosomal RNAs (rRNAs), RNA polymerase II for messenger RNAs (mRNAs) and some small regulatory RNAs, and the RNA polymeerase III for small RNAs such as transfer RNAs (tRNAs). The process of positioning of the RNA polymerase II and the transcriptional machinery require the recognition of a region know as \"core promoter\". The elements that could be found in the core promoter include the TATA element, the TFIIB recognition element (BRE), the initiatior (Inr), and the downstream core promoter element (DPE). Promoters in eukaryotes contain one or more of these core promotes elements (but any of them are absolutely essential for promoter function), these elements are binding sites for subunits of the transcriptional machinery and are involve in the initiation of the transcription, but also they have some specific enhancer functions. In addition, the promoter activity in eukaryotes include some complexities in the way of how they integrate signals from distal factors with the core promoter.\nEvolutionary processes.\nUnlike in protein coding regions, where the assumption of sequence conservation of functionally homologous genes have been frequently proved, there is no a clear relationship of conservation between sequences and their functions for regulatory regions. The transcriptional promoters regions are under less stringent selection, then have a higher substitutions rates, allowing transcription factor binding sites to be replaced easily be new ones arising from random mutations. Notwithstanding the sequence changes, mainly the functions of regulatory sequences remain conserved.\nIn recents years with the increase of availability of genome sequences, phylogenetic footprinting open the possibitlity to identify cis-elements, and then study their evolution processes. In this sense, Raijman et al., Dermitzakis et al. have developed techniques for analyzing evolutionary processes in transcription factor regions in Saccharomyces species promoters and mammalian regualatory networks respectively.\nThe basis for many of these evolutionary changes in nature are probably related with events within the cis-regulatory regions involve in gene expression. The impact of variation in regulatory regions is important for disease risk due their impact in the gene expression level. Furthermore, perturbations in the binding properties of proteins encoded by regulatory genes have been linked with phenotypes effects such as, duplicated structures, homeotic transformations and novel morphologies.\nMeasure of promoter activity.\nThe measure of the promoter activity has a broad meaning. The promoter activity could be measured for different situations or research questions, such as:\nMethods to study promoter activity commonly are based in the expression of a reporter gene from the promoter of the gene of interest. Mutations and deletions are made in a promoter region, and their changes on couple expression of the reporter gene are measured.\nThe most important reporter genes are the fluorescence proteins as GFP. These reporters allow to measure promoter activation by increasing fluorescent signals, and deactivation by decrease in the rate of fluorescence.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48695349","title":"Gypsy Blood (1920 film)","body":"\nGypsy Blood (1920 film)\n\nGypsy Blood (German:Zigeunerblut) is a 1920 German silent film directed by Karl Otto Krause and starring Lya De Putti, Carl Fenz and Paul Hansen. It is based on Georges Bizet's \"Carmen\" and shout not be confused with the 1918 German silent \"Carmen\".\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48695353","title":"Carlton E. Lemke","body":"\nCarlton E. Lemke\n\nCarlton Edward Lemke (October 11, 1920 - April 12, 2004) was an American mathematician.\nLemke received his bachelor's degree in 1949 at the University of Buffalo and his PhD (Extremal problem in Linear Inequalities) in 1953 at Carnegie Mellon University (then Carnegie Institute of Technology). In 1952-1954 he was instructor at the Carnegie Institute of Technology and in 1954-55 at the Knolls Atomic Power Laboratory of General Electric. In 1955-56 he was an engineer at the Radio Corporation of America in New Jersey. From 1956 he was assistant professor and later professor at the Rensselaer Polytechnic Institute. Since 1967, he was there Ford Foundation Professor of Mathematics.\nHis research is in Algebra, Mathematical Programming, Operations Research, and Statistics. In 1954 Lemke developed the dual simplex method, independently from E. M. L. Beale.\nHe is also known for his contribution to game theory. In 1964 Lemke (with J. T. Howson) constructed an algorithm for finding Nash equilibria the case of finite two-person games. For this work Lemke received in 1978 the John von Neumann Theory Prize.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48695355","title":"Iron Mountain Trail","body":"\nIron Mountain Trail\n\nIron Mountain Trail is a 1953 American Western film directed by William Witney and written by Gerald Geraghty. The film stars Rex Allen, Slim Pickens, Grant Withers, Nan Leslie, Roy Barcroft and Forrest Taylor. The film was released on May 8, 1953, by Republic Pictures.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48695356","title":"Talwandi Nepalan","body":"\nTalwandi Nepalan\n\nTalwandi Nepalan is a village in the Firozpur district of Punjab, India. It is located in the Zira tehsil.\nDemographics.\nAccording to the 2011 census of India, Talwandi Nepalan has 526 households. The effective literacy rate (i.e. the literacy rate of population excluding children aged 6 and below) is 68.69%.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48695360","title":"Rasulpur, Zira","body":"\nRasulpur, Zira\n\nRasulpur is a village in the Firozpur district of Punjab, India. It is located in the Zira tehsil.\nDemographics.\nAccording to the 2011 census of India, Rasulpur has 329 households. The effective literacy rate (i.e. the literacy rate of population excluding children aged 6 and below) is 66.22%.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48695365","title":"Sudan, Zira","body":"\nSudan, Zira\n\nSudan is a village in the Firozpur district of Punjab, India. It is located in the Zira tehsil.\nDemographics.\nAccording to the 2011 census of India, Sudan has 289 households. The effective literacy rate (i.e. the literacy rate of population excluding children aged 6 and below) is 62.14%.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48695372","title":"Charles Dundas Lawrie","body":""}
{"url":"https://en.wikipedia.org/wiki?curid=48121074","title":"Paul Wittek","body":"\nPaul Wittek\n\nPaul Wittek (11 January 1894, Baden bei Wien — 13 June 1978, Eastcote, Middlesex) was an Orientalist and historian from Austria. His 1938 thesis on the rise of the Ottoman Empire, known as the Ghazi thesis, argues that the Ottoman's \"raison d'être\" was the expansion of Islam. During the 1980s, his theory was the most influential and dominant explanation of the formation of the Ottoman Empire.\nBiography.\nWittek was conscripted at the outbreak of World War I as a reserve officer to an artillery regiment. In October 1914, he suffered a head wound in Galicia and was taken to Vienna to recover. Subsequently, he served first on the Isonzo and in 1917 was drafted as a military adviser to the Ottoman Empire, where he was stationed in Istanbul and Syria until the war ended. During this time Wittek learned Ottoman Turkish and acquired the patronage of Johann Heinrich Mordtmann, the former German consul in Istanbul. After the war ended, Wittek returned to Vienna and continued his studies of ancient history, which he had already begun before the war. In 1920 he obtained his doctorate with a study of the oldest Roman social and constitutional history.\nWittek was in Vienna at the emergence of the fledgling discipline of Ottoman studies. He was co-editor and author of the first scholarly journal in this field called \"Messages to Ottoman history\", which was published from 1921 till 1926. For his livelihood Wittek worked as a journalist for the Austrian Rundschau. From 1924, he worked for the German Archaeological Institute, where he focused on the early Ottoman epigraphy. Together with Turkish historians, he managed to prevent the sale of the Ottoman archives to Bulgaria as scrap paper.\nAfter the rise of Nazism in 1934 Wittek moved to Belgium, where he worked at the Institute for Byzantine Studies in Brussels with Henri Gregoire. After the German attack on Belgium Wittek fled in a small boat to England, where he was interned as an enemy alien. By supporting British Orientalists he was finally released and found a job at the University of London. After the war he returned to his family, who had remained in Belgium. In 1948 he returned to London and took over the newly created Chair of Turkish at the School of Oriental and African Studies (SOAS), where he remained until his retirement in 1961.\nWittek, who was close to the George circle, has published little, but has become very powerfully in his discipline. His only books, \"The Principality Menteşe\" and \"The Rise of the Ottoman Empire\" appeared in the 1930s. In the latter Wittek formulated his Ghazi thesis, according to which the ideology of sectarian struggle was the major cohesive factor in the formative phase of the Ottoman Empire. The Ghazi-thesis was to Rudi Paul Lindner nomad thesis in the 1980s, the prevailing view of the emergence of the Ottoman Empire.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48121075","title":"Glencoe Museum","body":"\nGlencoe Museum\n\nGlencoe Museum is located in a Victorian house in west downtown Radford, Virginia. The house was built in 1870 in the 19th century Victorian style, specifically Second Empire, and was the postbellum home of Confederate Brigadier General Gabriel C. Wharton. It is a large, two-story, five bay, brick dwelling, and originally had quite extensive grounds. The original house had a barn, chicken coop, smoke house, and an ice house.\nThe name Glencoe is thought to be inspired by Anne Wharton’s ancestry. Her family was originally from Scotland. The house didn’t appear on Radford’s tax records until 1876; it took a very long time to build a house of its size and grandeur in the 1800s. The house was kept in the family till 1996 when, after being deserted for 30 years, the house was given to the city of Radford. The house and grounds were donated by the Kollmorgen Motion Technology Group.\nThe house features some Victorian period rooms and displays about Radford's history, including Native American artifacts, early settlers, Mary Draper Ingles, local industries, railroads, river transportation, educational institutions and local sports. There is also an art gallery with changing exhibits of the art and works of contemporary Appalachian artists.\nGlencoe was listed on the National Register of Historic Places in 2000.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48121100","title":"Garshom Awards","body":""}
{"url":"https://en.wikipedia.org/wiki?curid=48121116","title":"Fred Kohler, Jr.","body":"\nFred Kohler, Jr.\n\nFred Kohler, Jr. was an American actor who performed in a number of Westerns such as \"The Pecos Kid\" and \"Toll of the Desert\".\nKohler's father was actor Fred Kohler.\nKohler and his father appeared twice in the same film. In RKO's \"Lawless Valley\", they played outlaws who were father and son and in one scene, Fred Kohler, Jr. says to his father's character \"Aw, that's crazy!,\" and Fred Sr. responds \"Careful, son, you're talkin' to your dad, ya know!\" \n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48121142","title":"Else Kastner-Michalitschke","body":"\nElse Kastner-Michalitschke\n\nElse Kastner-Michalitschke (28 April 1868 – 2 January 1939) was an Austrian writer.\nShe was born in Rokytnice v Orlických horách, in what was then Austria-Hungary and today the Czech Republic. She studied to become a teacher in Prague and lived in Vienna from 1892. She was married to Eduard Fedor Kastner, and later to Carl B. Braum. She was co-founder of the literary magazine \"Böhmens deutsche Poesie und Kunst\" and contributed to the magazine \"Wir leben\". She also published several collections of poetry. She received numerous awards in recognition of her artistic accomplishments.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48121143","title":"Rabiya Javeri Agha","body":"\nRabiya Javeri Agha\n\nRabiya Javeri Agha (born Rabiya Adila Javeri on December 2, 1963) is a Grade 21 Officer of the Pakistan Administrative Service. One of the senior most women in the civil service, she joined the Government of Pakistan in 1985. She is currently posted as Secretary Trade Development Authority of Pakistan.\nEarly life.\nRabiya is the daughter of well known jeweller Hasan Javeri of Jamnagar State and Ayesha Rafique Javeri (Family of Sir Syed Ahmed Khan, Allahbad). She is also the sister of well known photographer Tapu Javeri and artist Zehra Laila Javeri. Her education was at Convent of Jesus and Mary and Karachi Grammar School. She Graduated in Politics and Literature from Mount Holyoke College. she is married to senior civil servant Agha Jan Akhtar, Chairman Port Qasim Authority.\nCareer.\nBefore joining the bureaucracy, Rabiya Javeri Agha worked as a journalist for the Dawn newspaper. She has written over 300 articles on social, political and cultural issues. She has also authored and published research papers on Sufism and on the Afghan political and refugee crisis.\nHer duties with the Trade Authority include marketing Pakistan's potential as a trade and cultural partner. She travels throughout Pakistan and Europe to promote goods, like textiles and fashion, as well as the resources Pakistan has available.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48121161","title":"Lagos by-election, 1945","body":"\nLagos by-election, 1945\n\nA by-election was held for the Lagos seat in the Legislative Council of Nigeria in December 1945 to replace Jibril Martin of the Nigerian Youth Movement (NYM). It was won by Abubakar Olorun-Nimbe of the Nigerian National Democratic Party (NNDP).\nCampaign.\nThe NNDP and the Nigerian Union of Young Democrats put forward Olorun-Nimbe, vice president of the NNDP, as a joint candidate. A doctor, he had studied medicine at the University of Glasgow and ran a private practice in Lagos. He was well-known in the town due to his role as a member of Lagos Town Council. His opponent was Oluwole Ayodele Alakija of the NYM. Alakija was a barrister who had studied at Jesus College, Oxford and was vice-president of the party's Port Harcourt branch.\nDespite the NYM's success in the 1938 general elections, when it had won all three seats in Lagos, its popularity in the town had diminished, partly due to the internal splits caused by the row over the party's candidate for the 1941 by-election. Separately, the alliance of the NNDP with the new National Council of Nigeria and the Cameroons had restored some of its credibility.\nThe \"West African Pilot\" called on voters to vote for a \"seriously active Moslem\", noting the fact that Olorun-Nimbe had twice been to Mecca and that he was a \"practical politician with experience\". Despite not being a Muslim, Alakija was supported by Chief Imam Y. P. O. Shodeinde.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48121167","title":"Melville Amasa Scovell","body":"\nMelville Amasa Scovell\n\nMelville Amasa Scovell (February 26, 1855 – August 15, 1912) was an American academic from New Jersey. Moving with his family to Champaign, Illinois early in his life, he attended the University of Illinois there, graduating in 1875. He worked at the school for the next seven years, until he was dismissed over a conduct violation. In 1885, he became director of the Kentucky Agricultural Experiment Station at the University of Kentucky. Scovell was named dean of the College of Agriculture, Food, and Environment there shortly before his death.\nBiography.\nMelville Amasa Scovell was born February 26, 1855, in Belvidere, New Jersey. Shortly after his birth, his family moved to Jasper County, Illinois. They later moved to Champaign, where his father worked as a principal. Scovell enrolled at the University of Illinois in 1871, studying chemistry. He graduated in 1875 and became an instructor there. From 1876 to 1877, he served as the secretary to university president John Milton Gregory.\nScovell was named an assistant professor of chemistry in 1877, receiving a Master of science the next year. He was made professor of agricultural chemistry in 1880. He co-founded a method of clarifying cane sugar juice, but was forced to leave the university in 1882 because professors were expected to abstain from profiting from their research. Scovell founded a sugar factory in Champaign, but it was short-lived. He also worked as a special agent of the US Department of Agriculture following his dismissal.\nIn 1885, Scovell accepted a position at the Kentucky Agricultural Experiment Station at the University of Kentucky in Lexington, a position he held until his death. There, he promoted agriculture in Kentucky, with a focus on Jersey cattle. James Ben Ali Haggin commissioned Scovell to purchase cattle for his Elmendorf Farm. In 1893, Scovell was chairman of the dairy test at the World's Columbian Exposition in Chicago. He was awarded a Ph.D. by the University of Illinois in 1909. In 1911, Scovell was named dead of the University of Kentucky College of Agriculture, Food, and Environment.\nScovell died at his Lexington home from endocarditis on August 15, 1912. He married Nancy Davis, a member of his university class, in 1880; they had no children. Scovell served terms as president of the American Association of Agricultural Colleges and Experiment Stations and the Association of Official Agricultural Chemists. He was also a member of the Fair Committee of the Kentucky State Fair from 1907, when it moved to Louisville, until his death. He was a member of the Society of Chemical Industry and the American Chemical Society. He is the namesake of Scovell Hall at the University of Kentucky.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48121178","title":"Karen Mullins","body":"\nKaren Mullins\n\nKaren Mullins is an American college softball coach, most recently the long-time head coach of the Connecticut Huskies softball team. She served in that role from 1984 to 2014. She announced her retirement on May 19, 2014.\nPlaying career.\nMullins played four years of basketball at Connecticut and also two years of softball. Connecticut was just beginning to establish women's sports during her time as a student in Storrs. \nCoaching career.\nAfter completing a master's in sport management at UConn, Mullins became head coach at Nichols College in Massachusetts. She led the team for two seasons, compiling a 10–10 record before moving to E. O. Smith High School as a basketball coach. In 1984, she returned to UConn as head softball coach. Mullins would remain at UConn for thirty one seasons, leading the Huskies to 10 top 2 finishes in the NCAA Northeast rankings, eight appearances in the NCAA Division I Softball Championship, a Women's College World Series berth in 1993, six Big East Conference regular season and seven Big East Conference Softball Tournament championships, and an overall record of 862–626–5. Over 96 percent of her players graduated, nine earned All-American honors, six were named academic All-Americans, and her players earned Big East Player or Pitcher of the Year awards 11 times. She retired as one of the top 50 all-time coaches in career wins. Mullins was one of the longest-tenured coaches at UConn, although many coaches also had remained in Storrs for multiple decades.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48121201","title":"SAFRA National Service Association","body":"\nSAFRA National Service Association\n\nSAFRA National Service Association is an organisation that was formed as a recreation club for servicemen from the Singapore Armed Forces. This was also how SAFRA got its name: \"Singapore Armed Forces Recreation Association\".\nHistory.\nSAFRA was started on 2 July 1972 and was launched by, then Defense Minister of Singapore, Dr Goh Keng Swee.\nMission.\nThe SAFRA Mission\n\"To be a dynamic institution effective in bonding NSmen through a network of quality lifestyle clubs, services and activities. We shall be reputed for our good value and innovation.\"\nThis was to reward servicemen for their service to the nation with some relaxation from their hectic lives.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48121270","title":"Sadolin Sports Hall","body":"\nSadolin Sports Hall\n\nThe Sadolin Sports Hall () is a multi-purpose indoor arena complex in Rapla. It was opened in 2010 and is the current home arena of the Estonian Basketball League team Rapla KK. \n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48121350","title":"Sanguantang Station","body":"\nSanguantang Station\n\nSanguantang Station is an elevated metro station of Line 2 in Ningbo, Zhejiang, China. It situates on the west of the crossing of Ningzhen Road and Minghai Avenue. Construction of the station starts in middle 2012 and opened to service in September 26, 2015. In the construction plan of Ningbo Rail Transit, Sanguantang Station will be a transfer station between Line 2 and Line 5.\nExits.\nSanguantang Station has 2 exits.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48121402","title":"Phi Kappa Pi","body":"\nPhi Kappa Pi\n\nPhi Kappa Pi (ΦΚΠ) is a Canadian National Fraternity. Founded on March 22, 1913 as Canada's Only National Fraternity, Phi Kappa Pi has active chapters in Burnaby, Halifax, Toronto, and Montreal, as well as 6 inactive chapters. There are alumni chapters associated with most locations, as well as a National Council.\nHistory.\nPhi Kappa Pi Fraternity was founded in 1913, by two previously existing and separate organizations. Sigma Pi, founded in Toronto in 1901 and Alpha Beta Gamma, founded in Montreal in 1905, joined forces to create Canada's first and only national fraternity. The individual organizations' names would then become chapter names.\nIn 1923, alumni from the Alpha Beta Gamma chapter approached the Phi Kappa Pi National Council about the possibility of expanding to Dalhousie University in Halifax, Nova Scotia. The expansion request was approved and a chapter was founded. The chapter was the first fraternity to locate to Dalhousie's campus, and was named the Dalhousie chapter, until 1959 when it received it's Greek name, Zeta Gamma. The following year, 1924, Alpha Iota was founded at the University of British Columbia, followed by Delta Mu in 1930 at the University of Alberta, Tau Sigma Rho in 1935 at the University of Manitoba, and Alpha Epsilon in 1967 at the University of Waterloo.\nThe 1970s proved to be a tough decade for Phi Kappa Pi, with 4 chapters being lost. Alpha Iota and Alpha Epsilon both closed down in 1974, followed by Tau Sigma Rho in 1975, and one of the founding chapters, Alpha Beta Gamma in 1976. Alpha Beta Gamma, however, would be reopened in 1990 with the help of alumni from Phi Kappa Pi's then remaining two chapters. Soon after, in 2000, Theta Kappa Omicron opened at the University of Ottawa, and Omega Iota in 2006 at the University of Ontario Institute of Technology.\nIn September 2008, Simon Fraser University's student body voted 57% in favour of overturning the University's ban of Greek life on campus. The Omega Epsilon chapter opened on the university's campus in 2012. Phi Kappa Pi was the first Greek Life Organization to open on the Simon Fraser campus. \nChapters.\nUntil at least 1976, the chapter names are the name of the local from which it was formed, except in the case of Dalhousie.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48121545","title":"Lulin Station","body":"\nLulin Station\n\nLulin Station is an elevated metro station of Line 2 in Ningbo, Zhejiang, China. It situates on Fenghua Road. Construction of the station starts in middle 2012 and opened to service in September 26, 2015.\nExits.\nLulin Station has 2 exits.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48121588","title":"Orthogonal ligand-protein pair","body":"\nOrthogonal ligand-protein pair\n\nOrthogonal ligand-protein pairs (also known as re-engineered ligand-receptor interfaces or re-engineered enzyme-substrate interactions) are a protein-ligand binding pair made to be independent of the original binding pair. This is done by taking a mutant protein (naturally occurring or selectively engineered), which is activated by a different ligand (carefully synthesized or selected). The intention here is that the orthogonal ligand will not interact with the original protein. The original protein will also be designed to not interact with the orthogonal ligand in certain cases. An example of orthogonal ligand-receptor interfaces are RASSL and DREADD. They are G protein-coupled receptors that are activated by synthesized ligands that wouldn't normally exist in the cell, such as the anti-psychotic Clozapine, allowing researchers to control the interaction externally and independent of internal activation.\nApproaches and Designs.\nProtein Engineering Approach.\nThe protein engineering approach involves synthesizing a new ligand and directed mutation of the protein's ligand-binding site. In this approach one has to be careful to only change the ligand specificity without changing the other actions of the protein.\nSteric Modification.\nThe steric modification design can be summarized into 3 changes to the ligand-protein pair: \nReversal of hydrogen bonds or charge-charge interactions.\nAnother way to design an orthogonal protein is to switch the position of the hydrogen bond acceptors and donors. For example, if the ligand is a hydrogen bond donor and the protein a hydrogen bond acceptor, switch the ligand to the hydrogen bond acceptor and the protein to the donor. The reversal of charged interactions is similar, but it involves switching the position of the positive charge and the negative charge on the protein and ligand.\nSynthetic Chemistry Approach.\nThe synthetic chemist's approach is to take an already existing mutant form of the protein that binds the original ligand weakly, and synthesize a new ligand for which the mutant protein has a strong affinity. The drawback of this approach is the protein still interacts weakly with the natural ligand at low synthetic ligand concentrations.\nConfirmed Applications.\nAgriculture.\nInduced drought resistance.\nPark et al. created an orthogonal receptor-ligand interface between and . normally binds to abscisic acid which together then bind and inactivate to PP2C as a drought stress response, which stops PP2C from deactivating . This causes a cascade that leads to the activation of the and closing of the leaf guard cells and stomata. The result is less water loss by the plant. The natural response by the plant using abscisic acid to bind PYR1 in drought conditions is not strong enough and is activated too late to significantly hinder crop yield loss. Abscisic acid is also currently too expensive to synthesize to be used as a spray to control drought response artificially on a mass scale. The ability to control this externally by spraying the PYR1MANDI (orthogonal receptor) with mandipropamid (orthogonal ligand and fungicide) has the potential to reduce crop yield loss during droughts in plants with these engineered receptors, and has been confirmed to work in canola.\nMedicine.\nHormonal Pathway Control.\nDesigning ligands for mutant receptors that are unresponsive to the natural ligand could prove to be an effective way to treat disease. TRβ histidine 435 is a T3 insensitive mutant that plays a role in human pituitary cancer and RTH. Hassan and Koh showed QH2 (orthogonal ligand) was able to allosterically activate the mutant TRβ nuclear hormone receptors that had lost their responsiveness to endogenous T3 (natural mutants) but retained their DNA binding activity.\nResearch.\nGene Expression:.\nMixing and matching the ligand-binding domains and DNA-binding domains of different hormone receptors can be used as an inducible expression mechanism to study the action of any gene with a hormone response element in its promoter. Selectively altering the ligand-binding domain to make it orthogonal to the natural ligand-receptor interface, as well as the making the DNA-binding domain and hormone response element orthogonal, would give a researcher precise control of a gene's transcription in order to study a gene's action.\nSignal Transduction:.\nStudying signal transduction pathways and attempting to identify the action of proteins involved in these pathways is difficult due to the abundance and complexity of interactions, families of proteins with the same or similar action, and the relative a lack of selectivity for substrates (a good example of which are protein kinases). A method has been developed to use a radioactively labeled ATP orthogonal analog with an orthogonal kinase that uses the ATP analog to phosphorylate its substrates, allowing for identification of its targets within the pathway by the radioactive label that it will add the target. Variations on this approach can be used to identify the function of signal transduction proteins whose function remains undetermined.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48121736","title":"Magdalena Szczepańska","body":"\nMagdalena Szczepańska\n\nMagdalena Szczepańska (born January 25, 1980 in Zielona Góra) is a retired Polish heptathlete. She won a silver medal at the 2004 European Combined Events Cup in Hengelo, Netherlands, and then represented her nation Poland in heptathlon at the Olympics in Athens a few months later, finishing in twenty-first place. Szczepańska trained under the tutelage of head coach Jerzy Skucha for the national team, while competing at AZS AWFiS Gdańsk.\nSzczepańska qualified for the Polish squad in the women's heptathlon at the 2004 Summer Olympics in Athens. Two months before the Games, she eclipsed the IAAF Olympic \"B\" standard and her personal record of 6115 points to place second behind gold medalist Yuliya Ignatkina of Russia at the European Cup in Hengelo, Netherlands, resulting to her official selection to the Polish Olympic team in track and field. Szczepańska started the competition in a tie for second place with U.S. heptathlete Tiffany Lott-Hogan in the 100 metres hurdles to command the medal position, but a below-par performance in the high jump slipped her out of contention for the medal to the bottom of the leaderboard, achieving only 1.67 against leader Carolina Klüft's height by just twenty-four centimetres. Szczepańska could only manage to produce substantial events for the remaining events of the competition, until she finally landed herself to twenty-first place with a total score of 6012 points.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48122100","title":"TTÜ Sports Hall","body":"\nTTÜ Sports Hall\n\nThe TTÜ Sports Hall () is a multi-purpose indoor arena complex in Mustamäe, Tallinn. It was opened in 1975 and renovated in 2001. It is the current home arena of the Estonian Basketball League team TTÜ KK.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48122179","title":"Maracaibo (disambiguation)","body":"\nMaracaibo (disambiguation)\n\nMaracaibo is a city and municipality in the Zulia State, Venezuela.\nMaracaibo can also refer to:\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48122208","title":"Speaker of the United States House of Representatives election, October 2015","body":"\nSpeaker of the United States House of Representatives election, October 2015\n\nAn election for the Speaker of the U.S. House of Representatives took place on October 29, 2015, during the 114th U.S. Congress. The election was necessitated by the announcement of Speaker John Boehner's resignation, set for October 30. The Speaker of the House follows the Vice President in the line of succession to the presidency of the United States in accordance with the Presidential Succession Act.\nDue to friction within the Republican Party caucus, Boehner decided to step down as speaker and resign his seat in Congress. He scheduled a Republican caucus non-binding vote for speaker on October 8, and a full floor vote on October 29. Kevin McCarthy, the House Majority Leader and second-in-command to the Speaker, was initially viewed as the favorite to win the Speakership. However, due to the opposition of the Freedom Caucus, McCarthy dropped out of the race on October 8, and the caucus vote was postponed.\nJason Chaffetz initially declared his candidacy to challenge McCarthy, and Bill Flores declared his candidacy after McCarthy withdrew, but both dropped out later to express their support for Paul Ryan, who entered the race after being widely viewed as a potential frontrunner. Daniel Webster of the Republican Party and former Speaker Nancy Pelosi of the Democratic Party were also declared candidates. Ryan won the rescheduled caucus vote on October 28, and was elected Speaker of the House, receiving 54.6% of the House vote, on October 29.\nBackground.\nProcess and conventions.\nThe Speaker of the United States House of Representatives is the presiding officer of the United States House of Representatives, and is second in the United States presidential line of succession, after the Vice President and ahead of the President pro tempore of the United States Senate. Though the Constitution does not require that the Speaker be an elected member of the House of Representatives, every Speaker to date has been elected from House membership.\nThe 435 members of the House of Representatives elect a Speaker by majority rule at the beginning of each session of the United States Congress, who serves until the end of the Congress. Typically, the election is a formality, as the majority party's members vote as a bloc for their party's previously-chosen Speaker-designate (such as the speaker, majority leader, or minority leader from the previous term). Open elections are uncommon but have occurred. The last Speaker election to require multiple ballots occurred in 1923.\nSpeakership and resignation of John Boehner.\nJohn Boehner, a member of the Republican Party from Ohio, served as the Majority Leader of the United States House of Representatives from February 2006 until January 2007. As the Democratic Party assumed control of the House following the 2006 elections, Boehner served as Minority Leader from January 2007 until January 2011. When Republicans reassumed control of the House of Representatives in January 2011, Boehner was elected as Speaker, with the votes of all 241 of his fellow Republicans. In 2014, some House Republicans reached out to Ben Carson about his interest in becoming Speaker should they be able to oust Boehner; Carson declined, citing his impending candidacy for president. Boehner's Republican opponents formed a congressional caucus, called the Freedom Caucus, in January 2015 to focus their opposition. Though Boehner was reelected as Speaker at the beginning of the 114th United States Congress that month, 25 conservative members of the Republican caucus did not vote for him. Daniel Webster, a Republican from Florida, received 12 votes.\nThroughout 2015, Boehner and the Freedom Caucus remained at odds. Boehner stripped his opponents of leadership posts and other perks, while the American Action Network, a group allied with Boehner, aired television ads against Freedom Caucus members in their home districts. Meanwhile, the Freedom Caucus opposing Boehner's plans, forcing him to rely on Democratic votes to pass bills. Needing to pass a federal budget for the 2016 fiscal year beginning October 1, the Freedom Caucus, now consisting of approximately 40 conservative Republicans affiliated with the Tea Party movement, threatened to block a resolution from passing unless it would defund Planned Parenthood and to initiate a vote to vacate the speakership if Boehner did not support their demands. The caucus sought the following promises: (1) the decentralization of the House Steering Committee, so that the Speaker and House Majority Leader are not solely in charge of committee assignments, (2) not supporting an increase in the U.S. debt ceiling without entitlement reform, (3) willingness to impeach John Koskinen, the Commissioner of Internal Revenue, and (4) passing spending bills approved by the caucus rather than a continuing resolution favored by Democrats in the United States Senate.\nOn July 28, 2015, Mark Meadows, a member of the Freedom Caucus from North Carolina, filed a motion to vacate the speakership, only the second time the motion had been filed. The next day, Boehner referred to the motion as \"no big deal.\" However, following continued pressure from the Freedom Caucus, and to avoid the vacation of his speakership, Boehner announced on September 25 that he would resign the Speakership and retire from Congress effective October 30. Sources from his office indicated he chose to resign due to the increasing discord within the Republican caucus so that he could manage passage of a continuing resolution to fund the government and avoid a government shutdown.\nCandidates.\nOn September 28, Kevin McCarthy of California, the House Majority Leader, and Webster announced that they would run for Speaker of the House. McCarthy was considered the presumptive favorite in the race. Jason Chaffetz, a Republican from Utah and the Chairman of the House Oversight and Government Reform Committee, announced his candidacy on October 4, claiming that McCarthy did not have the votes to win the election. Several Republicans urged Paul Ryan of Wisconsin, the running mate of Mitt Romney in the 2012 presidential election, to run for Speaker, but he declined, saying he is a \"policy guy\" with a preference to focus on his role as Chairman of the House Ways and Means Committee.\nDemocrat Nancy Pelosi, who served as the Speaker from January 2007 through January 2011, asked her Democratic colleagues for their vote in the election. Steny Hoyer, the House Minority Whip, said that he expects that the \"overwhelming majority\" of Democrats will vote for Pelosi. He said that if a Republican cannot get the votes needed, Democrats may consider their options.\nOn October 7, the day before the Republican caucus scheduled a non-binding vote for speaker, Ryan and former Vice President Dick Cheney endorsed McCarthy, as did 11 of the 13 House Republicans from Pennsylvania. The Freedom Caucus decided to endorse Webster in the race. Other Republicans said they would vote against McCarthy, including Thomas Massie of Kentucky, who called McCarthy \"absolutely not an option\" because of his previous role as Boehner's \"right-hand man\". Also, Walter B. Jones, Jr. of North Carolina sent a letter to the Republican Conference Chairwoman Cathy McMorris Rodgers stating that any candidates for a leadership position with \"misdeeds\" should withdraw from the race. Jones has stated that his comment did not specifically refer to McCarthy, but it was widely seen as referring to rumors that McCarthy had been committing an extramarital affair with a fellow Representative, a rumor that both have denied; the basis for such an allegation and interpretation is unclear.\nCiting opposition from within the Republican Party, as well as fallout from controversial comments he made about the United States House Select Committee on Benghazi, McCarthy dropped out of the race on October 8. Following McCarthy's departure from the race, Republicans renewed their efforts to recruit Ryan as a candidate. Boehner personally called Ryan twice to ask him to run, and Chaffetz said that he would not run against Ryan if he chose to enter the race. Ryan also received calls from Mitt Romney and Trey Gowdy, among others, encouraging him to run for Speaker. Additional Ryan endorsements came from Wisconsin Senator Ron Johnson, 2016 Republican presidential frontrunner Donald Trump, and House Majority Whip Steve Scalise from Louisiana. On October 9, close aides of Ryan confirmed that Ryan was reconsidering the possibility of a run.\nA possible Ryan candidacy received support from the same Freedom Caucus that opposed Boehner and McCarthy, as Meadows said on October 11 that Ryan running would \"definitely change the equation,\" and Chairman Jim Jordan described Ryan as \"a good man\" and stated that the Freedom Caucus would view a Ryan run \"favorably.\"\nOthers who expressed their interest in running included Texas representatives Bill Flores and Michael McCaul, Georgia representative Lynn Westmoreland, Montana representative Ryan Zinke, and California representative and former Oversight Committee Chairman Darrell Issa. However, several candidates have made clear that they would only run if Ryan chooses not to, including Issa, McCaul, and Minnesota representative John Kline. On October 12, Flores confirmed that he would run for Speaker. He stated that he would run only if Ryan stayed out of the contest.\nRyan held a closed-door meeting with the Republican Caucus on October 20, where he explained that he would run for Speaker if he could be guaranteed an overwhelming majority of the Republican caucus would support him. Specifically, Ryan requested an increased threshold for the political maneuver of vacating the Speakership, stated that he would not lessen the amount of time he spends with his family, and requested an official endorsement from the Freedom Caucus, Republican Study Committee, and The Tuesday Group by October 23, before he could make his decision. Immediately after Ryan's announcement, Chaffetz announced that he would be dropping out of the race to support Ryan. The next day, the Freedom Caucus held a vote to determine which of its members would support Ryan; although the exact tally was not revealed, roughly two-thirds of the caucus voted to endorse Ryan. Although this was shy of the 80% vote needed for an official endorsement over Webster, both the caucus leaders and Ryan were satisfied with the result, and Ryan made efforts to move forward with a potential Speaker bid.\nOn October 22, Ryan announced his bid for Speaker. Flores, who chairs the Republican Study Committee, dropped out of the race and endorsed Ryan. Mo Brooks of Alabama, a member of the Freedom Caucus, announced on the floor of the House on October 27 that Ryan had agreed not to advance immigration reform legislation while Barack Obama is President of the United States, or unless it meets the \"Hastert Rule\", as it has the support of the majority of Republicans.\nDeclared.\nThe following officially declared their candidacy:\nPublicly expressed interest.\nThe following publicly expressed interest in becoming candidates:\nReceived speculation.\nThe following received speculation about a possible candidacy in at least two reliable sources:\nWithdrawn.\nThe following were candidates, but subsequently withdrew:\nDeclined to run.\nThe following received some speculation about a possible candidacy, but subsequently ruled themselves out:\nElection.\nHouse Republicans planned to hold a non-binding caucus vote on October 8, followed by the official floor vote on October 29. The winning candidate requires a 218-vote majority to win. Multiple ballots may be cast if the majority of the House cannot agree on a candidate. While McCarthy and Chaffetz both said they would vote for the winner of the caucus vote in the floor vote, Webster did not make the same promise.\nFollowing McCarthy dropping out of the race on October 8, the caucus vote was indefinitely postponed. Massie and Peter T. King referred to the House as a \"banana republic.\" Massie also criticized Boehner for postponing the election, saying they \"called off the election because they didn’t like the result,\" which was echoed by Tom Rice, Louie Gohmert, and Justin Amash. McMorris Rodgers and Conference Vice Chairwoman Lynn Jenkins defended Boehner, saying the matter was handled properly, as conference rules give him sole discretion. Rich Lowry of \"National Review\" asked McCarthy in a phone interview if the House was governable, to which McCarthy replied \"I don’t know. Sometimes you have to hit rock bottom.\" Charlie Dent, a Republican from Pennsylvania who had supported McCarthy, suggested that if Republicans are unable to agree on a candidate, the best option might be for a bipartisan coalition to select a Speaker.\nOnce it appeared certain that Ryan would run, and win an overwhelming majority of the caucus's votes, Boehner rescheduled the Republican caucus vote for October 28. Ryan won the nomination, defeating Webster 200 to 43 in the secret ballot voting. Blackburn and McCarthy each received one vote. The next day, Webster reportedly urged Republicans to vote for Ryan instead of him.\nFinal result.\nOn October 29, Ryan was elected Speaker with 236 of the 432 votes cast. Others receiving votes were Pelosi (184), Webster (9), Jim Cooper, John Lewis, and Colin Powell (1 each). Votes were cast by 432 of the 435 House members.\nFollowing the election, Raúl Labrador, a Freedom Caucus member from Idaho, said that Paul will need to \"realize the honeymoon is over and start bringing us some conservative policy,\" and that \"the final exam for Paul Ryan will be in January 2017, when there is a Speaker election, and we will look at his body of work and determine whether he gets a passing grade or not.\"\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48122215","title":"Ashfaq Ali Khan","body":"\nAshfaq Ali Khan\n\nAshfaq Ali Khan () is an Indian politician and a member of the 16th Legislative Assembly of Uttar Pradesh of India. He represents the Naugawan Sadat constituency of Uttar Pradesh and is a member of the Samajwadi Party political party.\nEarly life and education.\nAshfaq Ali Khan was born in Sihali Jageer, Uttar Pradesh. He attended the and attained Bachelor of Laws degree.\nPolitical career.\nAshfaq Ali Khan has been a MLA for one term. He represented the Naugawan Sadat constituency and is a member of the Samajwadi Party political party.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48122222","title":"Lai Chi Kok Central (constituency)","body":"\nLai Chi Kok Central (constituency)\n\nLai Chi Kok Central () is one of the 23 constituencies in the Sham Shui Po District of Hong Kong which was created in 2015.\nThe constituency loosely covers Liberté, The Pacifica and Banyan Garden in Lai Chi Kok with the estimated population of 19,882.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48122469","title":"Al-Karimah","body":"\nAl-Karimah\n\nAl-Karimah (; also spelled \"Karto al-Karimeh\") is a small town in northwestern Syria, administratively part of the Tartus Governorate. It is located in the Akkar Plain just north of the border with Lebanon and southeast of al-Hamidiyah. According to the Syria Central Bureau of Statistics (CBS), al-Karimah had a population of 3,461 in the 2004 census. It is the administrative center of the Karimah Subdistrict (\"nahiyah\") which consisted of 12 localities with a collective population of 17,271. Its inhabitants are predominantly Alawites.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48122573","title":"Valga Sports Hall","body":"\nValga Sports Hall\n\nThe Valga Sports Hall () is a multi-purpose indoor arena complex in Valga. It was opened in 2005 and is the current home arena of the Estonian Basketball League team BC Valga. \n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48122672","title":"Sung Wong Toi (constituency)","body":"\nSung Wong Toi (constituency)\n\nSung Wong Toi () is one of the 24 constituencies in the Kowloon City District of Hong Kong which was created in 2015.\nThe constituency loosely covers Ma Tau Kok with the estimated population of 20,487.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48122792","title":"List of attacks on civilians attributed to United States government forces","body":"\nList of attacks on civilians attributed to United States government forces\n\nThe following is a partial list of attacks on civilians attributed to armed groups under the control of the United States government, including the Army, Navy, Air Force, and North Atlantic Treaty Organization forces under U.S. control. The items on the list are sites widely (though not in all cases universally) considered to be of a civilian nature that were directly (though in some cases mistakenly) targeted, and do not include errant bombs or other collateral damage resulting from imprecise attacks on military targets.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48122878","title":"Pärnu Sports Hall","body":"\nPärnu Sports Hall\n\nThe Pärnu Sports Hall () is a multi-purpose indoor arena complex in Pärnu. The hall was opened in 2009 and is the current home arena of the Estonian Basketball League team KK Pärnu.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48122920","title":"Coach Terminal Station","body":"\nCoach Terminal Station\n\nCoach Terminal Station is an underground metro station in Ningbo, Zhejiang, China. Coach Terminal Station situates on the east of Ningbo Coach Terminal. Construction of the station starts in December 2010 and opened to service in September 26, 2015.\nExits.\nCoach Terminal Station has 3 exits.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48122984","title":"Kai Tak North (constituency)","body":"\nKai Tak North (constituency)\n\nKai Tak North () is one of the 24 constituencies in the Kowloon City District of Hong Kong which was created in 2015.\nThe constituency loosely covers Kai Ching Estate and part of Tak Long Estate in San Po Kong with the estimated population of 16,562.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48123075","title":"Kai Tak South (constituency)","body":"\nKai Tak South (constituency)\n\nKai Tak South () is one of the 24 constituencies in the Kowloon City District of Hong Kong which was created in 2015.\nThe constituency loosely covers large part of Tak Long Estate in San Po Kong and the previous Kai Tak Airport with the estimated population of 14,599.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48123132","title":"New Party (Turkey)","body":"\nNew Party (Turkey)\n\nThe New Party (Turkish: \"Yeni Parti\", YP) was a former political party in Turkey that was founded on 23 June 2008. Adhering to the principles of Kemalism, the party merged with the Rights and Equality Party (HEPAR) in 2012 without contesting any elections. Former leaders include Tuncay Özkan, who led the party despite being imprisoned following the Ergenekon trials. The party's colours were primarily red and the party logo was that of the Sun.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48123206","title":"Yalga, Republic of Mordovia","body":"\nYalga, Republic of Mordovia\n\nYalga () is an urban locality (a work settlement) under the administrative jurisdiction of Oktyabrsky City District of the city of republic significance of Saransk in the Republic of Mordovia, Russia. As of the 2010 Census, its population was 5,672.\nHistory.\nUrban-type settlement status was granted to it in 1984.\nAdministrative and municipal status.\nWithin the framework of administrative divisions, the work settlement of Yalga is incorporated as Yalga Work Settlement, which is subordinated to Oktyabrsky City District of the city of republic significance of Saransk. Within the framework of municipal divisions, Yalga is a part of Saransk Urban Okrug.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48123529","title":"2015 European Inline Speed Skating Championships","body":"\n2015 European Inline Speed Skating Championships\n\nThe 27th European Inline Speed Skating Championships were held in Wörgl, Austria from July 20 to July 26, 2015. Organized by European Confederation of Roller Skating.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48123563","title":"Gem Motion Picture Company","body":"\nGem Motion Picture Company\n\nThe Gem Motion Picture Company was an American silent-era film studio. It was co-founded by filmmaker Stanner E.V. Taylor and his wife, actress Marion Leonard in 1911. After management issues, the company evolved to primarily act as a producer of short comedies starring Billy Quirk.\nDistribution.\nGem film properies produced Taylor and Leonard were sold to the Rex Motion Picture Company, which released them in 1912 under their own banner. The company's films were released by Universal in 1913.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48123598","title":"Khirbet al-Ma'zah","body":"\nKhirbet al-Ma'zah\n\nKhirbet al-Ma'zah () is a town in northwestern Syria, administratively part of the Tartus Governorate. It is located along the road between Safita in the east and Tartus to the west. According to the Syria Central Bureau of Statistics (CBS), Khirbet al-Ma'zah had a population of 4,798 in the 2004 census. It is the administrative center of the Khirbet al-Ma'zah Subdistrict (\"nahiyah\") which consisted of 11 localities with a collective population of 22,897. Its inhabitants are predominantly Alawites.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48123601","title":"Elymus alaskanus","body":"\nElymus alaskanus\n\nElymus alaskanus, more commonly known as Alaskan wheatgrass, is an autogamous perennial that is native to North America and part of the Poaceae family. This complex is widespread and has diverged into different taxa based on morphological and cytological studies.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48123619","title":"Charlie Chaplin's Comedy Capers","body":"\nCharlie Chaplin's Comedy Capers\n\nCharlie Chaplin's Comedy Capers was an American comic strip by Stuart Carothers and later Elzie C. Segar starring Charlie Chaplin. It ran in syndication from 1915 until 1917. It was one of the earliest comic strips inspired by the popularity of a celebrity. \nBackground.\n\"Charlie Chaplin's Comedy Capers\" was published in the Chicago Herald. The comic strip cashed in on the tremendous popularity of the comedian at the time. It was created by Stuart Carothers in March 1915, who drew and wrote the stories until his tragic early death from defenestration. Two cartoonists named \"Warren\" and \"Ramsey\" took over the series until they were replaced by Elzie C. Segar, at that time still an amateur. On February 29, 1916 Segar published his first Chaplin strip. The daily version ran until July 15, 1916. His Sunday version ran longer, from March 12, 1916 until September 16, 1917. It was his first professional cartooning job. Contrary to his predecessors, who mostly borrowed ideas from Chaplin's films, Segar thought up his own jokes. He gave Chaplin a tiny sidekick named \"Luke the Gook\" to act as a straight man to his gags. \nReception.\nDespite Chaplin's popularity the comic strip wasn't a huge succes in the United States, mostly due to the fact that all artists involved were basically amateurs. It fared better in the U.K., where it was published in the weekly comics magazine \"Funny Wonder\" for decades. \n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48123644","title":"Sau Mau Ping Central (constituency)","body":"\nSau Mau Ping Central (constituency)\n\nSau Mau Ping Central () is one of the 37 constituencies in the Kwun Tong District of Hong Kong which was created in 2015.\nThe constituency loosely covers part of Sau Mau Ping Estate with the estimated population of 15,256.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48123655","title":"Intelsat 34","body":"\nIntelsat 34\n\nINTELSAT 34 or IS-34 is communications satellite built on Space Systems/Loral's 1300-series satellite platform. The satellite will broadcast television to homes in Brazil, distribute video programming for companies like HBO and Fox across Latin America, and beam broadband services to travelers aboard airplanes and ships crossing the North Atlantic Ocean.\nIntelsat 34, unlike its predecessor, does not include the UHF-band that Intelsat had been unable to sell to its intended customer, the U.S. Department of Defense.\nLaunch.\nIntelsat 34 is the 50th Loral-built satellite launched for Intelsat. With a launch mass of 7,275 pounds - about 3.3 metric tons - Intelsat 34 is a replacement for the Intelsat 27 spacecraft lost aboard a Sea Launch mission in 2013. It will take the place of Intelsat's Galaxy 11 and Intelsat 805 spacecraft in orbit, the company's last two relay stations launched before 2000.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48123672","title":"San Francisco Ballet Building","body":"\nSan Francisco Ballet Building\n\nThe San Francisco Ballet Building, located in San Francisco, California, was designed by architect Beverly Willis and completed in 1984. The New York Times identified it as “the first building in the United States to be designed and constructed exclusively for the use of a major ballet company.”\nOverview.\nThe San Francisco Ballet Building is located within the Civic Center, San Francisco. Beverly Willis’s design would later serve as a model for the design of future American ballet companies and schools. Upon completion, the San Francisco Ballet Building became a landmark achievement in the ballet world. The Boston Globe noted, “Dance people don’t merely visit the San Francisco Ballet building: They make pilgrimages to it.”\nBallet History.\nThe San Francisco Ballet was the first professional ballet company in the United States. The company was founded in 1933 as the San Francisco Opera Ballet under the leadership of ballet master Adolph Bolm. In 1942, the ballet separated from the San Francisco Opera to become its own independent company. The company’s performances are currently based in the War Memorial Opera House, San Francisco. It is among the world’s leading dance companies, presenting over 100 performances annually, with a repertoire that spans both classical and contemporary ballet. Along with American Ballet Theatre and the New York City Ballet, San Francisco Ballet has been described as part of the \"triumvirate of great classical companies defining the American style on the world stage today.\"\nWith its origins in turn-of-the-century traveling companies, the San Francisco ballet routinely rented practice studios. In the late 1970s, the company was housed in a renovated parking garage on 18th Avenue, San Francisco, in a downstairs studio with ceilings so low that the dancers could not practice lifts for fear of hitting the beams. On the east coast, ballet companies like the American Ballet Theatre, were also housed in rented spaces and buildings shared with other performing arts groups. In 1983, the San Francisco Ballet Association became “the first American ballet company and school to break this pattern by constructing new quarters for itself.\"\nDesign.\nBeverly Willis performed exhaustive research into the function of a ballet building, conducting numerous interviews with dancers on their needs and visiting the studios of major European ballet companies.The building includes facilities to support all of the activities of the company and school with the exception of set storage. The eight rehearsal and classroom studios have 15 feet high ceilings, to accommodate lifts, and average 56x40 feet in size. Additionally, there are administrative offices, a library with audiovisual equipment, and multi-purpose rooms for conferences, academic and choreographic study. Student and company members have physical therapy and workout rooms with gymnastic equipment, locker rooms with showers, separate lounges, and a computer room. Spaces accessible to the public include the ballet shop and a ground-floor studio for community outreach programs.\nWhile the project would serve as a prototype for new ballet schools nationwide, the design was required to extend deference to the classical order of the Civic Center’s architecture, characterized by grandeur of scale, simplicity of geometric forms, and dramatic use of columns. The San Francisco City Planning Department developed a set of design criteria for the building that specified a height of 96 feet, the location of cornice line levels, and the color and finishes of exterior materials, to ensure that the design was in context with the Neo-Renaissance architecture of the Civic Center. \nTo accomplish this, Willis incorporated elements of the Neo-Renaissance architectural vocabulary of the Civic Center− the rectangular geometry and the horizontal tripartite divisions of the base, middle and top, whose heights correspond to the opera house. The building’s planned location was on an elongated and rectangular site, one-sixth the size of the adjacent performing arts structures. To be successfully contextual, it needed to appear massive to sustain a visual relationship with the monumental civic center buildings occupying over a square block. Willis sized the facade to monumental, classical proportions. The four story facade equaled in height a typical 8 story office building. The horizontal divisions of the base, midsection and top, as part of the facade, matched the heights of those of the adjacent civic center buildings. The rectangular form of the envelope produced a classical form, into which the ballet’s interior functions fit. The proportion of the plan itself was a three to one classical ratio. The building is clad in a concrete material similar in color and texture to the other contemporary civic center structures.\nBreaking with the classical tradition of symmetry, the proscenium-style main entry is located on the corner of the site. The building’s two-story monumental entry at the corner accomplished several objectives: it connected the building with the Civic Center’s master plan axis; it gave the building an identity within the performing arts complex, from the Van Ness Avenue perspective where the Opera and Symphony faced; and it avoided orienting the main entry towards the Opera House’s blank rear wall.\nThe facade came out of the program like an abstraction and manifestation of the idea of ballet. The entry was envisioned as a proscenium arch. The rippling, curved glass within the entry is reminiscent of a stage curtain. The curved balconies over the entry arch are reminiscent of theater box seats. The facade is designed with solids and voids, curves and planes that play in constantly shifting light and shadows. The monumentality of the mass is softened by transparent layers that reveal the creative possibility, awaiting the birth of dance.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48123705","title":"Upper Ngau Tau Kok Estate (constituency)","body":"\nUpper Ngau Tau Kok Estate (constituency)\n\nUpper Ngau Tau Kok Estate () is one of the 37 constituencies in the Kwun Tong District of Hong Kong which was recreated in 2015.\nThe constituency loosely covers part of Upper Ngau Tau Kok Estate with the estimated population of 15,969.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48123865","title":"Lower Ngau Tau Kok Estate (constituency)","body":"\nLower Ngau Tau Kok Estate (constituency)\n\nLower Ngau Tau Kok Estate () is one of the 37 constituencies in the Kwun Tong District of Hong Kong which was created in 2015.\nThe constituency loosely covers part of Lower Ngau Tau Kok Estate with the estimated population of 17,736.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48123867","title":"Georgi Dimitrov bibliography","body":"\nGeorgi Dimitrov bibliography\n\nGeorgi Dimitrov (June 18, 1882 – July 2, 1949) was a Bulgarian communist politician. He was the first communist leader of Bulgaria, from 1946 to 1949. Dimitrov led the Third Comintern (Communist International) under Stalin from 1934 to 1943. He was a theorist of capitalism who expanded Lenin's ideas by arguing that fascism was the dictatorship of the most reactionary elements of financial capitalism.\nThis is a Georgi Dimitrov bibliography, including writings, speeches, letters and others.\nWritings.\nThis is a list of selected writings:\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48124047","title":"Kuranishi structure","body":"\nKuranishi structure\n\nIn mathematics, especially in topology, a Kuranishi structure is a smooth analogue of scheme structure. If a topological space is endowed with a Kuranishi structure, then locally it can be identified with the zero set of a smooth map formula_1 Kuranishi structure was introduced by Japanese mathematicians Kenji Fukaya and Kaoru Ono in the study of Gromov–Witten invariants in symplectic geometry.\nDefinition.\nLet formula_2 be a compact metrizable topological space. Let formula_3 be a point. A Kuranishi neighborhood of formula_4 (of dimension formula_5) is a 5-tuple\nwhere\nThey should satisfy that formula_12.\nIf formula_13 and formula_6, formula_15 are their Kuranishi neighborhoods respectively, then a coordinate change from formula_16 to formula_17 is a triple\nwhere\nIn addition, they must satisfy the compatibility condition:\nA Kuranishi structure on formula_2 of dimension formula_5 is a collection\nwhere\nIn addition, the coordinate changes must satisfy the cocycle condition, namely, whenever formula_34, we require that\nover the regions where both sides are defined.\nHistory.\nIn Gromov–Witten theory, one needs to define integration over the moduli space of stable maps formula_36(see for example ). They are maps formula_37 from a nodal Riemann surface with genus formula_38 and formula_39 marked points into a symplectic manifold formula_2, such that each component satisfies the Cauchy–Riemann equation\nIf the moduli space is a smooth, compact, oriented manifold or orbifold, then the integration (or a fundamental class) can be defined. When the symplectic manifold formula_2 is semi-positive, this is indeed the case (except for codimension 2 boundaries of the moduli space) if the almost complex structure formula_43 is perturbed generically. However, when formula_2 is not semi-positive, the moduli space may contain configurations for which one component is a multiple cover of a holomorphic sphere formula_45 whose intersection with the first Chern class of formula_2 is negative. Such configurations make the moduli space very singular so a fundamental class cannot be defined in the usual way.\nThe notion of Kuranishi structure was a way of defining a virtual fundamental cycle, which plays the same role as a fundamental cycle when the moduli space is cut out transversely. It was first used by Fukaya and Ono in defining the Gromov–Witten invariants and Floer homology, and was further developed when Fukaya, Oh, Ohta, Ono studied the Lagrangian intersection Floer theory.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48124067","title":"Jordan North (constituency)","body":"\nJordan North (constituency)\n\nJordan North () is one of the 19 constituencies in the Yau Tsim Mong District of Hong Kong which was created in 2015.\nThe constituency loosely covers Jordan Road with the estimated population of 13,558.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48124115","title":"Jazz Suite Inspired by Dylan Thomas' \"Under Milk Wood\"","body":"In a series of articles for \"The Guardian\" newspaper titled \"50 great moments in jazz\", John Fordham wrote of the album: \"Under Milk Wood was an evocative collection of sparky themes inspired by the Dylan Thomas radio play (it's sometimes performed with a narrator reading the parts). And thanks to Tracey's sparing piano and Wellins's softly hooting sax, the rippling tone-poem Starless and Bible Black is widely acclaimed as one of the great jazz performances\".\nRelease History.\nSince the original 1965 mono LP on Columbia, the album has been released on a number of labels, including Blue Note Records. The album was reissued in 2010 on his son, Clark Tracey's ReSteamed Records label, as \"Under Milk Wood: Jazz Suite\". A live version was recorded in 1976 on RCA records, which included a voice narration from the Welsh actor, Donald Houston.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48124386","title":"Strongboard Balance","body":"\nStrongboard Balance\n\nStrongBoard Balance is as a springboard and multi-spring balance board.\nOperation.\nConnected at the base, StrongBoard Balance is a one piece apparatus with the springs connected to the board. Unlike traditional balance trainers, there is no tube or roller, which prevents the board from sliding out from underneath or coming apart. StrongBoard Balance’s difference is the targeted layer of stability it adds to traditional strength-training. Through employing various balance techniques, StrongBoard Balance works to strengthen the core, toughen stabilizing muscles and building neuropathic communication. By not allowing stabilization, the user’s muscles never stop working. With a design consisting of a solid base and a flat top, StrongBoard Balance is a tool for exercises including pushups, step ups, squats, and many others.\nUse.\nIt launched in 2014 at the LA Fit Expo and showed at the IHRSA International Convention. Utilizing four compression springs, individuals can use StrongBoard Balance to train using the weight of their own body – in a portable and electricity manner. By engaging core-stabilizing muscles, the board builds upon traditional strengthening methods, and adds a new, plyometric and cardio training element.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48124405","title":"Kiss Me (Olly Murs song)","body":""}
{"url":"https://en.wikipedia.org/wiki?curid=48124495","title":"7 Letters","body":"\n7 Letters\n\n7 Letters is a 2015 Singaporean drama film directed by seven different directors. It comprises seven short stories celebrating Singapore's 50th anniversary. The film was selected as the Singaporean entry for the Best Foreign Language Film at the 88th Academy Awards but it was not nominated.\nIn January 2016, the film was initially flagged by Malaysian censors before it was due to screen at the Titian Budaya Festival. A successful appeal was made by organisers, CultureLink, against the cuts for the vulgar phrase in Cantonese, “curse your whole family”, in Jack Neo’s segment of the omnibus.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48124616","title":"Rainy Cocoa","body":"\nRainy Cocoa\n\n is a bilingual Japanese digital manga series. An anime television series based on the manga began airing in April 2015, and a second season, titled , began in October 2015.\nMedia.\nManga.\nThe manga is available in both Japanese and English, and allows the reader to switch between the two languages for both text and audio. According to the creators, the manga's app has been downloaded from the iTunes Store and Google Play in over 50 different countries.\nAnime.\nAn television anime adaptation was announced in December 2014. The series is directed by Tomomi Mochizuki, Atsuko Takahashi provides the character designs, and Kaoru Kondou is composing the series' music. The series' theme song, \"Rainy Cocoa\", is performed by Hiro Shimono. The series began airing on 5 April 2015, and was simulcast in North America by Funimation.\nA second season was announced in June 2015, titled . Also announced was a crowdfunding campaign to raise 2 million yen to add more characters and cast members. It premiered on 4 October 2015 on Tokyo MX and Sun TV. It will be accompanied by a live-action segment. The second season was also streamed by Funimation.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48124627","title":"Luigi Logan Grosu","body":""}
{"url":"https://en.wikipedia.org/wiki?curid=48124650","title":"1971 Indiana Hoosiers football team","body":"\n1971 Indiana Hoosiers football team\n\nThe 1971 Indiana Hoosiers football team represented the Indiana Hoosiers in the 1971 college football season. They participated as members of the Big Ten Conference. The Hoosiers played their home games at Seventeenth Street Stadium in Bloomington, Indiana. The team was coached by John Pont, in his seventh year as head coach of the Hoosiers.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48124725","title":"Academic Medicine (journal)","body":"\nAcademic Medicine (journal)\n\nAcademic Medicine is the monthly peer-reviewed medical journal of the Association of American Medical Colleges.\nHistory.\nThe journal was established in 1926 as the \"Bulletin of the Association of American Medical Colleges\". It was renamed \"Journal of the Association of American Medical Colleges\" in 1929. In 1951 it briefly became \"Medical Education\" then \"Journal of Medical Education\". In 1989 it took its current name of \"Academic Medicine\".\nIn the course of its history, the journal has had nine editors. David P. Sklar is the present editor-in-chief, appointed in 2013.\nAbstracting and indexing.\nThe journal is abstracted and indexed in:\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48124730","title":"Yau Ma Tei North (constituency)","body":"\nYau Ma Tei North (constituency)\n\nYau Ma Tei North () is one of the 19 constituencies in the Yau Tsim Mong District of Hong Kong which was first created in 1982 and recreated in 2015.\nThe constituency loosely covers Yau Ma Tei with the estimated population of 12,817.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48124792","title":"List of performing artists at the Viña del Mar International Song Festival","body":"\nList of performing artists at the Viña del Mar International Song Festival\n\nThe Viña del Mar International Song Festival () is a music festival that is considered the best and biggest in Latin America and the most important musical event in the Americas which is held annually on the 3rd week of February since 1960 in Viña del Mar, Chile.\nPerforming Artists per year.\n2015.\nTransmitting to date\nPerformers per Country.\nUnited Kingdom.\n(Includes England, Scotland, Wales and Gibraltar).\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48124831","title":"Almost Home (Mary Chapin Carpenter song)","body":"\nAlmost Home (Mary Chapin Carpenter song)\n\n\"Almost Home\" is a song co-written and recorded by American country music singer Mary Chapin Carpenter\nContent.\nThe song is a mid-tempo about a woma who \"takes stock of a life lived and comes up short\". It is in the key of B-flat major with an approximate tempo of 96 beats per minute and a chord pattern of F-B-E-B. Carpenter wrote the song with Beth Nielsen Chapman and Annie Roboff, and produced it with Blake Chancey.\nCritical reception.\nDeborah Evans Price of \"Billboard\" reviewed the single with favor, saying that \"it's a vibrant musical outing that could signal a return to prominence for this talented singer/songwriter. Carpenter's evocative vocals infuse any song with passion and integrity, and she's particularly effective on this poignant lyric.\" Alanna Nash of \"Entertainment Weekly\" also described the song favorably in her review of the album, saying that it \"scores the highest at marrying lyrical introspection and rhythmic yearning, one of the benchmarks of her graceful, if circuitous, career.\"\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48124892","title":"Matthew Ramsey (songwriter)","body":"\nMatthew Ramsey (songwriter)\n\nMatthew Ramsey is an American country music songwriter and lead vocalist of the band Old Dominion with several hit songs on country radio to his credit.\nEarly life.\nMatthew Ramsey grew up in Buchanan, VA. He learned to play the drums at a young age before picking up the guitar at age 14.\nCareer.\nHe received a degree in Illustration from Virginia Commonwealth University and then moved to Nashville to pursue songwriting. He met Trevor Rosen in Nashville and the two became members of the group Old Dominion. Ramsey has had several hit songs including The Band Perry’s \"Chainsaw\", Craig Morgan’s “Wake Up Loving You’’, Dierks Bentley’s “Say You Do’’, Kenny Chesney's \"Save It For a Rainy Day\", as well as songs by Sam Hunt and Luke Bryan. The band released its first album in October 2015, with songs that reached the top ten on the country charts.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48124910","title":"Center for Pastor Theologians (CPT)","body":"\nCenter for Pastor Theologians (CPT)\n\nThe Center for Pastor Theologians (CPT) is an evangelical Christian organization that is based in Oak Park, Illinois with the stated mission of assisting pastor theologians with “the study and written production of biblical and theological scholarship for the ecclesial renewal of theology and the theological renewal of the church.”\nBackground and Goals.\nThe organization was founded in 2006 by Gerald Hiestand and Todd Wilson, originally with the name The Society for the Advancement of Ecclesial Theology. Ecclesial theology, as described by Hiestand, is \"a theological project born in an ecclesial context, driven by an ecclesial agenda, and prosecuted by ecclesial thinkers; not merely theology about the church--but theology for the church.\"\nThe Center believes that many pastors are either ill-supported to contribute to the theological formation of the broader church, or not expected to do so at all, given the majority of theological scholarship being produced by professors in seminaries and universities.\nThe Center’s offices and symposia are hosted at Calvary Memorial Church in Oak Park, Illinois. Symposia are held for three Fellowships, groups of roughly 20 pastor theologians who gather to discuss a theological text with a noted theologian. At symposia, Fellows also solicit feedback on personal projects.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48124943","title":"1987 in Macau","body":"\n1987 in Macau\n\nEvents from the year 1987 in Portuguese Macau.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48124967","title":"French legislative election, 1848 (Senegal)","body":"\nFrench legislative election, 1848 (Senegal)\n\nElections to the French National Assembly were held in Senegal between 30 October and 2 November 1848.\nElectoral system.\nThe single Senegalese seat in the National Assembly was created by decree on 5 March 1848. Following an order of 5 November 1830 and a law of 24 April 1833, all free-born people and freed slaves in the Four Communes in Senegal had full civic and political rights, the only French African colony to give such rights until the end of World War II. The right to vote was given to all men over the age of 25 and who could prove they had lived in their municipality for the previous five years. In total 4,706 men registered to vote.\nCampaign.\nThe election was contested by three candidates; former Governor Léandre Bertin du Château, the creole Barthélémy Durand Valantin and Victor Schoelcher, a well-known anti-slavery activist. Although Schoelcher was on the ballot, he was not in Senegal at the time.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48124994","title":"2015–16 Scottish Junior Cup","body":"\n2015–16 Scottish Junior Cup\n\nThe 2015–16 Scottish Junior Cup is the 130th season of the Scottish Junior Cup, the national knockout tournament for member clubs of the Scottish Junior Football Association. The competition is sponsored by ETHX Energy and is known as The ETHXenergy Scottish Junior Cup. The winner of this competition is eligible to enter the following seasons Scottish Cup at the first round stage.\nA total of 158 clubs are entered to this year's competition, three fewer than the previous season. Dropping out are Ballingry Rovers who have folded and Harthill Royal, Luncarty, Portgordon Victoria and Whitehills who are in abeyance. North Region sides Glentanar and Islavale did not enter. New members Easthouses Lily MW and Gartcairn FA Juniors make their debut in the competition while Coupar Angus and Fochabers return to the tournament after a year in abeyance.\nThe six Junior clubs qualified for this season's Scottish Cup, are not included in the draw for the first round:\nAlso qualified automatically are Banks O'Dee and Linlithgow Rose who achieved national club licensing requirements and Girvan who qualify automatically as historic full members of the Scottish Football Association.\nFirst round.\nThe first round draw took place at Hampden Park, Glasgow on 27 August 2015.\nSecond round.\nThe second round draw took place at Mar Hall, Erskine on 6 October 2015.\nThird round.\nThe third round draw took place at The Sun offices in Glasgow on 3 November 2015.\n1 Match played at Pollok F.C.\nReplays.\n2 Match played at Tranent Juniors F.C.\nFourth round.\nThe fourth round draw took place at the Evening Times offices in Glasgow on 9 December 2015. \nFifth round.\nThe fifth round draw will take place in Glasgow City Chambers on 26 January 2016 at 2:00pm.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48125053","title":"Space (architecture)","body":"\nSpace (architecture)\n\nSpace is one of the elements of design of architecture, as space is continuously studied for its usage. Architectural designs are created by carving space out of space, creating space out of space, and designing spaces by dividing this space using various tools, such as geometry, colours, and shapes.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48125075","title":"Heather Parker","body":"\nHeather Parker\n\nHeather Parker (born September 25, 1978, Boston, Massachusetts, United States) is an American photographer and glitch artist, known for her work in documentary photography, as well as glitch art created from photographs of food. Parker is the cousin of Hoorsenbuhs partner Kether Parker.\nBiography.\nHeather began working with digital media after being formally trained in film photography at Massachusetts College of Art and Design under Abelardo Morell, Frank Gohlke and Laura McPhee. \nParker's documentary work includes photographing artists in and around Boston, deejays around the country, and Vespa rallies.\nThe glitch art that Parker has exhibited lays out defects produced by databending using a combination of audio editing software and photo software.\nParker gained a B.F.A. from the Massachusetts College of Art and Design in 2000 and resides in Chicago and the Fort Point Channel Historic District of Boston. She is a member of the Fort Point Arts Community and was noted in the Boston Globe as part of a campaign to save the historic Old Northern Avenue Bridge.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48125092","title":"V Satish","body":"\nV Satish\n\nV Satish (Satish Velankar) is the National Jt. General Secretary (Organisation) of Bharatiya Janata Party (BJP). Currently he is in-charge of Rajasthan State, Bharitya Janata Party. He is Full-time Worker, Rashtriya Swayamsevak Sangh and has been the senior functionary for the Rashtriya Swayamsewak Sangh.\nEarly life.\nBorn in Nagpur district of Maharashtra on May 23, 1954.\nAssociation with RSS.\nFull-timer for RSS.\nAssociation with the BJP.\nWorking as Jt. General Secretary (Org.) in Amit Shah, National Team of BJP. Currently handling charge of Rajasthan, BJP.\nHe was posted at Bangalore in Karnataka State for handling operations of Bhartiya Janata Party.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48125118","title":"Golden Eaglets of Nigeria","body":"\nGolden Eaglets of Nigeria\n\nThe Golden Eaglets Nigeria is the Nigerian Football Under 17 Team. They won the Maiden edition of the FIFA cadet world cup staged in China in 1985. They defeated the former West Germany to win the cup.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48125124","title":"Hudson Coutinho","body":"\nHudson Coutinho\n\nHudson José Coutinho (born 12 July 1972), known as Hudson Coutinho, is a Brazilian football manager, currently in charge of Figueirense.\nCareer.\nBorn in Florianópolis, Santa Catarina, Coutinho joined hometown's Figueirense in 2000, as a fitness coach, after a brief spell at Guarani de Palhoça. After nine years at the club – which included being manager for one match as an interim in 2007 – he moved to Náutico.\nIn July 2012, after another fitness coach experiences at Chapecoense, Marcílio Dias and Hercílio Luz, Coutinho was appointed manager of his previous club Guarani. He achieved promotion with the club in the state league, as champions, but was still sacked on 25 February of the following year.\nIn March 2013 Coutinho returned to his former side Figueirense, as an assistant manager. On 19 September 2015 he was named interim manager, replacing sacked René Simões.\nOn 21 September 2015 Coutinho was permanently appointed as manager of \"Figueira\", after a request from the squad.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48125143","title":"Petros Velissariou","body":"\nPetros Velissariou\n\nPetros Velissariou (in Greek: Πέτρος Βελισσαρίου;) born April 20, 1993 is a Greek professional basketball player who is currently playing for Kavala. He is 1.90 m (6 ft 2 ¾ in) tall.\nClub career.\nAfter playing youth basketball at Mantoulidis ,Velissariou started his playing career in 2012, playing with Kavala.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48125164","title":"Jennifer Thomas (pianist)","body":"\nJennifer Thomas (pianist)\n\nJennifer Thomas (born June 23, 1977) is an American pianist, violinist, composer, performing artist, and recording artist. She was classically trained at Brigham Young University-Idaho, and started composing in 2003, later releasing her first debut album in 2007. Thomas has issued four albums, the latest 'Winter Symphony' released in November 2015.\nThomas is known for writing and performing piano-centered orchestral music from classical music to classical music crossover and cinematic orchestral. While most of her works are original, she also covers classical pieces as well as pop music and movie soundtracks. Thomas has also composed film scores, where she won the Gold Medal of Excellence in the 2011 Park City Film Music Festival for \"Music in a Short Film\" as well as a 2012 Hollywood Music in Media Award for \"Best Film Score for Documentary/Short\".\nIn 2012 Thomas was named Classical Crossover UK's \"Female Artist of the Year\".\nThomas' third album, \"Illumination\" won \"Album of the Year\" and \"Artist of the Year\" at the 2013 IMC Awards. \nIn October 2015 \"Illumination\" also won the \"Classical Song of the Year\" International Music and Entertainment Association Award and the Enlightened Piano Radio Award for \"Best piano album with instrumentation\" at Carnegie Hall New York - where she performed live at the awards ceremony.\nWinter Symphony - Jennifer Thomas (pianist) album Thomas' fourth album was released in November 2015. \nMixed by 5 time Grammy Award winner Brian Vibberts, contributors included Ricky Kej and Taylor Davis (violinist).\nThe album has received many favourable reviews.\nFollowing the album release, Thomas performed concerts at Salt Lake City, Atascocita, Texas and the Benaroya Hall Seattle.\nDiscography.\nAlbums:\nThomas also features on the following albums;\nFilm and TV.\nList:\nEarly life.\nThomas was born in Walla Walla, Washington. She got her first toy piano at the age of 3, and began formal lessons on both the piano and violin at the age of 5, under the tutelage of her mother, Carolyn Southworth. Her brothers also learned piano, violin, and cello from their mother. Jennifer and her older brother played in grade school orchestras, with Southworth as a conductor's assistant. Thomas continued to train classically, and was involved in many recitals and piano adjudications through her teen years. She played with various youth orchestras and high school orchestras. She performed at her high school graduation, and later went to Brigham Young University-Idaho.\nAt Brigham Young University-Idaho, Thomas studied piano under Professor Stephen Allen. She was a member of the university's Piano Ensemble group, accompanied the College choir and many vocal/instrumental students, as well as played violin in the university symphony. Thomas also competed in the University's Concerto Competition, where she took 2nd place performing the Piano Concerto No. 3 (Prokofiev).\nAfter college graduation, Thomas moved to Salt Lake City, Utah, and was a regular performer with the Temple Square Concert Series, and played violin in the Murray, Utah Symphony Orchestra. While performing with the Murray Symphony, Thomas was a featured soloist on the Edward MacDowell Piano Concerto No.2. She eventually moved to Northwest, where she performed as a violinist with the Oregon Pro Arte Chamber Orchestra, and worked for the Seattle Symphony in the Education Department. It was during her time working for the Seattle Symphony when she started composing her own original music.\nPersonal life.\nThomas is married to Will Thomas, an ultra-marathon competitor who, in 2015, competed in the 106 mile race Ultra-Trail du Mont-Blanc in France. Together, they have three children and reside in the Seattle Washington (state) area.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48125213","title":"Yahmur","body":"\nYahmur\n\nYahmur (; also spelled \"Yahmour\") is a village in northwestern Syria, administratively part of the Tartus Governorate. It is located along the road between Safita in the east and Tartus to the west. According to the Syria Central Bureau of Statistics (CBS), Yahmur had a population of 3,722 in the 2004 census. Its inhabitants are predominantly Alawites. Nearby is Chastel Rouge (Qal'at Yahmur), a Crusader-era castle.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48125225","title":"Durston (surname)","body":"\nDurston (surname)\n\nDurston is an English toponymic surname. The name was first recorded in 1641 in \"A Somerset Petition of 1641\". The name is taken from the village of Durston in Somerset. It is derived from the Anglo-Saxon \"deór-tún\", a combination of \"deer\" (\"deór\",) and \"fenced enclosure\" (\"tún\"). The most likely interpretation is \"deer park\".\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48125249","title":"Ram Lal","body":"\nRam Lal\n\nRam Lal is an Indian politician who is the National General Secretary for the Bhartiya Janata Party\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48125286","title":"Migration Court","body":"\nMigration Court\n\nA Migration Court is a type of administrative court within the Swedish legal system. The Migration Courts are the courts of appeal for decisions made by the Swedish Migration Agency, for example regarding asylum or residency in Sweden. Decisions by the Migration Courts can be appealed to the Migration Courts of Appeal which are supreme appellate court relating to migration law.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48125289","title":"Judith Flemig","body":"\nJudith Flemig\n\nJudith Flemig-Pelzer (born 22 May 1979) is a former German female volleyball player. She was part of the Germany women's national volleyball team. She competed with the national team at the 2000 Summer Olympics in Sydney, Australia, finishing 6th.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48125323","title":"Anja-Nadin Pietrek","body":"\nAnja-Nadin Pietrek\n\nAnja-Nadin Pietrek (born 13 March 1979) is a former German female volleyball player. She was part of the Germany women's national volleyball team. She competed with the national team at the 2000 Summer Olympics in Sydney, Australia, finishing 6th.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48125333","title":"Hayle and Bristol Steam Packet Company","body":"\nHayle and Bristol Steam Packet Company\n\nThe Hayle and Bristol Steam Packet Company operated steam ship services between Hayle, Ilfracombe and Bristol in the mid nineteenth century. Confusingly from 1848 to 1860, the company name was used by two separate operators.\nHistory.\nAlthough a steamer first called at Hayle in 1824, regular weekly services began in 1831, when the \"Hayle Steamship Company\" was formed operating with the wooden vessel \"Herald\", under the command of John Vivian.\nThe engineering company Harvey's of Hayle built the engines for the PS \"Cornwall\" of 1842. When the Great Western Railway arrived in Bristol, this stimulated more travel between London and the South West of England, and the PS \"Cornwall\" was added to the Hayle service under the command of John Vivian. The extra business attracted a rival when Vivian Stevens of St Ives put his PS \"Brilliant\" on to the Hayle to Bristol route. \nThe \"Hayle Steamship Company\" was renamed the \"Hayle and Bristol Steam Packet Company\" in 1848, and confusingly Vivian Stevens with the PS \"Brilliant\" adopted the same title.\nThe original \"Hayle and Bristol Steam Packet Company\" launched a prospectus in 1857 to attract capital investment. The secretary of the new company was Mr John Vivian of Hayle. The company was launched with nominal capital of £28,750 (£ in ) and working capital of £23,000 (£ in ). The company prospectus announced that a First Class A.1. 12 years Iron Steamer was being built at Hayle, by Harvey and Co, capable of carrying 200 Tons of Cargo, with ample accommodation for passengers. The cost of this new steamer was £18,000 (£ in ), and in 1858, the company launched the Cornubia. The company also planned to sell the Cornwall for £2,000 (£ in ) when the SS \"Cornubia\" was launched.\nThe additional traffic was short-lived, as the extension of railway services from London and Bristol through into Cornwall was completed when the Royal Albert Bridge was completed and opened on 2 May 1859.\nBoth Hayle and Bristol Steam Packet Companies amalgamated around 1860, probably as a result of traffic diminishing. The company undertook voluntary liquidation following a meeting of the shareholders on 6 November 1861. Steamer services continued, and attempted competition with screw vessels. Having sold off the SS \"Cornubia\", Harveys built and owned the SS \"Bride\" of 1863 and SS \"Bessie\" of 1865. However, the two ships could not compete with rail travel for both passengers and freight, and were moved to other trades. \nThe Hayle to Bristol services reduced and were operated by \"Hosken, Trevithick, Polkinhorn and Company Ltd\" of Penzance which bought the screw steamer \"Norseman\" in 1893. The \"Norseman\" was replaced with the \"M.J. Hedley\", a steam coaster carrying passengers until 1917 on a weekly service linking Bristol, Hayle and Liverpool.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48125341","title":"Sylvia Roll","body":"\nSylvia Roll\n\nSylvia Roll (born 29 May 1973) is a former German female volleyball player. She was part of the Germany women's national volleyball team. She competed with the national team at the 2000 Summer Olympics in Sydney, Australia, finishing 6th.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48125360","title":"Christina Schultz","body":"\nChristina Schultz\n\nChristina Schultz (born 10 November 1969) is a former German female volleyball player. She was part of the Germany women's national volleyball team. She competed with the national team at the 2000 Summer Olympics in Sydney, Australia, finishing 6th.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48125396","title":"Maria Kochwa","body":"\nMaria Kochwa\n\nMary Ayuma-Kochwa (born 23 October 1966) is a former Kenyan female volleyball player. She was part of the Kenya women's national volleyball team. She competed with the national team at the 2000 Summer Olympics in Sydney, Australia, finishing 11th.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48125402","title":"2015 World Masters (darts)","body":"\nThe seedings were finalised on completion on 31 August. For the fourth consecutive year, there are 32 seeds (an increase from 8 between 2007–2011) with the Top 16 exempt until the Last 32 stage.\nMen's Draw.\nLast 32 onwards.\nSets are best of 3 legs.\nWomen.\nThe seedings were finalised on completion of the 2014 French Open 29 August. The ladies seeds enter at the start of the competition however can not play each other until the quarter final stage.\nLadies Draw.\nLast 8 onwards.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48125484","title":"Firefly protocol","body":"\nFirefly protocol\n\nFirefly protocol may refer to:\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48125500","title":"ICFR, Ltd.","body":"\nICFR, Ltd.\n\nICFR, Ltd. is a company registered in the United Kingdom. The company was founded on February 27, 2014. Although it is officially classified as a “private company limited by guarantee without share capital,” it is intended to act as an advocacy organization focusing on human rights. Its purpose is to “document cases of human rights violations and defend victims” through the use of domestic and international law and “UN human rights mechanisms.”\nIn furtherance of this goal it undertakes public relations and lobbying activities “to impose pressure on governments” that violate human rights, and provides “legal counsel and psychological support for victims of human rights violations.” The company is empowered by its articles of incorporation to fundraise and to contribute to other charities in furtherance of these goals.\nICFR’s official address is in the Westgate House, an office building in London that houses dozens of businesses and charities. Several of these organizations have been tied to extremist groups including the Muslim Brotherhood and Hamas. The most notable of these is the Cordoba Foundation, which Prime Minister David Cameron has described as a “political front for the Muslim Brotherhood.\"\nThe only officer of ICFR is Anas Altikriti, who serves as director. Altikriti, an outspoken supporter of the Muslim Brotherhood, is also president and founder of the Cordoba Foundation.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48125525","title":"1976 in Macau","body":"\n1976 in Macau\n\nEvents from the year 1976 in Portuguese Macau.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48125553","title":"Kuiba 2","body":"\nKuiba 2\n\nKuiba 2 () is a 2013 Chinese animated fantasy action adventure film directed by Chuan Wang. It was released on May 31, 2013. The film is part of the \"Kuiba\" film series, following \"Kuiba\" (2011) and preceding \"Kuiba 3\" (2014).\nReception.\nThe film earned at the Chinese box office.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48125624","title":"Bill Shockley","body":"\nBill Shockley\n\nWilliam Albert “Bill” Shockley Jr. (March 13, 1937 – December 7, 1992) was an American football kicker and halfback who played for four seasons for four different teams, the New York Titans, Buffalo Bills, and the Pittsburgh Steelers. He played college football at West Chester University. \n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48125662","title":"Mark McDowell","body":"\nMark McDowell\n\nMark McDowell (born October 8, 1962) is a Canadian diplomat and the first resident Ambassador of Canada to the Union of the Republic of Myanmar. He is considered an \"Asia hand\" and is a specialist in the fields of public diplomacy and digital diplomacy. He has been characterized as \"an unconventional diplomat\".\nEducation.\nAttracted by its “counterculture atmosphere”, McDowell attended Innis College at the University of Toronto. He received a MA from University of Toronto in East Asian Studies in 1988. He attended the Kennedy School of Government as a Fulbright Scholar, earning a Master of Public Administration in 2008, and stayed on as a visiting Research Scholar at the Ash Institute for Democratic Governance and Innovation.\nMyanmar.\nMcDowell was named Canada's first ever resident ambassador to Myanmar in March 2013. Because of the long period of sanctions imposed by Canada on Myanmar, the relationship between the two countries was very limited and cold.\nSince taking up his job in June 2013, relations have warmed considerably, with Canada naming Myanmar a priority country for both trade and aid and opening a visa office. Ambassador McDowell has focused much of his attention on supporting grassroots democracy and human rights organizations working on issues such as freedom of speech and voter and civic education. He has staked out a leading role for Canada in the area of federalism and minority rights, and in the promotion of LGBT rights in this laboratory for democracy. Canada has also started to cooperate on security related issues like border management and prevention of human trafficking.\nThe Embassy of Canada has had success in rapidly raising Canada's public profile in Burma, through both traditional and social media. Its Facebook presence has over 140,000 followers on its Burmese, English, and French pages.\nPublic Diplomacy and E-diplomacy.\nMcDowell is known as an innovator in public diplomacy and e-diplomacy. Canada’s Globe and Mail credits him with \"helping drag the Department of Foreign Affairs into the Internet age”, and Canada’s former Ambassador to China called him “among the most original of thinkers when it comes to using social media”.\nE-diplomacy.\nAmbassador McDowell is a frequent speaker and participant in e-diplomacy conferences, offering a practitioners perspective. In 2015 he spoke at events organized by the foreign ministries of Armenia and the Netherlands.\nHe is known for starting Canada's social media presence in China with \"canadaweibo\" on the Chinese Sina Weibo platform (see www.weibo.com/canadaweibo). Canadaweibo grew from zero to 400,000 followers within two years, becoming the second largest and most influential embassy site in China after the USA’s. Similarly, he has made social media a priority during his posting in Myanmar (see www.facebook.com/CanadainBurma).\nMcDowell's work in e-government is longstanding. He gave the government of Canada's address to the United Nations World Summit on the Information Society in 2002. At that time he also took a leading role in initiatives in Canada related to getting Aboriginal communities online, and disseminating news about the international activities of Canadian Aboriginal peoples.\nPublic Diplomacy.\nMcDowell has worked on public diplomacy throughout his diplomatic career, and was a Director of Public Diplomacy and Domestic Outreach in Canada’s Department of Foreign Affairs.\nHe wrote a brief primer on public diplomacy based on a talk he delivered at the 100th Anniversary Edward R. Murrow Memorial Conference at the Fletcher School for Law and Diplomacy (see www.fletcherforum.org/2012/07/26/32-3/). In a 2010 talk at the Fletcher School on the connection between domestic outreach and public diplomacy abroad, he coined the concept of \"total diplomacy\", engaging and partnering with segments of the domestic audience to achieve foreign policy goals. McDowell has been connected with “panda diplomacy” for his work in bringing a pair of Chinese pandas to Canada, and “sports diplomacy” for his public diplomacy in Burma connected with the traditional Burmese sport of chinlone.\nA conversation with McDowell forms one of the chapters of Chinese public diplomacy thinker Zhao Qizheng’s 2012 book “The Wisdom of Public Diplomacy: Cross-Border Dialogues”.\nPrevious Diplomatic Career.\nTaiwan.\nMcDowell served in Taipei from 1997-2001.\nAboriginal Affairs.\nMcDowell was deputy Director for Aboriginal Affairs in the Global Issues Bureau from 2001-2003.\nThailand.\nMcDowell was posted in Thailand from 2003-2007. He managed the Embassy throughout the Indian Ocean Tsunami crisis. During McDowell’s term in Thailand, there was significant unrest in the south of the country, attributed to Muslim terrorist groups. McDowell led Canada’s engagement in this region.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48125664","title":"State of Things","body":"\nState of Things\n\nState of Things () is a 1995 Romanian drama film directed by Stere Gulea. The film was selected as the Romanian entry for the Best Foreign Language Film at the 69th Academy Awards, but was not accepted as a nominee.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48125688","title":"Murat Özçelik","body":"\nMurat Özçelik\n\nMurat Özçelik (born 1 January 1954) is a Turkish politician, civil servant and diplomat from the Republican People's Party (CHP), who has served as a Member of Parliament for İstanbul's third electoral district since 7 June 2015. He served as the Deputy Leader of the CHP responsible for foreign relations between 3 November 2014 and 11 November 2015. He was part of the CHP delegation during coalition negotiations with the Justice and Development Party following the June 2015 general election. Before entering politics, Özçelik served as the Turkish Consul General at Shanghai from 1997 to 1998, as the Turkish Ambassador to Iraq from 2009 to 2011 and as the Undersecretary of Public Order and Security from 2011 to 2012.\nEarly life and career.\nMurat Özçelik was born on 1 January 1954 in Ankara and graduated from TED Ankara College before going on to study at the Department of Management at the Middle East Technical University (OTDÜ) Faculty of Economics and Administrative Sciences. He is married with two children.\nCivil service career.\nÖzçelik started working at the Ministry of Foreign Affairs in 1983. Between 1990 and 1992, he served as the Cabinet Chief for Turgut Özal, the then-President of Turkey. After serving at numerous other positions, he became the department manager at the Office of Information in 2005, serving concurrently as the foreign affairs deputy spokesperson. On 16 November 2011, he was appointed as the Undersecretary of Public Order and Security. Following a public statement by Özçelik, in which he claimed that he was being pressrued into not doing his job the way he wanted and that he wanted to resign, the government removed him from the position on 17 May 2012. He was subsequently appointed as an advisor at the Foreign Ministry and subsequently retired there.\nDiplomatic career.\n2 January 1997, Özçelik became the Turkish Consul General at Shanghai, a position in which he served until 22 September 1998. On 26 December 2006, he became the Assistant Special Representative to Iraq. He became the Special Representative to Iraq in 2007 and was appointed as the Ambassador to Iraq in 2009. He was removed from this position on 22 October 2011 upon the decision of the government.\nPolitical career.\nÖzçelik was a candidate to become a member of the Party Council of the Republican People's Party (CHP) during the party's 18th Extraordinary Convention held on 7 September 2014. However, he failed to win enough votes to enter the council, resulting in the party leader Kemal Kılıçdaroğlu appointing him as a personal advisor. It was alleged that Özçelik had stated in a closed meeting that he had voted for the Peoples' Democratic Party (HDP), though had the support of Kılıçdaroğlu since it was perceived that Kılıçdaroğlu wanted to give the task of forming a strong foreign policy to Özçelik. Numerous members of the party council who won a higher number of votes subsequently resigned from their positions in order to allow Özçelik to take a seat, which he did in October 2014. On 3 November 2014, he was appointed as the Deputy Leader of the CHP responsible for foreign relations. In the June 2015 general election, he was elected as a Member of Parliament for İstanbul's third electoral district. During a Party Council meeting on 24 August 2015, it was alleged that Özçelik had an argument with rival council member Durdu Özbolat, developing into a fight between the two men. This, as well as the fact that Özçelik had not been elected through a nomination primary before the June 2015 election, allegedly contributed to Kılıçdaroğlu's decision to not put him forward as a candidate for the November 2015 general election. Özçelik subsequently resigned his Deputy Leader position, but withdrew his resignation shortly after. He resigned as Deputy Leader and from the Party Council on 11 November 2015.\nControversy.\nÖzçelik has been controversial within the CHP for allegedly being in favour of an independent Kurdistan on the southeastern borders of Turkey. He has also been described as having close sympathies with the pro-Kurdish Peoples' Democratic Party (HDP), whom he claimed he, his family and his friends voted for in the June 2015 general election.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48125715","title":"The Springing Tiger","body":"\nThe Springing Tiger\n\nThe Springing Tiger is a historical account of the Indian National Army published in 1959. Authored by Col Hugh Toye. The book was published in London by Cassell Publishers, and is considered one of the first Sympathetic Western accounts of the army. Toye worked as an intelligence officer in World War II in Burma, and was tasked with interrogating captured soldiers of the INA by the CSDIC(I). The book is provided with a foreword by Phillip Mason, who in 1946 was the Secretary of the War department in India. The book describes in detail the formation of the INA under the auspices of the F Kikan of Japanese intelligence through the collapse and subsequent revival of the army under Subhas Chandra Bose, its role in the Battles of Imphal and Kohima and the subsequent collapse in the face of Allied Burmese offensive before ending with the death of Subhas Chandra Bose.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48125718","title":"William M. Feigenbaum","body":"\nWilliam M. Feigenbaum\n\nWilliam Morris Feigenbaum (December 25, 1886 – April 23, 1949) was an American statistician, journalist and politician from New York.\nLife.\nHe was born on December 25, 1886, in Antwerp, Belgium, the son of Benjamin Feigenbaum (1859–1932) and Matilda (Kaminsky) Feigenbaum, both originally from Warsaw. The family emigrated to the United States and settled in Brooklyn where he attended the public schools and Boys High School. He graduated A.B. from Columbia College in 1907, and A.M. from Columbia University in 1908. He also took courses at Dartmouth College, Wisconsin University and National University School of Law. From 1909 to 1912, he worked in the Bureau of Statistics and Accounts of the Interstate Commerce Commission in Washington, D.C.. In 1912, he returned to New York and worked for the New York Public Service Commission (1st D.).\nHe was a member of the Socialist Party of America. In November 1916, he ran for Congress in the 10th District, but was defeated by the incumbent Republican Reuben L. Haskell.\nIn November 1917, he was elected to the New York State Assembly (Kings Co., 6th D.), defeating the incumbent Republican Nathan D. Shapiro. Feigenbaum polled 3,694 votes, Shapiro polled 3,184 votes, and Democrat Martin Solomon polled 2,217. Feigenbaum was one of ten Socialist members of the 141st New York State Legislature in 1918.\nAfterwards he became the associated editor of \"The New Leader\", and wrote for several newspapers and political magazines.\nIn 1930 and 1932, he ran for the New York State Senate (4th D.) but was defeated both times by Democrat Philip M. Kleinfeld. \nHe died on April 23, 1949, at the Montgomery Nursing Home in Brooklyn.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48125759","title":"Iceni Academy (Colchester)","body":"\nIceni Academy (Colchester)\n\nIceni Academy is a junior school in the Shrub End suburb of Colchester. This school was formerly King's Ford Junior School but changed to an Academy status. Children from King's Ford Infant School are the main feeders on to this junior school.\nHistory.\nIceni Academy use to be King's Ford Junior School. However, governors and school representatives made the decision to convert King's Ford into an academy. During the time when the school was King's Ford, the school made poor progress and the school had a bad reputation with scoring low scores with Ofsted. \nOfsted and School Problems.\nKing's Ford were in and out of special measures. In 2012, they received Ofsted Satisfactory, however, in 2014, the school scored Inadequate and required special measures.\nBright Future and Catchment.\nIceni Academy hope to put away the bad memories and start fresh. The catchment area for Iceni Academy is within the Shrub End area. Most children after Year 6 would leave for Thomas Lord Audley School, Philip Morant School and College or the Stanway School.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48125763","title":"The Man Who Had His Hair Cut Short (film)","body":"\nThe Man Who Had His Hair Cut Short (film)\n\nThe Man Who Had His Hair Cut Short () is a 1966 Belgian drama film directed by André Delvaux, starring Senne Rouffaer and Beata Tyszkiewicz. It tells the story of a schoolteacher who falls in love with one of his students, and moves away in order to escape his infatuation. The film is based on the 1947 novel with the same title by Johan Daisne.\nThe film was awarded the Sutherland Trophy at the 1966 BFI London Film Festival.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48125766","title":"Felix (1996 film)","body":"\nFelix (1996 film)\n\nFelix () is a 1996 Slovenian drama film directed by Božo Šprajc. The film was selected as the Slovenian entry for the Best Foreign Language Film at the 69th Academy Awards, but was not accepted as a nominee.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48125787","title":"Al-Rawda, Tartus","body":"\nAl-Rawda, Tartus\n\nAl-Rawda (; also spelled \"Rauda\") is a small town in northwestern Syria, administratively part of the Tartus Governorate. It is situated along the Mediterranean coast and just west of the Syrian Coastal Mountains in between Tartus (to the south) and Baniyas (to the north). According to the Syria Central Bureau of Statistics (CBS), al-Rawda had a population of 3,131 in the 2004 census. It is the administrative center of the Rawda Subdistrict (\"nahiyah\") which consisted of nine localities with a collective population of 11,688. Its inhabitants are predominantly Christians, from various denominations.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48125794","title":"Betzy Akersloot-Berg","body":"\nBetzy Akersloot-Berg\n\nBetzy Rezora Akersloot-Berg (16 December 1850, Aurskog - 18 December 1922, Oost-Vlieland) was a Norwegian-born seascape and landscape painter who spent most of her career on a small island in Friesland.\nBiography.\nShe was born to a landowning family. Later, they moved to Christiania where her father became a businessman. Originally, she trained as a nurse, then worked as a combination nurse and missionary among the Sami in Finnmark. However, she found herself attracted to painting and ultimately decided to take lessons at the \"Statens håndverks- og kunstindustriskole\", where she studied with Wilhelm von Hanno and Frits Thaulow. Later, she worked with Otto Sinding and followed him when he moved to Munich in Germany.\nDuring a trip to Vienna, she saw some works by the Dutch marine painter, Hendrik Willem Mesdag, which greatly impressed her. In 1885, she had a chance meeting with him and his family. This led to studies with him at his workshop in The Hague. She became close friends with his wife, Sientje van Houten, who painted a portrait of her. In 1890, she studied briefly with Puvis de Chavannes in Paris.\nThrough them, she met Gooswinus Gerardus Akersloot (1843-1929), the former mayor of Hoevelaken, who had recently lost his wife. They were married in 1893 and, three years later, settled in Oost-Vlieland where they bought the oldest house in town and named it \"Tromp's Huys\", after Admiral Cornelis Tromp. Although isolated, she travelled every summer and was able to participate in exhibitions throughout Western Europe as well as in Czechoslovakia. She remained there until her death in 1922. In addition to painting, she ran a Sunday School and a sewing society for girls.\n\"Tromp's Huys\" became a museum in 1956. Most of her approximately 300 works are kept there and sent out for exhibits, including a major retrospective at the Noordelijk Scheepvaartmuseum in 1992, a special exhibition at her birthplace in Aurskog in 1996, and another at the Nordkappmuseet in Honningsvåg, near the place where she worked with the Sami, in 2004.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48125812","title":"2008–09 Glasgow Warriors season","body":"\n2008–09 Glasgow Warriors season\n\nThe 2008-09 season saw Glasgow Warriors compete in the competitions: the Magners Celtic League and the European Champions Cup, the Heineken Cup.\nCompetitions.\nMagners Celtic League.\nResults.\nThe all-Welsh fixtures were played mid-week to allow their teams to compete in the Anglo-Welsh Cup.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48125836","title":"Bwana (film)","body":"\nBwana (film)\n\nBwana is a 1996 Spanish drama film directed by Imanol Uribe. The film was selected as the Spanish entry for the Best Foreign Language Film at the 69th Academy Awards, but was not accepted as a nominee.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48125846","title":"Miles Thompson","body":"\nMiles Thompson\n\nMiles Thompson (born December 8, 1990) is an American professional lacrosse player who played for the University at Albany in NCAA Division I college lacrosse and plays for the Iroquois Nationals in international competition and the Florida Launch of Major League Lacrosse. He won the Tewaaraton Trophy in 2014 (co-winner with his brother Lyle). \nEarly life.\nMiles grew up in the Onondaga Nation, NY, to Doloris and Jerome Thompson. He was one of five children in the family, which included brothers Jeremy and Lyle, and cousin Ty; all four of whom played collegiate lacrosse at an elite level. Miles attended LaFayette High School, and was a standout in their Varsity lacrosse program. After graduation, Miles then attended the University of Albany in Albany, New York, and played alongside his cousin Ty. His brother Jeremy played lacrosse at Syracuse University, while his younger brother Lyle attended LaFayette High School.\nCollege.\nMiles (along with his brother Lyle) is the first Native American player to win the Tewaaraton Trophy; \"tewaaraton\" is the Mohawk term for the precursor of modern lacrosse.\nAs a player for the Iroquois Nationals in the 2014 World Lacrosse Championship, Miles and Lyle helped the Nationals place third, their best-ever result in international competition.\nFlorida Launch.\nMiles Thompson was drafted in the third round, 20th overall in the 2014 MLL Draft by the Rochester Rattlers. He was then traded to the Florida Launch, and was on the active roster with them in their inaugural season. In 2015, the Launch selected Miles' brother Lyle first overall in the 2015 MLL Draft. The brothers' first game together was against the Ohio Machine. They both played a total of eight games for the Launch in the 2015. \n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48125879","title":"Policy Aptitude Test","body":"\nPolicy Aptitude Test\n\nThe Policy Aptitude Test (PAT) is an offline written test held in India. This test scores a person on the bases of \"General Knowledge\", \"Numerical Problem Solving\", \"Policy Aptitude\", \"Logical Reasoning\", \"English Language\" and \"Policy Analysis Ability\". The National Law School of India University, Bengaluru (NLSIU) started this exam and use the test for selecting students for its Public Policy Programme. The test is conducted every year.\nExam format.\nPolicy Aptitude Test (PAT) have two parts. First part is multiple choice section with negative marking. Second part is descriptive analytical writing about a policy issue. Only those who obtain minimum of 40% of marks in the first part will be evaluated for the second part.\nFirst part of Policy Aptitude Test have five components: General Knowledge, Numerical Problem Solving, Policy Aptitude, Logical Reasoning and English Language. Each component have 20 questions. Each question carries 1 mark, and negative marking is -0.25. All components have equal weight.\nSecond part of Policy Aptitude Test is for 50 marks and it concerns descriptive writing about an issue that is provided. The second part examine candidate's policy analysis ability as well as English comprehension. Both parts together, Policy Aptitude Test carries 150 marks. Total duration of Policy Aptitude Test is of two hours.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48125890","title":"Dual fluid reactor","body":"\nDual fluid reactor\n\nThe Dual Fluid Reactor (DFR) is the project of a private German research institute, the Institute for Solid-State Nuclear Physics, combining the advantages of the molten salt reactor with the ones of the liquid metal cooled reactor: The fuel is in a liquid metal or molten chloride salt solution, while the cooling is provided by liquid lead. As a fast breeder reactor, the DFR can burn both natural uranium and thorium, as well as recycle nuclear waste. Due to the high thermal conductivity of the molten metal, the DFR is an inherently safe reactor (the decay heat can be removed passively).\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48125891","title":"J. Henry Bennett","body":"\nJ. Henry Bennett\n\nJ. Henry Bennett was a member of the Wisconsin State Senate.\nBiography.\nBennett was born on November 18, 1876 and died on April 29, 1956. He was buried in Viroqua, Wisconsin.\nCareer.\nBennett was first elected to the Senate in 1914. Additionally, he was District Attorney of Vernon County, Wisconsin. He was a Republican.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48125896","title":"Henriette (1803 ship)","body":"\nHenriette (1803 ship)\n\n\"Henriette\" was a French privateer commissioned in Bordeaux in late 1803. She served in the Bay of Biscay until mid-1804, and then in the Indian Ocean, based at Île de France (now Mauritius). The 74-gun HMS \"Powerful\" captured her in June 1806 off Ceylon.\nFrench service.\nCommissioned in late 1803 under Thomas Henry (or Henri), \"Henriette\" cruised in the Bay of Biscay until June 1804. She then crossed to Île de France, where she undertook three cruises, capturing several large British merchantmen.\nSoon after his arrival at Île de France on 17 August, Henry left Port Louis on a cruise, only to have to return quickly, pursued by and .\nHenry then embarked on 12 September on the first of two more successful cruises. Apparently some of \"Henriette\"s guns, two 12-pounder carronades, came from the East Indiaman \"Admiral Aplin\", which the French privateer \"Psyche\" had captured in January.\nOn 12 October he captured the \"Faza-Soubany\" (or \"Fazzy Soubani\"), of 500 tons (bm), Fryer, master, sailing from Bombay to Bengal.\nThen on 26 October he captured the \"Friendship\". \"Friendship\", of two guns and 380 tons, was carrying a cargo of rice, indigo, and cotton. \nThe next day Henry captured the \"Sha Allum\", of two guns and 380 tons. She was carrying pepper, indigo, and cotton. Two days later he captured the \"Marguerite\", of two guns and 280 tons. She was carrying sugar, indigo, and cotton. \nOn 12 November Henry captured the \"James Sybald\", of ten guns and 1,000 tons; she had a cargo of rice. (\"James Sibald\" had been sailing from Bengal to Bombay.) \"Henriette\" then returned to Port Louis on 10 December.\nHenry and \"Henriette\" left on their second cruise on 9 January 1805. On 3 February they captured the East Indiaman \"Coromandel\". \"Coromandel\" was described as being of 450 tons and armed with fourteen 9-pounder guns. \nIn May 1806 \"Lloyd's List\" reported that the French privateers \"Bellone\" (under Jacques François Perroud), \"Henriette\", and \"Caroline\" (under Nicolas Surcouf) had captured a number of merchantmen in the Bay of Bengal: \nThe privateers gave up the \"Robust\" to their prisoners. She arrived at Bengal on 4 December 1805.\nOn 17 September 1805 Henry captured the \"Viper\", of eight guns and 12 swivel guns. \"Lloyd's List\" reported that \"Henrietta\" had captured \"the East India Company's Brig the Viper\" at . A month later, on 13 November, \"Henriette\" captured the \"Phoenix\", of 600 tons. \"Henriette\" returned to Port Louis on 26 March 1806.\nIn April 1806, command of \"Henriette\" passed to Auguste Sagory. \"Henriette\" left Port Louis on 7 April, and on 6 May captured the \"Dawetz-Nissaint\" on 6 May.\nFate.\nOn 13 June HMS \"Powerful\" captured \"Henriette\" off Trincomalee, Ceylon (now Sri Lanka). \"Powerful\" had received intelligence of her presence in the area and had set out from Trincomalee on the 11th and had sighted \"Henriette\" on the morning of the 13th. After an 11-hour chase, during which \"Henriette\" fired her stern guns at \"Powerful\" without effect, \"Powerful\" succeeded in catching up to her quarry, which surrendered without further combat. During the chase, \"Henriette\"s crew had thrown four of her 6-pounder guns overboard in an attempt to lighten her and so gain speed. Head money was paid for \"Henriette\" in January 1814.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48125909","title":"Mister Transmission","body":""}
{"url":"https://en.wikipedia.org/wiki?curid=48125912","title":"Adriana Pop","body":"\nAdriana Pop\n\nAdriana Pop (born Adriana Rednic; October 22, 1965) is a French-Romanian gymnastics choreographer and former rhythmic gymnast.\nCareer.\nAdriana Rednic was born on October 22, 1965 in the Romanian city of Baia Mare. After taking dancing classes for six years, Adriana was directed into artistic gymnastics classes, joining a club in her city. Afraid of the uneven bars and vault, Pop quickly found that dancing her gift; rather than apparatus gymnastics. Soon after, she was directed into rhythmic gymnastics. At the age of thirteen, in 1979, she joined the Romanian National team in Bucharest.\nPop states, \"The music is important for me because from the music comes the idea for the routine.\"\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48125944","title":"It Could Happen to You (1939 film)","body":"\nIt Could Happen to You (1939 film)\n\nIt Could Happen to You is a 1939 American comedy film directed by Alfred L. Werker and written by Lou Breslow and Allen Rivkin. The film stars Stuart Erwin, Gloria Stuart, Raymond Walburn, Douglas Fowley, June Gale and Clarence Kolb. The film was released on June 8, 1939, by 20th Century Fox.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48125964","title":"Raïs Neza Boneza","body":"\nRaïs Neza Boneza\n\nRais Neza Boneza is a Congolese writer and poet (1979). \nHe was born in the Katanga province in Democratic Republic of Congo (Former Zaïre). He is the author of fiction, poetry, articles and academic materials. He is also a peace activist and practitioner. For his contribution to peace and conflict transformation, he was awarded an honorary doctorate degree (Honoris causa) from the Institute of management sciences (ISGM) and the Universite du CEPROMEC in Burundi 2008. He hold a BA in Social Sciences and Master in Humanities from the Derby University.\nHe is co-convener for Africa of the TRANSCEND Global Network; a Peace Development Environment Network. His debut novel \"“White Eldorado, Black Fever”(2013)\" is the only work which has been originally translated from his French native language “ \"Eldorado blanc, Fievre Noire”(2013)\". In his debut novel, he taps in his artistic background, a peace researcher and practitioner to create a work of fiction and fact to bring in the awareness about the conflict-resources direct effects to communities in the Great-Lakes region of Africa.\nReferences.\nAuthor website\nGLOBAL TORMENT\nLa liste d'ecrivains africains par pays\nTRANSCEND Network for Peace and Development\nRais Neza Boneza, Norwegian\nTV show:Emission Majuscule/15 January 2015\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48125965","title":"Skoronski","body":"\nSkoronski\n\nSkoronski is a surname. Notable people with the surname include:\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48125982","title":"Kōriyama City Museum of Art","body":"\nKōriyama City Museum of Art\n\n opened in 1992 in Kōriyama, Fukushima Prefecture, Japan. The collection includes works by Gainsborough, Constable, Turner, Burne-Jones, and Waterhouse, Shiba Kōkan, Takahashi Yuichi, Fujishima Takeji, and Kishida Ryūsei, as well as of artists associated with Kōriyama.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48125985","title":"Ednah Chepngeno","body":"\nEdnah Chepngeno\n\nEdnah Chumo Chepngeno (born 15 July 1977) is a former Kenyan female volleyball player. She was part of the Kenya women's national volleyball team. She competed with the national team at the 2000 Summer Olympics in Sydney, Australia, finishing 11th.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48126024","title":"Margaret Indakala","body":"\nMargaret Indakala\n\nMargaret Indakala (born 24 August 1962) is a former Kenyan female volleyball player. She was part of the Kenya women's national volleyball team. She competed with the national team at the 2000 Summer Olympics in Sydney, Australia, finishing 11th.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48126036","title":"Jacqueline Makokha","body":"\nJacqueline Makokha\n\nJacqueline Makokha or Jackline Makokha (born 15 November 1974) is a former Kenyan female volleyball player. She was part of the Kenya women's national volleyball team. She competed with the national team at the 2000 Summer Olympics in Sydney, Australia, finishing 11th.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48126044","title":"PS Gael (1867)","body":"\nPS Gael (1867)\n\nPS \"Gael\" was a passenger vessel operated by the Great Western Railway from 1884 to 1891 \nHistory.\nThis paddle steamer was launched on 9 March 1864 and completed completed on 11 February 1867 She was named by Miss Minnie Galbraith, daughter of Andrew Galbraith Esq, Johnstone Castle, ex-Provost of Glasgow and spent most of her years in Scotland. She was owned by the Clyde and Campbeltown Steam Packet Joint Stock Company.\nShe was bought in 1884 and operated by the GWR, mainly on its Weymouth routes but also for a time at Milford Haven and from 1887 - 1889 at Penzance for the West Cornwall Steam Ship Company. In 1891 she returned to the Clyde for duties on routes from Glasgow to Oban, Tobermory and Gairloch.\nShe was scrapped in 1924.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48126051","title":"Tatyana Gordeyeva","body":"\nTatyana Gordeyeva\n\nTatyana Vladimirovna Gordeyeva (; born June 3, 1973 in Volgograd) is a retired Russian heptathlete. She has won a total of two medals, a silver and a bronze, in heptathlon at the European Cup Super League, and has been selected to compete for Russia at the 2004 Summer Olympics, but later withdrew from the meet after falling at one of the hurdles in the opening heat. Gordeyeva trained under the tutelage of head coach Mikhail Zatselyapin for the national track and field team in combined events, while serving as a member of the Russian Army in her native Volgograd.\nGordeyeva qualified for the Russian squad, along with her teammates Yelena Prokhorova and Svetlana Sokolova, in the women's heptathlon at the 2004 Summer Olympics in Athens. She attained the IAAF Olympic \"A\" standard and a season best of 6235 points at the national meet in Tula to book her place on the Russian team in track and field. Coming to the Games with a number of sustained injuries, Gordeyeva attempted to clear one of the hurdles, and instead crashed straight into it. Thus, she did not finish the 110-metre hurdles heat, and later withdrew from the competition.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48126098","title":"Dorcas Nakhomicha Ndasaba","body":"\nDorcas Nakhomicha Ndasaba\n\nDorcas Nakhomicha Ndasaba (born 31 March 1971) is a retired Kenyan female volleyball player. She was part of the Kenya women's national volleyball team. She competed with the national team at the 2000 Summer Olympics in Sydney, Australia, finishing 11th.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48126121","title":"Nancy Waswa","body":"\nNancy Waswa\n\nNancy Lusanji Waswa (born 28 December 1971) is a retired Kenyan female volleyball player. She was part of the Kenya women's national volleyball team. She competed with the national team at the 2000 Summer Olympics in Sydney, Australia, finishing 11th.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48126128","title":"Political Science (disambiguation)","body":"\nPolitical Science (disambiguation)\n\nPolitical Science is a social science dealing with politics and systems of government.\nPolitical Science may also refer to:\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48126130","title":"Doris Wanjala","body":"\nDoris Wanjala\n\nDoris Wanjala-Wefwafwa (24 December 1966 – 11 December 2007) was a Kenyan female volleyball player. She was part of the Kenya women's national volleyball team. She competed with the national team at the 2000 Summer Olympics in Sydney, Australia, finishing 11th.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48126134","title":"Deborah Frances-White","body":"\nDeborah Frances-White\n\nDeborah Frances-White is a comedian and writer who regularly delivers seminars to women in business on subjects including charisma, diversity and inclusion. She has both British and Australian citizenship.\nEarly life.\nDeborah was born in Australia and adopted at ten days old. She moved to the UK and attended Oxford University and founded improv theatre company The Spontaneity Shop of which she is still a director.\nReligion.\nDeborah became a Jehovah's Witness while still a teenager. Her years in the religion and how she left it were the focus of her 2012 Edinburgh Fringe stand-up comedy show and one of the episodes of her BBC Radio 4 show \"Deborah Frances-White Rolls the Dice\".\nCareer.\nAfter developing a number of improvisation formats at The Spontaneity Shop (including the improvised romantic comedy DreamDate which had a pilot made for ITV) Deborah turned to stand-up comedy. Her first significant solo show was \"How to Get Almost Anyone to Want to Sleep With You\" which she performed at The Edinburgh Festival Fringe in 2007 and at The Melbourne International Comedy Festival in 2008 where she also hosted The Melbourne International Comedy Festival Roadshow.\nDeborah's recent shows have been more personal. \"Cult Following\" (2012) dealt with her experiences as a teenage Jehovah's Witness, \"Half a Can of Worms\" (2013) was about tracking down her biological family and \"Friend of a Friend of Dorothy\" (2015) was about feminism, sexism and homophobia.\nDeborah has continued to develop new improvisation formats. \"Voices in Your Head\" is a show which allows comedians, improvisers and actors to create comedy characters while the audience watches. Guests have included Phill Jupitus, Sara Pascoe, Russell Tovey, Mike McShane, Hannibal Buress and others. In 2015 she created \"The Beau Zeaux\" a long-form improvised comedy featuring a rotating cast including Marcus Brigstocke, Thom Tuck, Rachel Parris, Brendan Murphy, Ed Coleman, Milly Thomas and Pippa Evans. Guests have included Russell Tovey and Dan Starkey.\nHer BBC Radio 4 series \"Deborah Frances-White Rolls the Dice\" was broadcast in spring 2015 and featured stories about her adoption, green card marriage, and quest to find her biological family. The episodes were titled Half a Can of Worms, Cult Following, Visa Issues and Who's Your Daddy? In January 2016, The Writers Guild of Great Britain awarded Deborah Best Radio Comedy at their annual ceremony.\nCorporate Work.\nDeborah also regularly appears at corporate events speaking about confidence, charisma, diversity and sexism. Her TEDx talk on Charisma vs Stage-Fright was cited by James Caan as the secret of his presenting skills.\nWriting.\nDeborah is also a screenwriter with commissions from Fox Searchlight, Redwave Films, FremantleMedia, ITV Studios, the BBC and Channel 4. With her writing partner Philippa Waller, she contributed an episode of Young Dracula in 2014. She has co-written two books: \"The Improv Handbook\" with Tom Salinsky and \"Off the Mic\" with Marsha Shandur both published by Bloomsbury. Deborah writes for Standard Issue Magazine.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48126135","title":"Ithinumappuram","body":"\nIthinumappuram\n\nIthinumappuram is a Malayalam film released on 18 September 2015 by Agna Media. It is directed, written and produced by Manoj Alunkal. It stars Riyaz Khan and Meera Jasmine in the lead roles.\nPlot.\nThe film follows a girl named Rukmini Nair, played by Meera Jasmine, who is born and brought up in an affluent family. Rukmini's horoscope indicates she is a girl with \"Chovva Dosham\", meaning she was born under a bad sign. When she marries someone her husband will die soon, and so her family must work very hard to find a groom. By luck, Rukmini's family finds a match. However, Rukmini falls in love with a man who works in her home, Karthikeyan (played by Riyaz Khan) and elopes with him against her family's wishes.\nKarthikeyan had set his eyes on Rukmini's inheritance from her family. When he discovers that Rukmini’s family has disinherited her, he becomes enraged and reveals his true colors. Rukmini bore his two children, but is subjected to severe ill treatment by her husband. Though she is strong-willed, she silently bears the abuse and domestic violence. Eventually, Karthikeyan disavows her and elopes with another young woman named Devu, who works alongside him in a factory. Meanwhile, Rukmini is left pregnant with Karthikeyan's third child. The film then follows Rukmini as she deals with subsequent hardships. \nCast.\nCast of the movie:\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48126151","title":"Emily Wesutila","body":"\nEmily Wesutila\n\nEmily Wesutila (born 8 March 1973) is a retired Kenyan female volleyball player. She was part of the Kenya women's national volleyball team. She competed with the national team at the 2000 Summer Olympics in Sydney, Australia, finishing 11th.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48126160","title":"Clyde Docks Preservation Initiative","body":"\nClyde Docks Preservation Initiative\n\nThe Clyde Docks Preservation Initiative is a non-profit organisation set up in 2015 to establish a lead organisation in efforts to preserve the derelict Govan Graving Docks, Glasgow, Scotland (and other maritime sites on the River Clyde) as a heritage asset for future generations. The organisation aims to restore Govan graving docks as a shipbuilding and maritime heritage park in recognition of the maritime and shipbuilding heritage of the city.\nGovan Graving Docks has been abandoned since closing down in 1987 and while a number of redevelopment proposals for the site have been put forward since none have yet come to fruition.\nThe organisation is working to remedy what it sees as a lack of protection and recognition being afforded to various sites along the River Clyde. Glasgow once led the world in shipbuilding but now the only notable remaining trace of the city's industrial past is the Finnieston Crane and the remaining shipyards at Govan and Scotstoun.\nAs well as preserving the heritage CDPI aims to create a social enterprise / micro-enterprise hub, a cultural quarter and an ecology park area at Govan graving docks along with full restoration of the dry docks to working order and a facility for maintenance of historic ships.\nThe organisation has attracted attention in local and national media, most notably articles in The Sunday Herald, The Big issue magazine and a previous article in the Maritime Journal \n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48126162","title":"Fernand Ouellette","body":"\nFernand Ouellette\n\n Fernand Ouellette is a French Canadian writer. He is a four-time winner of the Governor General's Awards, having won the Governor General's Award for French-language non-fiction at the 1970 Governor General's Awards for \"Les actes retrouvés\" and at the 1976 Governor General's Awards for \"Les Bas Canada 1791-1840, changements structuraux et crise\", the Governor General's Award for French-language fiction at the 1985 Governor General's Awards for \"Lucie ou un midi en novembre\", and the Governor General's Award for French-language poetry at the 1987 Governor General's Awards for \"Les Heures\".\nLife.\nHe was born in Montreal on 24 September 1930.\nOuellette's papers are kept at the National Library and Archives of Canada in Ottawa.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48126177","title":"Fiorella Aíta","body":"\nFiorella Aíta\n\nFiorella Aíta (born 13 July 1977) is a retired Peruvian female volleyball player. She was part of the Peru women's national volleyball team. She competed with the national team at the 2000 Summer Olympics in Sydney, Australia, finishing 11th.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48126188","title":"Milagros Cámere","body":"\nMilagros Cámere\n\nMilagros Camere (born 22 September 1972) is a retired Peruvian female volleyball player. She was part of the Peru women's national volleyball team. She competed with the national team at the 2000 Summer Olympics in Sydney, Australia, finishing 11th.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48126207","title":"Patricia Soto","body":"\nPatricia Soto\n\nDiana Patricia Soto (born 10 February 1980) is a retired Peruvian female volleyball player. She was part of the Peru women's national volleyball team. She competed with the national team at the 2000 Summer Olympics in Sydney, Australia, finishing 11th.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48126224","title":"Milagros Jessenica Uceda","body":"\nMilagros Jessenica Uceda\n\nMilagros Jessenica Uceda (born 14 August 1981) is a retired Peruvian female volleyball player. She was part of the Peru women's national volleyball team. She competed with the national team at the 2000 Summer Olympics in Sydney, Australia, finishing 11th.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48126249","title":"1939 Notre Dame Fighting Irish football team","body":"\n1939 Notre Dame Fighting Irish football team\n\nThe 1939 Notre Dame Fighting Irish football team represented the University of Notre Dame during the 1939 college football season.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48126256","title":"Janet Vasconzuelos","body":"\nJanet Vasconzuelos\n\nJanet Daria Vasconzuelo or Janet Daria Vasconzuelos (born 4 July 1969) is a retired Peruvian female volleyball player. She was part of the Peru women's national volleyball team. She competed with the national team at the 2000 Summer Olympics in Sydney, Australia, finishing 11th.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48126272","title":"Muthuswamy","body":"\nMuthuswamy\n\nMuthuswamy is a Tamil name and may refer to\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48126278","title":"Mama (Emily Wells album)","body":"\nMama (Emily Wells album)\n\nMama is a studio album by Emily Wells. Released in 2012 through Partisan Records, it was largely well-received by critics. Bring the Noise called the release a \"fine example of what can happen when someone ignores the traditional boundaries of music genres.\" An acoustic version of \"Mama\" was released in on June 11, 2013 in the United States and United Kingdom through Partisan Records.\nCritical reception.\nMusic OMH gave \"Mama\" a score of 4/5/5, writing that the release \"has a freshness and vitality about it that proves startling.\" Beyond the songwriting, \"Impose Magazine\" praised her vocals in the album, writing that it was \"a voice that’s made precious while somehow also being distorted, raspy, repressed and hushed.\" \nGiving it a score of 80/100, In Your Speakers called the \"cathartic,\" writing that \"although Wells does not emulate her jazz and folk influences, she maintains the rawness and the passion of them, one being Bob Dylan.\" Bring the Noise praised the release, giving it 8/10 and calling it both \"one of the most interesting albums of the year so far,\" and a \"fine example of what can happen when someone ignores the traditional boundaries of music genres.\"\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48126288","title":"Yulissa Zamudio","body":"\nYulissa Zamudio\n\nYulissa Noelia Zamudio Orl (born 24 March 1976) is a retired Peruvian female volleyball player. She was part of the Peru women's national volleyball team. She competed with the national team at the 2000 Summer Olympics in Sydney, Australia, finishing 11th. She was part of the Peru women's national volleyball team at the 2010 FIVB Volleyball Women's World Championship in Japan. She played with Alianza Lima.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48126294","title":"Surasawadee Boonyuen","body":"\nSurasawadee Boonyuen\n\nSurasawadee Boonyuen (, born October 31, 1991 in Udonthani) is an Thai indoor volleyball. She is a member of the Thailand women's national volleyball team.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48126296","title":"2009–10 Glasgow Warriors season","body":"\n2009–10 Glasgow Warriors season\n\nThe 2009-10 season saw Glasgow Warriors compete in the competitions: the Magners Celtic League and the European Champions Cup, the Heineken Cup.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48126309","title":"Ayesha Dutt","body":"\nAyesha Dutt\n\nAyesha Shroff (born 5 June 1960) is a model, Bollywood actress and Film producer. She is the wife of popular Bollywood actor, Jackie Shroff and mother of Bollywood actor, Tiger Shroff.\nLife.\nShe was born to a Bengali, Ranjan Dutt, an Air vice marshall in Indian Air Force, and Claude Marie Dutt De Cavey, a Belgian.\nAyesha contested as the Miss Young World contest at Manila. She did not make it to the finals, but was elected the most popular girl at the contest by her fellow contestants. She began her career as a model and became successful.\nShe acted in a Bollywood film. She managed her 10% stake in Sony TV, which she sold in 2013.\nPersonal life.\nShe married her longtime boyfriend and Bollywood actor, Jackie Shroff on her birthday on 5 June 1987. She later turned into a film producer. The couple run a media company, Jackie Shroff Entertainment Limited. They jointly owned 10% shares in Sony TV since its launch until 2012 when they sold their stake and ended their 15-year-long association with Sony TV. The Shroffs have two children. They have two children, her elder son is Bollywood actor, Tiger Shroff (born 1990) and a daughter, Krishna (born 1993). \n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48126318","title":"Chung Sun-hye","body":"\nChung Sun-hye\n\nChung Sun-Hye or Jeong Seon-Hye (; born 17 December 1975) is a retired South Korean female volleyball player. She was part of the South Korea women's national volleyball team. She competed with the national team at the 2000 Summer Olympics in Sydney, Australia, finishing 8th.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48126320","title":"Seifudein Adem","body":"\nSeifudein Adem\n\nSeifudein Adem is a political economist from Ethiopia. He is the Associate Director of Institute of Global Cultural Studies at Binghamton University, where he has been teaching international relations and international political economy with a particular focus on Africa and Asia.\nEducation.\nSeifudein Adem graduated from Addis Ababa University in 1988, with a B.A. (Distinction), majoring in political science. He then left for Japan for further education, where he earned an M.A. in international relations from International University of Japan in 1994, and a Ph.D. in international political economy from University of Tsukuba in 1999.\nSeifudein Adem is proficient in English, Japanese, Russian, Afaan Oromo and Amharic. He also speaks some Chinese.\nCareer.\nSeifudein Adem served as an assistant lecturer at Addis Ababa University (formerly known as Haile Selassie I University), Ethiopia, from 1989 to 1992, and as a graduate teaching assistant at University of Tsukuba, Japan, from 1995 to 1999.\nAfter serving as a Foreign Scholar for two years, he was appointed as an Assistant Professor at University of Tsukuba in 2001. He held the positions of Foreign Scholar and Foreign Professor at University of Tsukuba until he completed his assignment in Japan in December 2005. He had also worked briefly at the United Nations University (UNU) in Tokyo as a researcher and an invited moderator /coordinator of UNU Global Seminars.\nIn January 2006, Seifudein Adem arrived at Binghamton University in Binghamton, New York, to work with Ali Mazrui at the Institute of Global Cultural Studies (IGCS). IGCS was founded by Mazrui in 1991. Adem was appointed as the Associate Director of IGCS also in 2006, with a joint teaching appointment in the Department of Political Science.\nWorks.\nSeifudein Adem's fields of interest include international relations of Africa, interactions between Africa and Asia and history and political economy of Ethiopia.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48126348","title":"Eoh Yeon-soon","body":"\nEoh Yeon-soon\n\nEoh Yeon-soon (; born 12 December 1973) is a retired South Korean female volleyball player. She was part of the South Korea women's national volleyball team. She competed with the national team at the 2000 Summer Olympics in Sydney, Australia, finishing 8th.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48126381","title":"Kim Guy-hyun","body":"\nKim Guy-hyun\n\nKim Guy-hyun (; born 12 January 1975) is a retired South Korean female volleyball player. She was part of the South Korea women's national volleyball team. She competed with the national team at the 2000 Summer Olympics in Sydney, Australia, finishing 8th.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48126385","title":"C. J. Cochran","body":"\nC. J. Cochran\n\nCarl Howard \"C. J.\" Cochran, Jr. (born 17 September 1991) is an American professional soccer player plays as a goalkeeper for Atlanta Silverbacks in the North American Soccer League.\nCochran was born in Alpharetta, Georgia and played his earlier career with Georgia State Panthers before starting his professional career with Atlanta Silverbacks in 2015.\nPlaying career.\nEarly career.\nCochran started his career with a successful four years at Georgia State Panthers, where he achieved such records as posting the season's all-time record goals-against average of 1.33. Cochran also ended his National Collegiate Athletic Association career with the competition's third-most clean sheets of 11 and with the third-best single-season goals-against average of 1.47 in 2014. While at Georgia State, Cochran also won numerous awards during his time there which included the Sun Belt and College Sports Madness Independent Defensive Player of the Week awards and two Colonial Athletic Association Rookie of the Week awards. In total, Cochran played 4,345 minutes of action with Georgia State which involved 48 starts. With 188 saves during his time there, Cochran comes in the top-10 for most career saves with the Panthers.\nAtlanta Silverbacks.\nIn 2015, Atlanta Silverbacks offered Cochran a trial at the club. After starting pre-season as a trialist, Cochran signed a professional contract with the club. On 4 April 2015, Cochran made his debut for the Atlanta Silverbacks against Indy Eleven in a match that ended 1–1. On 7 July, Cochran was nominated for the NASL Play of the Week award for his save against Martin Nuñez of the Tampa Bay Rowdies.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48126401","title":"Vladimir Tsyganko","body":"\nVladimir Tsyganko\n\nVladimir Vladimirovich Tsyganko (; ; also Țâganco, Tziganco, Tziganko or Țiganco; 1887 – 1937) was a Bessarabian, and later Soviet, politician. The son of a distinguished architect, and himself an engineer by vocation, Tsyganko entered politics shortly before the proclamation of a Moldavian Democratic Republic, when he earned a seat in the republican legislature (\"Sfatul Țării\"). He sided with the parliamentary Peasants' Faction, which supported left-wing ideals and pushed for land reform, being generally, and radically, opposed to the more right-wing Moldavian Bloc. Tsyganko was skeptical of the Bloc's plan to unite Bessarabia with Romania, although he possibly supported a federation. His uncompromising stance divided his Faction and led the Romanian Kingdom's authorities to identify him as a major obstruction to the unionist cause. \nIn November 1918, as the Bloc switched its support to unconditional unification and dissolved the regional government bodies, Tsyganko rejected the new regime and moved to Odessa. Allying himself to members of the White movement, with whom he set up a Committee for the Salvation of Bessarabia, attending the Paris Peace Conference to campaign for the reversal of the union. He later settled in Soviet territory, where he helped create a Moldavian Autonomous Soviet Socialist Republic; other members of his family opted to stay behind in Romania. In 1937, Tsyganko fell victim to the Great Purge.\nBiography.\nEarly career.\nTsyganko was born in Kishinev (Chișinău), regional capital of the Bessarabian Governorate, Russian Empire, and was a graduate of Riga Polytechnicum. He returned to his native city where his father Vladimir (? – 1919), an architect, designed such landmarks as the Ethnography Museum and Saint Nicholas Church; his brother Nikolai (Nicolai) Vladimirovich (born 1882) was the \"zemstvo\" engineer in Orhei, and from 1909 in Kishinev itself. By 1904, their father was the Director of Monastery Estates in Bessarabia, in which capacity he testified against Russian police after the Kishinev pogrom, accusing them of passivity. In 1916, the Bessarabian journalist Alexis Nour described Tsyganko Sr. as a \"much esteemed [...] Bessarabian intellectual of a Moldavian nationalist hue, but not a separatist\" (\"see Moldovenism\"). Also according to Nour, Nikolai, whom he met personally, could speak only Russian. Romanian politician Duiliu Zamfirescu, who met and debated with Vladimir Vladimirovich in 1918, claimed that the Tsygankos were \"Ruthenian\". He and his adversary talked in French, as Tsyganko \"could not speak a word of Romanian\".\nTsyganko reached political prominence after the October Revolution, which had left Bessarabia to administer itself independently, as a \"Moldavian Democratic Republic\". In January 1918, the local Soviet of Workers' and Soldiers' Deputies began to override the \"Sfatul Țării\" assembly (appointed the previous November) and attempted to bring about Bolshevik rule. This move was swiftly suppressed by a punitive expedition of the Romanian Army. The 3rd Peasants' Congress, assembled few days after the occupation of Chișinău, adopted an anti-secessionist position, dismissed the Moldavian prime-minister Pantelimon Erhan from the position of President of the Peasants' Soviet, and elected a new leadership from among the most vocal opponents of the Romanian intervention. According to the Rumcherod's newspaper, during the opening session, Tsyganko's message on behalf of the local Socialist Revolutionary branch was met with applause and calls to support the Russian Revolution. The following day, after demanding the withdrawal of Romanian troops within 24 hours, and negotiating on the issue with the Romanian military, the Congress' Presidium was put under arrest. General Ernest Broșteanu dismissed the immunity of those Peasants' representatives who were also members of \"Sfatul\", and issued a strong warning against further anti-Romanian agitation. Consequently, the following days the Congress selected a new list of \"Sfatul\" representatives, headed by Tsyganko, which comprised mostly moderates.\nClashes with the unionists.\nTsyganko, who was counted among the representatives of the Russian minority, affiliated with the left-wing \"Peasants' Faction\", which stood in opposition to the \"Moldavian Bloc\" of Romanian nationalists. During the debates on land reform, he suggested postponing the discussion until a new government, \"representative of the people's will\", would be approved by a Moldavian Constituent Assembly. Presumably, he feared that pressure from the Romanian troops would affect the extent of the reform. Nevertheless, he became the first chairman of \"Sfatul\"s Agrarian Commission, and in parallel presided upon the Peasants' Soviet. Despite being involved in left-wing politics, Tsyganko would gradually develop a working relationship with Andrei Krupenski, the Polono-Bessarabian landowner and ex-Marshal of Nobility, and Alexandr K. Schmidt, who stood for the conservative side of anti-Romanian agitation; between 1918 and 1920 the three men issued calls for the end of Romanian occupation, and began popularizing their cause in Europe. \nWhen Romanian Premier Alexandru Marghiloman traveled to Bessarabia to canvass for the unionist cause, he found the Peasant Faction divided between followers of Ion Inculeț, who endorsed the Romanian viewpoint, and deputies who sided with Tsyganko. Zamfirescu, who traveled with Marghiloman, recalls that Tsyganko \"thrice in one month\" attempted to recall the Republic's Directorate, his moves resisted by Inculeț. He also protested the selection of pro-Romanian students from Kiev and Odessa as representatives of the Transnistrian Moldavians, in which he saw efforts to shake the balance of power inside the \"Sfatul\". Zamfirescu claims to have saved Tsyganko from an undisclosed mortal danger, and then to have conversed with him, trying to gain insight into his political motivations. The latter, he concluded, were \"most phantasmagorical socialist ideas\", not dissuaded by the prospect of \"death, suffering, military disaster, sheer destitution, or degeneracy\". He adds: \"It was late at night, I was experiencing chills, and so I believe I have insulted the convictions of this visionary youth, reassuring him that all opinions lead to a ministerial chair, provided one makes sure to discard them on cue.\"\nDespite proclaiming its independence in late February 1918, the Moldavian Republic was still seen in various circles as subordinate to the neighboring Ukrainian People's Republic. Its Central Rada wished to represent Bessarabia in the preliminary negotiation of the Bucharest peace treaty, imposed by the Central Powers on Romania. The Moldavian Regional assembly reacted by reaffirming its independence and rejecting the division of Bessarabia, against the decisions of Akkerman and Khotin \"zemstva\", which had proclaimed their accession to the Ukraine. A Moldavian delegation was therefore selected to head to Kiev and obtain from the Central Rada official recognition of Moldavia's independence. The delegation, which included the interior minister Vladimir Cristi, the nationalists Nicolae Secară and Teodor Neaga, and Tsyganko as representative of the Peasants' Faction, was prevented from leaving. According to the unionist Gheorghe Andronachi, it was Daniel Ciugureanu, the Republic's pro-Romanian prime minister, who intervened with the Romanian Army to hamper the departure, fearing that an international recognition of independence would hinder nationalist plans for union with Romania.\nMarch union vote.\nOn March 27, 1918, when \"Sfatul\" voted to support the union with Romania, Tsyganko effectively abstained. Zamfirescu found it \"unbelievable\" that Romanian-speaking peasants had ever endorsed Tsyganko, who, he claimed, \"systematically opposes Bessarabia's government and Romania's policies, endeavoring for its annexation to the Ukraine\"; however, he also notes that Tsyganko himself accused the Romanians of wanting to hand in Bessarabia to the Ukrainians. A radical project for land reform had received pledges of support from \"Sfatul\" secretary Ion Buzdugan, and also from the Marghiloman himself; consequently, according to historian Alberto Basciani, Tsyganko's critique of unionism became marginal within his own party and Soviet.\nOn behalf of the Peasant Faction, Tsyganko denied the Assembly had the authority to discuss such and issue, declaring his group would refrain from voting, since they considered this a matter for a Constitutional Convention; furthermore, he stated the only admissible terms for a union between the Moldavian and Romanian peoples would be in a federation. Five members of his faction decided to side with the nationalists and voted for the union, while the other 17 present abstained. Researchers are divided in their assessments of Tsyganko's political stance at that early stage. Basciani describes him as one of those who \"opposed with great vehemence the union of Bessarabia with Romania\". However, according to Svetlana Suveică, Tsyganko did not object to union with autonomy, and in fact saw it as \"the only solution for avoiding the Bolshevik invasion of the region.\"\nIn November, after the generalization of Romanian military rule in Bessarabia, Tsyganko, as putative \"president\" of the Bessarabian Peasants' Party, with Nicolae Alexandri, Ion Păscăluță, and 37 other \"Sfatul\" members, sent a letter of protest to the Romanian government of Constantin Coandă. This coalition of Romanian Bessarabians and White Russians demanded the immediate recognition and restoration of autonomy, as well as the lifting of the martial law; however, its imperatives were rejected as illegitimate by the central authorities. According to Clark: \"We cannot but applaud the admirable aims of the 40 Deputies, in most of their requests; but at the same time we must wonder at their ingenuousness; they did not foresee the constant turbulence on the Eastern frontier, which even at that time impressed the Roumanians\".\nNovember union vote.\nThe protest arose controversy in political circles. Tsyganko reported a private interview with the Romanian envoy Artur Văitoianu. He quoted the latter as offering a deal: \"You must renounce [autonomy] if only for this sole reason—that you no good Roumanian officials in Bessarabia—that is to say, none who are good nationalists. If you give up autonomy, you will not have a Commissioner-General, but you will have a Bessarabian Chargé d'Affaires, a man of your own character, who will be nominated by the Central Power. The new [Bessarabian] Directorate will remain in office until the meeting of the Pan-Roumanian Constitutional Assembly. Does this appeal to you as attractive?\" Also according to Tsyganko, Văitoianu informed the group that they needed to coalesce with Romanian nationalists in front of Great Russian revivalism, and that \"the national idea takes precedence over everything\", implicitly threatening \"Sfatul\" dignitaries.\nAs Suveică writes, it was only at this stage that Tsyganko became an adversary of the unionist camp, placing his hopes in a reestablishment of the Russian Republic, and her re-annexation of Bessarabia. At the last \"Sfatul\" session, on November 25, 1918, unconditional union was proposed for ratification, as one of several measures being voted on, alongside the allocation of offices and a land-reform-law. According to the Peasants' Faction account, also supported by many of the Moldavian nationalists who had signed the earlier protest, the Moldavian Bloc kept the opposition uniformed about there being a \"Sfatul\" session: \"only Mr. V. Tziganko was aware of the fact, and he was informed privately, two hours before the opening of the sitting.\" The Tsyganko group confronted the assembly's president, Halippa, arguing that his election was illegal. They announced another walk-out, to which voices of the Moldavian Bloc responded with rhetorical questions (\"Is this how you intend to solve the agrarian issue?\") and taunts of \"Good riddance!\"\nThe opposition maintained that the walk-out resulted in a lack of quorum: only 48 of 160 deputies were reportedly present, which made the voting results questionable. Tsyganko and his colleagues accused the Bloc of putting up unconditional union for the vote as a rider, at 2.30 AM on the morning of November 26, and counted the votes during considerable and purposeful commotion. Some of the Fraction deputies in the opposition, including Tsyganko and Gavril Buciușcan, actually returned in time to cast their Nay votes. Clark claims that one of the Moldavian Bloc representatives testified that there were enough deputies present. According to Moldavian Bloc's Pan Halippa, Tsyganko's walk-out from the Assembly Hall proved to be a miscalculation, as the Peasant Faction's other members returned to vote on land reform, and, subsequently, on the unconditional union. Marghiloman nevertheless gave a contrasting account. He complained that \"not even 30 deputies\" had been present for the vote abrogating the conditions, in spite of \"all the money spent\".\nSalvation Committee.\nIn early 1919, Tsyganko emigrated from what was then being recognized as Romanian territory. He settled in Odessa, a Ukrainian port city, where he established the Peasants' Faction in exile, alongside a dozen other former \"Sfatul\" deputies. He joined efforts with Krupenski and Schmidt, affiliating with their Committee for the Salvation of Bessarabia, whose activities were closely monitored by Romania's secret police, the Siguranța. According to the Moldavian Bloc's Petru Cazacu, they answered indirectly to Anton Denikin, commander of the Volunteer Army. \nThe various groups of Bessarabian autonomists and White loyalists agreed to send a common delegation to the Peace Conference in Paris, where the Allies were debating on recognizing the union. On February 10, the Committee issued a common platform for these organizations, sharing two goals: \"the liberation of Bessarabia from the Romanian annexation and the realization of the aspirations of the people of Bessarabia.\" The latter referred to the region's reintegration into Russia. In April, together with Krupenski and Schmidt, later followed by Mark Slonim and Mihail Savenco, Tsyganko had arrived in Paris. In its addresses to the international media, the group insisted that the union was a putsch by urban intellectuals against the other social classes. It also circulated a protest against the Romanian land reform project, which the Salvation Committee saw as a chauvinistic attack against the landed gentry and the Russian patriots. \nAs noted by Suveică, Tsyganko was the only delegation member to belong to a non-aristocratic elite, and nominally an appointee of the \"Central Committee of the Peasants of Bessarabia\". He therefore took some distance from the conservative demands of the Salvation Committee, and in various contexts presented himself as an independent emissary, united with the others mainly in their common support for a plebiscite clause in Bessarabia. However, his autonomism and Krupenski's loyalism were mostly endorsed by the White émigré lobby in Paris, including the likes of Georgy Lvov, Vasily Maklakov, Sergey Sazonov, and Nikolai Tchaikovsky. In his papers, Halippa commented that Tsyganko, the self-proclaimed \"socialist and revolutionary\", had arrived in Paris as a propagandist of Russian nationalism, \"with no connection to the people [of Bessarabia]\". Cazacu also notes that the \"bizarre association\" comprising Tsyganko, Maklakov and Schmidt propagated the contradictory claim that \"Sfatul\" was a \"Bolshevik\" assembly.\nIn June 1919, the French communist organ, \"L'Humanité\", gave exposure to Slonim and Tsyganko's allegations regarding political repression and \"atrocities\" in Bessarabia, as a common protest of the \"democrats and socialists\". Such allegations were responded to by the BPȚ's Ion Pelivan, who wrote the newspaper to argue that Romania's intervention had first of all restored \"liberty and democracy\" in Bessarabia, and that the union expressed \"the free will of the Bessarabian populace, with no outside intervention.\" Countering Tsyganko's claim to speak for the peasants, the pro-Romanian delegation grew to include peasant members such as Ion Codreanu, Gheorghe Năstase, and Sergiu Victor Cujbă.\nLater life.\nMaking his split from the White Russian community a definitive one, Tsyganko eventually settled in the Ukrainian Soviet Socialist Republic. In September 1921, he wrote a memorandum on Bessarabia and Romania–Russia relations, which he sent to Leon Trotsky, the Commissar for Military Affairs. His text informed the Russian viewpoint at the negotiations in Warsaw between the Soviets and the Romanians, but also presented personal observations on the social makeup of Bessarabia. Tsyganko argued that the Moldavian Republic's creation and union were attributable to left-wing \"agitators\" such as Inculeț and Pantelimon Erhan. He claimed that multi-ethnic Bessarabia was naturally \"internationalist\", but also rural and \"well-off\", concluding that an anti-Romanian revolt could happen if sustained from across the border. Cazacu noted in 1924 that the dossier compiled by the Bolsheviks and the earlier Salvation Committee drafts used as sources the same documents, including statements by private individuals.\nIn 1924, Tsyganko became a founding figure of the Moldavian Autonomous Soviet Socialist Republic, created on Soviet territory as a Bessarabian rump state. In September 1926, he was at Odessa, where, together with Ivan Krivorukov, he issued a formal protest against Italy's recognition of the Bessarabian union with Romania, and therefore against her \"passage into the anti-Soviet camp\". Nikolai Vladimirovich, meanwhile, remained behind in Romania, working as a conservator for the Historical Monuments Commission, then as Department head for Chișinău City Hall. In early 1929, Nikolai supported the Bessarabian regionalist platform for administrative reform (an initiative by Erhan and Alexandru Mîță). He died some five years later, at age 52, while reading a book. At some point during the 1930s, Vladimir Tsyganko was singled out as a political suspect by the Stalinist regime, and was murdered in 1937, at the height of the Great Purge.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48126405","title":"Lee Meong-hee","body":"\nLee Meong-hee\n\nLee Meong-Hee (; born 4 July 1978) is a retired South Korean female volleyball player. She was part of the South Korea women's national volleyball team. She competed with the national team at the 2000 Summer Olympics in Sydney, Australia, finishing 8th.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48126432","title":"Lee Yun-hui","body":"\nLee Yun-hui\n\nLee Yun-Hui (; born 8 October 1980) is a retired South Korean female volleyball player. She was part of the South Korea women's national volleyball team. She competed with the national team at the 2000 Summer Olympics in Sydney, Australia, finishing 8th.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48126439","title":"Caniparola","body":"\nCaniparola\n\nCaniparola is a frazione del comune di Fosdinovo, in province di Massa e Carrara.\nPhysical Geography.\nIt's in the southern part of the comune, at 39 metres above sea level. It's the lowest frazione in the comune and it's displaced along the first part of the provincial street that leads to Fosdinovo from Aurelia Street.\nHistory.\nIn Caniparola, until the XVIII century, there was a tower, that was built at the age of the Bishops of Luni, on the which the Fosdinovo marquess Gabriele III Malaspina, ending his predecessor's project, Carlo Francesco Agostino Malaspina (who died here in 1722) built in 1724 his summer residence, the villa Malaspina. The plain on which this villa was founded was already exploited for agricultural use by Malaspina, who had built here a lot of farmhouses (they are said \"Malaspinian Farmhouses\"). In the mid-eighteenth century, between the end of Gabriele III's marquisate and the beginning of Carlo Emanuele Malaspina's one, some lignite benches were discovered for the mining of the so-called \"Caniparola coal\".\nThe toponym derives from the cultivation of the cannabis (canapa, in Italian) that was held in the area in the past.\nSociety.\nDemographic Evolution.\nDuring the second half of XIX century, this frazione had an outstanding demographic increase (which is corresponded to a likewise increase of the built infrastructures and houses), so that, counted with the near localities (above all Borgetto-Melara), from 2001 onwards it began representing almost the half of the total population of the comune. The only frazione, on the other hand, has a population that would place as the first between the frazioni, but as second compared to Fosdinovo, the chief town. Today Caniparola is a residential place, although it still keeps vineyards and olive groves of its agricultural past.\nReligion.\nCaniparola is seat of the Sant'Antonio da Padova Parish, in the diocese of Massa Carrara-Pontremoli. From September 2015, it is part of Fosdinovo Pastoral Unity, within Fivizzano Vicariate. Patron Saint Day is 13 June.\nCulture.\nEducation.\nCaniparola is seat of the detachment of the statal school \"Don Florindo Bonomi\", consisting of kinfergartens, elementary and secondary school. The chief seat is in Fosdinovo.\nSport.\nCaniparola has got a great public gym and a stadium, \"Mulattieri\", placed in the locality Borghetto-Melara, where some football tournaments are held, like Trofeo Città di Fosdinovo and Memoriale Federico Severino. In Caniparola the matches of the chief Fosdinovo volley team, \"Volley C.P.O. Fosdinovo\", are played. The female sector takes part to the regional Championship.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48126454","title":"News Is Made at Night","body":"\nNews Is Made at Night\n\nNews Is Made at Night is a 1939 American comedy film directed by Alfred L. Werker and written by John Larkin. The film stars Preston Foster, Lynn Bari, Russell Gleason, George Barbier, Eddie Collins and Minor Watson. The film was released on July 21, 1939, by 20th Century Fox.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48126458","title":"Park Mee-kyung","body":"\nPark Mee-kyung\n\nPark Mee-kyung or Park Mi-kyung (; born 13 May 1975 / 6 April 1975) is a retired South Korean female volleyball player. She was part of the South Korea women's national volleyball team. She competed with the national team at the 2000 Summer Olympics in Sydney, Australia, finishing 8th. On the club level she played with Hanil Synthetic Fiber, then in 1998 transferred to Korea Highway Corporation.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48126463","title":"En Adir","body":""}
{"url":"https://en.wikipedia.org/wiki?curid=48126483","title":"Park Soo-jeong","body":"\nPark Soo-jeong\n\nPark Soo-jeong (; born 2 March 1972) is a retired South Korean female volleyball player. She was part of the South Korea women's national volleyball team. She competed with the national team at the 2000 Summer Olympics in Sydney, Australia, finishing 8th.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48126543","title":"È arrivata la felicità","body":"\nÈ arrivata la felicità\n\nÈ arrivata la felicità is an Italian television comedy-drama series created by Stefano Bises, Ivan Cotroneo, Monica Rametta; and produced by Publispei and Rai Fiction. The setting of the show are Aventino and Testaccio, two districts in Rome.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48126561","title":"3rd New York Volunteer Cavalry","body":""}
{"url":"https://en.wikipedia.org/wiki?curid=48126562","title":"List of Indian states by GDP per capita","body":"\nList of Indian states by GDP per capita\n\nThis page lists Indian States by the nominal GDP per capita and the percentage of growth.\nGrowth in GDP per capita.\nThis shows annual growth in each state's GDP per capita for the years between 2004 and 2014. Figures are in rupees.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48126580","title":"2015 FA Women's Cup Final","body":"\n2015 FA Women's Cup Final\n\nThe 2015 FA Women's Cup Final was the 45th final of the FA Women's Cup, England's primary cup competition for women's football teams. The showpiece event was the 22nd to be played directly under the auspices of the Football Association (FA) and was named the SSE Women's FA Cup Final for sponsorship reasons. The final was contested between Chelsea Ladies and Notts County Ladies on 1 August 2015 at Wembley Stadium in London. Chelsea made its second final appearance, after losing the 2012 final. Notts County appeared in its first ever final.\nThe match was the first women's final to be staged at Wembley Stadium. Watched by a record crowd of 30,710 and a BBC television audience of nearly two million, Chelsea won the match 1–0, with a first-half goal from Ji So-yun. Chelsea's Eniola Aluko was named player of the match.\nRoute to the final.\nAs FA WSL 1 clubs, both teams entered the competition at the fifth round stage. Chelsea beat Watford (6–0), holders Arsenal (2–1) and Manchester City (1–0) to reach the final. Notts County faced lower-division opponents in all three games, defeating Tottenham Hotspur (4–0), Aston Villa (5–1) and Everton (3–0).\nThe 2015 final marked the second time Chelsea had reached this stage, after losing in 2012 in a penalty shootout against Birmingham City. Notts County had never previously appeared in the final, since its founding in 2014 or as its predecessor Lincoln Ladies.\nMatch.\nAfter a quiet start to the game, Chelsea winger Eniola Aluko applied the first serious pressure of the game with a shot at the 30th minute. A second soon after was deflected by Notts County's goalkeeper Carly Telford. The resulting corner setup Gemma Davison for a shot which went wide. In the 37th minute, Aluko found centre forward Ji So-yun inside the box and set her up for a short range goal. Notts County came back on the attack after the half. A long-range shot from midfielder Desiree Scott was deflected and a header by Leanne Crichton in the resulting corner was narrowly cleared off the line. Chelsea hunted for a second goal but Aluko had another shot deflected while midfielder Drew Spence sent a shot wide. In the end So-yun's lone goal proved enough and Chelsea won 1–0.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48126606","title":"Sinclair Cutcliffe","body":"\nSinclair Cutcliffe\n\nJohn Sinclair Cutcliffe (August 22, 1930 – November 10, 2007) was a Canadian politician, who served in the Legislative Assembly of Prince Edward Island from 1966 to 1972. A member of the Liberal Party, he was the assemblyman for the district of 2nd Queens.\nBorn and raised in Summerside, Prince Edward Island, he first worked for his father's Cutcliffe Funeral Home and eventually became owner of the business. He also served as president of the provincial Red Cross, as a chief of rescue with the Prince Edward Island Emergency Measures Organization, and as a president of the International Rescue and First Aid Association.\nHe was first elected to the legislature in the 1966 provincial election, serving as a backbench MLA. Reelected in the 1970 provincial election, in his second term he served as deputy speaker of the legislature. He resigned his provincial seat in 1972 to run as a Liberal Party of Canada candidate for Malpeque in the 1972 federal election, but lost to Angus MacLean.\nHe died on November 10, 2007 at the Queen Elizabeth Hospital in Charlottetown.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48126611","title":"2015–16 Texas–Rio Grande Valley Vaqueros women's basketball team","body":"\n2015–16 Texas–Rio Grande Valley Vaqueros women's basketball team\n\nThe 2015–16 UTRGV Vaqueros women's basketball team represents the University of Texas Rio Grande Valley during the 2015–16 NCAA Division I women's basketball season. This is head coach Larry Tidwell's third season (1st season) at UTRGV. The Vaqueros play their home games at the UTRGV Fieldhouse and are members of the Western Athletic Conference. This is the first season for UTRGV as an institution. Before the 2015–16 academic year UTRGV was UTPA and the University of Texas at Brownsville. \nPrevious Season.\nThe Broncs finished the season 19–15, 9–5 in final WAC play to finish in third place. They lost in the championship of the WAC Tournament to New Mexico State.\n2015–16 media.\nFor the first time in club history women's basketball games will be televised. 9 of 11 home games will air on TWCS (Ch 323), with 6 of the 9 games airing live. The other two home games will air on the TWCS Alternate Channel (Ch 825). Other games will air on WAC Digital Network or road teams video feeds.\nSchedule and results.\n!colspan=9 style=\"background:#; color:white;\"| Non-conference regular season\n!colspan=9 style=\"background:#; color:white;\"| WAC regular season\n!colspan=9 style=\"background:#; color:white;\"| WAC Women's Tournament\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48126612","title":"List of festivals in Oceania","body":"\nList of festivals in Oceania\n\nThe following is an incomplete list of festivals in Oceania, with links to separate lists by country and region where applicable. This list includes festivals of diverse types, including regional festivals, commerce festivals, film festivals, folk festivals, carnivals, pow wows, recurring festivals on holidays, and music festivals. Note that list of music festivals in Oceania redirects here, with music festivals denoted with (music) for countries where there is not a dedicated music section. The list overlaps with list of film festivals in Oceania.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48126633","title":"ONE (website)","body":"\nONE (website)\n\nONE is an Israeli website that covers sport news from around the world. According to the IARB (Israel Audience Research Board), it is one of the two biggest sport websites in Israel along with Sport5.co.il, It categorized news into \"Israeli Football\", \"World Football\", \"Israeli Basketball\", \"World Basketball\" and \"Other Sports\".\nHaim Revivo, Eyal Berkovic, Alon Hazan, Alon Mizrahi and Zvi Sherf are among ONE's columnists.\nONE was founded by Udi Milner and Gil Menkin in 1999, the website's headquarters are located in the BSR Towers in Ramat Gan. The website was founded in order to cover the TV show \"The 91th minute\", which was broadcast on Channel 2.\nIn the beginning of 2000, there was a race between Israeli sport websites, at the end, many of them came to an end. ONE survived by investments from the production company Telad. In 2007, Yedioth Ahronoth Group acquired 50% of the ownership on the website.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48126650","title":"Uehara Museum of Modern Art","body":"\nUehara Museum of Modern Art\n\n opened in 2000 in Shimoda, Shizuoka Prefecture, Japan, to house the collection of of Taisho Pharmaceutical. The collection includes works by Corot, Monet, Cézanne, Renoir, Fujishima Takeji, and Kishida Ryūsei. Adjacent is the , which opened in May 1983.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48126722","title":"Dilek Öcalan","body":"\nDilek Öcalan\n\nDilek Öcalan (born 3 October 1987) is a Turkish politician of Kurdish origin from the Peoples' Democratic Party (HDP) who currently serves as a Member of Parliament for the electoral district of Şanlıurfa since 7 June 2015. She is the niece of Abdullah Öcalan, the imprisoned leader of the Kurdistan Workers' Party (PKK) militant organisation that has been in conflict with the Turkish Armed Forces since the 1980s, making both her candidacy and election to Parliament highly controversial.\nEarly life.\nDilek Öcalan was born on 3 October 1987 in Şanlıurfa as the daughter of Fatma Öcalan, the sister of imprisoned PKK leader Abdullah Öcalan. On 23 December 2013, she visited her uncle at İmralı Prison and became known to the media after she gave a press statement detailing the conversation between them. Öcalan has been imprisoned since 1999, serving aggravated life imprisonment under charges of founding and leading a terrorist organisation (namely the PKK, which is recognised as a terrorist organisation by Turkey, the European Union and the United States).\nPolitical career.\nÖcalan first entered politics in 2012, a year before meeting her uncle on the Island of İmralı. During the third congress of the pro-Kurdish Peace and Democracy Party (BDP), she was elected to the party executive while the party changed its name to Democratic Regions Party (DBP) and adopted a fraternal relationship with the Peoples' Democratic Party (HDP).\nMember of Parliament.\nÖcalan's candidacy to become a Member of Parliament despite being the niece of Abdullah Öcalan was heavily controversial, drawing strong opposition from Turkish nationalists. Her candidacy also allegedly caused a split within the Öcalan family. Nevertheless, she was put forward as a HDP candidate for the electoral district of Şanlıurfa, being fielded as the second candidate on the HDP's provincial party list. She was subsequently elected in the June 2015 general election to become one of the youngest MPs in the new Parliament, resulting in her being appointed to the temporary Speaker's Council until a new Council could be elected in July.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48126732","title":"Antonietta luteorufa","body":"\nAntonietta luteorufa\n\nAntonietta luteorufa is a species of sea slug or aeolid nudibranch, a marine gastropod mollusc in the family Facelinidae.\nDistribution.\nThis nudibranch is known from the Gulf of Naples, Italy.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48126763","title":"List of Desperate Housewives Africa episodes","body":"\nList of Desperate Housewives Africa episodes\n\nDesperate Housewives Africa is a Nigerian television Comedy-drama-mystery that premiered on Ebony Life TV on 30 April 2015. It is an adaptation of the American series \"Desperate Housewives\". The majority of the episodes are titled according to the original version which were in turn named after lyrics by composer/lyricist Stephen Sondheim. The show revolves around four housewives namely; Ese De Souza (Nini Wacera), Kiki Obi (Kehinde Bankole), Tari Gambadia (Michelle Dede), and Funke Lawal (Omotu Bissong). The show is showcased from Rume Bello (Marcy Dolapo Oni) point of view who dies at the pilot episode.\nThe first season is slated to have 23 episodes.\nSeries overview.\nSeason one episodes.\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48126783","title":"Wallace W. Andrew","body":"\nWallace W. Andrew\n\nWallace W. Andrew (December 25, 1850 – January 18, 1919) was an American businessman and politician.\nBorn in Sheboygan County, Wisconsin, Andrew and his parents moved to Oregon, Wisconsin. Andrew was involved with the grain and livestock businesses. In 1894, Andrew moved with his brothers to Superior, Wisconsin and set up the Deluxe Manufacturing Company. Andrew served in the Wisconsin State Assembly in 1901 and 1905 and was a Republican. At the tome of his death in 1919, Andrew was serving on the Douglas County Board of Supervisors and was chairman of the county board. Andrew died at his home in Superior, Wisconsin. \n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48126794","title":"Alive (Hiromi album)","body":"\nAlive (Hiromi album)\n\nAlive is the third album from Hiromi Uehara's Trio Project featuring bassist Anthony Jackson and drummer Simon Phillips.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48126813","title":"No Control (Turbo Fruits album)","body":"\nNo Control (Turbo Fruits album)\n\nNo Control is an album by American band Turbo Fruits, which was released on April 21, 2015. All songs were produced by Jeremy Ferguson, except \"The Way I Want You\" and \"No Reason to Stay\", which were produced by The Black Keys drummer Patrick Carney.\nPersonnel.\nTurbo Fruits\nAdditional personnel\nProduction\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48126826","title":"PubNub","body":"\nPubNub\n\nPubNub is a global Data Stream Network (DSN) and realtime infrastructure-as-a-service (IaaS) company based in San Francisco, California. The company makes products for software and hardware developers to build realtime web, mobile, and Internet of Things (IoT) applications.\nPubNub's primary product is a realtime publish/subscribe messaging API built on their global data stream network which is made up of a replicated network of at least 14 data centers located in North America, South America, Europe, and Asia. The network currently serves over 300 million devices and streams more than 750 billion messages per month.\nHistory.\nPubNub was founded in 2010 by Stephen Blum and Todd Greene. PubNub raised $4.5 million in Series A funding from Relay Ventures and TiE Angels in March 2012. They received their $11 million Series B round of funding in September 2013 from Scale Venture Partners, Relay Ventures and TiE Angels. In July 2015, PubNub received their $20 million Series C round of funding led by Sapphire Ventures\nTechnology.\nPubNub utilizes a Publish/Subscribe model for realtime data streaming and device signaling and supports all of the capabilities of WebSockets, Socket.IO, SignalR, WebRTC Data Channel and other streaming protocols. PubNub provides SDKs for over 70 different programming languages and environments including JavaScript, iOS, and Android, as well as JavaScript frameworks such as AngularJS, Ember.js, and Backbone.js. PubNub also provides client libraries for board platforms including Raspberry Pi, Arduino, Texas Instruments, and Microchip.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48126834","title":"Elizabeth Buchanan Cowley","body":"\nElizabeth Buchanan Cowley\n\nElizabeth Buchanan Cowley (1874–1945) was an American mathematician.\nCowley was born on May 22, 1874, in Allegheny, Pennsylvania. She had four siblings, but they and her father all died by 1900. Cowley's mother, Mary Junkin Buchanan Cowley, later became a member of the Board of Public Education of Pittsburgh, and was the namesake of the Mary J. Cowley School in Pittsburgh. Cowley's grandfather (Mary Cowley's father) was James Galloway Buchanan, a surgeon in the Union Army.\nCowley earned a bachelor's degree in 1893 from the Indiana State Normal School of Pennsylvania, and became a school teacher. She earned a second bachelor's degree in 1901 and a master's degree in 1902 from Vassar College, and became an instructor at Vassar, studying higher mathematics during the summers at the University of Chicago. In 1908 she completed a doctorate from Columbia University. Her dissertation, on algebraic curves, was supervised by Cassius Jackson Keyser; she became the fourth woman to earn a doctorate in mathematics from Columbia. Continuing to work at Vassar, Cowley was promoted to assistant professor in 1913, and associate professor in 1916. She went on leave in 1926 to assist her mother, and resigned her position at Vassar in 1929, instead becoming a high school teacher in Pittsburgh.\nCowley and her co-author Ida Whiteside won a prize for a 1907 paper they wrote on the orbit of comet C/1825 V1. Another of her publications, in 1926, concerned liquid water pouring puzzles. She was the author of two textbooks on plane and solid geometry, published in 1932 and 1934, and advocated teaching solid geometry to high school students after many colleges had replaced the subject with freshman calculus. She published another book in 1941 about public education.\nCowley was an early member of the Mathematical Association of America, and became a member of its board of trustees when it incorporated in 1920.\nShe was an invited speaker at the International Congress of Mathematicians in 1932, speaking there about mathematics education. She also belonged to the American Mathematical Society, German Mathematical Society, and Circolo Matematico di Palermo.\nShe retired from teaching in 1938, had a stroke in 1941, and died on April 13, 1945, in Fort Lauderdale, Florida.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48126858","title":"Facelinopsis pacodelucia","body":"\nFacelinopsis pacodelucia\n\nFacelinopsis pacodelucia is a species of sea slug, an aeolid nudibranch, a marine gastropod mollusc in the family Facelinidae.\nDistribution.\nThis species was described from Algeciras harbour, Spain.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48126861","title":"2010–11 Glasgow Warriors season","body":"\n2010–11 Glasgow Warriors season\n\nThe 2010-11 season saw Glasgow Warriors compete in the competitions: the Magners Celtic League and the European Champions Cup, the Heineken Cup.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48126877","title":"Punjabi nationalism","body":" Delhi, Uttar Pradesh, Jammu and Kashmir and many institutes like schools-colleges in Punjab state itself where Punjabi language is ignored. Punjabi language dialects like Bauria, Bazigari, Bhand, Dhaha, Gojri, Lahanda, Lubana, Odi, Rai Sikhi and Sansi are also becoming extinct in Punjab, India. There is Hindi imposition since 1950s and 1960s in state against Punjabi language. Despite a rich heritage of Punjabi literature, Punjabi Television serial industry in Indian Punjab has totally disappeared.\nPunjabi nationalism in West Punjab.\nIn Pakistani Punjab province, Punjabi Language Movement is a linguistic movement in aimed at reviving the Punjabi language, art, culture and literature in Pakistan. There are several attempts going on by Punjabi society for implementation of Punjabi language as it is completely ignored by authorities in Punjab province. Urdu is preferred medium of education in local schools-colleges as well as Government paperwork which is very threatening for survival of Punjabi language in Punjab, Pakistan. But Urdu is the mother tongue of only about 7.57% Pakistanis. In September 2015, a case was filed in Supreme Court of Pakistan against Government of Punjab, Pakistan as it did not take any step to implement Punjabi language in the province. Punjabi lovers also say that creation of Bangladesh out of Pakistan proves that love of \"Mother-tongue\" is more important than religion. Pakistani Punjabi language film industry is in crisis as filmmakers were not producing Punjabi language films like before 1975 Punjabi films ruled in film industry of Pakistan. Television Channels from Lahore (Punjab's capital city) are all in Urdu instead of Punjabi. There is still 150-year-old unofficial ban on education in Punjabi language in Punjab, Pakistan and Government is ignorant about it thus compelling Punjabi people to protest. In August 2015, Pakistan Academy of Letters, International Writer’s Council (IWC) and World Punjabi Congress (WPC) organised \"Khawaja Farid conference\" and demanded Punjabi University should be established in Lahore and Punjabi language should be declared as the medium of instruction at the primary level. In Lahore, every year thousands of punjabis gather on International Mother Language Day seeking an end to the 150-year-old ban on education in Punjabi in Pakistan and against Urdu-isation of Punjab. In September 2015 at Government Emerson College, Multan thousands of aspirants seeking admission protested against the administration for forcing them not to adopt Punjabi and Saraiki dialect as compulsory or optional subjects as usually majority of students prefer Punjabi and Saraiki dialect balancing their marks sheet in BA (third year).\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48126881","title":"Time Warner Cable SportsChannel (Texas)","body":"\nTime Warner Cable SportsChannel (Texas)\n\nTime Warner Cable SportsChannel (TWC SportsChannel) is a regional sports network serving Texas. It is broadcast on Channel 323 and 1020 within the state exclusively on Time Warner Cable systems.\nProgramming.\nThe following sporting events are carried by TWC SportsChannel – Texas:\nOther shows that air on TWC SportsChannel:\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48126887","title":"Chris Gheysens","body":"\nChris Gheysens\n\nChris Gheysens (born 1971) is an American businessman who serves as the President and Chief Executive Officer of Wawa Inc., a privately-held chain of convenience store / gas stations with nearly 700 locations along the East Coast of the United States.\nHe grew up in Vineland, New Jersey and worked in his youth at car washes that his father owned. He attended St. Mary School in East Vineland and then moved on to St. Augustine Preparatory School in Richland, New Jersey, graduating in 1989. After earning a B.S. in accounting from Villanova University in 1993, Gheysens earned an M.B.A. from Saint Joseph's University in 2005, both located in Philadelphia. His family would spend their summers in the Jersey Shore community of Sea Isle City.\nCareer.\nGheysens worked for four years as an auditor in the Philadelphia office of Deloitte LLP, in Philadelphia.\nGheysens was hired by Wawa in 1997 and was named to serve as the company's its chief financial officer and chief administrative officer in 2007. In 2012 he was named as Wawa's president and became the chief financial officer in January 2013, after a 16-month-long transition from his predecessor, Howard Stoeckel. He is identified on his business card as \"Lead Goose\", a riff on the company's logo of a flying goose, a title that he describes as fitting in with the loose corporate culture at Wawa. Gheysens has overseen an extensive remodeling project for the company's stores to establish a \"warmer tone\" for customers, rollout of a mobile app and expansion into North Jersey and Florida.\nAt the Villanova School of Business, Gheysens is a member of the dean's advisory committee. He has also been active with the Southeastern Pennsylvania Chapter of the American Red Cross. In September 2013, Gheysens was named to serve a three-year term on the Economic Advisory Council of the Federal Reserve Bank of Philadelphia. In October 2013, he was one of four members added as retail members serving on the Board of Directors of the National Association of Convenience Stores.\nGheysens traveled to Rome in 2015 as part of a delegation coordinating aspects of the papal visit to Philadelphia as part of Pope Francis' 2015 visit to North America. As one of the corporate sponsors of the World Meeting of Families, Wawa was contributing one million bottles of water for those participating at the event.\nHe lived in Washington Township, Gloucester County, New Jersey before moving to Moorestown, New Jersey with his wife and four children.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48126889","title":"Francisco Plaza","body":"\nFrancisco Plaza\n\nFrancisco Plaza, also known as Fort Francisco Museum, built in 1862, was the first significant dwelling in the Cuchara Valley at what became La Veta, Colorado. The plaza is now a part of the museum complex. Only the courtyard and the fort building were added to the National Historic Register in 1986. The other structures are new, or were moved to this location during the 1960s.\nHistory.\nThe plaza was originally a U-shaped structure, much modified over the years. It was built by John M. Francisco of Georgia, and his business partner, Henry Daigre, a Frenchman from Quebec, and served as the headquarters for their cattle ranch. The ranch sold beef to the U.S. military forts in the area. The area around the plaza was home to Hispanic workers for the ranch. The plaza served as a supply center to the growing community, occasionally proving protection from Ute Indian attacks.\nThe plaza served as a temporary depot for the Denver and Rio Grande Railroad when it arrived in 1876. The town of La Veta, incorporated at the same time, never grew to more than 800 residents. The plaza because a residence and farm again for John M. Francisco by the 1890s, the partnership with Daigre having ended possibly 20 years prior. Francisco owned the plaza until his death in 1902. It then passed through various family members, and was acquired by the Huerfano County Historical Society in 1958.\nArchitecture.\nThe remaining historic structures were adobe of typical early Hispanic style, built of 18 to 24 inch thick adobe bricks. The building had three sides, each 100 feet long, with the fourth side closed by a fence. Significant changes were made to portions of the building, other buildings were built and rebuilt. The buildings were renovated in the late 1990s.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48126908","title":"Giovanni Waal","body":"\nGiovanni Waal\n\nGiovanni Waal (born May 25, 1989) is a Surinamese footballer playing as a Forward for Inter Moengotapoe in the Hoofdklasse, and for the Suriname national team.\nCareer.\nWaal began his career at SV Voorwaarts in Paramaribo, making his debut in the 2009-10 SVB Hoofdklasse season. After two season he transferred to SV Leo Victor, finishing the season as the leagues joint top scorer together with Ulrich Reding (of SV Boskamp), both finishing with 20 goals each. The following season saw Waal transfer to SV Robinhood where he played for two seasons. In 2014 Waal transferred to Inter Moengotapoe winning the National championship in his first season with his new club.\nInternational career.\nWaal plays International football for Suriname, having made his debut in the final qualifying round of the 2010 Caribbean Cup, in the 2-1 loss against Antigua and Barbuda. He also participated in the teams' 2014 FIFA World Cup qualification campaign, making four appearances against Cayman Islands, Dominican Republic and El Salvador, failing to help his team advance to further qualifying rounds. On 9 June 2012 he scored his first goal for the national team in a friendly match against French Guiana which ended in a 2-1 loss, He has also represented Suriname in the 2012 Caribbean Cup qualification, the 2018 FIFA World Cup qualification and the ABCS Tournament.\nCareer statistics.\nInternational performance.\n\"Statistics accurate as of matches played on 16 June 2015\",\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48126927","title":"Thank Your Lucky Stars (Beach House album)","body":"\nThank Your Lucky Stars (Beach House album)\n\nThank Your Lucky Stars is the sixth studio album by American dream pop band Beach House. It was co-produced by the band and Chris Coady, and was released on October 16, 2015, on Sub Pop and Bella Union. The album was released less than two months after their fifth studio album, \"Depression Cherry\".\nDescribed by the band as \"not a companion to \"Depression Cherry\", or a surprise, or b-sides,\" \"Thank Your Lucky Stars\" was unexpectedly announced nine days before its release via the band's Twitter account. It received mostly positive reviews from critics.\nBackground and recording.\nThe album was recorded at Studio in the Country in Bogalusa, Louisiana, and mixed at Sonic Ranch in Tornillo, Texas. Although the album was recorded simultaneously alongside \"Depression Cherry\", the band felt that the records should be seen as distinct unconnected works. \nReception.\n\"Thank Your Lucky Stars\" was released to highly positive reviews. At Metacritic, which assigns a normalized rating out of 100 to reviews from mainstream critics, the album has an average score of 80, based on 13 reviews.\nJayson Greene of Pitchfork suggested the songs took on a \"darker edge\" than those from \"Depression Cherry\", judging the songs to feel smaller by having stripped away the typical cathedral-like reverb from the group's previous albums. Greene likened the mood of the songs to Beach House's material before they joined Sub Pop, describing the feeling as \"pneumatic, dusty, like they are pulling a blanket around themselves in a heatless attic to ward off a threatening chill.\" Although the \"joy and comfort have vanished\" from the material, Greene claimed that that album is \"still undeniably a Beach House album, a familiar mix of warm tones and chilly sentiments.\" Ultimately, Greene welcomed the addition to the band's repertoire, but suggested that a new album so soon created a dissonance that feels like \"too much of a good thing.\"\nIn a review from \"The A.V. Club\", Corbin Reiff described the album as \"most assuredly a continuation of many of the same motifs and hallmarks of the group's last release.\" Reiff hailed the band's craft, arguing that \"Beach House has mastered the art of space by this point and seems to have an instinct for how long to drag out a keyboard melody or a guitar line before bringing in another element to keep things from bogging down.\" Although he felt \"Depression Cherry\" and \"Thank Your Lucky Stars\" were similar in motif, Reiff praised the band's decision to separate the songs, rather than tack them onto the former. For Reiff, \"Thank Your Lucky Stars\" supports itself as a singular entity where \"the full sonic and emotional weight is tremendous.\"\nWriting for \"Rolling Stone\", Meagan Fredette gave praise to Victoria Legrand's vocals stating that \"her singing on \"Thank Your Lucky Stars\" feels more playful than usual, a welcome lightness that comes across from the first moments of \"Majorette,\" the album's opener\". Elegy to the Void was also singled out as a highlight of the record with Fredette describing the track as \"the album’s crown jewel\" and \"as good a summation as any of what Beach House does best\". Emphasising the maturity of the record in comparison to the band's debut, she suggests that \"Like all their albums, this one is full of songs made for dreaming of a bygone love, or humming quietly to a new one\".\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48126935","title":"Alain Ngamayama","body":"\nAlain Ngamayama\n\nAlain Ngamayama is a Polish footballer who plays as a midfielder for Warta Poznań. He is the captain and widely considered a club hero.\nHe is was born to a Zairean father and Polish mother, however considers himself fully Polish having born in Greater Poland. He grew up in Poznań and began in Warta's youth teams. Despite the clubs varying fortune he stayed with the club throughout his career barring a short stint for one season early in his career.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48126945","title":"Massawepie Mire","body":"\nMassawepie Mire\n\nThe Massawepie Mire is a boreal peatland bog in Piercefield, New York. Located near Massawepie Lake, the mire is the largest bog in New York State. Much of the bog is on the property of Massawepie Scout Camps, and the camp partners with the Nature Conservancy to preserve the ecosystem. The Massawepie Mire is noted for birdwatching, with several species of rare birds occupying the area including spruce grouse, gray jay, Lincoln's sparrow, boreal chickadee, and the two-barred crossbill. Flora includes the carnivorous pitcher plants and sundew, tamarack pines and black spruce trees, as well as the sphagnum moss that makes up the base of the bog.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48126947","title":"Calmodulin in Target Binding and Recognition","body":"\nCalmodulin in Target Binding and Recognition\n\nCalmodulin (CaM) is a complex signaling protein that transduces transient calcium ion signals. CaM's binding of calcium ions cause conformational changes, which interact with downstream proteins. Current research indicates that selective protein binding occurs through the mechanism of mutually induced conformational fit, which would explain how calcium dynamics in CaM would modulate its interaction.\nCurrent research on CaM signaling and CaM-BT interaction includes experimental kinetic rate observations and coarse grain/all atom Molecular dynamics simulations. Because protein signaling and protein-protein interaction is a new field of research, many observed interactions cannot be explained through experiment alone. The unification between simulation and experimental results is necessary to expand the predictive power of the theoretical approach and create general laws that explain the mechanics of signaling/protein-protein interactions.\nThe computational approach for modeling macro molecules is very resource intensive. The Hamiltonian equation in molecular dynamic software relates each atom to all other atoms in the system through kinetic, electrostatic, van der Waals, dihedra, bond, etc. energies. For example, the RRK polypeptide (CaMKII residues: 293-313) contains 21 residues and 318 atoms. For a single time step, the molecular dynamics software must perform energy calculations between every atom in the polypeptide, which is ~100,000 calculations. Since the time step must be in the sub picosecond range (to insure stability), several million time steps must be performed to obtain meaningful data.\nTo remedy the large number of calculations involved in all atom simulations, the coarse grain simulation technique can be used. Current work from the biophysics group at the University of Houston uses open source coarse grain and all atomic models of CaM and wildtype/mutated binding targets of CaMKII in their research.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48126966","title":"The Silk Roads","body":"\nThe Silk Roads\n\nThe Silk Roads: A New History of The World is a 2015 book authored by Peter Frankopan, an academic at the University of Oxford. He presents a new point of view about center of human rise and oppose with traditional view that consider human heirs to the Egyptians.\nSummary.\nThe traditional view is that Western civilization descends from the Romans, who were in turn heir to the Greeks, who, in some accounts, were heirs to the Egyptians. Frankopan argues that the Persian empire was the center point of the rise of humanity. In the silk roads, Frankopan wants to change the view point of reader to History and make new sight.\nAuthor.\nFrankopan is a historian at Oxford University, where he is Senior Research Fellow at Worcester College Oxford and Director of the Oxford Centre for Byzantine Research. He works on the history of the Mediterranean, the Balkans, the Caucasus, Russia and on relations between Christianity and Islam. He also specializes in medieval Greek literature, and translated \"The Alexiad\"for Penguin Classics (2009). Frankopan often writes for the international press, including \"The New York Times\", \"The Washington Post\", \"The Guardian\", \"MoneyWeek\". He has also contributed to TV and Radio documentaries about the Byzantine Empire, Divine Women, Roman Law and the Code of Justinian, the Crusades, Varangian mercenaries and the reign of Ivan the Terrible. His new book is \"The Silk Roads: A New History of the World .\"\nReception.\nReviews on the silk roads by Peter Frankopan was published at the guardian, The Independent, The telegraph newspaper and The Times.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48126980","title":"Evolution and the Humanities","body":"\nEvolution and the Humanities\n\nEvolution and the Humanities is a 1987 book by David Holbrook that attacks Darwinian evolution. The book rejects reductionist biology and takes influence from Michael Polanyi and vitalist philosophy. \nReception.\nThe book has been heavily criticized by academics. Martin Stuart-Fox noted that Holbrook's criticism of natural selection was a \"cobble together, in a sort of scissors-and-paste criticism... the book contains no vigorous argument at all. Not only is Holbrook very obviously no scientist, he is no philosopher either.\"\nEcologist Arthur M. Shapiro in a review for the National Center for Science Education commented:\nDavid Holbrook, Fellow of Downing College, Cambridge, has written a polemic not so much against evolution as against scientific reductionism (which he sees incarnate in neo-Darwinism). He proceeds from revulsion at the existentialist vision of \"life as a 'scientific accident.' \" He's no creationist but, rather, a from-the-gut free-form vitalist—just as preoccupied with the perceived moral consequences of the Darwinian revolution as any Bible-thumping moralist could be. As usual, he conflates science with scientism and evolution with evolutionism, materialism, and atheism.\"\nThe book is said to have been poorly edited and riddled with errors.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48127002","title":"Ryan Walker (cartoonist)","body":"\nRyan Walker (cartoonist)\n\nRyan Walker (1870-1932) was an American political activist and cartoonist. A prolific artist who published political cartoons in a variety of radical newspapers and magazines in the United States, Walker is best remembered as the creator of the recurring character \"Henry Dubb,\" an American worker who ambled through life blithely being victimized by capitalism ostensibly as a result of his blind acceptance of the ideas of the ruling class.\nA member of the Socialist Party of America during his younger years, Walker's political views hardened with the coming of the Great Depression in 1929 and he joined the Communist Party, USA the following year, joining the editorial staff of the party's English-language daily newspaper in New York City. Walker died of pneumonia in June 1932 while on a visit to the Soviet Union.\nBiography.\nEarly years.\nRyan Walker was born in Springfield, Kentucky on December 26, 1870. His father, Edwin Ruthwin Walker, was a farmer who later became a lawyer and moved the family to the Midwestern metropolis of Kansas City, Missouri, where Ryan attended public school.\nShowing a proclivity for art from an early age, submitting his first free lance cartoons to \"Judge\" in 1883, at the age of 13. These were not of sufficiently finished quality to appear in the pages of the magazine, but the ideas were accepted and redrawn into a two page center spread and back cover cartoon by a house artist, for which Walker received a royalty check of $15. He received positive reinforcement from the magazine's editor to continue at the cartooning craft and to hone his drawing skill.\nUpon leaving school Walker studied for a time at the Art Students' League in New York City, before working for a number of years in a series of manual jobs, refining his drawing in his spare time. \nWalker's private portfolio grew until in 1895 he was finally able to land his first permanent artistic job, a position in the advertising department of the \"Kansas City Times.\" He showed aptitude with a pen and took an acute interest in political issues and he was shortly made an editorial cartoonist for that paper, remaining in that position until 1898. In that year he moved to St. Louis, Missouri to take a position as cartoonist for the \"St. Louis Republic,\" where he would stay until 1901, taking time to get married to his Kansas City sweetheart, journalist Maud Helena Davis, in October 1899.\nThe year 1901 saw a move to Boston, where he did a stint as cartoonist for the \"Boston Globe,\" leaving after one winter. He subsequently worked as a freelance cartoonist, publishing work in a variety of prominent newspapers and magazines of the day, including the \"New York Times,\"\"Life,\" \"The Arena,\" and \"The Bookman.\" \nWalker moved from freelance to syndicated work in 1904, joining with the Baltimore based International Syndicate as a cartoonist. He would stay with that firm until 1911, when he left to pursue political pursuits fulltime.\nSocialist years.\nFrom 1902 Walker contributed material to a glossy socialist monthly published in New York City during the first five years of the 20th Century, \"The Comrade.\"\nWalker turned a close eye to the social problems of his day and developed politically radical views, declaring in a 1905 interview that\n\"My aim, hope, and life-work is the betterment of my brother man. Nothing else counts. I believe the present economic system is cruel, unjust, and essentially wrong, and wrong is wrong, no matter how it may be disguised... I am a Socialist because I believe that Socialism will lead to the development of the greater self, to the out-blossoming of all that is finest and highest in individual life, and that it will secure for all the people a measure of prosperity, happiness, and freedom...\"\nIt was through the pages of the socialist \"Appeal to Reason,\" a mass circulation weekly published in Southeastern Kansas to which he began regularly contributing in 1906, that Walker first gained popular fame. It was in those pages that he first introduced the character \"Henry Dubb,\" an American worker who unthinkingly rejected the ideas of unionism and socialism, only to accept as inevitable his victimization by the violence and corruption of the social system around him. Exposed as a dupe and a fool by his worldly wife and somehow cognizant child, the oblivious and intractable protagonist would respond to his latest existential insult with an unblinking stare into space and the catchphrase \"I'm Henry Dubb!\" — an easy to understand depiction of the effects resulting from so-called false consciousness among the working class.\nWalker would come to publish two collections of Henry Dubb cartoons in hard covers, \"Adventures of Henry Dubb\" (1914) and \"New Adventures of Henry Dubb\" (1915), testimony to the character's enduring appeal among American radicals during the decade of the 1910s.\nIn addition to a steady stream of cartoons, beginning in 1912 Walker toured the country as a stump speaker on behalf of the Socialist Party of America, Walker was effective in his role as a socialist lecturer, so much so that his abilities were lauded by party orator Eugene V. Debs, who declared him a \"great cartoonist\" and \"equally great\" public speaker, who could delight and hold an audience of socialists and non-socialists alike. Walker was directly employed by the National Office of the Socialist Party as one of the touring speakers for its Lyceum Bureau from 1915 to 1916, working in close association with Lyceum director and future Communist Party leader L. E. Katterfeld.\nFollowing a conservative turn of the editorial line of the \"Appeal\" during the years of World War I, Walker would take his art and the Henry Dubb character to the pages of the New York City socialist daily \"New York Call\" and later to its successor, the \"New Leader.\" The left wing press being notoriously underfunded, Walker would supplement his socialist-related work with regular employment as the Director of the Art Department of the \"Evening Graphic\" newspaper in New York City, where he was employed from 1924 to 1929.\nCommunist years.\nIn the fall of 1930 Walker joined the Communist Party, USA and assumed a position as a staff cartoonist for \"The Daily Worker,\" the party's New York City-based newspaper. In conjunction with his new role, Walker created a new regularly recurring character for his cartoons, a stolid proletarian known as Bill Worker.\nDeath and legacy.\nDuring a visit to the Soviet Union in the spring of 1932, Ryan Walker fell ill and was forced to be hospitalized. He died of pneumonia at Rotkinsky hospital in Moscow on June 22, 1932. He was 61 years old at the time of his death.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48127012","title":"Stubbs Road (constituency)","body":"\nStubbs Road (constituency)\n\nStubbs Road () is one of the 13 constituencies in the Wan Chai District of Hong Kong which was created in 1994.\nThe constituency loosely covers Stubbs Road in Hong Kong Island with the estimated population of 14,203.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48127021","title":"Nguyễn Tiến Duy","body":"\nNguyễn Tiến Duy\n\nNguyễn Tiến Duy (born 29 April 1991) is a Vietnamese footballer who plays as a Defender for V-League club Than Quảng Ninh F.C. and the Vietnam national football team.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48127022","title":"Chief Justice of Grenada","body":"\nChief Justice of Grenada\n\nThe Chief Justice of Grenada is the head of the Supreme Court of Grenada which consists of the High Court with three justices and a two-tier Court of Appeal. \nThe original High Court of Grenada was replaced by the Windward and Leeward Islands Supreme Court and the Windward and Leeward Islands Court of Appeal in 1939; both of the latter were replaced in 1967 by the Eastern Caribbean Supreme Court which performs both functions. The Eastern Caribbean Supreme Court, known in Grenada as the Supreme Court of Grenada and the West Indies Associated States, is headquartered in St Lucia, and is now the superior court of record for Grenada and the other Caribbean states which comprise the Organisation of Eastern Caribbean States.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48127026","title":"TSS St Patrick (1947)","body":"\nTSS St Patrick (1947)\n\nTSS \"St Patrick\" (III) was a passenger vessel operated by the Great Western Railway from 1947 to 1948 and British Railways from 1948 - 1972 \nHistory.\nShe was built for the Great Western Railway in 1947 as one of a pair of new vessels for the Fishguard to Rosslare service, the other being TSS \"St David\". She replaced a former ship of the same name which had been sunk by torpedo on 13 June 1941. British Railways took ownership in 1948 and she was based in Weymouth. Typically running services to Cherbourg, she was also used in the summer for trips from Torquay to the Channel Islands. In 1963 she was transferred to Southampton for services to St Malo and Le Havre, and in 1965 she moved to Folkstone for the service to Boulogne.\nShe was sold in 1972 to Gerasimos S. Fetouris, in Piraeus, and renamed \"Thermopylae\". She was sold again in 1973 to Agapitos Bros, Piraeus and renamed \"Agapitos I\". Scrapped in 1980 in Greece.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48127028","title":"School violence in Australia","body":"\nSchool violence in Australia\n\nThe Education Minister of the State of Queensland said in July 2009 that the rising levels of violence in schools were \"totally unacceptable\" and admitted that not enough had been done to combat violent behaviour. 55,000 students had been suspended in the state's schools in 2008, nearly a third of which were for \"physical misconduct\".\nIn South Australia, 175 violent attacks against students or staff were recorded in 2008. Students were responsible for deliberately causing 3,000 injuries reported by teacher over two years from 2008 to 2009.\n46% of Principals in Western Australia have been either physically assaulted or witnessed physical violence in schools during 2012. 70% of school leaders had also been threatened with violence. Schools in Western Australia, South Australia and the Northern Territory rated far higher than other states in terms of threats of violence.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48127054","title":"Melkwezer dialect","body":"\nMelkwezer dialect\n\nThe Melkwezer dialect (Standard Dutch: \"Melkwezers\", ) is a subdialect of Brabantian spoken in Melkwezer, a town in the Linter municipality.\nPhonology.\nThe phonology of the Melkwezer dialect is similar to that of the Orsmaal-Gussenhoven dialect, but they are not identical. For instance, the diphthong in the Orsmaal-Gussenhoven dialect corresponds to in the Melkwezer dialect.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48127102","title":"Here I Am a Stranger","body":"\nHere I Am a Stranger\n\nHere I Am a Stranger is a 1939 American drama film directed by Roy Del Ruth and written by Sam Hellman and Milton Sperling. The film stars Richard Greene, Richard Dix, Brenda Joyce, Roland Young, Gladys George and Kay Aldridge. The film was released on September 28, 1939, by 20th Century Fox.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48127104","title":"Shaw Academy","body":"\nShaw Academy\n\nShaw Academy is a professional, online, higher education institution.\nShaw Academy was founded in 2013.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48127143","title":"ATIV Software","body":"\nATIV Software\n\n is a privately held company based in Santa Rosa, California that develops the EventPilot® conference and journal mobile apps for iOS, Android and web-based devices. EventPilot conference apps help large meetings go paperless and reach sustainability goals.\nHistory.\nATIV Software was co-founded by Silke Fleischer and Eric Converse in 2010 to provide native apps for events that save meeting organizers time and money.\nProducts and Services.\nEventPilot Conference App\nIn 2014, ATIV Software partnered with Radius Networks to incorporate iBeacon technology with EventPilot conference apps, enabling indoor positioning and proximity-aware notifications that send targeted messages to event attendees based on their indoor location. In 2015, EventPilot released an interactive maps feature and an online itinerary planner.\nEventPilot Journal App\nThe EventPilot Journal App is a native mobile app offering for medical and scientific peer-reviewed publications.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48127158","title":"Adam Roxburgh","body":"\nAdam Roxburgh\n\nAdam Roxburgh (born 14 April 1970) is a rugby union coach and former player who made eight appearances for the Scotland national rugby union team. He was known for his entertaining play in rugby sevens games.\nEarly life.\nRoxburgh was born in Edinburgh.\nRugby playing career.\nHe played club rugby for Kelso RFC.\nHe made his international rugby debut on 22 November 1997 against Australia at Murrayfield. His last appearance was against Australia at Brisbane during the 1998 Scotland rugby union tour of Oceania.\nRoxburgh was a talented rugby sevens player. With Kelso he competed in the Dubai Sevens, 1993 Rugby World Cup Sevens and has won three Kings of the Sevens. In 1997, he won the Middlesex Sevens with the Barbarians.\nWhen many of his rugby-playing contemporaries turned professional in 1997, Roxburgh remained with the firm of precision tool makers, Abbey Tool and Gauge in Kelso, who had been his first employer from school. He retired from club rugby in 2005.\nCoaching.\nBy 2008 he was coaching the Kelso sevens team and the Kelso second fifteen. He took over as a head coach at Kelso from 2015.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48127164","title":"Moridilla brockii","body":"\nMoridilla brockii\n\nMoridilla brockii is a species of sea slug, an aeolid nudibranch, a marine gastropod mollusc in the family Facelinidae.\nThis species is considered a nomen dubium.\nDistribution.\nThe type locality of \"Moridilla brockii\" is the Sunda Sea which is an old name for the Flores Sea. This species is considered to be widespread in the Indo-Pacific region. It was redescribed from the Gulf of Mannar, India.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48127171","title":"Shmuel Shapiro","body":"\nShmuel Shapiro\n\nShmuel Raphael Shapiro (, born 1974 in Aix les Bains, France), known by his stage name Shmuel Shapiro, is a French Chassidic-Jewish singer, composer and musician. He is especially popular in Israel and Europe, from the early 1990s to this day.\nEarly years.\nAt the age of nine, he moved to Israel with his family, studied in the Chassidic Yeshivot of Rachmastrivka and Erloy. Shmuel started his musical career very early. He composed his first song at the age of eleven and became the main soloist of the Erloys choir at seventeen. then he approached the Chabad movement.\nCareer.\nIn 1994, after his marriage, Shmuel studied in a Kollel and founded the orchestra \"Kol Haneguina\" with the famous artists Daniel Mamane and Haim Kirshinboim.\nShmuel then studied music, worked his voice and learned 'Hazanout in the great school of maestro Naftali Hershtik, Elie Jaffe and Benjamin Munk\nFrom 2000 he became the most requested conductor for Jewish choirs in France, to this day.\nHe also took lessons with musicians and opera singers. In 2001, Shmuel became cantor of the Great Synagogue of Migdal Haemek, of the Rav Yitzchak Dovid Grossman. Very dynamic, Shmuel also animated the Israely Radio Kol Hanechama in Jewish thought and music. Shmuel returned to France in 2006 as cantor of the Great Synagogue \"Ohel Avraham\" Montevideo st. (Paris 16e).\nIn 2009, he became director of a choir and member of the board of the \"Nigounit\" music school.\nShmuel was proposed in 2010 a global music project by musician was rejected by him on religious ground..\nShmuel has recorded several music titles during his career and his first album \"Seu Morom\" was recorded in 2013 in France and Israel, with the arranger Didier Atlan. His songs are included in weddings, synagogues and Yeshivot in Israel and other countries. The majority of the CD songs were composed by Shmuel. Shmuel's song named \"Ahavat Israel\" was proposed purchase by singers and music professionals worldwide. Finally buying rejected from producer of Shmuel.\nShmuel Shapiro appears regularly with famous singers like Enrico Macias (2013), Yoram Gaon (2008), Avraham Fried (2005), Mordechai Ben David (2004), (2006), Dedi Graucher (2006), Yosi Piamenta (2005), (2006), Ohad Moskowitz (2004), Isaac Bitton (2006), (2000–2003), (2006), yehuda glantz (1999), (2009), Benny Friedman (2013).\nPersonal life.\nShmuel is married and has three children, lives in Paris.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48127248","title":"Speed Sisters","body":"\nSpeed Sisters\n\nSpeed Sisters is a 2015 documentary film that follows the all-female Palestinian racing team the Speed Sisters and explores the social issues surrounding their career.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48127258","title":"James Marshall Campbell","body":"\nJames Marshall Campbell\n\nJames Marshall Campbell (1895-1977) was dean of the college of arts and sciences at The Catholic University of America. Campbell was a classical scholar, and a member of the department of Greek and Latin. He was on the faculty of the Catholic University from 1945-1966.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48127272","title":"Valencian People's Union","body":"\nValencian People's Union\n\nThe Valencian People's Union (in Valencian: \"Unitat del Poble Valencià\", UPV) was a political party created in 1984 when the Left Grouping of the Valencian Country (AEPV) and the Nationalist Party of the Valencian Country (PNPV) merged and became an unified party.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48127308","title":"DhoomBros","body":"\nDhoomBros\n\nOriginally from Pakistan and currently based in New York, Hussain Asif, Shehryaar Asif, Atif Khan and Waqas Riaz, collectively called the DhoomBros, are known globally for their success through YouTube, and are now also working their drama Hum Kahan Chal Diye along with many other projects. Since creating their first channel (DhoomBros) in 2008, their videos have gathered over 9 million combined views, including videos from their more recent channel (TheDhoomBros) made in 2012. They are particularly known for their satirical takes on everyday Desi lives, parodies of mainstream entertainment, video blogs, short films, and their Mehndi dance performances.\nCareer.\n2008–11: Early beginnings and background.\nThe DhoomBros are a four-member Pakistani-American group that includes \"Hussain Asif\", \"Shehryaar Asif\", \"Atif Khan\", and \"Waqas Riaz\" and they are based in the United States of America. The idea of calling themselves \"DhoomBros\" came within the name itself: “Dhoom” Bros (\"Dhoom\" = \"Blast\" in Hindi). The song “\"Dhoom Again\"”, from the 2006 Bollywood film Dhoom 2 was a popular hit amongst South Asians but the Western world was generally unaware of it. Brothers Shehryaar (informally known as \"Shehry\") and Hussain Asif performed to that song in a school talent show and received recognition from their peers and the school faculty. At this point, they called themselves the DhoomBros. This motivated them to entertain people through dance and various acts and so on June 23, 2008, the DhoomBros officially created their first YouTube channel (DhoomBros) and their official Facebook page. Atif Khan, the group's mutual friend, and Waqas Riaz, the cousin of the Asif brothers, joined later because they had similar interests.\nThey Started Off Making videos such as \"Jimmy And Saleem' and \"The Desi Mobsta Show\". They also would upload videos of themselves talking about weird things that have happened to them throughout their week, either at home,at school, or in daily life. \nWhen they started out they had nicknames, Hussain was, \"Desi Mobsta\" or \"Don\". Waqas was \"Daku\", Shehryaar was just \"Shehry\".\nNow, Hussain has a refurbished nickname \"Hussain Superstar\", Atif is \"Ati\" or \"Khan Saab\".\n2012–2013.\nIn 2012, DhoomBros videos became more frequent from \"Stuff Pakistanis Say\", a video that comically represents common Pakistani household events and phrases, to \"Humsafar Best Scenes Parody\", a parody based on the Pakistani drama serial, Humsafar, to the \"Annoying Brown Girls/Guys\" series, videos that show banter that stereotypical Desi teenagers seem to portray.\nIn October 2012, their popularity increased after the DhoomBros released their video, \"Desi Style\", a parody based on South Korean pop artist Psy's hit single, Gangnam Style. The DhoomBros chant in English, Urdu and Punjabi about their everyday Desi American lives, consisting of waking up to their mother’s voice, going to school, and greeting their grandfather, all accompanied with song and dance.\nThe group also experiment outside comical videos. \"Blessings of Ramadan\" is a video portraying three young men who indulge in materialistic aspects of their lives and fall astray from their spirituality by forgetting the significance of the month of Ramadan, the Muslim month of fasting and prayer. In addition, \"The Perfect Memory\" is the DhoomBros' first short film about the unexpected sacrifices one may have to make when it comes to love. Both videos were unlike the group's usual comical parodies, but were still well-garnered by audiences.\nTwo of the members, Shehryaar Asif and Waqas Riaz, are known for uploading occasional video blogs that highlight various aspects of the lives of the DhoomBros, such as showing sneak peeks of their projects and being DJs at work. They also document their trips, such as to different cities in the United States of America and their stay in Pakistan. In addition to being YouTube entertainers, the DhoomBros are also DJs and often perform at weddings, mehndi events, and other parties. Apart from their comical videos, their mehndi performances have also gathered many views.\n2014–Present.\nOne of the DhoomBros' most recent popular video is the \"Evolution of Bollywood Dance\", inspired by Penn Masala's Evolution of Bollywood Music. In this video, the DhoomBros recreate the dancing styles that the Bollywood film industry has witnessed over the years from the golden-aged actors From Raj Kapoor to Shammi Kapoor and Jeetendra to Dharmendra and Mithun Chakraborty and to the stars of today such as Hrithik Roshan, Salman Khan, and Shah Rukh Khan.\nAfter debuting in their first venture in the web-series, \"iDeewane\", the DhoomBros are currently in the pre-production status for their Drama: Hum Kahan Chal Diye.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48127312","title":"Alcides Greca","body":"\nAlcides Greca\n\nAlcides Greca (February 13, 1889 in San Javier, Saint Faith, Argentina – April 16, 1956 in Rosario, Saint Faith, Argentina) was a lawyer, journalist, cineasta, jurist, teacher, writer and Argentinian politician, that directed the film \"The last malón\" of 1917 and defended the native cause in Saint Faith, in addition to being socialist, radical and adherent of the university reform.\nBiography.\nFirst years.\nAlceides Was born as a second son of the marriage of don Francisco Greca and of donya Magdalena Trucco, immigrant of Italian and French origin, the February 13, 1889, in the town of San Javier, Saint Faith. It Would be part of a numerous family, composed by eleven brothers more: Silvio, Erminda, Francisco, Alejandro, Teodora, Magdalena, Ana, Mercedes, María Isabel, Clorinda and Gilds.\nTo the same city receive his first education, and has as a companions to the native mocovíes, which thing later influenced in his works. For the secondary level moves to the city of Saint Faith, in Inmaculada's School Concepción of the jesuïtes, and finishes the secondary in the National School Simón of Iriondo, being egressat of the first promotion of students.\nStarts of his literary and journalistic career.\nLater it travels to the Silver, Buenos Aires, to study advocacia, and writes his first lines of \"the Evangeli Rebellious\", \"Laurels of the Marsh\", and \"Black Tears.\" Being missing a lot little to receive, abandons his career to be elect deputy for his department in 1912.\nIn 1907, it decides to begin his journalistic career, and founds his first periodic \"The Mocoví\", to San Javier. Next, Alcides would found the periodic \"The Pure Truth\", \"The Paladín north\" and \"The Word\" (antecedent of the current \"The Litorial\"), in 1912, 1914 and 1915 respectively. These last two would be established to the city of Saint Faith. Besides, colaboriaría with the newspaper Rosario's \"The Capital\" and the magazine of Juridical and Social Sciences of University of the Seaboard.\nIn the meantime, in 1909, public his first book, \"Words of Quarrel.\" Later, it finishes \"Symphony of the Sky\", a series of hymns in prose, and \"Black Tears\", a history of madness and pain, the year 1910. And in 1915 public \"Laurels of the Marsh\" and \"The Evangeli Rebellious\".\n\"The last malón\".\nIt is reelecto provincial deputy in 1916, and in 1917 films \"The last malón\", feel east the first llargmetratge Argentinian in 35 millimeters that films to the interior of the country. In the same recreates the last native rebellion become in territory santafesino, fruit of the pursuit to the aborigine since the Law of Territories of 1884. It bases in the facts succeïts in the month April 1904. This film is produced in Rosario, for Greca Film Cinematographic Company Rosarina, in Av. Pellegrini To the 1655. Also it finishes his studies by right in The Silver.\nIn 1920 it contracts matrimonico with Rosa Pierri, known how \"Roxana.\" This same year is elect senator, and deputy constituent for the reform of the Provincial Constitution. In 1921 nacé the only son of the couple, Alcibíades Alejandro Greca. \nIt is appointed headline by right Administrative and Municipal Right Compared, in the Faculty of Juridical and Social Sciences of the University of the Seaboard, where would dictate chair for 27 years, comenzandó the July 5, 1921. For these years realises some voyages for the interior of the country, and in 1923 visit Chile, Peru, Bolivia and Uruguay, beside the brothers Ángel and Alfredo Guido. Two years next would be elect national deputy for the second time.\nAlready in 1927 it begins to públicar several books. The first novel públicada would be in this year, \"North Wind\", that deserved elogiosos trials of the national and foreign press. In 1929 it appears \"The Tower of the English\", which contains chronic of the voyages realised the year 1923, and in 1932 public \"Tales of the Committee\".\nIt Would be reelectó national deputy in 1930, but can not finalise his mandate because of the coup d'état of the general Uriburu, and the December 9, 1933 is detained and brought to the island Martín García, because of different motívos political. After going out of her, public \"After the alambrado of Martín García\".\nIn Chile, Alcides public \"The Pampa Gringa\", being the protagonist of this novel the south santafesino, in 1936, and, already in Saint Faith, public \"spiritual Tragedy of the Argentinians that today are 20 years old\", as an edition of the UNL.\nHis last years.\nWith his esposa, travel for Europe the year 1951, but have to go back before for a granddaughter's demise. In 1954, jubila as a university teacher, buys a chacra and moves to the city of Oliveros, where devotes to cultivate his horta and garden.\nLater, it would be him diagnosed pancreatitis, and is moved urgently to Rosario's a hospital, but the April 16, 1956 dies in a room of the Italian Hospital.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48127331","title":"The Araki","body":"\nThe Araki\n\nThe Araki is a sushi restaurant run by Japanese chef Mitsuhiro Araki which opened in London in 2014. It was awarded two stars in the 2016 Michelin Guide for the UK and Ireland.\nDescription.\nChef Mitsuhiro Araki had previously run a restaurant in Tokyo called Araki for which he held three Michelin stars, but chose to close it in February 2013 in order to pursue a new challenge. He had considered New York, Paris, and Singapore, but chef Joël Robuchon suggested London to him. The move took three years to organise.\nThe interior of the restaurant, designed by the Takenaka Corporation, features a counter made from 200-year-old cypress wood gifted to Araki by Japanese musician Ryuichi Sakamoto. That counter is divided from the kitchen by a pair of green curtains, and the overall look of the interior is based upon the architecture of the Japanese Edo period. There are only fifteen seats – nine at the counter and six in a private dining room. The restaurant formed part of a £250 million redevelopment of the combined office and retail space at Burlington Street.\nFare.\nThe restaurant offers a single choice of a set menu consisting of eleven courses, with two sittings taking place each evening. Araki has modified the style of sushi he has made to take into account European produce, such as salmon sushi, Cornish squid, and langoustines. Other dishes include similar designs to those he used at his previous restaurant, but from sources within Europe, such as his signature tuna sashimi, in which he serves three different cuts of the fish.\nReception.\nChef Jason Atherton called the food at The Araki \"mind blowing\" and said that it was as good as any restaurant in Japan. The Araki was named the best Japanese restaurant in London by \"Tatler\" magazine in their 2015 restaurant guide. In September 2015, The Araki was awarded two stars in the 2016 Michelin Guide for the UK and Ireland. It was one of two Japanese restaurants in London to be elevated to the two-star level that year, the other being Umu, which is located a short distance away from The Araki.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48127344","title":"Porotos de soja","body":"\nPorotos de soja\n\nPorotos de soja is an Argentinian documentary film produced by the National Institute of Cinema and Audiovisual Arts (INCAA), directed by David Blaustein and Osvaldo Daicich, written by Daicicht. The film premiered on 21 May 2009.\nSynopsis.\nThe film was based on the investigation of Mariana Dosso, Silvina Segundo and Osvaldo Daicich. It examines a conflict between the agricultural producers and the government that occurred in Argentina in 2008.\nThe conflict erupts when the producers, grouped in four employers' organizations, rejected the system of mobile retention to the exports of soy and sunflower established by the Resolution 125. In the new system quotas were replaced by an agreeable pricing standard where the percentage of compensation was equal to or greater than the international pricing standards of the product. One of the arguments was over an alleged fault regarding the Executive Powers ability to implement the measure.\nThe Argentine National Congress established the new system, finalizing the dispute on 17 July 2008.\nThe film presents the opinions of the philosopher Ricardo Forster, the journalist and economist Alfredo Zaiat and the graduate in communication Mariana Moyano.\nProduction.\nThe director declared that the idea of the film was born on April 1, 2008 when he decided to cover an act by President Fernández of Kirchner in support of this resolution. The initial aim was to produce a special program for television but afterwards with the prolongation and deepening of the conflict, it was transformed into a film. Produced by the state body National Institute of Cinema and Audiovisual Arts (NICAA) it was premiered in cinemas on 21 May 2009 and was exhibited on the state television channel two days later.\nCritical reception.\nThe newspaper \"La Nación\" highlighted the camera work and said that the directors \"attained to radio-graph this problem that had in check to the population, while sociologists, journalists, politicians and writers expose his points of view about a thematic that had an enormous transcendence for the agricultural sector\". It added that the film attempts \"to clarify some of the most complicated elements that were born from that resolution 125 and visits by means of a photography of undoubted quality fields, stays and places that saw affected by this governmental imposition\" and stands out that \"it shows, in definite, the fight of the men of the field for conserving his belongings, still by the expense of a fight that had few paragons in the history of the country\".\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48127346","title":"Kevin Quinn (actor)","body":"\nKevin Quinn (actor)\n\nKevin Quinn (born May 21, 1997, in Chicago, Illinois) is an American actor known for his starring role in the Disney Channel's \"Bunk'd\".\nCareer.\nHe began his career by appearing in episodes of \"Shameless\" and \"Chicago P.D.\" Before being on Disney, he auditioned for season 12 of \"American Idol\". He wound up being one of the top 60 males in the country. He then played Jonny in Steppenwolf Theater's production of \"Lord of the Flies\", and a boy in a Chicago Shakespeare Theater adaption of \"Henry V\". Quinn's feature film debut was in the 2015 independent film \"Kids and Ghosts\".\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48127369","title":"Av8er Explorer","body":"\nAv8er Explorer\n\nThe Av8er Explorer is a British paramotor that was designed by Paul Taylor and produced by Av8er Limited of Woodford Halse, Northamptonshire for powered paragliding. Now out of production, when it was available the aircraft was supplied complete and ready-to-fly.\nDesign and development.\nThe Explorer was designed to comply with the US FAR 103 Ultralight Vehicles rules as well as European regulations. It features a paraglider-style wing, single-place accommodation and a single engine in pusher configuration. The aircraft is built with special attention to balancing and vibration isolation. The cage assembly includes small wheels to ease ground movement of the motor unit.\nAs is the case with all paramotors, take-off and landing is accomplished by foot. Inflight steering is accomplished via handles that actuate the canopy brakes, creating roll and yaw.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48127400","title":"Waulsortian mudmound","body":""}
{"url":"https://en.wikipedia.org/wiki?curid=48127469","title":"Av8er Observer Light","body":"\nAv8er Observer Light\n\nThe Av8er Observer Light (or Lite) is a British paramotor that was designed by Paul Taylor and produced by Av8er Limited of Woodford Halse, Northamptonshire for powered paragliding. Now out of production, when it was available the aircraft was supplied complete and ready-to-fly.\nDesign and development.\nThe Observer Light was designed to comply with the US FAR 103 Ultralight Vehicles rules as well as European regulations. It features a paraglider-style wing, single-place accommodation and a single engine in pusher configuration. The aircraft is built with special attention to balancing and vibration isolation. The cage assembly includes small wheels to ease ground movement of the motor unit.\nAs is the case with all paramotors, take-off and landing is accomplished by foot. Inflight steering is accomplished via handles that actuate the canopy brakes, creating roll and yaw.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48127474","title":"Masjid An-Noor","body":"\nMasjid An-Noor\n\nMasjid An-Noor, or variations such as Masjid-an-Noor and Masjid-e-Noor, may refer to:\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48127492","title":"Steve Cassano","body":"\nSteve Cassano\n\nSteve Cassano (born March 7, 1947) is an American politician in the state of Connecticut. He is a Democratic member of the Connecticut State Senate, having first been elected in 2010. He previously served as Mayor of Manchester, Connecticut from 1991 to 2005. Cassano is an alumnus of Manchester Community College, Boston State College (BA), the University at Albany, SUNY (MA) and the University of Connecticut (MSW).\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48127496","title":"Pedomicrobium ferrugineum","body":"\nPedomicrobium ferrugineum\n\nPedomicrobium ferrugineum is a rod-shaped, aerobic to microaerophillic bacterium from the genus of Pedomicrobium with one polar or supolar flagellum. \"Pedomicrobium ferrugineum\" has been isolated from podzolic soil in north Germany\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48127499","title":"Joel Larsson","body":"\nJoel Larsson\n\nJoel Larsson is a Swedish professional \"\" player. He is most known for winning the Pro Tour Magic Origins competition in August 2015, and for his skills in limited formats. Joel had the highest win percentage in the world in limited matches during the 2011-2012 Pro Tour season.\nJoel began playing \"Magic\" in 2005 with the Saviours of Kamigawa set, and qualified for his first Pro Tour in 2010, making his debut at Pro Tour San Diego. Due to his hairdo and appearance, he received the nickname of \"Swedish Kibler\" after the 2013 finals of Pro Tour Gatecrash in Montreal. In Sweden, he often goes by the nickname \"Proel\".\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48127500","title":"List of Ministers of the Interior of the Netherlands","body":"\nList of Ministers of the Interior of the Netherlands\n\nThe Minister of the Interior and Kingdom Relations () is the head of the Ministry of the Interior and Kingdom Relations and a member of the Cabinet of the Netherlands. Ronald Plasterk has been the Minister of the Interior and Kingdom Relations since 5 November 2014.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48127505","title":"Joel Edmundson","body":"\nJoel Edmundson\n\nJoel Edmundson (born June 28, 1993) is a Canadian professional ice hockey defenseman who is currently playing for the St. Louis Blues of the National Hockey League (NHL).\nPlaying career.\nEdmundson was chosen in the sixth round, 121st overall, of the 2008 WHL Bantam Draft by the Moose Jaw Warriors. In his WHL rookie season, Edmundson played in 71 games for the Warriors. He scored 2 goals and added 18 assists for 20 points while adding on 95 penalty minutes. He later played for the Kamloops Blazers. In March 2013, Edmundson signed an entry-level contract with the Blues. He played the following two seasons for the Blues' American Hockey League affiliate, the Chicago Wolves.\nIn October 2015, it was it was announced that Edmundson had made the opening night roster of the St. Louis Blues for the 2015–16 NHL season.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48127511","title":"The Letters (film)","body":"\nThe Letters (film)\n\nThe Letters is a 2014 American biographical drama film directed and written by William Riead. The film stars Juliet Stevenson, Max von Sydow, Rutger Hauer and Priya Darshini. It was produced by Colin Azzopardi, Tony Cordeaux, and Lisa Riead. It was released theatrically by Freestyle Releasing on December 4, 2015.\nPlot.\nMother Teresa (Juliet Stevenson), recipient of the Nobel Peace Prize, is considered one of the greatest humanitarians of modern times. Her selfless commitment changed hearts, lives and inspired millions throughout the world. The film is told through personal letters she wrote over the last forty years of her life and reveal a troubled and vulnerable woman who grew to feel an isolation and an abandonment by God. The story is told from the point of view of a Vatican priest (Max von Sydow) charged with the task of investigating acts and events following her death. He recounts her life’s work, her political oppression, her religious zeal, and her unbreakable spirit.\nProduction.\nDevelopment.\nRiead began exploring ideas for an inspirational and uplifting film just before the devastating terror attacks of September 11, 2001, forced a realization on him that would come to define his project. “I didn’t know there was that kind of evil in this world until then,” says Riead. “The attacks really brought that home.\"\n\"The Letters\" became a labor of love for Riead during the fourteen years it would take to produce the film. The turning point for Riead was the discovery of a startling cache of heartfelt, formerly confidential letters written by Mother Teresa to her spiritual advisor, the Belgian Jesuit priest Celeste van Exem, over a nearly 50-year correspondence. In her letters, some of which have been published in the 2007 book \"Mother Teresa: Come Be My Light\", Teresa revealed a crisis of faith that left her doubting God’s belief in her dedication to the poor. Riead read all of the letters that were available to the public and decided that they would make up the spine of his screenplay.\nCasting.\nWhen the time came to cast the film, Riead had a wealth of actresses clamoring to don Mother Teresa’s habit. To play her confessor, Father van Exem, Riead cast Max von Sydow, the Swedish star who has been a favorite of directors ranging from Ingmar Bergman to Martin Scorsese. When von Sydow asked the director for some insight into the character, Riead gave him a simple but telling answer. “I said, the whole world looked up to Mother Teresa,” he recalls. “And Mother Teresa looked up to Father van Exem. He just looked at me for a long moment, and he said, ‘got it.’ And that was it. He showed up and knew exactly what to do.”\nTo portray the nuns and students of the Loreto Convent, the Bishop of Calcutta, Mother Teresa’s wealthy benefactors, and the residents of the poverty stricken slums, Riead cast professional actors from India’s Bollywood film industry, considered the largest in the world.\nFilming.\nThe film was shot primarily in India, with interiors shot in Goa and second unit filming taking place in Calcutta, Delhi, and Mumbai. The scenes featuring Max von Sydow and Rutger Hauer (as van Exem’s confidant, Father Benjamin Praagh), were shot in a 15th-century London monastery.\nRelease.\n\"The Letters\" premiered at the Sedona Film Festival in February 2014. It was released theatrically in 886 venues on December 4, 2015.\nCritical reception.\n\"The Letters\" has received generally negative reviews from critics. On Rotten Tomatoes, the film has a rating of 30%, based on 33 reviews, with an average rating of 4.4/10. The consensus states: \"\"The Letters\" tries to honor Mother Teresa with an unstintingly positive portrayal of her life and works, but ends up smothering a fascinating real-life story under a bland hagiography.\" On Metacritic, the film has a score of 25 out of 100, based on 11 critics, indicating \"generally unfavorable reviews\". \nAt the Sedona Film Festival, the film won the Audience Favorite “Best of the Fest” Award, and the International Catholic Film Festival in Rome, where Riead was honored as Best Director and Juliet Stevenson as Best Actress.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48127519","title":"Av8er Orbiter","body":"\nAv8er Orbiter\n\nThe Av8er Orbiter is a British paramotor that was designed by Paul Taylor and produced by Av8er Limited of Woodford Halse, Northamptonshire for powered paragliding. Now out of production, when it was available the aircraft was supplied complete and ready-to-fly.\nDesign and development.\nThe Orbiter was designed to comply with the US FAR 103 Ultralight Vehicles rules as well as European regulations. It features a paraglider-style wing, single-place accommodation and a single engine in pusher configuration. The aircraft is built with special attention to balancing and vibration isolation. The cage assembly includes small wheels to ease ground movement of the motor unit.\nAs is the case with all paramotors, take-off and landing is accomplished by foot. Inflight steering is accomplished via handles that actuate the canopy brakes, creating roll and yaw.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48127533","title":"Haydock railway station","body":"\nHaydock railway station\n\nHaydock railway station served the village of Haydock, formerly in Lancashire, now in Merseyside), England.\nThe station was on the Liverpool, St Helens and South Lancashire Railway line from Lowton St Mary's to the original St Helens Central railway station where it was crossed by what is now the A599 in the centre of the village.\nEast of the station was the Haydock Colliery Tunnel, the only tunnel on the line. It was built at the railway's expense using the 'cut and cover' method. Its sole purpose was to burrow beneath Haydock Colliery's tracks.\nHistory.\nOpened by the Liverpool, St Helens and South Lancashire Railway, as part of the Great Central Railway, it became part of the London and North Eastern Railway during the Grouping of 1923. The line and station passed to the Eastern Region of British Railways on nationalisation in 1948, being transferred to the London Midland Region later that year.\nThe line through the station was originally double track and the station had two platforms. In the 1930s the down (St Helens-bound) track was changed into a long siding and all trains to and from St Helens used the up line. The station's down side shelter and signs were removed.\nServices.\nIn 1922 five \"down\" (towards St Helens) trains called at the station, Mondays to Saturdays. These called at all stations from Manchester Central to St Helens via Glazebrook and Culcheth. The \"up\" service was similar.\nBy 1948 four trains plied between St Helens Central and Manchester Central, calling at all stations, Monday to Friday, reduced to three on Saturdays. \nA fuller selection of public and working timetables has now been published. Among other things this suggests that Sunday services ran until 1914, but had ceased by 1922 never to return.\nClosure.\nThe station was closed to passenger traffic by the British Railways Board in 1952, though goods traffic through to St Helens lingered on until 1965, when the tracks west of Ashton-in-Makerfield were abandoned. A short stretch from Ashton through the Haydock station site to a new Shell distribution depot was reinstated in 1968. This ceased being rail-served in 1983, whereafter the line was cut back to Lowton Metals' scrapyard at Ashton. Tracks were eventually lifted. \nThe site today.\nBy 2003 modern housing had completely obliterated the station site.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48127535","title":"2016 FedEx Cup Playoffs","body":"\n2016 FedEx Cup Playoffs\n\nThe 2016 FedEx Cup Playoffs, the series of four golf tournaments that will determine the season champion on the U.S.-based PGA Tour, will be played from August 25 to September 25. It includes the following four events:\nThese will be the tenth FedEx Cup playoffs since their inception in 2007.\nThe point distributions can be seen here.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48127539","title":"Dave Porter (politician)","body":"\nDave Porter (politician)\n\nDave Porter is a former Canadian politician, who served in the Legislative Assembly of Yukon from 1982 to 1989. He was a member of the Yukon New Democratic Party.\nHe was first elected in the 1982 election as MLA for Campbell. He shifted to the district of Watson Lake for the 1985 election, in which he was reelected, and served as House Leader and Deputy Premier in the government of Tony Penikett.\nHe did not run for reelection in the 1989 election. He was then appointed as executive director of the Yukon Human Rights Commission.\nPorter later served as CEO of the BC First Nations Energy and Mining Council, and as chief negotiator for the Kaska Dena Council.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48127546","title":"The Velours","body":""}
{"url":"https://en.wikipedia.org/wiki?curid=48127553","title":"Tokio Emoto","body":"\nTokio Emoto\n\n is a Japanese actor who is represented by the talent agency, Knockout.\nBiography.\nEmoto's father is Akira Emoto, his mother is Kazue Tsunogae, and his brother is Tasuku Emoto. He is left-handed.\nIn 2003, Emoto had his acting debut in the film, \"Jam Films S\".\nUp until around 2011, he maintained a part-time job in Shimokitazawa while acting. As of July 2015, his job was in a T-shirt shop.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48127557","title":"P2P Global Investments","body":"\nP2P Global Investments\n\nP2P Global Investments () is a large British investment trust dedicated to investments in consumer and small and medium sized enterprise loans and in corporate trade receivables. Established in 2014, the company is a constituent of the FTSE 250 Index. The chairman is Stuart Cruickshank.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48127571","title":"Vladimir Spirin","body":"\nVladimir Spirin\n\nVladimir Semionovich Spirin (Russian: Владимир Семёнович Спирин) (born May 5, 1929 - died May 17, 2002) was a Russian philologist, sinologist, historian, lecturer of Saint Petersburg State University, researcher at Saint Petersburg's branch of the Institute of Oriental Studies of the Russian Academy of Sciences, Saint Petersburg Russia, Candidate of Sciences (equiv. Ph.D.). His primary scientific interests resided in the field of classical Chinese philology and Chinese philosophy.\nBiography.\nDr. Spirin graduated in 1952 from the East Asian Studies Department at the Saint Petersburg State University and started to work as a researcher at Saint Petersburg's (then Leningrad) branch of the Institute of Oriental Studies of the Russian Academy of Sciences, where he worked until his death. Since 1957, he had been a member of the research group that worked on description of Dunhuang manuscripts, preserved in Russia (other members were Dr. Lev Menshikov, S.A. Schcolyar, etc.) In the 1960s, during the time of the Cultural Revolution, he conducted studies in China for nine months. He defended his doctoral thesis (Candidate of Sciences, Philosophy) in 1970, under the title of \"On Methodological Problems of Studying the Classic Chinese Philosophy: In Relation to the Analysis of Text Structures\". Since 1977 and until 1990s, he taught the Classic Chinese Philosophy to philosophy students at the Saint Petersburg State University, as an invited lecturer.\nHis main area of research had been methodological problems of studying classic Chinese texts. He developed an original structural approach to the texts, and discovered various types of textological structures in the classic Chinese culture. His method of graphic description of textual structures, providing simplicity and easy visualization, according to some researchers, reminds graphic methods of logical description such as Lambert's lines or Eiler's circles, as well as the implementation of graphic description in thermodynamics by Clapeyron. Spirin's work strongly influenced the study of Chinese culture in Russia, especially the younger generation of sinologists, working in Moscow (based in Leningrad he was not in permanent direct contact with these researchers). For example, according to A. Kobzev, Spirin's structural semiotic approach was intensively used by A.Karapetiantz. Spirin also influenced such Russian researchers as A.Kobzev, A.Krushinsky, M.Isayeva, V.Dorofeeva-Lichtman, etc.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48127608","title":"Hungarian presidential election, 2000","body":"\nHungarian presidential election, 2000\n\nAn indirect presidential election was held in Hungary on 5–6 June 2000. The only candidate was legal scholar Ferenc Mádl, who was nominated by the first cabinet of Viktor Orbán, composing Fidesz, FKGP and MDF. The left-wing (MSZP and SZDSZ) and the far-right (MIÉP) opposition parties did not nominee a candidate. After three rounds, Mádl was elected President of Hungary, taking the office on 4 August in that year. \nFirst and second rounds.\nIn the first two rounds, two-thirds majority requirement needed to elect the president, according to the Constitution.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48127617","title":"Av8er Limited","body":"\nAv8er Limited\n\nAv8er Limited () was a British aircraft manufacturer based in Woodford Halse, Northamptonshire and founded by Paul Taylor. The company specialized in the design and manufacture of paramotors in the form of ready-to-fly aircraft for the US FAR 103 Ultralight Vehicles and European rules.\nThe company seems to have been founded about 2001 and gone out of business in 2011.\nAv8er produced a range of paramotors noted for their lightness and attention to detail, in particular balancing and vibration isolating features. The models included the Explorer, Orbiter, Observer and Titan.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48127634","title":"WD-40 Company","body":"\nWD-40 Company\n\nWD-40 Company is a San Diego, CA-based manufacturer of household chemicals, including its signature lubricant, WD-40, as well as 3-In-One Oil, Lava, Spot Shot, X-14, Carpet Fresh, and 2000 Flushes. It markets its products in more than 160 countries.\nHistory.\nRocket Chemical Company was founded in 1953. In 1969, John S. Barry, on becoming President and CEO, changed the name to \"WD-40 Company\" after what was then its only product. Barry, who died July 3, 2009, reportedly made the name change on the basis that the Rocket Chemical Company did not make rockets. The company went public in 1973. Its NASDAQ stock symbol is (). \nProducts.\nIn addition to its flagship WD-40 product, the WD-40 Company has acquired several household-products companies, adding such brand names as 3-In-One Oil, Lava, Spot Shot, X-14, Carpet Fresh, and 2000 Flushes to its roster.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48127669","title":"Fenethazine","body":"\nFenethazine\n\nFenethazine (INN) (brand names Anergen, Contralergial, Ethysine, Etisine, Lisergan, Lysergan; former developmental code names RP-3015, SC-1627, WY-1143), also known as phenethazinum, is a first-generation antihistamine of the phenothiazine group. Promethazine, and subsequently chlorpromazine, were derived from fenethazine. Fenethazine, in turn, was derived from phenbenzamine.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48127671","title":"1932–33 Connecticut Aggies men's basketball team","body":"\n1932–33 Connecticut Aggies men's basketball team\n\nThe 1932–33 Connecticut Aggies men's basketball team represented Connecticut Agricultural College, now the University of Connecticut, in the 1932–33 collegiate men's basketball season. The Aggies completed the season with a 4–12 overall record. The Aggies were members of the New England Conference, where they ended the season with a 0–4 record. The Aggies played their home games at Hawley Armory in Storrs, Connecticut, and were led by second-year head coach John J. Heldman, Jr..\nSchedule.\n!colspan=12 style=\"\"| Regular Season\nSchedule Source:\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48127674","title":"Paul Fouracre","body":"\nPaul Fouracre\n\nPaul J. Fouracre is professor of medieval history at the University of Manchester. His research interests relate to early medieval history, the history of the Franks, law and custom in medieval societies, charters, hagiography, serf-lord relations in the eleventh century, and the cost of the liturgy.\nFouracre was co-ordinating editor of \"Early Medieval Europe\" from 2005 to 2009 and editor of the first volume of \"The New Cambridge Medieval History\" (2005). He is editor of the \"Bulletin of the John Rylands Library\". He is a Member of the Chetham Society, serving as a Member of Council since 2004 and as President since 2005.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48127710","title":"Hooton Tennis Club","body":"\nHooton Tennis Club\n\nHooton Tennis Club is a four-piece indie-rock band from the Wirral consisting of Ryan Murphy (vocals/guitar), James Madden (vocals/guitar), Callum McFadden (bass) and Harry Chalmers (drums) formed in 2013. They are signed to Heavenly Recordings and have released one album and a number of singles.\nBiography.\nThe band members first met in secondary school, although Madden and McFadden had known each other prior to that at primary school. Towards the end of 2013 the four began to write songs together. In January they were featured on the BBC Introducing in Merseyside, after which they were picked up by the not-for-profit The Label Recordings based at Edge Hill University. They recorded a four-track EP \"I Was a Punk in Europe (But My Mum Didn’t Mind)\", which was described as \"\"'trash-indie psychedelic'. In September 2014 it was announced that the band had signed with Heavenly Recordings. In February 2015 they released their first single \"Jasper/Standing Knees\". It was followed by second single, \"Kathleen Sat On The Arm Of Her Favourite Chair\". Their debut album \"Highest Point In Cliff Town\" was produced by Bill Ryder-Jones. The name of the band was taken from a tennis courts in Little Sutton. The band have played headlining shows around the UK and Europe.\nDiscography.\nAlbums.\n\"Highest Point In Cliff Town\" (2015, Heavenly Recordings)\nEPs.\n\"Long-Barrelled Saturday\" (2013)\n\"I Was A Punk In Europe (But My Mum Didn’t Mind)\" (2013)\n\"Oh Phantom, Please Don't!\" (2014 as \"Hootin' Terrors Klub\")\nSingles.\n\"Jasper/Standing Knees\" (2015)\n\"Kathleen Sat On The Arm Of Her Favourite Chair\" (2015)\n\"P.O.W.E.R.F.U.L. P.I.E.R.R.E.\" (2015)\n\"Barstool Blues\" (by Neil Young) (split with The Wytches) (2015)\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48127715","title":"St. Lucie Canal (C-44)","body":"\nSt. Lucie Canal (C-44)\n\nThe St. Lucie Canal (C-44) is a man-made canal built in 1916 in Martin County, Florida to divert floodwaters from Lake Okeechobee via the canal to the South Fork of the St. Lucie River and into the St. Lucie Estuary, a component of the Indian River Lagoon, which connects to the Atlantic Ocean. Resulting from this connection, restoration projects in the St. Lucie River are the northernmost component of the Comprehensive Everglades Restoration Plan.\nThe C-44 has been a source of contention since its construction in 1916.\nThere are three major structures along the C-44: the S-308 lock and dam structure; the S-153 structure; and S-80 lock and dam structure. The St. Lucie Canal (C-44) can be referred to as the St. Lucie Canal, C-44, C-44 Canal, or the Okeechobee Waterway. The C-44 has a drainage basin of 185 square miles.\nHistory.\nConstruction began on the St. Lucie Canal (C-44) in 1916 and was completed in 1924. The original purpose of the canal was to allow for an improved way to divert floodwaters from Lake Okeechobee. The canal was originally designed to flow into Manatee Pocket instead of the South Fork of the St. Lucie River.\nRecords indicate that people have been complaining about the impacts of the C-44 since the early 1950s.\nDescription.\nThe St. Lucie Canal (C-44) connects to Lake Okeechobee at Port Mayaca. The capacity for the St. Lucie Canal (C-44) is 8 feet and 9,000 cubic feet per second; the result of a the St. Lucie Canal (C-44) second deepening in 1949. In 1933, 16 fixed spillways were approved for construction to reduce shoaling.\nMajor Structures.\nS-308.\nThe S-308 lock and dam structure is located at the western end of the St. Lucie Canal (C-44) and connects to the shore of Lake Okeechobee.\nS-153.\nThe S-153 is designed to discharge into the St. Lucie Canal (C-44). The S-153 regulates water levels in the Levee 65 Borrow Canal The Levee 65 Borrow Canal is located on the edge of Lake Okeechobee and north of the St. Lucie Canal (C-44).\nS-80.\nThe S-80 structure is a lock and dam structure located at the eastern end of the St. Lucie Canal (C-44). This structure was completed in 1944.\nWater Flows.\nAccording to the Florida Department of Environmental Protection, the St. Lucie Canal (C-44) flows both east to the St. Lucie Estuary and west to Lake Okeechobee \"on about an equal basis.\"\nIn 1924, the original flow capacity was 5,000 cubic feet per second. \nIn 1937, the canal was deepened to 6 feet to provide a navigable passage to Lake Okeechobee, and the flow capacity is unknown to this author.\nIn 1949, the canal was deepened to 8 feet, which increased the flow capacity to 9,000 cubic feet per second.\nEnvironment.\nOne of the major problems resulting from C-44 is too much freshwater discharged from C-44 to the St. Lucie Estuary to control the water levels of Lake Okeechobee.\nEstuary Salinity.\nLarge discharges from Lake Okeechobee into C-44 cause salinity levels to drop rapidly, killing many species in the estuaries.\nTurbidity.\nHigh flow rates result in erosion and the transport of sediment into the estuary that can smother benthic habitats. The increased turbidity also results in sediment filling navigation channels.\nC-44 Basin.\nThe C-44 Basin is 117,000 acres. Drainage from these acres into the St. Lucie Canal also create water quality problems for the St. Lucie Estuary.\nNavigation.\nIn 1937, the St. Lucie Canal (C-44) was deepened to 6 feet.\nThe St. Lucie Canal (C-44) connects to the Caloosahatchee Waterway, which connects Lake Okeechobee to the Gulf of Mexico at Fort Myers, Florida.\nTimeline.\n1916: Construction begins on St. Lucie Canal (C-44).\n1924: Original construction is completed, providing a flow capacity of 5,000 cubic feet per second.\n1937: the St. Lucie Canal (C-44) was deepened to 6 feet to allow for vessel navigation to and from Lake Okeechobee. 1949: the canal was deepened to 8 feet, which increased the flow capacity to 9,000 cubic feet per second.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48127775","title":"Joseph Kenneth Ssebaggala","body":"\nJoseph Kenneth Ssebaggala\n\nJoseph Kenneth Ssebaggala \"Joseph S KEN\" (born 1983) is a Ugandan film director, screenwriter. In 2008 he started taking film training and workshops, like the Durban Talent Campus 2011. As a writer, producer and director he runs a film company called Zenken Films, under which he has produced two of his feature films: Master on Duty and That Small Piece. He is the recent winner of Best Director in the 2015 Uganda Film Festival with his House Arrest. He's is yet to direct the first Ugandan erotic film Not Just a Boy in which he is rumored to cast screenwriter-cum-actor Usama Mukwaya.\nHis 2015 Call 112 and House arrest were nominated in the 2016 AMVCA for best East African film, Best Lighting, and overall film of the year making him the most nominated Uganda so far in the Awards.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48127784","title":"Gallot","body":"\nGallot\n\nGallot is a surname. Notable people with the surname include:\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48127802","title":"Charles F. Orthwein","body":""}
{"url":"https://en.wikipedia.org/wiki?curid=48127821","title":"1933–34 Connecticut Aggies men's basketball team","body":"\n1933–34 Connecticut Aggies men's basketball team\n\nThe 1933–34 Connecticut Aggies men's basketball team represented Connecticut State College, now the University of Connecticut, in the 1933–34 collegiate men's basketball season. The Aggies completed the season with a 5–10 overall record. The Aggies were members of the New England Conference, where they ended the season with a 1–2 record. The Aggies played their home games at Hawley Armory in Storrs, Connecticut, and were led by third-year head coach John J. Heldman, Jr.\nSchedule.\n!colspan=12 style=\"\"| Regular Season\nSchedule Source:\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48127861","title":"Bakhtiyar Duyshobekov","body":"\nBakhtiyar Duyshobekov\n\nBakhtiyar Duyshobekov (born 3 June 1995) is a Kyrgyzstani footballer who plays as a Midfielder for Abdysh-Ata Kant and Kyrgyzstan.\nCareer Statistics.\nInternational.\n\"Statistics accurate as of match played 17 November 2015\"\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48127862","title":"Ladmirault","body":"\nLadmirault\n\nLadmirault is a surname. Notable people with the surname include:\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48127906","title":"Longspring Wood","body":"\nLongspring Wood\n\nLongspring Wood is a 1.2 hectare nature reserve managed by the Herts and Middlesex Wildlife Trust in Kings Langley in Hertfordshire.\nThe main trees in this small wood are oak, ash, wild cherry and hazel, and there is a display of bluebells in the spring. Birds include warblers, finches and tits, and there are mammals such as foxes and badgers.\nThere is access by a footpath between houses in Toms Lane.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48127927","title":"Raycen Raines","body":"\nRaycen Raines\n\nRaycen AmericanHorse Raines: Navy Veteran, Entrepreneur and Businessman. Enrolled member of the Oglala Sioux Tribe and advocate for local grass roots Tribal and community economic development. \nProfessional Background\nAfter serving in the US Navy as a young man, Raines has settled into his grandfather’s footsteps as a Native businessman and advocate for Native American social issues. Raines has been in the financial and insurance industry since 2000 and has been working towards economic development specific to Indian Country since 2005.\nEarly in his career Raines focused on personal finance for individual Native Americans. Specifically, on programs which focus on Native American health care, insurance, retirement, and long term care with Retirement Protection Strategies, Inc. The company provided financial planning for in Native American communities, with the goal of bringing self-reliance to Native American communities through a combination of traditional strategies and modern business concepts.\nUnder the mentorship of many well-known leaders in Tribal economic development and finance, such as financier Valerie Red Horse and attorney Dennis Ickes, Raines transitioned away from personal finance to tribal finance and economic development. Developing expertise in a variety of tribal economic development vehicles such as Tribal Section 17 corporations, Tribal Economic Development Bonds, and federal 8(a) contracting preferences.\nRaines served a Project Director for Nations Business Group, a business development firm located in Washington, DC lead then by tribal business leader Pete Homer. Raines was an advocate of the firm’s regional development model that worked with local tribal businesses to identify new revenue streams, and to obtain federal contracts though the SBA 8(a) program, backed with partnerships from major corporations.\nIn 2012 Raines decided to take his unique set of Tribal economic development skills back to his father’s reservation, the Pine Ridge\nIndian Reservation, and work more directly on tribal community economic development. Raines lives in the Wakpamni Lake Community on the Pine Ridge Indian Reservation and serves as an economic development consultant to the local tribal municipal government.\nPersonal Background \nBorn on October 23, 1975 in Salem, Oregon and raised primarily in Juneau, Alaska where his mother worked for the Indian Health Service. All four of Raines’s grandparents were teachers at the Chemewa Indian School in Oregon, where his parents subsequently met. Raines’s mother, Elizabeth Coburn, was born to Blackfeet (Margaret Pepion) and Klamath (Joseph Francis Coburn) parents, and is now with the Bureau of Indian Affairs (BIA). Raines’s father, William Clifford Ballard, was born to Oglala Sioux (Evelyn Clifford) and Cherokee (John K. Ballard) parents, and currently with the Indian Health Service (IHS).\nRaines was greatly influenced by his grandparents and elders who served as tribal chairmen, council members, and Native entrepreneurs and business leaders. His grandmother’s sister, Eloise Cobell, (of the $3.4 billion Cobell settlement) helped encourage and guide him towards his efforts in economic development. His maternal grandfather Joseph Coburn was a Klamath tribal chairman and helped lead the restoration of the Klamath tribe.\nRaines was predominately raised by his mother, step-father Chris Rummell, and maternal grandparents. A strained relationship with his birth father eventually led to Raines changing his surname. Raines’ is also a member of the Blue Bird family of the Wakpamni Lake Community.\nCriticism.\nRaines was under scrutiny when he began pursuing online payday lending as a means of bringing in more money for the Pine Ridge Reservation. However, many members of the Wakpamni Native American community feel the negative attention towards Raines is a fear campaign, because the tribe is attempting new economic strides. While a lawsuit was filed and an initial judgment was awarded to the Black Hills Sioux Nation Treaty Council on January 18, 2015, the judgment and restraining order were subsequently reversed and dropped on June 28, 2015 and formal apologies were issued to Raycen Raines and his partners (Docket # CIV-11-0359K of the Oglala Sioux Tribal Court). \n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48127930","title":"1934–35 Connecticut State Huskies men's basketball team","body":"\n1934–35 Connecticut State Huskies men's basketball team\n\nThe 1934–35 Connecticut State Huskies men's basketball team represented Connecticut State College, now the University of Connecticut, in the 1934–35 collegiate men's basketball season. This was the first year that the team was named the Huskies. The Huskies completed the season with a 7–8 overall record. The Huskies were members of the New England Conference, where they ended the season with a 1–2 record. The Huskies played their home games at Hawley Armory in Storrs, Connecticut, and were led by fourth-year head coach John J. Heldman, Jr..\nSchedule.\n!colspan=12 style=\"\"| Regular Season\nSchedule Source:\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48127932","title":"Them Boys","body":"\nThem Boys\n\n\"Them Boys\" is a song co-written and recorded by American country rock artist Brantley Gilbert. It was released in January 2011 as the second single from his second studio album \"Halfway to Heaven\". Gilbert wrote the song with Colt Ford and Mike Dekle.\nContent.\nThe song is a country rock song about observing a younger generation not understanding life. Towards the end, the narrator realizes his grandparents would've also said the same thing.\nCritical reception.\nIn her review of the album, Sarah Wyland of \"CountryMusicOnline.net\" gave the song a positive review, praising the lyrics and writing that \"“Them Boys” is another co-write with Dekle and Ford about 'those boys' that ride up and down Main Street with their music turned up and not a care in the world. It is a more mainstream sounding track that ends with 'them boys' reminiscing about days gone by while sitting around the wood stove in the hardware store. The album is dedicated to Brantley's grandfather and it's worth wondering if “Them Boys” is, at least in some way, about him.\"\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48127941","title":"2016 BMW PGA Championship","body":"\n2016 BMW PGA Championship\n\nThe 2016 BMW PGA Championship will be the 62nd edition of the BMW PGA Championship, an annual golf tournament on the European Tour, held 26–29 May at the West Course of Wentworth Club in Virginia Water, Surrey, England, a suburb southwest of London.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48127945","title":"Reversion (2015 film)","body":""}
{"url":"https://en.wikipedia.org/wiki?curid=48127960","title":"2014 FA Women's Cup Final","body":"\n2014 FA Women's Cup Final\n\nThe 2014 FA Women's Cup Final was the 44th final of the FA Women's Cup, England's primary cup competition for women's football teams. The showpiece event was the 21st to be played directly under the auspices of the Football Association (FA). The final was contested between Arsenal Ladies and Everton Ladies on 1 June 2014 at in Milton Keynes. Holders Arsenal made its 14th final appearance, after winning the 2013 final. Everton was appearing in its fifth final.\nAs FA WSL 1 clubs, both teams entered the competition at the fifth round stage. Arsenal beat Gillingham (2–0), Birmingham City (2–1) and Chelsea (5–3) to reach the final. Everton defeated Cardiff City (3–1), Liverpool (2–0) and Notts County (2–1). \n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48127961","title":"Norway (song)","body":"\nNorway (song)\n\n\"Norway\" is a song by American dream pop band Beach House, from their third studio album, \"Teen Dream\". The song was released on January 18, 2010, with \"Baby\" as its B-side. The song was released as a free download on the band's site on November 17, 2009, before its commercial release.\nReception.\n\"Norway\" received very positive reviews from contemporary music critics. The song was chosen upon release as Pitchfork Media's \"Best New Track\". Aaron Leitko stated that, \"'Norway', the lead track from \"Teen Dream\", the duo's Sub Pop debut, raises the temperature a few degrees. A percussive intro yields to an explosion of twinkling guitars and a chorus of woozy backing vocals. The core elements of Beach House's sound-- the drum machine, the thrift store keyboards-- are still present; they're just a few ticks faster. This makes a big difference. As it turns out, Beach House goes from dour to exuberant in just a few BPM.\" Leitko continues by saying, \"Legrand, whose vocals have been saddled with Nico comparisons, can finally breathe a sigh of relief, too. The 1960s chanteuse's shadow is nowhere to be found here. 'You let us in the wooden house/ To share in all the wealth,' sings Legrand over a carsick slide guitar riff. No, 'Norway' is radiant with the sunshiny 70s pop vibes. It's Stevie Nicks territory, for sure. Climate change has come to Beach House, and the weather suits them beautifully.\"\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48127978","title":"Golden Lotus Award for Best Supporting Actress","body":"\nGolden Lotus Award for Best Supporting Actress\n\nGolden Lotus Award for Best Supporting Actress () is the main category of Competition of Golden Lotus Awards. Awarding to supporting actress(es) who have outstanding performance in motion pictures.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48128004","title":"Irving Bibo","body":"\nIrving Bibo\n\nIrving Bibo (August 22, 1889 – May 2, 1962) was an American composer and songwriter. He wrote tunes for the Ziegfeld Follies (among them, \"Huggable, Kissable You\", \"Forever and a Day\" and \"Cherie\"), Greenwich Village Follies and other theatrical productions in the 1920s, scores for more than 300 motion pictures, and college songs.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48128005","title":"1957 U.S. National Championships – Women's Singles","body":"\n1957 U.S. National Championships – Women's Singles\n\nFirst-seeded Althea Gibson defeated second-seeded Louise Brough 6–3, 6–2 in the final to win the Women's Singles tennis title at the 1957 U.S. National Championships.\nSeeds.\nThe seeded players are listed below. Althea Gibson is the champion; others show in brackets the round in which they were eliminated.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48128008","title":"Toll of the Desert","body":"\nToll of the Desert\n\nThe Toll of the Desert is an American Western film starring Fred Kohler, Jr.\nPlot.\nWhen a cowboy's family is killed by Indians, he becomes an outlaw and hired gunman. Unbeknownst to him, his son survives the Indian attack and grows up to become a lawman who eventually has to hunt down his outlaw father.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48128021","title":"1606 in Sweden","body":"\n1606 in Sweden\n\nEvents from the year 1606 in Sweden\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48128036","title":"I-70 Killer","body":"\nI-70 Killer\n\nThe I-70 killer is an unidentified American serial killer who is known to have killed six store clerks in the Midwest in the spring of 1992. His nickname derives from the fact that several of the stores in which his victims worked were located a few miles off of Interstate 70 (I-70).\nHis victims were usually young, petite, brunette women. One of his victims was a man but he is believed to have mistaken the man for a woman as he often wore a ponytail. All of the stores attacked were speciality stores and were usually only robbed of a few hundred dollars. He is also suspected of shooting 3 more store clerks in Texas during 1993 and 1994, one of whom survived.\nDespite the case being featured on Unsolved Mysteries and Dark Minds, the killer has yet to have been identified and investigators have not publicly identified any suspects.\n1992 murder spree.\nThe killing spree began on April 8, 1992 with the murder of 26-year-old Payless ShoeSource manager Robin Fuldauer in Indianapolis. She was alone at the time of being shot and was murdered sometime between 1:30 and 2:00 p.m.\nThe next two murders occurred on April 11 at the La Bride d’Elegance bridal shop in Wichita. The victims were Patricia Smith, 23 and the store's owner, 32-year-old Patricia Majors. As this was the only case involving multiple victims, investigators believe the killer thought there was only one woman in the store. The women had stayed past normal closing time of 6 p.m. to allow a male customer to pick up a cummerbund. Sometime after 6 p.m., the women allowed the killer into the store, thinking he was the customer. After the women were murdered, the actual customer arrived to pick up the cummerbund and came to face-to-face with the I-70 killer. The I-70 killer let the man go,\nwho immediately notified police once the killer left. He would later provide details for a composite sketch.\nOn April 27, Michael McCown, 40, was killed in his mother Sylvia's ceramics store in Terre Haute, Indiana. McCown was the only man killed during spree and it is believed by investigators that the I-70 killer mistook him for a woman because of the store's name and because McCown wore a ponytail\nOn May 4, 24-year-old Nancy Kitzmiller was killed while working alone at Boot Village, a footwear shop in St. Charles, Missouri. She opened up the shop at noon and was found dead by customers at 2:30 p.m.\nThe final confirmed murder occurred on May 7 in Raytown, Missouri. The victim was 37-year-old Sarah Blessing who was working in her gift shop, Store of Many Colors. The murder occurred during the day, and the owner of video store next to the Kitzmiller's shop saw the killer enter the shop, heard a pop, and saw the killer leave. He then discovered Blessing's body after checking to see what had occurred in the store. A clerk at a nearby grocery store also saw the killer and saw him climbing a hill towards I-70 after the murder.\nPossible murders in Texas.\nInvestigators believe the I-70 killer may be responsible for two murders in 1993, and an attempted murder in 1994, all of which occurred in Texas. The two murder victims were 51-year-old Mary Ann Glasscock, who was killed on September 25, 1993 in Fort Worth at the Emporium Antiques store, and 22-year-old Amy Vess, who was shot dead in a dance apparel store in Arlington on November 1.\nThe surviving victim was Vicki Webb, 35, who was shot on January 15, 1994 in Houston at the Alternatives gift shop. She briefly talked to the shooter before he shot her in the back of the head. The bullet did not penetrate into Webb's head due to a large vertebra being hit. The shooter attempted to shoot her again, but his gun misfired, and left presuming Webb to be dead.\nThe modus operandi of the Texas killer was very similar to the I-70 killer and used a .22-caliber firearm, the same caliber as the I-70 killer. However, ballistics test determined that gun used in the Texas murders was not the same as the one used in the I-70 killings, so investigators have not been able to confirm that the I-70 killer was responsible for the shootings in Texas.\nInvestigation.\nThe murders were conclusively linked after a St. Charles detective suspected a connection. All of the murders were committed with a .22-caliber firearm and the victims were usually petite, young women with long dark hair. Aside from the Wichita murders, all the victims were alone while murdered and shot in the back of the head. None of the scenes had any signs of sexual assault and while all stores were robbed, robbery appeared to be a secondary motive as all the stores were small speciality stores, which would not have had as much money as larger stores.\nBased on witness testimonies, police strongly believe the murder weapon may have been an Intratec Scorpion pistol or an Erma Werke ET22 pistol, however they have not been able to rule out any other .22-caliber firearm models. The ammunition used in the killings was .22-caliber CCI copper-clad lead bullets. The cartridges of the bullets had been polished with jeweler's rouge.\nMidwest authorities linked the killer to the shootings in Texas in 1994, but Texas authorities were not convinced of a connection as different guns were used in each spree.\nBased on witness descriptions, investigators were able to produce to two composite sketches of the killer and a physical description of the suspect. The I-70 killer was described as being a white man in his twenties or thirties, 5'7\" (1.70 m) to 5'9\" (1.75 m) tall, thin and having lazy eyelids and sandy blond or reddish hair in 1992. If he still alive, he would be in his fifties or late forties.\nPolice have not publicly identified any suspects and the case has been classified as a cold case.\nPopular culture.\nThe case has been featured on \"Unsolved Mysteries\" and Investigation Discovery's \"Dark Minds\".\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48128090","title":"Ronen Shilo","body":""}
{"url":"https://en.wikipedia.org/wiki?curid=48128094","title":"Brent Bailey","body":""}
{"url":"https://en.wikipedia.org/wiki?curid=48128109","title":"1958 U.S. National Championships – Women's Singles","body":"\n1958 U.S. National Championships – Women's Singles\n\nFirst-seeded Althea Gibson defeated Darlene Hard 3–6, 6–1, 6–2 in the final to win the Women's Singles tennis title at the 1958 U.S. National Championships.\nSeeds.\nThe seeded players are listed below. Althea Gibson is the champion; others show in brackets the round in which they were eliminated.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48128110","title":"Kainton, South Australia","body":"\nKainton, South Australia\n\nKainton is a small town situated about 10 km south of Paskeville in the upper Yorke Peninsula.\nThe Kainton school closed in 1907, but the \"Hundred of Clinton School\" was renamed \"Kainton School\" in 1915.\nKainton is located within the federal Division of Grey, the state electoral district of Goyder and the local government area known as the Yorke Peninsula Council.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48128127","title":"Jay Karas","body":"\nJay Karas\n\nJay Karas is American film director and television director. His resume primarily consists of directing live telecasts and stand-up comedy specials. In recent years he moved on to directing episodic television, directing episodes of \"Parks and Recreation\", \"Raising Hope\", \"Awkward\", \"The Fosters\", \"Brooklyn Nine-Nine\" and \"Workaholics\".\nIn 2014, Karas made his feature film directing debut with the film \"Break Point\", starring Jeremy Sisto and David Walton.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48128138","title":"Sergey Nikolaev (cyclist)","body":"\nSergey Nikolaev (cyclist)\n\nSergey Nikolaev (born February 5, 1988 in Moscow) is a Russian cyclist riding for Itera-Katusha.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48128226","title":"Daniella Smith","body":"\nDaniella Smith\n\nDaniella Smith (born July 30, 1972, Kaikohe, New Zealand) is a New Zealand former professional boxer, the first International Boxing Federation Women's World Champion and is the second New Zealand born person to win a boxing world title. Smith is also ranked pound-for-pound number one in New Zealand of all time in the Women devision.\nIn 1999, Smith started her career as an amateur. In a space of six years she has fought in forty fights, winning multiple titles including the gold at the national championships four times. She also competed in 2002 World Championships in Turkey, even though she was not successful on winning a medal, she still won a gold medal in 2004 at the Oceania Games. In 2005 Smith made her pro debut against World Kicking Champion Sue Glassey. In 2006, Smith won against Glassey for the second time, but this time to capture her first pro boxing title (vacant NZPBA Women's light middleweight title). In 2010, Smith fought for the first time as a pro outside New Zealand, winning against Jennifer Retzke in Germany and becoming the first International Boxing Federation Women's World Champion. Smith defended her title against Noni Tenge in South Africa seven months after winning the title, but lost the bout. In 2013 Smith attempted to capture her second world title against Arlene Blencowe for the vacant Women's International Boxing Association World super lightweight title and the vacant World Boxing Federation female welterweight title, but Smith was unsuccessful in capturing the titles. In 2014, Smith fought her last fight against Gentiane Lupi. This is the second time that Smith has fought Lupi, but this time for the vacant NZPBA women's lightweight title, but Smith was unsuccessful. These days Smith co-owns a boxing gym called Boxing Alley. Smith also trains corporate and amateur boxers.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48128230","title":"Villa Madero","body":"\nVilla Madero\n\nVilla Madero is a town in the Madero Municipality, in the State of Michoacán, Mexico. Established in 1868 with the name of Cruz De Caminos. According to tradition the first inhabitant of the place was a man named Armas, he is now considered the town's founder. The land where the town currently sits belonged to La Hacienda De La Concepcion. The village is the point of intersection of the paths that lead to Acuitzio, Etucuaro, Curuchancio and Tacambaro, this is why it became known as Cruz De Caminos (Cross Roads).\nCruz De Caminos, was in 1901 part of Acuitzio Del Canje. On July 27, 1914, Cruz De Caminos applied under the Municipality Erection Act. On October 12, 1914, the agreement to raise it to a municipality with the name of Madero was ratified.\nIn present time, Villa Madero is becoming famous due to a great festival named \"La Feria del Mezcal\". This is about a traditional beverage \"mezcal\" produced in Etucuaro, a town that is part of the Madero municipality. During this festival, producers give free samples of their product. There is also a grand vast of traditional food stands, different sports activities, a parade and at night people gather in a ballroom to dance with live music.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48128255","title":"Myth (song)","body":"\nMyth (song)\n\n\"Myth\" is a song by American dream pop band Beach House, from the band's fourth studio album, \"Bloom\". The song was released as a single on March 26, 2012. The song surfaced on the band's website on March 7, 2012, before its commercial release.\nReception.\n\"Myth\" received very positive reviews from contemporary music critics. The song was chosen upon release as Pitchfork Media's \"Best New Track\". Larry Fitzmaurice stated that, \"On a surface level, there's no mistaking \"Myth\" for a Beach House song. All the sonic elements that have travelled with the Baltimore dream-pop duo during their steady ascent over the last five years are intact: Alex Scally's narcotic guitar, a steady backbeat, and Victoria Legrand's smoky ache of a voice. What sets \"Myth\" as another sonic evolution for Beach House, then, is all in the details.\" Fitzmaurice continues by saying, \"The layers of echo surrounding Legrand's voice during its chorus, as well as the gauzy glow wrapped around everything, give the impression that the airy expansiveness of 2010's Teen Dream has contracted, but somehow the sound is just as \"big\", if not bigger, than before. \"What comes after this momentary bliss?\" Legrand croons at one point. Hopefully, we'll find out soon enough.\"\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48128284","title":"The Escape (1939 film)","body":"\nThe Escape (1939 film)\n\nThe Escape is a 1939 American action film directed by Ricardo Cortez and written by Robert Ellis and Helen Logan. The film stars Kane Richmond, Amanda Duff, June Gale, Edward Norris, Henry Armetta and Frank Reicher. The film was released on October 6, 1939, by 20th Century Fox.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48128298","title":"David Bain (disambiguation)","body":"\nDavid Bain (disambiguation)\n\nDavid Bain is a New Zealand man who was acquitted of murder in 2009. The name may also refer to:\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48128318","title":"Moyer's Landfill","body":"\nMoyer's Landfill\n\nMoyer's Landfill was a privately owned landfill in Collegeville, Pennsylvania, United States. It was originally farmland outside the town. In the 1940s the owner started accepting trash and municipal waste as a way to make additional money. The original landfill was 39 acres and did not have a liner to protect the land from contaminate. A liner was added to a new section in the late 1970s. Over time, the landfill accepted sewage, and industrial wastes which contained hazardous substances in addition to municipal waste. The site was closed by the EPA in 1981, and was one of the first \"Superfund\" sites added to the National Priorities List.\nHistory.\nThe Site had been operating as a municipal landfill from the early 1940s until April 1981. The landfill accepted municipal waste, sewage, and a variety of solid and liquid hazardous wastes (e.g. polychlorinated biphenyls (PCBs), products containing dioxin, paint solvents, and similar material). The original landfill was a section of the farm with no liner to prevent material from seeping into the soil. In the original landfill any waste was simply dumped and covered with dirt.\nIn 1972 when the Pennsylvania Department of Environmental Protection () rules became more restrictive, the site was cited for violations. To achieve compliance, pipes were added to drain leachate to two earthen basins which were pumped into trucks for treatment and disposal. Due to leakage from the basins, the system was modified to pump all the leachate to a concrete basin where it was sprayed over the top of the landfill.\nIn the late 1970s, the landfill owners submitted a request to enlarge the landfill which was granted. Work started to enlarge the landfill in 1977, and included an asphalt liner to protect the soil from hazardous materials. Dumping was reportedly limited to this new area from 1977 to early 1981.\nBefore remediation, contaminants were spread by rain water soaking into the landfill, some of which may have reached the ground water. Run-off from the landfill also carried contaminates to local streams (Skippack Creek and Perkiomen Creek).\nLocal residents tried for years to get the landfill closed. In the late 1970s 450 families united to try to close what they called \"Mount Trashmore\". They packed the local zoning board meetings, wrote letters to several environmental protection agencies, and had lawn signs printed up to close the dump.\nIn the lawsuit \"O'LEARY v. Moyer's Landfill, Inc., 523 F. Supp. 642 (E.D. Pa. 1981)\" it states \"this suit was brought in part because DER has, in plaintiffs' view, been ineffective in alleviating the dangers plaintiffs perceive at the landfill\".\nThe site was finally closed by the PA DEP in early 1981.\nExtent of the contamination.\nAnalysis of the leachate dates back to 1972, this analysis was conducted to design an aerated lagoon to treat the liquid. After being designated a Superfund site, tests found heavy metals and organic chemicals. These chemicals included Benzene, toluene, Trichloroethylene, tetrachloroethylene and chlorobenzene. All of which are associated with industrial solvents. Samples from the landfill had a total of 86 priority pollutants and 16 metals. Water samples were taken from the Skippack and Perkiomen Creeks and chemicals found in the landfill were also found in both streams. A remediation study was funded at a total cost of $681,000\nThe result of the remediation survey in 1985 an estimate was made that the cost of a cleanup would be $15 million and an additional $340,000 a year for operation and maintenance. By 1994 the price tag has been increased to $45 million for the cleanup.\nCompletion.\nOn May 27, 2014 The Environmental Protection Agency (EPA) region III removed Moyer's Landfill from the National Priorities List. The site is no longer considered a Superfund site. The site consists of open land surrounded by trees on steep slopes. The landfill is fenced off and has leachate collection tanks. There are no development plans.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48128332","title":"Lunch Time Heroes","body":"\nLunch Time Heroes\n\nLunch Time Heroes is a 2015 Nigerian family comedy film directed by Seyi Babatope, and starring Dakore Akande, Omoni Oboli, Diana Yekinni, Tina Mba and Tope Tedela.\nThe film tells the story of Banke (Diana Yekinni), a corp member who has been posted to teach in a high school, and she has to gain the respect and attention of students and faculty that don’t want her around.\nProduction and release.\n\"Lunch Time Heroes\" was shot in Lagos for 16 days. Some of the child actors used in the film were sourced through local churches, and none had a previous professional acting experience. Before the commencement of principal photography, the director, Babatope had got the child actors on film set to play around, in order to desensitize them to the cameras, dollies, cables, lights and the peculiarities of filming environment.\nOnset photos for \"Lunch Time Heroes\" was released to the public online in March 2015. Trailer for the film was released in July 2015. It premiered at FilmHouse Cinema, Surulere, Lagos on 23 August 2015; with general theatrical release on 28 August 2015. The theme soundtrack for the film, titled \"I Believe\" by Capital Femi, was released online on 28 August 2015, along with its music video, which features the casts of the film.\nCritical reception.\nThe film has been met with mixed critical reception. Amarachukwu Iwuala of \"360Nobs\" commends the film's screenplay, character development and soundtrack, but criticizes the film for having several inconsistencies in its storytelling. She concludes: \"Much as the story of \"Lunch Time Heroes\" is foreseeable, owing to the title of the film and the information on the promotional materials, one nevertheless enjoys the journey that leads to the final destination\". Yvonne Anoruo praises the soundtrack, but notes the lack originality, and several inconsistencies. She comments: \"\"Lunch Time Heroes\" comes with a very simple plot, and with very predictable twists and turns. It is so focused on staying true to its subject matter and with rather rigid dialogues that it is altogether stiff. At the end of it, one realises that save a few characters, the others are largely flat. There were a lot of improvisations in measures that takes away from the movie. The final product does not elicit any feelings beyond the ordinary and if any, it totters on the edge of basic. Ultimately, for what it lacks everywhere else, the movie makes up for with very adorable child actors\". Jite Efemuaye comments: \"\"Lunch Time Heroes\" is a good effort which is undermined by a less than dedicated attention to detail on the director’s part. Even with all its limitations, it is an entertaining movie, one that can be enjoyed by all members of the family, but it is easily forgettable\". Yvonne Williams of \"Nollywood Observer\" comments: \"Although \"Lunch Time Heroes\" wows with its uncommon storyline and brilliant performances from Dakore Akande and Tina Mba, it falls short in its delivery – somewhat un-contagious forced humour, thinness of the plot, overacting amongst other things. However, it no doubt would be a welcome delight for the youth and the young at heart\".\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48128374","title":"Borgeaud","body":"\nBorgeaud\n\nBorgeaud is a surname. Notable people with the surname include:\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48128380","title":"Maelifell","body":"\nMaelifell\n\nMount Mælifell, also called as Measure-Hill, is located in Southern Iceland and is about 800 meters tall.\nMount Mælifell is reachable only by a four-wheeled vehicle and is on the southern Fjallabak road next to the glacier Mýrdalsjökull, the road is usually wet and sometimes completely flooded.\nIt is listed as one of the amazing places on the earth by \"Amazing places on earth\".\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48128387","title":"Svetislav Tisa Milosavljević","body":"\nSvetislav Tisa Milosavljević\n\nBan Svetislav Tisa Milosavljević, or Бан Светислав Тиса Милосављевић, (Born in Niš on 7. 9. 1882 - Died in Belgrade on 28. 7. 1960) was a military architect. He was the eldest son of a wealthy Niš dealer Tome Milosavljevic and his wife Basil Popović. \nMilitary career.\nSvetislav planned to become an engineer, but his father's financial collapse forced him into the military profession. He became an authority on military traffic, while advancing at the end of 1925 to the rank of Brigadier General.\nBanja Luka.\nHe came to Banja Luka on 8 November 1929. In a short time with a substantial state financial aid he helped develop the Banovina, and in particular Banja Luka.\nHis greatest accomplishments include the Banska Palace (now the city administration), Governor's Palace, the Theatre (founded in 1930 and today's building built 1934), Public Health Institute, the facilities and the Teacher's School of Agriculture, the east wing of the then Grammar School, and seven residential buildings for officers (in today's Alley St. Sava and at the Post Office). He helped establish the Banate Museum, Association for Tourism and Craft and the Chamber of Commerce.\nAlthough not a direct investor, builder or founder, Milosavljevic gained credit for the emergence of the Banja Luka town park with a monument to Peter Kocic, for upgrading the hotel Bosnia, paving and street lighting and construction of Sokolski Dom, City Municipality and the Hotel Palace.\nAfter becoming viceroy, Milosavljevic only once visited Banja Luka - Ascension Day, May 18, 1939, when he accepted the invitation of the Banja Luka Orthodox parish and came to the cathedral shrine.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48128396","title":"HD 164595 b","body":"\nHD 164595 b\n\nHD 164595 b is a confirmed exoplanet orbiting around the Sun-like star HD 164595 every 40 days some 94.36 light-years away. It has a mass of 16 Earth masses, most likely due to its high mass it could be a Mini-Neptune, however depending on the planet's density it could be a Mega-World that could be like a terrestrial planet or it could be made out of volatile compressed into a solid form.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48128399","title":"ID Dunedin Fashion Week","body":"\nID Dunedin Fashion Week\n\niD Dunedin Fashion Week is an annual festival of fashion held in the New Zealand city of Dunedin, usually in March or April. The festival has been held regularly since its inception in 2000. The 2015 show included 35 events, and attracted over 8000 people from around New Zealand and overseas.\nFashion Week includes a series of events around Dunedin and its Otago environs, such as tours, talks, and exhibitions, and features two major award shows. The first of these is the iD International Emerging Designer Awards, held in conjunction with Otago Polytechnic, which is a one-night show held at Dunedin Town Hall. Entry is restricted to recent graduates or current final-year students in fashion related courses, and regularly attracts new designers from around the world.\nThe week culminates in the second major show, the iD Dunedin Fashion Show. This two-night show takes place at Dunedin Railway Station, and the main platform is turned into one of the world's longest catwalks, a little over in length. The show is restricted to current commercial designers, and includes international guest designer selections - including major names, although its primary focus is on local competitive entries.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48128419","title":"AudioComics Company","body":""}
{"url":"https://en.wikipedia.org/wiki?curid=48128442","title":"Osaka Tōin Junior and Senior High School","body":"\nOsaka Tōin Junior and Senior High School\n\n is a private co-educational junior and senior high school located in Daitō City, Osaka Prefecture, Japan. The high school was founded in 1983 by Osaka Sangyo University.\nHistory.\nOsaka Tōin Senior High School was founded as the Daitō campus of Osaka Sangyo University Senior High School in 1983, during a period of rapid increase in the number of high school students in Japan. The school commenced with 150 students enrolled in two streams; a regular course and dedicated physical education course. The school became independent from Osaka Sangyo University Senior High School in 1988 and an integrated junior high school was opened in 1995.\nClub activities.\nBaseball.\nThe school's baseball club was formed in 1988. In 1991, only the club's fourth year of existence, Osaka Tōin participated in the spring invitational tournament for the first time. The school advanced to the quarter finals, with the highlight of the tournament being ace Yukihiko Wada pitching a no-hit, shutout in the first round match against Sendai Ikuei High School. In the same year, the school won the \"Summer Koshien\" national championships, defeating Okinawa Fisheries High School 13-8 in the final. Osaka Tōin was the 14th school to win the chamionship in their first year of qualifying for the tournament. Wada and future Yomiuri Giants member Yoshihiro Seo pitched in the championship match against Okinawa Fisheries ace Rin Ōno; fellow future Yomiuri Giant Makoto Hagiwara hit the only home run of the match.\nThe school won its second national championship in 2008, defeating Shizuoka Prefecture's Tokoha Kikukgawa Senior High School 17-0 in the final.\nIn 2012, Osaka Tōin became the seventh school in history to win the spring invitational and summer national tournaments in the same year, defeating Aomori Prefecture's Kōsei Gakuin in the final of both tournaments. It was the first time that two schools met in the final of both tournaments in the same year. Future Hanshin Tigers ace Shintaro Fujinami was the star of the tournament, pitching shutouts in both the semi-final and final. In the autumn of 2012, Osaka Tōin was joint-champion of the National Sports Festival along with Sendai Ikuei, becoming the third school in history to win the \"triple crown\" in one year. Lost time due to rain earlier in the tournament forced tournament organizers to announce that the winners of the two semi-finals would be named joint champions.\nAt the 2014 summer tournament, the school won for the fourth time, defeating Mie High School 4-3 in the final.\nFormer members of the Osaka Toin baseball team have played for eleven of the twelve Japanese professional baseball teams (see list of alumni below). Sho Nakata and Tsuyoshi Nishioka have played on the Japan national team and Nishioka spent two seasons with the Minnesota Twins of the MLB.\nBrass band.\nThe brass band club was formed in 2005 and in the same year took the gold prize at the Kansai Brass Band Contest. In 2006 and 2007, the band represented the Kansai region in the high school division of the All-Japan Band Competition, taking the silver award on both occasions. In 2008 the band did not qualify for the national competition, but returned in 2009 and won their first gold award. The band continued this success with consecutive wins at the 2010 and 2011 competitions. In 2008 the band also won silver in its first appearance at the All Japan Marching Contest. It followed this with by winning gold at the 2009 and 2010 events. As a result of this success, the band receives many requests for public performances and is well known throughout Japan despite its short history.\nSoccer.\nThe school's soccer club was founded in 2005. It qualified for the soccer tournament of the national high school sports championships in 2007 and reached the quarter finals of the same tournament in 2008. The club also qualified for the 2008 All Japan High School Soccer Tournament and advanced to the second round.\nThe girls' soccer club was formed in 2006. It has qualified for the national championships several times since its first appearance in 2007; in 2011 the club finished runners-up, losing to Tokiwagi Gakuen High School 1–3 in the final.\nRugby.\nThe school rugby club was formed in 1988. In 1995, it qualified for the National High School Rugby Tournament for the first time. In 2013 the club won the 14th Spring Invitational Tournament, its first championship win at the national level, defeating Tokai University Gyosei High School 33-14 in the final. In 2015 the club were runners-up in the spring invitational tournament, this time losing to Tokai Gyosei 0–21 in the final.\nGolf.\nIn 1999 the boys' golf team won the 20th annual All Japan High School Golf Tournament.\nBasketball.\nThe boys' and girls' basketball teams each made their first appearance at the summer All Japan High School Basketball Tournament in 2014, with the boys' team advancing to the second round and the girls' team advancing to the third round. The girls' team also qualified for the \"Winter Cup\" tournament for the first time in 2014.\nTrack and field.\nThe track and field club was formed in 2011 as the \"ekiden\" club. The club changed its name to the track and field club in the following year. In November 2013 the club won the Osaka Prefecture ekiden qualification race and finished 22nd in the national championship in the following month.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48128445","title":"Clube Náutico da Beira","body":"\nClube Náutico da Beira\n\nClube Náutico da Beira is a club located in Beira, Mozambique which features a restaurant, tennis court, pool, water-sports, and a boat warehouse.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48128462","title":"Wildflower (Hank Crawford album)","body":"\nWildflower (Hank Crawford album)\n\nWildflower is the fourteenth album led by saxophonist Hank Crawford and his third released on the Kudu label in 1973.\nReception.\nAllMusic awarded the album 4 stars stating \"\"Wildflower\" is indispensable as a shining example of '70s groove jazz at its best\".\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48128468","title":"Juan Antonio Suanzes","body":"\nJuan Antonio Suanzes\n\nJuan Antonio Suanzes Fernández (20 May 1891 – 6 December 1977) was a Spanish naval engineer. Before the Spanish Civil War (1936–39) he directed a shipyard. During the civil war he offered his services to the Nationalist side, and was made Minister of Industry and Commerce from 1938 to 1939. He was again Minister of Industry and Commerce from 1945 to 1951.\nEarly years (1891–1936).\nJuan Antonio Suanzes Fernández was born in Ferrol, Coruña, on 20 May 1891.\nHe was the oldest of six children in a family with naval traditions.\nHis father, Saturnino Sunazes Carpegna, belonged to the General Corps of the navy.\nHe attended a religious school for his early education.\nAt the age of 12 he entered the naval school in Ferrol.\nHe was promoted to midshipman (1906), frigate ensign (1908) and navy Ensign (1909).\nAt times he was assigned to ships such as the \"Numancia\", \"Pelayo\", \"Carlos V\" and \"Reina Regente\".\nIn 1913 he was appointed as a lieutenant to the battleship \"España\".\nIn 1915 Suanzes began to study naval engineering in Ferrol.\nIn 1917 he was a captain of naval engineers, and a teacher at the Naval Military School of San Fernando in Cadiz.\nIn 1920 he was named director of the Cartagena shipyard of the \"Sociedad Española de Construcción Naval\" (SECN, Spanish Society of Naval Construction).\nHe was appointed commander of engineers in 1921.\nIn 1922 he was made a supernumerary of the navy so he could devote himself to his work for the private company.\nHe was in charge of the SECN shipyard at Cartagena until 1926, then was transferred to run the shipyard in Ferrol. In January 1932 he moved to Madrid with his family.\nIn Madrid he was Inspector General of Construction for the company. A profound patriot, he became increasingly disturbed at the British ownership position in the SECN, which he felt was trying to prevent it from evolving into an independent Spanish operation.\nIn 1934 Suanzes left the SECN due to what he called the \"intolerable interference of the English\", referring to Vickers, one of the SECN proprietors.\nHe created a small company named \"Estudios, Proyectos y Reparaciones\" (EPYR), then obtained the position of Director General of Boetticher y Navarro, S.A. (BYNSA).\nCivil War (1936–39).\nAt the start of the Spanish Civil War (1936–39) BYNSA was taken over by the Ministry of Defense. In late October 1936 Suanzes took refuge in the Polish embassy. \nHe left there in March 1937 and traveled via Valencia, Marseille and San Sebastián to Salamanca, where he placed himself at the disposal of General Francisco Franco.\nSuanzes was named colonel of naval engineers in charge of salvage.\nIn June 1937 he was in Rome, where he asked Admiral Odoardo Somigli to help refurbish the Spanish naval vessels.\nHis request was refused at first, but Benito Mussolini intervened and Suanzes was able to get a series of ships overhauled and rearmed by the Italians.\nFranco appointed him Minister of Industry and Commerce on 31 January 1938.\nThe ministry was based in Bilbao, and the main task was recovery of industries in the areas that were coming under the control of Franco's forces.\nOn 9 August 1939 he was replaced in a cabinet reshuffle by Luis Alarcón de Lastra.\nLater career (1939–77).\nThe law of 1 September 1939 created the Office of Construction and of Naval Military Industries in the Ministry of the Navy. On 23 September 1939 Suanzes was made head of this organization, and became a member of the National Defense Council. His goal was to end existing contracts with the navy and start a new organization responsible for naval military construction. The Minister of the Navy, Salvador Moreno, delayed all his projects. He resigned in July 1941.\nThe \"Instituto Nacional de Industria\" (INI, National Institute of Industry) was created on 25 September 1941, and on 17 October 1941 Suanzes was named president of the institute.\nSuanzes was appointed Minister of Industry and Commerce on 20 July 1945, while remaining president of the INI.\nHe held office as Minister until 19 July 1951, when he was replaced in a cabinet shuffle by Joaquín Planell Riera (Industry) and Manuel Arburúa de la Miyar (Commerce).\nHe remained president of the INI until 1963, when Franco accepted his resignation.\nAlthough working in the INI, Suanzes remained a naval officer and became a Brigadier General in 1950.\nIn 1940 he became a member of the \"Consejo Superior de Investigaciones Científicas\" (CSIC, High Council for Scientific Research). \nHe became a member of the board of \"Juan de la Cierva\", and was named president of this company in 1942, holding that position for over twenty years.\nIn 1956 he was appointed the first president of the \"Escuela de Organización Industrial\" (EOI, School of Industrial Organization), holding office until 1963.\nIn 1956 he was appointed first president of the Spanish National Committee of the World Energy Conference, a position he held for the remainder of his life.\nIn 1960 Franco granted Suanzes and his heirs the title of \"Marqués de Suances\".\nIn 1963 he resigned from the INI and withdrew from all public activity.\nHe died in Madrid on 6 December 1977 at the age of 86.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48128518","title":"1938 U.S. National Championships – Women's Singles","body":"\n1938 U.S. National Championships – Women's Singles\n\nSecond-seeded Alice Marble defeated Nancye Wynne 6–0, 6–3 in the final to win the Women's Singles tennis title at the 1938 U.S. National Championships.\nSeeds.\nThe tournament used two lists of eight players for seeding the women's singles event; one for U.S. players and one for foreign players. Alice Marble is the champion; others show in brackets the round in which they were eliminated.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48128534","title":"Chilla Bulbeck","body":"\nChilla Bulbeck\n\nMargaret Chilla Bulbeck (born 1951) was the emeritus professor of women's studies at Adelaide University from 1997 until 2008, and has published widely on issues of gender and difference.\nEducation.\nBulbeck gained a degree in economics from the University of Adelaide (1972), a master of arts (1975) and a Ph.D. in Sociology (1980) from the Australian National University, and an LL.B. from the University of Queensland (1991).\nPolitical career.\nAfter retiring from academic life, Bulbeck entered politics as a full-time volunteer for The Greens (WA), becoming their Secretary and co-editor of their newsletter. She also ran, unsuccessfully in the Western Australian state election, 2013 for the district of Mandurah.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48128542","title":"List of 2004 box office number-one films in Mexico","body":"\nList of 2004 box office number-one films in Mexico\n\nThis is a list of films which placed number one at the weekend box office for the year 2004.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48128552","title":"Suanzes","body":"\nSuanzes\n\nSuanzes may refer to:\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48128553","title":"Bruce Judson","body":"\nBruce Judson\n\nBruce Judson (born 1958 in New York City) is an American author, media innovator, and public policy analyst.\nEducation.\nJudson received his Bachelor’s degree from Dartmouth College, in Policy Studies in 1980, where he studied with the environmentalist Donella Meadows. In 1984, he received his Juris Doctor from the Yale Law School and his MBA from the Yale School of Management. At the Yale Law School, he was the co-founder and Editor-in-Chief of the \"Yale Journal on Regulation\" and a Senior Editor of the \"Yale Law Journal\".\nCareer.\nJudson started his career as a consultant and founding member of the New York office of the Boston Consulting Group. In 1989, Judson joined Time Inc. Magazines, where he was appointed the Company’s first corporate Director of Marketing. After the merger of Time Inc. and Warner Communications led to the creation of Time Warner Inc., Judson’s corporate marketing department served as the focal point for Time Warner’s initiative to provide advertisers with advertising programs, involving entities throughout the media conglomerate.\nLater, with the creation of Time Inc. New Media, Judson was appointed General Manager, where he was one of the co-founders of the Pathfinder (website). Walter Isaacson, then President of Time Inc. New Media, and the subsequent biographer of Steve Jobs, credits Judson with inventing the concept of the Web banner ad, which established the standardized system that enabled the rapid growth of Internet advertising.\nWhile working at Time Inc. New Media, Judson wrote \"NetMarketing\", which became a nationwide bestseller, and was excerpted in \"Advertising Age\". He was named by \"Advertising Age\" as one of the nation’s \"Cybermarketing Leaders.\" Judson’s activities at Time Inc. New Media are described in Michael Wolff’s bestselling book, \"Burn Rate.\"\nAfter leaving Time Inc., Judson accepted an appointment at the Yale School of Management as a Faculty Fellow, and was later promoted to Senior Faculty Fellow. At Yale, he developed and taught a clinical course offering free consulting to small businesses. Judson also served as one of the founding faculty members of the Yale Publishing Course, and as the first entrepreneur-in-residence at the Yale Entrepreneurial Institute.\nIn 1999, Scribner published, \"HyperWars\" which Judson co-authored. The book asserted that significant changes in corporate strategies would be required for success in the coming Internet era. \"HyperWars\" was selected by Soundview Executive Book Summaries as one of the best business books published in the year of its release.\nIn 2004, HarperBusiness published Judson’s book, \"Go it Alone!\" which argued that the combination of software-as-a-service, automation, and outsourcing, enabled by the Internet would fundamentally alter the nature of entrepreneurship and small business success. In the book, Judson also asserted that as a result of automated leverage created by the Internet, small groups of people or individuals, working on their own, would be able to build high revenue businesses. The book was recognized by \"Library Journal\" as one of the best business books published in the year of its release, while Judson’s ideas on the future of entrepreneurship were the subject of dedicated interviews in business publications, such as \"The Wall Street Journal\"and \"Entrepreneur\" magazine.\nJudson later partnered with HarperBusiness, to test the value of making the full text of \"Go It Alone!\" available free online, with advertising support. This first-of-its-kind effort in book publishing was featured in a \"US News and World Report\" cover story.\nIn 2012, the continuing significance of the ideas in \"Go It Alone\" was recognized by \"Entrepreneur\" magazine, which dedicated a feature story to the book, and its continuing popularity, at a time when the \"half-life of business books\" is short, while the website LifeHack recommended the book, twelve years after its initial publication, in a May 2016 article.\nWhile involved at Yale and writing books, Judson was also active in developing independent businesses, including Web-Clipping (co-founder), (an early online news clipping service for businesses), the business broadband marketplace Speed Anywhere., and a mobile Web site development firm.\nJudson's book, \"It Could Happen Here\", was published in 2009 by HarperCollins. The book argued that growing and extreme economic inequality in the United States was a societal danger. Judson worked with historical and social science research to construct a model which indicated that highly unequal societies are characterized by political polarization, anger, lack of trust, political paralysis, a collapsing middle class and potentially political instability. The book appeared two years before Occupy Wall Street led economic inequality to be considered a mainstream political issue, and at the time the significance of growing economic inequality was often disregarded or seen as unlikely to continue.\nJudson was subsequently appointed a Braintruster at the Roosevelt Institute, where he launched a column titled \"Restoring Capitalism\" for the Institute’s website. Articles from the column were syndicated in online media including \"The Business Insider\" and \"The Huffington Post\".\nAs of December 2015, Judson is a Senior Adviser to Tern Plc.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48128557","title":"Haxhi Ymer Kashari","body":"\nHaxhi Ymer Kashari\n\nHaxhi Ymer Kashari known also as Ymer Mustafa Kashari was an Albanian poet of the Bejtexhinj movement of the 18th century.\nHaxhi Ymer was born in Tirana in early 18th century. Back then part of the Sanjak of Scutari of the Ottoman Empire, Tirana was already flourishing as an oriental-style town. Haxhi Ymer was a sheikh (Sufi leader) of the Qadiri order of Sufism, a less spread order going towards extinction in Albania. Most of his work is lost because of earlier lack of interest in him. His name Haxhi indicates that he had completed his hajj in Mecca. He used the pen name Suzi. The outer facade of the portal of Et'hem Bey Mosque in Tirana has an inscription written by him with his pen-name as signature.\nHaxhi Ymer was a \"bejte\" poet who wrote in two languages: Albanian and Turkish. From a few odes that are saved to date, one is of special interest. It is named \"Alif\" and it is one of a kind due to the specific structure it introduced to Albanian poetry of those times. The poem is based on the letters of the Arabic alphabet and thus has 28 verses, each verse starts with a unique letter in alphabetic order. The first starts with \"alif\" and the last with \"yā’\". This type of verse introduced by Haxhi Ymer became a tradition in Albanian poetry and had many followers.\nThough heavily laden with Oriental vocabulary, his work has linguistic significance due to the specific Tirana area Gheg dialect of the Albanian language (part of the Central Gheg branch), being the oldest written piece in this dialect.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48128569","title":"Joe Chenelly","body":"\nJoe Chenelly\n\nJoseph Randy \"Joe\" Chenelly (born October 2, 1976) is an American journalist and political adviser. He is now directing the \"Warriors for Webb\" grassroots movement of the Jim Webb campaign for U.S. president. He is also assistant national director of communications for Disabled American Veterans.\nChenelly covers military and veterans matters, on staff with the Military Times newspapers and Gannet News, reporting on operations in the Middle East, Southwest Asia, Africa, as well as disaster relief in Louisiana, Mississippi and Texas in the aftermath of Hurricane Katrina.\nChenelly was named one of the 100 \"most influential journalists covering armed violence\". He was the first U.S. Marine combat correspondent to step into enemy territory after September 11, 2001, documenting American military action and providing it for broadcast throughout the international media.\nChenelly was the first military reporter in Pakistan and Afghanistan after the terrorist attacks in the United States. He also reported from the frontlines with American and allied forces in Kuwait and Iraq as that war began in 2003. Chenelly was on the ground for the start of both Operation Enduring Freedom and Operation Iraqi Freedom. After returning to Washington to cover the wars from the policy aspect, he headed back to field reporting, corresponding live from the Louisiana Superdome and flooded streets of New Orleans as a civilian reporter in the immediate aftermath of Hurricane Katrina.\nAs part of the first conventional U.S. ground force to enter Afghanistan, he was the first to provide combat footage of Operation Enduring Freedom,[2] the first to report from inside a coalition detention facility in Afghanistan[2], the first to report an Iraqi man had given American forces information about where U.S. Army prisoner of war Pfc. Jessica Lynch was being held, the first to report that the other American prisoners of war had been rescued, and he was the first to report FEMA and the National Guard had pulled out of the Louisiana Superdome in New Orleans following Hurricane Katrina.\nChenelly is now assistant national director of communications for the Disabled American Veterans (DAV) in Washington, D.C. On November 6, 2012, he was elected to a four-year term on the Calvert County Board of Education (District 1).\nChenelly was named Calvert County (MD) Man of the Year by the county's Republican Central Committee in May 2013.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48128615","title":"Germania Flugzeugwerke","body":"\nGermania Flugzeugwerke\n\nGermania Flugzeugwerke GmbH was a German aircraft manufacturer during World War I. The company was established in 1914 at Leipzig. During 1915 and 1916, the company produced license built Rumpler C.I reconnaissance biplanes for the Luftstreitkräfte at Leipzig-Mockau Airport. The company also repaired other types of aircraft and maintained their own flight school to train pilots. The following types of 1919 were not yet reichsluftamt with an approval for the civil aviation: DFW C V, Ru. C I a, Germ. C IV. There were 17 aircraft of the Germania Reichsluftamt aircraft works when approved.\nThe company was liquidated in 1922 after the Treaty of Versailles.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48128616","title":"Pedomicrobium manganicum","body":"\nPedomicrobium manganicum\n\nPedomicrobium manganicum is a bacterium from the genus of Pedomicrobium which was isolated from quartzite rock pool in France. \"Pedomicrobium manganicum\" has the ability to bind MnO2\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48128626","title":"Pennsylvania School of Horticulture for Women","body":""}
{"url":"https://en.wikipedia.org/wiki?curid=48128644","title":"Victoria Angelova","body":"\nVictoria Angelova\n\nVictoria Angelova Vinarova (sometimes written Viktoria Angelova, , 1902–1947) was the first female architect of Bulgaria. She is credited with having built the first modern, national art gallery in the Balkans.\nBiography.\nVictoria Angelova was born on 20 November 1902 in Veliko Tarnovo, Bulgaria to Vasil Angelov, a merchant who had been educated in England. He named his daughter after Queen Victoria in homage. She graduated from the Vienna University of Technology and the Dresden Polytechnic. At the age of 24, she returned to Sofia and was working as an intern at the Ministry of Public Works when she won a contest for her first major commission. In 1933, Angelova married a fellow architect, Boris Vinarov and they set up a practice in Sofia. \nAngelova worked during a period when most public projects were awarded after competitions which were open nationally. She designed buildings throughout the country, but is primarily known for those in Sofia. She was awarded the Order of Civil Merit for her architectural contributions to the country. In 1944, the couple's home was bombed and they lost many of their personal effects, including their architectural drawings. They evacuated to Turnovo, where Angelova became ill with a severe case of pneumonia. Believing she had recovered, they returned to Sophia in 1946, but Angelova relapsed and died on 27 December 1947. Her husband died three months later.\nSelected projects.\nMinistry of Public Buildings, Roads and Public Works.\n The ministry held a contest in 1926 for designs of a new office building for the Ministry of Public Buildings, Roads and Public Works. Although Angelova won the contest, she was required to have the experienced architects and Yordan Yordanov () oversee her work. The building covered an entire city block known as \"Slaveykov Square\" and was bounded by \"GS Rakovski\", \"William Gladstone\" and \"Han Krum \" streets. Construction began in 1928 and was completed four years later.\nThe design was Neoclassical and featured towering marble columns and mosaic floor tiles. Flanking the entrance were two statues, one female figure representing architecture and one male figure representing construction, as well as three stone heads in altorilievo adorning the doorways. The sculptures were completed by Mikhail Ivanov, Stephen Peychev and . The wide corridors and high ceilings are offset by stained glass designed by and made in Munich by F. Seiler. Today it houses the Metropolitan Library and the \"Renaissance Theater\" on one side and several doctors' and dentists' offices on the other.\nNational Art Gallery.\nFrom 1934 to 1941, Angelova worked on the National Art Gallery. The building was completed in 1942 and opened featuring a first floor which housed Renaissance paintings by Stanislav Dospevski, Nikolai Pavlovich, Hristo Tsokev, Zahari Zograf, as well as handcrafts from regions noted for folk artworks, such as Tryavna, Samokov and others. The second floor focused on contemporary Bulgarian art featuring painters and sculptors from the early 20th century. When completed, the building was recognized as the first modern, national art gallery in the Balkans. It was bombed in 1944 and completely destroyed, along with its contents, which included the complete works of leading Bulgarian sculptor \nSea Casino of Burgas.\n In 1936, Atanas Sirekov, the mayor of Burgas, initiated a design contest for a casino on Burgas Bay. Seventeen architects competed and Angelova won with a design she called \"333\". The building required a complex design due to the steep slope of the site and its panoramic view of the entire gulf area. Completed in 1938, the inauguration was attended by dignitaries from throughout the country, who received a special travel discount of 70% off the price of train tickets to attend. The building was abandoned in the late 1990s, but after almost 20 years of neglect, was restored and opened as a cultural center in 2011. The renovation project won the “Building of the Year” award for 2011.\nRaduntsi Lung Hospital.\nIn 1937 after a lengthy study had taken place, an act was passed for the construction of a tubercular sanatorium in the village of . The Pulmonary Hospital was to be the largest facility of its kind in the Balkans and located 650 meters above sea level. Angelova won the contract for the construction of the hospital and building was to begin shortly before World War II started. Ground was broken in 1939, but in 1940 after four stories were built, further construction was suspended until after the war ended. Construction resumed on 9 September 1944 but was not completed until 1955, nearly a decade after Angelova's death. The first patients were received at the hospital on 1 November 1955. Financial problems which began in 2013, forced the closure of the hospital in 2015.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48128666","title":"Pack Up Your Troubles (1939 film)","body":"\nPack Up Your Troubles (1939 film)\n\nPack Up Your Troubles is a 1939 American comedy film directed by H. Bruce Humberstone and written by Lou Breslow and Owen Francis. The film stars Jane Withers, The Ritz Brothers, Lynn Bari, Joseph Schildkraut, Stanley Fields, Fritz Leiber and Lionel Royce. The film was released on October 20, 1939, by 20th Century Fox.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48128692","title":"Chari Budruk","body":"\nChari Budruk\n\nChari Budruk is a village in the Palghar district of Maharashtra, India. It is located in the Vikramgad taluka.\nDemographics.\nAccording to the 2011 census of India, Chari Budruk has 87 households. The effective literacy rate (i.e. the literacy rate of population excluding children aged 6 and below) is 63.74%.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48128695","title":"Satkor","body":"\nSatkor\n\nSatkor is a village in the Palghar district of Maharashtra, India. It is located in the Vikramgad taluka.\nDemographics.\nAccording to the 2011 census of India, Satkor has 278 households. The effective literacy rate (i.e. the literacy rate of population excluding children aged 6 and below) is 69.88%.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48128700","title":"Dolhari Khurd","body":"\nDolhari Khurd\n\nDolhari Khurd is a village in the Palghar district of Maharashtra, India. It is located in the Vikramgad taluka.\nDemographics.\nAccording to the 2011 census of India, Dolhari Khurd has 449 households. The effective literacy rate (i.e. the literacy rate of population excluding children aged 6 and below) is 60.55%.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48128705","title":"Apti Budruk","body":"\nApti Budruk\n\nApti Budruk is a village in the Palghar district of Maharashtra, India. It is located in the Vikramgad taluka.\nDemographics.\nAccording to the 2011 census of India, Apti Budruk has 249 households. The effective literacy rate (i.e. the literacy rate of population excluding children aged 6 and below) is 57.54%.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48128712","title":"Uparale","body":"\nUparale\n\nUparale is a village in the Palghar district of Maharashtra, India. It is located in the Vikramgad taluka.\nDemographics.\nAccording to the 2011 census of India, Uparale has 273 households. The effective literacy rate (i.e. the literacy rate of population excluding children aged 6 and below) is 60.2%.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48128717","title":"Sawade","body":"\nSawade\n\nSawade is a village in the Palghar district of Maharashtra, India. It is located in the Vikramgad taluka.\nDemographics.\nAccording to the 2011 census of India, Sawade has 556 households. The effective literacy rate (i.e. the literacy rate of population excluding children aged 6 and below) is 57.63%.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48128719","title":"Gadadhe","body":"\nGadadhe\n\nGadadhe is a village in the Palghar district of Maharashtra, India. It is located in the Vikramgad taluka.\nDemographics.\nAccording to the 2011 census of India, Gadadhe has 172 households. The effective literacy rate (i.e. the literacy rate of population excluding children aged 6 and below) is 60.48%.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48128723","title":"Nagzari, Vikramgad","body":"\nNagzari, Vikramgad\n\nNagzari is a village in the Palghar district of Maharashtra, India. It is located in the Vikramgad taluka.\nDemographics.\nAccording to the 2011 census of India, Nagzari has 40 households. The effective literacy rate (i.e. the literacy rate of population excluding children aged 6 and below) is 92.78%.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48128726","title":"Yashwantnagar","body":"\nYashwantnagar\n\nYashwantnagar is a village in the Palghar district of Maharashtra, India. It is located in the Vikramgad taluka.\nDemographics.\nAccording to the 2011 census of India, Yashwantnagar has 375 households. The effective literacy rate (i.e. the literacy rate of population excluding children aged 6 and below) is 76.36%.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48128732","title":"Octav Dessila","body":"\nOctav Dessila\n\nOctav Dessila (December 4, 1895–July 29, 1976) was a Romanian novelist and playwright.\nBorn in Bucharest, his parents were Iorgu Dessila, a \"Căile Ferate Române\" employee, and his wife Aristița (\"née\" Gheorghiu). He was part of the first class to graduate from the military high school at Dealu Monastery, and became an officer in the Romanian Land Forces. His first novel was \"Dragomir Valahul\" (1927), followed by \"Zvetlana\" (1930), \"București, orașul prăbușirilor\" (1930), \"Neastâmpăr\" (1934), \"Turbă\" (1936), \"Cartea cu minciuni\" (1936), \"Două chemări\" (vol. I-II, 1936), \"Iubim\" (vol. I-III, 1941-1943) and \"Porți fără număr\" (vol. I-II, 1946). He also wrote plays: \"Un om care dă palme vieții\" (1938) and \"Mihai Viteazul\" (1967). He belonged to the Romanian Writers' Society from 1931 to 1948, winning its prize in 1935; he was also a member of the Romanian Writers' Union from 1967. In 1937, he won the Romanian Academy's I. Al. Brătescu-Voinești prize. \"Iubim\" was the last in a string of commercial successes; revised and republished in 1970, it did not even attract attention from readers of its genre, suggesting the obsolete nature of Dessila's literary output.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48128742","title":"Corky Tharp","body":"\nCorky Tharp\n\nThomas Allen \"Corky\" Tharp (April 19, 1931 – April 3, 2003) was an American football defensive back who played one season for the New York Titans of the American Football League. He played college football at the University of Alabama for the Alabama Crimson Tide football team.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48128764","title":"David Gailey","body":"\nDavid Gailey\n\nDavid Gailey (1807 - 1881) was one of a number of Enrolled Pensioner Guards (EPGs) who came to the Swan River Colony between 1850 and 1868. Their role was to guard and oversee the work of the prisoners transported to Western Australia.\nIn common with many of the Enrolled Pensioner Guards, Gailey was Irish and Catholic. He was born in Old Ross County in Watford in 1807. In December 1825, at the age of 18 years, he enlisted in the British Army, serving as a private in the 18th Regiment. He served for 20 years and was discharged in September 1846. He was 39 years of age. His record indicates his character was \"extremely good\" and he was awarded three good conduct badges. He was described as in height, with a fair complexion, grey eyes and hair dark. He married Margaret Hannen and in 1849 they had a son named John.\nIn 1851 Gailey and his family travelled with a number of other Pensioner Guards to the settlement of Toodyay, where they were temporarily housed in A-framed straw huts and allotted plots of land. These allotments were later transferred to the permanent Convict Hiring Depot, upstream of the town. Thirteen allotments, S1 to S13, were marked out, and from 1852 to 1856 two-roomed brick cottages were erected. The Gaileys, whose family had increased with the birth of two daughters, Anna in 1851 and Ellen in 1856, were allocated one of the first three cottages to be completed. The Depot became known as the Pensioner Village. Canon Raffaele Martelli, who had been appointed in 1855 by Bishop Salvado to look after Toodyay’s Catholic community, occupied one of the cottages for a short time.\nWhen more Pensioner Guard families arrived at the Depot, Martelli had to vacate the cottage and return to the townsite, where he was offered Gailey’s straw hut as temporary quarters. Martelli kept regular correspondence with Salvado and in one letter he thanks the bishop for sending a jar of butter that he wanted to give to Gailey. Martelli’s correspondence reveals a high regard for Gailey. \nIn 1858, Gailey and many other Enrolled Pensioner Guards in the colony contributed to the Indian Relief Fund that had been set up in England following the Indian Mutiny of 1857. Many of the EPGs had served in India with the British Army before their retirement. The mutiny led to the ending of the East India Company in 1858, and the establishment of the British Raj.\nIn 1860 the new town of Newcastle, located around the Convict Hiring Depot, had been surveyed. Gailey was allocated Lot S7 of , and purchased Lot 17 consisting of . This lot was located across the road from what became the Sisters of Mercy Convent, and at the southern end of Lot 17, the Roman Catholic St John the Baptist church was erected in 1863. Possibly around the same time a Catholic Presbytery was built across the road from the church on Lot S19.\nDuring the 1860s Gailey employed four ticket-of-leave men, conducted a small school, and worked as a bootmaker. He offered to take in the Quinlan children, Timothy (born February 1861) and his sister Mary when their mother died while giving birth to twins. Their father was up north with a government party at the time. When their father also died the children were placed with Joseph Thomas Reilly, a prominent Catholic newspaperman and active citizen, who raised them with his own children. Timothy Quinlan went on to become a prominent politician and husband to Daniel Connor's daughter Teresa.\nGailey continued to be a resident in Toodyay, dying on 18 April 1881.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48128767","title":"Arif Hajili","body":"\nArif Hajili\n\nArif Hajili () (born January 22, 1962), is a prominent Azerbaijani politician and leader of Equality Party \"(Müsavat)\", the largest opposition party in Azerbaijan.\nBiography.\nArif Hajili was born in 1962 in the Yukhari Tala village of Zagatala region. He graduated the Journalism Faculty of Baku State University. He worked as an editor at Zagatala radio station in 1983-1988. He was one of the leaders of the independence movement of Azerbaijan. Was a member of the Supreme Council of Azerbaijan in 1990-1995. Was a member of the Parliament of Azerbaijan. He was a Chairman of the Supreme Body of the PFA in 1991-1992. At various times he was a Deputy Head of the \"Musavat\" party on organizational matters. He worked as a State Advisor for the territorial government and the control of Azerbaijan during the reign of Elchibey in 1992-1993. Was arrested a number of times during the rule of Aliyevs. A former prisoner conscience. He has been the head of the Executive Office of \"Musavat\" party, a member of its supreme body - Divan. since 2006. He was elected Head of the party at the VIII Congress in 2014.\nCurrently a chairman of the Musavat Party.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48128774","title":"Udland Church","body":"\nUdland Church\n\n \nUdland Church () is a parish church in Haugesund municipality in Rogaland county, Norway. It is located in the town of Haugesund. The church is part of the Skåre parish in the Haugaland deanery in the Diocese of Stavanger. The stone/brick church was built in 2002 by the architect Thomas Brekke. The church seats about 450 people.\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48128789","title":"Alfia","body":"\nAlfia\n\nAlfia may refer to:\n\n"}
{"url":"https://en.wikipedia.org/wiki?curid=48128792","title":"Great Smoky Mountains Study","body":"\nGreat Smoky Mountains Study\n\nThe Great Smoky Mountains Study is a longitudinal study led by William Copeland (professor) from Duke University Medical Center that started in 1993 and ended in 2003. It followed 1,420 children from western North Carolina. Participants were interviewed at up to nine points in time - first aged 9 to 16, and again at ages 19–21.\nDuring the study, about one quarter of the families saw a dramatic and unexpected increase in income. The study showed that among these children, instances of behavioral and emotional disorders decreased, and conscientiousness and agreeableness increased. Randall Akee remarked that \"It would be almost impossible to replicate this kind of longitudinal study”.\n\n"}


================================================
FILE: bitpacker/Cargo.toml
================================================
[package]
name = "tantivy-bitpacker"
version = "0.9.0"
edition = "2024"
authors = ["Paul Masurel <paul.masurel@gmail.com>"]
license = "MIT"
categories = []
description = """Tantivy-sub crate: bitpacking"""
repository = "https://github.com/quickwit-oss/tantivy"
keywords = []
documentation = "https://docs.rs/tantivy-bitpacker/latest/tantivy_bitpacker"
homepage = "https://github.com/quickwit-oss/tantivy"


# See more keys and their definitions at https://doc.rust-lang.org/cargo/reference/manifest.html

[dependencies]
bitpacking = { version = "0.9.2", default-features = false, features = ["bitpacker1x"] }

[dev-dependencies]
rand = "0.9"
proptest = "1"


================================================
FILE: bitpacker/benches/bench.rs
================================================
#![feature(test)]

extern crate test;

#[cfg(test)]
mod tests {
    use rand::rng;
    use rand::seq::IteratorRandom;
    use tantivy_bitpacker::{BitPacker, BitUnpacker, BlockedBitpacker};
    use test::Bencher;

    #[inline(never)]
    fn create_bitpacked_data(bit_width: u8, num_els: u32) -> Vec<u8> {
        let mut bitpacker = BitPacker::new();
        let mut buffer = Vec::new();
        for _ in 0..num_els {
            // the values do not matter.
            bitpacker.write(0u64, bit_width, &mut buffer).unwrap();
            bitpacker.flush(&mut buffer).unwrap();
        }
        buffer
    }

    #[bench]
    fn bench_bitpacking_read(b: &mut Bencher) {
        let bit_width = 3;
        let num_els = 1_000_000u32;
        let bit_unpacker = BitUnpacker::new(bit_width);
        let data = create_bitpacked_data(bit_width, num_els);
        let idxs: Vec<u32> = (0..num_els).choose_multiple(&mut rng(), 100_000);
        b.iter(|| {
            let mut out = 0u64;
            for &idx in &idxs {
                out = out.wrapping_add(bit_unpacker.get(idx, &data[..]));
            }
            out
        });
    }

    #[bench]
    fn bench_blockedbitp_read(b: &mut Bencher) {
        let mut blocked_bitpacker = BlockedBitpacker::new();
        for val in 0..=21500 {
            blocked_bitpacker.add(val * val);
        }
        b.iter(|| {
            let mut out = 0u64;
            for val in 0..=21500 {
                out = out.wrapping_add(blocked_bitpacker.get(val));
            }
            out
        });
    }

    #[bench]
    fn bench_blockedbitp_create(b: &mut Bencher) {
        b.iter(|| {
            let mut blocked_bitpacker = BlockedBitpacker::new();
            for val in 0..=21500 {
                blocked_bitpacker.add(val * val);
            }
            blocked_bitpacker
        });
    }
}


================================================
FILE: bitpacker/src/bitpacker.rs
================================================
use std::io;
use std::ops::{Range, RangeInclusive};

use bitpacking::{BitPacker as ExternalBitPackerTrait, BitPacker1x};

pub struct BitPacker {
    mini_buffer: u64,
    mini_buffer_written: usize,
}

impl Default for BitPacker {
    fn default() -> Self {
        BitPacker::new()
    }
}
impl BitPacker {
    pub fn new() -> BitPacker {
        BitPacker {
            mini_buffer: 0u64,
            mini_buffer_written: 0,
        }
    }

    #[inline]
    pub fn write<TWrite: io::Write + ?Sized>(
        &mut self,
        val: u64,
        num_bits: u8,
        output: &mut TWrite,
    ) -> io::Result<()> {
        let num_bits = num_bits as usize;
        if self.mini_buffer_written + num_bits > 64 {
            self.mini_buffer |= val.wrapping_shl(self.mini_buffer_written as u32);
            output.write_all(self.mini_buffer.to_le_bytes().as_ref())?;
            self.mini_buffer = val.wrapping_shr((64 - self.mini_buffer_written) as u32);
            self.mini_buffer_written = self.mini_buffer_written + num_bits - 64;
        } else {
            self.mini_buffer |= val << self.mini_buffer_written;
            self.mini_buffer_written += num_bits;
            if self.mini_buffer_written == 64 {
                output.write_all(self.mini_buffer.to_le_bytes().as_ref())?;
                self.mini_buffer_written = 0;
                self.mini_buffer = 0u64;
            }
        }
        Ok(())
    }

    pub fn flush<TWrite: io::Write + ?Sized>(&mut self, output: &mut TWrite) -> io::Result<()> {
        if self.mini_buffer_written > 0 {
            let num_bytes = self.mini_buffer_written.div_ceil(8);
            let bytes = self.mini_buffer.to_le_bytes();
            output.write_all(&bytes[..num_bytes])?;
            self.mini_buffer_written = 0;
            self.mini_buffer = 0;
        }
        Ok(())
    }

    pub fn close<TWrite: io::Write + ?Sized>(&mut self, output: &mut TWrite) -> io::Result<()> {
        self.flush(output)?;
        Ok(())
    }
}

#[derive(Clone, Debug, Default, Copy)]
pub struct BitUnpacker {
    num_bits: usize,
    mask: u64,
}

impl BitUnpacker {
    /// Creates a bit unpacker, that assumes the same bitwidth for all values.
    ///
    /// The bitunpacker works by doing an unaligned read of 8 bytes.
    /// For this reason, values of `num_bits` between
    /// [57..63] are forbidden.
    pub fn new(num_bits: u8) -> BitUnpacker {
        assert!(num_bits <= 7 * 8 || num_bits == 64);
        let mask: u64 = if num_bits == 64 {
            !0u64
        } else {
            (1u64 << num_bits) - 1u64
        };
        BitUnpacker {
            num_bits: usize::from(num_bits),
            mask,
        }
    }

    pub fn bit_width(&self) -> u8 {
        self.num_bits as u8
    }

    #[inline]
    pub fn get(&self, idx: u32, data: &[u8]) -> u64 {
        let addr_in_bits = idx as usize * self.num_bits;
        let addr = addr_in_bits >> 3;
        if addr + 8 > data.len() {
            if self.num_bits == 0 {
                return 0;
            }
            let bit_shift = addr_in_bits & 7;
            return self.get_slow_path(addr, bit_shift as u32, data);
        }
        let bit_shift = addr_in_bits & 7;
        let bytes: [u8; 8] = (&data[addr..addr + 8]).try_into().unwrap();
        let val_unshifted_unmasked: u64 = u64::from_le_bytes(bytes);
        let val_shifted = val_unshifted_unmasked >> bit_shift;
        val_shifted & self.mask
    }

    #[inline(never)]
    fn get_slow_path(&self, addr: usize, bit_shift: u32, data: &[u8]) -> u64 {
        let mut bytes: [u8; 8] = [0u8; 8];
        let available_bytes = data.len() - addr;
        // This function is meant to only be called if we did not have 8 bytes to load.
        debug_assert!(available_bytes < 8);
        bytes[..available_bytes].copy_from_slice(&data[addr..]);
        let val_unshifted_unmasked: u64 = u64::from_le_bytes(bytes);
        let val_shifted = val_unshifted_unmasked >> bit_shift;
        val_shifted & self.mask
    }

    // Decodes the range of bitpacked `u32` values with idx
    // in [start_idx, start_idx + output.len()).
    //
    // #Panics
    //
    // This methods panics if `num_bits` is > 32.
    fn get_batch_u32s(&self, start_idx: u32, data: &[u8], output: &mut [u32]) {
        assert!(
            self.bit_width() <= 32,
            "Bitwidth must be <= 32 to use this method."
        );

        let end_idx: u32 = start_idx + output.len() as u32;

        // We use `usize` here to avoid overflow issues.
        let end_bit_read = (end_idx as usize) * self.num_bits;
        let end_byte_read = end_bit_read.div_ceil(8);
        assert!(
            end_byte_read <= data.len(),
            "Requested index is out of bounds."
        );

        // Simple slow implementation of get_batch_u32s, to deal with our ramps.
        let get_batch_ramp = |start_idx: u32, output: &mut [u32]| {
            for (out, idx) in output.iter_mut().zip(start_idx..) {
                *out = self.get(idx, data) as u32;
            }
        };

        // We use an unrolled routine to decode 32 values at once.
        // We therefore decompose our range of values to decode into three ranges:
        // - Entrance ramp: [start_idx, fast_track_start) (up to 31 values)
        // - Highway: [fast_track_start, fast_track_end) (a length multiple of 32s)
        // - Exit ramp: [fast_track_end, start_idx + output.len()) (up to 31 values)

        // We want the start of the fast track to start align with bytes.
        // A sufficient condition is to start with an idx that is a multiple of 8,
        // so highway start is the closest multiple of 8 that is >= start_idx.
        let entrance_ramp_len: u32 = 8 - (start_idx % 8) % 8;

        let highway_start: u32 = start_idx + entrance_ramp_len;

        if highway_start + (BitPacker1x::BLOCK_LEN as u32) > end_idx {
            // We don't have enough values to have even a single block of highway.
            // Let's just supply the values the simple way.
            get_batch_ramp(start_idx, output);
            return;
        }

        let num_blocks: usize = (end_idx - highway_start) as usize / BitPacker1x::BLOCK_LEN;

        // Entrance ramp
        get_batch_ramp(start_idx, &mut output[..entrance_ramp_len as usize]);

        // Highway
        let mut offset = (highway_start as usize * self.num_bits) / 8;
        let mut output_cursor = (highway_start - start_idx) as usize;
        for _ in 0..num_blocks {
            offset += BitPacker1x.decompress(
                &data[offset..],
                &mut output[output_cursor..],
                self.num_bits as u8,
            );
            output_cursor += 32;
        }

        // Exit ramp
        let highway_end: u32 = highway_start + (num_blocks * BitPacker1x::BLOCK_LEN) as u32;
        get_batch_ramp(highway_end, &mut output[output_cursor..]);
    }

    pub fn get_ids_for_value_range(
        &self,
        range: RangeInclusive<u64>,
        id_range: Range<u32>,
        data: &[u8],
        positions: &mut Vec<u32>,
    ) {
        if self.bit_width() > 32 {
            self.get_ids_for_value_range_slow(range, id_range, data, positions)
        } else {
            if *range.start() > u32::MAX as u64 {
                positions.clear();
                return;
            }
            let range_u32 = (*range.start() as u32)..=(*range.end()).min(u32::MAX as u64) as u32;
            self.get_ids_for_value_range_fast(range_u32, id_range, data, positions)
        }
    }

    fn get_ids_for_value_range_slow(
        &self,
        range: RangeInclusive<u64>,
        id_range: Range<u32>,
        data: &[u8],
        positions: &mut Vec<u32>,
    ) {
        positions.clear();
        for i in id_range {
            // If we cared we could make this branchless, but the slow implementation should rarely
            // kick in.
            let val = self.get(i, data);
            if range.contains(&val) {
                positions.push(i);
            }
        }
    }

    fn get_ids_for_value_range_fast(
        &self,
        value_range: RangeInclusive<u32>,
        id_range: Range<u32>,
        data: &[u8],
        positions: &mut Vec<u32>,
    ) {
        positions.resize(id_range.len(), 0u32);
        self.get_batch_u32s(id_range.start, data, positions);
        crate::filter_vec::filter_vec_in_place(value_range, id_range.start, positions)
    }
}

#[cfg(test)]
mod test {
    use super::{BitPacker, BitUnpacker};

    fn create_bitpacker(len: usize, num_bits: u8) -> (BitUnpacker, Vec<u64>, Vec<u8>) {
        let mut data = Vec::new();
        let mut bitpacker = BitPacker::new();
        let max_val: u64 = (1u64 << num_bits as u64) - 1u64;
        let vals: Vec<u64> = (0u64..len as u64)
            .map(|i| if max_val == 0 { 0 } else { i % max_val })
            .collect();
        for &val in &vals {
            bitpacker.write(val, num_bits, &mut data).unwrap();
        }
        bitpacker.close(&mut data).unwrap();
        assert_eq!(data.len(), ((num_bits as usize) * len).div_ceil(8));
        let bitunpacker = BitUnpacker::new(num_bits);
        (bitunpacker, vals, data)
    }

    fn test_bitpacker_util(len: usize, num_bits: u8) {
        let (bitunpacker, vals, data) = create_bitpacker(len, num_bits);
        for (i, val) in vals.iter().enumerate() {
            assert_eq!(bitunpacker.get(i as u32, &data), *val);
        }
    }

    #[test]
    fn test_bitpacker() {
        test_bitpacker_util(10, 3);
        test_bitpacker_util(10, 0);
        test_bitpacker_util(10, 1);
        test_bitpacker_util(6, 14);
        test_bitpacker_util(1000, 14);
    }

    use proptest::prelude::*;

    fn num_bits_strategy() -> impl Strategy<Value = u8> {
        prop_oneof!(Just(0), Just(1), 2u8..56u8, Just(56), Just(64),)
    }

    fn vals_strategy() -> impl Strategy<Value = (u8, Vec<u64>)> {
        (num_bits_strategy(), 0usize..100usize).prop_flat_map(|(num_bits, len)| {
            let max_val = if num_bits == 64 {
                u64::MAX
            } else {
                (1u64 << num_bits as u32) - 1
            };
            let vals = proptest::collection::vec(0..=max_val, len);
            vals.prop_map(move |vals| (num_bits, vals))
        })
    }

    fn test_bitpacker_aux(num_bits: u8, vals: &[u64]) {
        let mut buffer: Vec<u8> = Vec::new();
        let mut bitpacker = BitPacker::new();
        for &val in vals {
            bitpacker.write(val, num_bits, &mut buffer).unwrap();
        }
        bitpacker.flush(&mut buffer).unwrap();
        assert_eq!(buffer.len(), (vals.len() * num_bits as usize).div_ceil(8));
        let bitunpacker = BitUnpacker::new(num_bits);
        let max_val = if num_bits == 64 {
            u64::MAX
        } else {
            (1u64 << num_bits) - 1
        };
        for (i, val) in vals.iter().copied().enumerate() {
            assert!(val <= max_val);
            assert_eq!(bitunpacker.get(i as u32, &buffer), val);
        }
    }

    proptest::proptest! {
        #[test]
        fn test_bitpacker_proptest((num_bits, vals) in vals_strategy()) {
            test_bitpacker_aux(num_bits, &vals);
        }
    }

    #[test]
    #[should_panic]
    fn test_get_batch_panics_over_32_bits() {
        let bitunpacker = BitUnpacker::new(33);
        let mut output: [u32; 1] = [0u32];
        bitunpacker.get_batch_u32s(0, &[0, 0, 0, 0, 0, 0, 0, 0], &mut output[..]);
    }

    #[test]
    fn test_get_batch_limit() {
        let bitunpacker = BitUnpacker::new(1);
        let mut output: [u32; 3] = [0u32, 0u32, 0u32];
        bitunpacker.get_batch_u32s(8 * 4 - 3, &[0u8, 0u8, 0u8, 0u8], &mut output[..]);
    }

    #[test]
    #[should_panic]
    fn test_get_batch_panics_when_off_scope() {
        let bitunpacker = BitUnpacker::new(1);
        let mut output: [u32; 3] = [0u32, 0u32, 0u32];
        // We are missing exactly one bit.
        bitunpacker.get_batch_u32s(8 * 4 - 2, &[0u8, 0u8, 0u8, 0u8], &mut output[..]);
    }

    proptest::proptest! {
        #[test]
        fn test_get_batch_u32s_proptest(num_bits in 0u8..=32u8) {
            let mask =
                if num_bits == 32u8 {
                    u32::MAX
                } else {
                    (1u32 << num_bits) - 1
                };
            let mut buffer: Vec<u8> = Vec::new();
            let mut bitpacker = BitPacker::new();
            for val in 0..100 {
                bitpacker.write(val & mask as u64, num_bits, &mut buffer).unwrap();
            }
            bitpacker.flush(&mut buffer).unwrap();
            let bitunpacker = BitUnpacker::new(num_bits);
            let mut output: Vec<u32> = Vec::new();
            for len in [0, 1, 2, 32, 33, 34, 64] {
                for start_idx in 0u32..32u32 {
                    output.resize(len, 0);
                    bitunpacker.get_batch_u32s(start_idx, &buffer, &mut output);
                    for (i, output_byte) in output.iter().enumerate() {
                        let expected = (start_idx + i as u32) & mask;
                        assert_eq!(*output_byte, expected);
                    }
                }
            }
        }
    }
}


================================================
FILE: bitpacker/src/blocked_bitpacker.rs
================================================
use super::bitpacker::BitPacker;
use super::compute_num_bits;
use crate::{BitUnpacker, minmax};

const BLOCK_SIZE: usize = 128;

/// `BlockedBitpacker` compresses data in blocks of
/// 128 elements, while keeping an index on it
#[derive(Debug, Clone)]
pub struct BlockedBitpacker {
    // bitpacked blocks
    compressed_blocks: Vec<u8>,
    // uncompressed data, collected until BLOCK_SIZE
    buffer: Vec<u64>,
    offset_and_bits: Vec<BlockedBitpackerEntryMetaData>,
}
impl Default for BlockedBitpacker {
    fn default() -> Self {
        BlockedBitpacker::new()
    }
}

/// `BlockedBitpackerEntryMetaData` encodes the
/// offset and bit_width into a u64 bit field
///
/// This saves some space, since 7byte is more
/// than enough and also keeps the access fast
/// because of alignment
#[derive(Debug, Clone, Default)]
struct BlockedBitpackerEntryMetaData {
    encoded: u64,
    base_value: u64,
}

impl BlockedBitpackerEntryMetaData {
    fn new(offset: u64, num_bits: u8, base_value: u64) -> Self {
        let encoded = offset | (u64::from(num_bits) << (64 - 8));
        Self {
            encoded,
            base_value,
        }
    }
    fn offset(&self) -> u64 {
        (self.encoded << 8) >> 8
    }
    fn num_bits(&self) -> u8 {
        (self.encoded >> 56) as u8
    }
    fn base_value(&self) -> u64 {
        self.base_value
    }
}

#[test]
fn metadata_test() {
    let meta = BlockedBitpackerEntryMetaData::new(50000, 6, 40000);
    assert_eq!(meta.offset(), 50000);
    assert_eq!(meta.num_bits(), 6);
}

fn mem_usage<T>(items: &Vec<T>) -> usize {
    items.capacity() * std::mem::size_of::<T>()
}

impl BlockedBitpacker {
    pub fn new() -> Self {
        Self {
            compressed_blocks: vec![0; 8],
            buffer: vec![],
            offset_and_bits: vec![],
        }
    }

    /// The memory used (inclusive childs)
    pub fn mem_usage(&self) -> usize {
        std::mem::size_of::<BlockedBitpacker>()
            + self.compressed_blocks.capacity()
            + mem_usage(&self.offset_and_bits)
            + mem_usage(&self.buffer)
    }

    #[inline]
    pub fn add(&mut self, val: u64) {
        self.buffer.push(val);
        if self.buffer.len() == BLOCK_SIZE {
            self.flush();
        }
    }

    pub fn flush(&mut self) {
        if let Some((min_value, max_value)) = minmax(self.buffer.iter()) {
            let mut bit_packer = BitPacker::new();
            let num_bits_block = compute_num_bits(*max_value - min_value);
            // todo performance: the padding handling could be done better, e.g. use a slice and
            // return num_bytes written from bitpacker
            self.compressed_blocks
                .resize(self.compressed_blocks.len() - 8, 0); // remove padding for bitpacker
            let offset = self.compressed_blocks.len() as u64;
            // todo performance: for some bit_width we
            // can encode multiple vals into the
            // mini_buffer before checking to flush
            // (to be done in BitPacker)
            for val in self.buffer.iter() {
                bit_packer
                    .write(
                        *val - min_value,
                        num_bits_block,
                        &mut self.compressed_blocks,
                    )
                    .expect("cannot write bitpacking to output"); // write to in memory can't fail
            }
            bit_packer.flush(&mut self.compressed_blocks).unwrap();
            self.offset_and_bits
                .push(BlockedBitpackerEntryMetaData::new(
                    offset,
                    num_bits_block,
                    *min_value,
                ));

            self.buffer.clear();
            self.compressed_blocks
                .resize(self.compressed_blocks.len() + 8, 0); // add padding for bitpacker
        }
    }
    #[inline]
    pub fn get(&self, idx: usize) -> u64 {
        let metadata_pos = idx / BLOCK_SIZE;
        let pos_in_block = idx % BLOCK_SIZE;
        if let Some(metadata) = self.offset_and_bits.get(metadata_pos) {
            let unpacked = BitUnpacker::new(metadata.num_bits()).get(
                pos_in_block as u32,
                &self.compressed_blocks[metadata.offset() as usize..],
            );
            unpacked + metadata.base_value()
        } else {
            self.buffer[pos_in_block]
        }
    }

    pub fn iter(&self) -> impl Iterator<Item = u64> + '_ {
        // todo performance: we could decompress a whole block and cache it instead
        let bitpacked_elems = self.offset_and_bits.len() * BLOCK_SIZE;

        (0..bitpacked_elems)
            .map(move |idx| self.get(idx))
            .chain(self.buffer.iter().cloned())
    }
}

#[cfg(test)]
mod tests {
    use super::*;
    #[test]
    fn blocked_bitpacker_empty() {
        let blocked_bitpacker = BlockedBitpacker::new();
        assert_eq!(blocked_bitpacker.iter().collect::<Vec<u64>>(), vec![]);
    }
    #[test]
    fn blocked_bitpacker_one() {
        let mut blocked_bitpacker = BlockedBitpacker::new();
        blocked_bitpacker.add(50000);
        assert_eq!(blocked_bitpacker.get(0), 50000);
        assert_eq!(blocked_bitpacker.iter().collect::<Vec<u64>>(), vec![50000]);
    }
    #[test]
    fn blocked_bitpacker_test() {
        let mut blocked_bitpacker = BlockedBitpacker::new();
        for val in 0..21500 {
            blocked_bitpacker.add(val);
        }
        for val in 0..21500 {
            assert_eq!(blocked_bitpacker.get(val as usize), val);
        }
        assert_eq!(blocked_bitpacker.iter().count(), 21500);
        assert_eq!(blocked_bitpacker.iter().last().unwrap(), 21499);
    }
}


================================================
FILE: bitpacker/src/filter_vec/avx2.rs
================================================
//! SIMD filtering of a vector as described in the following blog post.
//! <https://quickwit.io/blog/filtering%20a%20vector%20with%20simd%20instructions%20avx-2%20and%20avx-512>
use std::arch::x86_64::{
    __m256i as DataType, _mm256_add_epi32 as op_add, _mm256_cmpgt_epi32 as op_greater,
    _mm256_lddqu_si256 as load_unaligned, _mm256_or_si256 as op_or, _mm256_set1_epi32 as set1,
    _mm256_storeu_si256 as store_unaligned, _mm256_xor_si256 as op_xor, *,
};
use std::ops::RangeInclusive;

const NUM_LANES: usize = 8;

const HIGHEST_BIT: u32 = 1 << 31;

#[inline]
fn u32_to_i32(val: u32) -> i32 {
    (val ^ HIGHEST_BIT) as i32
}

#[inline]
unsafe fn u32_to_i32_avx2(vals_u32x8s: DataType) -> DataType {
    const HIGHEST_BIT_MASK: DataType = from_u32x8([HIGHEST_BIT; NUM_LANES]);
    unsafe { op_xor(vals_u32x8s, HIGHEST_BIT_MASK) }
}

pub fn filter_vec_in_place(range: RangeInclusive<u32>, offset: u32, output: &mut Vec<u32>) {
    // We use a monotonic mapping from u32 to i32 to make the comparison possible in AVX2.
    let range_i32: RangeInclusive<i32> = u32_to_i32(*range.start())..=u32_to_i32(*range.end());
    let num_words = output.len() / NUM_LANES;
    let mut output_len = unsafe {
        filter_vec_avx2_aux(
            output.as_ptr() as *const __m256i,
            range_i32,
            output.as_mut_ptr(),
            offset,
            num_words,
        )
    };
    let reminder_start = num_words * NUM_LANES;
    for i in reminder_start..output.len() {
        let val = output[i];
        output[output_len] = offset + i as u32;
        output_len += if range.contains(&val) { 1 } else { 0 };
    }
    output.truncate(output_len);
}

#[target_feature(enable = "avx2")]
unsafe fn filter_vec_avx2_aux(
    mut input: *const __m256i,
    range: RangeInclusive<i32>,
    output: *mut u32,
    offset: u32,
    num_words: usize,
) -> usize {
    let mut output_tail = output;
    let range_simd = set1(*range.start())..=set1(*range.end());
    let mut ids = from_u32x8([
        offset,
        offset + 1,
        offset + 2,
        offset + 3,
        offset + 4,
        offset + 5,
        offset + 6,
        offset + 7,
    ]);
    const SHIFT: __m256i = from_u32x8([NUM_LANES as u32; NUM_LANES]);
    for _ in 0..num_words {
        unsafe {
            let word = load_unaligned(input);
            let word = u32_to_i32_avx2(word);
            let keeper_bitset = compute_filter_bitset(word, range_simd.clone());
            let added_len = keeper_bitset.count_ones();
            let filtered_doc_ids = compact(ids, keeper_bitset);
            store_unaligned(output_tail as *mut __m256i, filtered_doc_ids);
            output_tail = output_tail.offset(added_len as isize);
            ids = op_add(ids, SHIFT);
            input = input.offset(1);
        }
    }
    unsafe { output_tail.offset_from(output) as usize }
}

#[inline]
#[target_feature(enable = "avx2")]
unsafe fn compact(data: DataType, mask: u8) -> DataType {
    let vperm_mask = MASK_TO_PERMUTATION[mask as usize];
    _mm256_permutevar8x32_epi32(data, vperm_mask)
}

#[inline]
#[target_feature(enable = "avx2")]
unsafe fn compute_filter_bitset(val: __m256i, range: std::ops::RangeInclusive<__m256i>) -> u8 {
    let too_low = op_greater(*range.start(), val);
    let too_high = op_greater(val, *range.end());
    let inside = op_or(too_low, too_high);
    255 - std::arch::x86_64::_mm256_movemask_ps(_mm256_castsi256_ps(inside)) as u8
}

union U8x32 {
    vector: DataType,
    vals: [u32; NUM_LANES],
}

const fn from_u32x8(vals: [u32; NUM_LANES]) -> DataType {
    unsafe { U8x32 { vals }.vector }
}

const MASK_TO_PERMUTATION: [DataType; 256] = [
    from_u32x8([0, 0, 0, 0, 0, 0, 0, 0]),
    from_u32x8([0, 0, 0, 0, 0, 0, 0, 0]),
    from_u32x8([1, 0, 0, 0, 0, 0, 0, 0]),
    from_u32x8([0, 1, 0, 0, 0, 0, 0, 0]),
    from_u32x8([2, 0, 0, 0, 0, 0, 0, 0]),
    from_u32x8([0, 2, 0, 0, 0, 0, 0, 0]),
    from_u32x8([1, 2, 0, 0, 0, 0, 0, 0]),
    from_u32x8([0, 1, 2, 0, 0, 0, 0, 0]),
    from_u32x8([3, 0, 0, 0, 0, 0, 0, 0]),
    from_u32x8([0, 3, 0, 0, 0, 0, 0, 0]),
    from_u32x8([1, 3, 0, 0, 0, 0, 0, 0]),
    from_u32x8([0, 1, 3, 0, 0, 0, 0, 0]),
    from_u32x8([2, 3, 0, 0, 0, 0, 0, 0]),
    from_u32x8([0, 2, 3, 0, 0, 0, 0, 0]),
    from_u32x8([1, 2, 3, 0, 0, 0, 0, 0]),
    from_u32x8([0, 1, 2, 3, 0, 0, 0, 0]),
    from_u32x8([4, 0, 0, 0, 0, 0, 0, 0]),
    from_u32x8([0, 4, 0, 0, 0, 0, 0, 0]),
    from_u32x8([1, 4, 0, 0, 0, 0, 0, 0]),
    from_u32x8([0, 1, 4, 0, 0, 0, 0, 0]),
    from_u32x8([2, 4, 0, 0, 0, 0, 0, 0]),
    from_u32x8([0, 2, 4, 0, 0, 0, 0, 0]),
    from_u32x8([1, 2, 4, 0, 0, 0, 0, 0]),
    from_u32x8([0, 1, 2, 4, 0, 0, 0, 0]),
    from_u32x8([3, 4, 0, 0, 0, 0, 0, 0]),
    from_u32x8([0, 3, 4, 0, 0, 0, 0, 0]),
    from_u32x8([1, 3, 4, 0, 0, 0, 0, 0]),
    from_u32x8([0, 1, 3, 4, 0, 0, 0, 0]),
    from_u32x8([2, 3, 4, 0, 0, 0, 0, 0]),
    from_u32x8([0, 2, 3, 4, 0, 0, 0, 0]),
    from_u32x8([1, 2, 3, 4, 0, 0, 0, 0]),
    from_u32x8([0, 1, 2, 3, 4, 0, 0, 0]),
    from_u32x8([5, 0, 0, 0, 0, 0, 0, 0]),
    from_u32x8([0, 5, 0, 0, 0, 0, 0, 0]),
    from_u32x8([1, 5, 0, 0, 0, 0, 0, 0]),
    from_u32x8([0, 1, 5, 0, 0, 0, 0, 0]),
    from_u32x8([2, 5, 0, 0, 0, 0, 0, 0]),
    from_u32x8([0, 2, 5, 0, 0, 0, 0, 0]),
    from_u32x8([1, 2, 5, 0, 0, 0, 0, 0]),
    from_u32x8([0, 1, 2, 5, 0, 0, 0, 0]),
    from_u32x8([3, 5, 0, 0, 0, 0, 0, 0]),
    from_u32x8([0, 3, 5, 0, 0, 0, 0, 0]),
    from_u32x8([1, 3, 5, 0, 0, 0, 0, 0]),
    from_u32x8([0, 1, 3, 5, 0, 0, 0, 0]),
    from_u32x8([2, 3, 5, 0, 0, 0, 0, 0]),
    from_u32x8([0, 2, 3, 5, 0, 0, 0, 0]),
    from_u32x8([1, 2, 3, 5, 0, 0, 0, 0]),
    from_u32x8([0, 1, 2, 3, 5, 0, 0, 0]),
    from_u32x8([4, 5, 0, 0, 0, 0, 0, 0]),
    from_u32x8([0, 4, 5, 0, 0, 0, 0, 0]),
    from_u32x8([1, 4, 5, 0, 0, 0, 0, 0]),
    from_u32x8([0, 1, 4, 5, 0, 0, 0, 0]),
    from_u32x8([2, 4, 5, 0, 0, 0, 0, 0]),
    from_u32x8([0, 2, 4, 5, 0, 0, 0, 0]),
    from_u32x8([1, 2, 4, 5, 0, 0, 0, 0]),
    from_u32x8([0, 1, 2, 4, 5, 0, 0, 0]),
    from_u32x8([3, 4, 5, 0, 0, 0, 0, 0]),
    from_u32x8([0, 3, 4, 5, 0, 0, 0, 0]),
    from_u32x8([1, 3, 4, 5, 0, 0, 0, 0]),
    from_u32x8([0, 1, 3, 4, 5, 0, 0, 0]),
    from_u32x8([2, 3, 4, 5, 0, 0, 0, 0]),
    from_u32x8([0, 2, 3, 4, 5, 0, 0, 0]),
    from_u32x8([1, 2, 3, 4, 5, 0, 0, 0]),
    from_u32x8([0, 1, 2, 3, 4, 5, 0, 0]),
    from_u32x8([6, 0, 0, 0, 0, 0, 0, 0]),
    from_u32x8([0, 6, 0, 0, 0, 0, 0, 0]),
    from_u32x8([1, 6, 0, 0, 0, 0, 0, 0]),
    from_u32x8([0, 1, 6, 0, 0, 0, 0, 0]),
    from_u32x8([2, 6, 0, 0, 0, 0, 0, 0]),
    from_u32x8([0, 2, 6, 0, 0, 0, 0, 0]),
    from_u32x8([1, 2, 6, 0, 0, 0, 0, 0]),
    from_u32x8([0, 1, 2, 6, 0, 0, 0, 0]),
    from_u32x8([3, 6, 0, 0, 0, 0, 0, 0]),
    from_u32x8([0, 3, 6, 0, 0, 0, 0, 0]),
    from_u32x8([1, 3, 6, 0, 0, 0, 0, 0]),
    from_u32x8([0, 1, 3, 6, 0, 0, 0, 0]),
    from_u32x8([2, 3, 6, 0, 0, 0, 0, 0]),
    from_u32x8([0, 2, 3, 6, 0, 0, 0, 0]),
    from_u32x8([1, 2, 3, 6, 0, 0, 0, 0]),
    from_u32x8([0, 1, 2, 3, 6, 0, 0, 0]),
    from_u32x8([4, 6, 0, 0, 0, 0, 0, 0]),
    from_u32x8([0, 4, 6, 0, 0, 0, 0, 0]),
    from_u32x8([1, 4, 6, 0, 0, 0, 0, 0]),
    from_u32x8([0, 1, 4, 6, 0, 0, 0, 0]),
    from_u32x8([2, 4, 6, 0, 0, 0, 0, 0]),
    from_u32x8([0, 2, 4, 6, 0, 0, 0, 0]),
    from_u32x8([1, 2, 4, 6, 0, 0, 0, 0]),
    from_u32x8([0, 1, 2, 4, 6, 0, 0, 0]),
    from_u32x8([3, 4, 6, 0, 0, 0, 0, 0]),
    from_u32x8([0, 3, 4, 6, 0, 0, 0, 0]),
    from_u32x8([1, 3, 4, 6, 0, 0, 0, 0]),
    from_u32x8([0, 1, 3, 4, 6, 0, 0, 0]),
    from_u32x8([2, 3, 4, 6, 0, 0, 0, 0]),
    from_u32x8([0, 2, 3, 4, 6, 0, 0, 0]),
    from_u32x8([1, 2, 3, 4, 6, 0, 0, 0]),
    from_u32x8([0, 1, 2, 3, 4, 6, 0, 0]),
    from_u32x8([5, 6, 0, 0, 0, 0, 0, 0]),
    from_u32x8([0, 5, 6, 0, 0, 0, 0, 0]),
    from_u32x8([1, 5, 6, 0, 0, 0, 0, 0]),
    from_u32x8([0, 1, 5, 6, 0, 0, 0, 0]),
    from_u32x8([2, 5, 6, 0, 0, 0, 0, 0]),
    from_u32x8([0, 2, 5, 6, 0, 0, 0, 0]),
    from_u32x8([1, 2, 5, 6, 0, 0, 0, 0]),
    from_u32x8([0, 1, 2, 5, 6, 0, 0, 0]),
    from_u32x8([3, 5, 6, 0, 0, 0, 0, 0]),
    from_u32x8([0, 3, 5, 6, 0, 0, 0, 0]),
    from_u32x8([1, 3, 5, 6, 0, 0, 0, 0]),
    from_u32x8([0, 1, 3, 5, 6, 0, 0, 0]),
    from_u32x8([2, 3, 5, 6, 0, 0, 0, 0]),
    from_u32x8([0, 2, 3, 5, 6, 0, 0, 0]),
    from_u32x8([1, 2, 3, 5, 6, 0, 0, 0]),
    from_u32x8([0, 1, 2, 3, 5, 6, 0, 0]),
    from_u32x8([4, 5, 6, 0, 0, 0, 0, 0]),
    from_u32x8([0, 4, 5, 6, 0, 0, 0, 0]),
    from_u32x8([1, 4, 5, 6, 0, 0, 0, 0]),
    from_u32x8([0, 1, 4, 5, 6, 0, 0, 0]),
    from_u32x8([2, 4, 5, 6, 0, 0, 0, 0]),
    from_u32x8([0, 2, 4, 5, 6, 0, 0, 0]),
    from_u32x8([1, 2, 4, 5, 6, 0, 0, 0]),
    from_u32x8([0, 1, 2, 4, 5, 6, 0, 0]),
    from_u32x8([3, 4, 5, 6, 0, 0, 0, 0]),
    from_u32x8([0, 3, 4, 5, 6, 0, 0, 0]),
    from_u32x8([1, 3, 4, 5, 6, 0, 0, 0]),
    from_u32x8([0, 1, 3, 4, 5, 6, 0, 0]),
    from_u32x8([2, 3, 4, 5, 6, 0, 0, 0]),
    from_u32x8([0, 2, 3, 4, 5, 6, 0, 0]),
    from_u32x8([1, 2, 3, 4, 5, 6, 0, 0]),
    from_u32x8([0, 1, 2, 3, 4, 5, 6, 0]),
    from_u32x8([7, 0, 0, 0, 0, 0, 0, 0]),
    from_u32x8([0, 7, 0, 0, 0, 0, 0, 0]),
    from_u32x8([1, 7, 0, 0, 0, 0, 0, 0]),
    from_u32x8([0, 1, 7, 0, 0, 0, 0, 0]),
    from_u32x8([2, 7, 0, 0, 0, 0, 0, 0]),
    from_u32x8([0, 2, 7, 0, 0, 0, 0, 0]),
    from_u32x8([1, 2, 7, 0, 0, 0, 0, 0]),
    from_u32x8([0, 1, 2, 7, 0, 0, 0, 0]),
    from_u32x8([3, 7, 0, 0, 0, 0, 0, 0]),
    from_u32x8([0, 3, 7, 0, 0, 0, 0, 0]),
    from_u32x8([1, 3, 7, 0, 0, 0, 0, 0]),
    from_u32x8([0, 1, 3, 7, 0, 0, 0, 0]),
    from_u32x8([2, 3, 7, 0, 0, 0, 0, 0]),
    from_u32x8([0, 2, 3, 7, 0, 0, 0, 0]),
    from_u32x8([1, 2, 3, 7, 0, 0, 0, 0]),
    from_u32x8([0, 1, 2, 3, 7, 0, 0, 0]),
    from_u32x8([4, 7, 0, 0, 0, 0, 0, 0]),
    from_u32x8([0, 4, 7, 0, 0, 0, 0, 0]),
    from_u32x8([1, 4, 7, 0, 0, 0, 0, 0]),
    from_u32x8([0, 1, 4, 7, 0, 0, 0, 0]),
    from_u32x8([2, 4, 7, 0, 0, 0, 0, 0]),
    from_u32x8([0, 2, 4, 7, 0, 0, 0, 0]),
    from_u32x8([1, 2, 4, 7, 0, 0, 0, 0]),
    from_u32x8([0, 1, 2, 4, 7, 0, 0, 0]),
    from_u32x8([3, 4, 7, 0, 0, 0, 0, 0]),
    from_u32x8([0, 3, 4, 7, 0, 0, 0, 0]),
    from_u32x8([1, 3, 4, 7, 0, 0, 0, 0]),
    from_u32x8([0, 1, 3, 4, 7, 0, 0, 0]),
    from_u32x8([2, 3, 4, 7, 0, 0, 0, 0]),
    from_u32x8([0, 2, 3, 4, 7, 0, 0, 0]),
    from_u32x8([1, 2, 3, 4, 7, 0, 0, 0]),
    from_u32x8([0, 1, 2, 3, 4, 7, 0, 0]),
    from_u32x8([5, 7, 0, 0, 0, 0, 0, 0]),
    from_u32x8([0, 5, 7, 0, 0, 0, 0, 0]),
    from_u32x8([1, 5, 7, 0, 0, 0, 0, 0]),
    from_u32x8([0, 1, 5, 7, 0, 0, 0, 0]),
    from_u32x8([2, 5, 7, 0, 0, 0, 0, 0]),
    from_u32x8([0, 2, 5, 7, 0, 0, 0, 0]),
    from_u32x8([1, 2, 5, 7, 0, 0, 0, 0]),
    from_u32x8([0, 1, 2, 5, 7, 0, 0, 0]),
    from_u32x8([3, 5, 7, 0, 0, 0, 0, 0]),
    from_u32x8([0, 3, 5, 7, 0, 0, 0, 0]),
    from_u32x8([1, 3, 5, 7, 0, 0, 0, 0]),
    from_u32x8([0, 1, 3, 5, 7, 0, 0, 0]),
    from_u32x8([2, 3, 5, 7, 0, 0, 0, 0]),
    from_u32x8([0, 2, 3, 5, 7, 0, 0, 0]),
    from_u32x8([1, 2, 3, 5, 7, 0, 0, 0]),
    from_u32x8([0, 1, 2, 3, 5, 7, 0, 0]),
    from_u32x8([4, 5, 7, 0, 0, 0, 0, 0]),
    from_u32x8([0, 4, 5, 7, 0, 0, 0, 0]),
    from_u32x8([1, 4, 5, 7, 0, 0, 0, 0]),
    from_u32x8([0, 1, 4, 5, 7, 0, 0, 0]),
    from_u32x8([2, 4, 5, 7, 0, 0, 0, 0]),
    from_u32x8([0, 2, 4, 5, 7, 0, 0, 0]),
    from_u32x8([1, 2, 4, 5, 7, 0, 0, 0]),
    from_u32x8([0, 1, 2, 4, 5, 7, 0, 0]),
    from_u32x8([3, 4, 5, 7, 0, 0, 0, 0]),
    from_u32x8([0, 3, 4, 5, 7, 0, 0, 0]),
    from_u32x8([1, 3, 4, 5, 7, 0, 0, 0]),
    from_u32x8([0, 1, 3, 4, 5, 7, 0, 0]),
    from_u32x8([2, 3, 4, 5, 7, 0, 0, 0]),
    from_u32x8([0, 2, 3, 4, 5, 7, 0, 0]),
    from_u32x8([1, 2, 3, 4, 5, 7, 0, 0]),
    from_u32x8([0, 1, 2, 3, 4, 5, 7, 0]),
    from_u32x8([6, 7, 0, 0, 0, 0, 0, 0]),
    from_u32x8([0, 6, 7, 0, 0, 0, 0, 0]),
    from_u32x8([1, 6, 7, 0, 0, 0, 0, 0]),
    from_u32x8([0, 1, 6, 7, 0, 0, 0, 0]),
    from_u32x8([2, 6, 7, 0, 0, 0, 0, 0]),
    from_u32x8([0, 2, 6, 7, 0, 0, 0, 0]),
    from_u32x8([1, 2, 6, 7, 0, 0, 0, 0]),
    from_u32x8([0, 1, 2, 6, 7, 0, 0, 0]),
    from_u32x8([3, 6, 7, 0, 0, 0, 0, 0]),
    from_u32x8([0, 3, 6, 7, 0, 0, 0, 0]),
    from_u32x8([1, 3, 6, 7, 0, 0, 0, 0]),
    from_u32x8([0, 1, 3, 6, 7, 0, 0, 0]),
    from_u32x8([2, 3, 6, 7, 0, 0, 0, 0]),
    from_u32x8([0, 2, 3, 6, 7, 0, 0, 0]),
    from_u32x8([1, 2, 3, 6, 7, 0, 0, 0]),
    from_u32x8([0, 1, 2, 3, 6, 7, 0, 0]),
    from_u32x8([4, 6, 7, 0, 0, 0, 0, 0]),
    from_u32x8([0, 4, 6, 7, 0, 0, 0, 0]),
    from_u32x8([1, 4, 6, 7, 0, 0, 0, 0]),
    from_u32x8([0, 1, 4, 6, 7, 0, 0, 0]),
    from_u32x8([2, 4, 6, 7, 0, 0, 0, 0]),
    from_u32x8([0, 2, 4, 6, 7, 0, 0, 0]),
    from_u32x8([1, 2, 4, 6, 7, 0, 0, 0]),
    from_u32x8([0, 1, 2, 4, 6, 7, 0, 0]),
    from_u32x8([3, 4, 6, 7, 0, 0, 0, 0]),
    from_u32x8([0, 3, 4, 6, 7, 0, 0, 0]),
    from_u32x8([1, 3, 4, 6, 7, 0, 0, 0]),
    from_u32x8([0, 1, 3, 4, 6, 7, 0, 0]),
    from_u32x8([2, 3, 4, 6, 7, 0, 0, 0]),
    from_u32x8([0, 2, 3, 4, 6, 7, 0, 0]),
    from_u32x8([1, 2, 3, 4, 6, 7, 0, 0]),
    from_u32x8([0, 1, 2, 3, 4, 6, 7, 0]),
    from_u32x8([5, 6, 7, 0, 0, 0, 0, 0]),
    from_u32x8([0, 5, 6, 7, 0, 0, 0, 0]),
    from_u32x8([1, 5, 6, 7, 0, 0, 0, 0]),
    from_u32x8([0, 1, 5, 6, 7, 0, 0, 0]),
    from_u32x8([2, 5, 6, 7, 0, 0, 0, 0]),
    from_u32x8([0, 2, 5, 6, 7, 0, 0, 0]),
    from_u32x8([1, 2, 5, 6, 7, 0, 0, 0]),
    from_u32x8([0, 1, 2, 5, 6, 7, 0, 0]),
    from_u32x8([3, 5, 6, 7, 0, 0, 0, 0]),
    from_u32x8([0, 3, 5, 6, 7, 0, 0, 0]),
    from_u32x8([1, 3, 5, 6, 7, 0, 0, 0]),
    from_u32x8([0, 1, 3, 5, 6, 7, 0, 0]),
    from_u32x8([2, 3, 5, 6, 7, 0, 0, 0]),
    from_u32x8([0, 2, 3, 5, 6, 7, 0, 0]),
    from_u32x8([1, 2, 3, 5, 6, 7, 0, 0]),
    from_u32x8([0, 1, 2, 3, 5, 6, 7, 0]),
    from_u32x8([4, 5, 6, 7, 0, 0, 0, 0]),
    from_u32x8([0, 4, 5, 6, 7, 0, 0, 0]),
    from_u32x8([1, 4, 5, 6, 7, 0, 0, 0]),
    from_u32x8([0, 1, 4, 5, 6, 7, 0, 0]),
    from_u32x8([2, 4, 5, 6, 7, 0, 0, 0]),
    from_u32x8([0, 2, 4, 5, 6, 7, 0, 0]),
    from_u32x8([1, 2, 4, 5, 6, 7, 0, 0]),
    from_u32x8([0, 1, 2, 4, 5, 6, 7, 0]),
    from_u32x8([3, 4, 5, 6, 7, 0, 0, 0]),
    from_u32x8([0, 3, 4, 5, 6, 7, 0, 0]),
    from_u32x8([1, 3, 4, 5, 6, 7, 0, 0]),
    from_u32x8([0, 1, 3, 4, 5, 6, 7, 0]),
    from_u32x8([2, 3, 4, 5, 6, 7, 0, 0]),
    from_u32x8([0, 2, 3, 4, 5, 6, 7, 0]),
    from_u32x8([1, 2, 3, 4, 5, 6, 7, 0]),
    from_u32x8([0, 1, 2, 3, 4, 5, 6, 7]),
];


================================================
FILE: bitpacker/src/filter_vec/mod.rs
================================================
use std::ops::RangeInclusive;

#[cfg(target_arch = "x86_64")]
mod avx2;

mod scalar;

#[derive(Clone, Copy, Eq, PartialEq, Debug)]
#[repr(u8)]
enum FilterImplPerInstructionSet {
    #[cfg(target_arch = "x86_64")]
    AVX2 = 0u8,
    Scalar = 1u8,
}

impl FilterImplPerInstructionSet {
    #[inline]
    pub fn is_available(&self) -> bool {
        match *self {
            #[cfg(target_arch = "x86_64")]
            FilterImplPerInstructionSet::AVX2 => is_x86_feature_detected!("avx2"),
            FilterImplPerInstructionSet::Scalar => true,
        }
    }
}

// List of available implementation in preferred order.
#[cfg(target_arch = "x86_64")]
const IMPLS: [FilterImplPerInstructionSet; 2] = [
    FilterImplPerInstructionSet::AVX2,
    FilterImplPerInstructionSet::Scalar,
];

#[cfg(not(target_arch = "x86_64"))]
const IMPLS: [FilterImplPerInstructionSet; 1] = [FilterImplPerInstructionSet::Scalar];

impl FilterImplPerInstructionSet {
    #[inline]
    #[allow(unused_variables)] // on non-x86_64, code is unused.
    fn from(code: u8) -> FilterImplPerInstructionSet {
        #[cfg(target_arch = "x86_64")]
        if code == FilterImplPerInstructionSet::AVX2 as u8 {
            return FilterImplPerInstructionSet::AVX2;
        }
        FilterImplPerInstructionSet::Scalar
    }

    #[inline]
    fn filter_vec_in_place(self, range: RangeInclusive<u32>, offset: u32, output: &mut Vec<u32>) {
        match self {
            #[cfg(target_arch = "x86_64")]
            FilterImplPerInstructionSet::AVX2 => avx2::filter_vec_in_place(range, offset, output),
            FilterImplPerInstructionSet::Scalar => {
                scalar::filter_vec_in_place(range, offset, output)
            }
        }
    }
}

#[inline]
fn get_best_available_instruction_set() -> FilterImplPerInstructionSet {
    use std::sync::atomic::{AtomicU8, Ordering};
    static INSTRUCTION_SET_BYTE: AtomicU8 = AtomicU8::new(u8::MAX);
    let instruction_set_byte: u8 = INSTRUCTION_SET_BYTE.load(Ordering::Relaxed);
    if instruction_set_byte == u8::MAX {
        // Let's initialize the instruction set and cache it.
        let instruction_set = IMPLS
            .into_iter()
            .find(FilterImplPerInstructionSet::is_available)
            .unwrap();
        INSTRUCTION_SET_BYTE.store(instruction_set as u8, Ordering::Relaxed);
        return instruction_set;
    }
    FilterImplPerInstructionSet::from(instruction_set_byte)
}

pub fn filter_vec_in_place(range: RangeInclusive<u32>, offset: u32, output: &mut Vec<u32>) {
    get_best_available_instruction_set().filter_vec_in_place(range, offset, output)
}

#[cfg(test)]
mod tests {
    use super::*;

    #[test]
    fn test_get_best_available_instruction_set() {
        // This does not test much unfortunately.
        // We just make sure the function returns without crashing and returns the same result.
        let instruction_set = get_best_available_instruction_set();
        assert_eq!(get_best_available_instruction_set(), instruction_set);
    }

    #[cfg(target_arch = "x86_64")]
    #[test]
    fn test_instruction_set_to_code_from_code() {
        for instruction_set in [
            FilterImplPerInstructionSet::AVX2,
            FilterImplPerInstructionSet::Scalar,
        ] {
            let code = instruction_set as u8;
            assert_eq!(instruction_set, FilterImplPerInstructionSet::from(code));
        }
    }

    fn test_filter_impl_empty_aux(filter_impl: FilterImplPerInstructionSet) {
        let mut output = vec![];
        filter_impl.filter_vec_in_place(0..=u32::MAX, 0, &mut output);
        assert_eq!(&output, &[]);
    }

    fn test_filter_impl_simple_aux(filter_impl: FilterImplPerInstructionSet) {
        let mut output = vec![3, 2, 1, 5, 11, 2, 5, 10, 2];
        filter_impl.filter_vec_in_place(3..=10, 0, &mut output);
        assert_eq!(&output, &[0, 3, 6, 7]);
    }

    fn test_filter_impl_simple_aux_shifted(filter_impl: FilterImplPerInstructionSet) {
        let mut output = vec![3, 2, 1, 5, 11, 2, 5, 10, 2];
        filter_impl.filter_vec_in_place(3..=10, 10, &mut output);
        assert_eq!(&output, &[10, 13, 16, 17]);
    }

    fn test_filter_impl_simple_outside_i32_range(filter_impl: FilterImplPerInstructionSet) {
        let mut output = vec![u32::MAX, i32::MAX as u32 + 1, 0, 1, 3, 1, 1, 1, 1];
        filter_impl.filter_vec_in_place(1..=i32::MAX as u32 + 1u32, 0, &mut output);
        assert_eq!(&output, &[1, 3, 4, 5, 6, 7, 8]);
    }

    fn test_filter_impl_test_suite(filter_impl: FilterImplPerInstructionSet) {
        test_filter_impl_empty_aux(filter_impl);
        test_filter_impl_simple_aux(filter_impl);
        test_filter_impl_simple_aux_shifted(filter_impl);
        test_filter_impl_simple_outside_i32_range(filter_impl);
    }

    #[test]
    #[cfg(target_arch = "x86_64")]
    fn test_filter_implementation_avx2() {
        if FilterImplPerInstructionSet::AVX2.is_available() {
            test_filter_impl_test_suite(FilterImplPerInstructionSet::AVX2);
        }
    }

    #[test]
    fn test_filter_implementation_scalar() {
        test_filter_impl_test_suite(FilterImplPerInstructionSet::Scalar);
    }

    #[cfg(target_arch = "x86_64")]
    proptest::proptest! {
        #[test]
        fn test_filter_compare_scalar_and_avx2_impl_proptest(
            start in proptest::prelude::any::<u32>(),
            end in proptest::prelude::any::<u32>(),
            offset in 0u32..2u32,
            mut vals in proptest::collection::vec(0..u32::MAX, 0..30)) {
            if FilterImplPerInstructionSet::AVX2.is_available() {
                let mut vals_clone = vals.clone();
                FilterImplPerInstructionSet::AVX2.filter_vec_in_place(start..=end, offset, &mut vals);
                FilterImplPerInstructionSet::Scalar.filter_vec_in_place(start..=end, offset, &mut vals_clone);
                assert_eq!(&vals, &vals_clone);
            }
       }
    }
}


================================================
FILE: bitpacker/src/filter_vec/scalar.rs
================================================
use std::ops::RangeInclusive;

pub fn filter_vec_in_place(range: RangeInclusive<u32>, offset: u32, output: &mut Vec<u32>) {
    // We restrict the accepted boundary, because unsigned integers & SIMD don't
    // play well.
    let mut output_cursor = 0;
    for i in 0..output.len() {
        let val = output[i];
        output[output_cursor] = offset + i as u32;
        output_cursor += if range.contains(&val) { 1 } else { 0 };
    }
    output.truncate(output_cursor);
}


================================================
FILE: bitpacker/src/lib.rs
================================================
mod bitpacker;
mod blocked_bitpacker;
mod filter_vec;

use std::cmp::Ordering;

pub use crate::bitpacker::{BitPacker, BitUnpacker};
pub use crate::blocked_bitpacker::BlockedBitpacker;

/// Computes the number of bits that will be used for bitpacking.
///
/// In general the target is the minimum number of bits
/// required to express the amplitude given in argument.
///
/// e.g. If the amplitude is 10, we can store all ints on simply 4bits.
///
/// The logic is slightly more convoluted here as for optimization
/// reasons, we want to ensure that a value spawns over at most 8 bytes
/// of aligned bytes.
///
/// Spanning over 9 bytes is possible for instance, if we do
/// bitpacking with an amplitude of 63 bits.
/// In this case, the second int will start on bit
/// 63 (which belongs to byte 7) and ends at byte 15;
/// Hence 9 bytes (from byte 7 to byte 15 included).
///
/// To avoid this, we force the number of bits to 64bits
/// when the result is greater than `64-8 = 56 bits`.
///
/// Note that this only affects rare use cases spawning over
/// a very large range of values. Even in this case, it results
/// in an extra cost of at most 12% compared to the optimal
/// number of bits.
pub fn compute_num_bits(n: u64) -> u8 {
    let amplitude = (64u32 - n.leading_zeros()) as u8;
    if amplitude <= 64 - 8 { amplitude } else { 64 }
}

/// Computes the (min, max) of an iterator of `PartialOrd` values.
///
/// For values implementing `Ord` (in a way consistent to their `PartialOrd` impl),
/// this function behaves as expected.
///
/// For values with partial ordering, the behavior is non-trivial and may
/// depends on the order of the values.
/// For floats however, it simply returns the same results as if NaN were
/// skipped.
pub fn minmax<I, T>(mut vals: I) -> Option<(T, T)>
where
    I: Iterator<Item = T>,
    T: Copy + PartialOrd,
{
    let first_el = vals.find(|val| {
        // We use this to make sure we skip all NaN values when
        // working with a float type.
        val.partial_cmp(val) == Some(Ordering::Equal)
    })?;
    let mut min_so_far: T = first_el;
    let mut max_so_far: T = first_el;
    for val in vals {
        if val.partial_cmp(&min_so_far) == Some(Ordering::Less) {
            min_so_far = val;
        }
        if val.partial_cmp(&max_so_far) == Some(Ordering::Greater) {
            max_so_far = val;
        }
    }
    Some((min_so_far, max_so_far))
}

#[cfg(test)]
mod tests {
    use super::*;

    #[test]
    fn test_compute_num_bits() {
        assert_eq!(compute_num_bits(1), 1u8);
        assert_eq!(compute_num_bits(0), 0u8);
        assert_eq!(compute_num_bits(2), 2u8);
        assert_eq!(compute_num_bits(3), 2u8);
        assert_eq!(compute_num_bits(4), 3u8);
        assert_eq!(compute_num_bits(255), 8u8);
        assert_eq!(compute_num_bits(256), 9u8);
        assert_eq!(compute_num_bits(5_000_000_000), 33u8);
    }

    #[test]
    fn test_minmax_empty() {
        let vals: Vec<u32> = vec![];
        assert_eq!(minmax(vals.into_iter()), None);
    }

    #[test]
    fn test_minmax_one() {
        assert_eq!(minmax(vec![1].into_iter()), Some((1, 1)));
    }

    #[test]
    fn test_minmax_two() {
        assert_eq!(minmax(vec![1, 2].into_iter()), Some((1, 2)));
        assert_eq!(minmax(vec![2, 1].into_iter()), Some((1, 2)));
    }

    #[test]
    fn test_minmax_nan() {
        assert_eq!(
            minmax(vec![f64::NAN, 1f64, 2f64].into_iter()),
            Some((1f64, 2f64))
        );
        assert_eq!(
            minmax(vec![2f64, f64::NAN, 1f64].into_iter()),
            Some((1f64, 2f64))
        );
        assert_eq!(
            minmax(vec![2f64, 1f64, f64::NAN].into_iter()),
            Some((1f64, 2f64))
        );
    }

    #[test]
    fn test_minmax_inf() {
        assert_eq!(
            minmax(vec![f64::INFINITY, 1f64, 2f64].into_iter()),
            Some((1f64, f64::INFINITY))
        );
        assert_eq!(
            minmax(vec![-f64::INFINITY, 1f64, 2f64].into_iter()),
            Some((-f64::INFINITY, 2f64))
        );
        assert_eq!(
            minmax(vec![2f64, f64::INFINITY, 1f64].into_iter()),
            Some((1f64, f64::INFINITY))
        );
        assert_eq!(
            minmax(vec![2f64, 1f64, -f64::INFINITY].into_iter()),
            Some((-f64::INFINITY, 2f64))
        );
    }
}


================================================
FILE: cliff.toml
================================================
# configuration file for git-cliff{ pattern = "foo", replace = "bar"}
# see https://github.com/orhun/git-cliff#configuration-file

[remote.github]
owner = "quickwit-oss"
repo = "tantivy"

[changelog]
# changelog header
header = """
"""
# template for the changelog body
# https://tera.netlify.app/docs/#introduction
body = """
## What's Changed

{%- if version %} in {{ version }}{%- endif -%}
{% for commit in commits %}
  {% if commit.remote.pr_title -%}
    {%- set commit_message = commit.remote.pr_title -%}
  {%- else -%}
    {%- set commit_message = commit.message -%}
  {%- endif -%}
  - {{ commit_message | split(pat="\n") | first | trim }}\
    {% if commit.remote.pr_number %} \
      [#{{ commit.remote.pr_number }}]({{ self::remote_url() }}/pull/{{ commit.remote.pr_number }}){% if commit.remote.username %}(@{{ commit.remote.username }}){%- endif -%} \
    {%- endif %}
{%- endfor -%}

{% if github.contributors | filter(attribute="is_first_time", value=true) | length != 0 %}
  {% raw %}\n{% endraw -%}
  ## New Contributors
{%- endif %}\
{% for contributor in github.contributors | filter(attribute="is_first_time", value=true) %}
  * @{{ contributor.username }} made their first contribution
    {%- if contributor.pr_number %} in \
      [#{{ contributor.pr_number }}]({{ self::remote_url() }}/pull/{{ contributor.pr_number }}) \
    {%- endif %}
{%- endfor -%}

{% if version %}
    {% if previous.version %}
      **Full Changelog**: {{ self::remote_url() }}/compare/{{ previous.version }}...{{ version }}
    {% endif %}
{% else -%}
  {% raw %}\n{% endraw %}
{% endif %}

{%- macro remote_url() -%}
  https://github.com/{{ remote.github.owner }}/{{ remote.github.repo }}
{%- endmacro -%}
"""
# remove the leading and trailing whitespace from the template
trim = true
# changelog footer
footer = """
"""

postprocessors = [
]

[git]
# parse the commits based on https://www.conventionalcommits.org
# This is required or commit.message contains the whole commit message and not just the title
conventional_commits = false
# filter out the commits that are not conventional
filter_unconventional = true
# process each line of a commit as an individual commit
split_commits = false
# regex for preprocessing the commit messages
commit_preprocessors = [
    { pattern = '\((\w+\s)?#([0-9]+)\)', replace = ""},
]
#link_parsers = [
    #{ pattern = "#(\\d+)", href = "https://github.com/quickwit-oss/tantivy/pulls/$1"},
#]
# regex for parsing and grouping commits
# protect breaking changes from being skipped due to matching a skipping commit_parser
protect_breaking_commits = false
# filter out the commits that are not matched by commit parsers
filter_commits = false
# glob pattern for matching git tags
tag_pattern = "v[0-9]*"
# regex for skipping tags
skip_tags = "v0.1.0-beta.1"
# regex for ignoring tags
ignore_tags = ""
# sort the tags topologically
topo_order = false
# sort the commits inside sections by oldest/newest order
sort_commits = "newest"
# limit the number of commits included in the changelog.
# limit_commits = 42


================================================
FILE: columnar/Cargo.toml
================================================
[package]
name = "tantivy-columnar"
version = "0.6.0"
edition = "2024"
license = "MIT"
homepage = "https://github.com/quickwit-oss/tantivy"
repository = "https://github.com/quickwit-oss/tantivy"
description = "column oriented storage for tantivy"
categories = ["database-implementations", "data-structures", "compression"]

[dependencies]
itertools = "0.14.0"
fastdivide = "0.4.0"

stacker = { version= "0.6", path = "../stacker", package="tantivy-stacker"}
sstable = { version= "0.6", path = "../sstable", package = "tantivy-sstable" }
common = { version= "0.10", path = "../common", package = "tantivy-common" }
tantivy-bitpacker = { version= "0.9", path = "../bitpacker/" }
serde = "1.0.152"
downcast-rs = "2.0.1"

[dev-dependencies]
proptest = "1"
more-asserts = "0.3.1"
rand = "0.9"
binggan = "0.14.0"

[[bench]]
name = "bench_merge"
harness = false

[[bench]]
name = "bench_access"
harness = false

[[bench]]
name = "bench_first_vals"
harness = false

[[bench]]
name = "bench_values_u64"
harness = false

[[bench]]
name = "bench_values_u128"
harness = false

[[bench]]
name = "bench_create_column_values"
harness = false

[[bench]]
name = "bench_column_values_get"
harness = false

[[bench]]
name = "bench_optional_index"
harness = false

[features]
zstd-compression = ["sstable/zstd-compression"]


================================================
FILE: columnar/README.md
================================================
# Columnar format

This crate describes columnar format used in tantivy.

## Goals

This format is special in the following way.
- it needs to be compact
- accessing a specific column does not require to load the entire columnar. It can be done in 2 to 3 random access.
- columns of several types can be associated with the same column name.
- it needs to support columns with different types `(str, u64, i64, f64)`
and different cardinality `(required, optional, multivalued)`.
- columns, once loaded, offer cheap random access.
- it is designed to allow range queries.

# Coercion rules

Users can create a columnar by inserting rows to a `ColumnarWriter`,
and serializing it into a `Write` object.
Nothing prevents a user from recording values with different type to the same `column_name`.

In that case, `tantivy-columnar`'s behavior is as follows:
- JsonValues are grouped into 3 types (String, Number, bool).
Values that corresponds to different groups are mapped to different columns. For instance, String values are treated independently
from Number or boolean values. `tantivy-columnar` will simply emit several columns associated to a given column_name.
- Only one column for a given json value type is emitted.  If number values with different number types are recorded (e.g. u64, i64, f64),
`tantivy-columnar` will pick the first type that can represents the set of appended value, with the following prioriy order (`i64`, `u64`, `f64`).
`i64` is picked over `u64` as it is likely to  yield less change of types. Most use cases strictly requiring `u64` show the
restriction on 50% of the values (e.g. a 64-bit hash). On the other hand, a lot of use cases can show rare negative value.

# Columnar format

This columnar format may have more than one column (with different types) associated to the same `column_name` (see [Coercion rules](#coercion-rules) above).
The `(column_name, column_type)` couple however uniquely identifies a column.
That couple is serialized as a column `column_key`.  The format of that key is:
`[column_name][ZERO_BYTE][column_type_header: u8]`

```
COLUMNAR:=
    [COLUMNAR_DATA]
    [COLUMNAR_KEY_TO_DATA_INDEX]
    [COLUMNAR_FOOTER];


# Columns are sorted by their column key.
COLUMNAR_DATA:=
    [COLUMN_DATA]+;

COLUMNAR_FOOTER := [RANGE_SSTABLE_BYTES_LEN: 8 bytes little endian]

```

The columnar file starts by the actual column data, concatenated one after the other,
sorted by column key.

A sstable associates
`(column name, column_cardinality, column_type) to range of bytes.

Column name may not contain the zero byte `\0`.

Listing all columns associated to `column_name` can therefore
be done by listing all keys prefixed by
`[column_name][ZERO_BYTE]`

The associated range of bytes refer to a range of bytes

This crate exposes a columnar format for tantivy.
This format is described in README.md


The crate introduces the following concepts.

`Columnar` is an equivalent of a dataframe.
It maps `column_key` to `Column`.

A `Column<T>` associates a `RowId` (u32) to any
number of values.

This is made possible by wrapping a `ColumnIndex` and a `ColumnValue` object.
The `ColumnValue<T>` represents a mapping that associates each `RowId` to
exactly one single value.

The `ColumnIndex` then maps each RowId to a set of `RowId` in the
`ColumnValue`.

For optimization, and compression purposes, the `ColumnIndex` has three
possible representation, each for different cardinalities.

- Full

All RowId have exactly one value. The ColumnIndex is the trivial mapping.

- Optional

All RowIds can have at most one value. The ColumnIndex is the trivial mapping `ColumnRowId -> Option<ColumnValueRowId>`.

- Multivalued

All RowIds can have any number of values.
The column index is mapping values to a range.


All these objects are implemented an unit tested independently
in their own module:

- columnar
- column_index
- column_values
- column


================================================
FILE: columnar/benches/bench_access.rs
================================================
use binggan::{InputGroup, black_box};
use common::*;
use tantivy_columnar::Column;

pub mod common;

const NUM_DOCS: u32 = 2_000_000;

pub fn generate_columnar_and_open(card: Card, num_docs: u32) -> Column {
    let reader = generate_columnar_with_name(card, num_docs, "price");
    reader.read_columns("price").unwrap()[0]
        .open_u64_lenient()
        .unwrap()
        .unwrap()
}

fn main() {
    let mut inputs = Vec::new();

    let mut add_card = |card1: Card| {
        inputs.push((
            card1.to_string(),
            generate_columnar_and_open(card1, NUM_DOCS),
        ));
    };

    add_card(Card::MultiSparse);
    add_card(Card::Multi);
    add_card(Card::Sparse);
    add_card(Card::Dense);
    add_card(Card::Full);

    bench_group(InputGroup::new_with_inputs(inputs));
}

fn bench_group(mut runner: InputGroup<Column>) {
    runner.register("access_values_for_doc", |column| {
        let mut sum = 0;
        for i in 0..NUM_DOCS {
            for value in column.values_for_doc(i) {
                sum += value;
            }
        }
        black_box(sum);
    });
    runner.register("access_first_vals", |column| {
        let mut sum = 0;
        const BLOCK_SIZE: usize = 32;
        let mut docs = vec![0; BLOCK_SIZE];
        let mut buffer = vec![None; BLOCK_SIZE];
        for i in (0..NUM_DOCS).step_by(BLOCK_SIZE) {
            // fill docs
            #[allow(clippy::needless_range_loop)]
            for idx in 0..BLOCK_SIZE {
                docs[idx] = idx as u32 + i;
            }

            column.first_vals(&docs, &mut buffer);
            for val in buffer.iter() {
                let Some(val) = val else { continue };
                sum += *val;
            }
        }

        black_box(sum);
    });
    runner.run();
}


================================================
FILE: columnar/benches/bench_column_values_get.rs
================================================
use std::sync::Arc;

use binggan::{InputGroup, black_box};
use rand::rngs::StdRng;
use rand::{Rng, SeedableRng};
use tantivy_columnar::ColumnValues;
use tantivy_columnar::column_values::{CodecType, serialize_and_load_u64_based_column_values};

fn get_data() -> Vec<u64> {
    let mut rng = StdRng::seed_from_u64(2u64);
    let mut data: Vec<_> = (100..55_000_u64)
        .map(|num| num + rng.random::<u8>() as u64)
        .collect();
    data.push(99_000);
    data.insert(1000, 2000);
    data.insert(2000, 100);
    data.insert(3000, 4100);
    data.insert(4000, 100);
    data.insert(5000, 800);
    data
}

#[inline(never)]
fn value_iter() -> impl Iterator<Item = u64> {
    0..20_000
}

type Col = Arc<dyn ColumnValues<u64>>;

fn main() {
    let data = get_data();
    let inputs: Vec<(String, Col)> = vec![
        (
            "bitpacked".to_string(),
            serialize_and_load_u64_based_column_values(&data.as_slice(), &[CodecType::Bitpacked]),
        ),
        (
            "linear".to_string(),
            serialize_and_load_u64_based_column_values(&data.as_slice(), &[CodecType::Linear]),
        ),
        (
            "blockwise_linear".to_string(),
            serialize_and_load_u64_based_column_values(
                &data.as_slice(),
                &[CodecType::BlockwiseLinear],
            ),
        ),
    ];

    let mut group: InputGroup<Col> = InputGroup::new_with_inputs(inputs);

    group.register("fastfield_get", |col: &Col| {
        let mut sum = 0u64;
        for pos in value_iter() {
            sum = sum.wrapping_add(col.get_val(pos as u32));
        }
        black_box(sum);
    });

    group.run();
}


================================================
FILE: columnar/benches/bench_create_column_values.rs
================================================
use binggan::{InputGroup, black_box};
use rand::rngs::StdRng;
use rand::{Rng, SeedableRng};
use tantivy_columnar::column_values::{CodecType, serialize_u64_based_column_values};

fn get_data() -> Vec<u64> {
    let mut rng = StdRng::seed_from_u64(2u64);
    let mut data: Vec<_> = (100..55_000_u64)
        .map(|num| num + rng.random::<u8>() as u64)
        .collect();
    data.push(99_000);
    data.insert(1000, 2000);
    data.insert(2000, 100);
    data.insert(3000, 4100);
    data.insert(4000, 100);
    data.insert(5000, 800);
    data
}

fn main() {
    let data = get_data();
    let mut group: InputGroup<(CodecType, Vec<u64>)> = InputGroup::new_with_inputs(vec![
        (
            "bitpacked codec".to_string(),
            (CodecType::Bitpacked, data.clone()),
        ),
        (
            "linear codec".to_string(),
            (CodecType::Linear, data.clone()),
        ),
        (
            "blockwise linear codec".to_string(),
            (CodecType::BlockwiseLinear, data.clone()),
        ),
    ]);

    group.register("serialize column_values", |data| {
        let mut buffer = Vec::new();
        serialize_u64_based_column_values(&data.1.as_slice(), &[data.0], &mut buffer).unwrap();
        black_box(buffer.len());
    });

    group.run();
}


================================================
FILE: columnar/benches/bench_first_vals.rs
================================================
use std::sync::Arc;

use binggan::{InputGroup, black_box};
use rand::prelude::*;
use tantivy_columnar::column_values::{CodecType, serialize_and_load_u64_based_column_values};
use tantivy_columnar::*;

struct Columns {
    pub optional: Column,
    pub full: Column,
    pub multi: Column,
}

fn get_test_columns() -> Columns {
    let data = generate_permutation();
    let mut dataframe_writer = ColumnarWriter::default();
    for (idx, val) in data.iter().enumerate() {
        dataframe_writer.record_numerical(idx as u32, "full_values", NumericalValue::U64(*val));
        if idx % 2 == 0 {
            dataframe_writer.record_numerical(
                idx as u32,
                "optional_values",
                NumericalValue::U64(*val),
            );
        }
        dataframe_writer.record_numerical(idx as u32, "multi_values", NumericalValue::U64(*val));
        dataframe_writer.record_numerical(idx as u32, "multi_values", NumericalValue::U64(*val));
    }
    let mut buffer: Vec<u8> = Vec::new();
    dataframe_writer
        .serialize(data.len() as u32, &mut buffer)
        .unwrap();
    let columnar = ColumnarReader::open(buffer).unwrap();

    let cols: Vec<DynamicColumnHandle> = columnar.read_columns("optional_values").unwrap();
    assert_eq!(cols.len(), 1);
    let optional = cols[0].open_u64_lenient().unwrap().unwrap();
    assert_eq!(optional.index.get_cardinality(), Cardinality::Optional);

    let cols: Vec<DynamicColumnHandle> = columnar.read_columns("full_values").unwrap();
    assert_eq!(cols.len(), 1);
    let column_full = cols[0].open_u64_lenient().unwrap().unwrap();
    assert_eq!(column_full.index.get_cardinality(), Cardinality::Full);

    let cols: Vec<DynamicColumnHandle> = columnar.read_columns("multi_values").unwrap();
    assert_eq!(cols.len(), 1);
    let multi = cols[0].open_u64_lenient().unwrap().unwrap();
    assert_eq!(multi.index.get_cardinality(), Cardinality::Multivalued);

    Columns {
        optional,
        full: column_full,
        multi,
    }
}

const NUM_VALUES: u64 = 100_000;
fn generate_permutation() -> Vec<u64> {
    let mut permutation: Vec<u64> = (0u64..NUM_VALUES).collect();
    permutation.shuffle(&mut StdRng::from_seed([1u8; 32]));
    permutation
}

pub fn serialize_and_load(column: &[u64], codec_type: CodecType) -> Arc<dyn ColumnValues<u64>> {
    serialize_and_load_u64_based_column_values(&column, &[codec_type])
}

fn main() {
    let Columns {
        optional,
        full,
        multi,
    } = get_test_columns();

    let inputs = vec![
        ("full".to_string(), full),
        ("optional".to_string(), optional),
        ("multi".to_string(), multi),
    ];

    let mut group = InputGroup::new_with_inputs(inputs);

    group.register("first_full_scan", |column| {
        let mut sum = 0u64;
        for i in 0..NUM_VALUES as u32 {
            let val = column.first(i);
            sum += val.unwrap_or(0);
        }
        black_box(sum);
    });

    group.register("first_block_single_calls", |column| {
        let mut block: Vec<Option<u64>> = vec![None; 64];
        let fetch_docids = (0..64).collect::<Vec<_>>();
        for i in 0..fetch_docids.len() {
            block[i] = column.first(fetch_docids[i]);
        }
        black_box(block[0]);
    });

    group.run();
}


================================================
FILE: columnar/benches/bench_merge.rs
================================================
pub mod common;

use binggan::BenchRunner;
use common::{Card, generate_columnar_with_name};
use tantivy_columnar::*;

const NUM_DOCS: u32 = 100_000;

fn main() {
    let mut inputs = Vec::new();

    let mut add_combo = |card1: Card, card2: Card| {
        inputs.push((
            format!("merge_{card1}_and_{card2}"),
            vec![
                generate_columnar_with_name(card1, NUM_DOCS, "price"),
                generate_columnar_with_name(card2, NUM_DOCS, "price"),
            ],
        ));
    };

    add_combo(Card::Multi, Card::Multi);
    add_combo(Card::MultiSparse, Card::MultiSparse);
    add_combo(Card::Dense, Card::Dense);
    add_combo(Card::Sparse, Card::Sparse);
    add_combo(Card::Sparse, Card::Dense);
    add_combo(Card::MultiSparse, Card::Dense);
    add_combo(Card::MultiSparse, Card::Sparse);
    add_combo(Card::Multi, Card::Dense);
    add_combo(Card::Multi, Card::Sparse);

    let mut runner: BenchRunner = BenchRunner::new();
    let mut group = runner.new_group();
    for (input_name, columnar_readers) in inputs.iter() {
        group.register_with_input(
            input_name,
            columnar_readers,
            move |columnar_readers: &Vec<ColumnarReader>| {
                let mut out = Vec::new();
                let columnar_readers = columnar_readers.iter().collect::<Vec<_>>();
                let merge_row_order = StackMergeOrder::stack(&columnar_readers[..]);

                merge_columnar(&columnar_readers, &[], merge_row_order.into(), &mut out).unwrap();
                Some(out.len() as u64)
            },
        );
    }
    group.run();
}


================================================
FILE: columnar/benches/bench_optional_index.rs
================================================
use binggan::{InputGroup, black_box};
use rand::rngs::StdRng;
use rand::{Rng, SeedableRng};
use tantivy_columnar::column_index::{OptionalIndex, Set};

const TOTAL_NUM_VALUES: u32 = 1_000_000;

fn gen_optional_index(fill_ratio: f64) -> OptionalIndex {
    let mut rng: StdRng = StdRng::from_seed([1u8; 32]);
    let vals: Vec<u32> = (0..TOTAL_NUM_VALUES)
        .map(|_| rng.random_bool(fill_ratio))
        .enumerate()
        .filter(|(_pos, val)| *val)
        .map(|(pos, _)| pos as u32)
        .collect();
    OptionalIndex::for_test(TOTAL_NUM_VALUES, &vals)
}

fn random_range_iterator(
    start: u32,
    end: u32,
    avg_step_size: u32,
    avg_deviation: u32,
) -> impl Iterator<Item = u32> {
    let mut rng: StdRng = StdRng::from_seed([1u8; 32]);
    let mut current = start;
    std::iter::from_fn(move || {
        current += rng.random_range(avg_step_size - avg_deviation..=avg_step_size + avg_deviation);
        if current >= end { None } else { Some(current) }
    })
}

fn n_percent_step_iterator(percent: f32, num_values: u32) -> impl Iterator<Item = u32> {
    let ratio = percent / 100.0;
    let step_size = (1f32 / ratio) as u32;
    let deviation = step_size - 1;
    random_range_iterator(0, num_values, step_size, deviation)
}

fn walk_over_data(codec: &OptionalIndex, avg_step_size: u32) -> Option<u32> {
    walk_over_data_from_positions(
        codec,
        random_range_iterator(0, TOTAL_NUM_VALUES, avg_step_size, 0),
    )
}

fn walk_over_data_from_positions(
    codec: &OptionalIndex,
    positions: impl Iterator<Item = u32>,
) -> Option<u32> {
    let mut dense_idx: Option<u32> = None;
    for idx in positions {
        dense_idx = dense_idx.or(codec.rank_if_exists(idx));
    }
    dense_idx
}

fn main() {
    // Build separate inputs for each fill ratio.
    let inputs: Vec<(String, OptionalIndex)> = vec![
        ("fill=1%".to_string(), gen_optional_index(0.01)),
        ("fill=5%".to_string(), gen_optional_index(0.05)),
        ("fill=10%".to_string(), gen_optional_index(0.10)),
        ("fill=50%".to_string(), gen_optional_index(0.50)),
        ("fill=90%".to_string(), gen_optional_index(0.90)),
    ];

    let mut group: InputGroup<OptionalIndex> = InputGroup::new_with_inputs(inputs);

    // Translate orig->codec (rank_if_exists) with sampling
    group.register("orig_to_codec_10pct_hit", |codec: &OptionalIndex| {
        black_box(walk_over_data(codec, 100));
    });
    group.register("orig_to_codec_1pct_hit", |codec: &OptionalIndex| {
        black_box(walk_over_data(codec, 1000));
    });
    group.register("orig_to_codec_full_scan", |codec: &OptionalIndex| {
        black_box(walk_over_data_from_positions(codec, 0..TOTAL_NUM_VALUES));
    });

    // Translate codec->orig (select/select_batch) on sampled ranks
    fn bench_translate_codec_to_orig_util(codec: &OptionalIndex, percent_hit: f32) {
        let num_non_nulls = codec.num_non_nulls();
        let idxs: Vec<u32> = if percent_hit == 100.0f32 {
            (0..num_non_nulls).collect()
        } else {
            n_percent_step_iterator(percent_hit, num_non_nulls).collect()
        };
        let mut output = vec![0u32; idxs.len()];
        output.copy_from_slice(&idxs[..]);
        codec.select_batch(&mut output);
        black_box(output);
    }

    group.register("codec_to_orig_0.005pct_hit", |codec: &OptionalIndex| {
        bench_translate_codec_to_orig_util(codec, 0.005);
    });
    group.register("codec_to_orig_10pct_hit", |codec: &OptionalIndex| {
        bench_translate_codec_to_orig_util(codec, 10.0);
    });
    group.register("codec_to_orig_full_scan", |codec: &OptionalIndex| {
        bench_translate_codec_to_orig_util(codec, 100.0);
    });

    group.run();
}


================================================
FILE: columnar/benches/bench_values_u128.rs
================================================
use std::ops::RangeInclusive;
use std::sync::Arc;

use binggan::{InputGroup, black_box};
use common::OwnedBytes;
use rand::rngs::StdRng;
use rand::seq::SliceRandom;
use rand::{Rng, SeedableRng, random};
use tantivy_columnar::ColumnValues;

// TODO does this make sense for IPv6 ?
fn generate_random() -> Vec<u64> {
    let mut permutation: Vec<u64> = (0u64..100_000u64)
        .map(|el| el + random::<u16>() as u64)
        .collect();
    permutation.shuffle(&mut StdRng::from_seed([1u8; 32]));
    permutation
}

fn get_u128_column_random() -> Arc<dyn ColumnValues<u128>> {
    let permutation = generate_random();
    let permutation = permutation.iter().map(|el| *el as u128).collect::<Vec<_>>();
    get_u128_column_from_data(&permutation)
}

fn get_u128_column_from_data(data: &[u128]) -> Arc<dyn ColumnValues<u128>> {
    let mut out = vec![];
    tantivy_columnar::column_values::serialize_column_values_u128(&data, &mut out).unwrap();
    let out = OwnedBytes::new(out);
    tantivy_columnar::column_values::open_u128_mapped::<u128>(out).unwrap()
}

const FIFTY_PERCENT_RANGE: RangeInclusive<u64> = 1..=50;
const SINGLE_ITEM: u64 = 90;
const SINGLE_ITEM_RANGE: RangeInclusive<u64> = 90..=90;

fn get_data_50percent_item() -> Vec<u128> {
    let mut rng = StdRng::from_seed([1u8; 32]);

    let mut data = vec![];
    for _ in 0..300_000 {
        let val = rng.random_range(1..=100);
        data.push(val);
    }
    data.push(SINGLE_ITEM);
    data.shuffle(&mut rng);
    data.iter().map(|el| *el as u128).collect::<Vec<_>>()
}

fn main() {
    let data = get_data_50percent_item();
    let column_range = get_u128_column_from_data(&data);
    let column_random = get_u128_column_random();

    struct Inputs {
        data: Vec<u128>,
        column_range: Arc<dyn ColumnValues<u128>>,
        column_random: Arc<dyn ColumnValues<u128>>,
    }

    let inputs = Inputs {
        data,
        column_range,
        column_random,
    };
    let mut group: InputGroup<Inputs> =
        InputGroup::new_with_inputs(vec![("u128 benches".to_string(), inputs)]);

    group.register(
        "intfastfield_getrange_u128_50percent_hit",
        |inp: &Inputs| {
            let mut positions = Vec::new();
            inp.column_range.get_row_ids_for_value_range(
                *FIFTY_PERCENT_RANGE.start() as u128..=*FIFTY_PERCENT_RANGE.end() as u128,
                0..inp.data.len() as u32,
                &mut positions,
            );
            black_box(positions.len());
        },
    );

    group.register("intfastfield_getrange_u128_single_hit", |inp: &Inputs| {
        let mut positions = Vec::new();
        inp.column_range.get_row_ids_for_value_range(
            *SINGLE_ITEM_RANGE.start() as u128..=*SINGLE_ITEM_RANGE.end() as u128,
            0..inp.data.len() as u32,
            &mut positions,
        );
        black_box(positions.len());
    });

    group.register("intfastfield_getrange_u128_hit_all", |inp: &Inputs| {
        let mut positions = Vec::new();
        inp.column_range.get_row_ids_for_value_range(
            0..=u128::MAX,
            0..inp.data.len() as u32,
            &mut positions,
        );
        black_box(positions.len());
    });

    group.register("intfastfield_scan_all_fflookup_u128", |inp: &Inputs| {
        let mut a = 0u128;
        for i in 0u64..inp.column_random.num_vals() as u64 {
            a += inp.column_random.get_val(i as u32);
        }
        black_box(a);
    });

    group.register("intfastfield_jumpy_stride5_u128", |inp: &Inputs| {
        let n = inp.column_random.num_vals();
        let mut a = 0u128;
        for i in (0..n / 5).map(|val| val * 5) {
            a += inp.column_random.get_val(i);
        }
        black_box(a);
    });

    group.run();
}


================================================
FILE: columnar/benches/bench_values_u64.rs
================================================
use std::ops::RangeInclusive;
use std::sync::Arc;

use binggan::{InputGroup, black_box};
use rand::prelude::*;
use tantivy_columnar::column_values::{CodecType, serialize_and_load_u64_based_column_values};
use tantivy_columnar::*;

// Warning: this generates the same permutation at each call
fn generate_permutation() -> Vec<u64> {
    let mut permutation: Vec<u64> = (0u64..100_000u64).collect();
    permutation.shuffle(&mut StdRng::from_seed([1u8; 32]));
    permutation
}

// Warning: this generates the same permutation at each call
fn generate_permutation_gcd() -> Vec<u64> {
    let mut permutation: Vec<u64> = (1u64..100_000u64).map(|el| el * 1000).collect();
    permutation.shuffle(&mut StdRng::from_seed([1u8; 32]));
    permutation
}

pub fn serialize_and_load(column: &[u64], codec_type: CodecType) -> Arc<dyn ColumnValues<u64>> {
    serialize_and_load_u64_based_column_values(&column, &[codec_type])
}

const FIFTY_PERCENT_RANGE: RangeInclusive<u64> = 1..=50;
const SINGLE_ITEM: u64 = 90;
const SINGLE_ITEM_RANGE: RangeInclusive<u64> = 90..=90;
const ONE_PERCENT_ITEM_RANGE: RangeInclusive<u64> = 49..=49;

fn get_data_50percent_item() -> Vec<u128> {
    let mut rng = StdRng::from_seed([1u8; 32]);

    let mut data = vec![];
    for _ in 0..300_000 {
        let val = rng.random_range(1..=100);
        data.push(val);
    }
    data.push(SINGLE_ITEM);

    data.shuffle(&mut rng);
    data.iter().map(|el| *el as u128).collect::<Vec<_>>()
}

type VecCol = (Vec<u64>, Arc<dyn ColumnValues<u64>>);

fn bench_access() {
    let permutation = generate_permutation();
    let column_perm: Arc<dyn ColumnValues<u64>> =
        serialize_and_load(&permutation, CodecType::Bitpacked);

    let permutation_gcd = generate_permutation_gcd();
    let column_perm_gcd: Arc<dyn ColumnValues<u64>> =
        serialize_and_load(&permutation_gcd, CodecType::Bitpacked);

    let mut group: InputGroup<VecCol> = InputGroup::new_with_inputs(vec![
        (
            "access".to_string(),
            (permutation.clone(), column_perm.clone()),
        ),
        (
            "access_gcd".to_string(),
            (permutation_gcd.clone(), column_perm_gcd.clone()),
        ),
    ]);

    group.register("stride7_vec", |inp: &VecCol| {
        let n = inp.0.len();
        let mut a = 0u64;
        for i in (0..n / 7).map(|val| val * 7) {
            a += inp.0[i];
        }
        black_box(a);
    });

    group.register("fullscan_vec", |inp: &VecCol| {
        let mut a = 0u64;
        for i in 0..inp.0.len() {
            a += inp.0[i];
        }
        black_box(a);
    });

    group.register("stride7_column_values", |inp: &VecCol| {
        let n = inp.1.num_vals() as usize;
        let mut a = 0u64;
        for i in (0..n / 7).map(|val| val * 7) {
            a += inp.1.get_val(i as u32);
        }
        black_box(a);
    });

    group.register("fullscan_column_values", |inp: &VecCol| {
        let mut a = 0u64;
        let n = inp.1.num_vals() as usize;
        for i in 0..n {
            a += inp.1.get_val(i as u32);
        }
        black_box(a);
    });

    group.run();
}

fn bench_range() {
    let data_50 = get_data_50percent_item();
    let data_u64 = data_50.iter().map(|el| *el as u64).collect::<Vec<_>>();
    let column_data: Arc<dyn ColumnValues<u64>> =
        serialize_and_load(&data_u64, CodecType::Bitpacked);

    let mut group: InputGroup<Arc<dyn ColumnValues<u64>>> =
        InputGroup::new_with_inputs(vec![("dist_50pct_item".to_string(), column_data.clone())]);

    group.register(
        "fastfield_getrange_u64_50percent_hit",
        |col: &Arc<dyn ColumnValues<u64>>| {
            let mut positions = Vec::new();
            col.get_row_ids_for_value_range(FIFTY_PERCENT_RANGE, 0..col.num_vals(), &mut positions);
            black_box(positions.len());
        },
    );

    group.register(
        "fastfield_getrange_u64_1percent_hit",
        |col: &Arc<dyn ColumnValues<u64>>| {
            let mut positions = Vec::new();
            col.get_row_ids_for_value_range(
                ONE_PERCENT_ITEM_RANGE,
                0..col.num_vals(),
                &mut positions,
            );
            black_box(positions.len());
        },
    );

    group.register(
        "fastfield_getrange_u64_single_hit",
        |col: &Arc<dyn ColumnValues<u64>>| {
            let mut positions = Vec::new();
            col.get_row_ids_for_value_range(SINGLE_ITEM_RANGE, 0..col.num_vals(), &mut positions);
            black_box(positions.len());
        },
    );

    group.register(
        "fastfield_getrange_u64_hit_all",
        |col: &Arc<dyn ColumnValues<u64>>| {
            let mut positions = Vec::new();
            col.get_row_ids_for_value_range(0..=u64::MAX, 0..col.num_vals(), &mut positions);
            black_box(positions.len());
        },
    );

    group.run();
}

fn main() {
    bench_access();
    bench_range();
}


================================================
FILE: columnar/benches/common.rs
================================================
extern crate tantivy_columnar;

use core::fmt;
use std::fmt::{Display, Formatter};

use tantivy_columnar::{ColumnarReader, ColumnarWriter};

pub enum Card {
    MultiSparse,
    Multi,
    Sparse,
    Dense,
    Full,
}
impl Display for Card {
    fn fmt(&self, f: &mut Formatter) -> fmt::Result {
        match self {
            Card::MultiSparse => write!(f, "multi sparse 1/13"),
            Card::Multi => write!(f, "multi 2x"),
            Card::Sparse => write!(f, "sparse 1/13"),
            Card::Dense => write!(f, "dense 1/12"),
            Card::Full => write!(f, "full"),
        }
    }
}
pub fn generate_columnar_with_name(card: Card, num_docs: u32, column_name: &str) -> ColumnarReader {
    let mut columnar_writer = ColumnarWriter::default();

    if let Card::MultiSparse = card {
        columnar_writer.record_numerical(0, column_name, 10u64);
        columnar_writer.record_numerical(0, column_name, 10u64);
    }

    for i in 0..num_docs {
        match card {
            Card::MultiSparse | Card::Sparse => {
                if i % 13 == 0 {
                    columnar_writer.record_numerical(i, column_name, i as u64);
                }
            }
            Card::Dense => {
                if i % 12 == 0 {
                    columnar_writer.record_numerical(i, column_name, i as u64);
                }
            }
            Card::Full => {
                columnar_writer.record_numerical(i, column_name, i as u64);
            }
            Card::Multi => {
                columnar_writer.record_numerical(i, column_name, i as u64);
                columnar_writer.record_numerical(i, column_name, i as u64);
            }
        }
    }

    let mut wrt: Vec<u8> = Vec::new();
    columnar_writer.serialize(num_docs, &mut wrt).unwrap();
    ColumnarReader::open(wrt).unwrap()
}


================================================
FILE: columnar/columnar-cli/Cargo.toml
================================================
[package]
name = "tantivy-columnar-cli"
version = "0.1.0"
edition = "2021"
license = "MIT"

[dependencies]
columnar = {path="../", package="tantivy-columnar"}
serde_json = "1"
serde_json_borrow = {git="https://github.com/PSeitz/serde_json_borrow/"}

[workspace]
members = []

[profile.release]
debug = true


================================================
FILE: columnar/columnar-cli/src/main.rs
================================================
use columnar::ColumnarWriter;
use columnar::NumericalValue;
use serde_json_borrow;
use std::fs::File;
use std::io;
use std::io::BufRead;
use std::io::BufReader;
use std::time::Instant;

#[derive(Default)]
struct JsonStack {
    path: String,
    stack: Vec<usize>,
}

impl JsonStack {
    fn push(&mut self, seg: &str) {
        let len = self.path.len();
        self.stack.push(len);
        self.path.push('.');
        self.path.push_str(seg);
    }

    fn pop(&mut self) {
        if let Some(len) = self.stack.pop() {
            self.path.truncate(len);
        }
    }

    fn path(&self) -> &str {
        &self.path[1..]
    }
}

fn append_json_to_columnar(
    doc: u32,
    json_value: &serde_json_borrow::Value,
    columnar: &mut ColumnarWriter,
    stack: &mut JsonStack,
) -> usize {
    let mut count = 0;
    match json_value {
        serde_json_borrow::Value::Null => {}
        serde_json_borrow::Value::Bool(val) => {
            columnar.record_numerical(
                doc,
                stack.path(),
                NumericalValue::from(if *val { 1u64 } else { 0u64 }),
            );
            count += 1;
        }
        serde_json_borrow::Value::Number(num) => {
            let numerical_value: NumericalValue = if let Some(num_i64) = num.as_i64() {
                num_i64.into()
            } else if let Some(num_u64) = num.as_u64() {
                num_u64.into()
            } else if let Some(num_f64) = num.as_f64() {
                num_f64.into()
            } else {
                panic!();
            };
            count += 1;
            columnar.record_numerical(
                doc,
                stack.path(),
                numerical_value,
            );
        }
        serde_json_borrow::Value::Str(msg) => {
            columnar.record_str(
                doc,
                stack.path(),
                msg,
            );
            count += 1;
        },
        serde_json_borrow::Value::Array(vals) => {
            for val in vals {
                count += append_json_to_columnar(doc, val, columnar, stack);
            }
        },
        serde_json_borrow::Value::Object(json_map) => {
            for (child_key, child_val) in json_map {
                stack.push(child_key);
                count += append_json_to_columnar(doc, child_val, columnar, stack);
                stack.pop();
            }
        },
    }
    count
}

fn main() -> io::Result<()> {
    let file = File::open("gh_small.json")?;
    let mut reader = BufReader::new(file);
    let mut line = String::with_capacity(100);
    let mut columnar = columnar::ColumnarWriter::default();
    let mut doc = 0;
    let start = Instant::now();
    let mut stack = JsonStack::default();
    let mut total_count = 0;

    let start_build = Instant::now();
    loop {
        line.clear();
        let len = reader.read_line(&mut line)?;
        if len == 0 {
            break;
        }
        let Ok(json_value) = serde_json::from_str::<serde_json_borrow::Value>(&line) else { continue; };
        total_count += append_json_to_columnar(doc, &json_value, &mut columnar, &mut stack);
        doc += 1;
    }
    println!("Build in {:?}", start_build.elapsed());

    println!("value count {total_count}");

    let mut buffer = Vec::new();
    let start_serialize = Instant::now();
    columnar.serialize(doc, None, &mut buffer)?;
    println!("Serialized in {:?}", start_serialize.elapsed());
    println!("num docs: {doc}, {:?}", start.elapsed());
    println!("buffer len {} MB", buffer.len() / 1_000_000);
    let columnar = columnar::ColumnarReader::open(buffer)?;
    for (column_name, dynamic_column) in columnar.list_columns()? {
        let num_bytes = dynamic_column.num_bytes();
        let typ = dynamic_column.column_type();
        if num_bytes > 1_000_000 {
            println!("{column_name} {typ:?}  {} KB", num_bytes / 1_000);
        }
    }
    println!("{} columns", columnar.num_columns());
    Ok(())
}


================================================
FILE: columnar/columnar-cli-inspect/Cargo.toml
================================================
[package]
name = "tantivy-columnar-inspect"
version = "0.1.0"
edition = "2021"
license = "MIT"

[dependencies]
tantivy = {path="../..", package="tantivy"}
columnar = {path="../", package="tantivy-columnar"}
common = {path="../../common", package="tantivy-common"}

[workspace]
members = []

[profile.release]
debug = true
#debug-assertions = true
#overflow-checks = true


================================================
FILE: columnar/columnar-cli-inspect/src/main.rs
================================================
use columnar::ColumnarReader;
use common::file_slice::{FileSlice, WrapFile};
use std::io;
use std::path::Path;
use tantivy::directory::footer::Footer;

fn main() -> io::Result<()> {
    println!("Opens a columnar file written by tantivy and validates it.");
    let path = std::env::args().nth(1).unwrap();

    let path = Path::new(&path);
    println!("Reading {:?}", path);
    let _reader = open_and_validate_columnar(path.to_str().unwrap())?;

    Ok(())
}

pub fn validate_columnar_reader(reader: &ColumnarReader) {
    let num_rows = reader.num_rows();
    println!("num_rows: {}", num_rows);
    let columns = reader.list_columns().unwrap();
    println!("num columns: {:?}", columns.len());
    for (col_name, dynamic_column_handle) in columns {
        let col = dynamic_column_handle.open().unwrap();
        match col {
            columnar::DynamicColumn::Bool(_)
            | columnar::DynamicColumn::I64(_)
            | columnar::DynamicColumn::U64(_)
            | columnar::DynamicColumn::F64(_)
            | columnar::DynamicColumn::IpAddr(_)
            | columnar::DynamicColumn::DateTime(_)
            | columnar::DynamicColumn::Bytes(_) => {}
            columnar::DynamicColumn::Str(str_column) => {
                let num_vals = str_column.ords().values.num_vals();
                let num_terms_dict = str_column.num_terms() as u64;
                let max_ord = str_column.ords().values.iter().max().unwrap_or_default();
                println!("{col_name:35}  num_vals {num_vals:10} \t num_terms_dict {num_terms_dict:8} max_ord: {max_ord:8}",);
                for ord in str_column.ords().values.iter() {
                    assert!(ord < num_terms_dict);
                }
            }
        }
    }
}

/// Opens a columnar file that was written by tantivy and validates it.
pub fn open_and_validate_columnar(path: &str) -> io::Result<ColumnarReader> {
    let wrap_file = WrapFile::new(std::fs::File::open(path)?)?;
    let slice = FileSlice::new(std::sync::Arc::new(wrap_file));
    let (_footer, slice) = Footer::extract_footer(slice.clone()).unwrap();
    let reader = ColumnarReader::open(slice).unwrap();
    validate_columnar_reader(&reader);
    Ok(reader)
}


================================================
FILE: columnar/src/TODO.md
================================================
# zero to one

* revisit line codec
* add columns from schema on merge
* Plugging JSON
* replug examples
* move datetime to quickwit common
* switch to nanos
* reintroduce the gcd map.

# Perf and Size
* remove alloc in `ord_to_term`
+ multivaued range queries restart from the beginning all of the time.
* re-add ZSTD compression for dictionaries
no systematic monotonic mapping
consider removing multilinear
f32?
adhoc solution for bool?
add metrics helper for aggregate. sum(row_id)
review inline absence/presence
improv perf of select using PDEP
compare with roaring bitmap/elias fano etc etc.
SIMD range? (see blog post)
Add alignment?
Consider another codec to bridge the gap between few and 5k elements

# Cleanup and rationalization
in benchmark, unify percent vs ratio, f32 vs f64.
investigate if should have better errors? io::Error is overused at the moment.
rename rank/select in unit tests
Review the public API via cargo doc
go through TODOs
remove all  doc_id occurrences -> row_id
use the rank & select naming in unit tests branch.
multi-linear -> blockwise
linear codec -> simply a multiplication for the index column
rename columnar to something more explicit, like column_dictionary or columnar_table
rename fastfield -> column
document changes
rationalization FastFieldValue, HasColumnType
isolate u128_based and uniform naming

# Other
fix enhance column-cli

# Santa Claus
autodetect datetime ipaddr, plug customizable tokenizer.


================================================
FILE: columnar/src/block_accessor.rs
================================================
use std::cmp::Ordering;

use crate::{Column, DocId, RowId};

#[derive(Debug, Default, Clone)]
pub struct ColumnBlockAccessor<T> {
    val_cache: Vec<T>,
    docid_cache: Vec<DocId>,
    missing_docids_cache: Vec<DocId>,
    row_id_cache: Vec<RowId>,
}

impl<T: PartialOrd + Copy + std::fmt::Debug + Send + Sync + 'static + Default>
    ColumnBlockAccessor<T>
{
    #[inline]
    pub fn fetch_block<'a>(&'a mut self, docs: &'a [u32], accessor: &Column<T>) {
        if accessor.index.get_cardinality().is_full() {
            self.val_cache.resize(docs.len(), T::default());
            accessor.values.get_vals(docs, &mut self.val_cache);
        } else {
            self.docid_cache.clear();
            self.row_id_cache.clear();
            accessor.row_ids_for_docs(docs, &mut self.docid_cache, &mut self.row_id_cache);
            self.val_cache.resize(self.row_id_cache.len(), T::default());
            accessor
                .values
                .get_vals(&self.row_id_cache, &mut self.val_cache);
        }
    }
    #[inline]
    pub fn fetch_block_with_missing(
        &mut self,
        docs: &[u32],
        accessor: &Column<T>,
        missing: Option<T>,
    ) {
        self.fetch_block(docs, accessor);
        // no missing values
        if accessor.index.get_cardinality().is_full() {
            return;
        }
        let Some(missing) = missing else {
            return;
        };

        // We can compare docid_cache length with docs to find missing docs
        // For multi value columns we can't rely on the length and always need to scan
        if accessor.index.get_cardinality().is_multivalue() || docs.len() != self.docid_cache.len()
        {
            self.missing_docids_cache.clear();
            find_missing_docs(docs, &self.docid_cache, |doc| {
                self.missing_docids_cache.push(doc);
                self.val_cache.push(missing);
            });
            self.docid_cache
                .extend_from_slice(&self.missing_docids_cache);
        }
    }

    #[inline]
    pub fn iter_vals(&self) -> impl Iterator<Item = T> + '_ {
        self.val_cache.iter().cloned()
    }

    #[inline]
    /// Returns an iterator over the docids and values
    /// The passed in `docs` slice needs to be the same slice that was passed to `fetch_block` or
    /// `fetch_block_with_missing`.
    ///
    /// The docs is used if the column is full (each docs has exactly one value), otherwise the
    /// internal docid vec is used for the iterator, which e.g. may contain duplicate docs.
    pub fn iter_docid_vals<'a>(
        &'a self,
        docs: &'a [u32],
        accessor: &Column<T>,
    ) -> impl Iterator<Item = (DocId, T)> + 'a + use<'a, T> {
        if accessor.index.get_cardinality().is_full() {
            docs.iter().cloned().zip(self.val_cache.iter().cloned())
        } else {
            self.docid_cache
                .iter()
                .cloned()
                .zip(self.val_cache.iter().cloned())
        }
    }
}

/// Given two sorted lists of docids `docs` and `hits`, hits is a subset of `docs`.
/// Return all docs that are not in `hits`.
fn find_missing_docs<F>(docs: &[u32], hits: &[u32], mut callback: F)
where F: FnMut(u32) {
    let mut docs_iter = docs.iter();
    let mut hits_iter = hits.iter();

    let mut doc = docs_iter.next();
    let mut hit = hits_iter.next();

    while let (Some(&current_doc), Some(&current_hit)) = (doc, hit) {
        match current_doc.cmp(&current_hit) {
            Ordering::Less => {
                callback(current_doc);
                doc = docs_iter.next();
            }
            Ordering::Equal => {
                doc = docs_iter.next();
                hit = hits_iter.next();
            }
            Ordering::Greater => {
                hit = hits_iter.next();
            }
        }
    }

    while let Some(&current_doc) = doc {
        callback(current_doc);
        doc = docs_iter.next();
    }
}

#[cfg(test)]
mod tests {
    use super::*;

    #[test]
    fn test_find_missing_docs() {
        let docs: Vec<u32> = vec![1, 2, 3, 4, 5, 6, 7, 8, 9, 10];
        let hits: Vec<u32> = vec![2, 4, 6, 8, 10];

        let mut missing_docs: Vec<u32> = Vec::new();

        find_missing_docs(&docs, &hits, |missing_doc| {
            missing_docs.push(missing_doc);
        });

        assert_eq!(missing_docs, vec![1, 3, 5, 7, 9]);
    }

    #[test]
    fn test_find_missing_docs_empty() {
        let docs: Vec<u32> = Vec::new();
        let hits: Vec<u32> = vec![2, 4, 6, 8, 10];

        let mut missing_docs: Vec<u32> = Vec::new();

        find_missing_docs(&docs, &hits, |missing_doc| {
            missing_docs.push(missing_doc);
        });

        assert_eq!(missing_docs, Vec::<u32>::new());
    }

    #[test]
    fn test_find_missing_docs_all_missing() {
        let docs: Vec<u32> = vec![1, 2, 3, 4, 5];
        let hits: Vec<u32> = Vec::new();

        let mut missing_docs: Vec<u32> = Vec::new();

        find_missing_docs(&docs, &hits, |missing_doc| {
            missing_docs.push(missing_doc);
        });

        assert_eq!(missing_docs, vec![1, 2, 3, 4, 5]);
    }
}


================================================
FILE: columnar/src/column/dictionary_encoded.rs
================================================
use std::ops::Deref;
use std::sync::Arc;
use std::{fmt, io};

use sstable::{Dictionary, VoidSSTable};

use crate::RowId;
use crate::column::Column;

/// Dictionary encoded column.
///
/// The column simply gives access to a regular u64-column that, in
/// which the values are term-ordinals.
///
/// These ordinals are ids uniquely identify the bytes that are stored in
/// the column. These ordinals are small, and sorted in the same order
/// as the term_ord_column.
#[derive(Clone)]
pub struct BytesColumn {
    pub(crate) dictionary: Arc<Dictionary<VoidSSTable>>,
    pub(crate) term_ord_column: Column<u64>,
}

impl fmt::Debug for BytesColumn {
    fn fmt(&self, f: &mut fmt::Formatter<'_>) -> fmt::Result {
        f.debug_struct("BytesColumn")
            .field("term_ord_column", &self.term_ord_column)
            .finish()
    }
}

impl BytesColumn {
    pub fn empty(num_docs: u32) -> BytesColumn {
        BytesColumn {
            dictionary: Arc::new(Dictionary::empty()),
            term_ord_column: Column::build_empty_column(num_docs),
        }
    }

    /// Fills the given `output` buffer with the term associated to the ordinal `ord`.
    ///
    /// Returns `false` if the term does not exist (e.g. `term_ord` is greater or equal to the
    /// overll number of terms).
    pub fn ord_to_bytes(&self, ord: u64, output: &mut Vec<u8>) -> io::Result<bool> {
        self.dictionary.ord_to_term(ord, output)
    }

    /// Returns the number of rows in the column.
    pub fn num_rows(&self) -> RowId {
        self.term_ord_column.num_docs()
    }

    pub fn term_ords(&self, row_id: RowId) -> impl Iterator<Item = u64> + '_ {
        self.term_ord_column.values_for_doc(row_id)
    }

    /// Returns the column of ordinals
    pub fn ords(&self) -> &Column<u64> {
        &self.term_ord_column
    }

    pub fn num_terms(&self) -> usize {
        self.dictionary.num_terms()
    }

    pub fn dictionary(&self) -> &Dictionary<VoidSSTable> {
        self.dictionary.as_ref()
    }
}

#[derive(Clone)]
pub struct StrColumn(BytesColumn);

impl fmt::Debug for StrColumn {
    fn fmt(&self, f: &mut fmt::Formatter) -> fmt::Result {
        write!(f, "{:?}", self.term_ord_column)
    }
}

impl From<StrColumn> for BytesColumn {
    fn from(str_column: StrColumn) -> BytesColumn {
        str_column.0
    }
}

impl StrColumn {
    pub fn wrap(bytes_column: BytesColumn) -> StrColumn {
        StrColumn(bytes_column)
    }

    pub fn dictionary(&self) -> &Dictionary<VoidSSTable> {
        self.0.dictionary.as_ref()
    }

    /// Fills the buffer
    pub fn ord_to_str(&self, term_ord: u64, output: &mut String) -> io::Result<bool> {
        unsafe {
            let buf = output.as_mut_vec();
            if !self.0.dictionary.ord_to_term(term_ord, buf)? {
                return Ok(false);
            }
            // TODO consider remove checks if it hurts performance.
            if std::str::from_utf8(buf.as_slice()).is_err() {
                buf.clear();
                return Err(io::Error::new(
                    io::ErrorKind::InvalidData,
                    "Not valid utf-8",
                ));
            }
        }
        Ok(true)
    }
}

impl Deref for StrColumn {
    type Target = BytesColumn;

    fn deref(&self) -> &Self::Target {
        &self.0
    }
}


================================================
FILE: columnar/src/column/mod.rs
================================================
mod dictionary_encoded;
mod serialize;

use std::fmt::{self, Debug};
use std::io::Write;
use std::ops::{Range, RangeInclusive};
use std::sync::Arc;

use common::BinarySerializable;
pub use dictionary_encoded::{BytesColumn, StrColumn};
pub use serialize::{
    open_column_bytes, open_column_str, open_column_u64, open_column_u128,
    open_column_u128_as_compact_u64, serialize_column_mappable_to_u64,
    serialize_column_mappable_to_u128,
};

use crate::column_index::{ColumnIndex, Set};
use crate::column_values::monotonic_mapping::StrictlyMonotonicMappingToInternal;
use crate::column_values::{ColumnValues, monotonic_map_column};
use crate::{Cardinality, DocId, EmptyColumnValues, MonotonicallyMappableToU64, RowId};

#[derive(Clone)]
pub struct Column<T = u64> {
    pub index: ColumnIndex,
    pub values: Arc<dyn ColumnValues<T>>,
}

impl<T: Debug + PartialOrd + Send + Sync + Copy + 'static> Debug for Column<T> {
    fn fmt(&self, f: &mut fmt::Formatter) -> fmt::Result {
        let num_docs = self.num_docs();
        let entries = (0..num_docs)
            .map(|i| (i, self.values_for_doc(i).collect::<Vec<_>>()))
            .filter(|(_, vals)| !vals.is_empty());
        f.debug_map().entries(entries).finish()
    }
}

impl<T: PartialOrd + Default> Column<T> {
    pub fn build_empty_column(num_docs: u32) -> Column<T> {
        Column {
            index: ColumnIndex::Empty { num_docs },
            values: Arc::new(EmptyColumnValues),
        }
    }
}

impl<T: MonotonicallyMappableToU64> Column<T> {
    pub fn to_u64_monotonic(self) -> Column<u64> {
        let values = Arc::new(monotonic_map_column(
            self.values,
            StrictlyMonotonicMappingToInternal::<T>::new(),
        ));
        Column {
            index: self.index,
            values,
        }
    }
}

impl<T: PartialOrd + Copy + Debug + Send + Sync + 'static> Column<T> {
    #[inline]
    pub fn get_cardinality(&self) -> Cardinality {
        self.index.get_cardinality()
    }

    pub fn num_docs(&self) -> RowId {
        match &self.index {
            ColumnIndex::Empty { num_docs } => *num_docs,
            ColumnIndex::Full => self.values.num_vals(),
            ColumnIndex::Optional(optional_index) => optional_index.num_docs(),
            ColumnIndex::Multivalued(col_index) => {
                // The multivalued index contains all value start row_id,
                // and one extra value at the end with the overall number of rows.
                col_index.num_docs()
            }
        }
    }

    pub fn min_value(&self) -> T {
        self.values.min_value()
    }

    pub fn max_value(&self) -> T {
        self.values.max_value()
    }

    #[inline]
    pub fn first(&self, doc_id: DocId) -> Option<T> {
        self.values_for_doc(doc_id).next()
    }

    /// Load the first value for each docid in the provided slice.
    #[inline]
    pub fn first_vals(&self, docids: &[DocId], output: &mut [Option<T>]) {
        match &self.index {
            ColumnIndex::Empty { .. } => {}
            ColumnIndex::Full => self.values.get_vals_opt(docids, output),
            ColumnIndex::Optional(optional_index) => {
                for (i, docid) in docids.iter().enumerate() {
                    output[i] = optional_index
                        .rank_if_exists(*docid)
                        .map(|rowid| self.values.get_val(rowid));
                }
            }
            ColumnIndex::Multivalued(multivalued_index) => {
                for (i, docid) in docids.iter().enumerate() {
                    let range = multivalued_index.range(*docid);
                    let is_empty = range.start == range.end;
                    if !is_empty {
                        output[i] = Some(self.values.get_val(range.start));
                    }
                }
            }
        }
    }

    /// Translates a block of docids to row_ids.
    ///
    /// returns the row_ids and the matching docids on the same index
    /// e.g.
    /// DocId In:  [0, 5, 6]
    /// DocId Out: [0, 0, 6, 6]
    /// RowId Out: [0, 1, 2, 3]
    #[inline]
    pub fn row_ids_for_docs(
        &self,
        doc_ids: &[DocId],
        doc_ids_out: &mut Vec<DocId>,
        row_ids: &mut Vec<RowId>,
    ) {
        self.index.docids_to_rowids(doc_ids, doc_ids_out, row_ids)
    }

    /// Get an iterator over the values for the provided docid.
    #[inline]
    pub fn values_for_doc(&self, doc_id: DocId) -> impl Iterator<Item = T> + '_ {
        self.index
            .value_row_ids(doc_id)
            .map(|value_row_id: RowId| self.values.get_val(value_row_id))
    }

    /// Get the docids of values which are in the provided value and docid range.
    #[inline]
    pub fn get_docids_for_value_range(
        &self,
        value_range: RangeInclusive<T>,
        selected_docid_range: Range<u32>,
        doc_ids: &mut Vec<u32>,
    ) {
        // convert passed docid range to row id range
        let rowid_range = self
            .index
            .docid_range_to_rowids(selected_docid_range.clone());

        // Load rows
        self.values
            .get_row_ids_for_value_range(value_range, rowid_range, doc_ids);
        // Convert rows to docids
        self.index
            .select_batch_in_place(selected_docid_range.start, doc_ids);
    }

    pub fn first_or_default_col(self, default_value: T) -> Arc<dyn ColumnValues<T>> {
        Arc::new(FirstValueWithDefault {
            column: self,
            default_value,
        })
    }
}

impl BinarySerializable for Cardinality {
    fn serialize<W: Write + ?Sized>(&self, writer: &mut W) -> std::io::Result<()> {
        self.to_code().serialize(writer)
    }

    fn deserialize<R: std::io::Read>(reader: &mut R) -> std::io::Result<Self> {
        let cardinality_code = u8::deserialize(reader)?;
        let cardinality = Cardinality::try_from_code(cardinality_code)?;
        Ok(cardinality)
    }
}

// TODO simplify or optimize
struct FirstValueWithDefault<T: Copy> {
    column: Column<T>,
    default_value: T,
}

impl<T: PartialOrd + Debug + Send + Sync + Copy + 'static> ColumnValues<T>
    for FirstValueWithDefault<T>
{
    #[inline(always)]
    fn get_val(&self, idx: u32) -> T {
        self.column.first(idx).unwrap_or(self.default_value)
    }

    fn min_value(&self) -> T {
        self.column.values.min_value()
    }

    fn max_value(&self) -> T {
        self.column.values.max_value()
    }

    fn num_vals(&self) -> u32 {
        match &self.column.index {
            ColumnIndex::Empty { .. } => 0u32,
            ColumnIndex::Full => self.column.values.num_vals(),
            ColumnIndex::Optional(optional_idx) => optional_idx.num_docs(),
            ColumnIndex::Multivalued(multivalue_idx) => multivalue_idx.num_docs(),
        }
    }
}


================================================
FILE: columnar/src/column/serialize.rs
================================================
use std::io;
use std::io::Write;
use std::sync::Arc;

use common::OwnedBytes;
use sstable::Dictionary;

use crate::column::{BytesColumn, Column};
use crate::column_index::{SerializableColumnIndex, serialize_column_index};
use crate::column_values::{
    CodecType, MonotonicallyMappableToU64, MonotonicallyMappableToU128,
    load_u64_based_column_values, serialize_column_values_u128, serialize_u64_based_column_values,
};
use crate::iterable::Iterable;
use crate::{StrColumn, Version};

pub fn serialize_column_mappable_to_u128<T: MonotonicallyMappableToU128>(
    column_index: SerializableColumnIndex<'_>,
    iterable: &dyn Iterable<T>,
    output: &mut impl Write,
) -> io::Result<()> {
    let column_index_num_bytes = serialize_column_index(column_index, output)?;
    serialize_column_values_u128(iterable, output)?;
    output.write_all(&column_index_num_bytes.to_le_bytes())?;
    Ok(())
}

pub fn serialize_column_mappable_to_u64<T: MonotonicallyMappableToU64>(
    column_index: SerializableColumnIndex<'_>,
    column_values: &impl Iterable<T>,
    output: &mut impl Write,
) -> io::Result<()> {
    let column_index_num_bytes = serialize_column_index(column_index, output)?;
    serialize_u64_based_column_values(
        column_values,
        &[CodecType::Bitpacked, CodecType::BlockwiseLinear],
        output,
    )?;
    output.write_all(&column_index_num_bytes.to_le_bytes())?;
    Ok(())
}

pub fn open_column_u64<T: MonotonicallyMappableToU64>(
    bytes: OwnedBytes,
    format_version: Version,
) -> io::Result<Column<T>> {
    let (body, column_index_num_bytes_payload) = bytes.rsplit(4);
    let column_index_num_bytes = u32::from_le_bytes(
        column_index_num_bytes_payload
            .as_slice()
            .try_into()
            .unwrap(),
    );
    let (column_index_data, column_values_data) = body.split(column_index_num_bytes as usize);
    let column_index = crate::column_index::open_column_index(column_index_data, format_version)?;
    let column_values = load_u64_based_column_values(column_values_data)?;
    Ok(Column {
        index: column_index,
        values: column_values,
    })
}

pub fn open_column_u128<T: MonotonicallyMappableToU128>(
    bytes: OwnedBytes,
    format_version: Version,
) -> io::Result<Column<T>> {
    let (body, column_index_num_bytes_payload) = bytes.rsplit(4);
    let column_index_num_bytes = u32::from_le_bytes(
        column_index_num_bytes_payload
            .as_slice()
            .try_into()
            .unwrap(),
    );
    let (column_index_data, column_values_data) = body.split(column_index_num_bytes as usize);
    let column_index = crate::column_index::open_column_index(column_index_data, format_version)?;
    let column_values = crate::column_values::open_u128_mapped(column_values_data)?;
    Ok(Column {
        index: column_index,
        values: column_values,
    })
}

/// Open the column as u64.
///
/// See [`open_u128_as_compact_u64`] for more details.
pub fn open_column_u128_as_compact_u64(
    bytes: OwnedBytes,
    format_version: Version,
) -> io::Result<Column<u64>> {
    let (body, column_index_num_bytes_payload) = bytes.rsplit(4);
    let column_index_num_bytes = u32::from_le_bytes(
        column_index_num_bytes_payload
            .as_slice()
            .try_into()
            .unwrap(),
    );
    let (column_index_data, column_values_data) = body.split(column_index_num_bytes as usize);
    let column_index = crate::column_index::open_column_index(column_index_data, format_version)?;
    let column_values = crate::column_values::open_u128_as_compact_u64(column_values_data)?;
    Ok(Column {
        index: column_index,
        values: column_values,
    })
}

pub fn open_column_bytes(data: OwnedBytes, format_version: Version) -> io::Result<BytesColumn> {
    let (body, dictionary_len_bytes) = data.rsplit(4);
    let dictionary_len = u32::from_le_bytes(dictionary_len_bytes.as_slice().try_into().unwrap());
    let (dictionary_bytes, column_bytes) = body.split(dictionary_len as usize);
    let dictionary = Arc::new(Dictionary::from_bytes(dictionary_bytes)?);
    let term_ord_column = crate::column::open_column_u64::<u64>(column_bytes, format_version)?;
    Ok(BytesColumn {
        dictionary,
        term_ord_column,
    })
}

pub fn open_column_str(data: OwnedBytes, format_version: Version) -> io::Result<StrColumn> {
    let bytes_column = open_column_bytes(data, format_version)?;
    Ok(StrColumn::wrap(bytes_column))
}


================================================
FILE: columnar/src/column_index/merge/mod.rs
================================================
mod shuffled;
mod stacked;

use common::ReadOnlyBitSet;
use shuffled::merge_column_index_shuffled;
use stacked::merge_column_index_stacked;

use crate::column_index::SerializableColumnIndex;
use crate::{Cardinality, ColumnIndex, MergeRowOrder};

fn detect_cardinality_single_column_index(
    column_index: &ColumnIndex,
    alive_bitset_opt: &Option<ReadOnlyBitSet>,
) -> Cardinality {
    let Some(alive_bitset) = alive_bitset_opt else {
        return column_index.get_cardinality();
    };
    let cardinality_before_deletes = column_index.get_cardinality();
    if cardinality_before_deletes == Cardinality::Full {
        // The columnar cardinality can only become more restrictive in the presence of deletes
        // (where cardinality sorted from the more restrictive to the least restrictive are Full,
        // Optional, Multivalued)
        //
        // If we are already "Full", we are guaranteed to stay "Full" after deletes.
        return Cardinality::Full;
    }
    let mut cardinality_so_far = Cardinality::Full;
    for doc_id in alive_bitset.iter() {
        let num_values = column_index.value_row_ids(doc_id).len();
        let row_cardinality = match num_values {
            0 => Cardinality::Optional,
            1 => Cardinality::Full,
            _ => Cardinality::Multivalued,
        };
        cardinality_so_far = cardinality_so_far.max(row_cardinality);
        if cardinality_so_far >= cardinality_before_deletes {
            // There won't be any improvement in the cardinality.
            // We can early exit.
            return cardinality_before_deletes;
        }
    }
    cardinality_so_far
}

fn detect_cardinality(
    column_indexes: &[ColumnIndex],
    merge_row_order: &MergeRowOrder,
) -> Cardinality {
    match merge_row_order {
        MergeRowOrder::Stack(_) => column_indexes
            .iter()
            .map(ColumnIndex::get_cardinality)
            .max()
            .unwrap_or(Cardinality::Full),
        MergeRowOrder::Shuffled(shuffle_merge_order) => {
            let mut merged_cardinality = Cardinality::Full;
            for (column_index, alive_bitset_opt) in column_indexes
                .iter()
                .zip(shuffle_merge_order.alive_bitsets.iter())
            {
                let cardinality: Cardinality =
                    detect_cardinality_single_column_index(column_index, alive_bitset_opt);
                if cardinality == Cardinality::Multivalued {
                    return cardinality;
                }
                merged_cardinality = merged_cardinality.max(cardinality);
            }
            merged_cardinality
        }
    }
}

pub fn merge_column_index<'a>(
    columns: &'a [ColumnIndex],
    merge_row_order: &'a MergeRowOrder,
) -> SerializableColumnIndex<'a> {
    // For simplification, we do not try to detect whether the cardinality could be
    // downgraded thanks to deletes.
    let cardinality_after_merge = detect_cardinality(columns, merge_row_order);
    match merge_row_order {
        MergeRowOrder::Stack(stack_merge_order) => {
            merge_column_index_stacked(columns, cardinality_after_merge, stack_merge_order)
        }
        MergeRowOrder::Shuffled(complex_merge_order) => {
            merge_column_index_shuffled(columns, cardinality_after_merge, complex_merge_order)
        }
    }
}

// TODO actually, the shuffled code path is a bit too general.
// In practise, we do not really shuffle everything.
// The merge order restricted to a specific column keeps the original row order.
//
// This may offer some optimization that we have not explored yet.

#[cfg(test)]
mod tests {
    use common::OwnedBytes;

    use crate::column_index::merge::detect_cardinality;
    use crate::column_index::multivalued_index::{
        MultiValueIndex, open_multivalued_index, serialize_multivalued_index,
    };
    use crate::column_index::{OptionalIndex, SerializableColumnIndex, merge_column_index};
    use crate::{
        Cardinality, ColumnIndex, MergeRowOrder, RowAddr, RowId, ShuffleMergeOrder, StackMergeOrder,
    };

    #[test]
    fn test_detect_cardinality() {
        assert_eq!(
            detect_cardinality(&[], &StackMergeOrder::stack_for_test(&[]).into()),
            Cardinality::Full
        );
        let optional_index: ColumnIndex = OptionalIndex::for_test(1, &[]).into();
        let multivalued_index: ColumnIndex = MultiValueIndex::for_test(&[0, 1]).into();
        assert_eq!(
            detect_cardinality(
                &[optional_index.clone(), ColumnIndex::Empty { num_docs: 0 }],
                &StackMergeOrder::stack_for_test(&[1, 0]).into()
            ),
            Cardinality::Optional
        );
        assert_eq!(
            detect_cardinality(
                &[optional_index.clone(), ColumnIndex::Full],
                &StackMergeOrder::stack_for_test(&[1, 1]).into()
            ),
            Cardinality::Optional
        );
        assert_eq!(
            detect_cardinality(
                &[
                    multivalued_index.clone(),
                    ColumnIndex::Empty { num_docs: 0 }
                ],
                &StackMergeOrder::stack_for_test(&[1, 0]).into()
            ),
            Cardinality::Multivalued
        );
        assert_eq!(
            detect_cardinality(
                &[multivalued_index.clone(), optional_index.clone()],
                &StackMergeOrder::stack_for_test(&[1, 1]).into()
            ),
            Cardinality::Multivalued
        );
        assert_eq!(
            detect_cardinality(
                &[optional_index, multivalued_index],
                &StackMergeOrder::stack_for_test(&[1, 1]).into()
            ),
            Cardinality::Multivalued
        );
    }

    #[test]
    fn test_merge_index_multivalued_sorted() {
        let column_indexes: Vec<ColumnIndex> = vec![MultiValueIndex::for_test(&[0, 2, 5]).into()];
        let merge_row_order: MergeRowOrder = ShuffleMergeOrder::for_test(
            &[2],
            vec![
                RowAddr {
                    segment_ord: 0u32,
                    row_id: 1u32,
                },
                RowAddr {
                    segment_ord: 0u32,
                    row_id: 0u32,
                },
            ],
        )
        .into();
        let merged_column_index = merge_column_index(&column_indexes[..], &merge_row_order);
        let SerializableColumnIndex::Multivalued(start_index_iterable) = merged_column_index else {
            panic!("Expected a multivalued index")
        };
        let mut output = Vec::new();
        serialize_multivalued_index(&start_index_iterable, &mut output).unwrap();
        let multivalue =
            open_multivalued_index(OwnedBytes::new(output), crate::Version::V2).unwrap();
        let start_indexes: Vec<RowId> = multivalue.get_start_index_column().iter().collect();
        assert_eq!(&start_indexes, &[0, 3, 5]);
    }

    #[test]
    fn test_merge_index_multivalued_sorted_several_segment() {
        let column_indexes: Vec<ColumnIndex> = vec![
            MultiValueIndex::for_test(&[0, 2, 5]).into(),
            ColumnIndex::Empty { num_docs: 0 },
            MultiValueIndex::for_test(&[0, 1, 4]).into(),
        ];
        let merge_row_order: MergeRowOrder = ShuffleMergeOrder::for_test(
            &[2, 0, 2],
            vec![
                RowAddr {
                    segment_ord: 2u32,
                    row_id: 1u32,
                },
                RowAddr {
                    segment_ord: 0u32,
                    row_id: 0u32,
                },
                RowAddr {
                    segment_ord: 2u32,
                    row_id: 0u32,
                },
            ],
        )
        .into();

        let merged_column_index = merge_column_index(&column_indexes[..], &merge_row_order);
        let SerializableColumnIndex::Multivalued(start_index_iterable) = merged_column_index else {
            panic!("Expected a multivalued index")
        };
        let mut output = Vec::new();
        serialize_multivalued_index(&start_index_iterable, &mut output).unwrap();
        let multivalue =
            open_multivalued_index(OwnedBytes::new(output), crate::Version::V2).unwrap();
        let start_indexes: Vec<RowId> = multivalue.get_start_index_column().iter().collect();
        assert_eq!(&start_indexes, &[0, 3, 5, 6]);
    }
}


================================================
FILE: columnar/src/column_index/merge/shuffled.rs
================================================
use std::iter;

use crate::column_index::{
    SerializableColumnIndex, SerializableMultivalueIndex, SerializableOptionalIndex, Set,
};
use crate::iterable::Iterable;
use crate::{Cardinality, ColumnIndex, RowId, ShuffleMergeOrder};

pub fn merge_column_index_shuffled<'a>(
    column_indexes: &'a [ColumnIndex],
    cardinality_after_merge: Cardinality,
    shuffle_merge_order: &'a ShuffleMergeOrder,
) -> SerializableColumnIndex<'a> {
    match cardinality_after_merge {
        Cardinality::Full => SerializableColumnIndex::Full,
        Cardinality::Optional => {
            let non_null_row_ids =
                merge_column_index_shuffled_optional(column_indexes, shuffle_merge_order);
            SerializableColumnIndex::Optional(SerializableOptionalIndex {
                non_null_row_ids,
                num_rows: shuffle_merge_order.num_rows(),
            })
        }
        Cardinality::Multivalued => {
            let non_null_row_ids =
                merge_column_index_shuffled_optional(column_indexes, shuffle_merge_order);
            SerializableColumnIndex::Multivalued(SerializableMultivalueIndex {
                doc_ids_with_values: SerializableOptionalIndex {
                    non_null_row_ids,
                    num_rows: shuffle_merge_order.num_rows(),
                },
                start_offsets: merge_column_index_shuffled_multivalued(
                    column_indexes,
                    shuffle_merge_order,
                ),
            })
        }
    }
}

/// Merge several column indexes into one, ordering rows according to the merge_order passed as
/// argument. While it is true that the `merge_order` may imply deletes and hence could in theory a
/// multivalued index into an optional one, this is not supported today for simplification.
///
/// In other words the column_indexes passed as argument may NOT be multivalued.
fn merge_column_index_shuffled_optional<'a>(
    column_indexes: &'a [ColumnIndex],
    merge_order: &'a ShuffleMergeOrder,
) -> Box<dyn Iterable<RowId> + 'a> {
    Box::new(ShuffledIndex {
        column_indexes,
        merge_order,
    })
}

struct ShuffledIndex<'a> {
    column_indexes: &'a [ColumnIndex],
    merge_order: &'a ShuffleMergeOrder,
}

impl Iterable<u32> for ShuffledIndex<'_> {
    fn boxed_iter(&self) -> Box<dyn Iterator<Item = u32> + '_> {
        Box::new(
            self.merge_order
                .iter_new_to_old_row_addrs()
                .enumerate()
                .filter_map(|(new_row_id, old_row_addr)| {
                    let column_index = &self.column_indexes[old_row_addr.segment_ord as usize];
                    let row_id = new_row_id as u32;
                    if column_index.has_value(old_row_addr.row_id) {
                        Some(row_id)
                    } else {
                        None
                    }
                }),
        )
    }
}

fn merge_column_index_shuffled_multivalued<'a>(
    column_indexes: &'a [ColumnIndex],
    merge_order: &'a ShuffleMergeOrder,
) -> Box<dyn Iterable<RowId> + 'a> {
    Box::new(ShuffledMultivaluedIndex {
        column_indexes,
        merge_order,
    })
}

struct ShuffledMultivaluedIndex<'a> {
    column_indexes: &'a [ColumnIndex],
    merge_order: &'a ShuffleMergeOrder,
}

fn iter_num_values<'a>(
    column_indexes: &'a [ColumnIndex],
    merge_order: &'a ShuffleMergeOrder,
) -> impl Iterator<Item = u32> + 'a {
    merge_order.iter_new_to_old_row_addrs().map(|row_addr| {
        let column_index = &column_indexes[row_addr.segment_ord as usize];
        match column_index {
            ColumnIndex::Empty { .. } => 0u32,
            ColumnIndex::Full => 1,
            ColumnIndex::Optional(optional_index) => {
                u32::from(optional_index.contains(row_addr.row_id))
            }
            ColumnIndex::Multivalued(multivalued_index) => {
                multivalued_index.range(row_addr.row_id).len() as u32
            }
        }
    })
}

/// Transforms an iterator containing the number of vals per row (with `num_rows` elements)
/// into a `start_offset` iterator starting at 0 and (with `num_rows + 1` element)
///
/// This will filter values with 0 values as these are covered by the optional index in the
/// multivalue index.
fn integrate_num_vals(num_vals: impl Iterator<Item = u32>) -> impl Iterator<Item = RowId> {
    iter::once(0u32).chain(
        num_vals
            .filter(|num_vals| *num_vals != 0)
            .scan(0, |state, num_vals| {
                *state += num_vals;
                Some(*state)
            }),
    )
}

impl Iterable<u32> for ShuffledMultivaluedIndex<'_> {
    fn boxed_iter(&self) -> Box<dyn Iterator<Item = u32> + '_> {
        let num_vals_per_row = iter_num_values(self.column_indexes, self.merge_order);
        Box::new(integrate_num_vals(num_vals_per_row))
    }
}

#[cfg(test)]
mod tests {
    use super::*;
    use crate::RowAddr;
    use crate::column_index::OptionalIndex;

    #[test]
    fn test_integrate_num_vals_empty() {
        assert!(integrate_num_vals(iter::empty()).eq(iter::once(0)));
    }

    #[test]
    fn test_integrate_num_vals_one_el() {
        assert!(integrate_num_vals(iter::once(10)).eq([0, 10].into_iter()));
    }

    #[test]
    fn test_integrate_num_vals_several() {
        assert!(integrate_num_vals([3, 0, 10, 20].into_iter()).eq([0, 3, 13, 33].into_iter()));
    }

    #[test]
    fn test_merge_column_index_optional_shuffle() {
        let optional_index: ColumnIndex = OptionalIndex::for_test(2, &[0]).into();
        let column_indexes = [optional_index, ColumnIndex::Full];
        let row_addrs = vec![
            RowAddr {
                segment_ord: 0u32,
                row_id: 1u32,
            },
            RowAddr {
                segment_ord: 1u32,
                row_id: 0u32,
            },
        ];
        let shuffle_merge_order = ShuffleMergeOrder::for_test(&[2, 1], row_addrs);
        let serializable_index = merge_column_index_shuffled(
            &column_indexes[..],
            Cardinality::Optional,
            &shuffle_merge_order,
        );
        let SerializableColumnIndex::Optional(SerializableOptionalIndex {
            non_null_row_ids,
            num_rows,
        }) = serializable_index
        else {
            panic!()
        };
        assert_eq!(num_rows, 2);
        let non_null_rows: Vec<RowId> = non_null_row_ids.boxed_iter().collect();
        assert_eq!(&non_null_rows, &[1]);
    }
}


================================================
FILE: columnar/src/column_index/merge/stacked.rs
================================================
use std::ops::Range;

use crate::column_index::SerializableColumnIndex;
use crate::column_index::multivalued_index::{MultiValueIndex, SerializableMultivalueIndex};
use crate::column_index::serialize::SerializableOptionalIndex;
use crate::iterable::Iterable;
use crate::{Cardinality, ColumnIndex, RowId, StackMergeOrder};

/// Simple case:
/// The new mapping just consists in stacking the different column indexes.
///
/// There are no sort nor deletes involved.
pub fn merge_column_index_stacked<'a>(
    columns: &'a [ColumnIndex],
    cardinality_after_merge: Cardinality,
    stack_merge_order: &'a StackMergeOrder,
) -> SerializableColumnIndex<'a> {
    match cardinality_after_merge {
        Cardinality::Full => SerializableColumnIndex::Full,
        Cardinality::Optional => SerializableColumnIndex::Optional(SerializableOptionalIndex {
            non_null_row_ids: Box::new(StackedOptionalIndex {
                columns,
                stack_merge_order,
            }),
            num_rows: stack_merge_order.num_rows(),
        }),
        Cardinality::Multivalued => {
            let serializable_multivalue_index =
                make_serializable_multivalued_index(columns, stack_merge_order);
            SerializableColumnIndex::Multivalued(serializable_multivalue_index)
        }
    }
}

struct StackedDocIdsWithValues<'a> {
    column_indexes: &'a [ColumnIndex],
    stack_merge_order: &'a StackMergeOrder,
}

impl Iterable<u32> for StackedDocIdsWithValues<'_> {
    fn boxed_iter(&self) -> Box<dyn Iterator<Item = u32> + '_> {
        Box::new((0..self.column_indexes.len()).flat_map(|i| {
            let column_index = &self.column_indexes[i];
            let doc_range = self.stack_merge_order.columnar_range(i);
            get_doc_ids_with_values(column_index, doc_range)
        }))
    }
}

fn get_doc_ids_with_values<'a>(
    column_index: &'a ColumnIndex,
    doc_range: Range<u32>,
) -> Box<dyn Iterator<Item = u32> + 'a> {
    match column_index {
        ColumnIndex::Empty { .. } => Box::new(0..0),
        ColumnIndex::Full => Box::new(doc_range),
        ColumnIndex::Optional(optional_index) => Box::new(
            optional_index
                .iter_non_null_docs()
                .map(move |row| row + doc_range.start),
        ),
        ColumnIndex::Multivalued(multivalued_index) => match multivalued_index {
            MultiValueIndex::MultiValueIndexV1(multivalued_index) => {
                Box::new((0..multivalued_index.num_docs()).filter_map(move |docid| {
                    let range = multivalued_index.range(docid);
                    if range.is_empty() {
                        None
                    } else {
                        Some(docid + doc_range.start)
                    }
                }))
            }
            MultiValueIndex::MultiValueIndexV2(multivalued_index) => Box::new(
                multivalued_index
                    .optional_index
                    .iter_non_null_docs()
                    .map(move |row| row + doc_range.start),
            ),
        },
    }
}

fn stack_doc_ids_with_values<'a>(
    column_indexes: &'a [ColumnIndex],
    stack_merge_order: &'a StackMergeOrder,
) -> SerializableOptionalIndex<'a> {
    let num_rows = stack_merge_order.num_rows();
    SerializableOptionalIndex {
        non_null_row_ids: Box::new(StackedDocIdsWithValues {
            column_indexes,
            stack_merge_order,
        }),
        num_rows,
    }
}

struct StackedStartOffsets<'a> {
    column_indexes: &'a [ColumnIndex],
    stack_merge_order: &'a StackMergeOrder,
}

fn get_num_values_iterator<'a>(
    column_index: &'a ColumnIndex,
    num_docs: u32,
) -> Box<dyn Iterator<Item = u32> + 'a> {
    match column_index {
        ColumnIndex::Empty { .. } => Box::new(std::iter::empty()),
        ColumnIndex::Full => Box::new(std::iter::repeat_n(1u32, num_docs as usize)),
        ColumnIndex::Optional(optional_index) => Box::new(std::iter::repeat_n(
            1u32,
            optional_index.num_non_nulls() as usize,
        )),
        ColumnIndex::Multivalued(multivalued_index) => Box::new(
            multivalued_index
                .get_start_index_column()
                .iter()
                .scan(0u32, |previous_start_offset, current_start_offset| {
                    let num_vals = current_start_offset - *previous_start_offset;
                    *previous_start_offset = current_start_offset;
                    Some(num_vals)
                })
                .skip(1),
        ),
    }
}

impl Iterable<u32> for StackedStartOffsets<'_> {
    fn boxed_iter(&self) -> Box<dyn Iterator<Item = u32> + '_> {
        let num_values_it = (0..self.column_indexes.len()).flat_map(|columnar_id| {
            let num_docs = self.stack_merge_order.columnar_range(columnar_id).len() as u32;
            let column_index = &self.column_indexes[columnar_id];
            get_num_values_iterator(column_index, num_docs)
        });
        Box::new(std::iter::once(0u32).chain(num_values_it.into_iter().scan(
            0u32,
            |cumulated, el| {
                *cumulated += el;
                Some(*cumulated)
            },
        )))
    }
}

fn stack_start_offsets<'a>(
    column_indexes: &'a [ColumnIndex],
    stack_merge_order: &'a StackMergeOrder,
) -> Box<dyn Iterable<u32> + 'a> {
    Box::new(StackedStartOffsets {
        column_indexes,
        stack_merge_order,
    })
}

fn make_serializable_multivalued_index<'a>(
    columns: &'a [ColumnIndex],
    stack_merge_order: &'a StackMergeOrder,
) -> SerializableMultivalueIndex<'a> {
    SerializableMultivalueIndex {
        doc_ids_with_values: stack_doc_ids_with_values(columns, stack_merge_order),
        start_offsets: stack_start_offsets(columns, stack_merge_order),
    }
}

struct StackedOptionalIndex<'a> {
    columns: &'a [ColumnIndex],
    stack_merge_order: &'a StackMergeOrder,
}

impl<'a> Iterable<RowId> for StackedOptionalIndex<'a> {
    fn boxed_iter(&self) -> Box<dyn Iterator<Item = RowId> + 'a> {
        Box::new(
            self.columns
                .iter()
                .enumerate()
                .flat_map(|(columnar_id, column_index_opt)| {
                    let columnar_row_range = self.stack_merge_order.columnar_range(columnar_id);
                    let rows_it: Box<dyn Iterator<Item = RowId>> = match column_index_opt {
                        ColumnIndex::Full => Box::new(columnar_row_range),
                        ColumnIndex::Optional(optional_index) => Box::new(
                            optional_index
                                .iter_non_null_docs()
                                .map(move |row_id: RowId| columnar_row_range.start + row_id),
                        ),
                        ColumnIndex::Multivalued(_) => {
                            panic!("No multivalued index is allowed when stacking column index");
                        }
                        ColumnIndex::Empty { .. } => Box::new(std::iter::empty()),
                    };
                    rows_it
                }),
        )
    }
}


================================================
FILE: columnar/src/column_index/mod.rs
================================================
//! # `column_index`
//!
//! `column_index` provides rank and select operations to associate positions when not all
//! documents have exactly one element.

mod merge;
mod multivalued_index;
mod optional_index;
mod serialize;

use std::ops::Range;

pub use merge::merge_column_index;
pub(crate) use multivalued_index::SerializableMultivalueIndex;
pub use optional_index::{OptionalIndex, Set};
pub use serialize::{
    SerializableColumnIndex, SerializableOptionalIndex, open_column_index, serialize_column_index,
};

use crate::column_index::multivalued_index::MultiValueIndex;
use crate::{Cardinality, DocId, RowId};

#[derive(Clone, Debug)]
pub enum ColumnIndex {
    Empty {
        num_docs: u32,
    },
    Full,
    Optional(OptionalIndex),
    /// In addition, at index num_rows, an extra value is added
    /// containing the overall number of values.
    Multivalued(MultiValueIndex),
}

impl From<OptionalIndex> for ColumnIndex {
    fn from(optional_index: OptionalIndex) -> ColumnIndex {
        ColumnIndex::Optional(optional_index)
    }
}

impl From<MultiValueIndex> for ColumnIndex {
    fn from(multi_value_index: MultiValueIndex) -> ColumnIndex {
        ColumnIndex::Multivalued(multi_value_index)
    }
}

impl ColumnIndex {
    /// Returns the cardinality of the column index.
    ///
    /// By convention, if the column contains no docs, we consider that it is
    /// full.
    #[inline]
    pub fn get_cardinality(&self) -> Cardinality {
        match self {
            ColumnIndex::Empty { num_docs: 0 } | ColumnIndex::Full => Cardinality::Full,
            ColumnIndex::Empty { .. } => Cardinality::Optional,
            ColumnIndex::Optional(_) => Cardinality::Optional,
            ColumnIndex::Multivalued(_) => Cardinality::Multivalued,
        }
    }

    /// Returns true if and only if there are at least one value associated to the row.
    pub fn has_value(&self, doc_id: DocId) -> bool {
        match self {
            ColumnIndex::Empty { .. } => false,
            ColumnIndex::Full => true,
            ColumnIndex::Optional(optional_index) => optional_index.contains(doc_id),
            ColumnIndex::Multivalued(multivalued_index) => {
                !multivalued_index.range(doc_id).is_empty()
            }
        }
    }

    pub fn value_row_ids(&self, doc_id: DocId) -> Range<RowId> {
        match self {
            ColumnIndex::Empty { .. } => 0..0,
            ColumnIndex::Full => doc_id..doc_id + 1,
            ColumnIndex::Optional(optional_index) => {
                if let Some(val) = optional_index.rank_if_exists(doc_id) {
                    val..val + 1
                } else {
                    0..0
                }
            }
            ColumnIndex::Multivalued(multivalued_index) => multivalued_index.range(doc_id),
        }
    }

    /// Translates a block of docis to row_ids.
    ///
    /// returns the row_ids and the matching docids on the same index
    /// e.g.
    /// DocId In:  [0, 5, 6]
    /// DocId Out: [0, 0, 6, 6]
    /// RowId Out: [0, 1, 2, 3]
    #[inline]
    pub fn docids_to_rowids(
        &self,
        doc_ids: &[DocId],
        doc_ids_out: &mut Vec<DocId>,
        row_ids: &mut Vec<RowId>,
    ) {
        match self {
            ColumnIndex::Empty { .. } => {}
            ColumnIndex::Full => {
                doc_ids_out.extend_from_slice(doc_ids);
                row_ids.extend_from_slice(doc_ids);
            }
            ColumnIndex::Optional(optional_index) => {
                for doc_id in doc_ids {
                    if let Some(row_id) = optional_index.rank_if_exists(*doc_id) {
                        doc_ids_out.push(*doc_id);
                        row_ids.push(row_id);
                    }
                }
            }
            ColumnIndex::Multivalued(multivalued_index) => {
                for doc_id in doc_ids {
                    for row_id in multivalued_index.range(*doc_id) {
                        doc_ids_out.push(*doc_id);
                        row_ids.push(row_id);
                    }
                }
            }
        }
    }

    pub fn docid_range_to_rowids(&self, doc_id_range: Range<DocId>) -> Range<RowId> {
        match self {
            ColumnIndex::Empty { .. } => 0..0,
            ColumnIndex::Full => doc_id_range,
            ColumnIndex::Optional(optional_index) => {
                let row_start = optional_index.rank(doc_id_range.start);
                let row_end = optional_index.rank(doc_id_range.end);
                row_start..row_end
            }
            ColumnIndex::Multivalued(multivalued_index) => match multivalued_index {
                MultiValueIndex::MultiValueIndexV1(index) => {
                    let row_start = index.start_index_column.get_val(doc_id_range.start);
                    let row_end = index.start_index_column.get_val(doc_id_range.end);
                    row_start..row_end
                }
                MultiValueIndex::MultiValueIndexV2(index) => {
                    // In this case we will use the optional_index select the next values
                    // that are valid. There are different cases to consider:
                    // Not exists below means does not exist in the optional
                    // index, because it has no values.
                    // * doc_id_range may cover a range of docids which are non existent
                    // => rank
                    //   will give us the next document outside the range with a value. They both
                    //   get the same rank and therefore return a zero range
                    //
                    // * doc_id_range.start and doc_id_range.end may not exist, but docids in
                    // between may have values
                    // => rank will give us the next document outside the range with a value.
                    //
                    // * doc_id_range.start may be not existent but doc_id_range.end may exist
                    // * doc_id_range.start may exist but doc_id_range.end may not exist
                    // * doc_id_range.start and doc_id_range.end may exist
                    // => rank on doc_id_range.end will give use the next value, which matches
                    // how the `start_index_column` works, so we get the value start of the next
                    // docid which we use to create the exclusive range.
                    //
                    let rank_start = index.optional_index.rank(doc_id_range.start);
                    let row_start = index.start_index_column.get_val(rank_start);
                    let rank_end = index.optional_index.rank(doc_id_range.end);
                    let row_end = index.start_index_column.get_val(rank_end);

                    row_start..row_end
                }
            },
        }
    }

    pub fn select_batch_in_place(&self, doc_id_start: DocId, rank_ids: &mut Vec<RowId>) {
        match self {
            ColumnIndex::Empty { .. } => {
                rank_ids.clear();
            }
            ColumnIndex::Full => {
                // No need to do anything:
                // value_idx and row_idx are the same.
            }
            ColumnIndex::Optional(optional_index) => {
                optional_index.select_batch(&mut rank_ids[..]);
            }
            ColumnIndex::Multivalued(multivalued_index) => {
                multivalued_index.select_batch_in_place(doc_id_start, rank_ids)
            }
        }
    }
}

#[cfg(test)]
mod tests {
    use crate::{Cardinality, ColumnIndex};

    #[test]
    fn test_column_index_get_cardinality() {
        assert_eq!(
            ColumnIndex::Empty { num_docs: 0 }.get_cardinality(),
            Cardinality::Full
        );
        assert_eq!(ColumnIndex::Full.get_cardinality(), Cardinality::Full);
        assert_eq!(
            ColumnIndex::Empty { num_docs: 1 }.get_cardinality(),
            Cardinality::Optional
        );
    }
}


================================================
FILE: columnar/src/column_index/multivalued_index.rs
================================================
use std::io;
use std::io::Write;
use std::ops::Range;
use std::sync::Arc;

use common::{CountingWriter, OwnedBytes};

use super::optional_index::{open_optional_index, serialize_optional_index};
use super::{OptionalIndex, SerializableOptionalIndex, Set};
use crate::column_values::{
    CodecType, ColumnValues, load_u64_based_column_values, serialize_u64_based_column_values,
};
use crate::iterable::Iterable;
use crate::{DocId, RowId, Version};

pub struct SerializableMultivalueIndex<'a> {
    pub doc_ids_with_values: SerializableOptionalIndex<'a>,
    pub start_offsets: Box<dyn Iterable<u32> + 'a>,
}

pub fn serialize_multivalued_index(
    multivalued_index: &SerializableMultivalueIndex,
    output: &mut impl Write,
) -> io::Result<()> {
    let SerializableMultivalueIndex {
        doc_ids_with_values,
        start_offsets,
    } = multivalued_index;
    let mut count_writer = CountingWriter::wrap(output);
    let SerializableOptionalIndex {
        non_null_row_ids,
        num_rows,
    } = doc_ids_with_values;
    serialize_optional_index(&**non_null_row_ids, *num_rows, &mut count_writer)?;
    let optional_len = count_writer.written_bytes() as u32;
    let output = count_writer.finish();
    serialize_u64_based_column_values(
        &**start_offsets,
        &[CodecType::Bitpacked, CodecType::Linear],
        output,
    )?;
    output.write_all(&optional_len.to_le_bytes())?;
    Ok(())
}

pub fn open_multivalued_index(
    bytes: OwnedBytes,
    format_version: Version,
) -> io::Result<MultiValueIndex> {
    match format_version {
        Version::V1 => {
            let start_index_column: Arc<dyn ColumnValues<RowId>> =
                load_u64_based_column_values(bytes)?;
            Ok(MultiValueIndex::MultiValueIndexV1(MultiValueIndexV1 {
                start_index_column,
            }))
        }
        Version::V2 => {
            let (body_bytes, optional_index_len) = bytes.rsplit(4);
            let optional_index_len =
                u32::from_le_bytes(optional_index_len.as_slice().try_into().unwrap());
            let (optional_index_bytes, start_index_bytes) =
                body_bytes.split(optional_index_len as usize);
            let optional_index = open_optional_index(optional_index_bytes)?;
            let start_index_column: Arc<dyn ColumnValues<RowId>> =
                load_u64_based_column_values(start_index_bytes)?;
            Ok(MultiValueIndex::MultiValueIndexV2(MultiValueIndexV2 {
                optional_index,
                start_index_column,
            }))
        }
    }
}

#[derive(Clone)]
/// Index to resolve value range for given doc_id.
/// Starts at 0.
pub enum MultiValueIndex {
    MultiValueIndexV1(MultiValueIndexV1),
    MultiValueIndexV2(MultiValueIndexV2),
}

#[derive(Clone)]
/// Index to resolve value range for given doc_id.
/// Starts at 0.
pub struct MultiValueIndexV1 {
    pub start_index_column: Arc<dyn crate::ColumnValues<RowId>>,
}

impl MultiValueIndexV1 {
    /// Returns `[start, end)`, such that the values associated with
    /// the given document are `start..end`.
    #[inline]
    pub(crate) fn range(&self, doc_id: DocId) -> Range<RowId> {
        if doc_id >= self.num_docs() {
            return 0..0;
        }
        let start = self.start_index_column.get_val(doc_id);
        let end = self.start_index_column.get_val(doc_id + 1);
        start..end
    }

    /// Returns the number of documents in the index.
    #[inline]
    pub fn num_docs(&self) -> u32 {
        self.start_index_column.num_vals() - 1
    }

    /// Converts a list of ranks (row ids of values) in a 1:n index to the corresponding list of
    /// docids. Positions are converted inplace to docids.
    ///
    /// Since there is no index for value pos -> docid, but docid -> value pos range, we scan the
    /// index.
    ///
    /// Correctness: positions needs to be sorted. idx_reader needs to contain monotonically
    /// increasing positions.
    ///
    /// TODO: Instead of a linear scan we can employ a exponential search into binary search to
    /// match a docid to its value position.
    pub(crate) fn select_batch_in_place(&self, docid_start: DocId, ranks: &mut Vec<u32>) {
        if ranks.is_empty() {
            return;
        }
        let mut cur_doc = docid_start;
        let mut last_doc = None;

        assert!(self.start_index_column.get_val(docid_start) <= ranks[0]);

        let mut write_doc_pos = 0;
        for i in 0..ranks.len() {
            let pos = ranks[i];
            loop {
                let end = self.start_index_column.get_val(cur_doc + 1);
                if end > pos {
                    ranks[write_doc_pos] = cur_doc;
                    write_doc_pos += if last_doc == Some(cur_doc) { 0 } else { 1 };
                    last_doc = Some(cur_doc);
                    break;
                }
                cur_doc += 1;
            }
        }
        ranks.truncate(write_doc_pos);
    }
}

#[derive(Clone)]
/// Index to resolve value range for given doc_id.
/// Starts at 0.
pub struct MultiValueIndexV2 {
    pub optional_index: OptionalIndex,
    pub start_index_column: Arc<dyn crate::ColumnValues<RowId>>,
}

impl std::fmt::Debug for MultiValueIndex {
    fn fmt(&self, f: &mut std::fmt::Formatter) -> std::fmt::Result {
        let index = match self {
            MultiValueIndex::MultiValueIndexV1(idx) => &idx.start_index_column,
            MultiValueIndex::MultiValueIndexV2(idx) => &idx.start_index_column,
        };
        f.debug_struct("MultiValuedIndex")
            .field("num_rows", &index.num_vals())
            .finish_non_exhaustive()
    }
}

impl MultiValueIndex {
    pub fn for_test(start_offsets: &[RowId]) -> MultiValueIndex {
        assert!(!start_offsets.is_empty());
        assert_eq!(start_offsets[0], 0);
        let mut doc_with_values = Vec::new();
        let mut compact_start_offsets: Vec<u32> = vec![0];
        for doc in 0..start_offsets.len() - 1 {
            if start_offsets[doc] < start_offsets[doc + 1] {
                doc_with_values.push(doc as RowId);
                compact_start_offsets.push(start_offsets[doc + 1]);
            }
        }
        let serializable_multivalued_index = SerializableMultivalueIndex {
            doc_ids_with_values: SerializableOptionalIndex {
                non_null_row_ids: Box::new(&doc_with_values[..]),
                num_rows: start_offsets.len() as u32 - 1,
            },
            start_offsets: Box::new(&compact_start_offsets[..]),
        };
        let mut buffer = Vec::new();
        serialize_multivalued_index(&serializable_multivalued_index, &mut buffer).unwrap();
        let bytes = OwnedBytes::new(buffer);
        open_multivalued_index(bytes, Version::V2).unwrap()
    }

    pub fn get_start_index_column(&self) -> &Arc<dyn crate::ColumnValues<RowId>> {
        match self {
            MultiValueIndex::MultiValueIndexV1(idx) => &idx.start_index_column,
            MultiValueIndex::MultiValueIndexV2(idx) => &idx.start_index_column,
        }
    }

    /// Returns `[start, end)` values range, such that the values associated with
    /// the given document are `start..end`.
    #[inline]
    pub(crate) fn range(&self, doc_id: DocId) -> Range<RowId> {
        match self {
            MultiValueIndex::MultiValueIndexV1(idx) => idx.range(doc_id),
            MultiValueIndex::MultiValueIndexV2(idx) => idx.range(doc_id),
        }
    }

    /// Returns the number of documents in the index.
    #[inline]
    pub fn num_docs(&self) -> u32 {
        match self {
            MultiValueIndex::MultiValueIndexV1(idx) => idx.start_index_column.num_vals() - 1,
            MultiValueIndex::MultiValueIndexV2(idx) => idx.optional_index.num_docs(),
        }
    }

    /// Returns an iterator over document ids that have at least one value.
    pub fn iter_non_null_docs(&self) -> Box<dyn Iterator<Item = DocId> + '_> {
        match self {
            MultiValueIndex::MultiValueIndexV1(idx) => {
                let mut doc: DocId = 0u32;
                let num_docs = idx.num_docs();
                Box::new(std::iter::from_fn(move || {
                    // This is not the most efficient way to do this, but it's legacy code.
                    while doc < num_docs {
                        let cur = doc;
                        doc += 1;
                        let start = idx.start_index_column.get_val(cur);
                        let end = idx.start_index_column.get_val(cur + 1);
                        if end > start {
                            return Some(cur);
                        }
                    }
                    None
                }))
            }
            MultiValueIndex::MultiValueIndexV2(idx) => {
                Box::new(idx.optional_index.iter_non_null_docs())
            }
        }
    }

    /// Converts a list of ranks (row ids of values) in a 1:n index to the corresponding list of
    /// docids. Positions are converted inplace to docids.
    ///
    /// Since there is no index for value pos -> docid, but docid -> value pos range, we scan the
    /// index.
    ///
    /// Correctness: positions needs to be sorted. idx_reader needs to contain monotonically
    /// increasing positions.
    ///
    /// TODO: Instead of a linear scan we can employ a exponential search into binary search to
    /// match a docid to its value position.
    pub(crate) fn select_batch_in_place(&self, docid_start: DocId, ranks: &mut Vec<u32>) {
        match self {
            MultiValueIndex::MultiValueIndexV1(idx) => {
                idx.select_batch_in_place(docid_start, ranks)
            }
            MultiValueIndex::MultiValueIndexV2(idx) => {
                idx.select_batch_in_place(docid_start, ranks)
            }
        }
    }
}
impl MultiValueIndexV2 {
    /// Returns `[start, end)`, such that the values associated with
    /// the given document are `start..end`.
    #[inline]
    pub(crate) fn range(&self, doc_id: DocId) -> Range<RowId> {
        let Some(rank) = self.optional_index.rank_if_exists(doc_id) else {
            return 0..0;
        };
        let start = self.start_index_column.get_val(rank);
        let end = self.start_index_column.get_val(rank + 1);
        start..end
    }

    /// Returns the number of documents in the index.
    #[inline]
    pub fn num_docs(&self) -> u32 {
        self.optional_index.num_docs()
    }

    /// Converts a list of ranks (row ids of values) in a 1:n index to the corresponding list of
    /// docids. Positions are converted inplace to docids.
    ///
    /// Since there is no index for value pos -> docid, but docid -> value pos range, we scan the
    /// index.
    ///
    /// Correctness: positions needs to be sorted. idx_reader needs to contain monotonically
    /// increasing positions.
    ///
    /// TODO: Instead of a linear scan we can employ a exponential search into binary search to
    /// match a docid to its value position.
    pub(crate) fn select_batch_in_place(&self, docid_start: DocId, ranks: &mut Vec<u32>) {
        if ranks.is_empty() {
            return;
        }
        let mut cur_pos_in_idx = self.optional_index.rank(docid_start);
        let mut last_doc = None;

        assert!(cur_pos_in_idx <= ranks[0]);

        let mut write_doc_pos = 0;
        for i in 0..ranks.len() {
            let pos = ranks[i];
            loop {
                let end = self.start_index_column.get_val(cur_pos_in_idx + 1);
                if end > pos {
                    ranks[write_doc_pos] = cur_pos_in_idx;
                    write_doc_pos += if last_doc == Some(cur_pos_in_idx) {
                        0
                    } else {
                        1
                    };
                    last_doc = Some(cur_pos_in_idx);
                    break;
                }
                cur_pos_in_idx += 1;
            }
        }
        ranks.truncate(write_doc_pos);

        for rank in ranks.iter_mut() {
            *rank = self.optional_index.select(*rank);
        }
    }
}

#[cfg(test)]
mod tests {
    use std::ops::Range;

    use super::MultiValueIndex;
    use crate::{ColumnarReader, DynamicColumn};

    fn index_to_pos_helper(
        index: &MultiValueIndex,
        doc_id_range: Range<u32>,
        positions: &[u32],
    ) -> Vec<u32> {
        let mut positions = positions.to_vec();
        index.select_batch_in_place(doc_id_range.start, &mut positions);
        positions
    }

    #[test]
    fn test_positions_to_docid() {
        let index = MultiValueIndex::for_test(&[0, 10, 12, 15, 22, 23]);
        assert_eq!(index.num_docs(), 5);
        let positions = &[10u32, 11, 15, 20, 21, 22];
        assert_eq!(index_to_pos_helper(&index, 0..5, positions), vec![1, 3, 4]);
        assert_eq!(index_to_pos_helper(&index, 1..5, positions), vec![1, 3, 4]);

        assert_eq!(index_to_pos_helper(&index, 0..5, &[9]), vec![0]);
        assert_eq!(index_to_pos_helper(&index, 1..5, &[10]), vec![1]);
        assert_eq!(index_to_pos_helper(&index, 1..5, &[11]), vec![1]);
        assert_eq!(index_to_pos_helper(&index, 2..5, &[12]), vec![2]);
        assert_eq!(index_to_pos_helper(&index, 2..5, &[12, 14]), vec![2]);
        assert_eq!(index_to_pos_helper(&index, 2..5, &[12, 14, 15]), vec![2, 3]);
    }

    #[test]
    fn test_range_to_rowids() {
        use crate::ColumnarWriter;

        let mut columnar_writer = ColumnarWriter::default();

        // This column gets coerced to u64
        columnar_writer.record_numerical(1, "full", u64::MAX);
        columnar_writer.record_numerical(1, "full", u64::MAX);

        columnar_writer.record_numerical(5, "full", u64::MAX);
        columnar_writer.record_numerical(5, "full", u64::MAX);

        let mut wrt: Vec<u8> = Vec::new();
        columnar_writer.serialize(7, &mut wrt).unwrap();

        let reader = ColumnarReader::open(wrt).unwrap();
        // Open the column as u64
        let column = reader.read_columns("full").unwrap()[0]
            .open()
            .unwrap()
            .coerce_numerical(crate::NumericalType::U64)
            .unwrap();
        let DynamicColumn::U64(column) = column else {
            panic!();
        };

        let row_id_range = column.index.docid_range_to_rowids(1..2);
        assert_eq!(row_id_range, 0..2);

        let row_id_range = column.index.docid_range_to_rowids(0..2);
        assert_eq!(row_id_range, 0..2);

        let row_id_range = column.index.docid_range_to_rowids(0..4);
        assert_eq!(row_id_range, 0..2);

        let row_id_range = column.index.docid_range_to_rowids(3..4);
        assert_eq!(row_id_range, 2..2);

        let row_id_range = column.index.docid_range_to_rowids(1..6);
        assert_eq!(row_id_range, 0..4);

        let row_id_range = column.index.docid_range_to_rowids(3..6);
        assert_eq!(row_id_range, 2..4);

        let row_id_range = column.index.docid_range_to_rowids(0..6);
        assert_eq!(row_id_range, 0..4);

        let row_id_range = column.index.docid_range_to_rowids(0..6);
        assert_eq!(row_id_range, 0..4);

        let check = |range, expected| {
            let full_range = 0..=u64::MAX;
            let mut docids = Vec::new();
            column.get_docids_for_value_range(full_range, range, &mut docids);
            assert_eq!(docids, expected);
        };

        // check(0..1, vec![]);
        // check(0..2, vec![1]);
        check(1..2, vec![1]);
    }
}


================================================
FILE: columnar/src/column_index/optional_index/mod.rs
================================================
use std::io;
use std::sync::Arc;

mod set;
mod set_block;

use common::{BinarySerializable, OwnedBytes, VInt};
pub use set::{SelectCursor, Set, SetCodec};
use set_block::{
    DENSE_BLOCK_NUM_BYTES, DenseBlock, DenseBlockCodec, SparseBlock, SparseBlockCodec,
};

use crate::iterable::Iterable;
use crate::{DocId, RowId};

/// The threshold for for number of elements after which we switch to dense block encoding.
///
/// We simply pick the value that minimize the size of the blocks.
const DENSE_BLOCK_THRESHOLD: u32 =
    set_block::DENSE_BLOCK_NUM_BYTES / std::mem::size_of::<u16>() as u32; //< 5_120

const ELEMENTS_PER_BLOCK: u32 = u16::MAX as u32 + 1;

#[derive(Copy, Clone, Debug)]
struct BlockMeta {
    non_null_rows_before_block: u32,
    start_byte_offset: u32,
    block_variant: BlockVariant,
}

#[derive(Clone, Copy, Debug)]
enum BlockVariant {
    Dense,
    Sparse { num_vals: u16 },
}

impl BlockVariant {
    pub fn empty() -> Self {
        Self::Sparse { num_vals: 0 }
    }
    pub fn num_bytes_in_block(&self) -> u32 {
        match *self {
            BlockVariant::Dense => set_block::DENSE_BLOCK_NUM_BYTES,
            BlockVariant::Sparse { num_vals } => num_vals as u32 * 2,
        }
    }
}

/// This codec is inspired by roaring bitmaps.
/// In the dense blocks, however, in order to accelerate `select`
/// we interleave an offset over two bytes. (more on this lower)
///
/// The lower 16 bits of doc ids are stored as u16 while the upper 16 bits are given by the block
/// id. Each block contains 1<<16 docids.
///
/// # Serialized Data Layout
/// The data starts with the block data. Each block is either dense or sparse encoded, depending on
/// the number of values in the block. A block is sparse when it contains less than
/// DENSE_BLOCK_THRESHOLD (6144) values.
/// [Sparse data block | dense data block, .. #repeat*; Desc: Either a sparse or dense encoded
/// block]
/// ### Sparse block data
/// [u16 LE, .. #repeat*; Desc: Positions with values in a block]
/// ### Dense block data
/// [Dense codec for the whole block; Desc: Similar to a bitvec(0..ELEMENTS_PER_BLOCK) + Metadata
/// for faster lookups. See dense.rs]
///
/// The data is followed by block metadata, to know which area of the raw block data belongs to
/// which block. Only metadata for blocks with elements is recorded to
/// keep the overhead low for scenarios with many very sparse columns. The block metadata consists
/// of the block index and the number of values in the block. Since we don't store empty blocks
/// num_vals is incremented by 1, e.g. 0 means 1 value.
///
/// The last u16 is storing the number of metadata blocks.
/// [u16 LE, .. #repeat*; Desc: Positions with values in a block][(u16 LE, u16 LE), .. #repeat*;
/// Desc: (Block Id u16, Num Elements u16)][u16 LE; Desc: num blocks with values u16]
///
/// # Opening
/// When opening the data layout, the data is expanded to `Vec<SparseCodecBlockVariant>`, where the
/// index is the block index. For each block `byte_start` and `offset` is computed.
#[derive(Clone)]
pub struct OptionalIndex {
    num_docs: RowId,
    num_non_null_docs: RowId,
    block_data: OwnedBytes,
    block_metas: Arc<[BlockMeta]>,
}

impl Iterable<u32> for &OptionalIndex {
    fn boxed_iter(&self) -> Box<dyn Iterator<Item = u32> + '_> {
        Box::new(self.iter_non_null_docs())
    }
}

impl std::fmt::Debug for OptionalIndex {
    fn fmt(&self, f: &mut std::fmt::Formatter) -> std::fmt::Result {
        f.debug_struct("OptionalIndex")
            .field("num_docs", &self.num_docs)
            .field("num_non_null_docs", &self.num_non_null_docs)
            .finish_non_exhaustive()
    }
}

/// Splits a value address into lower and upper 16bits.
/// The lower 16 bits are the value in the block
/// The upper 16 bits are the block index
#[derive(Copy, Debug, Clone)]
struct RowAddr {
    block_id: u16,
    in_block_row_id: u16,
}

#[inline(always)]
fn row_addr_from_row_id(row_id: RowId) -> RowAddr {
    RowAddr {
        block_id: (row_id / ELEMENTS_PER_BLOCK) as u16,
        in_block_row_id: (row_id % ELEMENTS_PER_BLOCK) as u16,
    }
}

enum BlockSelectCursor<'a> {
    Dense(<DenseBlock<'a> as Set<u16>>::SelectCursor<'a>),
    Sparse(<SparseBlock<'a> as Set<u16>>::SelectCursor<'a>),
}

impl BlockSelectCursor<'_> {
    fn select(&mut self, rank: u16) -> u16 {
        match self {
            BlockSelectCursor::Dense(dense_select_cursor) => dense_select_cursor.select(rank),
            BlockSelectCursor::Sparse(sparse_select_cursor) => sparse_select_cursor.select(rank),
        }
    }
}
pub struct OptionalIndexSelectCursor<'a> {
    current_block_cursor: BlockSelectCursor<'a>,
    current_block_id: u16,
    // The current block is guaranteed to contain ranks < end_rank.
    current_block_end_rank: RowId,
    optional_index: &'a OptionalIndex,
    block_doc_idx_start: RowId,
    num_null_rows_before_block: RowId,
}

impl OptionalIndexSelectCursor<'_> {
    fn search_and_load_block(&mut self, rank: RowId) {
        if rank < self.current_block_end_rank {
            // we are already in the right block
            return;
        }
        self.current_block_id = self.optional_index.find_block(rank, self.current_block_id);
        self.current_block_end_rank = self
            .optional_index
            .block_metas
            .get(self.current_block_id as usize + 1)
            .map(|block_meta| block_meta.non_null_rows_before_block)
            .unwrap_or(u32::MAX);
        self.block_doc_idx_start = (self.current_block_id as u32) * ELEMENTS_PER_BLOCK;
        let block_meta = self.optional_index.block_metas[self.current_block_id as usize];
        self.num_null_rows_before_block = block_meta.non_null_rows_before_block;
        let block: Block<'_> = self.optional_index.block(block_meta);
        self.current_block_cursor = match block {
            Block::Dense(dense_block) => BlockSelectCursor::Dense(dense_block.select_cursor()),
            Block::Sparse(sparse_block) => BlockSelectCursor::Sparse(sparse_block.select_cursor()),
        };
    }
}

impl SelectCursor<RowId> for OptionalIndexSelectCursor<'_> {
    fn select(&mut self, rank: RowId) -> RowId {
        self.search_and_load_block(rank);
        let index_in_block = (rank - self.num_null_rows_before_block) as u16;
        self.current_block_cursor.select(index_in_block) as RowId + self.block_doc_idx_start
    }
}

impl Set<RowId> for OptionalIndex {
    type SelectCursor<'b>
        = OptionalIndexSelectCursor<'b>
    where Self: 'b;
    // Check if value at position is not null.
    #[inline]
    fn contains(&self, row_id: RowId) -> bool {
        let RowAddr {
            block_id,
            in_block_row_id,
        } = row_addr_from_row_id(row_id);
        let block_meta = self.block_metas[block_id as usize];
        match self.block(block_meta) {
            Block::Dense(dense_block) => dense_block.contains(in_block_row_id),
            Block::Sparse(sparse_block) => sparse_block.contains(in_block_row_id),
        }
    }

    /// Any value doc_id is allowed.
    /// In particular, doc_id = num_rows.
    #[inline]
    fn rank(&self, doc_id: DocId) -> RowId {
        if doc_id >= self.num_docs() {
            return self.num_non_nulls();
        }
        let RowAddr {
            block_id,
            in_block_row_id,
        } = row_addr_from_row_id(doc_id);
        let block_meta = self.block_metas[block_id as usize];
        let block = self.block(block_meta);

        let block_offset_row_id = match block {
            Block::Dense(dense_block) => dense_block.rank(in_block_row_id),
            Block::Sparse(sparse_block) => sparse_block.rank(in_block_row_id),
        } as u32;
        block_meta.non_null_rows_before_block + block_offset_row_id
    }

    /// Any value doc_id is allowed.
    /// In particular, doc_id = num_rows.
    #[inline]
    fn rank_if_exists(&self, doc_id: DocId) -> Option<RowId> {
        let RowAddr {
            block_id,
            in_block_row_id,
        } = row_addr_from_row_id(doc_id);
        let block_meta = *self.block_metas.get(block_id as usize)?;
        let block = self.block(block_meta);
        let block_offset_row_id = match block {
            Block::Dense(dense_block) => dense_block.rank_if_exists(in_block_row_id),
            Block::Sparse(sparse_block) => sparse_block.rank_if_exists(in_block_row_id),
        }? as u32;
        Some(block_meta.non_null_rows_before_block + block_offset_row_id)
    }

    #[inline]
    fn select(&self, rank: RowId) -> RowId {
        let block_pos = self.find_block(rank, 0);
        let block_doc_idx_start = (block_pos as u32) * ELEMENTS_PER_BLOCK;
        let block_meta = self.block_metas[block_pos as usize];
        let block: Block<'_> = self.block(block_meta);
        let index_in_block = (rank - block_meta.non_null_rows_before_block) as u16;
        let in_block_rank = match block {
            Block::Dense(dense_block) => dense_block.select(index_in_block),
            Block::Sparse(sparse_block) => sparse_block.select(index_in_block),
        };
        block_doc_idx_start + in_block_rank as u32
    }

    fn select_cursor(&self) -> OptionalIndexSelectCursor<'_> {
        OptionalIndexSelectCursor {
            current_block_cursor: BlockSelectCursor::Sparse(
                SparseBlockCodec::open(b"").select_cursor(),
            ),
            current_block_id: 0u16,
            current_block_end_rank: 0u32, //< this is sufficient to force the first load
            optional_index: self,
            block_doc_idx_start: 0u32,
            num_null_rows_before_block: 0u32,
        }
    }
}

impl OptionalIndex {
    pub fn for_test(num_rows: RowId, row_ids: &[RowId]) -> OptionalIndex {
        assert!(
            row_ids
                .last()
                .copied()
                .map(|last_row_id| last_row_id < num_rows)
                .unwrap_or(true)
        );
        let mut buffer = Vec::new();
        serialize_optional_index(&row_ids, num_rows, &mut buffer).unwrap();
        let bytes = OwnedBytes::new(buffer);
        open_optional_index(bytes).unwrap()
    }

    pub fn num_docs(&self) -> RowId {
        self.num_docs
    }

    pub fn num_non_nulls(&self) -> RowId {
        self.num_non_null_docs
    }

    pub fn iter_non_null_docs(&self) -> impl Iterator<Item = RowId> + '_ {
        // TODO optimize. We could iterate over the blocks directly.
        // We use the dense value ids and retrieve the doc ids via select.
        let mut select_batch = self.select_cursor();
        (0..self.num_non_null_docs).map(move |rank| select_batch.select(rank))
    }
    pub fn select_batch(&self, ranks: &mut [RowId]) {
        let mut select_cursor = self.select_cursor();
        for rank in ranks.iter_mut() {
            *rank = select_cursor.select(*rank);
        }
    }

    #[inline]
    fn block(&self, block_meta: BlockMeta) -> Block<'_> {
        let BlockMeta {
            start_byte_offset,
            block_variant,
            ..
        } = block_meta;
        let start_byte_offset = start_byte_offset as usize;
        let bytes = self.block_data.as_slice();
        match block_variant {
            BlockVariant::Dense => Block::Dense(DenseBlockCodec::open(
                &bytes[start_byte_offset..start_byte_offset + DENSE_BLOCK_NUM_BYTES as usize],
            )),
            BlockVariant::Sparse { num_vals } => {
                let end_byte_offset = start_byte_offset + num_vals as usize * 2;
                let sparse_bytes = &bytes[start_byte_offset..end_byte_offset];
                Block::Sparse(SparseBlockCodec::open(sparse_bytes))
            }
        }
    }

    #[inline]
    fn find_block(&self, dense_idx: u32, start_block_pos: u16) -> u16 {
        for block_pos in start_block_pos..self.block_metas.len() as u16 {
            let offset = self.block_metas[block_pos as usize].non_null_rows_before_block;
            if offset > dense_idx {
                return block_pos - 1u16;
            }
        }
        self.block_metas.len() as u16 - 1u16
    }

    // TODO Add a good API for the codec_idx to original_idx translation.
    // The Iterator API is a probably a bad idea
}

#[derive(Copy, Clone)]
enum Block<'a> {
    Dense(DenseBlock<'a>),
    Sparse(SparseBlock<'a>),
}

fn serialize_optional_index_block(block_els: &[u16], out: &mut impl io::Write) -> io::Result<()> {
    let is_sparse = is_sparse(block_els.len() as u32);
    if is_sparse {
        SparseBlockCodec::serialize(block_els.iter().copied(), out)?;
    } else {
        DenseBlockCodec::serialize(block_els.iter().copied(), out)?;
    }
    Ok(())
}

pub fn serialize_optional_index<W: io::Write>(
    non_null_rows: &dyn Iterable<RowId>,
    num_rows: RowId,
    output: &mut W,
) -> io::Result<()> {
    VInt(num_rows as u64).serialize(output)?;

    let mut rows_it = non_null_rows.boxed_iter();
    let mut block_metadata: Vec<SerializedBlockMeta> = Vec::new();
    let mut current_block = Vec::new();

    // This if-statement for the first element ensures that
    // `block_metadata` is not empty in the loop below.
    let Some(idx) = rows_it.next() else {
        output.write_all(&0u16.to_le_bytes())?;
        return Ok(());
    };

    let row_addr = row_addr_from_row_id(idx);

    let mut current_block_id = row_addr.block_id;
    current_block.push(row_addr.in_block_row_id);

    for idx in rows_it {
        let value_addr = row_addr_from_row_id(idx);
        if current_block_id != value_addr.block_id {
            serialize_optional_index_block(&current_block[..], output)?;
            block_metadata.push(SerializedBlockMeta {
                block_id: current_block_id,
                num_non_null_rows: current_block.len() as u32,
            });
            current_block.clear();
            current_block_id = value_addr.block_id;
        }
        current_block.push(value_addr.in_block_row_id);
    }

    // handle last block
    serialize_optional_index_block(&current_block[..], output)?;

    block_metadata.push(SerializedBlockMeta {
        block_id: current_block_id,
        num_non_null_rows: current_block.len() as u32,
    });

    for block in &block_metadata {
        output.write_all(&block.to_bytes())?;
    }

    output.write_all((block_metadata.len() as u16).to_le_bytes().as_ref())?;

    Ok(())
}

const SERIALIZED_BLOCK_META_NUM_BYTES: usize = 4;

#[derive(Clone, Copy, Debug)]
struct SerializedBlockMeta {
    block_id: u16,
    num_non_null_rows: u32, //< takes values in 1..=u16::MAX
}

// TODO unit tests
impl SerializedBlockMeta {
    #[inline]
    fn from_bytes(bytes: [u8; SERIALIZED_BLOCK_META_NUM_BYTES]) -> SerializedBlockMeta {
        let block_id = u16::from_le_bytes(bytes[0..2].try_into().unwrap());
        let num_non_null_rows: u32 =
            u16::from_le_bytes(bytes[2..4].try_into().unwrap()) as u32 + 1u32;
        SerializedBlockMeta {
            block_id,
            num_non_null_rows,
        }
    }

    #[inline]
    fn to_bytes(self) -> [u8; SERIALIZED_BLOCK_META_NUM_BYTES] {
        assert!(self.num_non_null_rows > 0);
        let mut bytes = [0u8; SERIALIZED_BLOCK_META_NUM_BYTES];
        bytes[0..2].copy_from_slice(&self.block_id.to_le_bytes());
        // We don't store empty blocks, therefore we can subtract 1.
        // This way we will be able to use u16 when the number of elements is 1 << 16 or u16::MAX+1
        bytes[2..4].copy_from_slice(&((self.num_non_null_rows - 1u32) as u16).to_le_bytes());
        bytes
    }
}

#[inline]
fn is_sparse(num_rows_in_block: u32) -> bool {
    num_rows_in_block < DENSE_BLOCK_THRESHOLD
}

fn deserialize_optional_index_block_metadatas(
    data: &[u8],
    num_rows: u32,
) -> (Box<[BlockMeta]>, u32) {
    let num_blocks = data.len() / SERIALIZED_BLOCK_META_NUM_BYTES;
    let mut block_metas = Vec::with_capacity(num_blocks + 1);
    let mut start_byte_offset = 0;
    let mut non_null_rows_before_block = 0;
    for block_meta_bytes in data.chunks_exact(SERIALIZED_BLOCK_META_NUM_BYTES) {
        let block_meta_bytes: [u8; SERIALIZED_BLOCK_META_NUM_BYTES] =
            block_meta_bytes.try_into().unwrap();
        let SerializedBlockMeta {
            block_id,
            num_non_null_rows,
        } = SerializedBlockMeta::from_bytes(block_meta_bytes);
        block_metas.resize(
            block_id as usize,
            BlockMeta {
                non_null_rows_before_block,
                start_byte_offset,
                block_variant: BlockVariant::empty(),
            },
        );
        let block_variant = if is_sparse(num_non_null_rows) {
            BlockVariant::Sparse {
                num_vals: num_non_null_rows as u16,
            }
        } else {
            BlockVariant::Dense
        };
        block_metas.push(BlockMeta {
            non_null_rows_before_block,
            start_byte_offset,
            block_variant,
        });
        start_byte_offset += block_variant.num_bytes_in_block();
        non_null_rows_before_block += num_non_null_rows;
    }
    block_metas.resize(
        num_rows.div_ceil(ELEMENTS_PER_BLOCK) as usize,
        BlockMeta {
            non_null_rows_before_block,
            start_byte_offset,
            block_variant: BlockVariant::empty(),
        },
    );
    (block_metas.into_boxed_slice(), non_null_rows_before_block)
}

pub fn open_optional_index(bytes: OwnedBytes) -> io::Result<OptionalIndex> {
    let (mut bytes, num_non_empty_blocks_bytes) = bytes.rsplit(2);
    let num_non_empty_block_bytes =
        u16::from_le_bytes(num_non_empty_blocks_bytes.as_slice().try_into().unwrap());
    let num_docs = VInt::deserialize_u64(&mut bytes)? as u32;
    let block_metas_num_bytes =
        num_non_empty_block_bytes as usize * SERIALIZED_BLOCK_META_NUM_BYTES;
    let (block_data, block_metas) = bytes.rsplit(block_metas_num_bytes);
    let (block_metas, num_non_null_docs) =
        deserialize_optional_index_block_metadatas(block_metas.as_slice(), num_docs);
    let optional_index = OptionalIndex {
        num_docs,
        num_non_null_docs,
        block_data,
        block_metas: block_metas.into(),
    };
    Ok(optional_index)
}

#[cfg(test)]
mod tests;


================================================
FILE: columnar/src/column_index/optional_index/set.rs
================================================
use std::io;

/// A codec makes it possible to serialize a set of
/// elements, and open the resulting Set representation.
pub trait SetCodec {
    type Item: Copy + TryFrom<usize> + Eq + std::hash::Hash + std::fmt::Debug;
    type Reader<'a>: Set<Self::Item>;

    /// Serializes a set of unique sorted u16 elements.
    ///
    /// May panic if the elements are not sorted.
    fn serialize(els: impl Iterator<Item = Self::Item>, wrt: impl io::Write) -> io::Result<()>;
    fn open(data: &[u8]) -> Self::Reader<'_>;
}

/// Stateful object that makes it possible to compute several select in a row,
/// provided the rank passed as argument are increasing.
pub trait SelectCursor<T> {
    // May panic if rank is greater than the number of elements in the Set,
    // or if rank is < than value provided in the previous call.
    fn select(&mut self, rank: T) -> T;
}

pub trait Set<T> {
    type SelectCursor<'b>: SelectCursor<T>
    where Self: 'b;

    /// Returns true if the elements is contained in the Set
    fn contains(&self, el: T) -> bool;

    /// Returns the element's rank (its position in the set).
    /// If the set does not contain the element, it will return the next existing elements rank.
    fn rank(&self, el: T) -> T;

    /// If the set contains `el`, returns the element's rank (its position in the set).
    /// If the set does not contain the element, it returns `None`.
    fn rank_if_exists(&self, el: T) -> Option<T>;

    /// Return the rank-th value stored in this bitmap.
    ///
    /// # Panics
    ///
    /// May panic if rank is greater or equal to the number of
    /// elements in the Set.
    fn select(&self, rank: T) -> T;

    /// Creates a brand new select cursor.
    fn select_cursor(&self) -> Self::SelectCursor<'_>;
}


================================================
FILE: columnar/src/column_index/optional_index/set_block/dense.rs
================================================
use std::io::{self, Write};

use common::BinarySerializable;

use crate::column_index::optional_index::{ELEMENTS_PER_BLOCK, SelectCursor, Set, SetCodec};

#[inline(always)]
fn get_bit_at(input: u64, n: u16) -> bool {
    input & (1 << n) != 0
}

#[inline]
fn set_bit_at(input: &mut u64, n: u16) {
    *input |= 1 << n;
}

/// For the `DenseCodec`, `data` which contains the encoded blocks.
/// Each block consists of [u8; 12]. The first 8 bytes is a bitvec for 64 elements.
/// The last 4 bytes are the offset, the number of set bits so far.
///
/// When translating the original index to a dense index, the correct block can be computed
/// directly `orig_idx/64`. Inside the block the position is `orig_idx%64`.
///
/// When translating a dense index to the original index, we can use the offset to find the correct
/// block. Direct computation is not possible, but we can employ a linear or binary search.
const ELEMENTS_PER_MINI_BLOCK: u16 = 64;
const MINI_BLOCK_BITVEC_NUM_BYTES: usize = 8;
const MINI_BLOCK_OFFSET_NUM_BYTES: usize = 2;
pub const MINI_BLOCK_NUM_BYTES: usize = MINI_BLOCK_BITVEC_NUM_BYTES + MINI_BLOCK_OFFSET_NUM_BYTES;

/// Number of bytes in a dense block.
pub const DENSE_BLOCK_NUM_BYTES: u32 =
    (ELEMENTS_PER_BLOCK / ELEMENTS_PER_MINI_BLOCK as u32) * MINI_BLOCK_NUM_BYTES as u32;

pub struct DenseBlockCodec;

impl SetCodec for DenseBlockCodec {
    type Item = u16;
    type Reader<'a> = DenseBlock<'a>;

    fn serialize(els: impl Iterator<Item = u16>, wrt: impl io::Write) -> io::Result<()> {
        serialize_dense_codec(els, wrt)
    }

    #[inline]
    fn open(data: &[u8]) -> Self::Reader<'_> {
        assert_eq!(data.len(), DENSE_BLOCK_NUM_BYTES as usize);
        DenseBlock(data)
    }
}

/// Interpreting the bitvec as a set of integer within 0..=63
/// and given an element, returns the number of elements in the
/// set lesser than the element.
///
/// # Panics
///
/// May panic or return a wrong result if el <= 64.
#[inline(always)]
fn rank_u64(bitvec: u64, el: u16) -> u16 {
    debug_assert!(el < 64);
    let mask = (1u64 << el) - 1;
    let masked_bitvec = bitvec & mask;
    masked_bitvec.count_ones() as u16
}

#[inline(always)]
fn select_u64(mut bitvec: u64, rank: u16) -> u16 {
    for _ in 0..rank {
        bitvec &= bitvec - 1;
    }
    bitvec.trailing_zeros() as u16
}

// TODO test the following solution on Intel... on Ryzen Zen <3 it is a catastrophy.
// #[target_feature(enable = "bmi2")]
// unsafe fn select_bitvec_unsafe(bitvec: u64, rank: u16) -> u16 {
//     let pdep = _pdep_u64(1u64 << rank, bitvec);
//     pdep.trailing_zeros() as u16
// }

#[derive(Clone, Copy, Debug)]
struct DenseMiniBlock {
    bitvec: u64,
    rank: u16,
}

impl DenseMiniBlock {
    fn from_bytes(data: [u8; MINI_BLOCK_NUM_BYTES]) -> Self {
        let bitvec = u64::from_le_bytes(data[..MINI_BLOCK_BITVEC_NUM_BYTES].try_into().unwrap());
        let rank = u16::from_le_bytes(data[MINI_BLOCK_BITVEC_NUM_BYTES..].try_into().unwrap());
        Self { bitvec, rank }
    }

    fn to_bytes(self) -> [u8; MINI_BLOCK_NUM_BYTES] {
        let mut bytes = [0u8; MINI_BLOCK_NUM_BYTES];
        bytes[..MINI_BLOCK_BITVEC_NUM_BYTES].copy_from_slice(&self.bitvec.to_le_bytes());
        bytes[MINI_BLOCK_BITVEC_NUM_BYTES..].copy_from_slice(&self.rank.to_le_bytes());
        bytes
    }
}

#[derive(Copy, Clone)]
pub struct DenseBlock<'a>(&'a [u8]);

pub struct DenseBlockSelectCursor<'a> {
    block_id: u16,
    dense_block: DenseBlock<'a>,
}

impl SelectCursor<u16> for DenseBlockSelectCursor<'_> {
    #[inline]
    fn select(&mut self, rank: u16) -> u16 {
        self.block_id = self
            .dense_block
            .find_miniblock_containing_rank(rank, self.block_id)
            .unwrap();
        let index_block = self.dense_block.mini_block(self.block_id);
        let in_block_rank = rank - index_block.rank;
        self.block_id * ELEMENTS_PER_MINI_BLOCK + select_u64(index_block.bitvec, in_block_rank)
    }
}

impl<'a> Set<u16> for DenseBlock<'a> {
    type SelectCursor<'b>
        = DenseBlockSelectCursor<'a>
    where Self: 'b;

    #[inline(always)]
    fn contains(&self, el: u16) -> bool {
        let mini_block_id = el / ELEMENTS_PER_MINI_BLOCK;
        let bitvec = self.mini_block(mini_block_id).bitvec;
        let pos_in_bitvec = el % ELEMENTS_PER_MINI_BLOCK;
        get_bit_at(bitvec, pos_in_bitvec)
    }

    #[inline(always)]
    fn rank_if_exists(&self, el: u16) -> Option<u16> {
        let block_pos = el / ELEMENTS_PER_MINI_BLOCK;
        let index_block = self.mini_block(block_pos);
        let pos_in_block_bit_vec = el % ELEMENTS_PER_MINI_BLOCK;
        let ones_in_block = rank_u64(index_block.bitvec, pos_in_block_bit_vec);
        let rank = index_block.rank + ones_in_block;
        if get_bit_at(index_block.bitvec, pos_in_block_bit_vec) {
            Some(rank)
        } else {
            None
        }
    }

    #[inline(always)]
    fn rank(&self, el: u16) -> u16 {
        let block_pos = el / ELEMENTS_PER_MINI_BLOCK;
        let index_block = self.mini_block(block_pos);
        let pos_in_block_bit_vec = el % ELEMENTS_PER_MINI_BLOCK;
        let ones_in_block = rank_u64(index_block.bitvec, pos_in_block_bit_vec);
        index_block.rank + ones_in_block
    }

    #[inline(always)]
    fn select(&self, rank: u16) -> u16 {
        let block_id = self.find_miniblock_containing_rank(rank, 0).unwrap();
        let index_block = self.mini_block(block_id);
        let in_block_rank = rank - index_block.rank;
        block_id * ELEMENTS_PER_MINI_BLOCK + select_u64(index_block.bitvec, in_block_rank)
    }

    #[inline(always)]
    fn select_cursor(&self) -> Self::SelectCursor<'_> {
        DenseBlockSelectCursor {
            block_id: 0,
            dense_block: *self,
        }
    }
}

impl DenseBlock<'_> {
    #[inline]
    fn mini_block(&self, mini_block_id: u16) -> DenseMiniBlock {
        let data_start_pos = mini_block_id as usize * MINI_BLOCK_NUM_BYTES;
        DenseMiniBlock::from_bytes(
            self.0[data_start_pos..data_start_pos + MINI_BLOCK_NUM_BYTES]
                .try_into()
                .unwrap(),
        )
    }

    #[inline]
    fn iter_miniblocks(
        &self,
        from_block_id: u16,
    ) -> impl Iterator<Item = (u16, DenseMiniBlock)> + '_ {
        self.0
            .chunks_exact(MINI_BLOCK_NUM_BYTES)
            .enumerate()
            .skip(from_block_id as usize)
            .map(|(block_id, bytes)| {
                let mini_block = DenseMiniBlock::from_bytes(bytes.try_into().unwrap());
                (block_id as u16, mini_block)
            })
    }

    /// Finds the block position containing the dense_idx.
    ///
    /// # Correctness
    /// dense_idx needs to be smaller than the number of values in the index
    ///
    /// The last offset number is equal to the number of values in the index.
    #[inline]
    fn find_miniblock_containing_rank(&self, rank: u16, from_block_id: u16) -> Option<u16> {
        self.iter_miniblocks(from_block_id)
            .take_while(|(_, block)| block.rank <= rank)
            .map(|(block_id, _)| block_id)
            .last()
    }
}

/// Iterator over all values, true if set, otherwise false
pub fn serialize_dense_codec(
    els: impl Iterator<Item = u16>,
    mut output: impl Write,
) -> io::Result<()> {
    let mut non_null_rows_before: u16 = 0u16;
    let mut block = 0u64;
    let mut current_block_id = 0u16;
    for el in els {
        let block_id = el / ELEMENTS_PER_MINI_BLOCK;
        let in_offset = el % ELEMENTS_PER_MINI_BLOCK;
        while block_id > current_block_id {
            let dense_mini_block = DenseMiniBlock {
                bitvec: block,
                rank: non_null_rows_before,
            };
            output.write_all(&dense_mini_block.to_bytes())?;
            non_null_rows_before += block.count_ones() as u16;
            block = 0u64;
            current_block_id += 1u16;
        }
        set_bit_at(&mut block, in_offset);
    }
    while current_block_id <= u16::MAX / ELEMENTS_PER_MINI_BLOCK {
        block.serialize(&mut output)?;
        non_null_rows_before.serialize(&mut output)?;
        // This will overflow to 0 exactly if all bits are set.
        // This is however not problem as we won't use this last value.
        non_null_rows_before = non_null_rows_before.wrapping_add(block.count_ones() as u16);
        block = 0u64;
        current_block_id += 1u16;
    }
    Ok(())
}

#[cfg(test)]
mod tests {
    use super::*;

    #[test]
    fn test_select_bitvec() {
        assert_eq!(select_u64(1u64, 0), 0);
        assert_eq!(select_u64(2u64, 0), 1);
        assert_eq!(select_u64(4u64, 0), 2);
        assert_eq!(select_u64(8u64, 0), 3);
        assert_eq!(select_u64(1 | 8u64, 0), 0);
        assert_eq!(select_u64(1 | 8u64, 1), 3);
    }

    #[test]
    fn test_count_ones() {
        for i in 0..=63 {
            assert_eq!(rank_u64(u64::MAX, i), i);
        }
    }

    #[test]
    fn test_dense() {
        assert_eq!(DENSE_BLOCK_NUM_BYTES, 10_240);
    }
}


================================================
FILE: columnar/src/column_index/optional_index/set_block/mod.rs
================================================
mod dense;
mod sparse;

pub use dense::{DENSE_BLOCK_NUM_BYTES, DenseBlock, DenseBlockCodec};
pub use sparse::{SparseBlock, SparseBlockCodec};

#[cfg(test)]
mod tests;


================================================
FILE: columnar/src/column_index/optional_index/set_block/sparse.rs
================================================
use crate::column_index::optional_index::{SelectCursor, Set, SetCodec};

pub struct SparseBlockCodec;

impl SetCodec for SparseBlockCodec {
    type Item = u16;
    type Reader<'a> = SparseBlock<'a>;

    fn serialize(
        els: impl Iterator<Item = u16>,
        mut wrt: impl std::io::Write,
    ) -> std::io::Result<()> {
        for el in els {
            wrt.write_all(&el.to_le_bytes())?;
        }
        Ok(())
    }

    fn open(data: &[u8]) -> Self::Reader<'_> {
        SparseBlock(data)
    }
}

#[derive(Copy, Clone)]
pub struct SparseBlock<'a>(&'a [u8]);

impl<'a> SelectCursor<u16> for SparseBlock<'a> {
    #[inline]
    fn select(&mut self, rank: u16) -> u16 {
        <SparseBlock<'a> as Set<u16>>::select(self, rank)
    }
}

impl Set<u16> for SparseBlock<'_> {
    type SelectCursor<'b>
        = Self
    where Self: 'b;

    #[inline(always)]
    fn contains(&self, el: u16) -> bool {
        self.binary_search(el).is_ok()
    }

    #[inline(always)]
    fn rank_if_exists(&self, el: u16) -> Option<u16> {
        self.binary_search(el).ok()
    }

    #[inline(always)]
    fn rank(&self, el: u16) -> u16 {
        self.binary_search(el).unwrap_or_else(|el| el)
    }

    #[inline(always)]
    fn select(&self, rank: u16) -> u16 {
        let offset = rank as usize * 2;
        u16::from_le_bytes(self.0[offset..offset + 2].try_into().unwrap())
    }

    #[inline(always)]
    fn select_cursor(&self) -> Self::SelectCursor<'_> {
        *self
    }
}

#[inline(always)]
fn get_u16(data: &[u8], byte_position: usize) -> u16 {
    let bytes: [u8; 2] = data[byte_position..byte_position + 2].try_into().unwrap();
    u16::from_le_bytes(bytes)
}

impl SparseBlock<'_> {
    #[inline(always)]
    fn value_at_idx(&self, data: &[u8], idx: u16) -> u16 {
        let start_offset: usize = idx as usize * 2;
        get_u16(data, start_offset)
    }

    #[inline]
    fn num_vals(&self) -> u16 {
        (self.0.len() / 2) as u16
    }

    #[inline]
    #[expect(clippy::comparison_chain)]
    // Looks for the element in the block. Returns the positions if found.
    fn binary_search(&self, target: u16) -> Result<u16, u16> {
        let data = &self.0;
        let mut size = self.num_vals();
        let mut left = 0;
        let mut right = size;
        // TODO try different implem.
        //  e.g. exponential search into binary search
        while left < right {
            let mid = left + size / 2;

            // TODO do boundary check only once, and then use an
            // unsafe `value_at_idx`
            let mid_val = self.value_at_idx(data, mid);

            if target > mid_val {
                left = mid + 1;
            } else if target < mid_val {
                right = mid;
            } else {
                return Ok(mid);
            }

            size = right - left;
        }
        Err(left)
    }
}


================================================
FILE: columnar/src/column_index/optional_index/set_block/tests.rs
================================================
use std::collections::HashMap;

use crate::column_index::optional_index::set_block::dense::DENSE_BLOCK_NUM_BYTES;
use crate::column_index::optional_index::set_block::{DenseBlockCodec, SparseBlockCodec};
use crate::column_index::optional_index::{SelectCursor, Set, SetCodec};

fn test_set_helper<C: SetCodec<Item = u16>>(vals: &[u16]) -> usize {
    let mut buffer = Vec::new();
    C::serialize(vals.iter().copied(), &mut buffer).unwrap();
    let tested_set = C::open(buffer.as_slice());
    let hash_set: HashMap<C::Item, C::Item> = vals
        .iter()
        .copied()
        .enumerate()
        .map(|(ord, val)| (val, C::Item::try_from(ord).ok().unwrap()))
        .collect();
    for val in 0u16..=u16::MAX {
        assert_eq!(tested_set.contains(val), hash_set.contains_key(&val));
        assert_eq!(tested_set.rank_if_exists(val), hash_set.get(&val).copied());
        assert_eq!(
            tested_set.rank(val),
            vals.iter().cloned().take_while(|v| *v < val).count() as u16
        );
    }
    for (rank, val) in vals.iter().enumerate() {
        assert_eq!(tested_set.select(rank as u16), *val);
    }
    buffer.len()
}

#[test]
fn test_dense_block_set_u16_empty() {
    let buffer_len = test_set_helper::<DenseBlockCodec>(&[]);
    assert_eq!(buffer_len, DENSE_BLOCK_NUM_BYTES as usize);
}

#[test]
fn test_dense_block_set_u16_max() {
    let buffer_len = test_set_helper::<DenseBlockCodec>(&[u16::MAX]);
    assert_eq!(buffer_len, DENSE_BLOCK_NUM_BYTES as usize);
}

#[test]
fn test_sparse_block_set_u16_empty() {
    let buffer_len = test_set_helper::<SparseBlockCodec>(&[]);
    assert_eq!(buffer_len, 0);
}

#[test]
fn test_sparse_block_set_u16_max() {
    let buffer_len = test_set_helper::<SparseBlockCodec>(&[u16::MAX]);
    assert_eq!(buffer_len, 2);
}

use proptest::prelude::*;

proptest! {
    #![proptest_config(ProptestConfig::with_cases(1))]
    #[test]
    fn test_prop_test_dense(els in proptest::collection::btree_set(0..=u16::MAX, 0..=u16::MAX as usize)) {
        let vals: Vec<u16> = els.into_iter().collect();
        let buffer_len = test_set_helper::<DenseBlockCodec>(&vals);
        assert_eq!(buffer_len, DENSE_BLOCK_NUM_BYTES as usize);
    }

    #[test]
    fn test_prop_test_sparse(els in proptest::collection::btree_set(0..=u16::MAX, 0..=u16::MAX as usize)) {
        let vals: Vec<u16> = els.into_iter().collect();
        let buffer_len = test_set_helper::<SparseBlockCodec>(&vals);
        assert_eq!(buffer_len, vals.len() * 2);
    }
}

#[test]
fn test_simple_translate_codec_codec_idx_to_original_idx_dense() {
    let mut buffer = Vec::new();
    DenseBlockCodec::serialize([1, 3, 17, 32, 30_000, 30_001].iter().copied(), &mut buffer)
        .unwrap();
    let tested_set = DenseBlockCodec::open(buffer.as_slice());
    assert!(tested_set.contains(1));
    let mut select_cursor = tested_set.select_cursor();
    assert_eq!(select_cursor.select(0), 1);
    assert_eq!(select_cursor.select(1), 3);
    assert_eq!(select_cursor.select(2), 17);
}

#[test]
fn test_simple_translate_codec_idx_to_original_idx_sparse() {
    let mut buffer = Vec::new();
    SparseBlockCodec::serialize([1, 3, 17].iter().copied(), &mut buffer).unwrap();
    let tested_set = SparseBlockCodec::open(buffer.as_slice());
    assert!(tested_set.contains(1));
    let mut select_cursor = tested_set.select_cursor();
    assert_eq!(SelectCursor::select(&mut select_cursor, 0), 1);
    assert_eq!(SelectCursor::select(&mut select_cursor, 1), 3);
    assert_eq!(SelectCursor::select(&mut select_cursor, 2), 17);
}

#[test]
fn test_simple_translate_codec_idx_to_original_idx_dense() {
    let mut buffer = Vec::new();
    DenseBlockCodec::serialize(0u16..150u16, &mut buffer).unwrap();
    let tested_set = DenseBlockCodec::open(buffer.as_slice());
    assert!(tested_set.contains(1));
    let mut select_cursor = tested_set.select_cursor();
    for i in 0..150 {
        assert_eq!(i, select_cursor.select(i));
    }
}

#[test]
fn test_simple_translate_idx_to_value_idx_dense() {
    let mut buffer = Vec::new();
    DenseBlockCodec::serialize([1, 10].iter().copied(), &mut buffer).unwrap();
    let tested_set = DenseBlockCodec::open(buffer.as_slice());
    assert!(tested_set.contains(1));
    assert!(!tested_set.contains(2));
    assert_eq!(tested_set.rank(0), 0);
    assert_eq!(tested_set.rank(1), 0);
    for rank in 2..10 {
        // ranks that don't exist select the next highest one
        assert_eq!(tested_set.rank_if_exists(rank), None);
        assert_eq!(tested_set.rank(rank), 1);
    }
    assert_eq!(tested_set.rank(10), 1);
}

#[test]
fn test_simple_translate_idx_to_value_idx_sparse() {
    let mut buffer = Vec::new();
    SparseBlockCodec::serialize([1, 10].iter().copied(), &mut buffer).unwrap();
    let tested_set = SparseBlockCodec::open(buffer.as_slice());
    assert!(tested_set.contains(1));
    assert!(!tested_set.contains(2));
    assert_eq!(tested_set.rank(0), 0);
    assert_eq!(tested_set.select(tested_set.rank(0)), 1);
    assert_eq!(tested_set.rank(1), 0);
    assert_eq!(tested_set.select(tested_set.rank(1)), 1);
    for rank in 2..10 {
        // ranks that don't exist select the next highest one
        assert_eq!(tested_set.rank_if_exists(rank), None);
        assert_eq!(tested_set.rank(rank), 1);
        assert_eq!(tested_set.select(tested_set.rank(rank)), 10);
    }
    assert_eq!(tested_set.rank(10), 1);
    assert_eq!(tested_set.select(tested_set.rank(10)), 10);
}


================================================
FILE: columnar/src/column_index/optional_index/tests.rs
================================================
use proptest::prelude::*;
use proptest::{prop_oneof, proptest};

use super::*;
use crate::{ColumnarReader, ColumnarWriter, DynamicColumnHandle};

#[test]
fn test_optional_index_bug_2293() {
    // tests for panic in docid_range_to_rowids for docid == num_docs
    test_optional_index_with_num_docs(ELEMENTS_PER_BLOCK - 1);
    test_optional_index_with_num_docs(ELEMENTS_PER_BLOCK);
    test_optional_index_with_num_docs(ELEMENTS_PER_BLOCK + 1);
}
fn test_optional_index_with_num_docs(num_docs: u32) {
    let mut dataframe_writer = ColumnarWriter::default();
    dataframe_writer.record_numerical(100, "score", 80i64);
    let mut buffer: Vec<u8> = Vec::new();
    dataframe_writer.serialize(num_docs, &mut buffer).unwrap();
    let columnar = ColumnarReader::open(buffer).unwrap();
    assert_eq!(columnar.num_columns(), 1);
    let cols: Vec<DynamicColumnHandle> = columnar.read_columns("score").unwrap();
    assert_eq!(cols.len(), 1);

    let col = cols[0].open().unwrap();
    col.column_index().docid_range_to_rowids(0..num_docs);
}

#[test]
fn test_dense_block_threshold() {
    assert_eq!(super::DENSE_BLOCK_THRESHOLD, 5_120);
}

fn random_bitvec() -> BoxedStrategy<Vec<bool>> {
    prop_oneof![
        1 => prop::collection::vec(proptest::bool::weighted(1.0), 0..100),
        1 => prop::collection::vec(proptest::bool::weighted(0.00), 0..(ELEMENTS_PER_BLOCK as usize * 3)), // empty blocks
        1 => prop::collection::vec(proptest::bool::weighted(1.00), 0..(ELEMENTS_PER_BLOCK as usize + 10)), // full block
        1 => prop::collection::vec(proptest::bool::weighted(0.01), 0..100),
        1 => prop::collection::vec(proptest::bool::weighted(0.01), 0..u16::MAX as usize),
        8 => vec![any::<bool>()],
    ]
    .boxed()
}

proptest! {
    #![proptest_config(ProptestConfig::with_cases(50))]
    #[test]
    fn test_with_random_bitvecs(bitvec1 in random_bitvec(), bitvec2 in random_bitvec(), bitvec3 in random_bitvec()) {
        let mut bitvec = Vec::new();
        bitvec.extend_from_slice(&bitvec1);
        bitvec.extend_from_slice(&bitvec2);
        bitvec.extend_from_slice(&bitvec3);
        test_null_index(&bitvec[..]);
    }
}

#[test]
fn test_with_random_sets_simple() {
    let vals = 10..ELEMENTS_PER_BLOCK * 2;
    let mut out: Vec<u8> = Vec::new();
    serialize_optional_index(&vals, 100, &mut out).unwrap();
    let null_index = open_optional_index(OwnedBytes::new(out)).unwrap();
    let ranks: Vec<u32> = (65_472u32..65_473u32).collect();
    let els: Vec<u32> = ranks.iter().copied().map(|rank| rank + 10).collect();
    let mut select_cursor = null_index.select_cursor();
    for (rank, el) in ranks.iter().copied().zip(els.iter().copied()) {
        assert_eq!(select_cursor.select(rank), el);
    }
}

#[test]
fn test_optional_index_trailing_empty_blocks() {
    test_null_index(&[false]);
}

#[test]
fn test_optional_index_one_block_false() {
    let mut iter = vec![false; ELEMENTS_PER_BLOCK as usize];
    iter.push(true);
    test_null_index(&iter[..]);
}

#[test]
fn test_optional_index_one_block_true() {
    let mut iter = vec![true; ELEMENTS_PER_BLOCK as usize];
    iter.push(true);
    test_null_index(&iter[..]);
}

impl<'a> Iterable<RowId> for &'a [bool] {
    fn boxed_iter(&self) -> Box<dyn Iterator<Item = RowId> + 'a> {
        Box::new(
            self.iter()
                .cloned()
                .enumerate()
                .filter(|(_pos, val)| *val)
                .map(|(pos, _val)| pos as u32),
        )
    }
}

fn test_null_index(data: &[bool]) {
    let mut out: Vec<u8> = Vec::new();
    serialize_optional_index(&data, data.len() as RowId, &mut out).unwrap();
    let null_index = open_optional_index(OwnedBytes::new(out)).unwrap();
    let orig_idx_with_value: Vec<u32> = data
        .iter()
        .enumerate()
        .filter(|(_pos, val)| **val)
        .map(|(pos, _val)| pos as u32)
        .collect();
    let mut select_iter = null_index.select_cursor();
    for (i, expected) in orig_idx_with_value.iter().enumerate() {
        assert_eq!(select_iter.select(i as u32), *expected);
    }

    let step_size = (orig_idx_with_value.len() / 100).max(1);
    for (dense_idx, orig_idx) in orig_idx_with_value.iter().enumerate().step_by(step_size) {
        assert_eq!(null_index.rank_if_exists(*orig_idx), Some(dense_idx as u32));
    }

    // 100 samples
    let step_size = (data.len() / 100).max(1);
    for (pos, value) in data.iter().enumerate().step_by(step_size) {
        assert_eq!(null_index.contains(pos as u32), *value);
    }
}

#[test]
fn test_optional_index_test_translation() {
    let optional_index = OptionalIndex::for_test(4, &[0, 2]);
    let mut select_cursor = optional_index.select_cursor();
    assert_eq!(select_cursor.select(0), 0);
    assert_eq!(select_cursor.select(1), 2);
}

#[test]
fn test_optional_index_translate() {
    let optional_index = OptionalIndex::for_test(4, &[0, 2]);
    assert_eq!(optional_index.rank_if_exists(0), Some(0));
    assert_eq!(optional_index.rank_if_exists(2), Some(1));
}

#[test]
fn test_optional_index_small() {
    let optional_index = OptionalIndex::for_test(4, &[0, 2]);
    assert!(optional_index.contains(0));
    assert!(!optional_index.contains(1));
    assert!(optional_index.contains(2));
    assert!(!optional_index.contains(3));
}

#[test]
fn test_optional_index_large() {
    let row_ids = &[ELEMENTS_PER_BLOCK, ELEMENTS_PER_BLOCK + 1];
    let optional_index = OptionalIndex::for_test(ELEMENTS_PER_BLOCK + 2, row_ids);
    assert!(!optional_index.contains(0));
    assert!(!optional_index.contains(100));
    assert!(!optional_index.contains(ELEMENTS_PER_BLOCK - 1));
    assert!(optional_index.contains(ELEMENTS_PER_BLOCK));
    assert!(optional_index.contains(ELEMENTS_PER_BLOCK + 1));
}

fn test_optional_index_iter_aux(row_ids: &[RowId], num_rows: RowId) {
    let optional_index = OptionalIndex::for_test(num_rows, row_ids);
    assert_eq!(optional_index.num_docs(), num_rows);
    assert!(
        optional_index
            .iter_non_null_docs()
            .eq(row_ids.iter().copied())
    );
}

#[test]
fn test_optional_index_iter_empty() {
    test_optional_index_iter_aux(&[], 0u32);
}

fn test_optional_index_rank_aux(row_ids: &[RowId]) {
    let num_rows = row_ids.last().copied().unwrap_or(0u32) + 1;
    let null_index = OptionalIndex::for_test(num_rows, row_ids);
    assert_eq!(null_index.num_docs(), num_rows);
    for (row_id, row_val) in row_ids.iter().copied().enumerate() {
        assert_eq!(null_index.rank(row_val), row_id as u32);
        assert_eq!(null_index.rank_if_exists(row_val), Some(row_id as u32));
        if row_val > 0 && !null_index.contains(&row_val - 1) {
            assert_eq!(null_index.rank(row_val - 1), row_id as u32);
        }
        assert_eq!(null_index.rank(row_val + 1), row_id as u32 + 1);
    }
}

#[test]
fn test_optional_index_rank() {
    test_optional_index_rank_aux(&[1u32]);
    test_optional_index_rank_aux(&[0u32, 1u32]);
    let mut block = Vec::new();
    block.push(3u32);
    block.extend((0..ELEMENTS_PER_BLOCK).map(|i| i + ELEMENTS_PER_BLOCK + 1));
    test_optional_index_rank_aux(&block);
}

#[test]
fn test_optional_index_iter_empty_one() {
    test_optional_index_iter_aux(&[1], 2u32);
    test_optional_index_iter_aux(&[100_000], 200_000u32);
}

#[test]
fn test_optional_index_iter_dense_block() {
    let mut block = Vec::new();
    block.push(3u32);
    block.extend((0..ELEMENTS_PER_BLOCK).map(|i| i + ELEMENTS_PER_BLOCK + 1));
    test_optional_index_iter_aux(&block, 3 * ELEMENTS_PER_BLOCK);
}

#[test]
fn test_optional_index_for_tests() {
    let optional_index = OptionalIndex::for_test(4, &[1, 2]);
    assert!(!optional_index.contains(0));
    assert!(optional_index.contains(1));
    assert!(optional_index.contains(2));
    assert!(!optional_index.contains(3));
    assert_eq!(optional_index.num_docs(), 4);
}


================================================
FILE: columnar/src/column_index/serialize.rs
================================================
use std::io;
use std::io::Write;

use common::{CountingWriter, OwnedBytes};

use super::OptionalIndex;
use super::multivalued_index::SerializableMultivalueIndex;
use crate::column_index::ColumnIndex;
use crate::column_index::multivalued_index::serialize_multivalued_index;
use crate::column_index::optional_index::serialize_optional_index;
use crate::iterable::Iterable;
use crate::{Cardinality, RowId, Version};

pub struct SerializableOptionalIndex<'a> {
    pub non_null_row_ids: Box<dyn Iterable<RowId> + 'a>,
    pub num_rows: RowId,
}

impl<'a> From<&'a OptionalIndex> for SerializableOptionalIndex<'a> {
    fn from(optional_index: &'a OptionalIndex) -> Self {
        SerializableOptionalIndex {
            non_null_row_ids: Box::new(optional_index),
            num_rows: optional_index.num_docs(),
        }
    }
}

pub enum SerializableColumnIndex<'a> {
    Full,
    Optional(SerializableOptionalIndex<'a>),
    Multivalued(SerializableMultivalueIndex<'a>),
}

impl SerializableColumnIndex<'_> {
    pub fn get_cardinality(&self) -> Cardinality {
        match self {
            SerializableColumnIndex::Full => Cardinality::Full,
            SerializableColumnIndex::Optional(_) => Cardinality::Optional,
            SerializableColumnIndex::Multivalued(_) => Cardinality::Multivalued,
        }
    }
}

/// Serialize a column index.
pub fn serialize_column_index(
    column_index: SerializableColumnIndex,
    output: &mut impl Write,
) -> io::Result<u32> {
    let mut output = CountingWriter::wrap(output);
    let cardinality = column_index.get_cardinality().to_code();
    output.write_all(&[cardinality])?;
    match column_index {
        SerializableColumnIndex::Full => {}
        SerializableColumnIndex::Optional(SerializableOptionalIndex {
            non_null_row_ids,
            num_rows,
        }) => serialize_optional_index(non_null_row_ids.as_ref(), num_rows, &mut output)?,
        SerializableColumnIndex::Multivalued(multivalued_index) => {
            serialize_multivalued_index(&multivalued_index, &mut output)?
        }
    }
    let column_index_num_bytes = output.written_bytes() as u32;
    Ok(column_index_num_bytes)
}

/// Open a serialized column index.
pub fn open_column_index(
    mut bytes: OwnedBytes,
    format_version: Version,
) -> io::Result<ColumnIndex> {
    if bytes.is_empty() {
        return Err(io::Error::new(
            io::ErrorKind::UnexpectedEof,
            "Failed to deserialize column index. Empty buffer.",
        ));
    }
    let cardinality_code = bytes[0];
    let cardinality = Cardinality::try_from_code(cardinality_code)?;
    bytes.advance(1);
    match cardinality {
        Cardinality::Full => Ok(ColumnIndex::Full),
        Cardinality::Optional => {
            let optional_index = super::optional_index::open_optional_index(bytes)?;
            Ok(ColumnIndex::Optional(optional_index))
        }
        Cardinality::Multivalued => {
            let multivalue_index =
                super::multivalued_index::open_multivalued_index(bytes, format_version)?;
            Ok(ColumnIndex::Multivalued(multivalue_index))
        }
    }
}

// TODO unit tests


================================================
FILE: columnar/src/column_values/merge.rs
================================================
use std::fmt::Debug;
use std::sync::Arc;

use crate::iterable::Iterable;
use crate::{ColumnIndex, ColumnValues, MergeRowOrder};

pub(crate) struct MergedColumnValues<'a, T> {
    pub(crate) column_indexes: &'a [ColumnIndex],
    pub(crate) column_values: &'a [Option<Arc<dyn ColumnValues<T>>>],
    pub(crate) merge_row_order: &'a MergeRowOrder,
}

impl<T: Copy + PartialOrd + Debug + 'static> Iterable<T> for MergedColumnValues<'_, T> {
    fn boxed_iter(&self) -> Box<dyn Iterator<Item = T> + '_> {
        match self.merge_row_order {
            MergeRowOrder::Stack(_) => Box::new(
                self.column_values
                    .iter()
                    .flatten()
                    .flat_map(|column_value| column_value.iter()),
            ),
            MergeRowOrder::Shuffled(shuffle_merge_order) => Box::new(
                shuffle_merge_order
                    .iter_new_to_old_row_addrs()
                    .flat_map(|row_addr| {
                        let column_index = &self.column_indexes[row_addr.segment_ord as usize];
                        let column_values =
                            self.column_values[row_addr.segment_ord as usize].as_ref()?;
                        let value_range = column_index.value_row_ids(row_addr.row_id);
                        Some((value_range, column_values))
                    })
                    .flat_map(|(value_range, column_values)| {
                        value_range
                            .into_iter()
                            .map(|val| column_values.get_val(val))
                    }),
            ),
        }
    }
}


================================================
FILE: columnar/src/column_values/mod.rs
================================================
#![warn(missing_docs)]

//! # `fastfield_codecs`
//!
//! - Columnar storage of data for tantivy [`crate::Column`].
//! - Encode data in different codecs.
//! - Monotonically map values to u64/u128

use std::fmt::Debug;
use std::ops::{Range, RangeInclusive};
use std::sync::Arc;

use downcast_rs::DowncastSync;
pub use monotonic_mapping::{MonotonicallyMappableToU64, StrictlyMonotonicFn};
pub use monotonic_mapping_u128::MonotonicallyMappableToU128;

mod merge;
pub(crate) mod monotonic_mapping;
pub(crate) mod monotonic_mapping_u128;
mod stats;
mod u128_based;
mod u64_based;
mod vec_column;

mod monotonic_column;

pub(crate) use merge::MergedColumnValues;
pub use stats::ColumnStats;
pub use u64_based::{
    ALL_U64_CODEC_TYPES, CodecType, load_u64_based_column_values,
    serialize_and_load_u64_based_column_values, serialize_u64_based_column_values,
};
pub use u128_based::{
    CompactHit, CompactSpaceU64Accessor, open_u128_as_compact_u64, open_u128_mapped,
    serialize_column_values_u128,
};
pub use vec_column::VecColumn;

pub use self::monotonic_column::monotonic_map_column;
use crate::RowId;

/// `ColumnValues` provides access to a dense field column.
///
/// `Column` are just a wrapper over `ColumnValues` and a `ColumnIndex`.
///
/// Any methods with a default and specialized implementation need to be called in the
/// wrappers that implement the trait: Arc and MonotonicMappingColumn
pub trait ColumnValues<T: PartialOrd = u64>: Send + Sync + DowncastSync {
    /// Return the value associated with the given idx.
    ///
    /// This accessor should return as fast as possible.
    ///
    /// # Panics
    ///
    /// May panic if `idx` is greater than the column length.
    fn get_val(&self, idx: u32) -> T;

    /// Allows to push down multiple fetch calls, to avoid dynamic dispatch overhead.
    ///
    /// idx and output should have the same length
    ///
    /// # Panics
    ///
    /// May panic if `idx` is greater than the column length.
    fn get_vals(&self, indexes: &[u32], output: &mut [T]) {
        assert!(indexes.len() == output.len());
        let out_and_idx_chunks = output.chunks_exact_mut(4).zip(indexes.chunks_exact(4));
        for (out_x4, idx_x4) in out_and_idx_chunks {
            out_x4[0] = self.get_val(idx_x4[0]);
            out_x4[1] = self.get_val(idx_x4[1]);
            out_x4[2] = self.get_val(idx_x4[2]);
            out_x4[3] = self.get_val(idx_x4[3]);
        }

        let out_and_idx_chunks = output
            .chunks_exact_mut(4)
            .into_remainder()
            .iter_mut()
            .zip(indexes.chunks_exact(4).remainder());
        for (out, idx) in out_and_idx_chunks {
            *out = self.get_val(*idx);
        }
    }

    /// Allows to push down multiple fetch calls, to avoid dynamic dispatch overhead.
    /// The slightly weird `Option<T>` in output allows pushdown to full columns.
    ///
    /// idx and output should have the same length
    ///
    /// # Panics
    ///
    /// May panic if `idx` is greater than the column length.
    fn get_vals_opt(&self, indexes: &[u32], output: &mut [Option<T>]) {
        assert!(indexes.len() == output.len());
        let out_and_idx_chunks = output.chunks_exact_mut(4).zip(indexes.chunks_exact(4));
        for (out_x4, idx_x4) in out_and_idx_chunks {
            out_x4[0] = Some(self.get_val(idx_x4[0]));
            out_x4[1] = Some(self.get_val(idx_x4[1]));
            out_x4[2] = Some(self.get_val(idx_x4[2]));
            out_x4[3] = Some(self.get_val(idx_x4[3]));
        }
        let out_and_idx_chunks = output
            .chunks_exact_mut(4)
            .into_remainder()
            .iter_mut()
            .zip(indexes.chunks_exact(4).remainder());
        for (out, idx) in out_and_idx_chunks {
            *out = Some(self.get_val(*idx));
        }
    }

    /// Fills an output buffer with the fast field values
    /// associated with the `DocId` going from
    /// `start` to `start + output.len()`.
    ///
    /// # Panics
    ///
    /// Must panic if `start + output.len()` is greater than
    /// the segment's `maxdoc`.
    #[inline(always)]
    fn get_range(&self, start: u64, output: &mut [T]) {
        for (out, idx) in output.iter_mut().zip(start..) {
            *out = self.get_val(idx as u32);
        }
    }

    /// Get the row ids of values which are in the provided value range.
    ///
    /// Note that position == docid for single value fast fields
    fn get_row_ids_for_value_range(
        &self,
        value_range: RangeInclusive<T>,
        row_id_range: Range<RowId>,
        row_id_hits: &mut Vec<RowId>,
    ) {
        let row_id_range = row_id_range.start..row_id_range.end.min(self.num_vals());
        for idx in row_id_range {
            let val = self.get_val(idx);
            if value_range.contains(&val) {
                row_id_hits.push(idx);
            }
        }
    }

    /// Returns a lower bound for this column of values.
    ///
    /// All values are guaranteed to be higher than `.min_value()`
    /// but this value is not necessary the best boundary value.
    ///
    /// We have
    /// ∀i < self.num_vals(), self.get_val(i) >= self.min_value()
    /// But we don't have necessarily
    /// ∃i < self.num_vals(), self.get_val(i) == self.min_value()
    fn min_value(&self) -> T;

    /// Returns an upper bound for this column of values.
    ///
    /// All values are guaranteed to be lower than `.max_value()`
    /// but this value is not necessary the best boundary value.
    ///
    /// We have
    /// ∀i < self.num_vals(), self.get_val(i) <= self.max_value()
    /// But we don't have necessarily
    /// ∃i < self.num_vals(), self.get_val(i) == self.max_value()
    fn max_value(&self) -> T;

    /// The number of values in the column.
    fn num_vals(&self) -> u32;

    /// Returns a iterator over the data
    fn iter<'a>(&'a self) -> Box<dyn Iterator<Item = T> + 'a> {
        Box::new((0..self.num_vals()).map(|idx| self.get_val(idx)))
    }
}
downcast_rs::impl_downcast!(sync ColumnValues<T> where T: PartialOrd);

/// Empty column of values.
pub struct EmptyColumnValues;

impl<T: PartialOrd + Default> ColumnValues<T> for EmptyColumnValues {
    fn get_val(&self, _idx: u32) -> T {
        panic!("Internal Error: Called get_val of empty column.")
    }

    fn min_value(&self) -> T {
        T::default()
    }

    fn max_value(&self) -> T {
        T::default()
    }

    fn num_vals(&self) -> u32 {
        0
    }
}

impl<T: Copy + PartialOrd + Debug + 'static> ColumnValues<T> for Arc<dyn ColumnValues<T>> {
    #[inline(always)]
    fn get_val(&self, idx: u32) -> T {
        self.as_ref().get_val(idx)
    }

    #[inline(always)]
    fn get_vals_opt(&self, indexes: &[u32], output: &mut [Option<T>]) {
        self.as_ref().get_vals_opt(indexes, output)
    }

    #[inline(always)]
    fn min_value(&self) -> T {
        self.as_ref().min_value()
    }

    #[inline(always)]
    fn max_value(&self) -> T {
        self.as_ref().max_value()
    }

    #[inline(always)]
    fn num_vals(&self) -> u32 {
        self.as_ref().num_vals()
    }

    #[inline(always)]
    fn iter<'b>(&'b self) -> Box<dyn Iterator<Item = T> + 'b> {
        self.as_ref().iter()
    }

    #[inline(always)]
    fn get_range(&self, start: u64, output: &mut [T]) {
        self.as_ref().get_range(start, output)
    }

    #[inline(always)]
    fn get_row_ids_for_value_range(
        &self,
        range: RangeInclusive<T>,
        doc_id_range: Range<u32>,
        positions: &mut Vec<u32>,
    ) {
        self.as_ref()
            .get_row_ids_for_value_range(range, doc_id_range, positions)
    }
}


================================================
FILE: columnar/src/column_values/monotonic_column.rs
================================================
use std::fmt::Debug;
use std::marker::PhantomData;
use std::ops::{Range, RangeInclusive};

use crate::ColumnValues;
use crate::column_values::monotonic_mapping::StrictlyMonotonicFn;

struct MonotonicMappingColumn<C, T, Input> {
    from_column: C,
    monotonic_mapping: T,
    _phantom: PhantomData<Input>,
}

/// Creates a view of a column transformed by a strictly monotonic mapping. See
/// [`StrictlyMonotonicFn`].
///
/// E.g. apply a gcd monotonic_mapping([100, 200, 300]) == [1, 2, 3]
/// monotonic_mapping.mapping() is expected to be injective, and we should always have
/// monotonic_mapping.inverse(monotonic_mapping.mapping(el)) == el
///
/// The inverse of the mapping is required for:
/// `fn get_positions_for_value_range(&self, range: RangeInclusive<T>) -> Vec<u64> `
/// The user provides the original value range and we need to monotonic map them in the same way the
/// serialization does before calling the underlying column.
///
/// Note that when opening a codec, the monotonic_mapping should be the inverse of the mapping
/// during serialization. And therefore the monotonic_mapping_inv when opening is the same as
/// monotonic_mapping during serialization.
pub fn monotonic_map_column<C, T, Input, Output>(
    from_column: C,
    monotonic_mapping: T,
) -> impl ColumnValues<Output>
where
    C: ColumnValues<Input> + 'static,
    T: StrictlyMonotonicFn<Input, Output> + Send + Sync + 'static,
    Input: PartialOrd + Debug + Send + Sync + Clone + 'static,
    Output: PartialOrd + Debug + Send + Sync + Clone + 'static,
{
    MonotonicMappingColumn {
        from_column,
        monotonic_mapping,
        _phantom: PhantomData,
    }
}

impl<C, T, Input, Output> ColumnValues<Output> for MonotonicMappingColumn<C, T, Input>
where
    C: ColumnValues<Input> + 'static,
    T: StrictlyMonotonicFn<Input, Output> + Send + Sync + 'static,
    Input: PartialOrd + Send + Debug + Sync + Clone + 'static,
    Output: PartialOrd + Send + Debug + Sync + Clone + 'static,
{
    #[inline(always)]
    fn get_val(&self, idx: u32) -> Output {
        let from_val = self.from_column.get_val(idx);
        self.monotonic_mapping.mapping(from_val)
    }

    fn min_value(&self) -> Output {
        let from_min_value = self.from_column.min_value();
        self.monotonic_mapping.mapping(from_min_value)
    }

    fn max_value(&self) -> Output {
        let from_max_value = self.from_column.max_value();
        self.monotonic_mapping.mapping(from_max_value)
    }

    fn num_vals(&self) -> u32 {
        self.from_column.num_vals()
    }

    fn iter(&self) -> Box<dyn Iterator<Item = Output> + '_> {
        Box::new(
            self.from_column
                .iter()
                .map(|el| self.monotonic_mapping.mapping(el)),
        )
    }

    fn get_row_ids_for_value_range(
        &self,
        range: RangeInclusive<Output>,
        doc_id_range: Range<u32>,
        positions: &mut Vec<u32>,
    ) {
        self.from_column.get_row_ids_for_value_range(
            self.monotonic_mapping.inverse(range.start().clone())
                ..=self.monotonic_mapping.inverse(range.end().clone()),
            doc_id_range,
            positions,
        )
    }

    // We voluntarily do not implement get_range as it yields a regression,
    // and we do not have any specialized implementation anyway.
}

#[cfg(test)]
mod tests {
    use super::*;
    use crate::column_values::VecColumn;
    use crate::column_values::monotonic_mapping::{
        StrictlyMonotonicMappingInverter, StrictlyMonotonicMappingToInternal,
    };

    #[test]
    fn test_monotonic_mapping_iter() {
        let vals: Vec<u64> = (0..100u64).map(|el| el * 10).collect();
        let col = VecColumn::from(vals);
        let mapped = monotonic_map_column(
            col,
            StrictlyMonotonicMappingInverter::from(StrictlyMonotonicMappingToInternal::<i64>::new()),
        );
        let val_i64s: Vec<u64> = mapped.iter().collect();
        for i in 0..100 {
            assert_eq!(val_i64s[i as usize], mapped.get_val(i));
        }
    }
}


================================================
FILE: columnar/src/column_values/monotonic_mapping.rs
================================================
use std::fmt::Debug;
use std::marker::PhantomData;

use common::DateTime;

use super::MonotonicallyMappableToU128;
use crate::RowId;

/// Monotonic maps a value to u64 value space.
/// Monotonic mapping enables `PartialOrd` on u64 space without conversion to original space.
pub trait MonotonicallyMappableToU64: 'static + PartialOrd + Debug + Copy + Send + Sync {
    /// Converts a value to u64.
    ///
    /// Internally all fast field values are encoded as u64.
    fn to_u64(self) -> u64;

    /// Converts a value from u64
    ///
    /// Internally all fast field values are encoded as u64.
    /// **Note: To be used for converting encoded Term, Posting values.**
    fn from_u64(val: u64) -> Self;
}

/// Values need to be strictly monotonic mapped to a `Internal` value (u64 or u128) that can be
/// used in fast field codecs.
///
/// The monotonic mapping is required so that `PartialOrd` can be used on `Internal` without
/// converting to `External`.
///
/// All strictly monotonic functions are invertible because they are guaranteed to have a one-to-one
/// mapping from their range to their domain. The `inverse` method is required when opening a codec,
/// so a value can be converted back to its original domain (e.g. ip address or f64) from its
/// internal representation.
pub trait StrictlyMonotonicFn<External, Internal> {
    /// Strictly monotonically maps the value from External to Internal.
    fn mapping(&self, inp: External) -> Internal;
    /// Inverse of `mapping`. Maps the value from Internal to External.
    fn inverse(&self, out: Internal) -> External;
}

/// Inverts a strictly monotonic mapping from `StrictlyMonotonicFn<A, B>` to
/// `StrictlyMonotonicFn<B, A>`.
///
/// # Warning
///
/// This type comes with a footgun. A type being strictly monotonic does not impose that the inverse
/// mapping is strictly monotonic over the entire space External. e.g. a -> a * 2. Use at your own
/// risks.
pub(crate) struct StrictlyMonotonicMappingInverter<T> {
    orig_mapping: T,
}
impl<T> From<T> for StrictlyMonotonicMappingInverter<T> {
    fn from(orig_mapping: T) -> Self {
        Self { orig_mapping }
    }
}

impl<From, To, T> StrictlyMonotonicFn<To, From> for StrictlyMonotonicMappingInverter<T>
where T: StrictlyMonotonicFn<From, To>
{
    #[inline(always)]
    fn mapping(&self, val: To) -> From {
        self.orig_mapping.inverse(val)
    }

    #[inline(always)]
    fn inverse(&self, val: From) -> To {
        self.orig_mapping.mapping(val)
    }
}

/// Applies the strictly monotonic mapping from `T` without any additional changes.
pub(crate) struct StrictlyMonotonicMappingToInternal<T> {
    _phantom: PhantomData<T>,
}

impl<T> StrictlyMonotonicMappingToInternal<T> {
    pub(crate) fn new() -> StrictlyMonotonicMappingToInternal<T> {
        Self {
            _phantom: PhantomData,
        }
    }
}

impl<External: MonotonicallyMappableToU128, T: MonotonicallyMappableToU128>
    StrictlyMonotonicFn<External, u128> for StrictlyMonotonicMappingToInternal<T>
where T: MonotonicallyMappableToU128
{
    #[inline(always)]
    fn mapping(&self, inp: External) -> u128 {
        External::to_u128(inp)
    }

    #[inline(always)]
    fn inverse(&self, out: u128) -> External {
        External::from_u128(out)
    }
}

impl<External: MonotonicallyMappableToU64, T: MonotonicallyMappableToU64>
    StrictlyMonotonicFn<External, u64> for StrictlyMonotonicMappingToInternal<T>
where T: MonotonicallyMappableToU64
{
    #[inline(always)]
    fn mapping(&self, inp: External) -> u64 {
        External::to_u64(inp)
    }

    #[inline(always)]
    fn inverse(&self, out: u64) -> External {
        External::from_u64(out)
    }
}

impl MonotonicallyMappableToU64 for u64 {
    #[inline(always)]
    fn to_u64(self) -> u64 {
        self
    }

    #[inline(always)]
    fn from_u64(val: u64) -> Self {
        val
    }
}

impl MonotonicallyMappableToU64 for i64 {
    #[inline(always)]
    fn to_u64(self) -> u64 {
        common::i64_to_u64(self)
    }

    #[inline(always)]
    fn from_u64(val: u64) -> Self {
        common::u64_to_i64(val)
    }
}

impl MonotonicallyMappableToU64 for DateTime {
    #[inline(always)]
    fn to_u64(self) -> u64 {
        common::i64_to_u64(self.into_timestamp_nanos())
    }

    #[inline(always)]
    fn from_u64(val: u64) -> Self {
        DateTime::from_timestamp_nanos(common::u64_to_i64(val))
    }
}

impl MonotonicallyMappableToU64 for bool {
    #[inline(always)]
    fn to_u64(self) -> u64 {
        u64::from(self)
    }

    #[inline(always)]
    fn from_u64(val: u64) -> Self {
        val > 0
    }
}

impl MonotonicallyMappableToU64 for RowId {
    #[inline(always)]
    fn to_u64(self) -> u64 {
        u64::from(self)
    }

    #[inline(always)]
    fn from_u64(val: u64) -> RowId {
        val as RowId
    }
}

// TODO remove me.
// Tantivy should refuse NaN values and work with NotNaN internally.
impl MonotonicallyMappableToU64 for f64 {
    #[inline(always)]
    fn to_u64(self) -> u64 {
        common::f64_to_u64(self)
    }

    #[inline(always)]
    fn from_u64(val: u64) -> Self {
        common::u64_to_f64(val)
    }
}

#[cfg(test)]
mod tests {

    use super::*;

    #[test]
    fn strictly_monotonic_test() {
        // identity mapping
        test_round_trip(&StrictlyMonotonicMappingToInternal::<u64>::new(), 100u64);
        // round trip to i64
        test_round_trip(&StrictlyMonotonicMappingToInternal::<i64>::new(), 100u64);
        // TODO
        // identity mapping
        // test_round_trip(&StrictlyMonotonicMappingToInternal::<u128>::new(), 100u128);
    }

    fn test_round_trip<T: StrictlyMonotonicFn<K, L>, K: std::fmt::Debug + Eq + Copy, L>(
        mapping: &T,
        test_val: K,
    ) {
        assert_eq!(mapping.inverse(mapping.mapping(test_val)), test_val);
    }
}


================================================
FILE: columnar/src/column_values/monotonic_mapping_u128.rs
================================================
use std::fmt::Debug;
use std::net::Ipv6Addr;

/// Monotonic maps a value to u128 value space
/// Monotonic mapping enables `PartialOrd` on u128 space without conversion to original space.
pub trait MonotonicallyMappableToU128: 'static + PartialOrd + Copy + Debug + Send + Sync {
    /// Converts a value to u128.
    ///
    /// Internally all fast field values are encoded as u64.
    fn to_u128(self) -> u128;

    /// Converts a value from u128
    ///
    /// Internally all fast field values are encoded as u64.
    /// **Note: To be used for converting encoded Term, Posting values.**
    fn from_u128(val: u128) -> Self;
}

impl MonotonicallyMappableToU128 for u128 {
    fn to_u128(self) -> u128 {
        self
    }

    fn from_u128(val: u128) -> Self {
        val
    }
}

impl MonotonicallyMappableToU128 for Ipv6Addr {
    fn to_u128(self) -> u128 {
        ip_to_u128(self)
    }

    fn from_u128(val: u128) -> Self {
        Ipv6Addr::from(val.to_be_bytes())
    }
}

fn ip_to_u128(ip_addr: Ipv6Addr) -> u128 {
    u128::from_be_bytes(ip_addr.octets())
}


================================================
FILE: columnar/src/column_values/stats.rs
================================================
use std::io;
use std::io::Write;
use std::num::NonZeroU64;

use common::{BinarySerializable, VInt};

use crate::RowId;

/// Column statistics.
#[derive(Debug, Clone, Eq, PartialEq)]
pub struct ColumnStats {
    /// GCD of the elements `el - min(column)`.
    pub gcd: NonZeroU64,
    /// Minimum value of the column.
    pub min_value: u64,
    /// Maximum value of the column.
    pub max_value: u64,
    /// Number of rows in the column.
    pub num_rows: RowId,
}

impl ColumnStats {
    /// Amplitude of value.
    /// Difference between the maximum and the minimum value.
    pub fn amplitude(&self) -> u64 {
        self.max_value - self.min_value
    }
}

impl BinarySerializable for ColumnStats {
    fn serialize<W: Write + ?Sized>(&self, writer: &mut W) -> io::Result<()> {
        VInt(self.min_value).serialize(writer)?;
        VInt(self.gcd.get()).serialize(writer)?;
        VInt(self.amplitude() / self.gcd).serialize(writer)?;
        VInt(self.num_rows as u64).serialize(writer)?;
        Ok(())
    }

    fn deserialize<R: io::Read>(reader: &mut R) -> io::Result<Self> {
        let min_value = VInt::deserialize(reader)?.0;
        let gcd = VInt::deserialize(reader)?.0;
        let gcd = NonZeroU64::new(gcd)
            .ok_or_else(|| io::Error::new(io::ErrorKind::InvalidData, "GCD of 0 is forbidden"))?;
        let amplitude = VInt::deserialize(reader)?.0 * gcd.get();
        let max_value = min_value + amplitude;
        let num_rows = VInt::deserialize(reader)?.0 as RowId;
        Ok(ColumnStats {
            min_value,
            max_value,
            num_rows,
            gcd,
        })
    }
}

#[cfg(test)]
mod tests {
    use std::num::NonZeroU64;

    use common::BinarySerializable;

    use crate::column_values::ColumnStats;

    #[track_caller]
    fn test_stats_ser_deser_aux(stats: &ColumnStats, num_bytes: usize) {
        let mut buffer: Vec<u8> = Vec::new();
        stats.serialize(&mut buffer).unwrap();
        assert_eq!(buffer.len(), num_bytes);
        let deser_stats = ColumnStats::deserialize(&mut &buffer[..]).unwrap();
        assert_eq!(stats, &deser_stats);
    }

    #[test]
    fn test_stats_serialization() {
        test_stats_ser_deser_aux(
            &(ColumnStats {
                gcd: NonZeroU64::new(3).unwrap(),
                min_value: 1,
                max_value: 3001,
                num_rows: 10,
            }),
            5,
        );
        test_stats_ser_deser_aux(
            &(ColumnStats {
                gcd: NonZeroU64::new(1_000).unwrap(),
                min_value: 1,
                max_value: 3001,
                num_rows: 10,
            }),
            5,
        );
        test_stats_ser_deser_aux(
            &(ColumnStats {
                gcd: NonZeroU64::new(1).unwrap(),
                min_value: 0,
                max_value: 0,
                num_rows: 0,
            }),
            4,
        );
    }
}


================================================
FILE: columnar/src/column_values/u128_based/compact_space/blank_range.rs
================================================
use std::ops::RangeInclusive;

/// The range of a blank in value space.
///
/// A blank is an unoccupied space in the data.
/// Use try_into() to construct.
/// A range has to have at least length of 3. Invalid ranges will be rejected.
///
/// Ordered by range length.
#[derive(Debug, Eq, PartialEq, Clone)]
pub(crate) struct BlankRange {
    blank_range: RangeInclusive<u128>,
}
impl TryFrom<RangeInclusive<u128>> for BlankRange {
    type Error = &'static str;
    fn try_from(range: RangeInclusive<u128>) -> Result<Self, Self::Error> {
        let blank_size = range.end().saturating_sub(*range.start());
        if blank_size < 2 {
            Err("invalid range")
        } else {
            Ok(BlankRange { blank_range: range })
        }
    }
}
impl BlankRange {
    pub(crate) fn blank_size(&self) -> u128 {
        self.blank_range.end() - self.blank_range.start() + 1
    }
    pub(crate) fn blank_range(&self) -> RangeInclusive<u128> {
        self.blank_range.clone()
    }
}

impl Ord for BlankRange {
    fn cmp(&self, other: &Self) -> std::cmp::Ordering {
        self.blank_size().cmp(&other.blank_size())
    }
}
impl PartialOrd for BlankRange {
    fn partial_cmp(&self, other: &Self) -> Option<std::cmp::Ordering> {
        Some(self.cmp(other))
    }
}


================================================
FILE: columnar/src/column_values/u128_based/compact_space/build_compact_space.rs
================================================
use std::collections::{BTreeSet, BinaryHeap};
use std::iter;
use std::ops::RangeInclusive;

use itertools::Itertools;

use super::blank_range::BlankRange;
use super::{CompactSpace, RangeMapping};

/// Put the blanks for the sorted values into a binary heap
fn get_blanks(values_sorted: &BTreeSet<u128>) -> BinaryHeap<BlankRange> {
    let mut blanks: BinaryHeap<BlankRange> = BinaryHeap::new();
    for (first, second) in values_sorted.iter().copied().tuple_windows() {
        // Correctness Overflow: the values are deduped and sorted (BTreeSet property), that means
        // there's always space between two values.
        let blank_range = first + 1..=second - 1;
        let blank_range: Result<BlankRange, _> = blank_range.try_into();
        if let Ok(blank_range) = blank_range {
            blanks.push(blank_range);
        }
    }

    blanks
}

struct BlankCollector {
    blanks: Vec<BlankRange>,
    staged_blanks_sum: u128,
}
impl BlankCollector {
    fn new() -> Self {
        Self {
            blanks: vec![],
            staged_blanks_sum: 0,
        }
    }
    fn stage_blank(&mut self, blank: BlankRange) {
        self.staged_blanks_sum += blank.blank_size();
        self.blanks.push(blank);
    }
    fn drain(&mut self) -> impl Iterator<Item = BlankRange> + '_ {
        self.staged_blanks_sum = 0;
        self.blanks.drain(..)
    }
    fn staged_blanks_sum(&self) -> u128 {
        self.staged_blanks_sum
    }
    fn num_staged_blanks(&self) -> usize {
        self.blanks.len()
    }
}
fn num_bits(val: u128) -> u8 {
    (128u32 - val.leading_zeros()) as u8
}

/// Will collect blanks and add them to compact space if more bits are saved than cost from
/// metadata.
pub fn get_compact_space(
    values_deduped_sorted: &BTreeSet<u128>,
    total_num_values: u32,
    cost_per_blank: usize,
) -> CompactSpace {
    let mut compact_space_builder = CompactSpaceBuilder::new();
    if values_deduped_sorted.is_empty() {
        return compact_space_builder.finish();
    }

    // We start by space that's limited to min_value..=max_value
    // Replace after stabilization of https://github.com/rust-lang/rust/issues/62924
    let min_value = values_deduped_sorted.iter().next().copied().unwrap_or(0);
    let max_value = values_deduped_sorted.iter().last().copied().unwrap_or(0);

    let mut blanks: BinaryHeap<BlankRange> = get_blanks(values_deduped_sorted);

    // +1 for null, in case min and max covers the whole space, we are off by one.
    let mut amplitude_compact_space = (max_value - min_value).saturating_add(1);
    if min_value != 0 {
        compact_space_builder.add_blanks(iter::once(0..=min_value - 1));
    }
    if max_value != u128::MAX {
        compact_space_builder.add_blanks(iter::once(max_value + 1..=u128::MAX));
    }

    let mut amplitude_bits: u8 = num_bits(amplitude_compact_space);

    let mut blank_collector = BlankCollector::new();

    // We will stage blanks until they reduce the compact space by at least 1 bit and then flush
    // them if the metadata cost is lower than the total number of saved bits.
    // Binary heap to process the gaps by their size
    while let Some(blank_range) = blanks.pop() {
        blank_collector.stage_blank(blank_range);

        let staged_spaces_sum: u128 = blank_collector.staged_blanks_sum();
        let amplitude_new_compact_space = amplitude_compact_space - staged_spaces_sum;
        let amplitude_new_bits = num_bits(amplitude_new_compact_space);

        if amplitude_bits == amplitude_new_bits {
            continue;
        }
        let saved_bits = (amplitude_bits - amplitude_new_bits) as usize * total_num_values as usize;
        // TODO: Maybe calculate exact cost of blanks and run this more expensive computation only,
        // when amplitude_new_bits changes
        let cost = blank_collector.num_staged_blanks() * cost_per_blank;

        // We want to end up with a compact space that fits into 32 bits.
        // In order to deal with pathological cases, we force the algorithm to keep
        // refining the compact space the amplitude bits is lower than 32.
        //
        // The worst case scenario happens for a large number of u128s regularly
        // spread over the full u128 space.
        //
        // This change will force the algorithm to degenerate into dictionary encoding.
        if amplitude_bits <= 32 && cost >= saved_bits {
            // Continue here, since although we walk over the blanks by size,
            // we can potentially save a lot at the last bits, which are smaller blanks
            //
            // E.g. if the first range reduces the compact space by 1000 from 2000 to 1000, which
            // saves 11-10=1 bit and the next range reduces the compact space by 950 to
            // 50, which saves 10-6=4 bit
            continue;
        }

        amplitude_compact_space = amplitude_new_compact_space;
        amplitude_bits = amplitude_new_bits;
        compact_space_builder.add_blanks(blank_collector.drain().map(|blank| blank.blank_range()));
    }

    assert!(amplitude_bits <= 32);

    // special case, when we don't collected any blanks because:
    // * the data is empty (early exit)
    // * the algorithm did decide it's not worth the cost, which can be the case for single values
    //
    // We drain one collected blank unconditionally, so the empty case is reserved for empty
    // data, and therefore empty compact_space means the data is empty and no data is covered
    // (conversely to all data) and we can assign null to it.
    if compact_space_builder.is_empty() {
        compact_space_builder.add_blanks(
            blank_collector
                .drain()
                .map(|blank| blank.blank_range())
                .take(1),
        );
    }

    let compact_space = compact_space_builder.finish();
    if max_value - min_value != u128::MAX {
        debug_assert_eq!(
            compact_space.amplitude_compact_space(),
            amplitude_compact_space
        );
    }
    compact_space
}

#[derive(Debug, Clone, Eq, PartialEq)]
struct CompactSpaceBuilder {
    blanks: Vec<RangeInclusive<u128>>,
}

impl CompactSpaceBuilder {
    /// Creates a new compact space builder which will initially cover the whole space.
    fn new() -> Self {
        Self { blanks: Vec::new() }
    }

    /// Assumes that repeated add_blank calls don't overlap and are not adjacent,
    /// e.g. [3..=5, 5..=10] is not allowed
    ///
    /// Both of those assumptions are true when blanks are produced from sorted values.
    fn add_blanks(&mut self, blank: impl Iterator<Item = RangeInclusive<u128>>) {
        self.blanks.extend(blank);
    }

    fn is_empty(&self) -> bool {
        self.blanks.is_empty()
    }

    /// Convert blanks to covered space and assign null value
    fn finish(mut self) -> CompactSpace {
        // sort by start. ranges are not allowed to overlap
        self.blanks.sort_unstable_by_key(|blank| *blank.start());

        let mut covered_space = Vec::with_capacity(self.blanks.len());

        // beginning of the blanks
        if let Some(first_blank_start) = self.blanks.first().map(RangeInclusive::start)
            && *first_blank_start != 0
        {
            covered_space.push(0..=first_blank_start - 1);
        }

        // Between the blanks
        let between_blanks = self.blanks.iter().tuple_windows().map(|(left, right)| {
            assert!(
                left.end() < right.start(),
                "overlapping or adjacent ranges detected"
            );
            *left.end() + 1..=*right.start() - 1
        });
        covered_space.extend(between_blanks);

        // end of the blanks
        if let Some(last_blank_end) = self.blanks.last().map(RangeInclusive::end)
            && *last_blank_end != u128::MAX
        {
            covered_space.push(last_blank_end + 1..=u128::MAX);
        }

        if covered_space.is_empty() {
            covered_space.push(0..=0); // empty data case
        };

        let mut compact_start: u32 = 1; // 0 is reserved for `null`
        let mut ranges_mapping: Vec<RangeMapping> = Vec::with_capacity(covered_space.len());
        for cov in covered_space {
            let range_mapping = super::RangeMapping {
                value_range: cov,
                compact_start,
            };
            let covered_range_len = range_mapping.range_length();
            ranges_mapping.push(range_mapping);
            compact_start += covered_range_len;
        }
        // println!("num ranges {}", ranges_mapping.len());
        CompactSpace { ranges_mapping }
    }
}

#[cfg(test)]
mod tests {
    use super::*;
    use crate::column_values::u128_based::compact_space::COST_PER_BLANK_IN_BITS;

    #[test]
    fn test_binary_heap_pop_order() {
        let mut blanks: BinaryHeap<BlankRange> = BinaryHeap::new();
        blanks.push((0..=10).try_into().unwrap());
        blanks.push((100..=200).try_into().unwrap());
        blanks.push((100..=110).try_into().unwrap());
        assert_eq!(blanks.pop().unwrap().blank_size(), 101);
        assert_eq!(blanks.pop().unwrap().blank_size(), 11);
    }

    #[test]
    fn test_worst_case_scenario() {
        let vals: BTreeSet<u128> = (0..8).map(|i| i * ((1u128 << 34) / 8)).collect();
        let compact_space = get_compact_space(&vals, vals.len() as u32, COST_PER_BLANK_IN_BITS);
        assert!(compact_space.amplitude_compact_space() < u32::MAX as u128);
    }
}


================================================
FILE: columnar/src/column_values/u128_based/compact_space/mod.rs
================================================
/// This codec takes a large number space (u128) and reduces it to a compact number space.
///
/// It will find spaces in the number range. For example:
///
/// 100, 101, 102, 103, 104, 50000, 50001
/// could be mapped to
/// 100..104 -> 0..4
/// 50000..50001 -> 5..6
///
/// Compact space 0..=6 requires much less bits than 100..=50001
///
/// The codec is created to compress ip addresses, but may be employed in other use cases.
use std::{
    cmp::Ordering,
    collections::BTreeSet,
    io::{self, Write},
    ops::{Range, RangeInclusive},
};

mod blank_range;
mod build_compact_space;

use build_compact_space::get_compact_space;
use common::{BinarySerializable, CountingWriter, OwnedBytes, VInt, VIntU128};
use tantivy_bitpacker::{BitPacker, BitUnpacker};

use crate::RowId;
use crate::column_values::ColumnValues;

/// The cost per blank is quite hard actually, since blanks are delta encoded, the actual cost of
/// blanks depends on the number of blanks.
///
/// The number is taken by looking at a real dataset. It is optimized for larger datasets.
const COST_PER_BLANK_IN_BITS: usize = 36;

#[derive(Debug, Clone, Eq, PartialEq)]
pub struct CompactSpace {
    ranges_mapping: Vec<RangeMapping>,
}

/// Maps the range from the original space to compact_start + range.len()
#[derive(Debug, Clone, Eq, PartialEq)]
struct RangeMapping {
    value_range: RangeInclusive<u128>,
    compact_start: u32,
}
impl RangeMapping {
    fn range_length(&self) -> u32 {
        (self.value_range.end() - self.value_range.start()) as u32 + 1
    }

    // The last value of the compact space in this range
    fn compact_end(&self) -> u32 {
        self.compact_start + self.range_length() - 1
    }
}

impl BinarySerializable for CompactSpace {
    fn serialize<W: io::Write + ?Sized>(&self, writer: &mut W) -> io::Result<()> {
        VInt(self.ranges_mapping.len() as u64).serialize(writer)?;

        let mut prev_value = 0;
        for value_range in self
            .ranges_mapping
            .iter()
            .map(|range_mapping| &range_mapping.value_range)
        {
            let blank_delta_start = value_range.start() - prev_value;
            VIntU128(blank_delta_start).serialize(writer)?;
            prev_value = *value_range.start();

            let blank_delta_end = value_range.end() - prev_value;
            VIntU128(blank_delta_end).serialize(writer)?;
            prev_value = *value_range.end();
        }

        Ok(())
    }

    fn deserialize<R: io::Read>(reader: &mut R) -> io::Result<Self> {
        let num_ranges = VInt::deserialize(reader)?.0;
        let mut ranges_mapping: Vec<RangeMapping> = vec![];
        let mut value = 0u128;
        let mut compact_start = 1u32; // 0 is reserved for `null`
        for _ in 0..num_ranges {
            let blank_delta_start = VIntU128::deserialize(reader)?.0;
            value += blank_delta_start;
            let blank_start = value;

            let blank_delta_end = VIntU128::deserialize(reader)?.0;
            value += blank_delta_end;
            let blank_end = value;

            let range_mapping = RangeMapping {
                value_range: blank_start..=blank_end,
                compact_start,
            };
            let range_length = range_mapping.range_length();
            ranges_mapping.push(range_mapping);
            compact_start += range_length;
        }

        Ok(Self { ranges_mapping })
    }
}

impl CompactSpace {
    /// Amplitude is the value range of the compact space including the sentinel value used to
    /// identify null values. The compact space is 0..=amplitude .
    ///
    /// It's only used to verify we don't exceed u64 number space, which would indicate a bug.
    fn amplitude_compact_space(&self) -> u128 {
        self.ranges_mapping
            .last()
            .map(|last_range| last_range.compact_end() as u128)
            .unwrap_or(1) // compact space starts at 1, 0 == null
    }

    fn get_range_mapping(&self, pos: usize) -> &RangeMapping {
        &self.ranges_mapping[pos]
    }

    /// Returns either Ok(the value in the compact space) or if it is outside the compact space the
    /// Err(position where it would be inserted)
    fn u128_to_compact(&self, value: u128) -> Result<u32, usize> {
        self.ranges_mapping
            .binary_search_by(|probe| {
                let value_range: &RangeInclusive<u128> = &probe.value_range;
                if value < *value_range.start() {
                    Ordering::Greater
                } else if value > *value_range.end() {
                    Ordering::Less
                } else {
                    Ordering::Equal
                }
            })
            .map(|pos| {
                let range_mapping = &self.ranges_mapping[pos];
                let pos_in_range: u32 = (value - range_mapping.value_range.start()) as u32;
                range_mapping.compact_start + pos_in_range
            })
    }

    /// Unpacks a value from compact space u32 to u128 space
    fn compact_to_u128(&self, compact: u32) -> u128 {
        let pos = self
            .ranges_mapping
            .binary_search_by_key(&compact, |range_mapping| range_mapping.compact_start)
            // Correctness: Overflow. The first range starts at compact space 0, the error from
            // binary search can never be 0
            .unwrap_or_else(|e| e - 1);

        let range_mapping = &self.ranges_mapping[pos];
        let diff = compact - range_mapping.compact_start;
        range_mapping.value_range.start() + diff as u128
    }
}

pub struct CompactSpaceCompressor {
    params: IPCodecParams,
}

#[derive(Debug, Clone)]
pub struct IPCodecParams {
    compact_space: CompactSpace,
    bit_unpacker: BitUnpacker,
    min_value: u128,
    max_value: u128,
    num_vals: RowId,
    num_bits: u8,
}

impl CompactSpaceCompressor {
    pub fn num_vals(&self) -> RowId {
        self.params.num_vals
    }

    /// Taking the vals as Vec may cost a lot of memory. It is used to sort the vals.
    pub fn train_from(iter: impl Iterator<Item = u128>) -> Self {
        let mut values_sorted = BTreeSet::new();
        // Total number of values, with their redundancy.
        let mut total_num_values = 0u32;
        for val in iter {
            total_num_values += 1u32;
            values_sorted.insert(val);
        }
        let min_value = *values_sorted.iter().next().unwrap_or(&0);
        let max_value = *values_sorted.iter().last().unwrap_or(&0);

        let compact_space =
            get_compact_space(&values_sorted, total_num_values, COST_PER_BLANK_IN_BITS);
        let amplitude_compact_space = compact_space.amplitude_compact_space();

        assert!(
            amplitude_compact_space <= u64::MAX as u128,
            "case unsupported."
        );

        let num_bits = tantivy_bitpacker::compute_num_bits(amplitude_compact_space as u64);

        assert_eq!(
            compact_space
                .u128_to_compact(max_value)
                .expect("could not convert max value to compact space"),
            amplitude_compact_space as u32
        );
        CompactSpaceCompressor {
            params: IPCodecParams {
                compact_space,
                bit_unpacker: BitUnpacker::new(num_bits),
                min_value,
                max_value,
                num_vals: total_num_values,
                num_bits,
            },
        }
    }

    fn write_footer(self, writer: &mut impl Write) -> io::Result<()> {
        let writer = &mut CountingWriter::wrap(writer);
        self.params.serialize(writer)?;

        let footer_len = writer.written_bytes() as u32;
        footer_len.serialize(writer)?;

        Ok(())
    }

    pub fn compress_into(
        self,
        vals: impl Iterator<Item = u128>,
        write: &mut impl Write,
    ) -> io::Result<()> {
        let mut bitpacker = BitPacker::default();
        for val in vals {
            let compact = self
                .params
                .compact_space
                .u128_to_compact(val)
                .map_err(|_| {
                    io::Error::new(
                        io::ErrorKind::InvalidData,
                        "Could not convert value to compact_space. This is a bug.",
                    )
                })?;
            bitpacker.write(compact as u64, self.params.num_bits, write)?;
        }
        bitpacker.close(write)?;
        self.write_footer(write)?;
        Ok(())
    }
}

#[derive(Debug, Clone)]
pub struct CompactSpaceDecompressor {
    data: OwnedBytes,
    params: IPCodecParams,
}

impl BinarySerializable for IPCodecParams {
    fn serialize<W: io::Write + ?Sized>(&self, writer: &mut W) -> io::Result<()> {
        // header flags for future optional dictionary encoding
        let footer_flags = 0u64;
        footer_flags.serialize(writer)?;

        VIntU128(self.min_value).serialize(writer)?;
        VIntU128(self.max_value).serialize(writer)?;
        VIntU128(self.num_vals as u128).serialize(writer)?;
        self.num_bits.serialize(writer)?;

        self.compact_space.serialize(writer)?;

        Ok(())
    }

    fn deserialize<R: io::Read>(reader: &mut R) -> io::Result<Self> {
        let _header_flags = u64::deserialize(reader)?;
        let min_value = VIntU128::deserialize(reader)?.0;
        let max_value = VIntU128::deserialize(reader)?.0;
        let num_vals = VIntU128::deserialize(reader)?.0 as u32;
        let num_bits = u8::deserialize(reader)?;
        let compact_space = CompactSpace::deserialize(reader)?;

        Ok(Self {
            compact_space,
            bit_unpacker: BitUnpacker::new(num_bits),
            min_value,
            max_value,
            num_vals,
            num_bits,
        })
    }
}

/// Represents the result of looking up a u128 value in the compact space.
///
/// If a value is outside the compact space, the next compact value is returned.
#[derive(Debug, Clone, Copy, PartialEq, Eq)]
pub enum CompactHit {
    /// The value exists in the compact space
    Exact(u32),
    /// The value does not exist in the compact space, but the next higher value does
    Next(u32),
    /// The value is greater than the maximum compact value
    AfterLast,
}

/// Exposes the compact space compressed values as u64.
///
/// This allows faster access to the values, as u64 is faster to work with than u128.
/// It also allows to handle u128 values like u64, via the `open_u64_lenient` as a uniform
/// access interface.
///
/// When converting from the internal u64 to u128 `compact_to_u128` can be used.
pub struct CompactSpaceU64Accessor(CompactSpaceDecompressor);
impl CompactSpaceU64Accessor {
    pub(crate) fn open(data: OwnedBytes) -> io::Result<CompactSpaceU64Accessor> {
        let decompressor = CompactSpaceU64Accessor(CompactSpaceDecompressor::open(data)?);
        Ok(decompressor)
    }
    /// Convert a compact space value to u128
    pub fn compact_to_u128(&self, compact: u32) -> u128 {
        self.0.compact_to_u128(compact)
    }

    /// Finds the next compact space value for a given u128 value.
    pub fn u128_to_next_compact(&self, value: u128) -> CompactHit {
        self.0.u128_to_next_compact(value)
    }
}

impl ColumnValues<u64> for CompactSpaceU64Accessor {
    #[inline]
    fn get_val(&self, doc: u32) -> u64 {
        let compact = self.0.get_compact(doc);
        compact as u64
    }

    fn min_value(&self) -> u64 {
        self.0.u128_to_compact(self.0.min_value()).unwrap() as u64
    }

    fn max_value(&self) -> u64 {
        self.0.u128_to_compact(self.0.max_value()).unwrap() as u64
    }

    fn num_vals(&self) -> u32 {
        self.0.params.num_vals
    }

    #[inline]
    fn iter(&self) -> Box<dyn Iterator<Item = u64> + '_> {
        Box::new(self.0.iter_compact().map(|el| el as u64))
    }

    #[inline]
    fn get_row_ids_for_value_range(
        &self,
        value_range: RangeInclusive<u64>,
        position_range: Range<u32>,
        positions: &mut Vec<u32>,
    ) {
        let value_range = self.0.compact_to_u128(*value_range.start() as u32)
            ..=self.0.compact_to_u128(*value_range.end() as u32);
        self.0
            .get_row_ids_for_value_range(value_range, position_range, positions)
    }
}

impl ColumnValues<u128> for CompactSpaceDecompressor {
    #[inline]
    fn get_val(&self, doc: u32) -> u128 {
        self.get(doc)
    }

    fn min_value(&self) -> u128 {
        self.min_value()
    }

    fn max_value(&self) -> u128 {
        self.max_value()
    }

    fn num_vals(&self) -> u32 {
        self.params.num_vals
    }

    #[inline]
    fn iter(&self) -> Box<dyn Iterator<Item = u128> + '_> {
        Box::new(self.iter())
    }

    #[inline]
    fn get_row_ids_for_value_range(
        &self,
        value_range: RangeInclusive<u128>,
        position_range: Range<u32>,
        positions: &mut Vec<u32>,
    ) {
        if value_range.start() > value_range.end() {
            return;
        }
        let position_range = position_range.start..position_range.end.min(self.num_vals());
        let from_value = *value_range.start();
        let to_value = *value_range.end();
        assert!(to_value >= from_value);
        let compact_from = self.u128_to_compact(from_value);
        let compact_to = self.u128_to_compact(to_value);

        // Quick return, if both ranges fall into the same non-mapped space, the range can't cover
        // any values, so we can early exit
        match (compact_to, compact_from) {
            (Err(pos1), Err(pos2)) if pos1 == pos2 => return,
            _ => {}
        }

        let compact_from = compact_from.unwrap_or_else(|pos| {
            // Correctness: Out of bounds, if this value is Err(last_index + 1), we early exit,
            // since the to_value also mapps into the same non-mapped space
            let range_mapping = self.params.compact_space.get_range_mapping(pos);
            range_mapping.compact_start
        });
        // If there is no compact space, we go to the closest upperbound compact space
        let compact_to = compact_to.unwrap_or_else(|pos| {
            // Correctness: Overflow, if this value is Err(0), we early exit,
            // since the from_value also mapps into the same non-mapped space

            // Get end of previous range
            let pos = pos - 1;
            let range_mapping = self.params.compact_space.get_range_mapping(pos);
            range_mapping.compact_end()
        });

        let value_range = compact_from..=compact_to;
        self.get_positions_for_compact_value_range(value_range, position_range, positions);
    }
}

impl CompactSpaceDecompressor {
    pub fn open(data: OwnedBytes) -> io::Result<CompactSpaceDecompressor> {
        let (data_slice, footer_len_bytes) = data.split_at(data.len() - 4);
        let footer_len = u32::deserialize(&mut &footer_len_bytes[..])?;

        let data_footer = &data_slice[data_slice.len() - footer_len as usize..];
        let params = IPCodecParams::deserialize(&mut &data_footer[..])?;
        let decompressor = CompactSpaceDecompressor { data, params };

        Ok(decompressor)
    }

    /// Converting to compact space for the decompressor is more complex, since we may get values
    /// which are outside the compact space. e.g. if we map
    /// 1000 => 5
    /// 2000 => 6
    ///
    /// and we want a mapping for 1005, there is no equivalent compact space. We instead return an
    /// error with the index of the next range.
    fn u128_to_compact(&self, value: u128) -> Result<u32, usize> {
        self.params.compact_space.u128_to_compact(value)
    }

    /// Finds the next compact space value for a given u128 value.
    pub fn u128_to_next_compact(&self, value: u128) -> CompactHit {
        match self.u128_to_compact(value) {
            Ok(compact) => CompactHit::Exact(compact),
            Err(pos) => {
                if pos >= self.params.compact_space.ranges_mapping.len() {
                    CompactHit::AfterLast
                } else {
                    let next_range = &self.params.compact_space.ranges_mapping[pos];
                    CompactHit::Next(next_range.compact_start)
                }
            }
        }
    }

    fn compact_to_u128(&self, compact: u32) -> u128 {
        self.params.compact_space.compact_to_u128(compact)
    }

    #[inline]
    fn iter_compact(&self) -> impl Iterator<Item = u32> + '_ {
        (0..self.params.num_vals)
            .map(move |idx| self.params.bit_unpacker.get(idx, &self.data) as u32)
    }

    #[inline]
    fn iter(&self) -> impl Iterator<Item = u128> + '_ {
        // TODO: Performance. It would be better to iterate on the ranges and check existence via
        // the bit_unpacker.
        self.iter_compact()
            .map(|compact| self.compact_to_u128(compact))
    }

    #[inline]
    pub fn get_compact(&self, idx: u32) -> u32 {
        self.params.bit_unpacker.get(idx, &self.data) as u32
    }

    #[inline]
    pub fn get(&self, idx: u32) -> u128 {
        let compact = self.get_compact(idx);
        self.compact_to_u128(compact)
    }

    pub fn min_value(&self) -> u128 {
        self.params.min_value
    }

    pub fn max_value(&self) -> u128 {
        self.params.max_value
    }

    fn get_positions_for_compact_value_range(
        &self,
        value_range: RangeInclusive<u32>,
        position_range: Range<u32>,
        positions: &mut Vec<u32>,
    ) {
        self.params.bit_unpacker.get_ids_for_value_range(
            *value_range.start() as u64..=*value_range.end() as u64,
            position_range,
            &self.data,
            positions,
        );
    }
}

#[cfg(test)]
mod tests {

    use itertools::Itertools;

    use super::*;
    use crate::column_values::u128_based::U128Header;
    use crate::column_values::{open_u128_mapped, serialize_column_values_u128};

    #[test]
    fn compact_space_test() {
        let ips: BTreeSet<u128> = [
            2u128, 4u128, 1000, 1001, 1002, 1003, 1004, 1005, 1008, 1010, 1012, 1260,
        ]
        .into_iter()
        .collect();
        let compact_space = get_compact_space(&ips, ips.len() as u32, 11);
        let amplitude = compact_space.amplitude_compact_space();
        assert_eq!(amplitude, 17);
        assert_eq!(1, compact_space.u128_to_compact(2).unwrap());
        assert_eq!(2, compact_space.u128_to_compact(3).unwrap());
        assert_eq!(compact_space.u128_to_compact(100).unwrap_err(), 1);

        for (num1, num2) in (0..3).tuple_windows() {
            assert_eq!(
                compact_space.get_range_mapping(num1).compact_end() + 1,
                compact_space.get_range_mapping(num2).compact_start
            );
        }

        let mut output: Vec<u8> = Vec::new();
        compact_space.serialize(&mut output).unwrap();

        assert_eq!(
            compact_space,
            CompactSpace::deserialize(&mut &output[..]).unwrap()
        );

        for ip in ips {
            let compact = compact_space.u128_to_compact(ip).unwrap();
            assert_eq!(compact_space.compact_to_u128(compact), ip);
        }
    }

    #[test]
    fn compact_space_amplitude_test() {
        let ips = &[100000u128, 1000000].into_iter().collect();
        let compact_space = get_compact_space(ips, ips.len() as u32, 1);
        let amplitude = compact_space.amplitude_compact_space();
        assert_eq!(amplitude, 2);
    }

    fn test_all(mut data: OwnedBytes, expected: &[u128]) {
        let _header = U128Header::deserialize(&mut data);
        let decompressor = CompactSpaceDecompressor::open(data).unwrap();
        for (idx, expected_val) in expected.iter().cloned().enumerate() {
            let val = decompressor.get(idx as u32);
            assert_eq!(val, expected_val);

            let test_range = |range: RangeInclusive<u128>| {
                let expected_positions = expected
                    .iter()
                    .positions(|val| range.contains(val))
                    .map(|pos| pos as u32)
                    .collect::<Vec<_>>();
                let mut positions = Vec::new();
                decompressor.get_row_ids_for_value_range(
                    range,
                    0..decompressor.num_vals(),
                    &mut positions,
                );
                assert_eq!(positions, expected_positions);
            };

            test_range(expected_val.saturating_sub(1)..=expected_val);
            test_range(expected_val..=expected_val);
            test_range(expected_val..=expected_val.saturating_add(1));
            test_range(expected_val.saturating_sub(1)..=expected_val.saturating_add(1));
        }
    }

    fn test_aux_vals(u128_vals: &[u128]) -> OwnedBytes {
        let mut out = Vec::new();
        serialize_column_values_u128(&u128_vals, &mut out).unwrap();
        let data = OwnedBytes::new(out);
        test_all(data.clone(), u128_vals);
        data
    }

    #[test]
    fn test_range_1() {
        let vals = &[
            1u128,
            100u128,
            3u128,
            99999u128,
            100000u128,
            100001u128,
            4_000_211_221u128,
            4_000_211_222u128,
            333u128,
        ];
        let mut data = test_aux_vals(vals);

        let _header = U128Header::deserialize(&mut data);
        let decomp = CompactSpaceDecompressor::open(data).unwrap();
        let complete_range = 0..vals.len() as u32;
        for (pos, val) in vals.iter().enumerate() {
            let val = *val;
            let pos = pos as u32;
            let mut positions = Vec::new();
            decomp.get_row_ids_for_value_range(val..=val, pos..pos + 1, &mut positions);
            assert_eq!(positions, vec![pos]);
        }

        // handle docid range out of bounds
        let positions: Vec<u32> = get_positions_for_value_range_helper(&decomp, 0..=1, 1..u32::MAX);
        assert!(positions.is_empty());

        let positions =
            get_positions_for_value_range_helper(&decomp, 0..=1, complete_range.clone());
        assert_eq!(positions, vec![0]);
        let positions =
            get_positions_for_value_range_helper(&decomp, 0..=2, complete_range.clone());
        assert_eq!(positions, vec![0]);
        let positions =
            get_positions_for_value_range_helper(&decomp, 0..=3, complete_range.clone());
        assert_eq!(positions, vec![0, 2]);
        assert_eq!(
            get_positions_for_value_range_helper(
                &decomp,
                99999u128..=99999u128,
                complete_range.clone()
            ),
            vec![3]
        );
        assert_eq!(
            get_positions_for_value_range_helper(
                &decomp,
                99999u128..=100000u128,
                complete_range.clone()
            ),
            vec![3, 4]
        );
        assert_eq!(
            get_positions_for_value_range_helper(
                &decomp,
                99998u128..=100000u128,
                complete_range.clone()
            ),
            vec![3, 4]
        );
        assert_eq!(
            &get_positions_for_value_range_helper(
                &decomp,
                99998u128..=99999u128,
                complete_range.clone()
            ),
            &[3]
        );
        assert!(
            get_positions_for_value_range_helper(
                &decomp,
                99998u128..=99998u128,
                complete_range.clone()
            )
            .is_empty()
        );
        assert_eq!(
            &get_positions_for_value_range_helper(
                &decomp,
                333u128..=333u128,
                complete_range.clone()
            ),
            &[8]
        );
        assert_eq!(
            &get_positions_for_value_range_helper(
                &decomp,
                332u128..=333u128,
                complete_range.clone()
            ),
            &[8]
        );
        assert_eq!(
            &get_positions_for_value_range_helper(
                &decomp,
                332u128..=334u128,
                complete_range.clone()
            ),
            &[8]
        );
        assert_eq!(
            &get_positions_for_value_range_helper(
                &decomp,
                333u128..=334u128,
                complete_range.clone()
            ),
            &[8]
        );

        assert_eq!(
            &get_positions_for_value_range_helper(
                &decomp,
                4_000_211_221u128..=5_000_000_000u128,
                complete_range
            ),
            &[6, 7]
        );
    }

    #[test]
    fn test_empty() {
        let vals = &[];
        let data = test_aux_vals(vals);
        let _decomp = CompactSpaceDecompressor::open(data).unwrap();
    }

    #[test]
    fn test_range_2() {
        let vals = &[
            100u128,
            99999u128,
            100000u128,
            100001u128,
            4_000_211_221u128,
            4_000_211_222u128,
            333u128,
        ];
        let mut data = test_aux_vals(vals);
        let _header = U128Header::deserialize(&mut data);
        let decomp = CompactSpaceDecompressor::open(data).unwrap();
        let complete_range = 0..vals.len() as u32;
        assert!(
            &get_positions_for_value_range_helper(&decomp, 0..=5, complete_range.clone())
                .is_empty(),
        );
        assert_eq!(
            &get_positions_for_value_range_helper(&decomp, 0..=100, complete_range.clone()),
            &[0]
        );
        assert_eq!(
            &get_positions_for_value_range_helper(&decomp, 0..=105, complete_range),
            &[0]
        );
    }

    fn get_positions_for_value_range_helper<C: ColumnValues<T> + ?Sized, T: PartialOrd>(
        column: &C,
        value_range: RangeInclusive<T>,
        doc_id_range: Range<u32>,
    ) -> Vec<u32> {
        let mut positions = Vec::new();
        column.get_row_ids_for_value_range(value_range, doc_id_range, &mut positions);
        positions
    }

    #[test]
    fn test_range_3() {
        let vals = &[
            200u128,
            201,
            202,
            203,
            204,
            204,
            206,
            207,
            208,
            209,
            210,
            1_000_000,
            5_000_000_000,
        ];
        let mut out = Vec::new();
        serialize_column_values_u128(&&vals[..], &mut out).unwrap();
        let decomp = open_u128_mapped(OwnedBytes::new(out)).unwrap();
        let complete_range = 0..vals.len() as u32;

        assert_eq!(
            get_positions_for_value_range_helper(&*decomp, 199..=200, complete_range.clone()),
            vec![0]
        );

        assert_eq!(
            get_positions_for_value_range_helper(&*decomp, 199..=201, complete_range.clone()),
            vec![0, 1]
        );

        assert_eq!(
            get_positions_for_value_range_helper(&*decomp, 200..=200, complete_range.clone()),
            vec![0]
        );

        assert_eq!(
            get_positions_for_value_range_helper(&*decomp, 1_000_000..=1_000_000, complete_range),
            vec![11]
        );
    }

    #[test]
    fn test_bug1() {
        let vals = &[9223372036854775806];
        let _data = test_aux_vals(vals);
    }

    #[test]
    fn test_bug2() {
        let vals = &[340282366920938463463374607431768211455u128];
        let _data = test_aux_vals(vals);
    }

    #[test]
    fn test_bug3() {
        let vals = &[340282366920938463463374607431768211454];
        let _data = test_aux_vals(vals);
    }

    #[test]
    fn test_bug4() {
        let vals = &[340282366920938463463374607431768211455, 0];
        let _data = test_aux_vals(vals);
    }

    #[test]
    fn test_first_large_gaps() {
        let vals = &[1_000_000_000u128; 100];
        let _data = test_aux_vals(vals);
    }

    #[test]
    fn test_u128_to_next_compact() {
        let vals = &[100u128, 200u128, 1_000_000_000u128, 1_000_000_100u128];
        let mut data = test_aux_vals(vals);

        let _header = U128Header::deserialize(&mut data);
        let decomp = CompactSpaceDecompressor::open(data).unwrap();

        // Test value that's already in a range
        let compact_100 = decomp.u128_to_compact(100).unwrap();
        assert_eq!(
            decomp.u128_to_next_compact(100),
            CompactHit::Exact(compact_100)
        );

        // Test value between two ranges
        let compact_million = decomp.u128_to_compact(1_000_000_000).unwrap();
        assert_eq!(
            decomp.u128_to_next_compact(250),
            CompactHit::Next(compact_million)
        );

        // Test value before the first range
        assert_eq!(
            decomp.u128_to_next_compact(50),
            CompactHit::Next(compact_100)
        );

        // Test value after the last range
        assert_eq!(
            decomp.u128_to_next_compact(10_000_000_000),
            CompactHit::AfterLast
        );
    }

    use proptest::prelude::*;

    fn num_strategy() -> impl Strategy<Value = u128> {
        prop_oneof![
            1 => prop::num::u128::ANY.prop_map(|num| u128::MAX - (num % 10) ),
            1 => prop::num::u128::ANY.prop_map(|num| i64::MAX as u128 + 5 - (num % 10) ),
            1 => prop::num::u128::ANY.prop_map(|num| i128::MAX as u128 + 5 - (num % 10) ),
            1 => prop::num::u128::ANY.prop_map(|num| num % 10 ),
            20 => prop::num::u128::ANY,
        ]
    }

    proptest! {
        #![proptest_config(ProptestConfig::with_cases(10))]

        #[test]
        fn compress_decompress_random(vals in proptest::collection::vec(num_strategy() , 1..1000)) {
            let _data = test_aux_vals(&vals);
        }
    }
}


================================================
FILE: columnar/src/column_values/u128_based/mod.rs
================================================
use std::fmt::Debug;
use std::io;
use std::io::Write;
use std::sync::Arc;

mod compact_space;

use common::{BinarySerializable, OwnedBytes, VInt};
pub use compact_space::{
    CompactHit, CompactSpaceCompressor, CompactSpaceDecompressor, CompactSpaceU64Accessor,
};

use crate::column_values::monotonic_map_column;
use crate::column_values::monotonic_mapping::{
    StrictlyMonotonicMappingInverter, StrictlyMonotonicMappingToInternal,
};
use crate::iterable::Iterable;
use crate::{ColumnValues, MonotonicallyMappableToU128};

#[derive(Debug, Copy, Clone, PartialEq, Eq)]
pub(crate) struct U128Header {
    pub num_vals: u32,
    pub codec_type: U128FastFieldCodecType,
}

impl BinarySerializable for U128Header {
    fn serialize<W: io::Write + ?Sized>(&self, writer: &mut W) -> io::Result<()> {
        VInt(self.num_vals as u64).serialize(writer)?;
        self.codec_type.serialize(writer)?;
        Ok(())
    }

    fn deserialize<R: io::Read>(reader: &mut R) -> io::Result<Self> {
        let num_vals = VInt::deserialize(reader)?.0 as u32;
        let codec_type = U128FastFieldCodecType::deserialize(reader)?;
        Ok(U128Header {
            num_vals,
            codec_type,
        })
    }
}

/// Serializes u128 values with the compact space codec.
pub fn serialize_column_values_u128<T: MonotonicallyMappableToU128>(
    iterable: &dyn Iterable<T>,
    output: &mut impl io::Write,
) -> io::Result<()> {
    let compressor = CompactSpaceCompressor::train_from(
        iterable
            .boxed_iter()
            .map(MonotonicallyMappableToU128::to_u128),
    );
    let header = U128Header {
        num_vals: compressor.num_vals(),
        codec_type: U128FastFieldCodecType::CompactSpace,
    };
    header.serialize(output)?;
    compressor.compress_into(
        iterable
            .boxed_iter()
            .map(MonotonicallyMappableToU128::to_u128),
        output,
    )?;
    Ok(())
}

#[derive(PartialEq, Eq, PartialOrd, Ord, Debug, Clone, Copy)]
#[repr(u8)]
/// Available codecs to use to encode the u128 (via [`MonotonicallyMappableToU128`]) converted data.
pub(crate) enum U128FastFieldCodecType {
    /// This codec takes a large number space (u128) and reduces it to a compact number space, by
    /// removing the holes.
    CompactSpace = 1,
}

impl BinarySerializable for U128FastFieldCodecType {
    fn serialize<W: Write + ?Sized>(&self, wrt: &mut W) -> io::Result<()> {
        self.to_code().serialize(wrt)
    }

    fn deserialize<R: io::Read>(reader: &mut R) -> io::Result<Self> {
        let code = u8::deserialize(reader)?;
        let codec_type: Self = Self::from_code(code)
            .ok_or_else(|| io::Error::new(io::ErrorKind::InvalidData, "Unknown code `{code}.`"))?;
        Ok(codec_type)
    }
}

impl U128FastFieldCodecType {
    pub(crate) fn to_code(self) -> u8 {
        self as u8
    }

    pub(crate) fn from_code(code: u8) -> Option<Self> {
        match code {
            1 => Some(Self::CompactSpace),
            _ => None,
        }
    }
}

/// Returns the correct codec reader wrapped in the `Arc` for the data.
pub fn open_u128_mapped<T: MonotonicallyMappableToU128 + Debug>(
    mut bytes: OwnedBytes,
) -> io::Result<Arc<dyn ColumnValues<T>>> {
    let header = U128Header::deserialize(&mut bytes)?;
    assert_eq!(header.codec_type, U128FastFieldCodecType::CompactSpace);
    let reader = CompactSpaceDecompressor::open(bytes)?;
    let inverted: StrictlyMonotonicMappingInverter<StrictlyMonotonicMappingToInternal<T>> =
        StrictlyMonotonicMappingToInternal::<T>::new().into();
    Ok(Arc::new(monotonic_map_column(reader, inverted)))
}

/// Returns the u64 representation of the u128 data.
/// The internal representation of the data as u64 is useful for faster processing.
///
/// In order to convert to u128 back cast to `CompactSpaceU64Accessor` and call
/// `compact_to_u128`.
///
/// # Notice
/// In case there are new codecs added, check for usages of `CompactSpaceDecompressorU64` and
/// also handle the new codecs.
pub fn open_u128_as_compact_u64(mut bytes: OwnedBytes) -> io::Result<Arc<dyn ColumnValues<u64>>> {
    let header = U128Header::deserialize(&mut bytes)?;
    assert_eq!(header.codec_type, U128FastFieldCodecType::CompactSpace);
    let reader = CompactSpaceU64Accessor::open(bytes)?;
    Ok(Arc::new(reader))
}

#[cfg(test)]
pub(crate) mod tests {
    use super::*;
    use crate::column_values::CodecType;
    use crate::column_values::u64_based::{
        ALL_U64_CODEC_TYPES, serialize_and_load_u64_based_column_values,
        serialize_u64_based_column_values,
    };

    #[test]
    fn test_serialize_deserialize_u128_header() {
        let original = U128Header {
            num_vals: 11,
            codec_type: U128FastFieldCodecType::CompactSpace,
        };
        let mut out = Vec::new();
        original.serialize(&mut out).unwrap();
        let restored = U128Header::deserialize(&mut &out[..]).unwrap();
        assert_eq!(restored, original);
    }

    #[test]
    fn test_serialize_deserialize() {
        let original = [1u64, 5u64, 10u64];
        let restored: Vec<u64> =
            serialize_and_load_u64_based_column_values(&&original[..], &ALL_U64_CODEC_TYPES)
                .iter()
                .collect();
        assert_eq!(&restored, &original[..]);
    }

    #[test]
    fn test_fastfield_bool_size_bitwidth_1() {
        let mut buffer = Vec::new();
        serialize_u64_based_column_values::<bool>(
            &&[false, true][..],
            &ALL_U64_CODEC_TYPES,
            &mut buffer,
        )
        .unwrap();
        // TODO put the header as a footer so that it serves as a padding.
        // 5 bytes of header, 1 byte of value, 7 bytes of padding.
        assert_eq!(buffer.len(), 5 + 1);
    }

    #[test]
    fn test_fastfield_bool_bit_size_bitwidth_0() {
        let mut buffer = Vec::new();
        serialize_u64_based_column_values::<bool>(
            &&[false, true][..],
            &ALL_U64_CODEC_TYPES,
            &mut buffer,
        )
        .unwrap();
        // 6 bytes of header, 0 bytes of value, 7 bytes of padding.
        assert_eq!(buffer.len(), 6);
    }

    #[test]
    fn test_fastfield_gcd() {
        let mut buffer = Vec::new();
        let vals: Vec<u64> = (0..80).map(|val| (val % 7) * 1_000u64).collect();
        serialize_u64_based_column_values(&&vals[..], &[CodecType::Bitpacked], &mut buffer)
            .unwrap();
        // Values are stored over 3 bits.
        assert_eq!(buffer.len(), 6 + (3 * 80 / 8));
    }
}


================================================
FILE: columnar/src/column_values/u64_based/bitpacked.rs
================================================
use std::io::{self, Write};
use std::num::NonZeroU64;
use std::ops::{Range, RangeInclusive};

use common::{BinarySerializable, OwnedBytes};
use fastdivide::DividerU64;
use tantivy_bitpacker::{BitPacker, BitUnpacker, compute_num_bits};

use crate::column_values::u64_based::{ColumnCodec, ColumnCodecEstimator, ColumnStats};
use crate::{ColumnValues, RowId};

/// Depending on the field type, a different
/// fast field is required.
#[derive(Clone)]
pub struct BitpackedReader {
    data: OwnedBytes,
    bit_unpacker: BitUnpacker,
    stats: ColumnStats,
}

#[inline(always)]
const fn div_ceil(n: u64, q: NonZeroU64) -> u64 {
    // copied from unstable rust standard library.
    let d = n / q.get();
    let r = n % q.get();
    if r > 0 { d + 1 } else { d }
}

// The bitpacked codec applies a linear transformation `f` over data that are bitpacked.
// f is defined by:
// f: bitpacked -> stats.min_value + stats.gcd * bitpacked
//
// In order to run range queries, we invert the transformation.
// `transform_range_before_linear_transformation` returns the range of values
// [min_bipacked_value..max_bitpacked_value] such that
// f(bitpacked) ∈ [min_value, max_value] <=> bitpacked ∈ [min_bitpacked_value, max_bitpacked_value]
fn transform_range_before_linear_transformation(
    stats: &ColumnStats,
    range: RangeInclusive<u64>,
) -> Option<RangeInclusive<u64>> {
    if range.is_empty() {
        return None;
    }
    let shifted_range =
        range.start().saturating_sub(stats.min_value)..=range.end().saturating_sub(stats.min_value);
    let start_before_gcd_multiplication: u64 = div_ceil(*shifted_range.start(), stats.gcd);
    let end_before_gcd_multiplication: u64 = *shifted_range.end() / stats.gcd;
    Some(start_before_gcd_multiplication..=end_before_gcd_multiplication)
}

impl ColumnValues for BitpackedReader {
    #[inline(always)]
    fn get_val(&self, doc: u32) -> u64 {
        self.stats.min_value + self.stats.gcd.get() * self.bit_unpacker.get(doc, &self.data)
    }
    #[inline]
    fn min_value(&self) -> u64 {
        self.stats.min_value
    }
    #[inline]
    fn max_value(&self) -> u64 {
        self.stats.max_value
    }
    #[inline]
    fn num_vals(&self) -> RowId {
        self.stats.num_rows
    }

    fn get_row_ids_for_value_range(
        &self,
        range: RangeInclusive<u64>,
        doc_id_range: Range<u32>,
        positions: &mut Vec<u32>,
    ) {
        let Some(transformed_range) =
            transform_range_before_linear_transformation(&self.stats, range)
        else {
            positions.clear();
            return;
        };
        self.bit_unpacker.get_ids_for_value_range(
            transformed_range,
            doc_id_range,
            &self.data,
            positions,
        );
    }
}

fn num_bits(stats: &ColumnStats) -> u8 {
    compute_num_bits(stats.amplitude() / stats.gcd)
}

#[derive(Default)]
pub struct BitpackedCodecEstimator;

impl ColumnCodecEstimator for BitpackedCodecEstimator {
    fn collect(&mut self, _value: u64) {}

    fn estimate(&self, stats: &ColumnStats) -> Option<u64> {
        let num_bits_per_value = num_bits(stats);
        Some(stats.num_bytes() + (stats.num_rows as u64 * (num_bits_per_value as u64)).div_ceil(8))
    }

    fn serialize(
        &self,
        stats: &ColumnStats,
        vals: &mut dyn Iterator<Item = u64>,
        wrt: &mut dyn Write,
    ) -> io::Result<()> {
        stats.serialize(wrt)?;
        let num_bits = num_bits(stats);
        let mut bit_packer = BitPacker::new();
        let divider = DividerU64::divide_by(stats.gcd.get());
        for val in vals {
            bit_packer.write(divider.divide(val - stats.min_value), num_bits, wrt)?;
        }
        bit_packer.close(wrt)?;
        Ok(())
    }
}

pub struct BitpackedCodec;

impl ColumnCodec for BitpackedCodec {
    type ColumnValues = BitpackedReader;
    type Estimator = BitpackedCodecEstimator;

    /// Opens a fast field given a file.
    fn load(mut data: OwnedBytes) -> io::Result<Self::ColumnValues> {
        let stats = ColumnStats::deserialize(&mut data)?;
        let num_bits = num_bits(&stats);
        let bit_unpacker = BitUnpacker::new(num_bits);
        Ok(BitpackedReader {
            data,
            bit_unpacker,
            stats,
        })
    }
}

#[cfg(test)]
mod tests {
    use super::*;
    use crate::column_values::u64_based::tests::create_and_validate;

    #[test]
    fn test_with_codec_data_sets_simple() {
        create_and_validate::<BitpackedCodec>(&[4, 3, 12], "name");
    }

    #[test]
    fn test_with_codec_data_sets_simple_gcd() {
        create_and_validate::<BitpackedCodec>(&[1000, 2000, 3000], "name");
    }

    #[test]
    fn test_with_codec_data_sets() {
        let data_sets = crate::column_values::u64_based::tests::get_codec_test_datasets();
        for (mut data, name) in data_sets {
            create_and_validate::<BitpackedCodec>(&data, name);
            data.reverse();
            create_and_validate::<BitpackedCodec>(&data, name);
        }
    }

    #[test]
    fn bitpacked_fast_field_rand() {
        for _ in 0..500 {
            let mut data = (0..1 + rand::random::<u8>() as usize)
                .map(|_| rand::random::<i64>() as u64 / 2)
                .collect::<Vec<_>>();
            create_and_validate::<BitpackedCodec>(&data, "rand");
            data.reverse();
            create_and_validate::<BitpackedCodec>(&data, "rand");
        }
    }
}


================================================
FILE: columnar/src/column_values/u64_based/blockwise_linear.rs
================================================
use std::io::Write;
use std::sync::Arc;
use std::{io, iter};

use common::{BinarySerializable, CountingWriter, DeserializeFrom, OwnedBytes};
use fastdivide::DividerU64;
use tantivy_bitpacker::{BitPacker, BitUnpacker, compute_num_bits};

use crate::MonotonicallyMappableToU64;
use crate::column_values::u64_based::line::Line;
use crate::column_values::u64_based::{ColumnCodec, ColumnCodecEstimator, ColumnStats};
use crate::column_values::{ColumnValues, VecColumn};

const BLOCK_SIZE: u32 = 512u32;

#[derive(Debug, Default)]
struct Block {
    line: Line,
    bit_unpacker: BitUnpacker,
    data_start_offset: usize,
}

impl BinarySerializable for Block {
    fn serialize<W: Write + ?Sized>(&self, writer: &mut W) -> io::Result<()> {
        self.line.serialize(writer)?;
        self.bit_unpacker.bit_width().serialize(writer)?;
        Ok(())
    }

    fn deserialize<R: io::Read>(reader: &mut R) -> io::Result<Self> {
        let line = Line::deserialize(reader)?;
        let bit_width = u8::deserialize(reader)?;
        Ok(Block {
            line,
            bit_unpacker: BitUnpacker::new(bit_width),
            data_start_offset: 0,
        })
    }
}

fn compute_num_blocks(num_vals: u32) -> u32 {
    num_vals.div_ceil(BLOCK_SIZE)
}

pub struct BlockwiseLinearEstimator {
    block: Vec<u64>,
    values_num_bytes: u64,
    meta_num_bytes: u64,
}

impl Default for BlockwiseLinearEstimator {
    fn default() -> Self {
        Self {
            block: Vec::with_capacity(BLOCK_SIZE as usize),
            values_num_bytes: 0u64,
            meta_num_bytes: 0u64,
        }
    }
}

impl BlockwiseLinearEstimator {
    fn flush_block_estimate(&mut self) {
        if self.block.is_empty() {
            return;
        }
        let column = VecColumn::from(std::mem::take(&mut self.block));
        let line = Line::train(&column);
        self.block = column.into();

        let mut max_value = 0u64;
        for (i, buffer_val) in self.block.iter().enumerate() {
            let interpolated_val = line.eval(i as u32);
            let val = buffer_val.wrapping_sub(interpolated_val);
            max_value = val.max(max_value);
        }
        let bit_width = compute_num_bits(max_value) as usize;
        self.values_num_bytes += (bit_width * self.block.len() + 7) as u64 / 8;
        self.meta_num_bytes += 1 + line.num_bytes();
    }
}

impl ColumnCodecEstimator for BlockwiseLinearEstimator {
    fn collect(&mut self, value: u64) {
        self.block.push(value);
        if self.block.len() == BLOCK_SIZE as usize {
            self.flush_block_estimate();
            self.block.clear();
        }
    }
    fn estimate(&self, stats: &ColumnStats) -> Option<u64> {
        let mut estimate = 4 + stats.num_bytes() + self.meta_num_bytes + self.values_num_bytes;
        if stats.gcd.get() > 1 {
            let estimate_gain_from_gcd =
                (stats.gcd.get() as f32).log2().floor() * stats.num_rows as f32 / 8.0f32;
            estimate = estimate.saturating_sub(estimate_gain_from_gcd as u64);
        }
        Some(estimate)
    }

    fn finalize(&mut self) {
        self.flush_block_estimate();
    }

    fn serialize(
        &self,
        stats: &ColumnStats,
        mut vals: &mut dyn Iterator<Item = u64>,
        wrt: &mut dyn Write,
    ) -> io::Result<()> {
        stats.serialize(wrt)?;
        let mut buffer = Vec::with_capacity(BLOCK_SIZE as usize);
        let num_blocks = compute_num_blocks(stats.num_rows) as usize;
        let mut blocks = Vec::with_capacity(num_blocks);

        let mut bit_packer = BitPacker::new();

        let gcd_divider = DividerU64::divide_by(stats.gcd.get());

        for _ in 0..num_blocks {
            buffer.clear();
            buffer.extend(
                (&mut vals)
                    .map(MonotonicallyMappableToU64::to_u64)
                    .take(BLOCK_SIZE as usize),
            );

            for buffer_val in buffer.iter_mut() {
                *buffer_val = gcd_divider.divide(*buffer_val - stats.min_value);
            }

            let line = Line::train(&VecColumn::from(buffer.to_vec()));

            assert!(!buffer.is_empty());

            for (i, buffer_val) in buffer.iter_mut().enumerate() {
                let interpolated_val = line.eval(i as u32);
                *buffer_val = buffer_val.wrapping_sub(interpolated_val);
            }

            let bit_width = buffer.iter().copied().map(compute_num_bits).max().unwrap();

            for &buffer_val in &buffer {
                bit_packer.write(buffer_val, bit_width, wrt)?;
            }

            blocks.push(Block {
                line,
                bit_unpacker: BitUnpacker::new(bit_width),
                data_start_offset: 0,
            });
        }

        bit_packer.close(wrt)?;

        assert_eq!(blocks.len(), num_blocks);

        let mut counting_wrt = CountingWriter::wrap(wrt);
        for block in &blocks {
            block.serialize(&mut counting_wrt)?;
        }
        let footer_len = counting_wrt.written_bytes();
        (footer_len as u32).serialize(&mut counting_wrt)?;

        Ok(())
    }
}

pub struct BlockwiseLinearCodec;

impl ColumnCodec<u64> for BlockwiseLinearCodec {
    type ColumnValues = BlockwiseLinearReader;

    type Estimator = BlockwiseLinearEstimator;

    fn load(mut bytes: OwnedBytes) -> io::Result<Self::ColumnValues> {
        let stats = ColumnStats::deserialize(&mut bytes)?;
        let footer_len: u32 = (&bytes[bytes.len() - 4..]).deserialize()?;
        let footer_offset = bytes.len() - 4 - footer_len as usize;
        let (data, mut footer) = bytes.split(footer_offset);
        let num_blocks = compute_num_blocks(stats.num_rows);
        let mut blocks: Vec<Block> = iter::repeat_with(|| Block::deserialize(&mut footer))
            .take(num_blocks as usize)
            .collect::<io::Result<_>>()?;
        let mut start_offset = 0;
        for block in &mut blocks {
            block.data_start_offset = start_offset;
            start_offset += (block.bit_unpacker.bit_width() as usize) * BLOCK_SIZE as usize / 8;
        }
        Ok(BlockwiseLinearReader {
            blocks: blocks.into_boxed_slice().into(),
            data,
            stats,
        })
    }
}

#[derive(Clone)]
pub struct BlockwiseLinearReader {
    blocks: Arc<[Block]>,
    data: OwnedBytes,
    stats: ColumnStats,
}

impl ColumnValues for BlockwiseLinearReader {
    #[inline(always)]
    fn get_val(&self, idx: u32) -> u64 {
        let block_id = (idx / BLOCK_SIZE) as usize;
        let idx_within_block = idx % BLOCK_SIZE;
        let block = &self.blocks[block_id];
        let interpoled_val: u64 = block.line.eval(idx_within_block);
        let block_bytes = &self.data[block.data_start_offset..];
        let bitpacked_diff = block.bit_unpacker.get(idx_within_block, block_bytes);
        // TODO optimize me! the line parameters could be tweaked to include the multiplication and
        // remove the dependency.
        self.stats.min_value
            + self
                .stats
                .gcd
                .get()
                .wrapping_mul(interpoled_val.wrapping_add(bitpacked_diff))
    }

    #[inline(always)]
    fn min_value(&self) -> u64 {
        self.stats.min_value
    }

    #[inline(always)]
    fn max_value(&self) -> u64 {
        self.stats.max_value
    }

    #[inline(always)]
    fn num_vals(&self) -> u32 {
        self.stats.num_rows
    }
}

#[cfg(test)]
mod tests {
    use super::*;
    use crate::column_values::u64_based::tests::create_and_validate;

    #[test]
    fn test_with_codec_data_sets_simple() {
        create_and_validate::<BlockwiseLinearCodec>(
            &[11, 20, 40, 20, 10, 10, 10, 10, 10, 10],
            "simple test",
        )
        .unwrap();
    }

    #[test]
    fn test_with_codec_data_sets_simple_gcd() {
        let (_, actual_compression_rate) = create_and_validate::<BlockwiseLinearCodec>(
            &[10, 20, 40, 20, 10, 10, 10, 10, 10, 10],
            "name",
        )
        .unwrap();
        assert_eq!(actual_compression_rate, 0.175);
    }

    #[test]
    fn test_with_codec_data_sets() {
        let data_sets = crate::column_values::u64_based::tests::get_codec_test_datasets();
        for (mut data, name) in data_sets {
            create_and_validate::<BlockwiseLinearCodec>(&data, name);
            data.reverse();
            create_and_validate::<BlockwiseLinearCodec>(&data, name);
        }
    }

    #[test]
    fn test_blockwise_linear_fast_field_rand() {
        for _ in 0..500 {
            let mut data = (0..1 + rand::random::<u8>() as usize)
                .map(|_| rand::random::<i64>() as u64 / 2)
                .collect::<Vec<_>>();
            create_and_validate::<BlockwiseLinearCodec>(&data, "rand");
            data.reverse();
            create_and_validate::<BlockwiseLinearCodec>(&data, "rand");
        }
    }
}


================================================
FILE: columnar/src/column_values/u64_based/line.rs
================================================
use std::io;
use std::num::NonZeroU32;

use common::{BinarySerializable, VInt};

use crate::column_values::ColumnValues;

const MID_POINT: u64 = (1u64 << 32) - 1u64;

/// `Line` describes a line function `y: ax + b` using integer
/// arithmetic.
///
/// The slope is in fact a decimal split into a 32 bit integer value,
/// and a 32-bit decimal value.
///
/// The multiplication then becomes.
/// `y = m * x >> 32 + b`
#[derive(Debug, Clone, Copy, Default)]
pub struct Line {
    pub(crate) slope: u64,
    pub(crate) intercept: u64,
}

/// Compute the line slope.
///
/// This function has the nice property of being
/// invariant by translation.
/// `
///   compute_slope(y0, y1)
/// = compute_slope(y0 + X % 2^64, y1 + X % 2^64)
/// `
fn compute_slope(y0: u64, y1: u64, num_vals: NonZeroU32) -> u64 {
    let dy = y1.wrapping_sub(y0);
    let sign = dy <= (1 << 63);
    let abs_dy = if sign {
        y1.wrapping_sub(y0)
    } else {
        y0.wrapping_sub(y1)
    };
    if abs_dy >= 1 << 32 {
        // This is outside of realm we handle.
        // Let's just bail.
        return 0u64;
    }

    let abs_slope = (abs_dy << 32) / num_vals.get() as u64;
    if sign {
        abs_slope
    } else {
        // The complement does indeed create the
        // opposite decreasing slope...
        //
        // Intuitively (without the bitshifts and % u64::MAX)
        // ```
        //    (x + shift)*(u64::MAX - abs_slope)
        // -  (x * (u64::MAX - abs_slope))
        // = - shift * abs_slope
        // ```
        u64::MAX - abs_slope
    }
}

impl Line {
    #[inline(always)]
    pub fn eval(&self, x: u32) -> u64 {
        let linear_part = ((x as u64).wrapping_mul(self.slope) >> 32) as i32 as u64;
        self.intercept.wrapping_add(linear_part)
    }

    // Intercept is only computed from provided positions
    pub fn train_from(
        first_val: u64,
        last_val: u64,
        num_vals: u32,
        positions_and_values: impl Iterator<Item = (u64, u64)>,
    ) -> Self {
        // TODO replace with let else
        let idx_last_val = if let Some(idx_last_val) = NonZeroU32::new(num_vals - 1) {
            idx_last_val
        } else {
            return Line::default();
        };

        let y0 = first_val;
        let y1 = last_val;

        // We first independently pick our slope.
        let slope = compute_slope(y0, y1, idx_last_val);

        // We picked our slope. Note that it does not have to be perfect.
        // Now we need to compute the best intercept.
        //
        // Intuitively, the best intercept is such that line passes through one of the
        // `(i, ys[])`.
        //
        // The best intercept therefore has the form
        // `y[i] - line.eval(i)` (using wrapping arithmetic).
        // In other words, the best intercept is one of the `y - Line::eval(ys[i])`
        // and our task is just to pick the one that minimizes our error.
        //
        // Without sorting our values, this is a difficult problem.
        // We however rely on the following trick...
        //
        // We only focus on the case where the interpolation is half decent.
        // If the line interpolation is doing its job on a dataset suited for it,
        // we can hope that the maximum error won't be larger than `u64::MAX / 2`.
        //
        // In other words, even without the intercept the values `y - Line::eval(ys[i])` will all be
        // within an interval that takes less than half of the modulo space of `u64`.
        //
        // Our task is therefore to identify this interval.
        // Here we simply translate all of our values by `y0 - 2^63` and pick the min.
        let mut line = Line {
            slope,
            intercept: 0,
        };
        let heuristic_shift = y0.wrapping_sub(MID_POINT);
        line.intercept = positions_and_values
            .map(|(pos, y)| y.wrapping_sub(line.eval(pos as u32)))
            .min_by_key(|&val| val.wrapping_sub(heuristic_shift))
            .unwrap_or(0u64); //< Never happens.
        line
    }

    /// Returns a line that attempts to approximate a function
    /// f: i in 0..[ys.num_vals()) -> ys[i].
    ///
    /// - The approximation is always lower than the actual value. Or more rigorously, formally
    ///   `f(i).wrapping_sub(ys[i])` is small for any i in [0..ys.len()).
    /// - It computes without panicking for any value of it.
    ///
    /// This function is only invariable by translation if all of the
    /// `ys` are packaged into half of the space. (See heuristic below)
    /// TODO USE array
    pub fn train(ys: &dyn ColumnValues) -> Self {
        let first_val = ys.iter().next().unwrap();
        let last_val = ys.iter().nth(ys.num_vals() as usize - 1).unwrap();
        Self::train_from(
            first_val,
            last_val,
            ys.num_vals(),
            ys.iter().enumerate().map(|(pos, val)| (pos as u64, val)),
        )
    }
}

impl BinarySerializable for Line {
    fn serialize<W: io::Write + ?Sized>(&self, writer: &mut W) -> io::Result<()> {
        VInt(self.slope).serialize(writer)?;
        VInt(self.intercept).serialize(writer)?;
        Ok(())
    }

    fn deserialize<R: io::Read>(reader: &mut R) -> io::Result<Self> {
        let slope = VInt::deserialize(reader)?.0;
        let intercept = VInt::deserialize(reader)?.0;
        Ok(Line { slope, intercept })
    }
}

#[cfg(test)]
mod tests {
    use super::*;
    use crate::column_values::VecColumn;

    /// Test training a line and ensuring that the maximum difference between
    /// the data points and the line is `expected`.
    ///
    /// This function operates translation over the data for better coverage.
    #[track_caller]
    fn test_line_interpol_with_translation(ys: &[u64], expected: Option<u64>) {
        let mut translations = vec![0, 100, u64::MAX / 2, u64::MAX, u64::MAX - 1];
        translations.extend_from_slice(ys);
        for translation in translations {
            let translated_ys: Vec<u64> = ys
                .iter()
                .copied()
                .map(|y| y.wrapping_add(translation))
                .collect();
            let largest_err = test_eval_max_err(&translated_ys);
            assert_eq!(largest_err, expected);
        }
    }

    fn test_eval_max_err(ys: &[u64]) -> Option<u64> {
        let line = Line::train(&VecColumn::from(ys.to_vec()));
        ys.iter()
            .enumerate()
            .map(|(x, y)| y.wrapping_sub(line.eval(x as u32)))
            .max()
    }

    #[test]
    fn test_train() {
        test_line_interpol_with_translation(&[11, 11, 11, 12, 12, 13], Some(1));
        test_line_interpol_with_translation(&[13, 12, 12, 11, 11, 11], Some(1));
        test_line_interpol_with_translation(&[13, 13, 12, 11, 11, 11], Some(1));
        test_line_interpol_with_translation(&[13, 13, 12, 11, 11, 11], Some(1));
        test_line_interpol_with_translation(&[u64::MAX - 1, 0, 0, 1], Some(1));
        test_line_interpol_with_translation(&[u64::MAX - 1, u64::MAX, 0, 1], Some(0));
        test_line_interpol_with_translation(&[0, 1, 2, 3, 5], Some(0));
        test_line_interpol_with_translation(&[1, 2, 3, 4], Some(0));

        let data: Vec<u64> = (0..255).collect();
        test_line_interpol_with_translation(&data, Some(0));
        let data: Vec<u64> = (0..255).map(|el| el * 2).collect();
        test_line_interpol_with_translation(&data, Some(0));
    }
}


================================================
FILE: columnar/src/column_values/u64_based/linear.rs
================================================
use std::io;

use common::{BinarySerializable, OwnedBytes};
use tantivy_bitpacker::{BitPacker, BitUnpacker, compute_num_bits};

use super::ColumnValues;
use super::line::Line;
use crate::RowId;
use crate::column_values::VecColumn;
use crate::column_values::u64_based::{ColumnCodec, ColumnCodecEstimator, ColumnStats};

const HALF_SPACE: u64 = u64::MAX / 2;
const LINE_ESTIMATION_BLOCK_LEN: usize = 512;

/// Depending on the field type, a different
/// fast field is required.
#[derive(Clone)]
pub struct LinearReader {
    data: OwnedBytes,
    linear_params: LinearParams,
    stats: ColumnStats,
}

impl ColumnValues for LinearReader {
    #[inline]
    fn get_val(&self, doc: u32) -> u64 {
        let interpoled_val: u64 = self.linear_params.line.eval(doc);
        let bitpacked_diff = self.linear_params.bit_unpacker.get(doc, &self.data);
        interpoled_val.wrapping_add(bitpacked_diff)
    }

    #[inline(always)]
    fn min_value(&self) -> u64 {
        self.stats.min_value
    }

    #[inline(always)]
    fn max_value(&self) -> u64 {
        self.stats.max_value
    }

    #[inline]
    fn num_vals(&self) -> u32 {
        self.stats.num_rows
    }
}

/// Fastfield serializer, which tries to guess values by linear interpolation
/// and stores the difference bitpacked.
pub struct LinearCodec;

#[derive(Debug, Clone)]
struct LinearParams {
    line: Line,
    bit_unpacker: BitUnpacker,
}

impl BinarySerializable for LinearParams {
    fn serialize<W: io::Write + ?Sized>(&self, writer: &mut W) -> io::Result<()> {
        self.line.serialize(writer)?;
        self.bit_unpacker.bit_width().serialize(writer)?;
        Ok(())
    }

    fn deserialize<R: io::Read>(reader: &mut R) -> io::Result<Self> {
        let line = Line::deserialize(reader)?;
        let bit_width = u8::deserialize(reader)?;
        Ok(Self {
            line,
            bit_unpacker: BitUnpacker::new(bit_width),
        })
    }
}

pub struct LinearCodecEstimator {
    block: Vec<u64>,
    line: Option<Line>,
    row_id: RowId,
    min_deviation: u64,
    max_deviation: u64,
    first_val: u64,
    last_val: u64,
}

impl Default for LinearCodecEstimator {
    fn default() -> LinearCodecEstimator {
        LinearCodecEstimator {
            block: Vec::with_capacity(LINE_ESTIMATION_BLOCK_LEN),
            line: None,
            row_id: 0,
            min_deviation: u64::MAX,
            max_deviation: u64::MIN,
            first_val: 0u64,
            last_val: 0u64,
        }
    }
}

impl ColumnCodecEstimator for LinearCodecEstimator {
    fn finalize(&mut self) {
        if let Some(line) = self.line.as_mut() {
            line.intercept = line
                .intercept
                .wrapping_add(self.min_deviation)
                .wrapping_sub(HALF_SPACE);
        }
    }

    fn estimate(&self, stats: &ColumnStats) -> Option<u64> {
        let line = self.line?;
        let amplitude = self.max_deviation - self.min_deviation;
        let num_bits = compute_num_bits(amplitude);
        let linear_params = LinearParams {
            line,
            bit_unpacker: BitUnpacker::new(num_bits),
        };
        Some(
            stats.num_bytes()
                + linear_params.num_bytes()
                + (num_bits as u64 * stats.num_rows as u64).div_ceil(8),
        )
    }

    fn serialize(
        &self,
        stats: &ColumnStats,
        vals: &mut dyn Iterator<Item = u64>,
        wrt: &mut dyn io::Write,
    ) -> io::Result<()> {
        stats.serialize(wrt)?;
        let line = self.line.unwrap();
        let amplitude = self.max_deviation - self.min_deviation;
        let num_bits = compute_num_bits(amplitude);
        let linear_params = LinearParams {
            line,
            bit_unpacker: BitUnpacker::new(num_bits),
        };
        linear_params.serialize(wrt)?;
        let mut bit_packer = BitPacker::new();
        for (pos, value) in vals.enumerate() {
            let calculated_value = line.eval(pos as u32);
            let offset = value.wrapping_sub(calculated_value);
            bit_packer.write(offset, num_bits, wrt)?;
        }
        bit_packer.close(wrt)?;
        Ok(())
    }

    fn collect(&mut self, value: u64) {
        if let Some(line) = self.line {
            self.collect_after_line_estimation(&line, value);
        } else {
            self.collect_before_line_estimation(value);
        }
    }
}

impl LinearCodecEstimator {
    #[inline]
    fn collect_after_line_estimation(&mut self, line: &Line, value: u64) {
        let interpoled_val: u64 = line.eval(self.row_id);
        let deviation = value.wrapping_add(HALF_SPACE).wrapping_sub(interpoled_val);
        self.min_deviation = self.min_deviation.min(deviation);
        self.max_deviation = self.max_deviation.max(deviation);
        if self.row_id == 0 {
            self.first_val = value;
        }
        self.last_val = value;
        self.row_id += 1u32;
    }

    #[inline]
    fn collect_before_line_estimation(&mut self, value: u64) {
        self.block.push(value);
        if self.block.len() == LINE_ESTIMATION_BLOCK_LEN {
            let column = VecColumn::from(std::mem::take(&mut self.block));
            let line = Line::train(&column);
            self.block = column.into();
            let block = std::mem::take(&mut self.block);
            for val in block {
                self.collect_after_line_estimation(&line, val);
            }
            self.line = Some(line);
        }
    }
}

impl ColumnCodec for LinearCodec {
    type ColumnValues = LinearReader;

    type Estimator = LinearCodecEstimator;

    fn load(mut data: OwnedBytes) -> io::Result<Self::ColumnValues> {
        let stats = ColumnStats::deserialize(&mut data)?;
        let linear_params = LinearParams::deserialize(&mut data)?;
        Ok(LinearReader {
            stats,
            linear_params,
            data,
        })
    }
}

#[cfg(test)]
mod tests {
    use rand::RngCore;

    use super::*;
    use crate::column_values::u64_based::tests::{create_and_validate, get_codec_test_datasets};

    #[test]
    fn test_compression_simple() {
        let vals = (100u64..)
            .take(super::LINE_ESTIMATION_BLOCK_LEN)
            .collect::<Vec<_>>();
        create_and_validate::<LinearCodec>(&vals, "simple monotonically large").unwrap();
    }

    #[test]
    fn test_compression() {
        let data = (10..=6_000_u64).collect::<Vec<_>>();
        let (estimate, actual_compression) =
            create_and_validate::<LinearCodec>(&data, "simple monotonically large").unwrap();
        assert_le!(actual_compression, 0.001);
        assert_le!(estimate, 0.02);
    }

    #[test]
    fn test_with_codec_datasets() {
        let data_sets = get_codec_test_datasets();
        for (mut data, name) in data_sets {
            create_and_validate::<LinearCodec>(&data, name);
            data.reverse();
            create_and_validate::<LinearCodec>(&data, name);
        }
    }
    #[test]
    fn linear_interpol_fast_field_test_large_amplitude() {
        let data = vec![
            i64::MAX as u64 / 2,
            i64::MAX as u64 / 3,
            i64::MAX as u64 / 2,
        ];
        create_and_validate::<LinearCodec>(&data, "large amplitude");
    }

    #[test]
    fn overflow_error_test() {
        let data = vec![1572656989877777, 1170935903116329, 720575940379279, 0];
        create_and_validate::<LinearCodec>(&data, "overflow test");
    }

    #[test]
    fn linear_interpol_fast_concave_data() {
        let data = vec![0, 1, 2, 5, 8, 10, 20, 50];
        create_and_validate::<LinearCodec>(&data, "concave data");
    }
    #[test]
    fn linear_interpol_fast_convex_data() {
        let data = vec![0, 40, 60, 70, 75, 77];
        create_and_validate::<LinearCodec>(&data, "convex data");
    }
    #[test]
    fn linear_interpol_fast_field_test_simple() {
        let data = (10..=20_u64).collect::<Vec<_>>();
        create_and_validate::<LinearCodec>(&data, "simple monotonically");
    }

    #[test]
    fn linear_interpol_fast_field_rand() {
        let mut rng = rand::rng();
        for _ in 0..50 {
            let mut data = (0..10_000).map(|_| rng.next_u64()).collect::<Vec<_>>();
            create_and_validate::<LinearCodec>(&data, "random");
            data.reverse();
            create_and_validate::<LinearCodec>(&data, "random");
        }
    }
}


================================================
FILE: columnar/src/column_values/u64_based/mod.rs
================================================
mod bitpacked;
mod blockwise_linear;
mod line;
mod linear;
mod stats_collector;

use std::io;
use std::io::Write;
use std::sync::Arc;

use common::{BinarySerializable, OwnedBytes};

use crate::column_values::monotonic_mapping::{
    StrictlyMonotonicMappingInverter, StrictlyMonotonicMappingToInternal,
};
pub use crate::column_values::u64_based::bitpacked::BitpackedCodec;
pub use crate::column_values::u64_based::blockwise_linear::BlockwiseLinearCodec;
pub use crate::column_values::u64_based::linear::LinearCodec;
pub use crate::column_values::u64_based::stats_collector::StatsCollector;
use crate::column_values::{ColumnStats, monotonic_map_column};
use crate::iterable::Iterable;
use crate::{ColumnValues, MonotonicallyMappableToU64};

/// A `ColumnCodecEstimator` is in charge of gathering all
/// data required to serialize a column.
///
/// This happens during a first pass on data of the column elements.
/// During that pass, all column estimators receive a call to their
/// `.collect(el)`.
///
/// After this first pass, finalize is called.
/// `.estimate(..)` then should return an accurate estimation of the
/// size of the serialized column (were we to pick this codec.).
/// `.serialize(..)` then serializes the column using this codec.
pub trait ColumnCodecEstimator<T = u64>: 'static {
    /// Records a new value for estimation.
    /// This method will be called for each element of the column during
    /// `estimation`.
    fn collect(&mut self, value: u64);
    /// Finalizes the first pass phase.
    fn finalize(&mut self) {}
    /// Returns an accurate estimation of the number of bytes that will
    /// be used to represent this column.
    fn estimate(&self, stats: &ColumnStats) -> Option<u64>;
    /// Serializes the column using the given codec.
    /// This constitutes a second pass over the columns values.
    fn serialize(
        &self,
        stats: &ColumnStats,
        vals: &mut dyn Iterator<Item = T>,
        wrt: &mut dyn io::Write,
    ) -> io::Result<()>;
}

/// A column codec describes a column serialization format.
pub trait ColumnCodec<T: PartialOrd = u64> {
    /// Specialized `ColumnValues` type.
    type ColumnValues: ColumnValues<T> + 'static;
    /// `Estimator` for the given codec.
    type Estimator: ColumnCodecEstimator + Default;

    /// Loads a column that has been serialized using this codec.
    fn load(bytes: OwnedBytes) -> io::Result<Self::ColumnValues>;

    /// Returns an estimator.
    fn estimator() -> Self::Estimator {
        Self::Estimator::default()
    }

    /// Returns a boxed estimator.
    fn boxed_estimator() -> Box<dyn ColumnCodecEstimator> {
        Box::new(Self::estimator())
    }
}

/// Available codecs to use to encode the u64 (via [`MonotonicallyMappableToU64`]) converted data.
#[derive(PartialEq, Eq, PartialOrd, Ord, Debug, Clone, Copy)]
#[repr(u8)]
pub enum CodecType {
    /// Bitpack all values in the value range. The number of bits is defined by the amplitude
    /// `column.max_value() - column.min_value()`
    Bitpacked = 0u8,
    /// Linear interpolation puts a line between the first and last value and then bitpacks the
    /// values by the offset from the line. The number of bits is defined by the max deviation from
    /// the line.
    Linear = 1u8,
    /// Same as [`CodecType::Linear`], but encodes in blocks of 512 elements.
    BlockwiseLinear = 2u8,
}

/// List of all available u64-base codecs.
pub const ALL_U64_CODEC_TYPES: [CodecType; 3] = [
    CodecType::Bitpacked,
    CodecType::Linear,
    CodecType::BlockwiseLinear,
];

impl CodecType {
    fn to_code(self) -> u8 {
        self as u8
    }

    fn try_from_code(code: u8) -> Option<CodecType> {
        match code {
            0u8 => Some(CodecType::Bitpacked),
            1u8 => Some(CodecType::Linear),
            2u8 => Some(CodecType::BlockwiseLinear),
            _ => None,
        }
    }

    fn load<T: MonotonicallyMappableToU64>(
        &self,
        bytes: OwnedBytes,
    ) -> io::Result<Arc<dyn ColumnValues<T>>> {
        match self {
            CodecType::Bitpacked => load_specific_codec::<BitpackedCodec, T>(bytes),
            CodecType::Linear => load_specific_codec::<LinearCodec, T>(bytes),
            CodecType::BlockwiseLinear => load_specific_codec::<BlockwiseLinearCodec, T>(bytes),
        }
    }
}

fn load_specific_codec<C: ColumnCodec, T: MonotonicallyMappableToU64>(
    bytes: OwnedBytes,
) -> io::Result<Arc<dyn ColumnValues<T>>> {
    let reader = C::load(bytes)?;
    let reader_typed = monotonic_map_column(
        reader,
        StrictlyMonotonicMappingInverter::from(StrictlyMonotonicMappingToInternal::<T>::new()),
    );
    Ok(Arc::new(reader_typed))
}

impl CodecType {
    /// Returns a boxed codec estimator associated to a given `CodecType`.
    pub fn estimator(&self) -> Box<dyn ColumnCodecEstimator> {
        match self {
            CodecType::Bitpacked => BitpackedCodec::boxed_estimator(),
            CodecType::Linear => LinearCodec::boxed_estimator(),
            CodecType::BlockwiseLinear => BlockwiseLinearCodec::boxed_estimator(),
        }
    }
}

/// Serializes a given column of u64-mapped values.
pub fn serialize_u64_based_column_values<T: MonotonicallyMappableToU64>(
    vals: &dyn Iterable<T>,
    codec_types: &[CodecType],
    wrt: &mut dyn Write,
) -> io::Result<()> {
    let mut stats_collector = StatsCollector::default();
    let mut estimators: Vec<(CodecType, Box<dyn ColumnCodecEstimator>)> =
        Vec::with_capacity(codec_types.len());
    for &codec_type in codec_types {
        estimators.push((codec_type, codec_type.estimator()));
    }
    for val in vals.boxed_iter() {
        let val_u64 = val.to_u64();
        stats_collector.collect(val_u64);
        for (_, estimator) in &mut estimators {
            estimator.collect(val_u64);
        }
    }
    for (_, estimator) in &mut estimators {
        estimator.finalize();
    }
    let stats = stats_collector.stats();
    let (_, best_codec, best_codec_estimator) = estimators
        .into_iter()
        .flat_map(|(codec_type, estimator)| {
            let num_bytes = estimator.estimate(&stats)?;
            Some((num_bytes, codec_type, estimator))
        })
        .min_by_key(|(num_bytes, _, _)| *num_bytes)
        .ok_or_else(|| {
            io::Error::new(io::ErrorKind::InvalidData, "No available applicable codec.")
        })?;
    best_codec.to_code().serialize(wrt)?;
    best_codec_estimator.serialize(
        &stats,
        &mut vals.boxed_iter().map(MonotonicallyMappableToU64::to_u64),
        wrt,
    )?;
    Ok(())
}

/// Load u64-based column values.
///
/// This method first identifies the codec off the first byte.
pub fn load_u64_based_column_values<T: MonotonicallyMappableToU64>(
    mut bytes: OwnedBytes,
) -> io::Result<Arc<dyn ColumnValues<T>>> {
    let codec_type: CodecType = bytes
        .first()
        .copied()
        .and_then(CodecType::try_from_code)
        .ok_or_else(|| io::Error::new(io::ErrorKind::InvalidData, "Failed to read codec type"))?;
    bytes.advance(1);
    codec_type.load(bytes)
}

/// Helper function to serialize a column (autodetect from all codecs) and then open it
pub fn serialize_and_load_u64_based_column_values<T: MonotonicallyMappableToU64>(
    vals: &dyn Iterable,
    codec_types: &[CodecType],
) -> Arc<dyn ColumnValues<T>> {
    let mut buffer = Vec::new();
    serialize_u64_based_column_values(vals, codec_types, &mut buffer).unwrap();
    load_u64_based_column_values::<T>(OwnedBytes::new(buffer)).unwrap()
}

#[cfg(test)]
mod tests;


================================================
FILE: columnar/src/column_values/u64_based/stats_collector.rs
================================================
use std::num::NonZeroU64;

use fastdivide::DividerU64;

use crate::RowId;
use crate::column_values::ColumnStats;

/// Compute the gcd of two non null numbers.
///
/// It is recommended, but not required, to feed values such that `large >= small`.
fn compute_gcd(mut large: NonZeroU64, mut small: NonZeroU64) -> NonZeroU64 {
    loop {
        let rem: u64 = large.get() % small;
        if let Some(new_small) = NonZeroU64::new(rem) {
            (large, small) = (small, new_small);
        } else {
            return small;
        }
    }
}

#[derive(Default)]
pub struct StatsCollector {
    min_max_opt: Option<(u64, u64)>,
    num_rows: RowId,
    // We measure the GCD of the difference between the values and the minimal value.
    // This is the same as computing the difference between the values and the first value.
    //
    // This way, we can compress i64-converted-to-u64 (e.g. timestamp that were supplied in
    // seconds, only to be converted in nanoseconds).
    increment_gcd_opt: Option<(NonZeroU64, DividerU64)>,
    first_value_opt: Option<u64>,
}

impl StatsCollector {
    pub fn stats(&self) -> ColumnStats {
        let (min_value, max_value) = self.min_max_opt.unwrap_or((0u64, 0u64));
        let increment_gcd = if let Some((increment_gcd, _)) = self.increment_gcd_opt {
            increment_gcd
        } else {
            NonZeroU64::new(1u64).unwrap()
        };
        ColumnStats {
            min_value,
            max_value,
            num_rows: self.num_rows,
            gcd: increment_gcd,
        }
    }

    #[inline]
    fn update_increment_gcd(&mut self, value: u64) {
        let Some(first_value) = self.first_value_opt else {
            // We set the first value and just quit.
            self.first_value_opt = Some(value);
            return;
        };
        let Some(non_zero_value) = NonZeroU64::new(value.abs_diff(first_value)) else {
            // We can simply skip 0 values.
            return;
        };
        let Some((gcd, gcd_divider)) = self.increment_gcd_opt else {
            self.set_increment_gcd(non_zero_value);
            return;
        };
        if gcd.get() == 1 {
            // It won't see any update now.
            return;
        }
        let remainder =
            non_zero_value.get() - (gcd_divider.divide(non_zero_value.get())) * gcd.get();
        if remainder == 0 {
            return;
        }
        let new_gcd = compute_gcd(non_zero_value, gcd);
        self.set_increment_gcd(new_gcd);
    }

    fn set_increment_gcd(&mut self, gcd: NonZeroU64) {
        let new_divider = DividerU64::divide_by(gcd.get());
        self.increment_gcd_opt = Some((gcd, new_divider));
    }

    pub fn collect(&mut self, value: u64) {
        self.min_max_opt = Some(if let Some((min, max)) = self.min_max_opt {
            (min.min(value), max.max(value))
        } else {
            (value, value)
        });
        self.num_rows += 1;
        self.update_increment_gcd(value);
    }
}

#[cfg(test)]
mod tests {
    use std::num::NonZeroU64;

    use crate::column_values::u64_based::ColumnStats;
    use crate::column_values::u64_based::stats_collector::{StatsCollector, compute_gcd};

    fn compute_stats(vals: impl Iterator<Item = u64>) -> ColumnStats {
        let mut stats_collector = StatsCollector::default();
        for val in vals {
            stats_collector.collect(val);
        }
        stats_collector.stats()
    }

    fn find_gcd(vals: impl Iterator<Item = u64>) -> u64 {
        compute_stats(vals).gcd.get()
    }

    #[test]
    fn test_compute_gcd() {
        let test_compute_gcd_aux = |large, small, expected| {
            let large = NonZeroU64::new(large).unwrap();
            let small = NonZeroU64::new(small).unwrap();
            let expected = NonZeroU64::new(expected).unwrap();
            assert_eq!(compute_gcd(small, large), expected);
            assert_eq!(compute_gcd(large, small), expected);
        };
        test_compute_gcd_aux(1, 4, 1);
        test_compute_gcd_aux(2, 4, 2);
        test_compute_gcd_aux(10, 25, 5);
        test_compute_gcd_aux(25, 25, 25);
    }

    #[test]
    fn test_gcd() {
        assert_eq!(find_gcd([0].into_iter()), 1);
        assert_eq!(find_gcd([0, 10].into_iter()), 10);
        assert_eq!(find_gcd([10, 0].into_iter()), 10);
        assert_eq!(find_gcd([].into_iter()), 1);
        assert_eq!(find_gcd([15, 30, 5, 10].into_iter()), 5);
        assert_eq!(find_gcd([15, 16, 10].into_iter()), 1);
        assert_eq!(find_gcd([0, 5, 5, 5].into_iter()), 5);
        assert_eq!(find_gcd([0, 0].into_iter()), 1);
        assert_eq!(find_gcd([1, 10, 4, 1, 7, 10].into_iter()), 3);
        assert_eq!(find_gcd([1, 10, 0, 4, 1, 7, 10].into_iter()), 1);
    }

    #[test]
    fn test_stats() {
        assert_eq!(
            compute_stats([].into_iter()),
            ColumnStats {
                gcd: NonZeroU64::new(1).unwrap(),
                min_value: 0,
                max_value: 0,
                num_rows: 0
            }
        );
        assert_eq!(
            compute_stats([0, 1].into_iter()),
            ColumnStats {
                gcd: NonZeroU64::new(1).unwrap(),
                min_value: 0,
                max_value: 1,
                num_rows: 2
            }
        );
        assert_eq!(
            compute_stats([0, 1].into_iter()),
            ColumnStats {
                gcd: NonZeroU64::new(1).unwrap(),
                min_value: 0,
                max_value: 1,
                num_rows: 2
            }
        );
        assert_eq!(
            compute_stats([10, 20, 30].into_iter()),
            ColumnStats {
                gcd: NonZeroU64::new(10).unwrap(),
                min_value: 10,
                max_value: 30,
                num_rows: 3
            }
        );
        assert_eq!(
            compute_stats([10, 50, 10, 30].into_iter()),
            ColumnStats {
                gcd: NonZeroU64::new(20).unwrap(),
                min_value: 10,
                max_value: 50,
                num_rows: 4
            }
        );
        assert_eq!(
            compute_stats([10, 0, 30].into_iter()),
            ColumnStats {
                gcd: NonZeroU64::new(10).unwrap(),
                min_value: 0,
                max_value: 30,
                num_rows: 3
            }
        );
    }
}


================================================
FILE: columnar/src/column_values/u64_based/tests.rs
================================================
use proptest::prelude::*;
use proptest::{prop_oneof, proptest};
use rand::Rng;

#[test]
fn test_serialize_and_load_simple() {
    let mut buffer = Vec::new();
    let vals = &[1u64, 2u64, 5u64];
    serialize_u64_based_column_values(
        &&vals[..],
        &[CodecType::Bitpacked, CodecType::BlockwiseLinear],
        &mut buffer,
    )
    .unwrap();
    assert_eq!(buffer.len(), 7);
    let col = load_u64_based_column_values::<u64>(OwnedBytes::new(buffer)).unwrap();
    assert_eq!(col.num_vals(), 3);
    assert_eq!(col.get_val(0), 1);
    assert_eq!(col.get_val(1), 2);
    assert_eq!(col.get_val(2), 5);
}

#[test]
fn test_empty_column_i64() {
    let vals: [i64; 0] = [];
    let mut num_acceptable_codecs = 0;
    for codec in ALL_U64_CODEC_TYPES {
        let mut buffer = Vec::new();
        if serialize_u64_based_column_values(&&vals[..], &[codec], &mut buffer).is_err() {
            continue;
        }
        num_acceptable_codecs += 1;
        let col = load_u64_based_column_values::<i64>(OwnedBytes::new(buffer)).unwrap();
        assert_eq!(col.num_vals(), 0);
        assert_eq!(col.min_value(), i64::MIN);
        assert_eq!(col.max_value(), i64::MIN);
    }
    assert!(num_acceptable_codecs > 0);
}

#[test]
fn test_empty_column_u64() {
    let vals: [u64; 0] = [];
    let mut num_acceptable_codecs = 0;
    for codec in ALL_U64_CODEC_TYPES {
        let mut buffer = Vec::new();
        if serialize_u64_based_column_values(&&vals[..], &[codec], &mut buffer).is_err() {
            continue;
        }
        num_acceptable_codecs += 1;
        let col = load_u64_based_column_values::<u64>(OwnedBytes::new(buffer)).unwrap();
        assert_eq!(col.num_vals(), 0);
        assert_eq!(col.min_value(), u64::MIN);
        assert_eq!(col.max_value(), u64::MIN);
    }
    assert!(num_acceptable_codecs > 0);
}

#[test]
fn test_empty_column_f64() {
    let vals: [f64; 0] = [];
    let mut num_acceptable_codecs = 0;
    for codec in ALL_U64_CODEC_TYPES {
        let mut buffer = Vec::new();
        if serialize_u64_based_column_values(&&vals[..], &[codec], &mut buffer).is_err() {
            continue;
        }
        num_acceptable_codecs += 1;
        let col = load_u64_based_column_values::<f64>(OwnedBytes::new(buffer)).unwrap();
        assert_eq!(col.num_vals(), 0);
        // FIXME. f64::MIN would be better!
        assert!(col.min_value().is_nan());
        assert!(col.max_value().is_nan());
    }
    assert!(num_acceptable_codecs > 0);
}

pub(crate) fn create_and_validate<TColumnCodec: ColumnCodec>(
    vals: &[u64],
    name: &str,
) -> Option<(f32, f32)> {
    let mut stats_collector = StatsCollector::default();
    let mut codec_estimator: TColumnCodec::Estimator = Default::default();

    for val in vals.boxed_iter() {
        stats_collector.collect(val);
        codec_estimator.collect(val);
    }
    codec_estimator.finalize();
    let stats = stats_collector.stats();
    let estimation = codec_estimator.estimate(&stats)?;

    let mut buffer = Vec::new();
    codec_estimator
        .serialize(&stats, vals.boxed_iter().as_mut(), &mut buffer)
        .unwrap();

    let actual_compression = buffer.len() as u64;

    let reader = TColumnCodec::load(OwnedBytes::new(buffer)).unwrap();
    assert_eq!(reader.num_vals(), vals.len() as u32);
    let mut buffer = Vec::new();
    for (doc, orig_val) in vals.iter().copied().enumerate() {
        let val = reader.get_val(doc as u32);
        assert_eq!(
            val, orig_val,
            "val `{val}` does not match orig_val {orig_val:?}, in data set {name}, data `{vals:?}`",
        );

        buffer.resize(1, 0);
        reader.get_vals(&[doc as u32], &mut buffer);
        let val = buffer[0];
        assert_eq!(
            val, orig_val,
            "val `{val}` does not match orig_val {orig_val:?}, in data set {name}, data `{vals:?}`",
        );
    }

    let all_docs: Vec<u32> = (0..vals.len() as u32).collect();
    buffer.resize(all_docs.len(), 0);
    reader.get_vals(&all_docs, &mut buffer);
    assert_eq!(vals, buffer);

    if !vals.is_empty() {
        let test_rand_idx = rand::rng().random_range(0..=vals.len() - 1);
        let expected_positions: Vec<u32> = vals
            .iter()
            .enumerate()
            .filter(|(_, el)| **el == vals[test_rand_idx])
            .map(|(pos, _)| pos as u32)
            .collect();
        let mut positions = Vec::new();
        reader.get_row_ids_for_value_range(
            vals[test_rand_idx]..=vals[test_rand_idx],
            0..vals.len() as u32,
            &mut positions,
        );
        assert_eq!(expected_positions, positions);
    }
    if actual_compression > 1000 {
        assert!(relative_difference(estimation, actual_compression) < 0.10f32);
    }
    Some((
        compression_rate(estimation, stats.num_rows),
        compression_rate(actual_compression, stats.num_rows),
    ))
}

fn compression_rate(num_bytes: u64, num_values: u32) -> f32 {
    num_bytes as f32 / (num_values as f32 * 8.0)
}

fn relative_difference(left: u64, right: u64) -> f32 {
    let left = left as f32;
    let right = right as f32;
    2.0f32 * (left - right).abs() / (left + right)
}

proptest! {
    #![proptest_config(ProptestConfig::with_cases(100))]

    #[test]
    fn test_proptest_small_bitpacked(data in proptest::collection::vec(num_strategy(), 1..10)) {
        create_and_validate::<BitpackedCodec>(&data, "proptest bitpacked");
    }

    #[test]
    fn test_proptest_small_linear(data in proptest::collection::vec(num_strategy(), 1..10)) {
        create_and_validate::<LinearCodec>(&data, "proptest linearinterpol");
    }


    #[test]
    fn test_proptest_small_blockwise_linear(data in proptest::collection::vec(num_strategy(), 1..10)) {
        create_and_validate::<BlockwiseLinearCodec>(&data, "proptest multilinearinterpol");
    }
}

#[test]
fn test_small_blockwise_linear_example() {
    create_and_validate::<BlockwiseLinearCodec>(
        &[9223372036854775808, 9223370937344622593],
        "proptest multilinearinterpol",
    );
}

proptest! {
    #![proptest_config(ProptestConfig::with_cases(10))]

    #[test]
    fn test_proptest_large_bitpacked(data in proptest::collection::vec(num_strategy(), 1..6000)) {
        create_and_validate::<BitpackedCodec>(&data, "proptest bitpacked");
    }

    #[test]
    fn test_proptest_large_linear(data in proptest::collection::vec(num_strategy(), 1..6000)) {
        create_and_validate::<LinearCodec>(&data, "proptest linearinterpol");
    }

    #[test]
    fn test_proptest_large_blockwise_linear(data in proptest::collection::vec(num_strategy(), 1..6000)) {
        create_and_validate::<BlockwiseLinearCodec>(&data, "proptest multilinearinterpol");
    }
}

fn num_strategy() -> impl Strategy<Value = u64> {
    prop_oneof![
        1 => prop::num::u64::ANY.prop_map(|num| u64::MAX - (num % 10) ),
        1 => prop::num::u64::ANY.prop_map(|num| num % 10 ),
        20 => prop::num::u64::ANY,
    ]
}

pub fn get_codec_test_datasets() -> Vec<(Vec<u64>, &'static str)> {
    let mut data_and_names = vec![];

    let data = (10..=10_000_u64).collect::<Vec<_>>();
    data_and_names.push((data, "simple monotonically increasing"));

    data_and_names.push((
        vec![5, 6, 7, 8, 9, 10, 99, 100],
        "offset in linear interpol",
    ));
    data_and_names.push((vec![5, 50, 3, 13, 1, 1000, 35], "rand small"));
    data_and_names.push((vec![10], "single value"));

    data_and_names.push((
        vec![1572656989877777, 1170935903116329, 720575940379279, 0],
        "overflow error",
    ));

    data_and_names
}

fn test_codec<C: ColumnCodec>() {
    let codec_name = std::any::type_name::<C>();
    for (data, dataset_name) in get_codec_test_datasets() {
        let estimate_actual_opt: Option<(f32, f32)> =
            tests::create_and_validate::<C>(&data, dataset_name);
        let result = if let Some((estimate, actual)) = estimate_actual_opt {
            format!("Estimate `{estimate}` Actual `{actual}`")
        } else {
            "Disabled".to_string()
        };
        println!("Codec {codec_name}, DataSet {dataset_name}, {result}");
    }
}
#[test]
fn test_codec_bitpacking() {
    test_codec::<BitpackedCodec>();
}
#[test]
fn test_codec_interpolation() {
    test_codec::<LinearCodec>();
}
#[test]
fn test_codec_multi_interpolation() {
    test_codec::<BlockwiseLinearCodec>();
}

use super::*;

fn estimate<C: ColumnCodec>(vals: &[u64]) -> Option<f32> {
    let mut stats_collector = StatsCollector::default();
    let mut estimator = C::Estimator::default();
    for &val in vals {
        stats_collector.collect(val);
        estimator.collect(val);
    }
    estimator.finalize();
    let stats = stats_collector.stats();
    let num_bytes = estimator.estimate(&stats)?;
    if stats.num_rows == 0 {
        return None;
    }
    Some(num_bytes as f32 / (8.0 * stats.num_rows as f32))
}

#[test]
fn estimation_good_interpolation_case() {
    let data = (10..=20000_u64).collect::<Vec<_>>();

    let linear_interpol_estimation = estimate::<LinearCodec>(&data).unwrap();
    assert_le!(linear_interpol_estimation, 0.01);

    let multi_linear_interpol_estimation = estimate::<BlockwiseLinearCodec>(&data).unwrap();
    assert_le!(multi_linear_interpol_estimation, 0.2);
    assert_lt!(linear_interpol_estimation, multi_linear_interpol_estimation);

    let bitpacked_estimation = estimate::<BitpackedCodec>(&data).unwrap();
    assert_lt!(linear_interpol_estimation, bitpacked_estimation);
}

#[test]
fn estimation_test_bad_interpolation_case_monotonically_increasing() {
    let mut data: Vec<u64> = (201..=20000_u64).collect();
    data.push(1_000_000);

    // in this case the linear interpolation can't in fact not be worse than bitpacking,
    // but the estimator adds some threshold, which leads to estimated worse behavior
    let linear_interpol_estimation = estimate::<LinearCodec>(&data[..]).unwrap();
    assert_le!(linear_interpol_estimation, 0.35);

    let bitpacked_estimation = estimate::<BitpackedCodec>(&data).unwrap();
    assert_le!(bitpacked_estimation, 0.32);
    assert_le!(bitpacked_estimation, linear_interpol_estimation);
}

#[test]
fn test_fast_field_codec_type_to_code() {
    let mut count_codec = 0;
    for code in 0..=255 {
        if let Some(codec_type) = CodecType::try_from_code(code) {
            assert_eq!(codec_type.to_code(), code);
            count_codec += 1;
        }
    }
    assert_eq!(count_codec, 3);
}

fn test_fastfield_gcd_i64_with_codec(codec_type: CodecType, num_vals: usize) -> io::Result<()> {
    let mut vals: Vec<i64> = (-4..=(num_vals as i64) - 5).map(|val| val * 1000).collect();
    let mut buffer: Vec<u8> = Vec::new();
    crate::column_values::serialize_u64_based_column_values(
        &&vals[..],
        &[codec_type],
        &mut buffer,
    )?;
    let buffer = OwnedBytes::new(buffer);
    let column = crate::column_values::load_u64_based_column_values::<i64>(buffer.clone())?;
    assert_eq!(column.get_val(0), -4000i64);
    assert_eq!(column.get_val(1), -3000i64);
    assert_eq!(column.get_val(2), -2000i64);
    assert_eq!(column.max_value(), (num_vals as i64 - 5) * 1000);
    assert_eq!(column.min_value(), -4000i64);

    // Can't apply gcd
    let mut buffer_without_gcd = Vec::new();
    vals.pop();
    vals.push(1001i64);
    crate::column_values::serialize_u64_based_column_values(
        &&vals[..],
        &[codec_type],
        &mut buffer_without_gcd,
    )?;
    let buffer_without_gcd = OwnedBytes::new(buffer_without_gcd);
    assert!(buffer_without_gcd.len() > buffer.len());

    Ok(())
}

#[test]
fn test_fastfield_gcd_i64() -> io::Result<()> {
    for &codec_type in &[
        CodecType::Bitpacked,
        CodecType::BlockwiseLinear,
        CodecType::Linear,
    ] {
        test_fastfield_gcd_i64_with_codec(codec_type, 5500)?;
    }
    Ok(())
}

fn test_fastfield_gcd_u64_with_codec(codec_type: CodecType, num_vals: usize) -> io::Result<()> {
    let mut vals: Vec<u64> = (1..=num_vals).map(|i| i as u64 * 1000u64).collect();
    let mut buffer: Vec<u8> = Vec::new();
    crate::column_values::serialize_u64_based_column_values(
        &&vals[..],
        &[codec_type],
        &mut buffer,
    )?;
    let buffer = OwnedBytes::new(buffer);
    let column = crate::column_values::load_u64_based_column_values::<u64>(buffer.clone())?;
    assert_eq!(column.get_val(0), 1000u64);
    assert_eq!(column.get_val(1), 2000u64);
    assert_eq!(column.get_val(2), 3000u64);
    assert_eq!(column.max_value(), num_vals as u64 * 1000);
    assert_eq!(column.min_value(), 1000u64);

    // Can't apply gcd
    let mut buffer_without_gcd = Vec::new();
    vals.pop();
    vals.push(1001u64);
    crate::column_values::serialize_u64_based_column_values(
        &&vals[..],
        &[codec_type],
        &mut buffer_without_gcd,
    )?;
    let buffer_without_gcd = OwnedBytes::new(buffer_without_gcd);
    assert!(buffer_without_gcd.len() > buffer.len());
    Ok(())
}

#[test]
fn test_fastfield_gcd_u64() -> io::Result<()> {
    for &codec_type in &[
        CodecType::Bitpacked,
        CodecType::BlockwiseLinear,
        CodecType::Linear,
    ] {
        test_fastfield_gcd_u64_with_codec(codec_type, 5500)?;
    }
    Ok(())
}

#[test]
pub fn test_fastfield2() {
    let test_fastfield = crate::column_values::serialize_and_load_u64_based_column_values::<u64>(
        &&[100u64, 200u64, 300u64][..],
        &ALL_U64_CODEC_TYPES,
    );
    assert_eq!(test_fastfield.get_val(0), 100);
    assert_eq!(test_fastfield.get_val(1), 200);
    assert_eq!(test_fastfield.get_val(2), 300);
}


================================================
FILE: columnar/src/column_values/vec_column.rs
================================================
use std::fmt::Debug;

use tantivy_bitpacker::minmax;

use crate::ColumnValues;

/// VecColumn provides `Column` over a `Vec<T>`.
pub struct VecColumn<T = u64> {
    pub(crate) values: Vec<T>,
    pub(crate) min_value: T,
    pub(crate) max_value: T,
}

impl<T: Copy + PartialOrd + Send + Sync + Debug + 'static> ColumnValues<T> for VecColumn<T> {
    fn get_val(&self, position: u32) -> T {
        self.values[position as usize]
    }

    fn iter(&self) -> Box<dyn Iterator<Item = T> + '_> {
        Box::new(self.values.iter().copied())
    }

    fn min_value(&self) -> T {
        self.min_value
    }

    fn max_value(&self) -> T {
        self.max_value
    }

    fn num_vals(&self) -> u32 {
        self.values.len() as u32
    }

    fn get_range(&self, start: u64, output: &mut [T]) {
        output.copy_from_slice(&self.values[start as usize..][..output.len()])
    }
}

impl<T: Copy + PartialOrd + Default> From<Vec<T>> for VecColumn<T> {
    fn from(values: Vec<T>) -> Self {
        let (min_value, max_value) = minmax(values.iter().copied()).unwrap_or_default();
        Self {
            values,
            min_value,
            max_value,
        }
    }
}
impl From<VecColumn> for Vec<u64> {
    fn from(column: VecColumn) -> Self {
        column.values
    }
}


================================================
FILE: columnar/src/columnar/column_type.rs
================================================
use std::fmt;
use std::fmt::Debug;
use std::net::Ipv6Addr;

use serde::{Deserialize, Serialize};

use crate::InvalidData;
use crate::value::NumericalType;

/// The column type represents the column type.
/// Any changes need to be propagated to `COLUMN_TYPES`.
#[derive(Hash, Eq, PartialEq, Debug, Clone, Copy, Ord, PartialOrd, Serialize, Deserialize)]
#[repr(u8)]
pub enum ColumnType {
    I64 = 0u8,
    U64 = 1u8,
    F64 = 2u8,
    Bytes = 3u8,
    Str = 4u8,
    Bool = 5u8,
    IpAddr = 6u8,
    DateTime = 7u8,
}

impl fmt::Display for ColumnType {
    fn fmt(&self, f: &mut fmt::Formatter) -> fmt::Result {
        let short_str = match self {
            ColumnType::I64 => "i64",
            ColumnType::U64 => "u64",
            ColumnType::F64 => "f64",
            ColumnType::Bytes => "bytes",
            ColumnType::Str => "str",
            ColumnType::Bool => "bool",
            ColumnType::IpAddr => "ip",
            ColumnType::DateTime => "datetime",
        };
        write!(f, "{short_str}")
    }
}

// The order needs to match _exactly_ the order in the enum
const COLUMN_TYPES: [ColumnType; 8] = [
    ColumnType::I64,
    ColumnType::U64,
    ColumnType::F64,
    ColumnType::Bytes,
    ColumnType::Str,
    ColumnType::Bool,
    ColumnType::IpAddr,
    ColumnType::DateTime,
];

impl ColumnType {
    pub fn to_code(self) -> u8 {
        self as u8
    }
    pub fn is_date_time(&self) -> bool {
        self == &ColumnType::DateTime
    }

    pub(crate) fn try_from_code(code: u8) -> Result<ColumnType, InvalidData> {
        COLUMN_TYPES.get(code as usize).copied().ok_or(InvalidData)
    }
}

impl From<NumericalType> for ColumnType {
    fn from(numerical_type: NumericalType) -> Self {
        match numerical_type {
            NumericalType::I64 => ColumnType::I64,
            NumericalType::U64 => ColumnType::U64,
            NumericalType::F64 => ColumnType::F64,
        }
    }
}

impl ColumnType {
    pub fn numerical_type(&self) -> Option<NumericalType> {
        match self {
            ColumnType::I64 => Some(NumericalType::I64),
            ColumnType::U64 => Some(NumericalType::U64),
            ColumnType::F64 => Some(NumericalType::F64),
            ColumnType::Bytes
            | ColumnType::Str
            | ColumnType::Bool
            | ColumnType::IpAddr
            | ColumnType::DateTime => None,
        }
    }
}

// TODO remove if possible
pub trait HasAssociatedColumnType: 'static + Debug + Send + Sync + Copy + PartialOrd {
    fn column_type() -> ColumnType;
    fn default_value() -> Self;
}

impl HasAssociatedColumnType for u64 {
    fn column_type() -> ColumnType {
        ColumnType::U64
    }

    fn default_value() -> Self {
        0u64
    }
}

impl HasAssociatedColumnType for i64 {
    fn column_type() -> ColumnType {
        ColumnType::I64
    }

    fn default_value() -> Self {
        0i64
    }
}

impl HasAssociatedColumnType for f64 {
    fn column_type() -> ColumnType {
        ColumnType::F64
    }

    fn default_value() -> Self {
        Default::default()
    }
}

impl HasAssociatedColumnType for bool {
    fn column_type() -> ColumnType {
        ColumnType::Bool
    }
    fn default_value() -> Self {
        Default::default()
    }
}

impl HasAssociatedColumnType for common::DateTime {
    fn column_type() -> ColumnType {
        ColumnType::DateTime
    }
    fn default_value() -> Self {
        Default::default()
    }
}

impl HasAssociatedColumnType for Ipv6Addr {
    fn column_type() -> ColumnType {
        ColumnType::IpAddr
    }

    fn default_value() -> Self {
        Ipv6Addr::from([0u8; 16])
    }
}

#[cfg(test)]
mod tests {
    use super::*;
    use crate::Cardinality;

    #[test]
    fn test_column_type_to_code() {
        for (code, expected_column_type) in super::COLUMN_TYPES.iter().copied().enumerate() {
            if let Ok(column_type) = ColumnType::try_from_code(code as u8) {
                assert_eq!(column_type, expected_column_type);
            }
        }
        for code in COLUMN_TYPES.len() as u8..=u8::MAX {
            assert!(ColumnType::try_from_code(code).is_err());
        }
    }

    #[test]
    fn test_cardinality_to_code() {
        let mut num_cardinality = 0;
        for code in u8::MIN..=u8::MAX {
            if let Ok(cardinality) = Cardinality::try_from_code(code) {
                assert_eq!(cardinality.to_code(), code);
                num_cardinality += 1;
            }
        }
        assert_eq!(num_cardinality, 3);
    }
}


================================================
FILE: columnar/src/columnar/format_version.rs
================================================
use core::fmt;
use std::fmt::{Display, Formatter};

use crate::InvalidData;

pub const VERSION_FOOTER_NUM_BYTES: usize = MAGIC_BYTES.len() + std::mem::size_of::<u32>();

/// We end the file by these 4 bytes just to somewhat identify that
/// this is indeed a columnar file.
const MAGIC_BYTES: [u8; 4] = [2, 113, 119, 66];

pub fn footer() -> [u8; VERSION_FOOTER_NUM_BYTES] {
    let mut footer_bytes = [0u8; VERSION_FOOTER_NUM_BYTES];
    footer_bytes[0..4].copy_from_slice(&CURRENT_VERSION.to_bytes());
    footer_bytes[4..8].copy_from_slice(&MAGIC_BYTES[..]);
    footer_bytes
}

pub fn parse_footer(footer_bytes: [u8; VERSION_FOOTER_NUM_BYTES]) -> Result<Version, InvalidData> {
    if footer_bytes[4..8] != MAGIC_BYTES {
        return Err(InvalidData);
    }
    Version::try_from_bytes(footer_bytes[0..4].try_into().unwrap())
}

pub const CURRENT_VERSION: Version = Version::V2;

#[derive(Debug, Copy, Clone, Eq, PartialEq)]
#[repr(u32)]
pub enum Version {
    V1 = 1u32,
    V2 = 2u32,
}

impl Display for Version {
    fn fmt(&self, f: &mut Formatter) -> fmt::Result {
        match self {
            Version::V1 => write!(f, "v1"),
            Version::V2 => write!(f, "v2"),
        }
    }
}

impl Version {
    fn to_bytes(self) -> [u8; 4] {
        (self as u32).to_le_bytes()
    }

    fn try_from_bytes(bytes: [u8; 4]) -> Result<Version, InvalidData> {
        let code = u32::from_le_bytes(bytes);
        match code {
            1u32 => Ok(Version::V1),
            2u32 => Ok(Version::V2),
            _ => Err(InvalidData),
        }
    }
}

#[cfg(test)]
mod tests {
    use std::collections::HashSet;

    use super::*;

    #[test]
    fn test_footer_deserialization() {
        let parsed_version: Version = parse_footer(footer()).unwrap();
        assert_eq!(Version::V2, parsed_version);
    }

    #[test]
    fn test_version_serialization() {
        let version_to_tests: Vec<u32> = [0, 1 << 8, 1 << 16, 1 << 24]
            .iter()
            .copied()
            .flat_map(|offset| (0..255).map(move |el| el + offset))
            .collect();
        let mut valid_versions: HashSet<u32> = HashSet::default();
        for &i in &version_to_tests {
            let version_res = Version::try_from_bytes(i.to_le_bytes());
            if let Ok(version) = version_res {
                assert_eq!(version.to_bytes(), i.to_le_bytes());
                valid_versions.insert(i);
            }
        }
        assert_eq!(valid_versions.len(), 2);
    }
}


================================================
FILE: columnar/src/columnar/merge/merge_dict_column.rs
================================================
use std::io::{self, Write};

use common::{BitSet, CountingWriter, ReadOnlyBitSet};
use sstable::{SSTable, Streamer, TermOrdinal, VoidSSTable};

use super::term_merger::{TermMerger, TermsWithSegmentOrd};
use crate::column::serialize_column_mappable_to_u64;
use crate::column_index::SerializableColumnIndex;
use crate::iterable::Iterable;
use crate::{BytesColumn, MergeRowOrder, ShuffleMergeOrder};

// Serialize [Dictionary, Column, dictionary num bytes U32::LE]
// Column: [Column Index, Column Values, column index num bytes U32::LE]
pub fn merge_bytes_or_str_column(
    column_index: SerializableColumnIndex<'_>,
    bytes_columns: &[Option<BytesColumn>],
    merge_row_order: &MergeRowOrder,
    output: &mut impl Write,
) -> io::Result<()> {
    // Serialize dict and generate mapping for values
    let mut output = CountingWriter::wrap(output);
    // TODO !!! Remove useless terms.
    let term_ord_mapping = serialize_merged_dict(bytes_columns, merge_row_order, &mut output)?;
    let dictionary_num_bytes: u32 = output.written_bytes() as u32;
    let output = output.finish();
    let remapped_term_ordinals_values = RemappedTermOrdinalsValues {
        bytes_columns,
        term_ord_mapping: &term_ord_mapping,
        merge_row_order,
    };
    serialize_column_mappable_to_u64(column_index, &remapped_term_ordinals_values, output)?;
    output.write_all(&dictionary_num_bytes.to_le_bytes())?;
    Ok(())
}

struct RemappedTermOrdinalsValues<'a> {
    bytes_columns: &'a [Option<BytesColumn>],
    term_ord_mapping: &'a TermOrdinalMapping,
    merge_row_order: &'a MergeRowOrder,
}

impl Iterable for RemappedTermOrdinalsValues<'_> {
    fn boxed_iter(&self) -> Box<dyn Iterator<Item = u64> + '_> {
        match self.merge_row_order {
            MergeRowOrder::Stack(_) => self.boxed_iter_stacked(),
            MergeRowOrder::Shuffled(shuffle_merge_order) => {
                self.boxed_iter_shuffled(shuffle_merge_order)
            }
        }
    }
}

impl RemappedTermOrdinalsValues<'_> {
    fn boxed_iter_stacked(&self) -> Box<dyn Iterator<Item = u64> + '_> {
        let iter = self
            .bytes_columns
            .iter()
            .enumerate()
            .flat_map(|(seg_ord, bytes_column_opt)| {
                let bytes_column = bytes_column_opt.as_ref()?;
                Some((seg_ord, bytes_column))
            })
            .flat_map(move |(seg_ord, bytes_column)| {
                let term_ord_after_merge_mapping =
                    self.term_ord_mapping.get_segment(seg_ord as u32);
                bytes_column
                    .ords()
                    .values
                    .iter()
                    .map(move |term_ord| term_ord_after_merge_mapping[term_ord as usize])
            });
        Box::new(iter)
    }

    fn boxed_iter_shuffled<'b>(
        &'b self,
        shuffle_merge_order: &'b ShuffleMergeOrder,
    ) -> Box<dyn Iterator<Item = u64> + 'b> {
        Box::new(
            shuffle_merge_order
                .iter_new_to_old_row_addrs()
                .flat_map(move |old_addr| {
                    let segment_ord = self.term_ord_mapping.get_segment(old_addr.segment_ord);
                    self.bytes_columns[old_addr.segment_ord as usize]
                        .as_ref()
                        .into_iter()
                        .flat_map(move |bytes_column| {
                            bytes_column
                                .term_ords(old_addr.row_id)
                                .map(|old_term_ord: u64| segment_ord[old_term_ord as usize])
                        })
                }),
        )
    }
}

fn compute_term_bitset(column: &BytesColumn, row_bitset: &ReadOnlyBitSet) -> BitSet {
    let num_terms = column.dictionary().num_terms();
    let mut term_bitset = BitSet::with_max_value(num_terms as u32);
    for row_id in row_bitset.iter() {
        for term_ord in column.term_ord_column.values_for_doc(row_id) {
            term_bitset.insert(term_ord as u32);
        }
    }
    term_bitset
}

fn is_term_present(bitsets: &[Option<BitSet>], term_merger: &TermMerger) -> bool {
    for (segment_ord, from_term_ord) in term_merger.matching_segments() {
        if let Some(bitset) = bitsets[segment_ord].as_ref() {
            if bitset.contains(from_term_ord as u32) {
                return true;
            }
        } else {
            return true;
        }
    }
    false
}

fn serialize_merged_dict(
    bytes_columns: &[Option<BytesColumn>],
    merge_row_order: &MergeRowOrder,
    output: &mut impl Write,
) -> io::Result<TermOrdinalMapping> {
    let mut term_ord_mapping = TermOrdinalMapping::default();

    let mut field_term_streams = Vec::new();
    for (segment_ord, column_opt) in bytes_columns.iter().enumerate() {
        if let Some(column) = column_opt {
            term_ord_mapping.add_segment(column.dictionary.num_terms());
            let terms: Streamer<VoidSSTable> = column.dictionary.stream()?;
            field_term_streams.push(TermsWithSegmentOrd { terms, segment_ord });
        } else {
            term_ord_mapping.add_segment(0);
            field_term_streams.push(TermsWithSegmentOrd {
                terms: Streamer::empty(),
                segment_ord,
            });
        }
    }

    let mut merged_terms = TermMerger::new(field_term_streams);
    let mut sstable_builder = sstable::VoidSSTable::writer(output);

    match merge_row_order {
        MergeRowOrder::Stack(_) => {
            let mut current_term_ord = 0;
            while merged_terms.advance() {
                let term_bytes: &[u8] = merged_terms.key();
                sstable_builder.insert(term_bytes, &())?;
                for (segment_ord, from_term_ord) in merged_terms.matching_segments() {
                    term_ord_mapping.register_from_to(segment_ord, from_term_ord, current_term_ord);
                }
                current_term_ord += 1;
            }
            sstable_builder.finish()?;
        }
        MergeRowOrder::Shuffled(shuffle_merge_order) => {
            assert_eq!(shuffle_merge_order.alive_bitsets.len(), bytes_columns.len());
            let mut term_bitsets: Vec<Option<BitSet>> = Vec::with_capacity(bytes_columns.len());
            for (alive_bitset_opt, bytes_column_opt) in shuffle_merge_order
                .alive_bitsets
                .iter()
                .zip(bytes_columns.iter())
            {
                match (alive_bitset_opt, bytes_column_opt) {
                    (Some(alive_bitset), Some(bytes_column)) => {
                        let term_bitset = compute_term_bitset(bytes_column, alive_bitset);
                        term_bitsets.push(Some(term_bitset));
                    }
                    _ => {
                        term_bitsets.push(None);
                    }
                }
            }
            let mut current_term_ord = 0;
            while merged_terms.advance() {
                let term_bytes: &[u8] = merged_terms.key();
                if !is_term_present(&term_bitsets[..], &merged_terms) {
                    continue;
                }
                sstable_builder.insert(term_bytes, &())?;
                for (segment_ord, from_term_ord) in merged_terms.matching_segments() {
                    term_ord_mapping.register_from_to(segment_ord, from_term_ord, current_term_ord);
                }
                current_term_ord += 1;
            }
            sstable_builder.finish()?;
        }
    }
    Ok(term_ord_mapping)
}

#[derive(Default, Debug)]
struct TermOrdinalMapping {
    /// Contains the new term ordinals for each segment.
    per_segment_new_term_ordinals: Vec<Vec<TermOrdinal>>,
}

impl TermOrdinalMapping {
    fn add_segment(&mut self, max_term_ord: usize) {
        self.per_segment_new_term_ordinals
            .push(vec![TermOrdinal::default(); max_term_ord]);
    }

    fn register_from_to(&mut self, segment_ord: usize, from_ord: TermOrdinal, to_ord: TermOrdinal) {
        self.per_segment_new_term_ordinals[segment_ord][from_ord as usize] = to_ord;
    }

    fn get_segment(&self, segment_ord: u32) -> &[TermOrdinal] {
        &self.per_segment_new_term_ordinals[segment_ord as usize]
    }
}


================================================
FILE: columnar/src/columnar/merge/merge_mapping.rs
================================================
use std::ops::Range;

use common::{BitSet, OwnedBytes, ReadOnlyBitSet};

use crate::{ColumnarReader, RowAddr, RowId};

pub struct StackMergeOrder {
    // This does not start at 0. The first row is the number of
    // rows in the first columnar.
    cumulated_row_ids: Vec<RowId>,
}

impl StackMergeOrder {
    #[cfg(test)]
    pub fn stack_for_test(num_rows_per_columnar: &[u32]) -> StackMergeOrder {
        let mut cumulated_row_ids: Vec<RowId> = Vec::with_capacity(num_rows_per_columnar.len());
        let mut cumulated_row_id = 0;
        for &num_rows in num_rows_per_columnar {
            cumulated_row_id += num_rows;
            cumulated_row_ids.push(cumulated_row_id);
        }
        StackMergeOrder { cumulated_row_ids }
    }

    pub fn stack(columnars: &[&ColumnarReader]) -> StackMergeOrder {
        let mut cumulated_row_ids: Vec<RowId> = Vec::with_capacity(columnars.len());
        let mut cumulated_row_id = 0;
        for columnar in columnars {
            cumulated_row_id += columnar.num_docs();
            cumulated_row_ids.push(cumulated_row_id);
        }
        StackMergeOrder { cumulated_row_ids }
    }

    pub fn num_rows(&self) -> RowId {
        self.cumulated_row_ids.last().copied().unwrap_or(0)
    }

    pub fn offset(&self, columnar_id: usize) -> RowId {
        if columnar_id == 0 {
            return 0;
        }
        self.cumulated_row_ids[columnar_id - 1]
    }

    pub fn columnar_range(&self, columnar_id: usize) -> Range<RowId> {
        self.offset(columnar_id)..self.offset(columnar_id + 1)
    }
}

pub enum MergeRowOrder {
    /// Columnar tables are simply stacked one above the other.
    /// If the i-th columnar_readers has n_rows_i rows, then
    /// in the resulting columnar,
    /// rows [r0..n_row_0) contains the row of `columnar_readers[0]`, in ordder
    /// rows [n_row_0..n_row_0 + n_row_1 contains the row of `columnar_readers[1]`, in order.
    /// ..
    /// No documents is deleted.
    Stack(StackMergeOrder),
    /// Some more complex mapping, that may interleaves rows from the different readers and
    /// drop rows, or do both.
    Shuffled(ShuffleMergeOrder),
}

impl From<StackMergeOrder> for MergeRowOrder {
    fn from(stack_merge_order: StackMergeOrder) -> MergeRowOrder {
        MergeRowOrder::Stack(stack_merge_order)
    }
}

impl From<ShuffleMergeOrder> for MergeRowOrder {
    fn from(shuffle_merge_order: ShuffleMergeOrder) -> MergeRowOrder {
        MergeRowOrder::Shuffled(shuffle_merge_order)
    }
}

impl MergeRowOrder {
    pub fn num_rows(&self) -> RowId {
        match self {
            MergeRowOrder::Stack(stack_row_order) => stack_row_order.num_rows(),
            MergeRowOrder::Shuffled(complex_mapping) => complex_mapping.num_rows(),
        }
    }
}

pub struct ShuffleMergeOrder {
    pub new_row_id_to_old_row_id: Vec<RowAddr>,
    pub alive_bitsets: Vec<Option<ReadOnlyBitSet>>,
}

impl ShuffleMergeOrder {
    pub fn for_test(
        segment_num_rows: &[RowId],
        new_row_id_to_old_row_id: Vec<RowAddr>,
    ) -> ShuffleMergeOrder {
        let mut alive_bitsets: Vec<BitSet> = segment_num_rows
            .iter()
            .map(|&num_rows| BitSet::with_max_value(num_rows))
            .collect();
        for &RowAddr {
            segment_ord,
            row_id,
        } in &new_row_id_to_old_row_id
        {
            alive_bitsets[segment_ord as usize].insert(row_id);
        }
        let alive_bitsets: Vec<Option<ReadOnlyBitSet>> = alive_bitsets
            .into_iter()
            .map(|alive_bitset| {
                let mut buffer = Vec::new();
                alive_bitset.serialize(&mut buffer).unwrap();
                let data = OwnedBytes::new(buffer);
                Some(ReadOnlyBitSet::open(data))
            })
            .collect();
        ShuffleMergeOrder {
            new_row_id_to_old_row_id,
            alive_bitsets,
        }
    }

    pub fn num_rows(&self) -> RowId {
        self.new_row_id_to_old_row_id.len() as RowId
    }

    pub fn iter_new_to_old_row_addrs(&self) -> impl Iterator<Item = RowAddr> + '_ {
        self.new_row_id_to_old_row_id.iter().copied()
    }
}


================================================
FILE: columnar/src/columnar/merge/mod.rs
================================================
mod merge_dict_column;
mod merge_mapping;
mod term_merger;

use std::collections::{BTreeMap, HashSet};
use std::io;
use std::net::Ipv6Addr;
use std::sync::Arc;

pub use merge_mapping::{MergeRowOrder, ShuffleMergeOrder, StackMergeOrder};

use super::writer::ColumnarSerializer;
use crate::column::{serialize_column_mappable_to_u64, serialize_column_mappable_to_u128};
use crate::column_values::MergedColumnValues;
use crate::columnar::ColumnarReader;
use crate::columnar::merge::merge_dict_column::merge_bytes_or_str_column;
use crate::columnar::writer::CompatibleNumericalTypes;
use crate::dynamic_column::DynamicColumn;
use crate::{
    BytesColumn, Column, ColumnIndex, ColumnType, ColumnValues, DynamicColumnHandle, NumericalType,
    NumericalValue,
};

/// Column types are grouped into different categories.
/// After merge, all columns belonging to the same category are coerced to
/// the same column type.
///
/// In practise, today, only Numerical columns are coerced into one type today.
///
/// See also [README.md].
///
/// The ordering has to match the ordering of the variants in [ColumnType].
#[derive(Copy, Clone, Eq, PartialOrd, Ord, PartialEq, Hash, Debug)]
pub(crate) enum ColumnTypeCategory {
    Numerical,
    Bytes,
    Str,
    Bool,
    IpAddr,
    DateTime,
}

impl From<ColumnType> for ColumnTypeCategory {
    fn from(column_type: ColumnType) -> Self {
        match column_type {
            ColumnType::I64 => ColumnTypeCategory::Numerical,
            ColumnType::U64 => ColumnTypeCategory::Numerical,
            ColumnType::F64 => ColumnTypeCategory::Numerical,
            ColumnType::Bytes => ColumnTypeCategory::Bytes,
            ColumnType::Str => ColumnTypeCategory::Str,
            ColumnType::Bool => ColumnTypeCategory::Bool,
            ColumnType::IpAddr => ColumnTypeCategory::IpAddr,
            ColumnType::DateTime => ColumnTypeCategory::DateTime,
        }
    }
}

/// Merge several columnar table together.
///
/// If several columns with the same name are conflicting with the numerical types in the
/// input columnars, the first type compatible out of i64, u64, f64 in that order will be used.
///
/// `require_columns` makes it possible to ensure that some columns will be present in the
/// resulting columnar. When a required column is a numerical column type, one of two things can
/// happen:
/// - If the required column type is compatible with all of the input columnar, the resulting merged
///   columnar will simply coerce the input column and use the required column type.
/// - If the required column type is incompatible with one of the input columnar, the merged will
///   fail with an InvalidData error.
///
/// `merge_row_order` makes it possible to remove or reorder row in the resulting
/// `Columnar` table.
///
/// Reminder: a string and a numerical column may bare the same column name. This is not
/// considered a conflict.
pub fn merge_columnar(
    columnar_readers: &[&ColumnarReader],
    required_columns: &[(String, ColumnType)],
    merge_row_order: MergeRowOrder,
    output: &mut impl io::Write,
) -> io::Result<()> {
    let mut serializer = ColumnarSerializer::new(output);
    let num_docs_per_columnar = columnar_readers
        .iter()
        .map(|reader| reader.num_docs())
        .collect::<Vec<u32>>();

    let columns_to_merge = group_columns_for_merge(columnar_readers, required_columns)?;
    for res in columns_to_merge {
        let ((column_name, _column_type_category), grouped_columns) = res;
        let grouped_columns = grouped_columns.open(&merge_row_order)?;
        if grouped_columns.is_empty() {
            continue;
        }

        let column_type_after_merge = grouped_columns.column_type_after_merge();
        let mut columns = grouped_columns.columns;
        // Make sure the number of columns is the same as the number of columnar readers.
        // Or num_docs_per_columnar would be incorrect.
        assert_eq!(columns.len(), columnar_readers.len());
        coerce_columns(column_type_after_merge, &mut columns)?;

        let mut column_serializer =
            serializer.start_serialize_column(column_name.as_bytes(), column_type_after_merge);
        merge_column(
            column_type_after_merge,
            &num_docs_per_columnar,
            columns,
            &merge_row_order,
            &mut column_serializer,
        )?;
        column_serializer.finalize()?;
    }

    serializer.finalize(merge_row_order.num_rows())?;
    Ok(())
}

fn dynamic_column_to_u64_monotonic(dynamic_column: DynamicColumn) -> Option<Column<u64>> {
    match dynamic_column {
        DynamicColumn::Bool(column) => Some(column.to_u64_monotonic()),
        DynamicColumn::I64(column) => Some(column.to_u64_monotonic()),
        DynamicColumn::U64(column) => Some(column.to_u64_monotonic()),
        DynamicColumn::F64(column) => Some(column.to_u64_monotonic()),
        DynamicColumn::DateTime(column) => Some(column.to_u64_monotonic()),
        DynamicColumn::IpAddr(_) | DynamicColumn::Bytes(_) | DynamicColumn::Str(_) => None,
    }
}

fn merge_column(
    column_type: ColumnType,
    num_docs_per_column: &[u32],
    columns_to_merge: Vec<Option<DynamicColumn>>,
    merge_row_order: &MergeRowOrder,
    wrt: &mut impl io::Write,
) -> io::Result<()> {
    match column_type {
        ColumnType::I64
        | ColumnType::U64
        | ColumnType::F64
        | ColumnType::DateTime
        | ColumnType::Bool => {
            let mut column_indexes: Vec<ColumnIndex> = Vec::with_capacity(columns_to_merge.len());
            let mut column_values: Vec<Option<Arc<dyn ColumnValues>>> =
                Vec::with_capacity(columns_to_merge.len());
            for (i, dynamic_column_opt) in columns_to_merge.into_iter().enumerate() {
                match dynamic_column_opt.and_then(dynamic_column_to_u64_monotonic) {
                    Some(Column { index: idx, values }) => {
                        column_indexes.push(idx);
                        column_values.push(Some(values));
                    }
                    None => {
                        column_indexes.push(ColumnIndex::Empty {
                            num_docs: num_docs_per_column[i],
                        });
                        column_values.push(None);
                    }
                }
            }
            let merged_column_index =
                crate::column_index::merge_column_index(&column_indexes[..], merge_row_order);
            let merge_column_values = MergedColumnValues {
                column_indexes: &column_indexes[..],
                column_values: &column_values[..],
                merge_row_order,
            };
            serialize_column_mappable_to_u64(merged_column_index, &merge_column_values, wrt)?;
        }
        ColumnType::IpAddr => {
            let mut column_indexes: Vec<ColumnIndex> = Vec::with_capacity(columns_to_merge.len());
            let mut column_values: Vec<Option<Arc<dyn ColumnValues<Ipv6Addr>>>> =
                Vec::with_capacity(columns_to_merge.len());
            for (i, dynamic_column_opt) in columns_to_merge.into_iter().enumerate() {
                if let Some(DynamicColumn::IpAddr(Column { index: idx, values })) =
                    dynamic_column_opt
                {
                    column_indexes.push(idx);
                    column_values.push(Some(values));
                } else {
                    column_indexes.push(ColumnIndex::Empty {
                        num_docs: num_docs_per_column[i],
                    });
                    column_values.push(None);
                }
            }

            let merged_column_index =
                crate::column_index::merge_column_index(&column_indexes[..], merge_row_order);
            let merge_column_values = MergedColumnValues {
                column_indexes: &column_indexes[..],
                column_values: &column_values,
                merge_row_order,
            };

            serialize_column_mappable_to_u128(merged_column_index, &merge_column_values, wrt)?;
        }
        ColumnType::Bytes | ColumnType::Str => {
            let mut column_indexes: Vec<ColumnIndex> = Vec::with_capacity(columns_to_merge.len());
            let mut bytes_columns: Vec<Option<BytesColumn>> =
                Vec::with_capacity(columns_to_merge.len());
            for (i, dynamic_column_opt) in columns_to_merge.into_iter().enumerate() {
                match dynamic_column_opt {
                    Some(DynamicColumn::Str(str_column)) => {
                        column_indexes.push(str_column.term_ord_column.index.clone());
                        bytes_columns.push(Some(str_column.into()));
                    }
                    Some(DynamicColumn::Bytes(bytes_column)) => {
                        column_indexes.push(bytes_column.term_ord_column.index.clone());
                        bytes_columns.push(Some(bytes_column));
                    }
                    _ => {
                        column_indexes.push(ColumnIndex::Empty {
                            num_docs: num_docs_per_column[i],
                        });
                        bytes_columns.push(None);
                    }
                }
            }
            let merged_column_index =
                crate::column_index::merge_column_index(&column_indexes[..], merge_row_order);
            merge_bytes_or_str_column(merged_column_index, &bytes_columns, merge_row_order, wrt)?;
        }
    }
    Ok(())
}

struct GroupedColumns {
    required_column_type: Option<ColumnType>,
    columns: Vec<Option<DynamicColumn>>,
}

impl GroupedColumns {
    /// Check is column group can be skipped during serialization.
    fn is_empty(&self) -> bool {
        self.required_column_type.is_none() && self.columns.iter().all(Option::is_none)
    }

    /// Returns the column type after merge.
    ///
    /// This method does not check if the column types can actually be coerced to
    /// this type.
    fn column_type_after_merge(&self) -> ColumnType {
        if let Some(required_type) = self.required_column_type {
            return required_type;
        }
        let column_type: HashSet<ColumnType> = self
            .columns
            .iter()
            .flatten()
            .map(|column| column.column_type())
            .collect();
        if column_type.len() == 1 {
            return column_type.into_iter().next().unwrap();
        }
        // At the moment, only the numerical column type category has more than one possible
        // column type.
        assert!(
            self.columns
                .iter()
                .flatten()
                .all(|el| ColumnTypeCategory::from(el.column_type())
                    == ColumnTypeCategory::Numerical)
        );
        merged_numerical_columns_type(self.columns.iter().flatten()).into()
    }
}

struct GroupedColumnsHandle {
    required_column_type: Option<ColumnType>,
    columns: Vec<Option<DynamicColumnHandle>>,
}

impl GroupedColumnsHandle {
    fn new(num_columnars: usize) -> Self {
        GroupedColumnsHandle {
            required_column_type: None,
            columns: vec![None; num_columnars],
        }
    }
    fn open(self, merge_row_order: &MergeRowOrder) -> io::Result<GroupedColumns> {
        let mut columns: Vec<Option<DynamicColumn>> = Vec::new();
        for (columnar_id, column) in self.columns.iter().enumerate() {
            if let Some(column) = column {
                let column = column.open()?;
                // We skip columns that end up with 0 documents.
                // That way, we make sure they don't end up influencing the merge type or
                // creating empty columns.

                if is_empty_after_merge(merge_row_order, &column, columnar_id) {
                    columns.push(None);
                } else {
                    columns.push(Some(column));
                }
            } else {
                columns.push(None);
            }
        }
        Ok(GroupedColumns {
            required_column_type: self.required_column_type,
            columns,
        })
    }

    /// Set the dynamic column for a given columnar.
    fn set_column(&mut self, columnar_id: usize, column: DynamicColumnHandle) {
        self.columns[columnar_id] = Some(column);
    }

    /// Force the existence of a column, as well as its type.
    fn require_type(&mut self, required_type: ColumnType) -> io::Result<()> {
        if let Some(existing_required_type) = self.required_column_type {
            if existing_required_type == required_type {
                // This was just a duplicate in the `required_columns`.
                // Nothing to do.
                return Ok(());
            } else {
                return Err(io::Error::new(
                    io::ErrorKind::InvalidInput,
                    "Required column conflicts with another required column of the same type \
                     category.",
                ));
            }
        }
        self.required_column_type = Some(required_type);
        Ok(())
    }
}

/// Returns the type of the merged numerical column.
///
/// This function picks the first numerical type out of i64, u64, f64 (order matters
/// here), that is compatible with all the `columns`.
///
/// # Panics
/// Panics if one of the column is not numerical.
fn merged_numerical_columns_type<'a>(
    columns: impl Iterator<Item = &'a DynamicColumn>,
) -> NumericalType {
    let mut compatible_numerical_types = CompatibleNumericalTypes::default();
    for column in columns {
        let (min_value, max_value) =
            min_max_if_numerical(column).expect("All columns re required to be numerical");
        compatible_numerical_types.accept_value(min_value);
        compatible_numerical_types.accept_value(max_value);
    }
    compatible_numerical_types.to_numerical_type()
}

fn is_empty_after_merge(
    merge_row_order: &MergeRowOrder,
    column: &DynamicColumn,
    columnar_ord: usize,
) -> bool {
    if column.num_values() == 0u32 {
        // It was empty before the merge.
        return true;
    }
    match merge_row_order {
        MergeRowOrder::Stack(_) => {
            // If we are stacking the columnar, no rows are being deleted.
            false
        }
        MergeRowOrder::Shuffled(shuffled) => {
            if let Some(alive_bitset) = &shuffled.alive_bitsets[columnar_ord] {
                let column_index = column.column_index();
                match column_index {
                    ColumnIndex::Empty { .. } => true,
                    ColumnIndex::Full => alive_bitset.len() == 0,
                    ColumnIndex::Optional(optional_index) => {
                        for doc in optional_index.iter_non_null_docs() {
                            if alive_bitset.contains(doc) {
                                return false;
                            }
                        }
                        true
                    }
                    ColumnIndex::Multivalued(multivalued_index) => {
                        for alive_docid in alive_bitset.iter() {
                            if !multivalued_index.range(alive_docid).is_empty() {
                                return false;
                            }
                        }
                        true
                    }
                }
            } else {
                // No document is being deleted.
                // The shuffle is applying a permutation.
                false
            }
        }
    }
}

/// Iterates over the columns of the columnar readers, grouped by column name.
/// Key functionality is that `open` of the Columns is done lazy per group.
fn group_columns_for_merge<'a>(
    columnar_readers: &'a [&'a ColumnarReader],
    required_columns: &'a [(String, ColumnType)],
) -> io::Result<BTreeMap<(String, ColumnTypeCategory), GroupedColumnsHandle>> {
    let mut columns: BTreeMap<(String, ColumnTypeCategory), GroupedColumnsHandle> = BTreeMap::new();

    for &(ref column_name, column_type) in required_columns {
        columns
            .entry((column_name.clone(), column_type.into()))
            .or_insert_with(|| GroupedColumnsHandle::new(columnar_readers.len()))
            .require_type(column_type)?;
    }

    for (columnar_id, columnar_reader) in columnar_readers.iter().enumerate() {
        let column_name_and_handle = columnar_reader.iter_columns()?;

        for (column_name, handle) in column_name_and_handle {
            let column_category: ColumnTypeCategory = handle.column_type().into();
            columns
                .entry((column_name, column_category))
                .or_insert_with(|| GroupedColumnsHandle::new(columnar_readers.len()))
                .set_column(columnar_id, handle);
        }
    }
    Ok(columns)
}

fn coerce_columns(
    column_type: ColumnType,
    columns: &mut [Option<DynamicColumn>],
) -> io::Result<()> {
    for column_opt in columns.iter_mut() {
        if let Some(column) = column_opt.take() {
            *column_opt = Some(coerce_column(column_type, column)?);
        }
    }
    Ok(())
}

fn coerce_column(column_type: ColumnType, column: DynamicColumn) -> io::Result<DynamicColumn> {
    if let Some(numerical_type) = column_type.numerical_type() {
        column
            .coerce_numerical(numerical_type)
            .ok_or_else(|| io::Error::new(io::ErrorKind::InvalidInput, ""))
    } else {
        if column.column_type() != column_type {
            return Err(io::Error::new(
                io::ErrorKind::InvalidInput,
                format!(
                    "Cannot coerce column of type `{:?}` to `{column_type:?}`",
                    column.column_type()
                ),
            ));
        }
        Ok(column)
    }
}

/// Returns the (min, max) of a column provided it is numerical (i64, u64. f64).
///
/// The min and the max are simply the numerical value as defined by `ColumnValue::min_value()`,
/// and `ColumnValue::max_value()`.
///
/// It is important to note that these values are only guaranteed to be lower/upper bound
/// (as opposed to min/max value).
/// If a column is empty, the min and max values are currently set to 0.
fn min_max_if_numerical(column: &DynamicColumn) -> Option<(NumericalValue, NumericalValue)> {
    match column {
        DynamicColumn::I64(column) => Some((column.min_value().into(), column.max_value().into())),
        DynamicColumn::U64(column) => Some((column.min_value().into(), column.max_value().into())),
        DynamicColumn::F64(column) => Some((column.min_value().into(), column.max_value().into())),
        DynamicColumn::Bool(_)
        | DynamicColumn::IpAddr(_)
        | DynamicColumn::DateTime(_)
        | DynamicColumn::Bytes(_)
        | DynamicColumn::Str(_) => None,
    }
}

#[cfg(test)]
mod tests;


================================================
FILE: columnar/src/columnar/merge/term_merger.rs
================================================
use std::cmp::Ordering;
use std::collections::BinaryHeap;

use sstable::TermOrdinal;

use crate::Streamer;

/// The terms of a column with the ordinal of the segment.
pub struct TermsWithSegmentOrd<'a> {
    pub terms: Streamer<'a>,
    pub segment_ord: usize,
}

impl PartialEq for TermsWithSegmentOrd<'_> {
    fn eq(&self, other: &Self) -> bool {
        self.segment_ord == other.segment_ord
    }
}

impl Eq for TermsWithSegmentOrd<'_> {}

impl<'a> PartialOrd for TermsWithSegmentOrd<'a> {
    fn partial_cmp(&self, other: &TermsWithSegmentOrd<'a>) -> Option<Ordering> {
        Some(self.cmp(other))
    }
}

impl<'a> Ord for TermsWithSegmentOrd<'a> {
    fn cmp(&self, other: &TermsWithSegmentOrd<'a>) -> Ordering {
        (&other.terms.key(), &other.segment_ord).cmp(&(&self.terms.key(), &self.segment_ord))
    }
}

/// Given a list of sorted term streams,
/// returns an iterator over sorted unique terms.
///
/// The item yield is actually a pair with
/// - the term
/// - a slice with the ordinal of the segments containing the terms.
pub struct TermMerger<'a> {
    heap: BinaryHeap<TermsWithSegmentOrd<'a>>,
    term_streams_with_segment: Vec<TermsWithSegmentOrd<'a>>,
}

impl<'a> TermMerger<'a> {
    /// Stream of merged term dictionary
    pub fn new(term_streams_with_segment: Vec<TermsWithSegmentOrd<'a>>) -> TermMerger<'a> {
        TermMerger {
            heap: BinaryHeap::new(),
            term_streams_with_segment,
        }
    }

    pub(crate) fn matching_segments<'b: 'a>(
        &'b self,
    ) -> impl 'b + Iterator<Item = (usize, TermOrdinal)> {
        self.term_streams_with_segment
            .iter()
            .map(|heap_item| (heap_item.segment_ord, heap_item.terms.term_ord()))
    }

    fn advance_segments(&mut self) {
        let streamers = &mut self.term_streams_with_segment;
        let heap = &mut self.heap;
        for mut heap_item in streamers.drain(..) {
            if heap_item.terms.advance() {
                heap.push(heap_item);
            }
        }
    }

    /// Advance the term iterator to the next term.
    /// Returns true if there is indeed another term
    /// False if there is none.
    pub fn advance(&mut self) -> bool {
        self.advance_segments();
        match self.heap.pop() {
            Some(head) => {
                self.term_streams_with_segment.push(head);
                while let Some(next_streamer) = self.heap.peek() {
                    if self.term_streams_with_segment[0].terms.key() != next_streamer.terms.key() {
                        break;
                    }
                    let next_heap_it = self.heap.pop().unwrap(); // safe : we peeked beforehand
                    self.term_streams_with_segment.push(next_heap_it);
                }
                true
            }
            _ => false,
        }
    }

    /// Returns the current term.
    ///
    /// This method may be called
    /// if and only if advance() has been called before
    /// and "true" was returned.
    pub fn key(&self) -> &[u8] {
        self.term_streams_with_segment[0].terms.key()
    }
}


================================================
FILE: columnar/src/columnar/merge/tests.rs
================================================
use itertools::Itertools;
use proptest::collection::vec;
use proptest::prelude::*;

use super::*;
use crate::columnar::{ColumnarReader, MergeRowOrder, StackMergeOrder, merge_columnar};
use crate::{Cardinality, ColumnarWriter, DynamicColumn, HasAssociatedColumnType, RowId};

fn make_columnar<T: Into<NumericalValue> + HasAssociatedColumnType + Copy>(
    column_name: &str,
    vals: &[T],
) -> ColumnarReader {
    let mut dataframe_writer = ColumnarWriter::default();
    dataframe_writer.record_column_type(column_name, T::column_type(), false);
    for (row_id, val) in vals.iter().copied().enumerate() {
        dataframe_writer.record_numerical(row_id as RowId, column_name, val.into());
    }
    let mut buffer: Vec<u8> = Vec::new();
    dataframe_writer
        .serialize(vals.len() as RowId, &mut buffer)
        .unwrap();
    ColumnarReader::open(buffer).unwrap()
}

#[test]
fn test_column_coercion_to_u64() {
    // i64 type
    let columnar1 = make_columnar("numbers", &[1i64]);
    // u64 type
    let columnar2 = make_columnar("numbers", &[u64::MAX]);
    let columnars = &[&columnar1, &columnar2];
    let column_map: BTreeMap<(String, ColumnTypeCategory), GroupedColumnsHandle> =
        group_columns_for_merge(columnars, &[]).unwrap();
    assert_eq!(column_map.len(), 1);
    assert!(column_map.contains_key(&("numbers".to_string(), ColumnTypeCategory::Numerical)));
}

#[test]
fn test_column_coercion_to_i64() {
    let columnar1 = make_columnar("numbers", &[-1i64]);
    let columnar2 = make_columnar("numbers", &[2u64]);
    let columnars = &[&columnar1, &columnar2];
    let column_map: BTreeMap<(String, ColumnTypeCategory), GroupedColumnsHandle> =
        group_columns_for_merge(columnars, &[]).unwrap();
    assert_eq!(column_map.len(), 1);
    assert!(column_map.contains_key(&("numbers".to_string(), ColumnTypeCategory::Numerical)));
}

//#[test]
// fn test_impossible_coercion_returns_an_error() {
// let columnar1 = make_columnar("numbers", &[u64::MAX]);
// let merge_order = StackMergeOrder::stack(&[&columnar1]).into();
// let group_error = group_columns_for_merge_iter(
//&[&columnar1],
//&[("numbers".to_string(), ColumnType::I64)],
//&merge_order,
//)
//.unwrap_err();
// assert_eq!(group_error.kind(), io::ErrorKind::InvalidInput);
//}

#[test]
fn test_group_columns_with_required_column() {
    let columnar1 = make_columnar("numbers", &[1i64]);
    let columnar2 = make_columnar("numbers", &[2u64]);
    let columnars = &[&columnar1, &columnar2];
    let column_map: BTreeMap<(String, ColumnTypeCategory), GroupedColumnsHandle> =
        group_columns_for_merge(columnars, &[("numbers".to_string(), ColumnType::U64)]).unwrap();
    assert_eq!(column_map.len(), 1);
    assert!(column_map.contains_key(&("numbers".to_string(), ColumnTypeCategory::Numerical)));
}

#[test]
fn test_group_columns_required_column_with_no_existing_columns() {
    let columnar1 = make_columnar("numbers", &[2u64]);
    let columnar2 = make_columnar("numbers", &[2u64]);
    let columnars = &[&columnar1, &columnar2];
    let column_map: BTreeMap<_, _> =
        group_columns_for_merge(columnars, &[("required_col".to_string(), ColumnType::Str)])
            .unwrap();
    assert_eq!(column_map.len(), 2);
    let columns = &column_map
        .get(&("required_col".to_string(), ColumnTypeCategory::Str))
        .unwrap()
        .columns;
    assert_eq!(columns.len(), 2);
    assert!(columns[0].is_none());
    assert!(columns[1].is_none());
}

#[test]
fn test_group_columns_required_column_is_above_all_columns_have_the_same_type_rule() {
    let columnar1 = make_columnar("numbers", &[2i64]);
    let columnar2 = make_columnar("numbers", &[2i64]);
    let columnars = &[&columnar1, &columnar2];
    let column_map: BTreeMap<(String, ColumnTypeCategory), GroupedColumnsHandle> =
        group_columns_for_merge(columnars, &[("numbers".to_string(), ColumnType::U64)]).unwrap();
    assert_eq!(column_map.len(), 1);
    assert!(column_map.contains_key(&("numbers".to_string(), ColumnTypeCategory::Numerical)));
}

#[test]
fn test_missing_column() {
    let columnar1 = make_columnar("numbers", &[-1i64]);
    let columnar2 = make_columnar("numbers2", &[2u64]);
    let columnars = &[&columnar1, &columnar2];
    let column_map: BTreeMap<(String, ColumnTypeCategory), GroupedColumnsHandle> =
        group_columns_for_merge(columnars, &[]).unwrap();
    assert_eq!(column_map.len(), 2);
    assert!(column_map.contains_key(&("numbers".to_string(), ColumnTypeCategory::Numerical)));
    {
        let columns = &column_map
            .get(&("numbers".to_string(), ColumnTypeCategory::Numerical))
            .unwrap()
            .columns;
        assert!(columns[0].is_some());
        assert!(columns[1].is_none());
    }
    {
        let columns = &column_map
            .get(&("numbers2".to_string(), ColumnTypeCategory::Numerical))
            .unwrap()
            .columns;
        assert!(columns[0].is_none());
        assert!(columns[1].is_some());
    }
}

fn make_numerical_columnar_multiple_columns(
    columns: &[(&str, &[&[NumericalValue]])],
) -> ColumnarReader {
    let mut dataframe_writer = ColumnarWriter::default();
    for (column_name, column_values) in columns {
        for (row_id, vals) in column_values.iter().enumerate() {
            for val in vals.iter() {
                dataframe_writer.record_numerical(row_id as u32, column_name, *val);
            }
        }
    }
    let num_rows = columns
        .iter()
        .map(|(_, val_rows)| val_rows.len() as RowId)
        .max()
        .unwrap_or(0u32);
    let mut buffer: Vec<u8> = Vec::new();
    dataframe_writer.serialize(num_rows, &mut buffer).unwrap();
    ColumnarReader::open(buffer).unwrap()
}

#[track_caller]
fn make_byte_columnar_multiple_columns(
    columns: &[(&str, &[&[&[u8]]])],
    num_rows: u32,
) -> ColumnarReader {
    let mut dataframe_writer = ColumnarWriter::default();
    for (column_name, column_values) in columns {
        assert_eq!(
            column_values.len(),
            num_rows as usize,
            "All columns must have `{num_rows}` rows"
        );
        for (row_id, vals) in column_values.iter().enumerate() {
            for val in vals.iter() {
                dataframe_writer.record_bytes(row_id as u32, column_name, val);
            }
        }
    }
    let mut buffer: Vec<u8> = Vec::new();
    dataframe_writer.serialize(num_rows, &mut buffer).unwrap();
    ColumnarReader::open(buffer).unwrap()
}

fn make_text_columnar_multiple_columns(columns: &[(&str, &[&[&str]])]) -> ColumnarReader {
    let mut dataframe_writer = ColumnarWriter::default();
    for (column_name, column_values) in columns {
        for (row_id, vals) in column_values.iter().enumerate() {
            for val in vals.iter() {
                dataframe_writer.record_str(row_id as u32, column_name, val);
            }
        }
    }
    let num_rows = columns
        .iter()
        .map(|(_, val_rows)| val_rows.len() as RowId)
        .max()
        .unwrap_or(0u32);
    let mut buffer: Vec<u8> = Vec::new();
    dataframe_writer.serialize(num_rows, &mut buffer).unwrap();
    ColumnarReader::open(buffer).unwrap()
}

#[test]
fn test_merge_columnar_numbers() {
    let columnar1 =
        make_numerical_columnar_multiple_columns(&[("numbers", &[&[NumericalValue::from(-1f64)]])]);
    let columnar2 = make_numerical_columnar_multiple_columns(&[(
        "numbers",
        &[&[], &[NumericalValue::from(-3f64)]],
    )]);
    let mut buffer = Vec::new();
    let columnars = &[&columnar1, &columnar2];
    let stack_merge_order = StackMergeOrder::stack(columnars);
    crate::columnar::merge_columnar(
        columnars,
        &[],
        MergeRowOrder::Stack(stack_merge_order),
        &mut buffer,
    )
    .unwrap();
    let columnar_reader = ColumnarReader::open(buffer).unwrap();
    assert_eq!(columnar_reader.num_docs(), 3);
    assert_eq!(columnar_reader.num_columns(), 1);
    let cols = columnar_reader.read_columns("numbers").unwrap();
    let dynamic_column = cols[0].open().unwrap();
    let DynamicColumn::F64(vals) = dynamic_column else {
        panic!()
    };
    assert_eq!(vals.get_cardinality(), Cardinality::Optional);
    assert_eq!(vals.first(0u32), Some(-1f64));
    assert_eq!(vals.first(1u32), None);
    assert_eq!(vals.first(2u32), Some(-3f64));
}

#[test]
fn test_merge_columnar_texts() {
    let columnar1 = make_text_columnar_multiple_columns(&[("texts", &[&["a"]])]);
    let columnar2 = make_text_columnar_multiple_columns(&[("texts", &[&[], &["b"]])]);
    let mut buffer = Vec::new();
    let columnars = &[&columnar1, &columnar2];
    let stack_merge_order = StackMergeOrder::stack(columnars);
    crate::columnar::merge_columnar(
        columnars,
        &[],
        MergeRowOrder::Stack(stack_merge_order),
        &mut buffer,
    )
    .unwrap();
    let columnar_reader = ColumnarReader::open(buffer).unwrap();
    assert_eq!(columnar_reader.num_docs(), 3);
    assert_eq!(columnar_reader.num_columns(), 1);
    let cols = columnar_reader.read_columns("texts").unwrap();
    let dynamic_column = cols[0].open().unwrap();
    let DynamicColumn::Str(vals) = dynamic_column else {
        panic!()
    };
    assert_eq!(vals.ords().get_cardinality(), Cardinality::Optional);

    let get_str_for_ord = |ord| {
        let mut out = String::new();
        vals.ord_to_str(ord, &mut out).unwrap();
        out
    };

    assert_eq!(vals.dictionary.num_terms(), 2);
    assert_eq!(get_str_for_ord(0), "a");
    assert_eq!(get_str_for_ord(1), "b");

    let get_str_for_row = |row_id| {
        let term_ords: Vec<u64> = vals.term_ords(row_id).collect();
        assert!(term_ords.len() <= 1);
        let mut out = String::new();
        if term_ords.len() == 1 {
            vals.ord_to_str(term_ords[0], &mut out).unwrap();
        }
        out
    };

    assert_eq!(get_str_for_row(0), "a");
    assert_eq!(get_str_for_row(1), "");
    assert_eq!(get_str_for_row(2), "b");
}

#[test]
fn test_merge_columnar_byte() {
    let columnar1 = make_byte_columnar_multiple_columns(&[("bytes", &[&[b"bbbb"], &[b"baaa"]])], 2);
    let columnar2 = make_byte_columnar_multiple_columns(&[("bytes", &[&[], &[b"a"]])], 2);
    let mut buffer = Vec::new();
    let columnars = &[&columnar1, &columnar2];
    let stack_merge_order = StackMergeOrder::stack(columnars);
    crate::columnar::merge_columnar(
        columnars,
        &[],
        MergeRowOrder::Stack(stack_merge_order),
        &mut buffer,
    )
    .unwrap();
    let columnar_reader = ColumnarReader::open(buffer).unwrap();
    assert_eq!(columnar_reader.num_docs(), 4);
    assert_eq!(columnar_reader.num_columns(), 1);
    let cols = columnar_reader.read_columns("bytes").unwrap();
    let dynamic_column = cols[0].open().unwrap();
    let DynamicColumn::Bytes(vals) = dynamic_column else {
        panic!()
    };
    let get_bytes_for_ord = |ord| {
        let mut out = Vec::new();
        vals.ord_to_bytes(ord, &mut out).unwrap();
        out
    };

    assert_eq!(vals.dictionary.num_terms(), 3);
    assert_eq!(get_bytes_for_ord(0), b"a");
    assert_eq!(get_bytes_for_ord(1), b"baaa");
    assert_eq!(get_bytes_for_ord(2), b"bbbb");

    let get_bytes_for_row = |row_id| {
        let term_ords: Vec<u64> = vals.term_ords(row_id).collect();
        assert!(term_ords.len() <= 1);
        let mut out = Vec::new();
        if term_ords.len() == 1 {
            vals.ord_to_bytes(term_ords[0], &mut out).unwrap();
        }
        out
    };

    assert_eq!(get_bytes_for_row(0), b"bbbb");
    assert_eq!(get_bytes_for_row(1), b"baaa");
    assert_eq!(get_bytes_for_row(2), b"");
    assert_eq!(get_bytes_for_row(3), b"a");
}

#[test]
fn test_merge_columnar_byte_with_missing() {
    let columnar1 = make_byte_columnar_multiple_columns(&[], 3);
    let columnar2 = make_byte_columnar_multiple_columns(&[("col", &[&[b"b"], &[]])], 2);
    let columnar3 = make_byte_columnar_multiple_columns(
        &[
            ("col", &[&[], &[b"b"], &[b"a", b"b"]]),
            ("col2", &[&[b"hello"], &[], &[b"a", b"b"]]),
        ],
        3,
    );
    let mut buffer = Vec::new();
    let columnars = &[&columnar1, &columnar2, &columnar3];
    let stack_merge_order = StackMergeOrder::stack(columnars);
    crate::columnar::merge_columnar(
        columnars,
        &[],
        MergeRowOrder::Stack(stack_merge_order),
        &mut buffer,
    )
    .unwrap();
    let columnar_reader = ColumnarReader::open(buffer).unwrap();
    assert_eq!(columnar_reader.num_docs(), 3 + 2 + 3);
    assert_eq!(columnar_reader.num_columns(), 2);
    let cols = columnar_reader.read_columns("col").unwrap();
    let dynamic_column = cols[0].open().unwrap();
    let DynamicColumn::Bytes(vals) = dynamic_column else {
        panic!()
    };
    let get_bytes_for_ord = |ord| {
        let mut out = Vec::new();
        vals.ord_to_bytes(ord, &mut out).unwrap();
        out
    };
    assert_eq!(vals.dictionary.num_terms(), 2);
    assert_eq!(get_bytes_for_ord(0), b"a");
    assert_eq!(get_bytes_for_ord(1), b"b");
    let get_bytes_for_row = |row_id| {
        let terms: Vec<Vec<u8>> = vals
            .term_ords(row_id)
            .map(|term_ord| {
                let mut out = Vec::new();
                vals.ord_to_bytes(term_ord, &mut out).unwrap();
                out
            })
            .collect();
        terms
    };
    assert!(get_bytes_for_row(0).is_empty());
    assert!(get_bytes_for_row(1).is_empty());
    assert!(get_bytes_for_row(2).is_empty());
    assert_eq!(get_bytes_for_row(3), vec![b"b".to_vec()]);
    assert!(get_bytes_for_row(4).is_empty());
    assert!(get_bytes_for_row(5).is_empty());
    assert_eq!(get_bytes_for_row(6), vec![b"b".to_vec()]);
    assert_eq!(get_bytes_for_row(7), vec![b"a".to_vec(), b"b".to_vec()]);
}

#[test]
fn test_merge_columnar_different_types() {
    let columnar1 = make_text_columnar_multiple_columns(&[("mixed", &[&["a"]])]);
    let columnar2 = make_text_columnar_multiple_columns(&[("mixed", &[&[], &["b"]])]);
    let columnar3 = make_columnar("mixed", &[1i64]);
    let mut buffer = Vec::new();
    let columnars = &[&columnar1, &columnar2, &columnar3];
    let stack_merge_order = StackMergeOrder::stack(columnars);
    crate::columnar::merge_columnar(
        columnars,
        &[],
        MergeRowOrder::Stack(stack_merge_order),
        &mut buffer,
    )
    .unwrap();
    let columnar_reader = ColumnarReader::open(buffer).unwrap();
    assert_eq!(columnar_reader.num_docs(), 4);
    assert_eq!(columnar_reader.num_columns(), 2);
    let cols = columnar_reader.read_columns("mixed").unwrap();

    // numeric column
    let dynamic_column = cols[0].open().unwrap();
    let DynamicColumn::I64(vals) = dynamic_column else {
        panic!()
    };
    assert_eq!(vals.get_cardinality(), Cardinality::Optional);
    assert_eq!(vals.values_for_doc(0).collect_vec(), Vec::<i64>::new());
    assert_eq!(vals.values_for_doc(1).collect_vec(), Vec::<i64>::new());
    assert_eq!(vals.values_for_doc(2).collect_vec(), Vec::<i64>::new());
    assert_eq!(vals.values_for_doc(3).collect_vec(), vec![1]);
    assert_eq!(vals.values_for_doc(4).collect_vec(), Vec::<i64>::new());

    // text column
    let dynamic_column = cols[1].open().unwrap();
    let DynamicColumn::Str(vals) = dynamic_column else {
        panic!()
    };
    assert_eq!(vals.ords().get_cardinality(), Cardinality::Optional);
    let get_str_for_ord = |ord| {
        let mut out = String::new();
        vals.ord_to_str(ord, &mut out).unwrap();
        out
    };

    assert_eq!(vals.dictionary.num_terms(), 2);
    assert_eq!(get_str_for_ord(0), "a");
    assert_eq!(get_str_for_ord(1), "b");

    let get_str_for_row = |row_id| {
        let term_ords: Vec<String> = vals
            .term_ords(row_id)
            .map(|el| {
                let mut out = String::new();
                vals.ord_to_str(el, &mut out).unwrap();
                out
            })
            .collect();
        term_ords
    };

    assert_eq!(get_str_for_row(0), vec!["a".to_string()]);
    assert_eq!(get_str_for_row(1), Vec::<String>::new());
    assert_eq!(get_str_for_row(2), vec!["b".to_string()]);
    assert_eq!(get_str_for_row(3), Vec::<String>::new());
}

#[test]
fn test_merge_columnar_different_empty_cardinality() {
    let columnar1 = make_text_columnar_multiple_columns(&[("mixed", &[&["a"]])]);
    let columnar2 = make_columnar("mixed", &[1i64]);
    let mut buffer = Vec::new();
    let columnars = &[&columnar1, &columnar2];
    let stack_merge_order = StackMergeOrder::stack(columnars);
    crate::columnar::merge_columnar(
        columnars,
        &[],
        MergeRowOrder::Stack(stack_merge_order),
        &mut buffer,
    )
    .unwrap();
    let columnar_reader = ColumnarReader::open(buffer).unwrap();
    assert_eq!(columnar_reader.num_docs(), 2);
    assert_eq!(columnar_reader.num_columns(), 2);
    let cols = columnar_reader.read_columns("mixed").unwrap();

    // numeric column
    let dynamic_column = cols[0].open().unwrap();
    assert_eq!(dynamic_column.get_cardinality(), Cardinality::Optional);

    // text column
    let dynamic_column = cols[1].open().unwrap();
    assert_eq!(dynamic_column.get_cardinality(), Cardinality::Optional);
}

#[derive(Debug, Clone)]
struct ColumnSpec {
    column_name: String,
    /// (row_id, term)
    terms: Vec<(RowId, Vec<u8>)>,
}

#[derive(Clone, Debug)]
struct ColumnarSpec {
    columns: Vec<ColumnSpec>,
}

/// Generate a random (row_id, term) pair:
///  - row_id in [0..10]
///  - term is either from POSSIBLE_TERMS or random bytes
fn rowid_and_term_strategy() -> impl Strategy<Value = (RowId, Vec<u8>)> {
    const POSSIBLE_TERMS: &[&[u8]] = &[b"a", b"b", b"allo"];

    let term_strat = prop_oneof![
        // pick from the fixed list
        (0..POSSIBLE_TERMS.len()).prop_map(|i| POSSIBLE_TERMS[i].to_vec()),
        // or random bytes (length 0..10)
        prop::collection::vec(any::<u8>(), 0..10),
    ];

    (0u32..11, term_strat)
}

/// Generate one ColumnSpec, with a random name and a random list of (row_id, term).
/// We sort it by row_id so that data is in ascending order.
fn column_spec_strategy() -> impl Strategy<Value = ColumnSpec> {
    let column_name = prop_oneof![
        Just("col".to_string()),
        Just("col2".to_string()),
        "col.*".prop_map(|s| s),
    ];

    // We'll produce 0..8 (rowid,term) entries for this column
    let data_strat = vec(rowid_and_term_strategy(), 0..8).prop_map(|mut pairs| {
        // Sort by row_id
        pairs.sort_by_key(|(row_id, _)| *row_id);
        pairs
    });

    (column_name, data_strat).prop_map(|(name, data)| ColumnSpec {
        column_name: name,
        terms: data,
    })
}

/// Strategy to generate an ColumnarSpec
fn columnar_strategy() -> impl Strategy<Value = ColumnarSpec> {
    vec(column_spec_strategy(), 0..3).prop_map(|columns| ColumnarSpec { columns })
}

/// Strategy to generate multiple ColumnarSpecs, each of which we will treat
/// as one "columnar" to be merged together.
fn columnars_strategy() -> impl Strategy<Value = Vec<ColumnarSpec>> {
    vec(columnar_strategy(), 1..4)
}

/// Build a `ColumnarReader` from a `ColumnarSpec`
fn build_columnar(spec: &ColumnarSpec) -> ColumnarReader {
    let mut writer = ColumnarWriter::default();
    let mut max_row_id = 0;
    for col in &spec.columns {
        for &(row_id, ref term) in &col.terms {
            writer.record_bytes(row_id, &col.column_name, term);
            max_row_id = max_row_id.max(row_id);
        }
    }

    let mut buffer = Vec::new();
    writer.serialize(max_row_id + 1, &mut buffer).unwrap();
    ColumnarReader::open(buffer).unwrap()
}

proptest! {
    // We just test that the merge_columnar function doesn't crash.
    #![proptest_config(ProptestConfig::with_cases(256))]
    #[test]
    fn test_merge_columnar_bytes_no_crash(columnars in columnars_strategy(), second_merge_columnars in columnars_strategy()) {
        let columnars: Vec<ColumnarReader> = columnars.iter()
            .map(build_columnar)
            .collect();

        let mut out = Vec::new();
        let columnar_refs: Vec<&ColumnarReader> = columnars.iter().collect();
        let stack_merge_order = StackMergeOrder::stack(&columnar_refs);
        merge_columnar(
            &columnar_refs,
            &[],
            MergeRowOrder::Stack(stack_merge_order),
            &mut out,
        ).unwrap();

        let merged_reader = ColumnarReader::open(out).unwrap();

        // Merge the second set of columnars with the result of the first merge
        let mut columnars: Vec<ColumnarReader> = second_merge_columnars.iter()
            .map(build_columnar)
            .collect();
        columnars.push(merged_reader);
        let mut out = Vec::new();
        let columnar_refs: Vec<&ColumnarReader> = columnars.iter().collect();
        let stack_merge_order = StackMergeOrder::stack(&columnar_refs);
        merge_columnar(
            &columnar_refs,
            &[],
            MergeRowOrder::Stack(stack_merge_order),
            &mut out,
        ).unwrap();

    }
}


================================================
FILE: columnar/src/columnar/mod.rs
================================================
mod column_type;
mod format_version;
mod merge;
mod reader;
mod writer;

pub use column_type::{ColumnType, HasAssociatedColumnType};
pub use format_version::{CURRENT_VERSION, Version};
#[cfg(test)]
pub(crate) use merge::ColumnTypeCategory;
pub use merge::{MergeRowOrder, ShuffleMergeOrder, StackMergeOrder, merge_columnar};
pub use reader::ColumnarReader;
pub use writer::ColumnarWriter;


================================================
FILE: columnar/src/columnar/reader/mod.rs
================================================
use std::{fmt, io, mem};

use common::BinarySerializable;
use common::file_slice::FileSlice;
use common::json_path_writer::JSON_PATH_SEGMENT_SEP;
use sstable::{Dictionary, RangeSSTable};

use crate::columnar::{ColumnType, format_version};
use crate::dynamic_column::DynamicColumnHandle;
use crate::{RowId, Version};

fn io_invalid_data(msg: String) -> io::Error {
    io::Error::new(io::ErrorKind::InvalidData, msg)
}

/// The ColumnarReader makes it possible to access a set of columns
/// associated to field names.
#[derive(Clone)]
pub struct ColumnarReader {
    column_dictionary: Dictionary<RangeSSTable>,
    column_data: FileSlice,
    num_docs: RowId,
    format_version: Version,
}

impl fmt::Debug for ColumnarReader {
    fn fmt(&self, f: &mut fmt::Formatter<'_>) -> fmt::Result {
        let num_rows = self.num_docs();
        let columns = self.list_columns().unwrap();
        let num_cols = columns.len();
        let mut debug_struct = f.debug_struct("Columnar");
        debug_struct
            .field("num_rows", &num_rows)
            .field("num_cols", &num_cols);
        for (col_name, dynamic_column_handle) in columns.into_iter().take(5) {
            let col = dynamic_column_handle.open().unwrap();
            if col.num_values() > 10 {
                debug_struct.field(&col_name, &"..");
            } else {
                debug_struct.field(&col_name, &col);
            }
        }
        if num_cols > 5 {
            debug_struct.finish_non_exhaustive()?;
        } else {
            debug_struct.finish()?;
        }
        Ok(())
    }
}

/// Functions by both the async/sync code listing columns.
/// It takes a stream from the column sstable and return the list of
/// `DynamicColumn` available in it.
fn read_all_columns_in_stream(
    mut stream: sstable::Streamer<'_, RangeSSTable>,
    column_data: &FileSlice,
    format_version: Version,
) -> io::Result<Vec<DynamicColumnHandle>> {
    let mut results = Vec::new();
    while stream.advance() {
        let key_bytes: &[u8] = stream.key();
        let Some(column_code) = key_bytes.last().copied() else {
            return Err(io_invalid_data("Empty column name.".to_string()));
        };
        let column_type = ColumnType::try_from_code(column_code)
            .map_err(|_| io_invalid_data(format!("Unknown column code `{column_code}`")))?;
        let range = stream.value();
        let file_slice = column_data.slice(range.start as usize..range.end as usize);
        let dynamic_column_handle = DynamicColumnHandle {
            file_slice,
            column_type,
            format_version,
        };
        results.push(dynamic_column_handle);
    }
    Ok(results)
}

fn column_dictionary_prefix_for_column_name(column_name: &str) -> String {
    // Each column is a associated to a given `column_key`,
    // that starts by `column_name\0column_header`.
    //
    // Listing the columns associated to the given column name is therefore equivalent to
    // listing `column_key` with the prefix `column_name\0`.
    format!("{}{}", column_name, '\0')
}

fn column_dictionary_prefix_for_subpath(root_path: &str) -> String {
    format!("{}{}", root_path, JSON_PATH_SEGMENT_SEP as char)
}

impl ColumnarReader {
    /// Opens a new Columnar file.
    pub fn open<F>(file_slice: F) -> io::Result<ColumnarReader>
    where FileSlice: From<F> {
        Self::open_inner(file_slice.into())
    }

    fn open_inner(file_slice: FileSlice) -> io::Result<ColumnarReader> {
        let (file_slice_without_sstable_len, footer_slice) = file_slice
            .split_from_end(mem::size_of::<u64>() + 4 + format_version::VERSION_FOOTER_NUM_BYTES);
        let footer_bytes = footer_slice.read_bytes()?;
        let sstable_len = u64::deserialize(&mut &footer_bytes[0..8])?;
        let num_rows = u32::deserialize(&mut &footer_bytes[8..12])?;
        let version_footer_bytes: [u8; format_version::VERSION_FOOTER_NUM_BYTES] =
            footer_bytes[12..].try_into().unwrap();
        let format_version = format_version::parse_footer(version_footer_bytes)?;
        let (column_data, sstable) =
            file_slice_without_sstable_len.split_from_end(sstable_len as usize);
        let column_dictionary = Dictionary::open(sstable)?;
        Ok(ColumnarReader {
            column_dictionary,
            column_data,
            num_docs: num_rows,
            format_version,
        })
    }

    pub fn num_docs(&self) -> RowId {
        self.num_docs
    }
    // Iterate over the columns in a sorted way
    pub fn iter_columns(
        &self,
    ) -> io::Result<impl Iterator<Item = (String, DynamicColumnHandle)> + '_> {
        let mut stream = self.column_dictionary.stream()?;
        Ok(std::iter::from_fn(move || {
            if stream.advance() {
                let key_bytes: &[u8] = stream.key();
                let column_code: u8 = key_bytes.last().cloned().unwrap();
                // TODO Error Handling. The API gets quite ugly when returning the error here, so
                // instead we could just check the first N columns upfront.
                let column_type: ColumnType = ColumnType::try_from_code(column_code)
                    .map_err(|_| io_invalid_data(format!("Unknown column code `{column_code}`")))
                    .unwrap();
                let range = stream.value().clone();
                let column_name =
                // The last two bytes are respectively the 0u8 separator and the column_type.
                String::from_utf8_lossy(&key_bytes[..key_bytes.len() - 2]).to_string();
                let file_slice = self
                    .column_data
                    .slice(range.start as usize..range.end as usize);
                let column_handle = DynamicColumnHandle {
                    file_slice,
                    column_type,
                    format_version: self.format_version,
                };
                Some((column_name, column_handle))
            } else {
                None
            }
        }))
    }

    // TODO Add unit tests
    pub fn list_columns(&self) -> io::Result<Vec<(String, DynamicColumnHandle)>> {
        Ok(self.iter_columns()?.collect())
    }

    pub async fn read_columns_async(
        &self,
        column_name: &str,
    ) -> io::Result<Vec<DynamicColumnHandle>> {
        let prefix = column_dictionary_prefix_for_column_name(column_name);
        let stream = self
            .column_dictionary
            .prefix_range(prefix)
            .into_stream_async()
            .await?;
        read_all_columns_in_stream(stream, &self.column_data, self.format_version)
    }

    /// Get all columns for the given column name.
    ///
    /// There can be more than one column associated to a given column name, provided they have
    /// different types.
    pub fn read_columns(&self, column_name: &str) -> io::Result<Vec<DynamicColumnHandle>> {
        let prefix = column_dictionary_prefix_for_column_name(column_name);
        let stream = self.column_dictionary.prefix_range(prefix).into_stream()?;
        read_all_columns_in_stream(stream, &self.column_data, self.format_version)
    }

    pub async fn read_subpath_columns_async(
        &self,
        root_path: &str,
    ) -> io::Result<Vec<DynamicColumnHandle>> {
        let prefix = column_dictionary_prefix_for_subpath(root_path);
        let stream = self
            .column_dictionary
            .prefix_range(prefix)
            .into_stream_async()
            .await?;
        read_all_columns_in_stream(stream, &self.column_data, self.format_version)
    }

    /// Get all inner columns for a given JSON prefix, i.e columns for which the name starts
    /// with the prefix then contain the [`JSON_PATH_SEGMENT_SEP`].
    ///
    /// There can be more than one column associated to each path within the JSON structure,
    /// provided they have different types.
    pub fn read_subpath_columns(&self, root_path: &str) -> io::Result<Vec<DynamicColumnHandle>> {
        let prefix = column_dictionary_prefix_for_subpath(root_path);
        let stream = self
            .column_dictionary
            .prefix_range(prefix.as_bytes())
            .into_stream()?;
        read_all_columns_in_stream(stream, &self.column_data, self.format_version)
    }

    /// Return the number of columns in the columnar.
    pub fn num_columns(&self) -> usize {
        self.column_dictionary.num_terms()
    }
}

#[cfg(test)]
mod tests {
    use common::json_path_writer::JSON_PATH_SEGMENT_SEP;

    use crate::{ColumnType, ColumnarReader, ColumnarWriter};

    #[test]
    fn test_list_columns() {
        let mut columnar_writer = ColumnarWriter::default();
        columnar_writer.record_column_type("col1", ColumnType::Str, false);
        columnar_writer.record_column_type("col2", ColumnType::U64, false);
        let mut buffer = Vec::new();
        columnar_writer.serialize(1, &mut buffer).unwrap();
        let columnar = ColumnarReader::open(buffer).unwrap();
        let columns = columnar.list_columns().unwrap();
        assert_eq!(columns.len(), 2);
        assert_eq!(&columns[0].0, "col1");
        assert_eq!(columns[0].1.column_type(), ColumnType::Str);
        assert_eq!(&columns[1].0, "col2");
        assert_eq!(columns[1].1.column_type(), ColumnType::U64);
    }

    #[test]
    fn test_list_columns_strict_typing_prevents_coercion() {
        let mut columnar_writer = ColumnarWriter::default();
        columnar_writer.record_column_type("count", ColumnType::U64, false);
        columnar_writer.record_numerical(1, "count", 1u64);
        let mut buffer = Vec::new();
        columnar_writer.serialize(2, &mut buffer).unwrap();
        let columnar = ColumnarReader::open(buffer).unwrap();
        let columns = columnar.list_columns().unwrap();
        assert_eq!(columns.len(), 1);
        assert_eq!(&columns[0].0, "count");
        assert_eq!(columns[0].1.column_type(), ColumnType::U64);
    }

    #[test]
    fn test_read_columns() {
        let mut columnar_writer = ColumnarWriter::default();
        columnar_writer.record_column_type("col", ColumnType::U64, false);
        columnar_writer.record_numerical(1, "col", 1u64);
        let mut buffer = Vec::new();
        columnar_writer.serialize(2, &mut buffer).unwrap();
        let columnar = ColumnarReader::open(buffer).unwrap();
        {
            let columns = columnar.read_columns("col").unwrap();
            assert_eq!(columns.len(), 1);
            assert_eq!(columns[0].column_type(), ColumnType::U64);
        }
        {
            let columns = columnar.read_columns("other").unwrap();
            assert_eq!(columns.len(), 0);
        }
    }

    #[test]
    fn test_read_subpath_columns() {
        let mut columnar_writer = ColumnarWriter::default();
        columnar_writer.record_str(
            0,
            &format!("col1{}subcol1", JSON_PATH_SEGMENT_SEP as char),
            "hello",
        );
        columnar_writer.record_numerical(
            0,
            &format!("col1{}subcol2", JSON_PATH_SEGMENT_SEP as char),
            1i64,
        );
        columnar_writer.record_str(1, "col1", "hello");
        columnar_writer.record_str(0, "col2", "hello");
        let mut buffer = Vec::new();
        columnar_writer.serialize(2, &mut buffer).unwrap();

        let columnar = ColumnarReader::open(buffer).unwrap();
        {
            let columns = columnar.read_subpath_columns("col1").unwrap();
            assert_eq!(columns.len(), 2);
            assert_eq!(columns[0].column_type(), ColumnType::Str);
            assert_eq!(columns[1].column_type(), ColumnType::I64);
        }
        {
            let columns = columnar.read_subpath_columns("col1.subcol1").unwrap();
            assert_eq!(columns.len(), 0);
        }
        {
            let columns = columnar.read_subpath_columns("col2").unwrap();
            assert_eq!(columns.len(), 0);
        }
        {
            let columns = columnar.read_subpath_columns("other").unwrap();
            assert_eq!(columns.len(), 0);
        }
    }

    #[test]
    #[should_panic(expected = "Input type forbidden")]
    fn test_list_columns_strict_typing_panics_on_wrong_types() {
        let mut columnar_writer = ColumnarWriter::default();
        columnar_writer.record_column_type("count", ColumnType::U64, false);
        columnar_writer.record_numerical(1, "count", 1i64);
    }
}


================================================
FILE: columnar/src/columnar/writer/column_operation.rs
================================================
use std::net::Ipv6Addr;

use crate::dictionary::UnorderedId;
use crate::utils::{place_bits, pop_first_byte, select_bits};
use crate::value::NumericalValue;
use crate::{InvalidData, NumericalType, RowId};

/// When we build a columnar dataframe, we first just group
/// all mutations per column, and appends them in append-only buffer
/// in the stacker.
///
/// These ColumnOperation<T> are therefore serialize/deserialized
/// in memory.
///
/// We represents all of these operations as `ColumnOperation`.
#[derive(Eq, PartialEq, Debug, Clone, Copy)]
pub(super) enum ColumnOperation<T> {
    NewDoc(RowId),
    Value(T),
}

#[derive(Copy, Clone, Eq, PartialEq, Debug)]
struct ColumnOperationMetadata {
    op_type: ColumnOperationType,
    len: u8,
}

impl ColumnOperationMetadata {
    fn to_code(self) -> u8 {
        place_bits::<0, 6>(self.len) | place_bits::<6, 8>(self.op_type.to_code())
    }

    fn try_from_code(code: u8) -> Result<Self, InvalidData> {
        let len = select_bits::<0, 6>(code);
        let typ_code = select_bits::<6, 8>(code);
        let column_type = ColumnOperationType::try_from_code(typ_code)?;
        Ok(ColumnOperationMetadata {
            op_type: column_type,
            len,
        })
    }
}

#[derive(Copy, Clone, Eq, PartialEq, Debug)]
#[repr(u8)]
enum ColumnOperationType {
    NewDoc = 0u8,
    AddValue = 1u8,
}

impl ColumnOperationType {
    pub fn to_code(self) -> u8 {
        self as u8
    }

    pub fn try_from_code(code: u8) -> Result<Self, InvalidData> {
        match code {
            0 => Ok(Self::NewDoc),
            1 => Ok(Self::AddValue),
            _ => Err(InvalidData),
        }
    }
}

impl<V: SymbolValue> ColumnOperation<V> {
    pub(super) fn serialize(self) -> impl AsRef<[u8]> {
        let mut minibuf = MiniBuffer::default();
        let column_op_metadata = match self {
            ColumnOperation::NewDoc(new_doc) => {
                let symbol_len = new_doc.serialize(&mut minibuf.bytes[1..]);
                ColumnOperationMetadata {
                    op_type: ColumnOperationType::NewDoc,
                    len: symbol_len,
                }
            }
            ColumnOperation::Value(val) => {
                let symbol_len = val.serialize(&mut minibuf.bytes[1..]);
                ColumnOperationMetadata {
                    op_type: ColumnOperationType::AddValue,
                    len: symbol_len,
                }
            }
        };
        minibuf.bytes[0] = column_op_metadata.to_code();
        // +1 for the metadata
        minibuf.len = 1 + column_op_metadata.len;
        minibuf
    }

    /// Deserialize a column operation.
    /// Returns None if the buffer is empty.
    ///
    /// Panics if the payload is invalid:
    /// this deserialize method is meant to target in memory.
    pub(super) fn deserialize(bytes: &mut &[u8]) -> Option<Self> {
        let column_op_metadata_byte = pop_first_byte(bytes)?;
        let column_op_metadata = ColumnOperationMetadata::try_from_code(column_op_metadata_byte)
            .expect("Invalid op metadata byte");
        let symbol_bytes: &[u8];
        (symbol_bytes, *bytes) = bytes.split_at(column_op_metadata.len as usize);
        match column_op_metadata.op_type {
            ColumnOperationType::NewDoc => {
                let new_doc = u32::deserialize(symbol_bytes);
                Some(ColumnOperation::NewDoc(new_doc))
            }
            ColumnOperationType::AddValue => {
                let value = V::deserialize(symbol_bytes);
                Some(ColumnOperation::Value(value))
            }
        }
    }
}

impl<T> From<T> for ColumnOperation<T> {
    fn from(value: T) -> Self {
        ColumnOperation::Value(value)
    }
}

// Serialization trait very local to the writer.
// As we write fast fields, we accumulate them in "in memory".
// In order to limit memory usage, and in order
// to benefit from the stacker, we do this by serialization our data
// as "Symbols".
pub(super) trait SymbolValue: Clone + Copy {
    // Serializes the symbol into the given buffer.
    // Returns the number of bytes written into the buffer.
    /// # Panics
    /// May not exceed 9bytes
    fn serialize(self, buffer: &mut [u8]) -> u8;
    // Panics if invalid
    fn deserialize(bytes: &[u8]) -> Self;
}

impl SymbolValue for bool {
    fn serialize(self, buffer: &mut [u8]) -> u8 {
        buffer[0] = u8::from(self);
        1u8
    }

    fn deserialize(bytes: &[u8]) -> Self {
        bytes[0] == 1u8
    }
}

impl SymbolValue for Ipv6Addr {
    fn serialize(self, buffer: &mut [u8]) -> u8 {
        buffer[0..16].copy_from_slice(&self.octets());
        16
    }

    fn deserialize(bytes: &[u8]) -> Self {
        let octets: [u8; 16] = bytes[0..16].try_into().unwrap();
        Ipv6Addr::from(octets)
    }
}

#[derive(Default)]
struct MiniBuffer {
    pub bytes: [u8; 17],
    pub len: u8,
}

impl AsRef<[u8]> for MiniBuffer {
    fn as_ref(&self) -> &[u8] {
        &self.bytes[..self.len as usize]
    }
}

impl SymbolValue for NumericalValue {
    fn deserialize(mut bytes: &[u8]) -> Self {
        let type_code = pop_first_byte(&mut bytes).unwrap();
        let symbol_type = NumericalType::try_from_code(type_code).unwrap();
        let mut octet: [u8; 8] = [0u8; 8];
        octet[..bytes.len()].copy_from_slice(bytes);
        match symbol_type {
            NumericalType::U64 => {
                let val: u64 = u64::from_le_bytes(octet);
                NumericalValue::U64(val)
            }
            NumericalType::I64 => {
                let encoded: u64 = u64::from_le_bytes(octet);
                let val: i64 = decode_zig_zag(encoded);
                NumericalValue::I64(val)
            }
            NumericalType::F64 => {
                debug_assert_eq!(bytes.len(), 8);
                let val: f64 = f64::from_le_bytes(octet);
                NumericalValue::F64(val)
            }
        }
    }

    /// F64: Serialize with a fixed size of 9 bytes
    /// U64: Serialize without leading zeroes
    /// I64: ZigZag encoded and serialize without leading zeroes
    fn serialize(self, output: &mut [u8]) -> u8 {
        match self {
            NumericalValue::F64(val) => {
                output[0] = NumericalType::F64 as u8;
                output[1..9].copy_from_slice(&val.to_le_bytes());
                9u8
            }
            NumericalValue::U64(val) => {
                let len = compute_num_bytes_for_u64(val) as u8;
                output[0] = NumericalType::U64 as u8;
                output[1..9].copy_from_slice(&val.to_le_bytes());
                len + 1u8
            }
            NumericalValue::I64(val) => {
                let zig_zag_encoded = encode_zig_zag(val);
                let len = compute_num_bytes_for_u64(zig_zag_encoded) as u8;
                output[0] = NumericalType::I64 as u8;
                output[1..9].copy_from_slice(&zig_zag_encoded.to_le_bytes());
                len + 1u8
            }
        }
    }
}

impl SymbolValue for u32 {
    fn serialize(self, output: &mut [u8]) -> u8 {
        let len = compute_num_bytes_for_u64(self as u64);
        output[0..4].copy_from_slice(&self.to_le_bytes());
        len as u8
    }

    fn deserialize(bytes: &[u8]) -> Self {
        let mut quartet: [u8; 4] = [0u8; 4];
        quartet[..bytes.len()].copy_from_slice(bytes);
        u32::from_le_bytes(quartet)
    }
}

impl SymbolValue for UnorderedId {
    fn serialize(self, output: &mut [u8]) -> u8 {
        self.0.serialize(output)
    }

    fn deserialize(bytes: &[u8]) -> Self {
        UnorderedId(u32::deserialize(bytes))
    }
}

fn compute_num_bytes_for_u64(val: u64) -> usize {
    let msb = (64u32 - val.leading_zeros()) as usize;
    msb.div_ceil(8)
}

fn encode_zig_zag(n: i64) -> u64 {
    ((n << 1) ^ (n >> 63)) as u64
}

fn decode_zig_zag(n: u64) -> i64 {
    ((n >> 1) as i64) ^ (-((n & 1) as i64))
}

#[cfg(test)]
mod tests {
    use super::*;

    #[track_caller]
    fn test_zig_zag_aux(val: i64) {
        let encoded = super::encode_zig_zag(val);
        assert_eq!(decode_zig_zag(encoded), val);
        if let Some(abs_val) = val.checked_abs() {
            let abs_val = abs_val as u64;
            assert!(encoded <= abs_val * 2);
        }
    }

    #[test]
    fn test_zig_zag() {
        assert_eq!(encode_zig_zag(0i64), 0u64);
        assert_eq!(encode_zig_zag(-1i64), 1u64);
        assert_eq!(encode_zig_zag(1i64), 2u64);
        test_zig_zag_aux(0i64);
        test_zig_zag_aux(i64::MIN);
        test_zig_zag_aux(i64::MAX);
    }

    use proptest::prelude::any;
    use proptest::proptest;

    proptest! {
        #[test]
        fn test_proptest_zig_zag(val in any::<i64>()) {
            test_zig_zag_aux(val);
        }
    }

    #[test]
    fn test_column_op_metadata_byte_serialization() {
        for len in 0..=15 {
            for op_type in [ColumnOperationType::AddValue, ColumnOperationType::NewDoc] {
                let column_op_metadata = ColumnOperationMetadata { op_type, len };
                let column_op_metadata_code = column_op_metadata.to_code();
                let serdeser_metadata =
                    ColumnOperationMetadata::try_from_code(column_op_metadata_code).unwrap();
                assert_eq!(column_op_metadata, serdeser_metadata);
            }
        }
    }

    #[track_caller]
    fn ser_deser_symbol(column_op: ColumnOperation<NumericalValue>) {
        let buf = column_op.serialize();
        let mut buffer = buf.as_ref().to_vec();
        buffer.extend_from_slice(b"234234");
        let mut bytes = &buffer[..];
        let serdeser_symbol = ColumnOperation::deserialize(&mut bytes).unwrap();
        assert_eq!(bytes.len() + buf.as_ref().len(), buffer.len());
        assert_eq!(column_op, serdeser_symbol);
    }

    #[test]
    fn test_compute_num_bytes_for_u64() {
        assert_eq!(compute_num_bytes_for_u64(0), 0);
        assert_eq!(compute_num_bytes_for_u64(1), 1);
        assert_eq!(compute_num_bytes_for_u64(255), 1);
        assert_eq!(compute_num_bytes_for_u64(256), 2);
        assert_eq!(compute_num_bytes_for_u64((1 << 16) - 1), 2);
        assert_eq!(compute_num_bytes_for_u64(1 << 16), 3);
    }

    #[test]
    fn test_symbol_serialization() {
        ser_deser_symbol(ColumnOperation::NewDoc(0));
        ser_deser_symbol(ColumnOperation::NewDoc(3));
        ser_deser_symbol(ColumnOperation::Value(NumericalValue::I64(0i64)));
        ser_deser_symbol(ColumnOperation::Value(NumericalValue::I64(1i64)));
        ser_deser_symbol(ColumnOperation::Value(NumericalValue::U64(257u64)));
        ser_deser_symbol(ColumnOperation::Value(NumericalValue::I64(-257i64)));
        ser_deser_symbol(ColumnOperation::Value(NumericalValue::I64(i64::MIN)));
        ser_deser_symbol(ColumnOperation::Value(NumericalValue::U64(0u64)));
        ser_deser_symbol(ColumnOperation::Value(NumericalValue::U64(u64::MIN)));
        ser_deser_symbol(ColumnOperation::Value(NumericalValue::U64(u64::MAX)));
    }

    fn test_column_operation_unordered_aux(val: u32, expected_len: usize) {
        let column_op = ColumnOperation::Value(UnorderedId(val));
        let minibuf = column_op.serialize();
        assert_eq!({ minibuf.as_ref().len() }, expected_len);
        let mut buf = minibuf.as_ref().to_vec();
        buf.extend_from_slice(&[2, 2, 2, 2, 2, 2]);
        let mut cursor = &buf[..];
        let column_op_serdeser: ColumnOperation<UnorderedId> =
            ColumnOperation::deserialize(&mut cursor).unwrap();
        assert_eq!(column_op_serdeser, ColumnOperation::Value(UnorderedId(val)));
        assert_eq!(cursor.len() + expected_len, buf.len());
    }

    #[test]
    fn test_column_operation_unordered() {
        test_column_operation_unordered_aux(300u32, 3);
        test_column_operation_unordered_aux(1u32, 2);
        test_column_operation_unordered_aux(0u32, 1);
    }
}


================================================
FILE: columnar/src/columnar/writer/column_writers.rs
================================================
use std::cmp::Ordering;

use stacker::{ExpUnrolledLinkedList, MemoryArena};

use crate::columnar::writer::column_operation::{ColumnOperation, SymbolValue};
use crate::dictionary::{DictionaryBuilder, UnorderedId};
use crate::{Cardinality, NumericalType, NumericalValue, RowId};

#[derive(Copy, Clone, Debug, Eq, PartialEq)]
#[repr(u8)]
enum DocumentStep {
    Same = 0,
    Next = 1,
    Skipped = 2,
}

#[inline(always)]
fn delta_with_last_doc(last_doc_opt: Option<u32>, doc: u32) -> DocumentStep {
    let expected_next_doc = last_doc_opt.map(|last_doc| last_doc + 1).unwrap_or(0u32);
    match doc.cmp(&expected_next_doc) {
        Ordering::Less => DocumentStep::Same,
        Ordering::Equal => DocumentStep::Next,
        Ordering::Greater => DocumentStep::Skipped,
    }
}

#[derive(Copy, Clone, Default)]
pub struct ColumnWriter {
    // Detected cardinality of the column so far.
    cardinality: Cardinality,
    // Last document inserted.
    // None if no doc has been added yet.
    last_doc_opt: Option<u32>,
    // Buffer containing the serialized values.
    values: ExpUnrolledLinkedList,
}

impl ColumnWriter {
    /// Returns an iterator over the Symbol that have been recorded
    /// for the given column.
    pub(super) fn operation_iterator<'a, V: SymbolValue>(
        &self,
        arena: &MemoryArena,
        buffer: &'a mut Vec<u8>,
    ) -> impl Iterator<Item = ColumnOperation<V>> + 'a + use<'a, V> {
        buffer.clear();
        self.values.read_to_end(arena, buffer);
        let mut cursor: &[u8] = &buffer[..];
        std::iter::from_fn(move || ColumnOperation::deserialize(&mut cursor))
    }

    /// Records a change of the document being recorded.
    ///
    /// This function will also update the cardinality of the column
    /// if necessary.
    pub(super) fn record<S: SymbolValue>(&mut self, doc: RowId, value: S, arena: &mut MemoryArena) {
        // Difference between `doc` and the last doc.
        match delta_with_last_doc(self.last_doc_opt, doc) {
            DocumentStep::Same => {
                // This is the last encounterred document.
                self.cardinality = Cardinality::Multivalued;
            }
            DocumentStep::Next => {
                self.last_doc_opt = Some(doc);
                self.write_symbol::<S>(ColumnOperation::NewDoc(doc), arena);
            }
            DocumentStep::Skipped => {
                self.cardinality = self.cardinality.max(Cardinality::Optional);
                self.last_doc_opt = Some(doc);
                self.write_symbol::<S>(ColumnOperation::NewDoc(doc), arena);
            }
        }
        self.write_symbol(ColumnOperation::Value(value), arena);
    }

    // Get the cardinality.
    // The overall number of docs in the column is necessary to
    // deal with the case where the all docs contain 1 value, except some documents
    // at the end of the column.
    pub(crate) fn get_cardinality(&self, num_docs: RowId) -> Cardinality {
        match delta_with_last_doc(self.last_doc_opt, num_docs) {
            DocumentStep::Same | DocumentStep::Next => self.cardinality,
            DocumentStep::Skipped => self.cardinality.max(Cardinality::Optional),
        }
    }

    /// Appends a new symbol to the `ColumnWriter`.
    fn write_symbol<V: SymbolValue>(
        &mut self,
        column_operation: ColumnOperation<V>,
        arena: &mut MemoryArena,
    ) {
        self.values
            .writer(arena)
            .extend_from_slice(column_operation.serialize().as_ref());
    }
}

#[derive(Clone, Copy, Default)]
pub(crate) struct NumericalColumnWriter {
    compatible_numerical_types: CompatibleNumericalTypes,
    column_writer: ColumnWriter,
}

impl NumericalColumnWriter {
    pub fn force_numerical_type(&mut self, numerical_type: NumericalType) {
        assert!(
            self.compatible_numerical_types
                .is_type_accepted(numerical_type)
        );
        self.compatible_numerical_types = CompatibleNumericalTypes::StaticType(numerical_type);
    }
}

/// State used to store what types are still acceptable
/// after having seen a set of numerical values.
#[derive(Clone, Copy)]
pub(crate) enum CompatibleNumericalTypes {
    Dynamic {
        all_values_within_i64_range: bool,
        all_values_within_u64_range: bool,
    },
    StaticType(NumericalType),
}

impl Default for CompatibleNumericalTypes {
    fn default() -> CompatibleNumericalTypes {
        CompatibleNumericalTypes::Dynamic {
            all_values_within_i64_range: true,
            all_values_within_u64_range: true,
        }
    }
}

impl CompatibleNumericalTypes {
    pub fn is_type_accepted(&self, numerical_type: NumericalType) -> bool {
        match self {
            CompatibleNumericalTypes::Dynamic {
                all_values_within_i64_range,
                all_values_within_u64_range,
            } => match numerical_type {
                NumericalType::I64 => *all_values_within_i64_range,
                NumericalType::U64 => *all_values_within_u64_range,
                NumericalType::F64 => true,
            },
            CompatibleNumericalTypes::StaticType(static_numerical_type) => {
                *static_numerical_type == numerical_type
            }
        }
    }

    pub fn accept_value(&mut self, numerical_value: NumericalValue) {
        match self {
            CompatibleNumericalTypes::Dynamic {
                all_values_within_i64_range,
                all_values_within_u64_range,
            } => match numerical_value {
                NumericalValue::I64(val_i64) => {
                    let value_within_u64_range = val_i64 >= 0i64;
                    *all_values_within_u64_range &= value_within_u64_range;
                }
                NumericalValue::U64(val_u64) => {
                    let value_within_i64_range = val_u64 < i64::MAX as u64;
                    *all_values_within_i64_range &= value_within_i64_range;
                }
                NumericalValue::F64(_) => {
                    *all_values_within_i64_range = false;
                    *all_values_within_u64_range = false;
                }
            },
            CompatibleNumericalTypes::StaticType(typ) => {
                assert_eq!(
                    numerical_value.numerical_type(),
                    *typ,
                    "Input type forbidden. This column has been forced to type {typ:?}, received \
                     {numerical_value:?}"
                );
            }
        }
    }

    pub fn to_numerical_type(self) -> NumericalType {
        for numerical_type in [NumericalType::I64, NumericalType::U64] {
            if self.is_type_accepted(numerical_type) {
                return numerical_type;
            }
        }
        NumericalType::F64
    }
}

impl NumericalColumnWriter {
    pub fn numerical_type(&self) -> NumericalType {
        self.compatible_numerical_types.to_numerical_type()
    }

    pub fn cardinality(&self, num_docs: RowId) -> Cardinality {
        self.column_writer.get_cardinality(num_docs)
    }

    pub fn record_numerical_value(
        &mut self,
        doc: RowId,
        value: NumericalValue,
        arena: &mut MemoryArena,
    ) {
        self.compatible_numerical_types.accept_value(value);
        self.column_writer.record(doc, value, arena);
    }

    pub(super) fn operation_iterator<'a>(
        self,
        arena: &MemoryArena,
        buffer: &'a mut Vec<u8>,
    ) -> impl Iterator<Item = ColumnOperation<NumericalValue>> + 'a + use<'a> {
        self.column_writer.operation_iterator(arena, buffer)
    }
}

#[derive(Copy, Clone)]
pub(crate) struct StrOrBytesColumnWriter {
    pub(crate) dictionary_id: u32,
    pub(crate) column_writer: ColumnWriter,
    // If true, when facing a multivalued cardinality,
    // values associated to a given document will be sorted.
    //
    // This is useful for facets.
    //
    // If false, the order of appearance in the document will be
    // observed.
    pub(crate) sort_values_within_row: bool,
}

impl StrOrBytesColumnWriter {
    pub(crate) fn with_dictionary_id(dictionary_id: u32) -> StrOrBytesColumnWriter {
        StrOrBytesColumnWriter {
            dictionary_id,
            column_writer: Default::default(),
            sort_values_within_row: false,
        }
    }

    pub(crate) fn record_bytes(
        &mut self,
        doc: RowId,
        bytes: &[u8],
        dictionaries: &mut [DictionaryBuilder],
        arena: &mut MemoryArena,
    ) {
        let unordered_id =
            dictionaries[self.dictionary_id as usize].get_or_allocate_id(bytes, arena);
        self.column_writer.record(doc, unordered_id, arena);
    }

    pub(super) fn operation_iterator<'a>(
        &self,
        arena: &MemoryArena,
        byte_buffer: &'a mut Vec<u8>,
    ) -> impl Iterator<Item = ColumnOperation<UnorderedId>> + 'a + use<'a> {
        self.column_writer.operation_iterator(arena, byte_buffer)
    }
}

#[cfg(test)]
mod tests {
    use super::*;

    #[test]
    fn test_delta_with_last_doc() {
        assert_eq!(delta_with_last_doc(None, 0u32), DocumentStep::Next);
        assert_eq!(delta_with_last_doc(None, 1u32), DocumentStep::Skipped);
        assert_eq!(delta_with_last_doc(None, 2u32), DocumentStep::Skipped);
        assert_eq!(delta_with_last_doc(Some(0u32), 0u32), DocumentStep::Same);
        assert_eq!(delta_with_last_doc(Some(1u32), 1u32), DocumentStep::Same);
        assert_eq!(delta_with_last_doc(Some(1u32), 2u32), DocumentStep::Next);
        assert_eq!(delta_with_last_doc(Some(1u32), 3u32), DocumentStep::Skipped);
        assert_eq!(delta_with_last_doc(Some(1u32), 4u32), DocumentStep::Skipped);
    }

    #[track_caller]
    fn test_column_writer_coercion_iter_aux(
        values: impl Iterator<Item = NumericalValue>,
        expected_numerical_type: NumericalType,
    ) {
        let mut compatible_numerical_types = CompatibleNumericalTypes::default();
        for value in values {
            compatible_numerical_types.accept_value(value);
        }
        assert_eq!(
            compatible_numerical_types.to_numerical_type(),
            expected_numerical_type
        );
    }

    #[track_caller]
    fn test_column_writer_coercion_aux(
        values: &[NumericalValue],
        expected_numerical_type: NumericalType,
    ) {
        test_column_writer_coercion_iter_aux(values.iter().copied(), expected_numerical_type);
        test_column_writer_coercion_iter_aux(values.iter().rev().copied(), expected_numerical_type);
    }

    #[test]
    fn test_column_writer_coercion() {
        test_column_writer_coercion_aux(&[], NumericalType::I64);
        test_column_writer_coercion_aux(&[1i64.into()], NumericalType::I64);
        test_column_writer_coercion_aux(&[1u64.into()], NumericalType::I64);
        // We don't detect exact integer at the moment. We could!
        test_column_writer_coercion_aux(&[1f64.into()], NumericalType::F64);
        test_column_writer_coercion_aux(&[u64::MAX.into()], NumericalType::U64);
        test_column_writer_coercion_aux(&[(i64::MAX as u64).into()], NumericalType::U64);
        test_column_writer_coercion_aux(&[(1u64 << 63).into()], NumericalType::U64);
        test_column_writer_coercion_aux(&[1i64.into(), 1u64.into()], NumericalType::I64);
        test_column_writer_coercion_aux(&[u64::MAX.into(), (-1i64).into()], NumericalType::F64);
    }

    #[test]
    #[should_panic]
    fn test_compatible_numerical_types_static_incompatible_type() {
        let mut compatible_numerical_types =
            CompatibleNumericalTypes::StaticType(NumericalType::U64);
        compatible_numerical_types.accept_value(NumericalValue::I64(1i64));
    }

    #[test]
    fn test_compatible_numerical_types_static_different_type_forbidden() {
        let mut compatible_numerical_types =
            CompatibleNumericalTypes::StaticType(NumericalType::U64);
        compatible_numerical_types.accept_value(NumericalValue::U64(u64::MAX));
    }

    #[test]
    fn test_compatible_numerical_types_static() {
        for typ in [NumericalType::I64, NumericalType::I64, NumericalType::F64] {
            let compatible_numerical_types = CompatibleNumericalTypes::StaticType(typ);
            assert_eq!(compatible_numerical_types.to_numerical_type(), typ);
        }
    }
}


================================================
FILE: columnar/src/columnar/writer/mod.rs
================================================
mod column_operation;
mod column_writers;
mod serializer;
mod value_index;

use std::io;
use std::net::Ipv6Addr;

use column_operation::ColumnOperation;
pub(crate) use column_writers::CompatibleNumericalTypes;
use common::CountingWriter;
use common::json_path_writer::JSON_END_OF_PATH;
pub(crate) use serializer::ColumnarSerializer;
use stacker::{Addr, ArenaHashMap, MemoryArena};

use crate::column_index::{SerializableColumnIndex, SerializableOptionalIndex};
use crate::column_values::{MonotonicallyMappableToU64, MonotonicallyMappableToU128};
use crate::columnar::column_type::ColumnType;
use crate::columnar::writer::column_writers::{
    ColumnWriter, NumericalColumnWriter, StrOrBytesColumnWriter,
};
use crate::columnar::writer::value_index::{IndexBuilder, PreallocatedIndexBuilders};
use crate::dictionary::{DictionaryBuilder, TermIdMapping, UnorderedId};
use crate::value::{Coerce, NumericalType, NumericalValue};
use crate::{Cardinality, RowId};

/// This is a set of buffers that are used to temporarily write the values into before passing them
/// to the fast field codecs.
#[derive(Default)]
struct SpareBuffers {
    value_index_builders: PreallocatedIndexBuilders,
    u64_values: Vec<u64>,
    ip_addr_values: Vec<Ipv6Addr>,
}

/// Makes it possible to create a new columnar.
///
/// ```rust
/// use tantivy_columnar::ColumnarWriter;
///
/// let mut columnar_writer = ColumnarWriter::default();
/// columnar_writer.record_str(0u32 /* doc id */, "product_name", "Red backpack");
/// columnar_writer.record_numerical(0u32 /* doc id */, "price", 10u64);
/// columnar_writer.record_str(1u32 /* doc id */, "product_name", "Apple");
/// columnar_writer.record_numerical(0u32 /* doc id */, "price", 10.5f64); //< uh oh we ended up mixing integer and floats.
/// let mut wrt: Vec<u8> =  Vec::new();
/// columnar_writer.serialize(2u32, &mut wrt).unwrap();
/// ```
#[derive(Default)]
pub struct ColumnarWriter {
    numerical_field_hash_map: ArenaHashMap,
    datetime_field_hash_map: ArenaHashMap,
    bool_field_hash_map: ArenaHashMap,
    ip_addr_field_hash_map: ArenaHashMap,
    bytes_field_hash_map: ArenaHashMap,
    str_field_hash_map: ArenaHashMap,
    arena: MemoryArena,
    // Dictionaries used to store dictionary-encoded values.
    dictionaries: Vec<DictionaryBuilder>,
    buffers: SpareBuffers,
}

impl ColumnarWriter {
    pub fn mem_usage(&self) -> usize {
        self.arena.mem_usage()
            + self.numerical_field_hash_map.mem_usage()
            + self.bool_field_hash_map.mem_usage()
            + self.bytes_field_hash_map.mem_usage()
            + self.str_field_hash_map.mem_usage()
            + self.ip_addr_field_hash_map.mem_usage()
            + self.datetime_field_hash_map.mem_usage()
            + self
                .dictionaries
                .iter()
                .map(|dict| dict.mem_usage())
                .sum::<usize>()
    }

    /// Records a column type. This is useful to bypass the coercion process,
    /// makes sure the empty is present in the resulting columnar, or set
    /// the `sort_values_within_row`.
    ///
    /// `sort_values_within_row` is only allowed for `Bytes` or `Str` columns.
    pub fn record_column_type(
        &mut self,
        column_name: &str,
        column_type: ColumnType,
        sort_values_within_row: bool,
    ) {
        if sort_values_within_row {
            assert!(
                column_type == ColumnType::Bytes || column_type == ColumnType::Str,
                "sort_values_within_row is only allowed for Bytes and Str columns",
            );
        }
        match column_type {
            ColumnType::Str | ColumnType::Bytes => {
                let (hash_map, dictionaries) = (
                    if column_type == ColumnType::Str {
                        &mut self.str_field_hash_map
                    } else {
                        &mut self.bytes_field_hash_map
                    },
                    &mut self.dictionaries,
                );
                hash_map.mutate_or_create(
                    column_name.as_bytes(),
                    |column_opt: Option<StrOrBytesColumnWriter>| {
                        let mut column_writer = if let Some(column_writer) = column_opt {
                            column_writer
                        } else {
                            let dictionary_id = dictionaries.len() as u32;
                            dictionaries.push(DictionaryBuilder::default());
                            StrOrBytesColumnWriter::with_dictionary_id(dictionary_id)
                        };
                        column_writer.sort_values_within_row = sort_values_within_row;
                        column_writer
                    },
                );
            }
            ColumnType::Bool => {
                self.bool_field_hash_map.mutate_or_create(
                    column_name.as_bytes(),
                    |column_opt: Option<ColumnWriter>| column_opt.unwrap_or_default(),
                );
            }
            ColumnType::DateTime => {
                self.datetime_field_hash_map.mutate_or_create(
                    column_name.as_bytes(),
                    |column_opt: Option<ColumnWriter>| column_opt.unwrap_or_default(),
                );
            }
            ColumnType::I64 | ColumnType::F64 | ColumnType::U64 => {
                let numerical_type = column_type.numerical_type().unwrap();
                self.numerical_field_hash_map.mutate_or_create(
                    column_name.as_bytes(),
                    |column_opt: Option<NumericalColumnWriter>| {
                        let mut column: NumericalColumnWriter = column_opt.unwrap_or_default();
                        column.force_numerical_type(numerical_type);
                        column
                    },
                );
            }
            ColumnType::IpAddr => self.ip_addr_field_hash_map.mutate_or_create(
                column_name.as_bytes(),
                |column_opt: Option<ColumnWriter>| column_opt.unwrap_or_default(),
            ),
        }
    }

    pub fn record_numerical<T: Into<NumericalValue> + Copy>(
        &mut self,
        doc: RowId,
        column_name: &str,
        numerical_value: T,
    ) {
        let (hash_map, arena) = (&mut self.numerical_field_hash_map, &mut self.arena);
        hash_map.mutate_or_create(
            column_name.as_bytes(),
            |column_opt: Option<NumericalColumnWriter>| {
                let mut column: NumericalColumnWriter = column_opt.unwrap_or_default();
                column.record_numerical_value(doc, numerical_value.into(), arena);
                column
            },
        );
    }

    pub fn record_ip_addr(&mut self, doc: RowId, column_name: &str, ip_addr: Ipv6Addr) {
        let (hash_map, arena) = (&mut self.ip_addr_field_hash_map, &mut self.arena);
        hash_map.mutate_or_create(
            column_name.as_bytes(),
            |column_opt: Option<ColumnWriter>| {
                let mut column: ColumnWriter = column_opt.unwrap_or_default();
                column.record(doc, ip_addr, arena);
                column
            },
        );
    }

    pub fn record_bool(&mut self, doc: RowId, column_name: &str, val: bool) {
        let (hash_map, arena) = (&mut self.bool_field_hash_map, &mut self.arena);
        hash_map.mutate_or_create(
            column_name.as_bytes(),
            |column_opt: Option<ColumnWriter>| {
                let mut column: ColumnWriter = column_opt.unwrap_or_default();
                column.record(doc, val, arena);
                column
            },
        );
    }

    pub fn record_datetime(&mut self, doc: RowId, column_name: &str, datetime: common::DateTime) {
        let (hash_map, arena) = (&mut self.datetime_field_hash_map, &mut self.arena);
        hash_map.mutate_or_create(
            column_name.as_bytes(),
            |column_opt: Option<ColumnWriter>| {
                let mut column: ColumnWriter = column_opt.unwrap_or_default();
                column.record(
                    doc,
                    NumericalValue::I64(datetime.into_timestamp_nanos()),
                    arena,
                );
                column
            },
        );
    }

    pub fn record_str(&mut self, doc: RowId, column_name: &str, value: &str) {
        let (hash_map, arena, dictionaries) = (
            &mut self.str_field_hash_map,
            &mut self.arena,
            &mut self.dictionaries,
        );
        hash_map.mutate_or_create(
            column_name.as_bytes(),
            |column_opt: Option<StrOrBytesColumnWriter>| {
                let mut column: StrOrBytesColumnWriter = column_opt.unwrap_or_else(|| {
                    // Each column has its own dictionary
                    let dictionary_id = dictionaries.len() as u32;
                    dictionaries.push(DictionaryBuilder::default());
                    StrOrBytesColumnWriter::with_dictionary_id(dictionary_id)
                });
                column.record_bytes(doc, value.as_bytes(), dictionaries, arena);
                column
            },
        );
    }

    pub fn record_bytes(&mut self, doc: RowId, column_name: &str, value: &[u8]) {
        let (hash_map, arena, dictionaries) = (
            &mut self.bytes_field_hash_map,
            &mut self.arena,
            &mut self.dictionaries,
        );
        hash_map.mutate_or_create(
            column_name.as_bytes(),
            |column_opt: Option<StrOrBytesColumnWriter>| {
                let mut column: StrOrBytesColumnWriter = column_opt.unwrap_or_else(|| {
                    // Each column has its own dictionary
                    let dictionary_id = dictionaries.len() as u32;
                    dictionaries.push(DictionaryBuilder::default());
                    StrOrBytesColumnWriter::with_dictionary_id(dictionary_id)
                });
                column.record_bytes(doc, value, dictionaries, arena);
                column
            },
        );
    }
    pub fn serialize(&mut self, num_docs: RowId, wrt: &mut dyn io::Write) -> io::Result<()> {
        let mut serializer = ColumnarSerializer::new(wrt);

        let mut columns: Vec<(&[u8], ColumnType, Addr)> = self
            .numerical_field_hash_map
            .iter()
            .map(|(column_name, addr)| {
                let numerical_column_writer: NumericalColumnWriter =
                    self.numerical_field_hash_map.read(addr);
                let column_type = numerical_column_writer.numerical_type().into();
                (column_name, column_type, addr)
            })
            .collect();
        columns.extend(
            self.bytes_field_hash_map
                .iter()
                .map(|(column_name, addr)| (column_name, ColumnType::Bytes, addr)),
        );
        columns.extend(
            self.str_field_hash_map
                .iter()
                .map(|(column_name, addr)| (column_name, ColumnType::Str, addr)),
        );
        columns.extend(
            self.bool_field_hash_map
                .iter()
                .map(|(column_name, addr)| (column_name, ColumnType::Bool, addr)),
        );
        columns.extend(
            self.ip_addr_field_hash_map
                .iter()
                .map(|(column_name, addr)| (column_name, ColumnType::IpAddr, addr)),
        );
        columns.extend(
            self.datetime_field_hash_map
                .iter()
                .map(|(column_name, addr)| (column_name, ColumnType::DateTime, addr)),
        );
        columns.sort_unstable_by_key(|(column_name, col_type, _)| (*column_name, *col_type));
        let (arena, buffers, dictionaries) = (&self.arena, &mut self.buffers, &self.dictionaries);
        let mut symbol_byte_buffer: Vec<u8> = Vec::new();
        for (column_name, column_type, addr) in columns {
            if column_name.contains(&JSON_END_OF_PATH) {
                // Tantivy uses b'0' as a separator for nested fields in JSON.
                // Column names with a b'0' are not simply ignored by the columnar (and the inverted
                // index).
                continue;
            }
            match column_type {
                ColumnType::Bool => {
                    let column_writer: ColumnWriter = self.bool_field_hash_map.read(addr);
                    let cardinality = column_writer.get_cardinality(num_docs);
                    let mut column_serializer =
                        serializer.start_serialize_column(column_name, column_type);
                    serialize_bool_column(
                        cardinality,
                        num_docs,
                        column_writer.operation_iterator(arena, &mut symbol_byte_buffer),
                        buffers,
                        &mut column_serializer,
                    )?;
                    column_serializer.finalize()?;
                }
                ColumnType::IpAddr => {
                    let column_writer: ColumnWriter = self.ip_addr_field_hash_map.read(addr);
                    let cardinality = column_writer.get_cardinality(num_docs);
                    let mut column_serializer =
                        serializer.start_serialize_column(column_name, ColumnType::IpAddr);
                    serialize_ip_addr_column(
                        cardinality,
                        num_docs,
                        column_writer.operation_iterator(arena, &mut symbol_byte_buffer),
                        buffers,
                        &mut column_serializer,
                    )?;
                    column_serializer.finalize()?;
                }
                ColumnType::Bytes | ColumnType::Str => {
                    let str_or_bytes_column_writer: StrOrBytesColumnWriter =
                        if column_type == ColumnType::Bytes {
                            self.bytes_field_hash_map.read(addr)
                        } else {
                            self.str_field_hash_map.read(addr)
                        };
                    let dictionary_builder =
                        &dictionaries[str_or_bytes_column_writer.dictionary_id as usize];
                    let cardinality = str_or_bytes_column_writer
                        .column_writer
                        .get_cardinality(num_docs);
                    let mut column_serializer =
                        serializer.start_serialize_column(column_name, column_type);
                    serialize_bytes_or_str_column(
                        cardinality,
                        num_docs,
                        str_or_bytes_column_writer.sort_values_within_row,
                        dictionary_builder,
                        str_or_bytes_column_writer
                            .operation_iterator(arena, &mut symbol_byte_buffer),
                        buffers,
                        &self.arena,
                        &mut column_serializer,
                    )?;
                    column_serializer.finalize()?;
                }
                ColumnType::F64 | ColumnType::I64 | ColumnType::U64 => {
                    let numerical_column_writer: NumericalColumnWriter =
                        self.numerical_field_hash_map.read(addr);
                    let cardinality = numerical_column_writer.cardinality(num_docs);
                    let mut column_serializer =
                        serializer.start_serialize_column(column_name, column_type);
                    let numerical_type = column_type.numerical_type().unwrap();
                    serialize_numerical_column(
                        cardinality,
                        num_docs,
                        numerical_type,
                        numerical_column_writer.operation_iterator(arena, &mut symbol_byte_buffer),
                        buffers,
                        &mut column_serializer,
                    )?;
                    column_serializer.finalize()?;
                }
                ColumnType::DateTime => {
                    let column_writer: ColumnWriter = self.datetime_field_hash_map.read(addr);
                    let cardinality = column_writer.get_cardinality(num_docs);
                    let mut column_serializer =
                        serializer.start_serialize_column(column_name, ColumnType::DateTime);
                    serialize_numerical_column(
                        cardinality,
                        num_docs,
                        NumericalType::I64,
                        column_writer.operation_iterator(arena, &mut symbol_byte_buffer),
                        buffers,
                        &mut column_serializer,
                    )?;
                    column_serializer.finalize()?;
                }
            };
        }
        serializer.finalize(num_docs)?;
        Ok(())
    }
}

// Serialize [Dictionary, Column, dictionary num bytes U32::LE]
// Column: [Column Index, Column Values, column index num bytes U32::LE]
#[expect(clippy::too_many_arguments)]
fn serialize_bytes_or_str_column(
    cardinality: Cardinality,
    num_docs: RowId,
    sort_values_within_row: bool,
    dictionary_builder: &DictionaryBuilder,
    operation_it: impl Iterator<Item = ColumnOperation<UnorderedId>>,
    buffers: &mut SpareBuffers,
    arena: &MemoryArena,
    wrt: impl io::Write,
) -> io::Result<()> {
    let SpareBuffers {
        value_index_builders,
        u64_values,
        ..
    } = buffers;
    let mut counting_writer = CountingWriter::wrap(wrt);
    let term_id_mapping: TermIdMapping =
        dictionary_builder.serialize(arena, &mut counting_writer)?;
    let dictionary_num_bytes: u32 = counting_writer.written_bytes() as u32;
    let mut wrt = counting_writer.finish();
    let operation_iterator = operation_it.map(|symbol: ColumnOperation<UnorderedId>| {
        // We map unordered ids to ordered ids.
        match symbol {
            ColumnOperation::Value(unordered_id) => {
                let ordered_id = term_id_mapping.to_ord(unordered_id);
                ColumnOperation::Value(ordered_id.0 as u64)
            }
            ColumnOperation::NewDoc(doc) => ColumnOperation::NewDoc(doc),
        }
    });
    send_to_serialize_column_mappable_to_u64(
        operation_iterator,
        cardinality,
        num_docs,
        sort_values_within_row,
        value_index_builders,
        u64_values,
        &mut wrt,
    )?;
    wrt.write_all(&dictionary_num_bytes.to_le_bytes()[..])?;
    Ok(())
}

fn serialize_numerical_column(
    cardinality: Cardinality,
    num_docs: RowId,
    numerical_type: NumericalType,
    op_iterator: impl Iterator<Item = ColumnOperation<NumericalValue>>,
    buffers: &mut SpareBuffers,
    wrt: &mut impl io::Write,
) -> io::Result<()> {
    let SpareBuffers {
        value_index_builders,
        u64_values,
        ..
    } = buffers;
    match numerical_type {
        NumericalType::I64 => {
            send_to_serialize_column_mappable_to_u64(
                coerce_numerical_symbol::<i64>(op_iterator),
                cardinality,
                num_docs,
                false,
                value_index_builders,
                u64_values,
                wrt,
            )?;
        }
        NumericalType::U64 => {
            send_to_serialize_column_mappable_to_u64(
                coerce_numerical_symbol::<u64>(op_iterator),
                cardinality,
                num_docs,
                false,
                value_index_builders,
                u64_values,
                wrt,
            )?;
        }
        NumericalType::F64 => {
            send_to_serialize_column_mappable_to_u64(
                coerce_numerical_symbol::<f64>(op_iterator),
                cardinality,
                num_docs,
                false,
                value_index_builders,
                u64_values,
                wrt,
            )?;
        }
    };
    Ok(())
}

fn serialize_bool_column(
    cardinality: Cardinality,
    num_docs: RowId,
    column_operations_it: impl Iterator<Item = ColumnOperation<bool>>,
    buffers: &mut SpareBuffers,
    wrt: &mut impl io::Write,
) -> io::Result<()> {
    let SpareBuffers {
        value_index_builders,
        u64_values,
        ..
    } = buffers;
    send_to_serialize_column_mappable_to_u64(
        column_operations_it.map(|bool_column_operation| match bool_column_operation {
            ColumnOperation::NewDoc(doc) => ColumnOperation::NewDoc(doc),
            ColumnOperation::Value(bool_val) => ColumnOperation::Value(bool_val.to_u64()),
        }),
        cardinality,
        num_docs,
        false,
        value_index_builders,
        u64_values,
        wrt,
    )?;
    Ok(())
}

fn serialize_ip_addr_column(
    cardinality: Cardinality,
    num_docs: RowId,
    column_operations_it: impl Iterator<Item = ColumnOperation<Ipv6Addr>>,
    buffers: &mut SpareBuffers,
    wrt: &mut impl io::Write,
) -> io::Result<()> {
    let SpareBuffers {
        value_index_builders,
        ip_addr_values,
        ..
    } = buffers;
    send_to_serialize_column_mappable_to_u128(
        column_operations_it,
        cardinality,
        num_docs,
        value_index_builders,
        ip_addr_values,
        wrt,
    )?;
    Ok(())
}

fn send_to_serialize_column_mappable_to_u128<
    T: Copy + Ord + std::fmt::Debug + Send + Sync + MonotonicallyMappableToU128 + PartialOrd,
>(
    op_iterator: impl Iterator<Item = ColumnOperation<T>>,
    cardinality: Cardinality,
    num_rows: RowId,
    value_index_builders: &mut PreallocatedIndexBuilders,
    values: &mut Vec<T>,
    mut wrt: impl io::Write,
) -> io::Result<()> {
    values.clear();
    // TODO: split index and values
    let serializable_column_index = match cardinality {
        Cardinality::Full => {
            consume_operation_iterator(
                op_iterator,
                value_index_builders.borrow_required_index_builder(),
                values,
            );
            SerializableColumnIndex::Full
        }
        Cardinality::Optional => {
            let optional_index_builder = value_index_builders.borrow_optional_index_builder();
            consume_operation_iterator(op_iterator, optional_index_builder, values);
            let optional_index = optional_index_builder.finish(num_rows);
            SerializableColumnIndex::Optional(SerializableOptionalIndex {
                num_rows,
                non_null_row_ids: Box::new(optional_index),
            })
        }
        Cardinality::Multivalued => {
            let multivalued_index_builder = value_index_builders.borrow_multivalued_index_builder();
            consume_operation_iterator(op_iterator, multivalued_index_builder, values);
            let serializable_multivalued_index = multivalued_index_builder.finish(num_rows);
            SerializableColumnIndex::Multivalued(serializable_multivalued_index)
        }
    };
    crate::column::serialize_column_mappable_to_u128(
        serializable_column_index,
        &&values[..],
        &mut wrt,
    )?;
    Ok(())
}

fn send_to_serialize_column_mappable_to_u64(
    op_iterator: impl Iterator<Item = ColumnOperation<u64>>,
    cardinality: Cardinality,
    num_rows: RowId,
    sort_values_within_row: bool,
    value_index_builders: &mut PreallocatedIndexBuilders,
    values: &mut Vec<u64>,
    mut wrt: impl io::Write,
) -> io::Result<()> {
    values.clear();
    let serializable_column_index = match cardinality {
        Cardinality::Full => {
            consume_operation_iterator(
                op_iterator,
                value_index_builders.borrow_required_index_builder(),
                values,
            );
            SerializableColumnIndex::Full
        }
        Cardinality::Optional => {
            let optional_index_builder = value_index_builders.borrow_optional_index_builder();
            consume_operation_iterator(op_iterator, optional_index_builder, values);
            let optional_index = optional_index_builder.finish(num_rows);
            SerializableColumnIndex::Optional(SerializableOptionalIndex {
                non_null_row_ids: Box::new(optional_index),
                num_rows,
            })
        }
        Cardinality::Multivalued => {
            let multivalued_index_builder = value_index_builders.borrow_multivalued_index_builder();
            consume_operation_iterator(op_iterator, multivalued_index_builder, values);
            let serializable_multivalued_index = multivalued_index_builder.finish(num_rows);
            if sort_values_within_row {
                sort_values_within_row_in_place(
                    serializable_multivalued_index.start_offsets.boxed_iter(),
                    values,
                );
            }
            SerializableColumnIndex::Multivalued(serializable_multivalued_index)
        }
    };
    crate::column::serialize_column_mappable_to_u64(
        serializable_column_index,
        &&values[..],
        &mut wrt,
    )?;
    Ok(())
}

fn sort_values_within_row_in_place(
    multivalued_index: impl Iterator<Item = RowId>,
    values: &mut [u64],
) {
    let mut start_index: usize = 0;
    for end_index in multivalued_index {
        let end_index = end_index as usize;
        values[start_index..end_index].sort_unstable();
        start_index = end_index;
    }
}

fn coerce_numerical_symbol<T>(
    operation_iterator: impl Iterator<Item = ColumnOperation<NumericalValue>>,
) -> impl Iterator<Item = ColumnOperation<u64>>
where T: Coerce + MonotonicallyMappableToU64 {
    operation_iterator.map(|symbol| match symbol {
        ColumnOperation::NewDoc(doc) => ColumnOperation::NewDoc(doc),
        ColumnOperation::Value(numerical_value) => {
            ColumnOperation::Value(T::coerce(numerical_value).to_u64())
        }
    })
}

fn consume_operation_iterator<T: Ord, TIndexBuilder: IndexBuilder>(
    operation_iterator: impl Iterator<Item = ColumnOperation<T>>,
    index_builder: &mut TIndexBuilder,
    values: &mut Vec<T>,
) {
    for symbol in operation_iterator {
        match symbol {
            ColumnOperation::NewDoc(doc) => {
                index_builder.record_row(doc);
            }
            ColumnOperation::Value(value) => {
                index_builder.record_value();
                values.push(value);
            }
        }
    }
}

#[cfg(test)]
mod tests {
    use stacker::MemoryArena;

    use crate::columnar::writer::column_operation::ColumnOperation;
    use crate::{Cardinality, NumericalValue};

    #[test]
    fn test_column_writer_required_simple() {
        let mut arena = MemoryArena::default();
        let mut column_writer = super::ColumnWriter::default();
        column_writer.record(0u32, NumericalValue::from(14i64), &mut arena);
        column_writer.record(1u32, NumericalValue::from(15i64), &mut arena);
        column_writer.record(2u32, NumericalValue::from(-16i64), &mut arena);
        assert_eq!(column_writer.get_cardinality(3), Cardinality::Full);
        let mut buffer = Vec::new();
        let symbols: Vec<ColumnOperation<NumericalValue>> = column_writer
            .operation_iterator(&arena, &mut buffer)
            .collect();
        assert_eq!(symbols.len(), 6);
        assert!(matches!(symbols[0], ColumnOperation::NewDoc(0u32)));
        assert!(matches!(
            symbols[1],
            ColumnOperation::Value(NumericalValue::I64(14i64))
        ));
        assert!(matches!(symbols[2], ColumnOperation::NewDoc(1u32)));
        assert!(matches!(
            symbols[3],
            ColumnOperation::Value(NumericalValue::I64(15i64))
        ));
        assert!(matches!(symbols[4], ColumnOperation::NewDoc(2u32)));
        assert!(matches!(
            symbols[5],
            ColumnOperation::Value(NumericalValue::I64(-16i64))
        ));
    }

    #[test]
    fn test_column_writer_optional_cardinality_missing_first() {
        let mut arena = MemoryArena::default();
        let mut column_writer = super::ColumnWriter::default();
        column_writer.record(1u32, NumericalValue::from(15i64), &mut arena);
        column_writer.record(2u32, NumericalValue::from(-16i64), &mut arena);
        assert_eq!(column_writer.get_cardinality(3), Cardinality::Optional);
        let mut buffer = Vec::new();
        let symbols: Vec<ColumnOperation<NumericalValue>> = column_writer
            .operation_iterator(&arena, &mut buffer)
            .collect();
        assert_eq!(symbols.len(), 4);
        assert!(matches!(symbols[0], ColumnOperation::NewDoc(1u32)));
        assert!(matches!(
            symbols[1],
            ColumnOperation::Value(NumericalValue::I64(15i64))
        ));
        assert!(matches!(symbols[2], ColumnOperation::NewDoc(2u32)));
        assert!(matches!(
            symbols[3],
            ColumnOperation::Value(NumericalValue::I64(-16i64))
        ));
    }

    #[test]
    fn test_column_writer_optional_cardinality_missing_last() {
        let mut arena = MemoryArena::default();
        let mut column_writer = super::ColumnWriter::default();
        column_writer.record(0u32, NumericalValue::from(15i64), &mut arena);
        assert_eq!(column_writer.get_cardinality(2), Cardinality::Optional);
        let mut buffer = Vec::new();
        let symbols: Vec<ColumnOperation<NumericalValue>> = column_writer
            .operation_iterator(&arena, &mut buffer)
            .collect();
        assert_eq!(symbols.len(), 2);
        assert!(matches!(symbols[0], ColumnOperation::NewDoc(0u32)));
        assert!(matches!(
            symbols[1],
            ColumnOperation::Value(NumericalValue::I64(15i64))
        ));
    }

    #[test]
    fn test_column_writer_multivalued() {
        let mut arena = MemoryArena::default();
        let mut column_writer = super::ColumnWriter::default();
        column_writer.record(0u32, NumericalValue::from(16i64), &mut arena);
        column_writer.record(0u32, NumericalValue::from(17i64), &mut arena);
        assert_eq!(column_writer.get_cardinality(1), Cardinality::Multivalued);
        let mut buffer = Vec::new();
        let symbols: Vec<ColumnOperation<NumericalValue>> = column_writer
            .operation_iterator(&arena, &mut buffer)
            .collect();
        assert_eq!(symbols.len(), 3);
        assert!(matches!(symbols[0], ColumnOperation::NewDoc(0u32)));
        assert!(matches!(
            symbols[1],
            ColumnOperation::Value(NumericalValue::I64(16i64))
        ));
        assert!(matches!(
            symbols[2],
            ColumnOperation::Value(NumericalValue::I64(17i64))
        ));
    }
}


================================================
FILE: columnar/src/columnar/writer/serializer.rs
================================================
use std::io;
use std::io::Write;

use common::json_path_writer::JSON_END_OF_PATH;
use common::{BinarySerializable, CountingWriter};
use sstable::RangeSSTable;
use sstable::value::RangeValueWriter;

use crate::RowId;
use crate::columnar::ColumnType;

pub struct ColumnarSerializer<W: io::Write> {
    wrt: CountingWriter<W>,
    sstable_range: sstable::Writer<Vec<u8>, RangeValueWriter>,
    prepare_key_buffer: Vec<u8>,
}

/// Returns a key consisting of the concatenation of the key and the column_type_and_cardinality
/// code.
fn prepare_key(key: &[u8], column_type: ColumnType, buffer: &mut Vec<u8>) {
    buffer.clear();
    buffer.extend_from_slice(key);
    buffer.push(JSON_END_OF_PATH);
    buffer.push(column_type.to_code());
}

impl<W: io::Write> ColumnarSerializer<W> {
    pub(crate) fn new(wrt: W) -> ColumnarSerializer<W> {
        let sstable_range: sstable::Writer<Vec<u8>, RangeValueWriter> =
            sstable::Dictionary::<RangeSSTable>::builder(Vec::with_capacity(100_000)).unwrap();
        ColumnarSerializer {
            wrt: CountingWriter::wrap(wrt),
            sstable_range,
            prepare_key_buffer: Vec::new(),
        }
    }

    /// Creates a ColumnSerializer.
    pub fn start_serialize_column<'a>(
        &'a mut self,
        column_name: &[u8],
        column_type: ColumnType,
    ) -> ColumnSerializer<'a, W> {
        let start_offset = self.wrt.written_bytes();
        prepare_key(column_name, column_type, &mut self.prepare_key_buffer);
        ColumnSerializer {
            columnar_serializer: self,
            start_offset,
        }
    }

    pub(crate) fn finalize(mut self, num_rows: RowId) -> io::Result<()> {
        let sstable_bytes: Vec<u8> = self.sstable_range.finish()?;
        let sstable_num_bytes: u64 = sstable_bytes.len() as u64;
        self.wrt.write_all(&sstable_bytes)?;
        self.wrt.write_all(&sstable_num_bytes.to_le_bytes()[..])?;
        num_rows.serialize(&mut self.wrt)?;
        self.wrt
            .write_all(&super::super::format_version::footer())?;
        self.wrt.flush()?;
        Ok(())
    }
}

pub struct ColumnSerializer<'a, W: io::Write> {
    columnar_serializer: &'a mut ColumnarSerializer<W>,
    start_offset: u64,
}

impl<W: io::Write> ColumnSerializer<'_, W> {
    pub fn finalize(self) -> io::Result<()> {
        let end_offset: u64 = self.columnar_serializer.wrt.written_bytes();
        let byte_range = self.start_offset..end_offset;
        self.columnar_serializer.sstable_range.insert(
            &self.columnar_serializer.prepare_key_buffer[..],
            &byte_range,
        )?;
        self.columnar_serializer.prepare_key_buffer.clear();
        Ok(())
    }
}

impl<W: io::Write> io::Write for ColumnSerializer<'_, W> {
    fn write(&mut self, buf: &[u8]) -> io::Result<usize> {
        self.columnar_serializer.wrt.write(buf)
    }

    fn flush(&mut self) -> io::Result<()> {
        self.columnar_serializer.wrt.flush()
    }

    fn write_all(&mut self, buf: &[u8]) -> io::Result<()> {
        self.columnar_serializer.wrt.write_all(buf)
    }
}


================================================
FILE: columnar/src/columnar/writer/value_index.rs
================================================
use crate::RowId;
use crate::column_index::{SerializableMultivalueIndex, SerializableOptionalIndex};
use crate::iterable::Iterable;

/// The `IndexBuilder` interprets a sequence of
/// calls of the form:
/// (record_doc,record_value+)*
/// and can then serialize the results into an index to associate docids with their value[s].
///
/// It has different implementation depending on whether the
/// cardinality is required, optional, or multivalued.
pub(crate) trait IndexBuilder {
    fn record_row(&mut self, doc: RowId);
    #[inline]
    fn record_value(&mut self) {}
}

/// The FullIndexBuilder does nothing.
#[derive(Default)]
pub struct FullIndexBuilder;

impl IndexBuilder for FullIndexBuilder {
    #[inline(always)]
    fn record_row(&mut self, _doc: RowId) {}
}

#[derive(Default)]
pub struct OptionalIndexBuilder {
    docs: Vec<RowId>,
}

impl OptionalIndexBuilder {
    pub fn finish(&mut self, num_rows: RowId) -> impl Iterable<RowId> + '_ {
        debug_assert!(
            self.docs
                .last()
                .copied()
                .map(|last_doc| last_doc < num_rows)
                .unwrap_or(true)
        );
        &self.docs[..]
    }

    fn reset(&mut self) {
        self.docs.clear();
    }
}

impl IndexBuilder for OptionalIndexBuilder {
    #[inline(always)]
    fn record_row(&mut self, doc: RowId) {
        debug_assert!(
            self.docs
                .last()
                .copied()
                .map(|prev_doc| doc > prev_doc)
                .unwrap_or(true)
        );
        self.docs.push(doc);
    }
}

#[derive(Default)]
pub struct MultivaluedIndexBuilder {
    doc_with_values: Vec<RowId>,
    start_offsets: Vec<u32>,
    total_num_vals_seen: u32,
    current_row: RowId,
    current_row_has_value: bool,
}

impl MultivaluedIndexBuilder {
    pub fn finish(&mut self, num_docs: RowId) -> SerializableMultivalueIndex<'_> {
        self.start_offsets.push(self.total_num_vals_seen);
        let non_null_row_ids: Box<dyn Iterable<RowId>> = Box::new(&self.doc_with_values[..]);
        SerializableMultivalueIndex {
            doc_ids_with_values: SerializableOptionalIndex {
                non_null_row_ids,
                num_rows: num_docs,
            },
            start_offsets: Box::new(&self.start_offsets[..]),
        }
    }

    fn reset(&mut self) {
        self.doc_with_values.clear();
        self.start_offsets.clear();
        self.total_num_vals_seen = 0;
        self.current_row = 0;
        self.current_row_has_value = false;
    }
}

impl IndexBuilder for MultivaluedIndexBuilder {
    fn record_row(&mut self, row_id: RowId) {
        self.current_row = row_id;
        self.current_row_has_value = false;
    }

    fn record_value(&mut self) {
        if !self.current_row_has_value {
            self.current_row_has_value = true;
            self.doc_with_values.push(self.current_row);
            self.start_offsets.push(self.total_num_vals_seen);
        }
        self.total_num_vals_seen += 1;
    }
}

/// The `SpareIndexBuilders` is there to avoid allocating a
/// new index builder for every single column.
#[derive(Default)]
pub struct PreallocatedIndexBuilders {
    required_index_builder: FullIndexBuilder,
    optional_index_builder: OptionalIndexBuilder,
    multivalued_index_builder: MultivaluedIndexBuilder,
}

impl PreallocatedIndexBuilders {
    pub fn borrow_required_index_builder(&mut self) -> &mut FullIndexBuilder {
        &mut self.required_index_builder
    }

    pub fn borrow_optional_index_builder(&mut self) -> &mut OptionalIndexBuilder {
        self.optional_index_builder.reset();
        &mut self.optional_index_builder
    }

    pub fn borrow_multivalued_index_builder(&mut self) -> &mut MultivaluedIndexBuilder {
        self.multivalued_index_builder.reset();
        &mut self.multivalued_index_builder
    }
}

#[cfg(test)]
mod tests {
    use super::*;

    #[test]
    fn test_optional_value_index_builder() {
        let mut opt_value_index_builder = OptionalIndexBuilder::default();
        opt_value_index_builder.record_row(0u32);
        opt_value_index_builder.record_value();
        assert_eq!(
            &opt_value_index_builder
                .finish(1u32)
                .boxed_iter()
                .collect::<Vec<u32>>(),
            &[0]
        );
        opt_value_index_builder.reset();
        opt_value_index_builder.record_row(1u32);
        opt_value_index_builder.record_value();
        assert_eq!(
            &opt_value_index_builder
                .finish(2u32)
                .boxed_iter()
                .collect::<Vec<u32>>(),
            &[1]
        );
    }

    #[test]
    fn test_multivalued_value_index_builder_simple() {
        let mut multivalued_value_index_builder = MultivaluedIndexBuilder::default();
        {
            multivalued_value_index_builder.record_row(0u32);
            multivalued_value_index_builder.record_value();
            multivalued_value_index_builder.record_value();
            let serialized_multivalue_index = multivalued_value_index_builder.finish(1u32);
            let start_offsets: Vec<u32> = serialized_multivalue_index
                .start_offsets
                .boxed_iter()
                .collect();
            assert_eq!(&start_offsets, &[0, 2]);
        }
        multivalued_value_index_builder.reset();
        multivalued_value_index_builder.record_row(0u32);
        multivalued_value_index_builder.record_value();
        multivalued_value_index_builder.record_value();
        let serialized_multivalue_index = multivalued_value_index_builder.finish(1u32);
        let start_offsets: Vec<u32> = serialized_multivalue_index
            .start_offsets
            .boxed_iter()
            .collect();
        assert_eq!(&start_offsets, &[0, 2]);
    }

    #[test]
    fn test_multivalued_value_index_builder() {
        let mut multivalued_value_index_builder = MultivaluedIndexBuilder::default();
        multivalued_value_index_builder.record_row(1u32);
        multivalued_value_index_builder.record_value();
        multivalued_value_index_builder.record_value();
        multivalued_value_index_builder.record_row(2u32);
        multivalued_value_index_builder.record_value();
        let SerializableMultivalueIndex {
            doc_ids_with_values,
            start_offsets,
        } = multivalued_value_index_builder.finish(4u32);
        assert_eq!(doc_ids_with_values.num_rows, 4u32);
        let doc_ids_with_values: Vec<u32> =
            doc_ids_with_values.non_null_row_ids.boxed_iter().collect();
        assert_eq!(&doc_ids_with_values, &[1u32, 2u32]);
        let start_offsets: Vec<u32> = start_offsets.boxed_iter().collect();
        assert_eq!(&start_offsets[..], &[0, 2, 3]);
    }
}


================================================
FILE: columnar/src/compat_tests.rs
================================================
use std::path::PathBuf;

use itertools::Itertools;

use crate::{
    CURRENT_VERSION, Cardinality, Column, ColumnarReader, DynamicColumn, StackMergeOrder,
    merge_columnar,
};

const NUM_DOCS: u32 = u16::MAX as u32;

fn generate_columnar(num_docs: u32, value_offset: u64) -> Vec<u8> {
    use crate::ColumnarWriter;

    let mut columnar_writer = ColumnarWriter::default();

    for i in 0..num_docs {
        if i % 100 == 0 {
            columnar_writer.record_numerical(i, "sparse", value_offset + i as u64);
        }
        if i % 5 == 0 {
            columnar_writer.record_numerical(i, "dense", value_offset + i as u64);
        }
        columnar_writer.record_numerical(i, "full", value_offset + i as u64);
        columnar_writer.record_numerical(i, "multi", value_offset + i as u64);
        columnar_writer.record_numerical(i, "multi", value_offset + i as u64);
    }

    let mut wrt: Vec<u8> = Vec::new();
    columnar_writer.serialize(num_docs, &mut wrt).unwrap();

    wrt
}

#[test]
/// Writes a columnar for the CURRENT_VERSION to disk.
fn create_format() {
    let version = CURRENT_VERSION.to_string();
    let file_path = path_for_version(&version);
    if PathBuf::from(file_path.clone()).exists() {
        return;
    }
    let columnar = generate_columnar(NUM_DOCS, 0);
    std::fs::write(file_path, columnar).unwrap();
}

fn path_for_version(version: &str) -> String {
    format!("./compat_tests_data/{}.columnar", version)
}

#[test]
fn test_format_v1() {
    let path = path_for_version("v1");
    test_format(&path);
}

#[test]
fn test_format_v2() {
    let path = path_for_version("v2");
    test_format(&path);
}

fn test_format(path: &str) {
    let file_content = std::fs::read(path).unwrap();
    let reader = ColumnarReader::open(file_content).unwrap();

    check_columns(&reader);

    // Test merge
    let reader2 = ColumnarReader::open(generate_columnar(NUM_DOCS, NUM_DOCS as u64)).unwrap();
    let columnar_readers = vec![&reader, &reader2];
    let merge_row_order = StackMergeOrder::stack(&columnar_readers[..]);
    let mut out = Vec::new();
    merge_columnar(&columnar_readers, &[], merge_row_order.into(), &mut out).unwrap();
    let reader = ColumnarReader::open(out).unwrap();
    check_columns(&reader);
}

fn check_columns(reader: &ColumnarReader) {
    let column = open_column(reader, "full");
    check_column(&column, |doc_id| vec![(doc_id, doc_id as u64).into()]);
    assert_eq!(column.get_cardinality(), Cardinality::Full);

    let column = open_column(reader, "multi");
    check_column(&column, |doc_id| {
        vec![
            (doc_id * 2, doc_id as u64).into(),
            (doc_id * 2 + 1, doc_id as u64).into(),
        ]
    });
    assert_eq!(column.get_cardinality(), Cardinality::Multivalued);

    let column = open_column(reader, "sparse");
    check_column(&column, |doc_id| {
        if doc_id % 100 == 0 {
            vec![(doc_id / 100, doc_id as u64).into()]
        } else {
            vec![]
        }
    });
    assert_eq!(column.get_cardinality(), Cardinality::Optional);

    let column = open_column(reader, "dense");
    check_column(&column, |doc_id| {
        if doc_id % 5 == 0 {
            vec![(doc_id / 5, doc_id as u64).into()]
        } else {
            vec![]
        }
    });
    assert_eq!(column.get_cardinality(), Cardinality::Optional);
}

struct RowIdAndValue {
    row_id: u32,
    value: u64,
}
impl From<(u32, u64)> for RowIdAndValue {
    fn from((row_id, value): (u32, u64)) -> Self {
        Self { row_id, value }
    }
}

fn check_column<F: Fn(u32) -> Vec<RowIdAndValue>>(column: &Column<u64>, expected: F) {
    let num_docs = column.num_docs();
    let test_doc = |doc: u32| {
        if expected(doc).is_empty() {
            assert_eq!(column.first(doc), None);
        } else {
            assert_eq!(column.first(doc), Some(expected(doc)[0].value));
        }
        let values = column.values_for_doc(doc).collect_vec();
        assert_eq!(values, expected(doc).iter().map(|x| x.value).collect_vec());
        let mut row_ids = Vec::new();
        column.row_ids_for_docs(&[doc], &mut vec![], &mut row_ids);
        assert_eq!(
            row_ids,
            expected(doc).iter().map(|x| x.row_id).collect_vec()
        );
        let values = column.values_for_doc(doc).collect_vec();
        assert_eq!(values, expected(doc).iter().map(|x| x.value).collect_vec());

        // Docid rowid conversion
        let mut row_ids = Vec::new();
        let safe_next_doc = |doc: u32| (doc + 1).min(num_docs - 1);
        column
            .index
            .docids_to_rowids(&[doc, safe_next_doc(doc)], &mut vec![], &mut row_ids);
        let expected_rowids = expected(doc)
            .iter()
            .map(|x| x.row_id)
            .chain(expected(safe_next_doc(doc)).iter().map(|x| x.row_id))
            .collect_vec();
        assert_eq!(row_ids, expected_rowids);
        let rowid_range = column
            .index
            .docid_range_to_rowids(doc..safe_next_doc(doc) + 1);
        if expected_rowids.is_empty() {
            assert!(rowid_range.is_empty());
        } else {
            assert_eq!(
                rowid_range,
                expected_rowids[0]..expected_rowids.last().unwrap() + 1
            );
        }
    };
    test_doc(0);
    test_doc(num_docs - 1);
    test_doc(num_docs - 2);
    test_doc(65000);
}

fn open_column(reader: &ColumnarReader, name: &str) -> Column<u64> {
    let column = reader.read_columns(name).unwrap()[0]
        .open()
        .unwrap()
        .coerce_numerical(crate::NumericalType::U64)
        .unwrap();
    let DynamicColumn::U64(column) = column else {
        panic!();
    };
    column
}


================================================
FILE: columnar/src/dictionary.rs
================================================
use std::io;

use sstable::SSTable;
use stacker::{MemoryArena, SharedArenaHashMap};

pub(crate) struct TermIdMapping {
    unordered_to_ord: Vec<OrderedId>,
}

impl TermIdMapping {
    pub fn to_ord(&self, unordered: UnorderedId) -> OrderedId {
        self.unordered_to_ord[unordered.0 as usize]
    }
}

/// When we add values, we cannot know their ordered id yet.
/// For this reason, we temporarily assign them a `UnorderedId`
/// that will be mapped to an `OrderedId` upon serialization.
#[derive(Clone, Copy, Debug, Hash, PartialEq, Eq)]
pub struct UnorderedId(pub u32);

#[derive(Clone, Copy, Hash, PartialEq, Eq, Debug)]
pub struct OrderedId(pub u32);

/// `DictionaryBuilder` for dictionary encoding.
///
/// It stores the different terms encounterred and assigns them a temporary value
/// we call unordered id.
///
/// Upon serialization, we will sort the ids and hence build a `UnorderedId -> Term ordinal`
/// mapping.
#[derive(Default)]
pub(crate) struct DictionaryBuilder {
    dict: SharedArenaHashMap,
}

impl DictionaryBuilder {
    /// Get or allocate an unordered id.
    /// (This ID is simply an auto-incremented id.)
    pub fn get_or_allocate_id(&mut self, term: &[u8], arena: &mut MemoryArena) -> UnorderedId {
        let next_id = self.dict.len() as u32;
        let unordered_id = self
            .dict
            .mutate_or_create(term, arena, |unordered_id: Option<u32>| {
                if let Some(unordered_id) = unordered_id {
                    unordered_id
                } else {
                    next_id
                }
            });
        UnorderedId(unordered_id)
    }

    /// Serialize the dictionary into an fst, and returns the
    /// `UnorderedId -> TermOrdinal` map.
    pub fn serialize<'a, W: io::Write + 'a>(
        &self,
        arena: &MemoryArena,
        wrt: &mut W,
    ) -> io::Result<TermIdMapping> {
        let mut terms: Vec<(&[u8], UnorderedId)> = self
            .dict
            .iter(arena)
            .map(|(k, v)| (k, arena.read(v)))
            .collect();
        terms.sort_unstable_by_key(|(key, _)| *key);
        // TODO Remove the allocation.
        let mut unordered_to_ord: Vec<OrderedId> = vec![OrderedId(0u32); terms.len()];
        let mut sstable_builder = sstable::VoidSSTable::writer(wrt);
        for (ord, (key, unordered_id)) in terms.into_iter().enumerate() {
            let ordered_id = OrderedId(ord as u32);
            sstable_builder.insert(key, &())?;
            unordered_to_ord[unordered_id.0 as usize] = ordered_id;
        }
        sstable_builder.finish()?;
        Ok(TermIdMapping { unordered_to_ord })
    }

    pub(crate) fn mem_usage(&self) -> usize {
        self.dict.mem_usage()
    }
}

#[cfg(test)]
mod tests {
    use super::*;

    #[test]
    fn test_dictionary_builder() {
        let mut arena = MemoryArena::default();
        let mut dictionary_builder = DictionaryBuilder::default();
        let hello_uid = dictionary_builder.get_or_allocate_id(b"hello", &mut arena);
        let happy_uid = dictionary_builder.get_or_allocate_id(b"happy", &mut arena);
        let tax_uid = dictionary_builder.get_or_allocate_id(b"tax", &mut arena);
        let mut buffer = Vec::new();
        let id_mapping = dictionary_builder.serialize(&arena, &mut buffer).unwrap();
        assert_eq!(id_mapping.to_ord(hello_uid), OrderedId(1));
        assert_eq!(id_mapping.to_ord(happy_uid), OrderedId(0));
        assert_eq!(id_mapping.to_ord(tax_uid), OrderedId(2));
    }
}


================================================
FILE: columnar/src/dynamic_column.rs
================================================
use std::net::Ipv6Addr;
use std::sync::Arc;
use std::{fmt, io};

use common::file_slice::FileSlice;
use common::{ByteCount, DateTime, OwnedBytes};
use serde::{Deserialize, Serialize};

use crate::column::{BytesColumn, Column, StrColumn};
use crate::column_values::{StrictlyMonotonicFn, monotonic_map_column};
use crate::columnar::ColumnType;
use crate::{Cardinality, ColumnIndex, ColumnValues, NumericalType, Version};

#[derive(Clone)]
pub enum DynamicColumn {
    Bool(Column<bool>),
    I64(Column<i64>),
    U64(Column<u64>),
    F64(Column<f64>),
    IpAddr(Column<Ipv6Addr>),
    DateTime(Column<DateTime>),
    Bytes(BytesColumn),
    Str(StrColumn),
}

impl fmt::Debug for DynamicColumn {
    fn fmt(&self, f: &mut fmt::Formatter) -> fmt::Result {
        write!(f, "[{} {} |", self.get_cardinality(), self.column_type())?;
        match self {
            DynamicColumn::Bool(col) => write!(f, " {col:?}")?,
            DynamicColumn::I64(col) => write!(f, " {col:?}")?,
            DynamicColumn::U64(col) => write!(f, " {col:?}")?,
            DynamicColumn::F64(col) => write!(f, "{col:?}")?,
            DynamicColumn::IpAddr(col) => write!(f, "{col:?}")?,
            DynamicColumn::DateTime(col) => write!(f, "{col:?}")?,
            DynamicColumn::Bytes(col) => write!(f, "{col:?}")?,
            DynamicColumn::Str(col) => write!(f, "{col:?}")?,
        }
        write!(f, "]")
    }
}

impl DynamicColumn {
    pub fn column_index(&self) -> &ColumnIndex {
        match self {
            DynamicColumn::Bool(c) => &c.index,
            DynamicColumn::I64(c) => &c.index,
            DynamicColumn::U64(c) => &c.index,
            DynamicColumn::F64(c) => &c.index,
            DynamicColumn::IpAddr(c) => &c.index,
            DynamicColumn::DateTime(c) => &c.index,
            DynamicColumn::Bytes(c) => &c.ords().index,
            DynamicColumn::Str(c) => &c.ords().index,
        }
    }

    pub fn get_cardinality(&self) -> Cardinality {
        self.column_index().get_cardinality()
    }

    pub fn num_values(&self) -> u32 {
        match self {
            DynamicColumn::Bool(c) => c.values.num_vals(),
            DynamicColumn::I64(c) => c.values.num_vals(),
            DynamicColumn::U64(c) => c.values.num_vals(),
            DynamicColumn::F64(c) => c.values.num_vals(),
            DynamicColumn::IpAddr(c) => c.values.num_vals(),
            DynamicColumn::DateTime(c) => c.values.num_vals(),
            DynamicColumn::Bytes(c) => c.ords().values.num_vals(),
            DynamicColumn::Str(c) => c.ords().values.num_vals(),
        }
    }

    pub fn column_type(&self) -> ColumnType {
        match self {
            DynamicColumn::Bool(_) => ColumnType::Bool,
            DynamicColumn::I64(_) => ColumnType::I64,
            DynamicColumn::U64(_) => ColumnType::U64,
            DynamicColumn::F64(_) => ColumnType::F64,
            DynamicColumn::IpAddr(_) => ColumnType::IpAddr,
            DynamicColumn::DateTime(_) => ColumnType::DateTime,
            DynamicColumn::Bytes(_) => ColumnType::Bytes,
            DynamicColumn::Str(_) => ColumnType::Str,
        }
    }

    pub fn coerce_numerical(self, target_numerical_type: NumericalType) -> Option<Self> {
        match target_numerical_type {
            NumericalType::I64 => self.coerce_to_i64(),
            NumericalType::U64 => self.coerce_to_u64(),
            NumericalType::F64 => self.coerce_to_f64(),
        }
    }

    pub fn is_numerical(&self) -> bool {
        self.column_type().numerical_type().is_some()
    }

    pub fn is_f64(&self) -> bool {
        self.column_type().numerical_type() == Some(NumericalType::F64)
    }
    pub fn is_i64(&self) -> bool {
        self.column_type().numerical_type() == Some(NumericalType::I64)
    }
    pub fn is_u64(&self) -> bool {
        self.column_type().numerical_type() == Some(NumericalType::U64)
    }

    fn coerce_to_f64(self) -> Option<DynamicColumn> {
        match self {
            DynamicColumn::I64(column) => Some(DynamicColumn::F64(Column {
                index: column.index,
                values: Arc::new(monotonic_map_column(column.values, MapI64ToF64)),
            })),
            DynamicColumn::U64(column) => Some(DynamicColumn::F64(Column {
                index: column.index,
                values: Arc::new(monotonic_map_column(column.values, MapU64ToF64)),
            })),
            DynamicColumn::F64(_) => Some(self),
            _ => None,
        }
    }
    fn coerce_to_i64(self) -> Option<DynamicColumn> {
        match self {
            DynamicColumn::U64(column) => {
                if column.max_value() > i64::MAX as u64 {
                    return None;
                }
                Some(DynamicColumn::I64(Column {
                    index: column.index,
                    values: Arc::new(monotonic_map_column(column.values, MapU64ToI64)),
                }))
            }
            DynamicColumn::I64(_) => Some(self),
            _ => None,
        }
    }
    fn coerce_to_u64(self) -> Option<DynamicColumn> {
        match self {
            DynamicColumn::I64(column) => {
                if column.min_value() < 0 {
                    return None;
                }
                Some(DynamicColumn::U64(Column {
                    index: column.index,
                    values: Arc::new(monotonic_map_column(column.values, MapI64ToU64)),
                }))
            }
            DynamicColumn::U64(_) => Some(self),
            _ => None,
        }
    }
}

struct MapI64ToF64;
impl StrictlyMonotonicFn<i64, f64> for MapI64ToF64 {
    #[inline(always)]
    fn mapping(&self, inp: i64) -> f64 {
        inp as f64
    }
    #[inline(always)]
    fn inverse(&self, out: f64) -> i64 {
        out as i64
    }
}

struct MapU64ToF64;
impl StrictlyMonotonicFn<u64, f64> for MapU64ToF64 {
    #[inline(always)]
    fn mapping(&self, inp: u64) -> f64 {
        inp as f64
    }
    #[inline(always)]
    fn inverse(&self, out: f64) -> u64 {
        out as u64
    }
}

struct MapU64ToI64;
impl StrictlyMonotonicFn<u64, i64> for MapU64ToI64 {
    #[inline(always)]
    fn mapping(&self, inp: u64) -> i64 {
        inp as i64
    }
    #[inline(always)]
    fn inverse(&self, out: i64) -> u64 {
        out as u64
    }
}

struct MapI64ToU64;
impl StrictlyMonotonicFn<i64, u64> for MapI64ToU64 {
    #[inline(always)]
    fn mapping(&self, inp: i64) -> u64 {
        inp as u64
    }
    #[inline(always)]
    fn inverse(&self, out: u64) -> i64 {
        out as i64
    }
}

macro_rules! static_dynamic_conversions {
    ($typ:ty, $enum_name:ident) => {
        impl From<DynamicColumn> for Option<$typ> {
            fn from(dynamic_column: DynamicColumn) -> Option<$typ> {
                if let DynamicColumn::$enum_name(col) = dynamic_column {
                    Some(col)
                } else {
                    None
                }
            }
        }

        impl From<$typ> for DynamicColumn {
            fn from(typed_column: $typ) -> Self {
                DynamicColumn::$enum_name(typed_column)
            }
        }
    };
}

static_dynamic_conversions!(Column<bool>, Bool);
static_dynamic_conversions!(Column<u64>, U64);
static_dynamic_conversions!(Column<i64>, I64);
static_dynamic_conversions!(Column<f64>, F64);
static_dynamic_conversions!(Column<DateTime>, DateTime);
static_dynamic_conversions!(StrColumn, Str);
static_dynamic_conversions!(BytesColumn, Bytes);
static_dynamic_conversions!(Column<Ipv6Addr>, IpAddr);

#[derive(Clone, Debug)]
pub struct DynamicColumnHandle {
    pub(crate) file_slice: FileSlice,
    pub(crate) column_type: ColumnType,
    pub(crate) format_version: Version,
}

impl DynamicColumnHandle {
    // TODO rename load
    pub fn open(&self) -> io::Result<DynamicColumn> {
        let column_bytes: OwnedBytes = self.file_slice.read_bytes()?;
        self.open_internal(column_bytes)
    }

    #[doc(hidden)]
    pub fn file_slice(&self) -> &FileSlice {
        &self.file_slice
    }

    /// Returns the `u64` fast field reader reader associated with `fields` of types
    /// Str, u64, i64, f64, bool, ip, or datetime.
    ///
    /// Notice that for IpAddr, the fastfield reader will return the u64 representation of the
    /// IpAddr.
    /// In order to convert to u128 back cast to `CompactSpaceU64Accessor` and call
    /// `compact_to_u128`.
    ///
    /// If not, the fastfield reader will returns the u64-value associated with the original
    /// FastValue.
    pub fn open_u64_lenient(&self) -> io::Result<Option<Column<u64>>> {
        let column_bytes = self.file_slice.read_bytes()?;
        match self.column_type {
            ColumnType::Str | ColumnType::Bytes => {
                let column: BytesColumn =
                    crate::column::open_column_bytes(column_bytes, self.format_version)?;
                Ok(Some(column.term_ord_column))
            }
            ColumnType::IpAddr => {
                let column = crate::column::open_column_u128_as_compact_u64(
                    column_bytes,
                    self.format_version,
                )?;
                Ok(Some(column))
            }
            ColumnType::Bool
            | ColumnType::I64
            | ColumnType::U64
            | ColumnType::F64
            | ColumnType::DateTime => {
                let column =
                    crate::column::open_column_u64::<u64>(column_bytes, self.format_version)?;
                Ok(Some(column))
            }
        }
    }

    fn open_internal(&self, column_bytes: OwnedBytes) -> io::Result<DynamicColumn> {
        let dynamic_column: DynamicColumn = match self.column_type {
            ColumnType::Bytes => {
                crate::column::open_column_bytes(column_bytes, self.format_version)?.into()
            }
            ColumnType::Str => {
                crate::column::open_column_str(column_bytes, self.format_version)?.into()
            }
            ColumnType::I64 => {
                crate::column::open_column_u64::<i64>(column_bytes, self.format_version)?.into()
            }
            ColumnType::U64 => {
                crate::column::open_column_u64::<u64>(column_bytes, self.format_version)?.into()
            }
            ColumnType::F64 => {
                crate::column::open_column_u64::<f64>(column_bytes, self.format_version)?.into()
            }
            ColumnType::Bool => {
                crate::column::open_column_u64::<bool>(column_bytes, self.format_version)?.into()
            }
            ColumnType::IpAddr => {
                crate::column::open_column_u128::<Ipv6Addr>(column_bytes, self.format_version)?
                    .into()
            }
            ColumnType::DateTime => {
                crate::column::open_column_u64::<DateTime>(column_bytes, self.format_version)?
                    .into()
            }
        };
        Ok(dynamic_column)
    }

    pub fn num_bytes(&self) -> ByteCount {
        self.file_slice.num_bytes()
    }

    /// Legacy helper returning the column space usage.
    pub fn column_and_dictionary_num_bytes(&self) -> io::Result<ColumnSpaceUsage> {
        self.space_usage()
    }

    /// Return the space usage of the column, optionally broken down by dictionary and column
    /// values.
    ///
    /// For dictionary encoded columns (strings and bytes), this splits the total footprint into
    /// the dictionary and the remaining column data (including index and values).
    /// For all other column types, the dictionary size is `None` and the column size
    /// equals the total bytes.
    pub fn space_usage(&self) -> io::Result<ColumnSpaceUsage> {
        let total_num_bytes = self.num_bytes();
        let dynamic_column = self.open()?;
        let dictionary_num_bytes = match &dynamic_column {
            DynamicColumn::Bytes(bytes_column) => bytes_column.dictionary().num_bytes(),
            DynamicColumn::Str(str_column) => str_column.dictionary().num_bytes(),
            _ => {
                return Ok(ColumnSpaceUsage::new(self.num_bytes(), None));
            }
        };
        assert!(dictionary_num_bytes <= total_num_bytes);
        let column_num_bytes =
            ByteCount::from(total_num_bytes.get_bytes() - dictionary_num_bytes.get_bytes());
        Ok(ColumnSpaceUsage::new(
            column_num_bytes,
            Some(dictionary_num_bytes),
        ))
    }

    pub fn column_type(&self) -> ColumnType {
        self.column_type
    }
}

/// Represents space usage of a column.
///
/// `column_num_bytes` tracks the column payload (index, values and footer).
/// For dictionary encoded columns, `dictionary_num_bytes` captures the dictionary footprint.
/// [`ColumnSpaceUsage::total_num_bytes`] returns the sum of both parts.
#[derive(Clone, Debug, Serialize, Deserialize)]
pub struct ColumnSpaceUsage {
    column_num_bytes: ByteCount,
    dictionary_num_bytes: Option<ByteCount>,
}

impl ColumnSpaceUsage {
    pub(crate) fn new(
        column_num_bytes: ByteCount,
        dictionary_num_bytes: Option<ByteCount>,
    ) -> Self {
        ColumnSpaceUsage {
            column_num_bytes,
            dictionary_num_bytes,
        }
    }

    pub fn column_num_bytes(&self) -> ByteCount {
        self.column_num_bytes
    }

    pub fn dictionary_num_bytes(&self) -> Option<ByteCount> {
        self.dictionary_num_bytes
    }

    pub fn total_num_bytes(&self) -> ByteCount {
        self.column_num_bytes + self.dictionary_num_bytes.unwrap_or_default()
    }

    /// Merge two space usage values by summing their components.
    pub fn merge(&self, other: &ColumnSpaceUsage) -> ColumnSpaceUsage {
        let dictionary_num_bytes = match (self.dictionary_num_bytes, other.dictionary_num_bytes) {
            (Some(lhs), Some(rhs)) => Some(lhs + rhs),
            (Some(val), None) | (None, Some(val)) => Some(val),
            (None, None) => None,
        };
        ColumnSpaceUsage {
            column_num_bytes: self.column_num_bytes + other.column_num_bytes,
            dictionary_num_bytes,
        }
    }
}


================================================
FILE: columnar/src/iterable.rs
================================================
use std::ops::Range;
use std::sync::Arc;

use crate::{ColumnValues, RowId};

pub trait Iterable<T = u64> {
    fn boxed_iter(&self) -> Box<dyn Iterator<Item = T> + '_>;
}

impl<T: Copy> Iterable<T> for &[T] {
    fn boxed_iter(&self) -> Box<dyn Iterator<Item = T> + '_> {
        Box::new(self.iter().copied())
    }
}

impl<T: Copy> Iterable<T> for Range<T>
where Range<T>: Iterator<Item = T>
{
    fn boxed_iter(&self) -> Box<dyn Iterator<Item = T> + '_> {
        Box::new(self.clone())
    }
}

impl Iterable for Arc<dyn crate::ColumnValues<RowId>> {
    fn boxed_iter(&self) -> Box<dyn Iterator<Item = u64> + '_> {
        Box::new(self.iter().map(|row_id| row_id as u64))
    }
}


================================================
FILE: columnar/src/lib.rs
================================================
//! # Tantivy-Columnar
//!
//! `tantivy-columnar`provides a columnar storage for tantivy.
//! The crate allows for efficient read operations on specific columns rather than entire records.
//!
//! ## Overview
//!
//! - **columnar**: Reading, writing, and merging multiple columns:
//!   - **[ColumnarWriter]**: Makes it possible to create a new columnar.
//!   - **[ColumnarReader]**: The ColumnarReader makes it possible to access a set of columns
//!     associated to field names.
//!   - **[merge_columnar]**: Contains the functionalities to merge multiple ColumnarReader or
//!     segments into a single one.
//!
//! - **column**: A single column, which contains
//!     - [column_index]: Resolves the rows for a document id. Manages the cardinality of the
//!       column.
//!     - [column_values]: Stores the values of a column in a dense format.

#[cfg(test)]
#[macro_use]
extern crate more_asserts;

use std::fmt::Display;
use std::io;

mod block_accessor;
mod column;
pub mod column_index;
pub mod column_values;
mod columnar;
mod dictionary;
mod dynamic_column;
mod iterable;
pub(crate) mod utils;
mod value;

pub use block_accessor::ColumnBlockAccessor;
pub use column::{BytesColumn, Column, StrColumn};
pub use column_index::ColumnIndex;
pub use column_values::{
    ColumnValues, EmptyColumnValues, MonotonicallyMappableToU64, MonotonicallyMappableToU128,
};
pub use columnar::{
    CURRENT_VERSION, ColumnType, ColumnarReader, ColumnarWriter, HasAssociatedColumnType,
    MergeRowOrder, ShuffleMergeOrder, StackMergeOrder, Version, merge_columnar,
};
use sstable::VoidSSTable;
pub use value::{NumericalType, NumericalValue};

pub use self::dynamic_column::{ColumnSpaceUsage, DynamicColumn, DynamicColumnHandle};

pub type RowId = u32;
pub type DocId = u32;

#[derive(Clone, Copy, Debug)]
pub struct RowAddr {
    pub segment_ord: u32,
    pub row_id: RowId,
}

pub use sstable::{Dictionary, TermOrdHit};
pub type Streamer<'a> = sstable::Streamer<'a, VoidSSTable>;

pub use common::DateTime;

#[derive(Copy, Clone, Debug)]
pub struct InvalidData;

impl From<InvalidData> for io::Error {
    fn from(_: InvalidData) -> Self {
        io::Error::new(io::ErrorKind::InvalidData, "Invalid data")
    }
}

/// Enum describing the number of values that can exist per document
/// (or per row if you will).
///
/// The cardinality must fit on 2 bits.
#[derive(Clone, Copy, Hash, Default, Debug, PartialEq, Eq, PartialOrd, Ord)]
#[repr(u8)]
pub enum Cardinality {
    /// All documents contain exactly one value.
    /// `Full` is the default for auto-detecting the Cardinality, since it is the most strict.
    #[default]
    Full = 0,
    /// All documents contain at most one value.
    Optional = 1,
    /// All documents may contain any number of values.
    Multivalued = 2,
}

impl Display for Cardinality {
    fn fmt(&self, f: &mut std::fmt::Formatter) -> std::fmt::Result {
        let short_str = match self {
            Cardinality::Full => "full",
            Cardinality::Optional => "opt",
            Cardinality::Multivalued => "mult",
        };
        write!(f, "{short_str}")
    }
}

impl Cardinality {
    pub fn is_optional(&self) -> bool {
        matches!(self, Cardinality::Optional)
    }
    pub fn is_multivalue(&self) -> bool {
        matches!(self, Cardinality::Multivalued)
    }
    pub fn is_full(&self) -> bool {
        matches!(self, Cardinality::Full)
    }
    pub(crate) fn to_code(self) -> u8 {
        self as u8
    }
    pub(crate) fn try_from_code(code: u8) -> Result<Cardinality, InvalidData> {
        match code {
            0 => Ok(Cardinality::Full),
            1 => Ok(Cardinality::Optional),
            2 => Ok(Cardinality::Multivalued),
            _ => Err(InvalidData),
        }
    }
}

#[cfg(test)]
mod tests;

#[cfg(test)]
mod compat_tests;


================================================
FILE: columnar/src/tests.rs
================================================
use std::collections::HashMap;
use std::fmt::Debug;
use std::net::Ipv6Addr;

use common::DateTime;
use proptest::prelude::*;
use proptest::sample::subsequence;

use crate::column_values::MonotonicallyMappableToU128;
use crate::columnar::{ColumnType, ColumnTypeCategory};
use crate::dynamic_column::{DynamicColumn, DynamicColumnHandle};
use crate::value::{Coerce, NumericalValue};
use crate::{
    BytesColumn, Cardinality, Column, ColumnarReader, ColumnarWriter, RowAddr, RowId,
    ShuffleMergeOrder, StackMergeOrder,
};

#[test]
fn test_dataframe_writer_str() {
    let mut dataframe_writer = ColumnarWriter::default();
    dataframe_writer.record_str(1u32, "my_string", "hello");
    dataframe_writer.record_str(3u32, "my_string", "helloeee");
    let mut buffer: Vec<u8> = Vec::new();
    dataframe_writer.serialize(5, &mut buffer).unwrap();
    let columnar = ColumnarReader::open(buffer).unwrap();
    assert_eq!(columnar.num_columns(), 1);
    let cols: Vec<DynamicColumnHandle> = columnar.read_columns("my_string").unwrap();
    assert_eq!(cols.len(), 1);
    assert_eq!(cols[0].num_bytes(), 73);
}

#[test]
fn test_dataframe_writer_bytes() {
    let mut dataframe_writer = ColumnarWriter::default();
    dataframe_writer.record_bytes(1u32, "my_string", b"hello");
    dataframe_writer.record_bytes(3u32, "my_string", b"helloeee");
    let mut buffer: Vec<u8> = Vec::new();
    dataframe_writer.serialize(5, &mut buffer).unwrap();
    let columnar = ColumnarReader::open(buffer).unwrap();
    assert_eq!(columnar.num_columns(), 1);
    let cols: Vec<DynamicColumnHandle> = columnar.read_columns("my_string").unwrap();
    assert_eq!(cols.len(), 1);
    assert_eq!(cols[0].num_bytes(), 73);
}

#[test]
fn test_dataframe_writer_bool() {
    let mut dataframe_writer = ColumnarWriter::default();
    dataframe_writer.record_bool(1u32, "bool.value", false);
    dataframe_writer.record_bool(3u32, "bool.value", true);
    let mut buffer: Vec<u8> = Vec::new();
    dataframe_writer.serialize(5, &mut buffer).unwrap();
    let columnar = ColumnarReader::open(buffer).unwrap();
    assert_eq!(columnar.num_columns(), 1);
    let cols: Vec<DynamicColumnHandle> = columnar.read_columns("bool.value").unwrap();
    assert_eq!(cols.len(), 1);
    assert_eq!(cols[0].num_bytes(), 22);
    assert_eq!(cols[0].column_type(), ColumnType::Bool);
    let dyn_bool_col = cols[0].open().unwrap();
    let DynamicColumn::Bool(bool_col) = dyn_bool_col else {
        panic!();
    };
    let vals: Vec<Option<bool>> = (0..5).map(|doc_id| bool_col.first(doc_id)).collect();
    assert_eq!(&vals, &[None, Some(false), None, Some(true), None,]);
}

#[test]
fn test_dataframe_writer_u64_multivalued() {
    let mut dataframe_writer = ColumnarWriter::default();
    dataframe_writer.record_numerical(2u32, "divisor", 2u64);
    dataframe_writer.record_numerical(3u32, "divisor", 3u64);
    dataframe_writer.record_numerical(4u32, "divisor", 2u64);
    dataframe_writer.record_numerical(5u32, "divisor", 5u64);
    dataframe_writer.record_numerical(6u32, "divisor", 2u64);
    dataframe_writer.record_numerical(6u32, "divisor", 3u64);
    let mut buffer: Vec<u8> = Vec::new();
    dataframe_writer.serialize(7, &mut buffer).unwrap();
    let columnar = ColumnarReader::open(buffer).unwrap();
    assert_eq!(columnar.num_columns(), 1);
    let cols: Vec<DynamicColumnHandle> = columnar.read_columns("divisor").unwrap();
    assert_eq!(cols.len(), 1);
    assert_eq!(cols[0].num_bytes(), 50);
    let dyn_i64_col = cols[0].open().unwrap();
    let DynamicColumn::I64(divisor_col) = dyn_i64_col else {
        panic!();
    };
    assert_eq!(
        divisor_col.get_cardinality(),
        crate::Cardinality::Multivalued
    );
    assert_eq!(divisor_col.num_docs(), 7);
}

#[test]
fn test_dataframe_writer_ip_addr() {
    let mut dataframe_writer = ColumnarWriter::default();
    dataframe_writer.record_ip_addr(1, "ip_addr", Ipv6Addr::from_u128(1001));
    dataframe_writer.record_ip_addr(3, "ip_addr", Ipv6Addr::from_u128(1050));
    let mut buffer: Vec<u8> = Vec::new();
    dataframe_writer.serialize(5, &mut buffer).unwrap();
    let columnar = ColumnarReader::open(buffer).unwrap();
    assert_eq!(columnar.num_columns(), 1);
    let cols: Vec<DynamicColumnHandle> = columnar.read_columns("ip_addr").unwrap();
    assert_eq!(cols.len(), 1);
    assert_eq!(cols[0].num_bytes(), 42);
    assert_eq!(cols[0].column_type(), ColumnType::IpAddr);
    let dyn_bool_col = cols[0].open().unwrap();
    let DynamicColumn::IpAddr(ip_col) = dyn_bool_col else {
        panic!();
    };
    let vals: Vec<Option<Ipv6Addr>> = (0..5).map(|doc_id| ip_col.first(doc_id)).collect();
    assert_eq!(
        &vals,
        &[
            None,
            Some(Ipv6Addr::from_u128(1001)),
            None,
            Some(Ipv6Addr::from_u128(1050)),
            None,
        ]
    );
}

#[test]
fn test_dataframe_writer_numerical() {
    let mut dataframe_writer = ColumnarWriter::default();
    dataframe_writer.record_numerical(1u32, "srical.value", NumericalValue::U64(12u64));
    dataframe_writer.record_numerical(2u32, "srical.value", NumericalValue::U64(13u64));
    dataframe_writer.record_numerical(4u32, "srical.value", NumericalValue::U64(15u64));
    let mut buffer: Vec<u8> = Vec::new();
    dataframe_writer.serialize(6, &mut buffer).unwrap();
    let columnar = ColumnarReader::open(buffer).unwrap();
    assert_eq!(columnar.num_columns(), 1);
    let cols: Vec<DynamicColumnHandle> = columnar.read_columns("srical.value").unwrap();
    assert_eq!(cols.len(), 1);
    // Right now this 31 bytes are spent as follows
    //
    // - header 14 bytes
    // - vals  8 //< due to padding? could have been 1byte?.
    // - null footer 6 bytes
    assert_eq!(cols[0].num_bytes(), 33);
    let column = cols[0].open().unwrap();
    let DynamicColumn::I64(column_i64) = column else {
        panic!();
    };
    assert_eq!(column_i64.index.get_cardinality(), Cardinality::Optional);
    assert_eq!(column_i64.first(0), None);
    assert_eq!(column_i64.first(1), Some(12i64));
    assert_eq!(column_i64.first(2), Some(13i64));
    assert_eq!(column_i64.first(3), None);
    assert_eq!(column_i64.first(4), Some(15i64));
    assert_eq!(column_i64.first(5), None);
    assert_eq!(column_i64.first(6), None); //< we can change the spec for that one.
}

#[test]
fn test_dictionary_encoded_str() {
    let mut buffer = Vec::new();
    let mut columnar_writer = ColumnarWriter::default();
    columnar_writer.record_str(1, "my.column", "a");
    columnar_writer.record_str(3, "my.column", "c");
    columnar_writer.record_str(3, "my.column2", "different_column!");
    columnar_writer.record_str(4, "my.column", "b");
    columnar_writer.serialize(5, &mut buffer).unwrap();
    let columnar_reader = ColumnarReader::open(buffer).unwrap();
    assert_eq!(columnar_reader.num_columns(), 2);
    let col_handles = columnar_reader.read_columns("my.column").unwrap();
    assert_eq!(col_handles.len(), 1);
    let DynamicColumn::Str(str_col) = col_handles[0].open().unwrap() else {
        panic!();
    };
    let index: Vec<Option<u64>> = (0..5).map(|doc_id| str_col.ords().first(doc_id)).collect();
    assert_eq!(index, &[None, Some(0), None, Some(2), Some(1)]);
    assert_eq!(str_col.num_rows(), 5);
    let mut term_buffer = String::new();
    let term_ords = str_col.ords();
    assert_eq!(term_ords.first(0), None);
    assert_eq!(term_ords.first(1), Some(0));
    str_col.ord_to_str(0u64, &mut term_buffer).unwrap();
    assert_eq!(term_buffer, "a");
    assert_eq!(term_ords.first(2), None);
    assert_eq!(term_ords.first(3), Some(2));
    str_col.ord_to_str(2u64, &mut term_buffer).unwrap();
    assert_eq!(term_buffer, "c");
    assert_eq!(term_ords.first(4), Some(1));
    str_col.ord_to_str(1u64, &mut term_buffer).unwrap();
    assert_eq!(term_buffer, "b");
}

#[test]
fn test_dictionary_encoded_bytes() {
    let mut buffer = Vec::new();
    let mut columnar_writer = ColumnarWriter::default();
    columnar_writer.record_bytes(1, "my.column", b"a");
    columnar_writer.record_bytes(3, "my.column", b"c");
    columnar_writer.record_bytes(3, "my.column2", b"different_column!");
    columnar_writer.record_bytes(4, "my.column", b"b");
    columnar_writer.serialize(5, &mut buffer).unwrap();
    let columnar_reader = ColumnarReader::open(buffer).unwrap();
    assert_eq!(columnar_reader.num_columns(), 2);
    let col_handles = columnar_reader.read_columns("my.column").unwrap();
    assert_eq!(col_handles.len(), 1);
    let DynamicColumn::Bytes(bytes_col) = col_handles[0].open().unwrap() else {
        panic!();
    };
    let index: Vec<Option<u64>> = (0..5)
        .map(|doc_id| bytes_col.ords().first(doc_id))
        .collect();
    assert_eq!(index, &[None, Some(0), None, Some(2), Some(1)]);
    assert_eq!(bytes_col.num_rows(), 5);
    let mut term_buffer = Vec::new();
    let term_ords = bytes_col.ords();
    assert_eq!(term_ords.first(0), None);
    assert_eq!(term_ords.first(1), Some(0));
    bytes_col
        .dictionary
        .ord_to_term(0u64, &mut term_buffer)
        .unwrap();
    assert_eq!(term_buffer, b"a");
    assert_eq!(term_ords.first(2), None);
    assert_eq!(term_ords.first(3), Some(2));
    bytes_col
        .dictionary
        .ord_to_term(2u64, &mut term_buffer)
        .unwrap();
    assert_eq!(term_buffer, b"c");
    assert_eq!(term_ords.first(4), Some(1));
    bytes_col
        .dictionary
        .ord_to_term(1u64, &mut term_buffer)
        .unwrap();
    assert_eq!(term_buffer, b"b");
}

fn num_strategy() -> impl Strategy<Value = NumericalValue> {
    prop_oneof![
        3 => Just(NumericalValue::U64(0u64)),
        3 => Just(NumericalValue::U64(u64::MAX)),
        3 => Just(NumericalValue::I64(0i64)),
        3 => Just(NumericalValue::I64(i64::MIN)),
        3 => Just(NumericalValue::I64(i64::MAX)),
        3 => Just(NumericalValue::F64(1.2f64)),
        1 => any::<f64>().prop_map(NumericalValue::from),
        1 => any::<u64>().prop_map(NumericalValue::from),
        1 => any::<i64>().prop_map(NumericalValue::from),
    ]
}

#[derive(Debug, Clone, Copy)]
enum ColumnValue {
    Str(&'static str),
    Bytes(&'static [u8]),
    Numerical(NumericalValue),
    IpAddr(Ipv6Addr),
    Bool(bool),
    DateTime(DateTime),
}

impl<T: Into<NumericalValue>> From<T> for ColumnValue {
    fn from(val: T) -> ColumnValue {
        ColumnValue::Numerical(val.into())
    }
}

impl ColumnValue {
    pub(crate) fn column_type_category(&self) -> ColumnTypeCategory {
        match self {
            ColumnValue::Str(_) => ColumnTypeCategory::Str,
            ColumnValue::Bytes(_) => ColumnTypeCategory::Bytes,
            ColumnValue::Numerical(_) => ColumnTypeCategory::Numerical,
            ColumnValue::IpAddr(_) => ColumnTypeCategory::IpAddr,
            ColumnValue::Bool(_) => ColumnTypeCategory::Bool,
            ColumnValue::DateTime(_) => ColumnTypeCategory::DateTime,
        }
    }
}

fn column_name_strategy() -> impl Strategy<Value = &'static str> {
    prop_oneof![Just("c1"), Just("c2")]
}

fn string_strategy() -> impl Strategy<Value = &'static str> {
    prop_oneof![Just("a"), Just("b")]
}

fn bytes_strategy() -> impl Strategy<Value = &'static [u8]> {
    prop_oneof![Just(&[0u8][..]), Just(&[1u8][..])]
}

// A random column value
fn column_value_strategy() -> impl Strategy<Value = ColumnValue> {
    prop_oneof![
        10 => string_strategy().prop_map(ColumnValue::Str),
        1 => bytes_strategy().prop_map(ColumnValue::Bytes),
        40 => num_strategy().prop_map(ColumnValue::Numerical),
        1 => (1u16..3u16).prop_map(|ip_addr_byte| ColumnValue::IpAddr(Ipv6Addr::new(
            127,
            0,
            0,
            0,
            0,
            0,
            0,
            ip_addr_byte
        ))),
        1 => any::<bool>().prop_map(ColumnValue::Bool),
        1 => (679_723_993i64..1_679_723_995i64)
            .prop_map(|val| { ColumnValue::DateTime(DateTime::from_timestamp_secs(val)) })
    ]
}

// A document contains up to 4 values.
fn doc_strategy() -> impl Strategy<Value = Vec<(&'static str, ColumnValue)>> {
    proptest::collection::vec((column_name_strategy(), column_value_strategy()), 0..=4)
}

fn num_docs_strategy() -> impl Strategy<Value = usize> {
    prop_oneof!(
        // We focus heavily on the 0..2 case as we assume it is sufficient to cover all edge cases.
        0usize..=3usize,
        // We leave 50% of the effort exploring more defensively.
        3usize..=12usize
    )
}

// A columnar contains up to 2 docs.
fn columnar_docs_strategy() -> impl Strategy<Value = Vec<Vec<(&'static str, ColumnValue)>>> {
    num_docs_strategy()
        .prop_flat_map(|num_docs| proptest::collection::vec(doc_strategy(), num_docs))
}

fn permutation_and_subset_strategy(n: usize) -> impl Strategy<Value = Vec<usize>> {
    let vals: Vec<usize> = (0..n).collect();
    subsequence(vals, 0..=n).prop_shuffle()
}

fn build_columnar_with_mapping(docs: &[Vec<(&'static str, ColumnValue)>]) -> ColumnarReader {
    let num_docs = docs.len() as u32;
    let mut buffer = Vec::new();
    let mut columnar_writer = ColumnarWriter::default();
    for (doc_id, vals) in docs.iter().enumerate() {
        for (column_name, col_val) in vals {
            match *col_val {
                ColumnValue::Str(str_val) => {
                    columnar_writer.record_str(doc_id as u32, column_name, str_val);
                }
                ColumnValue::Bytes(bytes) => {
                    columnar_writer.record_bytes(doc_id as u32, column_name, bytes)
                }
                ColumnValue::Numerical(num) => {
                    columnar_writer.record_numerical(doc_id as u32, column_name, num);
                }
                ColumnValue::IpAddr(ip_addr) => {
                    columnar_writer.record_ip_addr(doc_id as u32, column_name, ip_addr);
                }
                ColumnValue::Bool(bool_val) => {
                    columnar_writer.record_bool(doc_id as u32, column_name, bool_val);
                }
                ColumnValue::DateTime(date_time) => {
                    columnar_writer.record_datetime(doc_id as u32, column_name, date_time);
                }
            }
        }
    }
    columnar_writer.serialize(num_docs, &mut buffer).unwrap();

    ColumnarReader::open(buffer).unwrap()
}

fn build_columnar(docs: &[Vec<(&'static str, ColumnValue)>]) -> ColumnarReader {
    build_columnar_with_mapping(docs)
}

fn assert_columnar_eq_strict(left: &ColumnarReader, right: &ColumnarReader) {
    assert_columnar_eq(left, right, false);
}

fn assert_columnar_eq(
    left: &ColumnarReader,
    right: &ColumnarReader,
    lenient_on_numerical_value: bool,
) {
    assert_eq!(left.num_docs(), right.num_docs());
    let left_columns = left.list_columns().unwrap();
    let right_columns = right.list_columns().unwrap();
    assert_eq!(left_columns.len(), right_columns.len());
    for i in 0..left_columns.len() {
        assert_eq!(left_columns[i].0, right_columns[i].0);
        let left_column = left_columns[i].1.open().unwrap();
        let right_column = right_columns[i].1.open().unwrap();
        assert_dyn_column_eq(&left_column, &right_column, lenient_on_numerical_value);
    }
}

#[track_caller]
fn assert_column_eq<T: Copy + PartialOrd + Debug + Send + Sync + 'static>(
    left: &Column<T>,
    right: &Column<T>,
) {
    assert_eq!(left.get_cardinality(), right.get_cardinality());
    assert_eq!(left.num_docs(), right.num_docs());
    let num_docs = left.num_docs();
    for doc in 0..num_docs {
        assert_eq!(
            left.index.value_row_ids(doc),
            right.index.value_row_ids(doc)
        );
    }
    assert_eq!(left.values.num_vals(), right.values.num_vals());
    let num_vals = left.values.num_vals();
    for i in 0..num_vals {
        assert_eq!(left.values.get_val(i), right.values.get_val(i));
    }
}

fn assert_bytes_column_eq(left: &BytesColumn, right: &BytesColumn) {
    assert_eq!(
        left.term_ord_column.get_cardinality(),
        right.term_ord_column.get_cardinality()
    );
    assert_eq!(left.num_rows(), right.num_rows());
    assert_column_eq(&left.term_ord_column, &right.term_ord_column);
    assert_eq!(left.dictionary.num_terms(), right.dictionary.num_terms());
    let num_terms = left.dictionary.num_terms();
    let mut left_terms = left.dictionary.stream().unwrap();
    let mut right_terms = right.dictionary.stream().unwrap();
    for _ in 0..num_terms {
        assert!(left_terms.advance());
        assert!(right_terms.advance());
        assert_eq!(left_terms.key(), right_terms.key());
    }
    assert!(!left_terms.advance());
    assert!(!right_terms.advance());
}

fn assert_dyn_column_eq(
    left_dyn_column: &DynamicColumn,
    right_dyn_column: &DynamicColumn,
    lenient_on_numerical_value: bool,
) {
    assert_eq!(
        &left_dyn_column.get_cardinality(),
        &right_dyn_column.get_cardinality()
    );
    match &(left_dyn_column, right_dyn_column) {
        (DynamicColumn::Bool(left_col), DynamicColumn::Bool(right_col)) => {
            assert_column_eq(left_col, right_col);
        }
        (DynamicColumn::I64(left_col), DynamicColumn::I64(right_col)) => {
            assert_column_eq(left_col, right_col);
        }
        (DynamicColumn::U64(left_col), DynamicColumn::U64(right_col)) => {
            assert_column_eq(left_col, right_col);
        }
        (DynamicColumn::F64(left_col), DynamicColumn::F64(right_col)) => {
            assert_column_eq(left_col, right_col);
        }
        (DynamicColumn::DateTime(left_col), DynamicColumn::DateTime(right_col)) => {
            assert_column_eq(left_col, right_col);
        }
        (DynamicColumn::IpAddr(left_col), DynamicColumn::IpAddr(right_col)) => {
            assert_column_eq(left_col, right_col);
        }
        (DynamicColumn::Bytes(left_col), DynamicColumn::Bytes(right_col)) => {
            assert_bytes_column_eq(left_col, right_col);
        }
        (DynamicColumn::Str(left_col), DynamicColumn::Str(right_col)) => {
            assert_bytes_column_eq(left_col, right_col);
        }
        (left, right) => {
            if lenient_on_numerical_value {
                assert_eq!(
                    ColumnTypeCategory::from(left.column_type()),
                    ColumnTypeCategory::from(right.column_type())
                );
            } else {
                panic!(
                    "Column type are not the same: {:?} vs {:?}",
                    left.column_type(),
                    right.column_type()
                );
            }
        }
    }
}

trait AssertEqualToColumnValue {
    fn assert_equal_to_column_value(&self, column_value: &ColumnValue);
}

impl AssertEqualToColumnValue for bool {
    fn assert_equal_to_column_value(&self, column_value: &ColumnValue) {
        let ColumnValue::Bool(val) = column_value else {
            panic!()
        };
        assert_eq!(self, val);
    }
}

impl AssertEqualToColumnValue for Ipv6Addr {
    fn assert_equal_to_column_value(&self, column_value: &ColumnValue) {
        let ColumnValue::IpAddr(val) = column_value else {
            panic!()
        };
        assert_eq!(self, val);
    }
}

impl<T: Coerce + PartialEq + Debug + Into<NumericalValue>> AssertEqualToColumnValue for T {
    fn assert_equal_to_column_value(&self, column_value: &ColumnValue) {
        let ColumnValue::Numerical(num) = column_value else {
            panic!()
        };
        assert_eq!(self, &T::coerce(*num));
    }
}

impl AssertEqualToColumnValue for DateTime {
    fn assert_equal_to_column_value(&self, column_value: &ColumnValue) {
        let ColumnValue::DateTime(dt) = column_value else {
            panic!()
        };
        assert_eq!(self, dt);
    }
}

fn assert_column_values<
    T: AssertEqualToColumnValue + PartialEq + Copy + PartialOrd + Debug + Send + Sync + 'static,
>(
    col: &Column<T>,
    expected: &HashMap<u32, Vec<&ColumnValue>>,
) {
    let mut num_non_empty_rows = 0;
    for doc in 0..col.num_docs() {
        let doc_vals: Vec<T> = col.values_for_doc(doc).collect();
        if doc_vals.is_empty() {
            continue;
        }
        num_non_empty_rows += 1;
        let expected_vals = expected.get(&doc).unwrap();
        assert_eq!(doc_vals.len(), expected_vals.len());
        for (val, &expected) in doc_vals.iter().zip(expected_vals.iter()) {
            val.assert_equal_to_column_value(expected)
        }
    }
    assert_eq!(num_non_empty_rows, expected.len());
}

fn assert_bytes_column_values(
    col: &BytesColumn,
    expected: &HashMap<u32, Vec<&ColumnValue>>,
    is_str: bool,
) {
    let mut num_non_empty_rows = 0;
    let mut buffer = Vec::new();
    for doc in 0..col.term_ord_column.num_docs() {
        let doc_vals: Vec<u64> = col.term_ords(doc).collect();
        if doc_vals.is_empty() {
            continue;
        }
        let expected_vals = expected.get(&doc).unwrap();
        assert_eq!(doc_vals.len(), expected_vals.len());
        for (&expected_col_val, &ord) in expected_vals.iter().zip(&doc_vals) {
            col.ord_to_bytes(ord, &mut buffer).unwrap();
            match expected_col_val {
                ColumnValue::Str(str_val) => {
                    assert!(is_str);
                    assert_eq!(str_val.as_bytes(), &buffer);
                }
                ColumnValue::Bytes(bytes_val) => {
                    assert!(!is_str);
                    assert_eq!(bytes_val, &buffer);
                }
                _ => {
                    panic!();
                }
            }
        }
        num_non_empty_rows += 1;
    }
    assert_eq!(num_non_empty_rows, expected.len());
}

// This proptest attempts to create a tiny columnar based of up to 3 rows, and checks that the
// resulting columnar matches the row data.
proptest! {
    #![proptest_config(ProptestConfig::with_cases(500))]
    #[test]
    fn test_single_columnar_builder_proptest(docs in columnar_docs_strategy()) {
        let columnar = build_columnar(&docs[..]);
        assert_eq!(columnar.num_docs() as usize, docs.len());
        let mut expected_columns: HashMap<(&str, ColumnTypeCategory), HashMap<u32, Vec<&ColumnValue>> > = Default::default();
        for (doc_id, doc_vals) in docs.iter().enumerate() {
            for (col_name, col_val) in doc_vals {
                expected_columns
                    .entry((col_name, col_val.column_type_category()))
                    .or_default()
                    .entry(doc_id as u32)
                    .or_default()
                    .push(col_val);
            }
        }
        let column_list = columnar.list_columns().unwrap();
        assert_eq!(expected_columns.len(), column_list.len());
        for (column_name, column) in column_list {
            let dynamic_column = column.open().unwrap();
            let col_category: ColumnTypeCategory = dynamic_column.column_type().into();
            let expected_col_values: &HashMap<u32, Vec<&ColumnValue>> = expected_columns.get(&(column_name.as_str(), col_category)).unwrap();
            match &dynamic_column {
                DynamicColumn::Bool(col) =>
                    assert_column_values(col, expected_col_values),
                DynamicColumn::I64(col) =>
                    assert_column_values(col, expected_col_values),
                DynamicColumn::U64(col) =>
                    assert_column_values(col, expected_col_values),
                DynamicColumn::F64(col) =>
                    assert_column_values(col, expected_col_values),
                DynamicColumn::IpAddr(col) =>
                    assert_column_values(col, expected_col_values),
                DynamicColumn::DateTime(col) =>
                    assert_column_values(col, expected_col_values),
                DynamicColumn::Bytes(col) =>
                    assert_bytes_column_values(col, expected_col_values, false),
                DynamicColumn::Str(col) =>
                    assert_bytes_column_values(col, expected_col_values, true),
            }
        }
    }
}

// This tests create 2 or 3 random small columnar and attempts to merge them.
// It compares the resulting merged dataframe with what would have been obtained by building the
// dataframe from the concatenated rows to begin with.
proptest! {
    #![proptest_config(ProptestConfig::with_cases(1000))]
    #[test]
    fn test_columnar_merge_proptest(columnar_docs in proptest::collection::vec(columnar_docs_strategy(), 2..=3)) {
        let columnar_readers: Vec<ColumnarReader> = columnar_docs.iter()
            .map(|docs| build_columnar(&docs[..]))
            .collect::<Vec<_>>();
        let columnar_readers_arr: Vec<&ColumnarReader> = columnar_readers.iter().collect();
        let mut output: Vec<u8> = Vec::new();
        let stack_merge_order = StackMergeOrder::stack(&columnar_readers_arr[..]).into();
        crate::merge_columnar(&columnar_readers_arr[..], &[], stack_merge_order, &mut output).unwrap();
        let merged_columnar = ColumnarReader::open(output).unwrap();
        let concat_rows: Vec<Vec<(&'static str, ColumnValue)>> = columnar_docs.iter().flatten().cloned().collect();
        let expected_merged_columnar = build_columnar(&concat_rows[..]);
        assert_columnar_eq_strict(&merged_columnar, &expected_merged_columnar);
    }
}

#[test]
fn test_columnar_merging_empty_columnar() {
    let columnar_docs: Vec<Vec<Vec<(&str, ColumnValue)>>> =
        vec![vec![], vec![vec![("c1", ColumnValue::Str("a"))]]];
    let columnar_readers: Vec<ColumnarReader> = columnar_docs
        .iter()
        .map(|docs| build_columnar(&docs[..]))
        .collect::<Vec<_>>();
    let columnar_readers_arr: Vec<&ColumnarReader> = columnar_readers.iter().collect();
    let mut output: Vec<u8> = Vec::new();
    let stack_merge_order = StackMergeOrder::stack(&columnar_readers_arr[..]);
    crate::merge_columnar(
        &columnar_readers_arr[..],
        &[],
        crate::MergeRowOrder::Stack(stack_merge_order),
        &mut output,
    )
    .unwrap();
    let merged_columnar = ColumnarReader::open(output).unwrap();
    let concat_rows: Vec<Vec<(&'static str, ColumnValue)>> =
        columnar_docs.iter().flatten().cloned().collect();
    let expected_merged_columnar = build_columnar(&concat_rows[..]);
    assert_columnar_eq_strict(&merged_columnar, &expected_merged_columnar);
}

#[test]
fn test_columnar_merging_number_columns() {
    let columnar_docs: Vec<Vec<Vec<(&str, ColumnValue)>>> = vec![
        // columnar 1
        vec![
            // doc 1.1
            vec![("c2", ColumnValue::Numerical(0i64.into()))],
        ],
        // columnar2
        vec![
            // doc 2.1
            vec![("c2", ColumnValue::Numerical(0u64.into()))],
            // doc 2.2
            vec![("c2", ColumnValue::Numerical(u64::MAX.into()))],
        ],
    ];
    let columnar_readers: Vec<ColumnarReader> = columnar_docs
        .iter()
        .map(|docs| build_columnar(&docs[..]))
        .collect::<Vec<_>>();
    let columnar_readers_arr: Vec<&ColumnarReader> = columnar_readers.iter().collect();
    let mut output: Vec<u8> = Vec::new();
    let stack_merge_order = StackMergeOrder::stack(&columnar_readers_arr[..]);
    crate::merge_columnar(
        &columnar_readers_arr[..],
        &[],
        crate::MergeRowOrder::Stack(stack_merge_order),
        &mut output,
    )
    .unwrap();
    let merged_columnar = ColumnarReader::open(output).unwrap();
    let concat_rows: Vec<Vec<(&'static str, ColumnValue)>> =
        columnar_docs.iter().flatten().cloned().collect();
    let expected_merged_columnar = build_columnar(&concat_rows[..]);
    assert_columnar_eq_strict(&merged_columnar, &expected_merged_columnar);
}

// TODO add non trivial remap and merge
// TODO test required_columns
// TODO document edge case: required_columns incompatible with values.

#[allow(clippy::type_complexity)]
fn columnar_docs_and_remap()
-> impl Strategy<Value = (Vec<Vec<Vec<(&'static str, ColumnValue)>>>, Vec<RowAddr>)> {
    proptest::collection::vec(columnar_docs_strategy(), 2..=3).prop_flat_map(
        |columnars_docs: Vec<Vec<Vec<(&str, ColumnValue)>>>| {
            let row_addrs: Vec<RowAddr> = columnars_docs
                .iter()
                .enumerate()
                .flat_map(|(segment_ord, columnar_docs)| {
                    (0u32..columnar_docs.len() as u32).map(move |row_id| RowAddr {
                        segment_ord: segment_ord as u32,
                        row_id,
                    })
                })
                .collect();
            permutation_and_subset_strategy(row_addrs.len()).prop_map(move |shuffled_subset| {
                let shuffled_row_addr_subset: Vec<RowAddr> =
                    shuffled_subset.iter().map(|ord| row_addrs[*ord]).collect();
                (columnars_docs.clone(), shuffled_row_addr_subset)
            })
        },
    )
}

proptest! {
    #![proptest_config(ProptestConfig::with_cases(1000))]
    #[test]
    fn test_columnar_merge_and_remap_proptest((columnar_docs, shuffle_merge_order) in
columnar_docs_and_remap()) {
        test_columnar_merge_and_remap(columnar_docs, shuffle_merge_order);
    }
}

fn test_columnar_merge_and_remap(
    columnar_docs: Vec<Vec<Vec<(&'static str, ColumnValue)>>>,
    shuffle_merge_order: Vec<RowAddr>,
) {
    let shuffled_rows: Vec<Vec<(&'static str, ColumnValue)>> = shuffle_merge_order
        .iter()
        .map(|row_addr| {
            columnar_docs[row_addr.segment_ord as usize][row_addr.row_id as usize].clone()
        })
        .collect();
    let expected_merged_columnar = build_columnar(&shuffled_rows[..]);
    let columnar_readers: Vec<ColumnarReader> = columnar_docs
        .iter()
        .map(|docs| build_columnar(&docs[..]))
        .collect::<Vec<_>>();
    let columnar_readers_ref: Vec<&ColumnarReader> = columnar_readers.iter().collect();
    let mut output: Vec<u8> = Vec::new();
    let segment_num_rows: Vec<RowId> = columnar_docs
        .iter()
        .map(|docs| docs.len() as RowId)
        .collect();
    let shuffle_merge_order = ShuffleMergeOrder::for_test(&segment_num_rows, shuffle_merge_order);
    crate::merge_columnar(
        &columnar_readers_ref[..],
        &[],
        shuffle_merge_order.into(),
        &mut output,
    )
    .unwrap();
    let merged_columnar = ColumnarReader::open(output).unwrap();
    assert_columnar_eq(&merged_columnar, &expected_merged_columnar, true);
}

#[test]
fn test_columnar_merge_and_remap_bug_1() {
    let columnar_docs = vec![vec![
        vec![
            ("c1", ColumnValue::Numerical(NumericalValue::U64(0))),
            ("c1", ColumnValue::Numerical(NumericalValue::U64(0))),
        ],
        vec![],
    ]];
    let shuffle_merge_order: Vec<RowAddr> = vec![
        RowAddr {
            segment_ord: 0,
            row_id: 1,
        },
        RowAddr {
            segment_ord: 0,
            row_id: 0,
        },
    ];

    test_columnar_merge_and_remap(columnar_docs, shuffle_merge_order);
}

#[test]
fn test_columnar_merge_empty() {
    let columnar_reader_1 = build_columnar(&[]);
    let rows: &[Vec<_>] = &[vec![("c1", ColumnValue::Str("a"))]][..];
    let columnar_reader_2 = build_columnar(rows);
    let mut output: Vec<u8> = Vec::new();
    let segment_num_rows: Vec<RowId> = vec![0, 0];
    let shuffle_merge_order = ShuffleMergeOrder::for_test(&segment_num_rows, vec![]);
    crate::merge_columnar(
        &[&columnar_reader_1, &columnar_reader_2],
        &[],
        shuffle_merge_order.into(),
        &mut output,
    )
    .unwrap();
    let merged_columnar = ColumnarReader::open(output).unwrap();
    assert_eq!(merged_columnar.num_docs(), 0);
    assert_eq!(merged_columnar.num_columns(), 0);
}

#[test]
fn test_columnar_merge_single_str_column() {
    let columnar_reader_1 = build_columnar(&[]);
    let rows: &[Vec<_>] = &[vec![("c1", ColumnValue::Str("a"))]][..];
    let columnar_reader_2 = build_columnar(rows);
    let mut output: Vec<u8> = Vec::new();
    let segment_num_rows: Vec<RowId> = vec![0, 1];
    let shuffle_merge_order = ShuffleMergeOrder::for_test(
        &segment_num_rows,
        vec![RowAddr {
            segment_ord: 1u32,
            row_id: 0u32,
        }],
    );
    crate::merge_columnar(
        &[&columnar_reader_1, &columnar_reader_2],
        &[],
        shuffle_merge_order.into(),
        &mut output,
    )
    .unwrap();
    let merged_columnar = ColumnarReader::open(output).unwrap();
    assert_eq!(merged_columnar.num_docs(), 1);
    assert_eq!(merged_columnar.num_columns(), 1);
}

#[test]
fn test_delete_decrease_cardinality() {
    let columnar_reader_1 = build_columnar(&[]);
    let rows: &[Vec<_>] = &[
        vec![
            ("c", ColumnValue::from(0i64)),
            ("c", ColumnValue::from(0i64)),
        ],
        vec![("c", ColumnValue::from(0i64))],
    ][..];
    // c is multivalued here
    let columnar_reader_2 = build_columnar(rows);
    let mut output: Vec<u8> = Vec::new();
    let shuffle_merge_order = ShuffleMergeOrder::for_test(
        &[0, 2],
        vec![RowAddr {
            segment_ord: 1u32,
            row_id: 1u32,
        }],
    );
    crate::merge_columnar(
        &[&columnar_reader_1, &columnar_reader_2],
        &[],
        shuffle_merge_order.into(),
        &mut output,
    )
    .unwrap();
    let merged_columnar = ColumnarReader::open(output).unwrap();
    assert_eq!(merged_columnar.num_docs(), 1);
    assert_eq!(merged_columnar.num_columns(), 1);
    let cols = merged_columnar.read_columns("c").unwrap();
    assert_eq!(cols.len(), 1);
    assert_eq!(cols[0].column_type(), ColumnType::I64);
    assert_eq!(cols[0].open().unwrap().get_cardinality(), Cardinality::Full);
}


================================================
FILE: columnar/src/utils.rs
================================================
const fn compute_mask(num_bits: u8) -> u8 {
    if num_bits == 8 {
        u8::MAX
    } else {
        (1u8 << num_bits) - 1
    }
}

#[inline(always)]
#[must_use]
pub(crate) fn select_bits<const START: u8, const END: u8>(code: u8) -> u8 {
    assert!(START <= END);
    assert!(END <= 8);
    let num_bits: u8 = END - START;
    let mask: u8 = compute_mask(num_bits);
    (code >> START) & mask
}

#[inline(always)]
#[must_use]
pub(crate) fn place_bits<const START: u8, const END: u8>(code: u8) -> u8 {
    assert!(START <= END);
    assert!(END <= 8);
    let num_bits: u8 = END - START;
    let mask: u8 = compute_mask(num_bits);
    assert!(code <= mask);
    code << START
}

/// Pop-front one bytes from a slice of bytes.
#[inline(always)]
pub fn pop_first_byte(bytes: &mut &[u8]) -> Option<u8> {
    if bytes.is_empty() {
        return None;
    }
    let first_byte = bytes[0];
    *bytes = &bytes[1..];
    Some(first_byte)
}

#[cfg(test)]
mod tests {
    use super::*;

    #[test]
    fn test_select_bits() {
        assert_eq!(255u8, select_bits::<0, 8>(255u8));
        assert_eq!(0u8, select_bits::<0, 0>(255u8));
        assert_eq!(8u8, select_bits::<0, 4>(8u8));
        assert_eq!(4u8, select_bits::<1, 4>(8u8));
        assert_eq!(0u8, select_bits::<1, 3>(8u8));
    }

    #[test]
    fn test_place_bits() {
        assert_eq!(255u8, place_bits::<0, 8>(255u8));
        assert_eq!(4u8, place_bits::<2, 3>(1u8));
        assert_eq!(0u8, place_bits::<2, 2>(0u8));
    }

    #[test]
    #[should_panic]
    fn test_place_bits_overflows() {
        let _ = place_bits::<1, 4>(8u8);
    }

    #[test]
    fn test_pop_first_byte() {
        let mut cursor: &[u8] = &b"abcd"[..];
        assert_eq!(pop_first_byte(&mut cursor), Some(b'a'));
        assert_eq!(pop_first_byte(&mut cursor), Some(b'b'));
        assert_eq!(pop_first_byte(&mut cursor), Some(b'c'));
        assert_eq!(pop_first_byte(&mut cursor), Some(b'd'));
        assert_eq!(pop_first_byte(&mut cursor), None);
    }
}


================================================
FILE: columnar/src/value.rs
================================================
use std::str::FromStr;

use common::DateTime;

use crate::InvalidData;

#[derive(Copy, Clone, PartialEq, Debug)]
pub enum NumericalValue {
    I64(i64),
    U64(u64),
    F64(f64),
}

impl FromStr for NumericalValue {
    type Err = ();

    fn from_str(s: &str) -> Result<Self, ()> {
        if let Ok(val_i64) = s.parse::<i64>() {
            return Ok(val_i64.into());
        }
        if let Ok(val_u64) = s.parse::<u64>() {
            return Ok(val_u64.into());
        }
        if let Ok(val_f64) = s.parse::<f64>() {
            return Ok(NumericalValue::from(val_f64).normalize());
        }
        Err(())
    }
}

impl NumericalValue {
    pub fn numerical_type(&self) -> NumericalType {
        match self {
            NumericalValue::I64(_) => NumericalType::I64,
            NumericalValue::U64(_) => NumericalType::U64,
            NumericalValue::F64(_) => NumericalType::F64,
        }
    }

    /// Tries to normalize the numerical value in the following priorities:
    /// i64, i64, f64
    pub fn normalize(self) -> Self {
        match self {
            NumericalValue::U64(val) => {
                if val <= i64::MAX as u64 {
                    NumericalValue::I64(val as i64)
                } else {
                    NumericalValue::U64(val)
                }
            }
            NumericalValue::I64(val) => NumericalValue::I64(val),
            NumericalValue::F64(val) => {
                let fract = val.fract();
                if fract == 0.0 && val >= i64::MIN as f64 && val <= i64::MAX as f64 {
                    NumericalValue::I64(val as i64)
                } else if fract == 0.0 && val >= u64::MIN as f64 && val <= u64::MAX as f64 {
                    NumericalValue::U64(val as u64)
                } else {
                    NumericalValue::F64(val)
                }
            }
        }
    }
}

impl From<u64> for NumericalValue {
    fn from(val: u64) -> NumericalValue {
        NumericalValue::U64(val)
    }
}

impl From<i64> for NumericalValue {
    fn from(val: i64) -> Self {
        NumericalValue::I64(val)
    }
}

impl From<f64> for NumericalValue {
    fn from(val: f64) -> Self {
        NumericalValue::F64(val)
    }
}

#[derive(Clone, Copy, Debug, Default, Hash, Eq, PartialEq)]
#[repr(u8)]
pub enum NumericalType {
    #[default]
    I64 = 0,
    U64 = 1,
    F64 = 2,
}

impl NumericalType {
    pub fn to_code(self) -> u8 {
        self as u8
    }

    pub fn try_from_code(code: u8) -> Result<NumericalType, InvalidData> {
        match code {
            0 => Ok(NumericalType::I64),
            1 => Ok(NumericalType::U64),
            2 => Ok(NumericalType::F64),
            _ => Err(InvalidData),
        }
    }
}

/// We voluntarily avoid using `Into` here to keep this
/// implementation quirk as private as possible.
///
/// # Panics
/// This coercion trait actually panics if it is used
/// to convert a loose types to a stricter type.
///
/// The level is strictness is somewhat arbitrary.
/// - i64
/// - u64
/// - f64.
pub(crate) trait Coerce {
    fn coerce(numerical_value: NumericalValue) -> Self;
}

impl Coerce for i64 {
    fn coerce(value: NumericalValue) -> Self {
        match value {
            NumericalValue::I64(val) => val,
            NumericalValue::U64(val) => val as i64,
            NumericalValue::F64(_) => unreachable!(),
        }
    }
}

impl Coerce for u64 {
    fn coerce(value: NumericalValue) -> Self {
        match value {
            NumericalValue::I64(val) => val as u64,
            NumericalValue::U64(val) => val,
            NumericalValue::F64(_) => unreachable!(),
        }
    }
}

impl Coerce for f64 {
    fn coerce(value: NumericalValue) -> Self {
        match value {
            NumericalValue::I64(val) => val as f64,
            NumericalValue::U64(val) => val as f64,
            NumericalValue::F64(val) => val,
        }
    }
}

impl Coerce for DateTime {
    fn coerce(value: NumericalValue) -> Self {
        let timestamp_micros = i64::coerce(value);
        DateTime::from_timestamp_nanos(timestamp_micros)
    }
}

#[cfg(test)]
mod tests {
    use super::NumericalType;
    use crate::NumericalValue;

    #[test]
    fn test_numerical_type_code() {
        let mut num_numerical_type = 0;
        for code in u8::MIN..=u8::MAX {
            if let Ok(numerical_type) = NumericalType::try_from_code(code) {
                assert_eq!(numerical_type.to_code(), code);
                num_numerical_type += 1;
            }
        }
        assert_eq!(num_numerical_type, 3);
    }

    #[test]
    fn test_parse_numerical() {
        assert_eq!(
            "123".parse::<NumericalValue>().unwrap(),
            NumericalValue::I64(123)
        );
        assert_eq!(
            "18446744073709551615".parse::<NumericalValue>().unwrap(),
            NumericalValue::U64(18446744073709551615u64)
        );
        assert_eq!(
            "1.0".parse::<NumericalValue>().unwrap(),
            NumericalValue::I64(1i64)
        );
        assert_eq!(
            "1.1".parse::<NumericalValue>().unwrap(),
            NumericalValue::F64(1.1f64)
        );
        assert_eq!(
            "-1.0".parse::<NumericalValue>().unwrap(),
            NumericalValue::I64(-1i64)
        );
    }

    #[test]
    fn test_normalize_numerical() {
        assert_eq!(
            NumericalValue::from(1u64).normalize(),
            NumericalValue::I64(1i64),
        );
        let limit_val = i64::MAX as u64 + 1u64;
        assert_eq!(
            NumericalValue::from(limit_val).normalize(),
            NumericalValue::U64(limit_val),
        );
        assert_eq!(
            NumericalValue::from(-1i64).normalize(),
            NumericalValue::I64(-1i64),
        );
        assert_eq!(
            NumericalValue::from(-2.0f64).normalize(),
            NumericalValue::I64(-2i64),
        );
        assert_eq!(
            NumericalValue::from(-2.1f64).normalize(),
            NumericalValue::F64(-2.1f64),
        );
        let large_float = 2.0f64.powf(70.0f64);
        assert_eq!(
            NumericalValue::from(large_float).normalize(),
            NumericalValue::F64(large_float),
        );
    }
}


================================================
FILE: common/Cargo.toml
================================================
[package]
name = "tantivy-common"
version = "0.10.0"
authors = ["Paul Masurel <paul@quickwit.io>", "Pascal Seitz <pascal@quickwit.io>"]
license = "MIT"
edition = "2024"
description = "common traits and utility functions used by multiple tantivy subcrates"
documentation = "https://docs.rs/tantivy_common/"
homepage = "https://github.com/quickwit-oss/tantivy"
repository = "https://github.com/quickwit-oss/tantivy"

# See more keys and their definitions at https://doc.rust-lang.org/cargo/reference/manifest.html

[dependencies]
byteorder = "1.4.3"
ownedbytes = { version= "0.9", path="../ownedbytes" }
async-trait = "0.1"
time = { version = "0.3.47", features = ["serde-well-known"] }
serde = { version = "1.0.136", features = ["derive"] }

[dev-dependencies]
binggan = "0.14.0"
proptest = "1.0.0"
rand = "0.9"


================================================
FILE: common/benches/bench.rs
================================================
use binggan::{BenchRunner, black_box};
use rand::rng;
use rand::seq::IteratorRandom;
use tantivy_common::{BitSet, TinySet, serialize_vint_u32};

fn bench_vint() {
    let mut runner = BenchRunner::new();

    let vals: Vec<u32> = (0..20_000).collect();
    runner.bench_function("bench_vint", move |_| {
        let mut out = 0u64;
        for val in vals.iter().cloned() {
            let mut buf = [0u8; 8];
            serialize_vint_u32(val, &mut buf);
            out += u64::from(buf[0]);
        }
        black_box(out);
    });

    let vals: Vec<u32> = (0..20_000).choose_multiple(&mut rng(), 100_000);
    runner.bench_function("bench_vint_rand", move |_| {
        let mut out = 0u64;
        for val in vals.iter().cloned() {
            let mut buf = [0u8; 8];
            serialize_vint_u32(val, &mut buf);
            out += u64::from(buf[0]);
        }
        black_box(out);
    });
}

fn bench_bitset() {
    let mut runner = BenchRunner::new();

    runner.bench_function("bench_tinyset_pop", move |_| {
        let mut tinyset = TinySet::singleton(black_box(31u32));
        tinyset.pop_lowest();
        tinyset.pop_lowest();
        tinyset.pop_lowest();
        tinyset.pop_lowest();
        tinyset.pop_lowest();
        tinyset.pop_lowest();
        black_box(tinyset);
    });

    let tiny_set = TinySet::empty().insert(10u32).insert(14u32).insert(21u32);
    runner.bench_function("bench_tinyset_sum", move |_| {
        assert_eq!(black_box(tiny_set).into_iter().sum::<u32>(), 45u32);
    });

    let v = [10u32, 14u32, 21u32];
    runner.bench_function("bench_tinyarr_sum", move |_| {
        black_box(v.iter().cloned().sum::<u32>());
    });

    runner.bench_function("bench_bitset_initialize", move |_| {
        black_box(BitSet::with_max_value(1_000_000));
    });
}

fn main() {
    bench_vint();
    bench_bitset();
}


================================================
FILE: common/src/bitset.rs
================================================
use std::io::Write;
use std::{fmt, io};

use ownedbytes::OwnedBytes;

use crate::ByteCount;

#[derive(Clone, Copy, Eq, PartialEq)]
pub struct TinySet(u64);

impl fmt::Debug for TinySet {
    fn fmt(&self, f: &mut fmt::Formatter<'_>) -> fmt::Result {
        self.into_iter().collect::<Vec<u32>>().fmt(f)
    }
}

pub struct TinySetIterator(TinySet);
impl Iterator for TinySetIterator {
    type Item = u32;

    #[inline]
    fn next(&mut self) -> Option<Self::Item> {
        self.0.pop_lowest()
    }
}

impl IntoIterator for TinySet {
    type Item = u32;
    type IntoIter = TinySetIterator;
    fn into_iter(self) -> Self::IntoIter {
        TinySetIterator(self)
    }
}

impl TinySet {
    pub fn serialize<T: Write>(&self, writer: &mut T) -> io::Result<()> {
        writer.write_all(self.0.to_le_bytes().as_ref())
    }

    pub fn into_bytes(self) -> [u8; 8] {
        self.0.to_le_bytes()
    }

    #[inline]
    pub fn deserialize(data: [u8; 8]) -> Self {
        let val: u64 = u64::from_le_bytes(data);
        TinySet(val)
    }

    /// Returns an empty `TinySet`.
    #[inline]
    pub fn empty() -> TinySet {
        TinySet(0u64)
    }

    /// Returns a full `TinySet`.
    #[inline]
    pub fn full() -> TinySet {
        TinySet::empty().complement()
    }

    pub fn clear(&mut self) {
        self.0 = 0u64;
    }

    /// Returns the complement of the set in `[0, 64[`.
    ///
    /// Careful on making this function public, as it will break the padding handling in the last
    /// bucket.
    #[inline]
    fn complement(self) -> TinySet {
        TinySet(!self.0)
    }

    /// Returns true iff the `TinySet` contains the element `el`.
    #[inline]
    pub fn contains(self, el: u32) -> bool {
        !self.intersect(TinySet::singleton(el)).is_empty()
    }

    /// Returns the number of elements in the TinySet.
    #[inline]
    pub fn len(self) -> u32 {
        self.0.count_ones()
    }

    /// Returns the intersection of `self` and `other`
    #[inline]
    #[must_use]
    pub fn intersect(self, other: TinySet) -> TinySet {
        TinySet(self.0 & other.0)
    }

    /// Creates a new `TinySet` containing only one element
    /// within `[0; 64[`
    #[inline]
    pub fn singleton(el: u32) -> TinySet {
        TinySet(1u64 << u64::from(el))
    }

    /// Insert a new element within [0..64)
    #[inline]
    #[must_use]
    pub fn insert(self, el: u32) -> TinySet {
        self.union(TinySet::singleton(el))
    }

    /// Removes an element within [0..64)
    #[inline]
    #[must_use]
    pub fn remove(self, el: u32) -> TinySet {
        self.intersect(TinySet::singleton(el).complement())
    }

    /// Insert a new element within [0..64)
    ///
    /// returns true if the set changed
    #[inline]
    pub fn insert_mut(&mut self, el: u32) -> bool {
        let old = *self;
        *self = old.insert(el);
        old != *self
    }

    /// Remove a element within [0..64)
    ///
    /// returns true if the set changed
    #[inline]
    pub fn remove_mut(&mut self, el: u32) -> bool {
        let old = *self;
        *self = old.remove(el);
        old != *self
    }

    /// Returns the union of two tinysets
    #[inline]
    #[must_use]
    pub fn union(self, other: TinySet) -> TinySet {
        TinySet(self.0 | other.0)
    }

    /// Returns true iff the `TinySet` is empty.
    #[inline]
    pub fn is_empty(self) -> bool {
        self.0 == 0u64
    }

    /// Returns the lowest element in the `TinySet`
    /// and removes it.
    #[inline]
    pub fn pop_lowest(&mut self) -> Option<u32> {
        if self.is_empty() {
            None
        } else {
            let lowest = self.0.trailing_zeros();
            self.0 ^= TinySet::singleton(lowest).0;
            Some(lowest)
        }
    }

    /// Returns a `TinySet` than contains all values up
    /// to limit excluded.
    ///
    /// The limit is assumed to be strictly lower than 64.
    pub fn range_lower(upper_bound: u32) -> TinySet {
        TinySet((1u64 << u64::from(upper_bound % 64u32)) - 1u64)
    }

    /// Returns a `TinySet` that contains all values greater
    /// or equal to the given limit, included. (and up to 63)
    ///
    /// The limit is assumed to be strictly lower than 64.
    pub fn range_greater_or_equal(from_included: u32) -> TinySet {
        TinySet::range_lower(from_included).complement()
    }
}

#[derive(Clone)]
pub struct BitSet {
    tinysets: Box<[TinySet]>,
    len: u64,
    max_value: u32,
}
impl std::fmt::Debug for BitSet {
    fn fmt(&self, f: &mut fmt::Formatter<'_>) -> fmt::Result {
        f.debug_struct("BitSet")
            .field("len", &self.len)
            .field("max_value", &self.max_value)
            .finish()
    }
}

fn num_buckets(max_val: u32) -> u32 {
    max_val.div_ceil(64u32)
}

impl BitSet {
    /// serialize a `BitSet`.
    pub fn serialize<T: Write>(&self, writer: &mut T) -> io::Result<()> {
        writer.write_all(self.max_value.to_le_bytes().as_ref())?;
        for tinyset in self.tinysets.iter().cloned() {
            writer.write_all(&tinyset.into_bytes())?;
        }
        writer.flush()?;
        Ok(())
    }

    /// Create a new `BitSet` that may contain elements
    /// within `[0, max_val)`.
    pub fn with_max_value(max_value: u32) -> BitSet {
        let num_buckets = num_buckets(max_value);
        let tinybitsets = vec![TinySet::empty(); num_buckets as usize].into_boxed_slice();
        BitSet {
            tinysets: tinybitsets,
            len: 0,
            max_value,
        }
    }

    /// Create a new `BitSet` that may contain elements. Initially all values will be set.
    /// within `[0, max_val)`.
    pub fn with_max_value_and_full(max_value: u32) -> BitSet {
        let num_buckets = num_buckets(max_value);
        let mut tinybitsets = vec![TinySet::full(); num_buckets as usize].into_boxed_slice();

        // Fix padding
        let lower = max_value % 64u32;
        if lower != 0 {
            tinybitsets[tinybitsets.len() - 1] = TinySet::range_lower(lower);
        }
        BitSet {
            tinysets: tinybitsets,
            len: max_value as u64,
            max_value,
        }
    }

    /// Removes all elements from the `BitSet`.
    pub fn clear(&mut self) {
        for tinyset in self.tinysets.iter_mut() {
            *tinyset = TinySet::empty();
        }
    }

    /// Intersect with serialized bitset
    pub fn intersect_update(&mut self, other: &ReadOnlyBitSet) {
        self.intersect_update_with_iter(other.iter_tinysets());
    }

    /// Intersect with tinysets
    fn intersect_update_with_iter(&mut self, other: impl Iterator<Item = TinySet>) {
        self.len = 0;
        for (left, right) in self.tinysets.iter_mut().zip(other) {
            *left = left.intersect(right);
            self.len += left.len() as u64;
        }
    }

    /// Returns the number of elements in the `BitSet`.
    #[inline]
    pub fn len(&self) -> usize {
        self.len as usize
    }

    /// Inserts an element in the `BitSet`
    #[inline]
    pub fn insert(&mut self, el: u32) {
        // we do not check saturated els.
        let higher = el / 64u32;
        let lower = el % 64u32;
        self.len += u64::from(self.tinysets[higher as usize].insert_mut(lower));
    }

    /// Inserts an element in the `BitSet`
    #[inline]
    pub fn remove(&mut self, el: u32) {
        // we do not check saturated els.
        let higher = el / 64u32;
        let lower = el % 64u32;
        self.len -= u64::from(self.tinysets[higher as usize].remove_mut(lower));
    }

    /// Returns true iff the elements is in the `BitSet`.
    #[inline]
    pub fn contains(&self, el: u32) -> bool {
        self.tinyset(el / 64u32).contains(el % 64)
    }

    /// Returns the first non-empty `TinySet` associated with a bucket lower
    /// or greater than bucket.
    ///
    /// Reminder: the tiny set with the bucket `bucket`, represents the
    /// elements from `bucket * 64` to `(bucket+1) * 64`.
    pub fn first_non_empty_bucket(&self, bucket: u32) -> Option<u32> {
        self.tinysets[bucket as usize..]
            .iter()
            .cloned()
            .position(|tinyset| !tinyset.is_empty())
            .map(|delta_bucket| bucket + delta_bucket as u32)
    }

    #[inline]
    pub fn max_value(&self) -> u32 {
        self.max_value
    }

    /// Returns the tiny bitset representing the
    /// the set restricted to the number range from
    /// `bucket * 64` to `(bucket + 1) * 64`.
    pub fn tinyset(&self, bucket: u32) -> TinySet {
        self.tinysets[bucket as usize]
    }
}

/// Serialized BitSet.
#[derive(Clone)]
pub struct ReadOnlyBitSet {
    data: OwnedBytes,
    max_value: u32,
}

pub fn intersect_bitsets(left: &ReadOnlyBitSet, other: &ReadOnlyBitSet) -> ReadOnlyBitSet {
    assert_eq!(left.max_value(), other.max_value());
    assert_eq!(left.data.len(), other.data.len());
    let union_tinyset_it = left
        .iter_tinysets()
        .zip(other.iter_tinysets())
        .map(|(left_tinyset, right_tinyset)| left_tinyset.intersect(right_tinyset));
    let mut output_dataset: Vec<u8> = Vec::with_capacity(left.data.len());
    for tinyset in union_tinyset_it {
        output_dataset.extend_from_slice(&tinyset.into_bytes());
    }
    ReadOnlyBitSet {
        data: OwnedBytes::new(output_dataset),
        max_value: left.max_value(),
    }
}

impl ReadOnlyBitSet {
    pub fn open(data: OwnedBytes) -> Self {
        let (max_value_data, data) = data.split(4);
        assert_eq!(data.len() % 8, 0);
        let max_value: u32 = u32::from_le_bytes(max_value_data.as_ref().try_into().unwrap());
        ReadOnlyBitSet { data, max_value }
    }

    /// Number of elements in the bitset.
    #[inline]
    pub fn len(&self) -> usize {
        self.iter_tinysets()
            .map(|tinyset| tinyset.len() as usize)
            .sum()
    }

    /// Iterate the tinyset on the fly from serialized data.
    #[inline]
    fn iter_tinysets(&self) -> impl Iterator<Item = TinySet> + '_ {
        self.data.chunks_exact(8).map(move |chunk| {
            let tinyset: TinySet = TinySet::deserialize(chunk.try_into().unwrap());
            tinyset
        })
    }

    /// Iterate over the positions of the elements.
    #[inline]
    pub fn iter(&self) -> impl Iterator<Item = u32> + '_ {
        self.iter_tinysets()
            .enumerate()
            .flat_map(move |(chunk_num, tinyset)| {
                let chunk_base_val = chunk_num as u32 * 64;
                tinyset
                    .into_iter()
                    .map(move |val| val + chunk_base_val)
                    .take_while(move |doc| *doc < self.max_value)
            })
    }

    /// Returns true iff the elements is in the `BitSet`.
    #[inline]
    pub fn contains(&self, el: u32) -> bool {
        let byte_offset = el / 8u32;
        let b: u8 = self.data[byte_offset as usize];
        let shift = (el % 8) as u8;
        b & (1u8 << shift) != 0
    }

    /// Maximum value the bitset may contain.
    /// (Note this is not the maximum value contained in the set.)
    ///
    /// A bitset has an intrinsic capacity.
    /// It only stores elements within [0..max_value).
    #[inline]
    pub fn max_value(&self) -> u32 {
        self.max_value
    }

    /// Number of bytes used in the bitset representation.
    pub fn num_bytes(&self) -> ByteCount {
        self.data.len().into()
    }
}

impl<'a> From<&'a BitSet> for ReadOnlyBitSet {
    fn from(bitset: &'a BitSet) -> ReadOnlyBitSet {
        let mut buffer = Vec::with_capacity(bitset.tinysets.len() * 8 + 4);
        bitset
            .serialize(&mut buffer)
            .expect("serializing into a buffer should never fail");
        ReadOnlyBitSet::open(OwnedBytes::new(buffer))
    }
}

#[cfg(test)]
mod tests {

    use std::collections::HashSet;

    use ownedbytes::OwnedBytes;
    use rand::distr::Bernoulli;
    use rand::rngs::StdRng;
    use rand::{Rng, SeedableRng};

    use super::{BitSet, ReadOnlyBitSet, TinySet};

    #[test]
    fn test_read_serialized_bitset_full_multi() {
        for i in 0..1000 {
            let bitset = BitSet::with_max_value_and_full(i);
            let mut out = vec![];
            bitset.serialize(&mut out).unwrap();

            let bitset = ReadOnlyBitSet::open(OwnedBytes::new(out));
            assert_eq!(bitset.len(), i as usize);
        }
    }

    #[test]
    fn test_read_serialized_bitset_full_block() {
        let bitset = BitSet::with_max_value_and_full(64);
        let mut out = vec![];
        bitset.serialize(&mut out).unwrap();

        let bitset = ReadOnlyBitSet::open(OwnedBytes::new(out));
        assert_eq!(bitset.len(), 64);
    }

    #[test]
    fn test_read_serialized_bitset_full() {
        let mut bitset = BitSet::with_max_value_and_full(5);
        bitset.remove(3);
        let mut out = vec![];
        bitset.serialize(&mut out).unwrap();

        let bitset = ReadOnlyBitSet::open(OwnedBytes::new(out));
        assert_eq!(bitset.len(), 4);
    }

    #[test]
    fn test_bitset_intersect() {
        let bitset_serialized = {
            let mut bitset = BitSet::with_max_value_and_full(5);
            bitset.remove(1);
            bitset.remove(3);
            let mut out = vec![];
            bitset.serialize(&mut out).unwrap();

            ReadOnlyBitSet::open(OwnedBytes::new(out))
        };

        let mut bitset = BitSet::with_max_value_and_full(5);
        bitset.remove(1);
        bitset.intersect_update(&bitset_serialized);

        assert!(bitset.contains(0));
        assert!(!bitset.contains(1));
        assert!(bitset.contains(2));
        assert!(!bitset.contains(3));
        assert!(bitset.contains(4));

        bitset.intersect_update_with_iter(vec![TinySet::singleton(0)].into_iter());

        assert!(bitset.contains(0));
        assert!(!bitset.contains(1));
        assert!(!bitset.contains(2));
        assert!(!bitset.contains(3));
        assert!(!bitset.contains(4));
        assert_eq!(bitset.len(), 1);

        bitset.intersect_update_with_iter(vec![TinySet::singleton(1)].into_iter());
        assert!(!bitset.contains(0));
        assert!(!bitset.contains(1));
        assert!(!bitset.contains(2));
        assert!(!bitset.contains(3));
        assert!(!bitset.contains(4));
        assert_eq!(bitset.len(), 0);
    }

    #[test]
    fn test_read_serialized_bitset_empty() {
        let mut bitset = BitSet::with_max_value(5);
        bitset.insert(3);
        let mut out = vec![];
        bitset.serialize(&mut out).unwrap();

        let bitset = ReadOnlyBitSet::open(OwnedBytes::new(out));
        assert_eq!(bitset.len(), 1);

        {
            let bitset = BitSet::with_max_value(5);
            let mut out = vec![];
            bitset.serialize(&mut out).unwrap();
            let bitset = ReadOnlyBitSet::open(OwnedBytes::new(out));
            assert_eq!(bitset.len(), 0);
        }
    }

    #[test]
    fn test_tiny_set_remove() {
        {
            let mut u = TinySet::empty().insert(63u32).insert(5).remove(63u32);
            assert_eq!(u.pop_lowest(), Some(5u32));
            assert!(u.pop_lowest().is_none());
        }
        {
            let mut u = TinySet::empty()
                .insert(63u32)
                .insert(1)
                .insert(5)
                .remove(63u32);
            assert_eq!(u.pop_lowest(), Some(1u32));
            assert_eq!(u.pop_lowest(), Some(5u32));
            assert!(u.pop_lowest().is_none());
        }
        {
            let mut u = TinySet::empty().insert(1).remove(63u32);
            assert_eq!(u.pop_lowest(), Some(1u32));
            assert!(u.pop_lowest().is_none());
        }
        {
            let mut u = TinySet::empty().insert(1).remove(1u32);
            assert!(u.pop_lowest().is_none());
        }
    }
    #[test]
    fn test_tiny_set() {
        assert!(TinySet::empty().is_empty());
        {
            let mut u = TinySet::empty().insert(1u32);
            assert_eq!(u.pop_lowest(), Some(1u32));
            assert!(u.pop_lowest().is_none())
        }
        {
            let mut u = TinySet::empty().insert(1u32).insert(1u32);
            assert_eq!(u.pop_lowest(), Some(1u32));
            assert!(u.pop_lowest().is_none())
        }
        {
            let mut u = TinySet::empty().insert(2u32);
            assert_eq!(u.pop_lowest(), Some(2u32));
            u.insert_mut(1u32);
            assert_eq!(u.pop_lowest(), Some(1u32));
            assert!(u.pop_lowest().is_none());
        }
        {
            let mut u = TinySet::empty().insert(63u32);
            assert_eq!(u.pop_lowest(), Some(63u32));
            assert!(u.pop_lowest().is_none());
        }
        {
            let mut u = TinySet::empty().insert(63u32).insert(5);
            assert_eq!(u.pop_lowest(), Some(5u32));
            assert_eq!(u.pop_lowest(), Some(63u32));
            assert!(u.pop_lowest().is_none());
        }
        {
            let original = TinySet::empty().insert(63u32).insert(5);
            let after_serialize_deserialize = TinySet::deserialize(original.into_bytes());
            assert_eq!(original, after_serialize_deserialize);
        }
    }

    #[test]
    fn test_bitset() {
        let test_against_hashset = |els: &[u32], max_value: u32| {
            let mut hashset: HashSet<u32> = HashSet::new();
            let mut bitset = BitSet::with_max_value(max_value);
            for &el in els {
                assert!(el < max_value);
                hashset.insert(el);
                bitset.insert(el);
            }
            for el in 0..max_value {
                assert_eq!(hashset.contains(&el), bitset.contains(el));
            }
            assert_eq!(bitset.max_value(), max_value);

            // test deser
            let mut data = vec![];
            bitset.serialize(&mut data).unwrap();
            let ro_bitset = ReadOnlyBitSet::open(OwnedBytes::new(data));
            for el in 0..max_value {
                assert_eq!(hashset.contains(&el), ro_bitset.contains(el));
            }
            assert_eq!(ro_bitset.max_value(), max_value);
            assert_eq!(ro_bitset.len(), els.len());
        };

        test_against_hashset(&[], 0);
        test_against_hashset(&[], 1);
        test_against_hashset(&[0u32], 1);
        test_against_hashset(&[0u32], 100);
        test_against_hashset(&[1u32, 2u32], 4);
        test_against_hashset(&[99u32], 100);
        test_against_hashset(&[63u32], 64);
        test_against_hashset(&[62u32, 63u32], 64);
    }

    #[test]
    fn test_bitset_num_buckets() {
        use super::num_buckets;
        assert_eq!(num_buckets(0u32), 0);
        assert_eq!(num_buckets(1u32), 1);
        assert_eq!(num_buckets(64u32), 1);
        assert_eq!(num_buckets(65u32), 2);
        assert_eq!(num_buckets(128u32), 2);
        assert_eq!(num_buckets(129u32), 3);
    }

    #[test]
    fn test_tinyset_range() {
        assert_eq!(
            TinySet::range_lower(3).into_iter().collect::<Vec<u32>>(),
            [0, 1, 2]
        );
        assert!(TinySet::range_lower(0).is_empty());
        assert_eq!(
            TinySet::range_lower(63).into_iter().collect::<Vec<u32>>(),
            (0u32..63u32).collect::<Vec<_>>()
        );
        assert_eq!(
            TinySet::range_lower(1).into_iter().collect::<Vec<u32>>(),
            [0]
        );
        assert_eq!(
            TinySet::range_lower(2).into_iter().collect::<Vec<u32>>(),
            [0, 1]
        );
        assert_eq!(
            TinySet::range_greater_or_equal(3)
                .into_iter()
                .collect::<Vec<u32>>(),
            (3u32..64u32).collect::<Vec<_>>()
        );
    }

    #[test]
    fn test_bitset_len() {
        let mut bitset = BitSet::with_max_value(1_000);
        assert_eq!(bitset.len(), 0);
        bitset.insert(3u32);
        assert_eq!(bitset.len(), 1);
        bitset.insert(103u32);
        assert_eq!(bitset.len(), 2);
        bitset.insert(3u32);
        assert_eq!(bitset.len(), 2);
        bitset.insert(103u32);
        assert_eq!(bitset.len(), 2);
        bitset.insert(104u32);
        assert_eq!(bitset.len(), 3);
        bitset.remove(105u32);
        assert_eq!(bitset.len(), 3);
        bitset.remove(104u32);
        assert_eq!(bitset.len(), 2);
        bitset.remove(3u32);
        assert_eq!(bitset.len(), 1);
        bitset.remove(103u32);
        assert_eq!(bitset.len(), 0);
    }

    pub fn sample_with_seed(n: u32, ratio: f64, seed_val: u8) -> Vec<u32> {
        StdRng::from_seed([seed_val; 32])
            .sample_iter(&Bernoulli::new(ratio).unwrap())
            .take(n as usize)
            .enumerate()
            .filter_map(|(val, keep)| if keep { Some(val as u32) } else { None })
            .collect()
    }

    pub fn sample(n: u32, ratio: f64) -> Vec<u32> {
        sample_with_seed(n, ratio, 4)
    }

    #[test]
    fn test_bitset_clear() {
        let mut bitset = BitSet::with_max_value(1_000);
        let els = sample(1_000, 0.01f64);
        for &el in &els {
            bitset.insert(el);
        }
        assert!(els.iter().all(|el| bitset.contains(*el)));
        bitset.clear();
        for el in 0u32..1000u32 {
            assert!(!bitset.contains(el));
        }
    }
}


================================================
FILE: common/src/bounds.rs
================================================
use std::io;
use std::ops::Bound;

#[derive(Clone, Debug)]
pub struct BoundsRange<T> {
    pub lower_bound: Bound<T>,
    pub upper_bound: Bound<T>,
}
impl<T> BoundsRange<T> {
    pub fn new(lower_bound: Bound<T>, upper_bound: Bound<T>) -> Self {
        BoundsRange {
            lower_bound,
            upper_bound,
        }
    }
    pub fn is_unbounded(&self) -> bool {
        matches!(self.lower_bound, Bound::Unbounded) && matches!(self.upper_bound, Bound::Unbounded)
    }
    pub fn map_bound<TTo>(&self, transform: impl Fn(&T) -> TTo) -> BoundsRange<TTo> {
        BoundsRange {
            lower_bound: map_bound(&self.lower_bound, &transform),
            upper_bound: map_bound(&self.upper_bound, &transform),
        }
    }

    pub fn map_bound_res<TTo, Err>(
        &self,
        transform: impl Fn(&T) -> Result<TTo, Err>,
    ) -> Result<BoundsRange<TTo>, Err> {
        Ok(BoundsRange {
            lower_bound: map_bound_res(&self.lower_bound, &transform)?,
            upper_bound: map_bound_res(&self.upper_bound, &transform)?,
        })
    }

    pub fn transform_inner<TTo>(
        &self,
        transform_lower: impl Fn(&T) -> TransformBound<TTo>,
        transform_upper: impl Fn(&T) -> TransformBound<TTo>,
    ) -> BoundsRange<TTo> {
        BoundsRange {
            lower_bound: transform_bound_inner(&self.lower_bound, &transform_lower),
            upper_bound: transform_bound_inner(&self.upper_bound, &transform_upper),
        }
    }

    /// Returns the first set inner value
    pub fn get_inner(&self) -> Option<&T> {
        inner_bound(&self.lower_bound).or(inner_bound(&self.upper_bound))
    }
}

pub enum TransformBound<T> {
    /// Overwrite the bounds
    NewBound(Bound<T>),
    /// Use Existing bounds with new value
    Existing(T),
}

/// Takes a bound and transforms the inner value into a new bound via a closure.
/// The bound variant may change by the value returned value from the closure.
pub fn transform_bound_inner_res<TFrom, TTo>(
    bound: &Bound<TFrom>,
    transform: impl Fn(&TFrom) -> io::Result<TransformBound<TTo>>,
) -> io::Result<Bound<TTo>> {
    use self::Bound::*;
    Ok(match bound {
        Excluded(from_val) => match transform(from_val)? {
            TransformBound::NewBound(new_val) => new_val,
            TransformBound::Existing(new_val) => Excluded(new_val),
        },
        Included(from_val) => match transform(from_val)? {
            TransformBound::NewBound(new_val) => new_val,
            TransformBound::Existing(new_val) => Included(new_val),
        },
        Unbounded => Unbounded,
    })
}

/// Takes a bound and transforms the inner value into a new bound via a closure.
/// The bound variant may change by the value returned value from the closure.
pub fn transform_bound_inner<TFrom, TTo>(
    bound: &Bound<TFrom>,
    transform: impl Fn(&TFrom) -> TransformBound<TTo>,
) -> Bound<TTo> {
    use self::Bound::*;
    match bound {
        Excluded(from_val) => match transform(from_val) {
            TransformBound::NewBound(new_val) => new_val,
            TransformBound::Existing(new_val) => Excluded(new_val),
        },
        Included(from_val) => match transform(from_val) {
            TransformBound::NewBound(new_val) => new_val,
            TransformBound::Existing(new_val) => Included(new_val),
        },
        Unbounded => Unbounded,
    }
}

/// Returns the inner value of a `Bound`
pub fn inner_bound<T>(val: &Bound<T>) -> Option<&T> {
    match val {
        Bound::Included(term) | Bound::Excluded(term) => Some(term),
        Bound::Unbounded => None,
    }
}

pub fn map_bound<TFrom, TTo>(
    bound: &Bound<TFrom>,
    transform: impl Fn(&TFrom) -> TTo,
) -> Bound<TTo> {
    use self::Bound::*;
    match bound {
        Excluded(from_val) => Bound::Excluded(transform(from_val)),
        Included(from_val) => Bound::Included(transform(from_val)),
        Unbounded => Unbounded,
    }
}

pub fn map_bound_res<TFrom, TTo, Err>(
    bound: &Bound<TFrom>,
    transform: impl Fn(&TFrom) -> Result<TTo, Err>,
) -> Result<Bound<TTo>, Err> {
    use self::Bound::*;
    Ok(match bound {
        Excluded(from_val) => Excluded(transform(from_val)?),
        Included(from_val) => Included(transform(from_val)?),
        Unbounded => Unbounded,
    })
}


================================================
FILE: common/src/byte_count.rs
================================================
use std::iter::Sum;
use std::ops::{Add, AddAssign};

use serde::{Deserialize, Serialize};

/// Indicates space usage in bytes
#[derive(Copy, Clone, Default, PartialEq, Eq, PartialOrd, Ord, Serialize, Deserialize)]
pub struct ByteCount(u64);

impl std::fmt::Debug for ByteCount {
    fn fmt(&self, f: &mut std::fmt::Formatter<'_>) -> std::fmt::Result {
        f.write_str(&self.human_readable())
    }
}

impl std::fmt::Display for ByteCount {
    fn fmt(&self, f: &mut std::fmt::Formatter<'_>) -> std::fmt::Result {
        f.write_str(&self.human_readable())
    }
}

const SUFFIX_AND_THRESHOLD: [(&str, u64); 5] = [
    ("KB", 1_000),
    ("MB", 1_000_000),
    ("GB", 1_000_000_000),
    ("TB", 1_000_000_000_000),
    ("PB", 1_000_000_000_000_000),
];

impl ByteCount {
    #[inline]
    pub fn get_bytes(&self) -> u64 {
        self.0
    }

    pub fn human_readable(&self) -> String {
        for (suffix, threshold) in SUFFIX_AND_THRESHOLD.iter().rev() {
            if self.get_bytes() >= *threshold {
                let unit_num = self.get_bytes() as f64 / *threshold as f64;
                return format!("{unit_num:.2} {suffix}");
            }
        }
        format!("{:.2} B", self.get_bytes())
    }
}

impl From<u64> for ByteCount {
    fn from(value: u64) -> Self {
        ByteCount(value)
    }
}
impl From<usize> for ByteCount {
    fn from(value: usize) -> Self {
        ByteCount(value as u64)
    }
}

impl Sum for ByteCount {
    #[inline]
    fn sum<I: Iterator<Item = Self>>(iter: I) -> Self {
        iter.fold(ByteCount::default(), |acc, x| acc + x)
    }
}

impl PartialEq<u64> for ByteCount {
    #[inline]
    fn eq(&self, other: &u64) -> bool {
        self.get_bytes() == *other
    }
}

impl PartialOrd<u64> for ByteCount {
    #[inline]
    fn partial_cmp(&self, other: &u64) -> Option<std::cmp::Ordering> {
        self.get_bytes().partial_cmp(other)
    }
}

impl Add for ByteCount {
    type Output = Self;

    #[inline]
    fn add(self, other: Self) -> Self {
        Self(self.get_bytes() + other.get_bytes())
    }
}

impl AddAssign for ByteCount {
    #[inline]
    fn add_assign(&mut self, other: Self) {
        *self = Self(self.get_bytes() + other.get_bytes());
    }
}

#[cfg(test)]
mod test {
    use crate::ByteCount;

    #[test]
    fn test_bytes() {
        assert_eq!(ByteCount::from(0u64).human_readable(), "0 B");
        assert_eq!(ByteCount::from(300u64).human_readable(), "300 B");
        assert_eq!(ByteCount::from(1_000_000u64).human_readable(), "1.00 MB");
        assert_eq!(ByteCount::from(1_500_000u64).human_readable(), "1.50 MB");
        assert_eq!(
            ByteCount::from(1_500_000_000u64).human_readable(),
            "1.50 GB"
        );
        assert_eq!(
            ByteCount::from(3_213_000_000_000u64).human_readable(),
            "3.21 TB"
        );
    }
}


================================================
FILE: common/src/datetime.rs
================================================
use std::fmt;
use std::io::{Read, Write};

use serde::{Deserialize, Serialize};
use time::format_description::well_known::Rfc3339;
use time::{OffsetDateTime, PrimitiveDateTime, UtcOffset};

use crate::BinarySerializable;

/// Precision with which datetimes are truncated when stored in fast fields. This setting is only
/// relevant for fast fields. In the docstore, datetimes are always saved with nanosecond precision.
#[derive(
    Clone, Copy, Debug, Hash, PartialEq, Eq, PartialOrd, Ord, Serialize, Deserialize, Default,
)]
#[serde(rename_all = "lowercase")]
pub enum DateTimePrecision {
    /// Second precision.
    #[default]
    Seconds,
    /// Millisecond precision.
    Milliseconds,
    /// Microsecond precision.
    Microseconds,
    /// Nanosecond precision.
    Nanoseconds,
}

/// A date/time value with nanoseconds precision.
///
/// This timestamp does not carry any explicit time zone information.
/// Users are responsible for applying the provided conversion
/// functions consistently. Internally the time zone is assumed
/// to be UTC, which is also used implicitly for JSON serialization.
///
/// All constructors and conversions are provided as explicit
/// functions and not by implementing any `From`/`Into` traits
/// to prevent unintended usage.
#[derive(Clone, Default, Copy, PartialEq, Eq, PartialOrd, Ord, Hash, Serialize, Deserialize)]
pub struct DateTime {
    // Timestamp in nanoseconds.
    pub(crate) timestamp_nanos: i64,
}

impl DateTime {
    /// Minimum possible `DateTime` value.
    pub const MIN: DateTime = DateTime {
        timestamp_nanos: i64::MIN,
    };

    /// Maximum possible `DateTime` value.
    pub const MAX: DateTime = DateTime {
        timestamp_nanos: i64::MAX,
    };

    /// Create new from UNIX timestamp in seconds
    pub const fn from_timestamp_secs(seconds: i64) -> Self {
        Self {
            timestamp_nanos: seconds * 1_000_000_000,
        }
    }

    /// Create new from UNIX timestamp in milliseconds
    pub const fn from_timestamp_millis(milliseconds: i64) -> Self {
        Self {
            timestamp_nanos: milliseconds * 1_000_000,
        }
    }

    /// Create new from UNIX timestamp in microseconds.
    pub const fn from_timestamp_micros(microseconds: i64) -> Self {
        Self {
            timestamp_nanos: microseconds * 1_000,
        }
    }

    /// Create new from UNIX timestamp in nanoseconds.
    pub const fn from_timestamp_nanos(nanoseconds: i64) -> Self {
        Self {
            timestamp_nanos: nanoseconds,
        }
    }

    /// Create new from `OffsetDateTime`
    ///
    /// The given date/time is converted to UTC and the actual
    /// time zone is discarded.
    pub fn from_utc(dt: OffsetDateTime) -> Self {
        let timestamp_nanos = dt.unix_timestamp_nanos() as i64;
        Self { timestamp_nanos }
    }

    /// Create new from `PrimitiveDateTime`
    ///
    /// Implicitly assumes that the given date/time is in UTC!
    /// Otherwise the original value must only be reobtained with
    /// [`Self::into_primitive()`].
    pub fn from_primitive(dt: PrimitiveDateTime) -> Self {
        Self::from_utc(dt.assume_utc())
    }

    /// Convert to UNIX timestamp in seconds.
    pub const fn into_timestamp_secs(self) -> i64 {
        self.timestamp_nanos / 1_000_000_000
    }

    /// Convert to UNIX timestamp in milliseconds.
    pub const fn into_timestamp_millis(self) -> i64 {
        self.timestamp_nanos / 1_000_000
    }

    /// Convert to UNIX timestamp in microseconds.
    pub const fn into_timestamp_micros(self) -> i64 {
        self.timestamp_nanos / 1_000
    }

    /// Convert to UNIX timestamp in nanoseconds.
    pub const fn into_timestamp_nanos(self) -> i64 {
        self.timestamp_nanos
    }

    /// Convert to UTC `OffsetDateTime`
    pub fn into_utc(self) -> OffsetDateTime {
        let utc_datetime = OffsetDateTime::from_unix_timestamp_nanos(self.timestamp_nanos as i128)
            .expect("valid UNIX timestamp");
        debug_assert_eq!(UtcOffset::UTC, utc_datetime.offset());
        utc_datetime
    }

    /// Convert to `OffsetDateTime` with the given time zone
    pub fn into_offset(self, offset: UtcOffset) -> OffsetDateTime {
        self.into_utc().to_offset(offset)
    }

    /// Convert to `PrimitiveDateTime` without any time zone
    ///
    /// The value should have been constructed with [`Self::from_primitive()`].
    /// Otherwise the time zone is implicitly assumed to be UTC.
    pub fn into_primitive(self) -> PrimitiveDateTime {
        let utc_datetime = self.into_utc();
        // Discard the UTC time zone offset
        debug_assert_eq!(UtcOffset::UTC, utc_datetime.offset());
        PrimitiveDateTime::new(utc_datetime.date(), utc_datetime.time())
    }

    /// Truncates the microseconds value to the corresponding precision.
    pub fn truncate(self, precision: DateTimePrecision) -> Self {
        let truncated_timestamp_micros = match precision {
            DateTimePrecision::Seconds => (self.timestamp_nanos / 1_000_000_000) * 1_000_000_000,
            DateTimePrecision::Milliseconds => (self.timestamp_nanos / 1_000_000) * 1_000_000,
            DateTimePrecision::Microseconds => (self.timestamp_nanos / 1_000) * 1_000,
            DateTimePrecision::Nanoseconds => self.timestamp_nanos,
        };
        Self {
            timestamp_nanos: truncated_timestamp_micros,
        }
    }
}

impl fmt::Debug for DateTime {
    fn fmt(&self, f: &mut fmt::Formatter) -> fmt::Result {
        let utc_rfc3339 = self.into_utc().format(&Rfc3339).map_err(|_| fmt::Error)?;
        f.write_str(&utc_rfc3339)
    }
}

impl BinarySerializable for DateTime {
    fn serialize<W: Write + ?Sized>(&self, writer: &mut W) -> std::io::Result<()> {
        let timestamp_micros = self.into_timestamp_micros();
        <i64 as BinarySerializable>::serialize(&timestamp_micros, writer)
    }

    fn deserialize<R: Read>(reader: &mut R) -> std::io::Result<Self> {
        let timestamp_micros = <i64 as BinarySerializable>::deserialize(reader)?;
        Ok(Self::from_timestamp_micros(timestamp_micros))
    }
}


================================================
FILE: common/src/file_slice.rs
================================================
use std::fs::File;
use std::ops::{Deref, Range, RangeBounds};
use std::path::Path;
use std::sync::Arc;
use std::{fmt, io};

use async_trait::async_trait;
use ownedbytes::{OwnedBytes, StableDeref};

use crate::{ByteCount, HasLen};

/// Objects that represents files sections in tantivy.
///
/// By contract, whatever happens to the directory file, as long as a FileHandle
/// is alive, the data associated with it cannot be altered or destroyed.
///
/// The underlying behavior is therefore specific to the `Directory` that
/// created it. Despite its name, a [`FileSlice`] may or may not directly map to an actual file
/// on the filesystem.

#[async_trait]
pub trait FileHandle: 'static + Send + Sync + HasLen + fmt::Debug {
    /// Reads a slice of bytes.
    ///
    /// This method may panic if the range requested is invalid.
    fn read_bytes(&self, range: Range<usize>) -> io::Result<OwnedBytes>;

    #[doc(hidden)]
    async fn read_bytes_async(&self, _byte_range: Range<usize>) -> io::Result<OwnedBytes> {
        Err(io::Error::new(
            io::ErrorKind::Unsupported,
            "Async read is not supported.",
        ))
    }
}

#[derive(Debug)]
/// A File with it's length included.
pub struct WrapFile {
    file: File,
    len: usize,
}
impl WrapFile {
    /// Creates a new WrapFile and stores its length.
    pub fn new(file: File) -> io::Result<Self> {
        let len = file.metadata()?.len() as usize;
        Ok(WrapFile { file, len })
    }
}

#[async_trait]
impl FileHandle for WrapFile {
    fn read_bytes(&self, range: Range<usize>) -> io::Result<OwnedBytes> {
        let file_len = self.len();

        // Calculate the actual range to read, ensuring it stays within file boundaries
        let start = range.start;
        let end = range.end.min(file_len);

        // Ensure the start is before the end of the range
        if start >= end {
            return Err(io::Error::new(io::ErrorKind::InvalidInput, "Invalid range"));
        }

        let mut buffer = vec![0; end - start];

        #[cfg(unix)]
        {
            use std::os::unix::prelude::FileExt;
            self.file.read_exact_at(&mut buffer, start as u64)?;
        }

        #[cfg(not(unix))]
        {
            use std::io::{Read, Seek};
            let mut file = self.file.try_clone()?; // Clone the file to read from it separately
            // Seek to the start position in the file
            file.seek(io::SeekFrom::Start(start as u64))?;
            // Read the data into the buffer
            file.read_exact(&mut buffer)?;
        }

        Ok(OwnedBytes::new(buffer))
    }
    // todo implement async
}
impl HasLen for WrapFile {
    fn len(&self) -> usize {
        self.len
    }
}

#[async_trait]
impl FileHandle for &'static [u8] {
    fn read_bytes(&self, range: Range<usize>) -> io::Result<OwnedBytes> {
        let bytes = &self[range];
        Ok(OwnedBytes::new(bytes))
    }

    async fn read_bytes_async(&self, byte_range: Range<usize>) -> io::Result<OwnedBytes> {
        Ok(self.read_bytes(byte_range)?)
    }
}

impl<B> From<B> for FileSlice
where B: StableDeref + Deref<Target = [u8]> + 'static + Send + Sync
{
    fn from(bytes: B) -> FileSlice {
        FileSlice::new(Arc::new(OwnedBytes::new(bytes)))
    }
}

/// Logical slice of read only file in tantivy.
///
/// It can be cloned and sliced cheaply.
#[derive(Clone)]
pub struct FileSlice {
    data: Arc<dyn FileHandle>,
    range: Range<usize>,
}

impl fmt::Debug for FileSlice {
    fn fmt(&self, f: &mut fmt::Formatter) -> fmt::Result {
        write!(f, "FileSlice({:?}, {:?})", &self.data, self.range)
    }
}

impl FileSlice {
    pub fn stream_file_chunks(&self) -> impl Iterator<Item = io::Result<OwnedBytes>> + '_ {
        let len = self.range.end;
        let mut start = self.range.start;
        std::iter::from_fn(move || {
            /// Returns chunks of 1MB of data from the FileHandle.
            const CHUNK_SIZE: usize = 1024 * 1024; // 1MB

            if start < len {
                let end = (start + CHUNK_SIZE).min(len);
                let range = start..end;
                let chunk = self.data.read_bytes(range);
                start += CHUNK_SIZE;
                match chunk {
                    Ok(chunk) => Some(Ok(chunk)),
                    Err(e) => Some(Err(e)),
                }
            } else {
                None
            }
        })
    }
}

/// Takes a range, a `RangeBounds` object, and returns
/// a `Range` that corresponds to the relative application of the
/// `RangeBounds` object to the original `Range`.
///
/// For instance, combine_ranges(`[2..11)`, `[5..7]`) returns `[7..10]`
/// as it reads, what is the sub-range that starts at the 5 element of
/// `[2..11)` and ends at the 9th element included.
///
/// This function panics, if the result would suggest something outside
/// of the bounds of the original range.
fn combine_ranges<R: RangeBounds<usize>>(orig_range: Range<usize>, rel_range: R) -> Range<usize> {
    let start: usize = orig_range.start
        + match rel_range.start_bound().cloned() {
            std::ops::Bound::Included(rel_start) => rel_start,
            std::ops::Bound::Excluded(rel_start) => rel_start + 1,
            std::ops::Bound::Unbounded => 0,
        };
    assert!(start <= orig_range.end);
    let end: usize = match rel_range.end_bound().cloned() {
        std::ops::Bound::Included(rel_end) => orig_range.start + rel_end + 1,
        std::ops::Bound::Excluded(rel_end) => orig_range.start + rel_end,
        std::ops::Bound::Unbounded => orig_range.end,
    };
    assert!(end >= start);
    assert!(end <= orig_range.end);
    start..end
}

impl FileSlice {
    /// Creates a FileSlice from a path.
    pub fn open(path: &Path) -> io::Result<FileSlice> {
        let wrap_file = WrapFile::new(File::open(path)?)?;
        Ok(FileSlice::new(Arc::new(wrap_file)))
    }

    /// Wraps a FileHandle.
    pub fn new(file_handle: Arc<dyn FileHandle>) -> Self {
        let num_bytes = file_handle.len();
        FileSlice::new_with_num_bytes(file_handle, num_bytes)
    }

    /// Wraps a FileHandle.
    #[doc(hidden)]
    #[must_use]
    pub fn new_with_num_bytes(file_handle: Arc<dyn FileHandle>, num_bytes: usize) -> Self {
        FileSlice {
            data: file_handle,
            range: 0..num_bytes,
        }
    }

    /// Creates a fileslice that is just a view over a slice of the data.
    ///
    /// # Panics
    ///
    /// Panics if `byte_range.end` exceeds the filesize.
    #[must_use]
    #[inline]
    pub fn slice<R: RangeBounds<usize>>(&self, byte_range: R) -> FileSlice {
        FileSlice {
            data: self.data.clone(),
            range: combine_ranges(self.range.clone(), byte_range),
        }
    }

    /// Creates an empty FileSlice
    pub fn empty() -> FileSlice {
        const EMPTY_SLICE: &[u8] = &[];
        FileSlice::from(EMPTY_SLICE)
    }

    /// Returns a `OwnedBytes` with all of the data in the `FileSlice`.
    ///
    /// The behavior is strongly dependent on the implementation of the underlying
    /// `Directory` and the `FileSliceTrait` it creates.
    /// In particular, it is  up to the `Directory` implementation
    /// to handle caching if needed.
    pub fn read_bytes(&self) -> io::Result<OwnedBytes> {
        self.data.read_bytes(self.range.clone())
    }

    #[doc(hidden)]
    pub async fn read_bytes_async(&self) -> io::Result<OwnedBytes> {
        self.data.read_bytes_async(self.range.clone()).await
    }

    /// Reads a specific slice of data.
    ///
    /// This is equivalent to running `file_slice.slice(from, to).read_bytes()`.
    pub fn read_bytes_slice(&self, range: Range<usize>) -> io::Result<OwnedBytes> {
        assert!(
            range.end <= self.len(),
            "end of requested range exceeds the fileslice length ({} > {})",
            range.end,
            self.len()
        );
        self.data
            .read_bytes(self.range.start + range.start..self.range.start + range.end)
    }

    #[doc(hidden)]
    pub async fn read_bytes_slice_async(&self, byte_range: Range<usize>) -> io::Result<OwnedBytes> {
        assert!(
            self.range.start + byte_range.end <= self.range.end,
            "`to` exceeds the fileslice length"
        );
        self.data
            .read_bytes_async(
                self.range.start + byte_range.start..self.range.start + byte_range.end,
            )
            .await
    }

    /// Splits the FileSlice at the given offset and return two file slices.
    /// `file_slice[..split_offset]` and `file_slice[split_offset..]`.
    ///
    /// This operation is cheap and must not copy any underlying data.
    pub fn split(self, left_len: usize) -> (FileSlice, FileSlice) {
        let left = self.slice_to(left_len);
        let right = self.slice_from(left_len);
        (left, right)
    }

    /// Splits the file slice at the given offset and return two file slices.
    /// `file_slice[..split_offset]` and `file_slice[split_offset..]`.
    pub fn split_from_end(self, right_len: usize) -> (FileSlice, FileSlice) {
        let left_len = self.len() - right_len;
        self.split(left_len)
    }

    /// Like `.slice(...)` but enforcing only the `from`
    /// boundary.
    ///
    /// Equivalent to `.slice(from_offset, self.len())`
    #[must_use]
    pub fn slice_from(&self, from_offset: usize) -> FileSlice {
        self.slice(from_offset..self.len())
    }

    /// Returns a slice from the end.
    ///
    /// Equivalent to `.slice(self.len() - from_offset, self.len())`
    #[must_use]
    pub fn slice_from_end(&self, from_offset: usize) -> FileSlice {
        self.slice(self.len() - from_offset..self.len())
    }

    /// Like `.slice(...)` but enforcing only the `to`
    /// boundary.
    ///
    /// Equivalent to `.slice(0, to_offset)`
    #[must_use]
    pub fn slice_to(&self, to_offset: usize) -> FileSlice {
        self.slice(0..to_offset)
    }

    /// Returns the byte count of the FileSlice.
    pub fn num_bytes(&self) -> ByteCount {
        self.range.len().into()
    }
}

#[async_trait]
impl FileHandle for FileSlice {
    fn read_bytes(&self, range: Range<usize>) -> io::Result<OwnedBytes> {
        self.read_bytes_slice(range)
    }

    async fn read_bytes_async(&self, byte_range: Range<usize>) -> io::Result<OwnedBytes> {
        self.read_bytes_slice_async(byte_range).await
    }
}

impl HasLen for FileSlice {
    fn len(&self) -> usize {
        self.range.len()
    }
}

#[async_trait]
impl FileHandle for OwnedBytes {
    fn read_bytes(&self, range: Range<usize>) -> io::Result<OwnedBytes> {
        Ok(self.slice(range))
    }

    async fn read_bytes_async(&self, range: Range<usize>) -> io::Result<OwnedBytes> {
        self.read_bytes(range)
    }
}

#[cfg(test)]
mod tests {
    use std::io;
    use std::ops::Bound;
    use std::sync::Arc;

    use super::{FileHandle, FileSlice};
    use crate::HasLen;
    use crate::file_slice::combine_ranges;

    #[test]
    fn test_file_slice() -> io::Result<()> {
        let file_slice = FileSlice::new(Arc::new(b"abcdef".as_ref()));
        assert_eq!(file_slice.len(), 6);
        assert_eq!(file_slice.slice_from(2).read_bytes()?.as_slice(), b"cdef");
        assert_eq!(file_slice.slice_to(2).read_bytes()?.as_slice(), b"ab");
        assert_eq!(
            file_slice
                .slice_from(1)
                .slice_to(2)
                .read_bytes()?
                .as_slice(),
            b"bc"
        );
        {
            let (left, right) = file_slice.clone().split(0);
            assert_eq!(left.read_bytes()?.as_slice(), b"");
            assert_eq!(right.read_bytes()?.as_slice(), b"abcdef");
        }
        {
            let (left, right) = file_slice.clone().split(2);
            assert_eq!(left.read_bytes()?.as_slice(), b"ab");
            assert_eq!(right.read_bytes()?.as_slice(), b"cdef");
        }
        {
            let (left, right) = file_slice.clone().split_from_end(0);
            assert_eq!(left.read_bytes()?.as_slice(), b"abcdef");
            assert_eq!(right.read_bytes()?.as_slice(), b"");
        }
        {
            let (left, right) = file_slice.split_from_end(2);
            assert_eq!(left.read_bytes()?.as_slice(), b"abcd");
            assert_eq!(right.read_bytes()?.as_slice(), b"ef");
        }
        Ok(())
    }

    #[test]
    fn test_file_slice_trait_slice_len() {
        let blop: &'static [u8] = b"abc";
        let owned_bytes: Box<dyn FileHandle> = Box::new(blop);
        assert_eq!(owned_bytes.len(), 3);
    }

    #[test]
    fn test_slice_simple_read() -> io::Result<()> {
        let slice = FileSlice::new(Arc::new(&b"abcdef"[..]));
        assert_eq!(slice.len(), 6);
        assert_eq!(slice.read_bytes()?.as_ref(), b"abcdef");
        assert_eq!(slice.slice(1..4).read_bytes()?.as_ref(), b"bcd");
        Ok(())
    }

    #[test]
    fn test_slice_read_slice() -> io::Result<()> {
        let slice_deref = FileSlice::new(Arc::new(&b"abcdef"[..]));
        assert_eq!(slice_deref.read_bytes_slice(1..4)?.as_ref(), b"bcd");
        Ok(())
    }

    #[test]
    #[should_panic(expected = "end of requested range exceeds the fileslice length (10 > 6)")]
    fn test_slice_read_slice_invalid_range_exceeds() {
        let slice_deref = FileSlice::new(Arc::new(&b"abcdef"[..]));
        assert_eq!(
            slice_deref.read_bytes_slice(0..10).unwrap().as_ref(),
            b"bcd"
        );
    }

    #[test]
    fn test_combine_range() {
        assert_eq!(combine_ranges(1..3, 0..1), 1..2);
        assert_eq!(combine_ranges(1..3, 1..), 2..3);
        assert_eq!(combine_ranges(1..4, ..2), 1..3);
        assert_eq!(combine_ranges(3..10, 2..5), 5..8);
        assert_eq!(combine_ranges(2..11, 5..=7), 7..10);
        assert_eq!(
            combine_ranges(2..11, (Bound::Excluded(5), Bound::Unbounded)),
            8..11
        );
    }

    #[test]
    #[should_panic]
    fn test_combine_range_panics() {
        let _ = combine_ranges(3..5, 1..4);
    }
}


================================================
FILE: common/src/group_by.rs
================================================
use std::cell::RefCell;
use std::iter::Peekable;
use std::rc::Rc;

pub trait GroupByIteratorExtended: Iterator {
    /// Return an `Iterator` that groups iterator elements. Consecutive elements that map to the
    /// same key are assigned to the same group.
    ///
    /// The returned Iterator item is `(K, impl Iterator)`, where Iterator are the items of the
    /// group.
    ///
    /// ```
    /// use tantivy_common::GroupByIteratorExtended;
    ///
    /// // group data into blocks of larger than zero or not.
    /// let data: Vec<i32> = vec![1, 3, -2, -2, 1, 0, 1, 2];
    /// // groups:               |---->|------>|--------->|
    ///
    /// let mut data_grouped = Vec::new();
    /// // Note: group is an iterator
    /// for (key, group) in data.into_iter().group_by(|val| *val >= 0) {
    ///     data_grouped.push((key, group.collect()));
    /// }
    /// assert_eq!(data_grouped, vec![(true, vec![1, 3]), (false, vec![-2, -2]), (true, vec![1, 0, 1, 2])]);
    /// ```
    fn group_by<K, F>(self, key: F) -> GroupByIterator<Self, F, K>
    where
        Self: Sized,
        F: FnMut(&Self::Item) -> K,
        K: PartialEq + Clone,
        Self::Item: Clone,
    {
        GroupByIterator::new(self, key)
    }
}
impl<I: Iterator> GroupByIteratorExtended for I {}

pub struct GroupByIterator<I, F, K: Clone>
where
    I: Iterator,
    F: FnMut(&I::Item) -> K,
{
    // I really would like to avoid the Rc<RefCell>, but the Iterator is shared between
    // `GroupByIterator` and `GroupIter`. In practice they are used consecutive and
    // `GroupByIter` is finished before calling next on `GroupByIterator`. I'm not sure there
    // is a solution with lifetimes for that, because we would need to enforce it in the usage
    // somehow.
    //
    // One potential solution would be to replace the iterator approach with something similar.
    inner: Rc<RefCell<GroupByShared<I, F, K>>>,
}

struct GroupByShared<I, F, K: Clone>
where
    I: Iterator,
    F: FnMut(&I::Item) -> K,
{
    iter: Peekable<I>,
    group_by_fn: F,
}

impl<I, F, K> GroupByIterator<I, F, K>
where
    I: Iterator,
    F: FnMut(&I::Item) -> K,
    K: Clone,
{
    fn new(inner: I, group_by_fn: F) -> Self {
        let inner = GroupByShared {
            iter: inner.peekable(),
            group_by_fn,
        };

        Self {
            inner: Rc::new(RefCell::new(inner)),
        }
    }
}

impl<I, F, K> Iterator for GroupByIterator<I, F, K>
where
    I: Iterator,
    I::Item: Clone,
    F: FnMut(&I::Item) -> K,
    K: Clone,
{
    type Item = (K, GroupIterator<I, F, K>);

    fn next(&mut self) -> Option<Self::Item> {
        let mut inner = self.inner.borrow_mut();
        let value = inner.iter.peek()?.clone();
        let key = (inner.group_by_fn)(&value);

        let inner = self.inner.clone();

        let group_iter = GroupIterator {
            inner,
            group_key: key.clone(),
        };
        Some((key, group_iter))
    }
}

pub struct GroupIterator<I, F, K: Clone>
where
    I: Iterator,
    F: FnMut(&I::Item) -> K,
{
    inner: Rc<RefCell<GroupByShared<I, F, K>>>,
    group_key: K,
}

impl<I, F, K: PartialEq + Clone> Iterator for GroupIterator<I, F, K>
where
    I: Iterator,
    I::Item: Clone,
    F: FnMut(&I::Item) -> K,
{
    type Item = I::Item;

    fn next(&mut self) -> Option<Self::Item> {
        let mut inner = self.inner.borrow_mut();
        // peek if next value is in group
        let peek_val = inner.iter.peek()?.clone();
        if (inner.group_by_fn)(&peek_val) == self.group_key {
            inner.iter.next()
        } else {
            None
        }
    }
}

#[cfg(test)]
mod tests {
    use super::*;

    fn group_by_collect<I: Iterator<Item = u32>>(iter: I) -> Vec<(I::Item, Vec<I::Item>)> {
        iter.group_by(|val| val / 10)
            .map(|(el, iter)| (el, iter.collect::<Vec<_>>()))
            .collect::<Vec<_>>()
    }

    #[test]
    fn group_by_two_groups() {
        let vals = vec![1u32, 4, 15];
        let grouped_vals = group_by_collect(vals.into_iter());
        assert_eq!(grouped_vals, vec![(0, vec![1, 4]), (1, vec![15])]);
    }

    #[test]
    fn group_by_test_empty() {
        let vals = vec![];
        let grouped_vals = group_by_collect(vals.into_iter());
        assert_eq!(grouped_vals, vec![]);
    }

    #[test]
    fn group_by_three_groups() {
        let vals = vec![1u32, 4, 15, 1];
        let grouped_vals = group_by_collect(vals.into_iter());
        assert_eq!(
            grouped_vals,
            vec![(0, vec![1, 4]), (1, vec![15]), (0, vec![1])]
        );
    }
}


================================================
FILE: common/src/json_path_writer.rs
================================================
use crate::replace_in_place;

/// Separates the different segments of a json path.
pub const JSON_PATH_SEGMENT_SEP: u8 = 1u8;
pub const JSON_PATH_SEGMENT_SEP_STR: &str =
    unsafe { std::str::from_utf8_unchecked(&[JSON_PATH_SEGMENT_SEP]) };

/// Separates the json path and the value in
/// a JSON term binary representation.
pub const JSON_END_OF_PATH: u8 = 0u8;
pub const JSON_END_OF_PATH_STR: &str =
    unsafe { std::str::from_utf8_unchecked(&[JSON_END_OF_PATH]) };

/// Create a new JsonPathWriter, that creates flattened json paths for tantivy.
#[derive(Clone, Debug, Default)]
pub struct JsonPathWriter {
    path: String,
    indices: Vec<usize>,
    expand_dots: bool,
}

impl JsonPathWriter {
    pub fn with_expand_dots(expand_dots: bool) -> Self {
        JsonPathWriter {
            path: String::new(),
            indices: Vec::new(),
            expand_dots,
        }
    }

    pub fn new() -> Self {
        JsonPathWriter {
            path: String::new(),
            indices: Vec::new(),
            expand_dots: false,
        }
    }

    /// When expand_dots is enabled, json object like
    /// `{"k8s.node.id": 5}` is processed as if it was
    /// `{"k8s": {"node": {"id": 5}}}`.
    /// This option has the merit of allowing users to
    /// write queries  like `k8s.node.id:5`.
    /// On the other, enabling that feature can lead to
    /// ambiguity.
    #[inline]
    pub fn set_expand_dots(&mut self, expand_dots: bool) {
        self.expand_dots = expand_dots;
    }

    /// Push a new segment to the path.
    #[inline]
    pub fn push(&mut self, segment: &str) {
        let len_path = self.path.len();
        self.indices.push(len_path);
        if self.indices.len() > 1 {
            self.path.push(JSON_PATH_SEGMENT_SEP as char);
        }
        self.path.push_str(segment);
        if self.expand_dots {
            // This might include the separation byte, which is ok because it is not a dot.
            let appended_segment = &mut self.path[len_path..];
            // The unsafe below is safe as long as b'.' and JSON_PATH_SEGMENT_SEP are
            // valid single byte ut8 strings.
            // By utf-8 design, they cannot be part of another codepoint.
            unsafe {
                replace_in_place(b'.', JSON_PATH_SEGMENT_SEP, appended_segment.as_bytes_mut())
            };
        }
    }

    /// Set the end of JSON path marker.
    #[inline]
    pub fn set_end(&mut self) {
        self.path.push_str(JSON_END_OF_PATH_STR);
    }

    /// Remove the last segment. Does nothing if the path is empty.
    #[inline]
    pub fn pop(&mut self) {
        if let Some(last_idx) = self.indices.pop() {
            self.path.truncate(last_idx);
        }
    }

    /// Clear the path.
    #[inline]
    pub fn clear(&mut self) {
        self.path.clear();
        self.indices.clear();
    }

    /// Get the current path.
    #[inline]
    pub fn as_str(&self) -> &str {
        &self.path
    }
}

impl From<JsonPathWriter> for String {
    #[inline]
    fn from(value: JsonPathWriter) -> Self {
        value.path
    }
}

#[cfg(test)]
mod tests {
    use super::*;

    #[test]
    fn json_path_writer_test() {
        let mut writer = JsonPathWriter::new();
        writer.set_expand_dots(false);

        writer.push("root");
        assert_eq!(writer.as_str(), "root");

        writer.push("child");
        assert_eq!(writer.as_str(), "root\u{1}child");

        writer.pop();
        assert_eq!(writer.as_str(), "root");

        writer.push("k8s.node.id");
        assert_eq!(writer.as_str(), "root\u{1}k8s.node.id");

        writer.set_expand_dots(true);
        writer.pop();
        writer.push("k8s.node.id");
        assert_eq!(writer.as_str(), "root\u{1}k8s\u{1}node\u{1}id");
    }

    #[test]
    fn test_json_path_expand_dots_enabled_pop_segment() {
        let mut json_writer = JsonPathWriter::with_expand_dots(true);
        json_writer.push("hello");
        assert_eq!(json_writer.as_str(), "hello");
        json_writer.push("color.hue");
        assert_eq!(json_writer.as_str(), "hello\x01color\x01hue");
        json_writer.pop();
        assert_eq!(json_writer.as_str(), "hello");
    }
}


================================================
FILE: common/src/lib.rs
================================================
#![allow(clippy::len_without_is_empty)]

use std::ops::Deref;

pub use byteorder::LittleEndian as Endianness;

mod bitset;
pub mod bounds;
mod byte_count;
mod datetime;
pub mod file_slice;
mod group_by;
pub mod json_path_writer;
mod serialize;
mod vint;
mod writer;
pub use bitset::*;
pub use byte_count::ByteCount;
pub use datetime::{DateTime, DateTimePrecision};
pub use group_by::GroupByIteratorExtended;
pub use json_path_writer::JsonPathWriter;
pub use ownedbytes::{OwnedBytes, StableDeref};
pub use serialize::{BinarySerializable, DeserializeFrom, FixedSize};
pub use vint::{
    VInt, VIntU128, read_u32_vint, read_u32_vint_no_advance, serialize_vint_u32, write_u32_vint,
};
pub use writer::{AntiCallToken, CountingWriter, TerminatingWrite};

/// Has length trait
pub trait HasLen {
    /// Return length
    fn len(&self) -> usize;

    /// Returns true iff empty.
    fn is_empty(&self) -> bool {
        self.len() == 0
    }
}

impl<T: Deref<Target = [u8]>> HasLen for T {
    fn len(&self) -> usize {
        self.deref().len()
    }
}

const HIGHEST_BIT: u64 = 1 << 63;

/// Maps a `i64` to `u64`
///
/// For simplicity, tantivy internally handles `i64` as `u64`.
/// The mapping is defined by this function.
///
/// Maps `i64` to `u64` so that
/// `-2^63 .. 2^63-1` is mapped
///     to
/// `0 .. 2^64-1`
/// in that order.
///
/// This is more suited than simply casting (`val as u64`)
/// because of bitpacking.
///
/// Imagine a list of `i64` ranging from -10 to 10.
/// When casting negative values, the negative values are projected
/// to values over 2^63, and all values end up requiring 64 bits.
///
/// # See also
/// The reverse mapping is [`u64_to_i64()`].
#[inline]
pub fn i64_to_u64(val: i64) -> u64 {
    (val as u64) ^ HIGHEST_BIT
}

/// Reverse the mapping given by [`i64_to_u64()`].
#[inline]
pub fn u64_to_i64(val: u64) -> i64 {
    (val ^ HIGHEST_BIT) as i64
}

/// Maps a `f64` to `u64`
///
/// For simplicity, tantivy internally handles `f64` as `u64`.
/// The mapping is defined by this function.
///
/// Maps `f64` to `u64` in a monotonic manner, so that bytes lexical order is preserved.
///
/// This is more suited than simply casting (`val as u64`)
/// which would truncate the result
///
/// # Reference
///
/// Daniel Lemire's [blog post](https://lemire.me/blog/2020/12/14/converting-floating-point-numbers-to-integers-while-preserving-order/)
/// explains the mapping in a clear manner.
///
/// # See also
/// The reverse mapping is [`u64_to_f64()`].
#[inline]
pub fn f64_to_u64(val: f64) -> u64 {
    let bits = val.to_bits();
    if val.is_sign_positive() {
        bits ^ HIGHEST_BIT
    } else {
        !bits
    }
}

/// Reverse the mapping given by [`f64_to_u64()`].
#[inline]
pub fn u64_to_f64(val: u64) -> f64 {
    f64::from_bits(if val & HIGHEST_BIT != 0 {
        val ^ HIGHEST_BIT
    } else {
        !val
    })
}

/// Replaces a given byte in the `bytes` slice of bytes.
///
/// This function assumes that the needle is rarely contained in the bytes string
/// and offers a fast path if the needle is not present.
#[inline]
pub fn replace_in_place(needle: u8, replacement: u8, bytes: &mut [u8]) {
    if !bytes.contains(&needle) {
        return;
    }
    for b in bytes {
        if *b == needle {
            *b = replacement;
        }
    }
}

#[cfg(test)]
pub(crate) mod test {

    use proptest::prelude::*;

    use super::{f64_to_u64, i64_to_u64, u64_to_f64, u64_to_i64};

    fn test_i64_converter_helper(val: i64) {
        assert_eq!(u64_to_i64(i64_to_u64(val)), val);
    }

    fn test_f64_converter_helper(val: f64) {
        assert_eq!(u64_to_f64(f64_to_u64(val)), val);
    }

    proptest! {
        #[test]
        fn test_f64_converter_monotonicity_proptest((left, right) in (proptest::num::f64::NORMAL, proptest::num::f64::NORMAL)) {
            let left_u64 = f64_to_u64(left);
            let right_u64 = f64_to_u64(right);
            assert_eq!(left_u64 < right_u64,  left < right);
        }
    }

    #[test]
    fn test_i64_converter() {
        assert_eq!(i64_to_u64(i64::MIN), u64::MIN);
        assert_eq!(i64_to_u64(i64::MAX), u64::MAX);
        test_i64_converter_helper(0i64);
        test_i64_converter_helper(i64::MIN);
        test_i64_converter_helper(i64::MAX);
        for i in -1000i64..1000i64 {
            test_i64_converter_helper(i);
        }
    }

    #[test]
    fn test_f64_converter() {
        test_f64_converter_helper(f64::INFINITY);
        test_f64_converter_helper(f64::NEG_INFINITY);
        test_f64_converter_helper(0.0);
        test_f64_converter_helper(-0.0);
        test_f64_converter_helper(1.0);
        test_f64_converter_helper(-1.0);
    }

    #[test]
    fn test_f64_order() {
        assert!(
            !(f64_to_u64(f64::NEG_INFINITY)..f64_to_u64(f64::INFINITY))
                .contains(&f64_to_u64(f64::NAN))
        ); // nan is not a number
        assert!(f64_to_u64(1.5) > f64_to_u64(1.0)); // same exponent, different mantissa
        assert!(f64_to_u64(2.0) > f64_to_u64(1.0)); // same mantissa, different exponent
        assert!(f64_to_u64(2.0) > f64_to_u64(1.5)); // different exponent and mantissa
        assert!(f64_to_u64(1.0) > f64_to_u64(-1.0)); // pos > neg
        assert!(f64_to_u64(-1.5) < f64_to_u64(-1.0));
        assert!(f64_to_u64(-2.0) < f64_to_u64(1.0));
        assert!(f64_to_u64(-2.0) < f64_to_u64(-1.5));
    }

    #[test]
    fn test_replace_in_place() {
        let test_aux = |before_replacement: &[u8], expected: &[u8]| {
            let mut bytes: Vec<u8> = before_replacement.to_vec();
            super::replace_in_place(b'b', b'c', &mut bytes);
            assert_eq!(&bytes[..], expected);
        };
        test_aux(b"", b"");
        test_aux(b"b", b"c");
        test_aux(b"baaa", b"caaa");
        test_aux(b"aaab", b"aaac");
        test_aux(b"aaabaa", b"aaacaa");
        test_aux(b"aaaaaa", b"aaaaaa");
        test_aux(b"bbbb", b"cccc");
    }
}


================================================
FILE: common/src/serialize.rs
================================================
use std::borrow::Cow;
use std::io::{Read, Write};
use std::{fmt, io};

use byteorder::{ReadBytesExt, WriteBytesExt};

use crate::{Endianness, VInt};

#[derive(Default)]
struct Counter(u64);

impl io::Write for Counter {
    fn write(&mut self, buf: &[u8]) -> io::Result<usize> {
        self.0 += buf.len() as u64;
        Ok(buf.len())
    }

    fn write_all(&mut self, buf: &[u8]) -> io::Result<()> {
        self.0 += buf.len() as u64;
        Ok(())
    }

    fn flush(&mut self) -> io::Result<()> {
        Ok(())
    }
}

/// Trait for a simple binary serialization.
pub trait BinarySerializable: fmt::Debug + Sized {
    /// Serialize
    fn serialize<W: Write + ?Sized>(&self, writer: &mut W) -> io::Result<()>;
    /// Deserialize
    fn deserialize<R: Read>(reader: &mut R) -> io::Result<Self>;

    fn num_bytes(&self) -> u64 {
        let mut counter = Counter::default();
        self.serialize(&mut counter).unwrap();
        counter.0
    }
}

pub trait DeserializeFrom<T: BinarySerializable> {
    fn deserialize(&mut self) -> io::Result<T>;
}

/// Implement deserialize from &[u8] for all types which implement BinarySerializable.
///
/// TryFrom would actually be preferable, but not possible because of the orphan
/// rules (not completely sure if this could be resolved)
impl<T: BinarySerializable> DeserializeFrom<T> for &[u8] {
    fn deserialize(&mut self) -> io::Result<T> {
        T::deserialize(self)
    }
}

/// `FixedSize` marks a `BinarySerializable` as
/// always serializing to the same size.
pub trait FixedSize: BinarySerializable {
    const SIZE_IN_BYTES: usize;
}

impl BinarySerializable for () {
    fn serialize<W: Write + ?Sized>(&self, _: &mut W) -> io::Result<()> {
        Ok(())
    }
    fn deserialize<R: Read>(_: &mut R) -> io::Result<Self> {
        Ok(())
    }
}

impl FixedSize for () {
    const SIZE_IN_BYTES: usize = 0;
}

impl<T: BinarySerializable> BinarySerializable for Vec<T> {
    fn serialize<W: Write + ?Sized>(&self, writer: &mut W) -> io::Result<()> {
        BinarySerializable::serialize(&VInt(self.len() as u64), writer)?;
        for it in self {
            it.serialize(writer)?;
        }
        Ok(())
    }
    fn deserialize<R: Read>(reader: &mut R) -> io::Result<Vec<T>> {
        let num_items = <VInt as BinarySerializable>::deserialize(reader)?.val();
        let mut items: Vec<T> = Vec::with_capacity(num_items as usize);
        for _ in 0..num_items {
            let item = T::deserialize(reader)?;
            items.push(item);
        }
        Ok(items)
    }
}

impl<Left: BinarySerializable, Right: BinarySerializable> BinarySerializable for (Left, Right) {
    fn serialize<W: Write + ?Sized>(&self, write: &mut W) -> io::Result<()> {
        self.0.serialize(write)?;
        self.1.serialize(write)
    }
    fn deserialize<R: Read>(reader: &mut R) -> io::Result<Self> {
        Ok((Left::deserialize(reader)?, Right::deserialize(reader)?))
    }
}
impl<Left: BinarySerializable + FixedSize, Right: BinarySerializable + FixedSize> FixedSize
    for (Left, Right)
{
    const SIZE_IN_BYTES: usize = Left::SIZE_IN_BYTES + Right::SIZE_IN_BYTES;
}

impl BinarySerializable for u32 {
    fn serialize<W: Write + ?Sized>(&self, writer: &mut W) -> io::Result<()> {
        writer.write_u32::<Endianness>(*self)
    }

    fn deserialize<R: Read>(reader: &mut R) -> io::Result<u32> {
        reader.read_u32::<Endianness>()
    }
}

impl FixedSize for u32 {
    const SIZE_IN_BYTES: usize = 4;
}

impl BinarySerializable for u16 {
    fn serialize<W: Write + ?Sized>(&self, writer: &mut W) -> io::Result<()> {
        writer.write_u16::<Endianness>(*self)
    }

    fn deserialize<R: Read>(reader: &mut R) -> io::Result<u16> {
        reader.read_u16::<Endianness>()
    }
}

impl FixedSize for u16 {
    const SIZE_IN_BYTES: usize = 2;
}

impl BinarySerializable for u64 {
    fn serialize<W: Write + ?Sized>(&self, writer: &mut W) -> io::Result<()> {
        writer.write_u64::<Endianness>(*self)
    }
    fn deserialize<R: Read>(reader: &mut R) -> io::Result<Self> {
        reader.read_u64::<Endianness>()
    }
}

impl FixedSize for u64 {
    const SIZE_IN_BYTES: usize = 8;
}

impl BinarySerializable for u128 {
    fn serialize<W: Write + ?Sized>(&self, writer: &mut W) -> io::Result<()> {
        writer.write_u128::<Endianness>(*self)
    }
    fn deserialize<R: Read>(reader: &mut R) -> io::Result<Self> {
        reader.read_u128::<Endianness>()
    }
}

impl FixedSize for u128 {
    const SIZE_IN_BYTES: usize = 16;
}

impl BinarySerializable for f32 {
    fn serialize<W: Write + ?Sized>(&self, writer: &mut W) -> io::Result<()> {
        writer.write_f32::<Endianness>(*self)
    }
    fn deserialize<R: Read>(reader: &mut R) -> io::Result<Self> {
        reader.read_f32::<Endianness>()
    }
}

impl FixedSize for f32 {
    const SIZE_IN_BYTES: usize = 4;
}

impl BinarySerializable for i64 {
    fn serialize<W: Write + ?Sized>(&self, writer: &mut W) -> io::Result<()> {
        writer.write_i64::<Endianness>(*self)
    }
    fn deserialize<R: Read>(reader: &mut R) -> io::Result<Self> {
        reader.read_i64::<Endianness>()
    }
}

impl FixedSize for i64 {
    const SIZE_IN_BYTES: usize = 8;
}

impl BinarySerializable for f64 {
    fn serialize<W: Write + ?Sized>(&self, writer: &mut W) -> io::Result<()> {
        writer.write_f64::<Endianness>(*self)
    }
    fn deserialize<R: Read>(reader: &mut R) -> io::Result<Self> {
        reader.read_f64::<Endianness>()
    }
}

impl FixedSize for f64 {
    const SIZE_IN_BYTES: usize = 8;
}

impl BinarySerializable for u8 {
    fn serialize<W: Write + ?Sized>(&self, writer: &mut W) -> io::Result<()> {
        writer.write_u8(*self)
    }
    fn deserialize<R: Read>(reader: &mut R) -> io::Result<u8> {
        reader.read_u8()
    }
}

impl FixedSize for u8 {
    const SIZE_IN_BYTES: usize = 1;
}

impl BinarySerializable for bool {
    fn serialize<W: Write + ?Sized>(&self, writer: &mut W) -> io::Result<()> {
        writer.write_u8(u8::from(*self))
    }
    fn deserialize<R: Read>(reader: &mut R) -> io::Result<bool> {
        let val = reader.read_u8()?;
        match val {
            0 => Ok(false),
            1 => Ok(true),
            _ => Err(io::Error::new(
                io::ErrorKind::InvalidData,
                "invalid bool value on deserialization, data corrupted",
            )),
        }
    }
}

impl FixedSize for bool {
    const SIZE_IN_BYTES: usize = 1;
}

impl BinarySerializable for String {
    fn serialize<W: Write + ?Sized>(&self, writer: &mut W) -> io::Result<()> {
        let data: &[u8] = self.as_bytes();
        BinarySerializable::serialize(&VInt(data.len() as u64), writer)?;
        writer.write_all(data)
    }

    fn deserialize<R: Read>(reader: &mut R) -> io::Result<String> {
        let string_length = <VInt as BinarySerializable>::deserialize(reader)?.val() as usize;
        let mut result = String::with_capacity(string_length);
        reader
            .take(string_length as u64)
            .read_to_string(&mut result)?;
        Ok(result)
    }
}

impl<'a> BinarySerializable for Cow<'a, str> {
    fn serialize<W: Write + ?Sized>(&self, writer: &mut W) -> io::Result<()> {
        let data: &[u8] = self.as_bytes();
        BinarySerializable::serialize(&VInt(data.len() as u64), writer)?;
        writer.write_all(data)
    }

    fn deserialize<R: Read>(reader: &mut R) -> io::Result<Cow<'a, str>> {
        let string_length = <VInt as BinarySerializable>::deserialize(reader)?.val() as usize;
        let mut result = String::with_capacity(string_length);
        reader
            .take(string_length as u64)
            .read_to_string(&mut result)?;
        Ok(Cow::Owned(result))
    }
}

impl<'a> BinarySerializable for Cow<'a, [u8]> {
    fn serialize<W: Write + ?Sized>(&self, writer: &mut W) -> io::Result<()> {
        BinarySerializable::serialize(&VInt(self.len() as u64), writer)?;
        for it in self.iter() {
            BinarySerializable::serialize(it, writer)?;
        }
        Ok(())
    }

    fn deserialize<R: Read>(reader: &mut R) -> io::Result<Cow<'a, [u8]>> {
        let num_items = <VInt as BinarySerializable>::deserialize(reader)?.val();
        let mut items: Vec<u8> = Vec::with_capacity(num_items as usize);
        for _ in 0..num_items {
            let item = <u8 as BinarySerializable>::deserialize(reader)?;
            items.push(item);
        }
        Ok(Cow::Owned(items))
    }
}

#[cfg(test)]
pub mod test {

    use super::*;
    pub fn fixed_size_test<O: BinarySerializable + FixedSize + Default>() {
        let mut buffer = Vec::new();
        O::default().serialize(&mut buffer).unwrap();
        assert_eq!(buffer.len(), O::SIZE_IN_BYTES);
    }

    fn serialize_test<T: BinarySerializable + Eq>(v: T) -> usize {
        let mut buffer: Vec<u8> = Vec::new();
        v.serialize(&mut buffer).unwrap();
        let num_bytes = buffer.len();
        let mut cursor = &buffer[..];
        let deser = T::deserialize(&mut cursor).unwrap();
        assert_eq!(deser, v);
        num_bytes
    }

    #[test]
    fn test_serialize_u8() {
        fixed_size_test::<u8>();
    }

    #[test]
    fn test_serialize_u32() {
        fixed_size_test::<u32>();
        assert_eq!(4, serialize_test(3u32));
        assert_eq!(4, serialize_test(5u32));
        assert_eq!(4, serialize_test(u32::MAX));
    }

    #[test]
    fn test_serialize_i64() {
        fixed_size_test::<i64>();
    }

    #[test]
    fn test_serialize_f64() {
        fixed_size_test::<f64>();
    }

    #[test]
    fn test_serialize_u64() {
        fixed_size_test::<u64>();
    }

    #[test]
    fn test_serialize_bool() {
        fixed_size_test::<bool>();
    }

    #[test]
    fn test_serialize_string() {
        assert_eq!(serialize_test(String::from("")), 1);
        assert_eq!(serialize_test(String::from("ぽよぽよ")), 1 + 3 * 4);
        assert_eq!(serialize_test(String::from("富士さん見える。")), 1 + 3 * 8);
    }

    #[test]
    fn test_serialize_vec() {
        assert_eq!(serialize_test(Vec::<u8>::new()), 1);
        assert_eq!(serialize_test(vec![1u32, 3u32]), 1 + 4 * 2);
    }

    #[test]
    fn test_serialize_vint() {
        for i in 0..10_000 {
            serialize_test(VInt(i as u64));
        }
        assert_eq!(serialize_test(VInt(7u64)), 1);
        assert_eq!(serialize_test(VInt(127u64)), 1);
        assert_eq!(serialize_test(VInt(128u64)), 2);
        assert_eq!(serialize_test(VInt(129u64)), 2);
        assert_eq!(serialize_test(VInt(1234u64)), 2);
        assert_eq!(serialize_test(VInt(16_383u64)), 2);
        assert_eq!(serialize_test(VInt(16_384u64)), 3);
        assert_eq!(serialize_test(VInt(u64::MAX)), 10);
    }
}


================================================
FILE: common/src/vint.rs
================================================
use std::io;
use std::io::{Read, Write};

use super::BinarySerializable;

/// Variable int serializes a u128 number
pub fn serialize_vint_u128(mut val: u128, output: &mut Vec<u8>) {
    loop {
        let next_byte: u8 = (val % 128u128) as u8;
        val /= 128u128;
        if val == 0 {
            output.push(next_byte | STOP_BIT);
            return;
        } else {
            output.push(next_byte);
        }
    }
}

///   Wrapper over a `u128` that serializes as a variable int.
#[derive(Clone, Copy, Debug, Eq, PartialEq)]
pub struct VIntU128(pub u128);

impl BinarySerializable for VIntU128 {
    fn serialize<W: Write + ?Sized>(&self, writer: &mut W) -> io::Result<()> {
        let mut buffer = vec![];
        serialize_vint_u128(self.0, &mut buffer);
        writer.write_all(&buffer)
    }

    #[allow(clippy::unbuffered_bytes)]
    fn deserialize<R: Read>(reader: &mut R) -> io::Result<Self> {
        #[allow(clippy::unbuffered_bytes)]
        let mut bytes = reader.bytes();
        let mut result = 0u128;
        let mut shift = 0u64;
        loop {
            match bytes.next() {
                Some(Ok(b)) => {
                    result |= u128::from(b % 128u8) << shift;
                    if b >= STOP_BIT {
                        return Ok(VIntU128(result));
                    }
                    shift += 7;
                }
                _ => {
                    return Err(io::Error::new(
                        io::ErrorKind::InvalidData,
                        "Reach end of buffer while reading VInt",
                    ));
                }
            }
        }
    }
}

///   Wrapper over a `u64` that serializes as a variable int.
#[derive(Clone, Copy, Debug, Eq, PartialEq)]
pub struct VInt(pub u64);

const STOP_BIT: u8 = 128;

#[inline]
pub fn serialize_vint_u32(val: u32, buf: &mut [u8; 8]) -> &[u8] {
    const START_2: u64 = 1 << 7;
    const START_3: u64 = 1 << 14;
    const START_4: u64 = 1 << 21;
    const START_5: u64 = 1 << 28;

    const MASK_1: u64 = 127;
    const MASK_2: u64 = MASK_1 << 7;
    const MASK_3: u64 = MASK_2 << 7;
    const MASK_4: u64 = MASK_3 << 7;
    const MASK_5: u64 = MASK_4 << 7;

    let val = u64::from(val);
    const STOP_BIT: u64 = 128u64;
    let (res, num_bytes) = if val < START_2 {
        (val | STOP_BIT, 1)
    } else if val < START_3 {
        (
            (val & MASK_1) | ((val & MASK_2) << 1) | (STOP_BIT << (8)),
            2,
        )
    } else if val < START_4 {
        (
            (val & MASK_1) | ((val & MASK_2) << 1) | ((val & MASK_3) << 2) | (STOP_BIT << (8 * 2)),
            3,
        )
    } else if val < START_5 {
        (
            (val & MASK_1)
                | ((val & MASK_2) << 1)
                | ((val & MASK_3) << 2)
                | ((val & MASK_4) << 3)
                | (STOP_BIT << (8 * 3)),
            4,
        )
    } else {
        (
            (val & MASK_1)
                | ((val & MASK_2) << 1)
                | ((val & MASK_3) << 2)
                | ((val & MASK_4) << 3)
                | ((val & MASK_5) << 4)
                | (STOP_BIT << (8 * 4)),
            5,
        )
    };
    *buf = res.to_le_bytes();
    &buf[0..num_bytes]
}

/// Returns the number of bytes covered by a
/// serialized vint `u32`.
///
/// Expects a buffer data that starts
/// by the serialized `vint`, scans at most 5 bytes ahead until
/// it finds the vint final byte.
///
/// # May Panic
/// If the payload does not start by a valid `vint`
fn vint_len(data: &[u8]) -> usize {
    for (i, &val) in data.iter().enumerate().take(5) {
        if val >= STOP_BIT {
            return i + 1;
        }
    }
    panic!("Corrupted data. Invalid VInt 32");
}

/// Reads a vint `u32` from a buffer, and
/// consumes its payload data.
///
/// # Panics
///
/// If the buffer does not start by a valid
/// vint payload
pub fn read_u32_vint(data: &mut &[u8]) -> u32 {
    let (result, vlen) = read_u32_vint_no_advance(data);
    *data = &data[vlen..];
    result
}

pub fn read_u32_vint_no_advance(data: &[u8]) -> (u32, usize) {
    let vlen = vint_len(data);
    let mut result = 0u32;
    let mut shift = 0u64;
    for &b in &data[..vlen] {
        result |= u32::from(b & 127u8) << shift;
        shift += 7;
    }
    (result, vlen)
}
/// Write a `u32` as a vint payload.
pub fn write_u32_vint<W: io::Write + ?Sized>(val: u32, writer: &mut W) -> io::Result<()> {
    let mut buf = [0u8; 8];
    let data = serialize_vint_u32(val, &mut buf);
    writer.write_all(data)
}

impl VInt {
    pub fn val(&self) -> u64 {
        self.0
    }

    pub fn deserialize_u64<R: Read>(reader: &mut R) -> io::Result<u64> {
        VInt::deserialize(reader).map(|vint| vint.0)
    }

    pub fn serialize_into_vec(&self, output: &mut Vec<u8>) {
        let mut buffer = [0u8; 10];
        let num_bytes = self.serialize_into(&mut buffer);
        output.extend(&buffer[0..num_bytes]);
    }

    pub fn serialize_into(&self, buffer: &mut [u8; 10]) -> usize {
        let mut remaining = self.0;
        for (i, b) in buffer.iter_mut().enumerate() {
            let next_byte: u8 = (remaining % 128u64) as u8;
            remaining /= 128u64;
            if remaining == 0u64 {
                *b = next_byte | STOP_BIT;
                return i + 1;
            } else {
                *b = next_byte;
            }
        }
        unreachable!();
    }
}

impl BinarySerializable for VInt {
    fn serialize<W: Write + ?Sized>(&self, writer: &mut W) -> io::Result<()> {
        let mut buffer = [0u8; 10];
        let num_bytes = self.serialize_into(&mut buffer);
        writer.write_all(&buffer[0..num_bytes])
    }

    #[allow(clippy::unbuffered_bytes)]
    fn deserialize<R: Read>(reader: &mut R) -> io::Result<Self> {
        #[allow(clippy::unbuffered_bytes)]
        let mut bytes = reader.bytes();
        let mut result = 0u64;
        let mut shift = 0u64;
        loop {
            match bytes.next() {
                Some(Ok(b)) => {
                    result |= u64::from(b % 128u8) << shift;
                    if b >= STOP_BIT {
                        return Ok(VInt(result));
                    }
                    shift += 7;
                }
                _ => {
                    return Err(io::Error::new(
                        io::ErrorKind::InvalidData,
                        "Reach end of buffer while reading VInt",
                    ));
                }
            }
        }
    }
}

#[cfg(test)]
mod tests {

    use super::{BinarySerializable, VInt, serialize_vint_u32};

    fn aux_test_vint(val: u64) {
        let mut v = [14u8; 10];
        let num_bytes = VInt(val).serialize_into(&mut v);
        for el in &v[num_bytes..10] {
            assert_eq!(el, &14u8);
        }
        assert!(num_bytes > 0);
        if num_bytes < 10 {
            assert!(1u64 << (7 * num_bytes) > val);
        }
        if num_bytes > 1 {
            assert!(1u64 << (7 * (num_bytes - 1)) <= val);
        }
        let serdeser_val = VInt::deserialize(&mut &v[..]).unwrap();
        assert_eq!(val, serdeser_val.0);
    }

    #[test]
    fn test_vint() {
        aux_test_vint(0);
        aux_test_vint(1);
        aux_test_vint(5);
        aux_test_vint(u64::MAX);
        for i in 1..9 {
            let power_of_128 = 1u64 << (7 * i);
            aux_test_vint(power_of_128 - 1u64);
            aux_test_vint(power_of_128);
            aux_test_vint(power_of_128 + 1u64);
        }
        aux_test_vint(10);
    }

    fn aux_test_serialize_vint_u32(val: u32) {
        let mut buffer = [0u8; 10];
        let mut buffer2 = [0u8; 8];
        let len_vint = VInt(val as u64).serialize_into(&mut buffer);
        let res2 = serialize_vint_u32(val, &mut buffer2);
        assert_eq!(&buffer[..len_vint], res2, "array wrong for {val}");
    }

    #[test]
    fn test_vint_u32() {
        aux_test_serialize_vint_u32(0);
        aux_test_serialize_vint_u32(1);
        aux_test_serialize_vint_u32(5);
        for i in 1..3 {
            let power_of_128 = 1u32 << (7 * i);
            aux_test_serialize_vint_u32(power_of_128 - 1u32);
            aux_test_serialize_vint_u32(power_of_128);
            aux_test_serialize_vint_u32(power_of_128 + 1u32);
        }
        aux_test_serialize_vint_u32(u32::MAX);
    }
}


================================================
FILE: common/src/writer.rs
================================================
use std::io::{self, BufWriter, Write};

pub struct CountingWriter<W> {
    underlying: W,
    written_bytes: u64,
}

impl<W: Write> CountingWriter<W> {
    pub fn wrap(underlying: W) -> CountingWriter<W> {
        CountingWriter {
            underlying,
            written_bytes: 0,
        }
    }

    #[inline]
    pub fn written_bytes(&self) -> u64 {
        self.written_bytes
    }

    /// Returns the underlying write object.
    /// Note that this method does not trigger any flushing.
    #[inline]
    pub fn finish(self) -> W {
        self.underlying
    }
}

impl<W: Write> Write for CountingWriter<W> {
    #[inline]
    fn write(&mut self, buf: &[u8]) -> io::Result<usize> {
        let written_size = self.underlying.write(buf)?;
        self.written_bytes += written_size as u64;
        Ok(written_size)
    }

    #[inline]
    fn write_all(&mut self, buf: &[u8]) -> io::Result<()> {
        self.underlying.write_all(buf)?;
        self.written_bytes += buf.len() as u64;
        Ok(())
    }

    #[inline]
    fn flush(&mut self) -> io::Result<()> {
        self.underlying.flush()
    }
}

impl<W: TerminatingWrite> TerminatingWrite for CountingWriter<W> {
    #[inline]
    fn terminate_ref(&mut self, token: AntiCallToken) -> io::Result<()> {
        self.underlying.terminate_ref(token)
    }
}

/// Struct used to prevent from calling
/// [`terminate_ref`](TerminatingWrite::terminate_ref) directly
///
/// The point is that while the type is public, it cannot be built by anyone
/// outside of this module.
pub struct AntiCallToken(());

/// Trait used to indicate when no more write need to be done on a writer
///
/// Thread-safety is enforced at the call sites that require it.
pub trait TerminatingWrite: Write {
    /// Indicate that the writer will no longer be used. Internally call terminate_ref.
    fn terminate(mut self) -> io::Result<()>
    where Self: Sized {
        self.terminate_ref(AntiCallToken(()))
    }

    /// You should implement this function to define custom behavior.
    /// This function should flush any buffer it may hold.
    fn terminate_ref(&mut self, _: AntiCallToken) -> io::Result<()>;
}

impl<W: TerminatingWrite + ?Sized> TerminatingWrite for Box<W> {
    fn terminate_ref(&mut self, token: AntiCallToken) -> io::Result<()> {
        self.as_mut().terminate_ref(token)
    }
}

impl<W: TerminatingWrite> TerminatingWrite for BufWriter<W> {
    fn terminate_ref(&mut self, a: AntiCallToken) -> io::Result<()> {
        self.flush()?;
        self.get_mut().terminate_ref(a)
    }
}

impl TerminatingWrite for &mut Vec<u8> {
    fn terminate_ref(&mut self, _a: AntiCallToken) -> io::Result<()> {
        self.flush()
    }
}

#[cfg(test)]
mod test {

    use std::io::Write;

    use super::CountingWriter;

    #[test]
    fn test_counting_writer() {
        let buffer: Vec<u8> = vec![];
        let mut counting_writer = CountingWriter::wrap(buffer);
        let bytes = (0u8..10u8).collect::<Vec<u8>>();
        counting_writer.write_all(&bytes).unwrap();
        let len = counting_writer.written_bytes();
        let buffer_restituted: Vec<u8> = counting_writer.finish();
        assert_eq!(len, 10u64);
        assert_eq!(buffer_restituted.len(), 10);
    }
}


================================================
FILE: doc/.gitignore
================================================
book


================================================
FILE: doc/book.toml
================================================
[book]
authors = ["Paul Masurel"]
multilingual = false
src = "src"
title = "Tantivy, the user guide"


================================================
FILE: doc/src/SUMMARY.md
================================================
# Summary

[Avant Propos](./avant-propos.md)

- [Segments](./basis.md)
- [Defining your schema](./schema.md)
- [Facetting](./facetting.md)
- [Index Sorting](./index_sorting.md)
- [Innerworkings](./innerworkings.md)
  - [Inverted index](./inverted_index.md)
- [Best practise](./inverted_index.md)

[Frequently Asked Questions](./faq.md)
[Examples](./examples.md)


================================================
FILE: doc/src/avant-propos.md
================================================
# Foreword, what is the scope of tantivy?

> Tantivy is a **search** engine **library** for Rust.

If you are familiar with Lucene, it's an excellent approximation to consider tantivy as Lucene for Rust. Tantivy is heavily inspired by Lucene's design and
they both have the same scope and targeted use cases.

If you are not familiar with Lucene, let's break down our little tagline.

- **Search** here means full-text search : fundamentally, tantivy is here to help you
identify efficiently what are the documents matching a given query in your corpus.
But modern search UI are so much more : text processing, facetting, autocomplete, fuzzy search, good
relevancy, collapsing, highlighting, spatial search.

  While some of these features are not available in tantivy yet, all of these are relevant
  feature requests. Tantivy's objective is to offer a solid toolbox to create the best search
  experience. But keep in mind this is just a toolbox.
  Which bring us to the second keyword...

- **Library** means that you will have to write code. Tantivy is not an *all-in-one* server solution like Elasticsearch for instance.

  Sometimes a functionality will not be available in tantivy because it is too
  specific to your use case. By design, tantivy should make it possible to extend
  the available set of features using the existing rock-solid datastructures.

  Most frequently this will mean writing your own `Collector`, your own `Scorer` or your own
  `TokenFilter`... Some of your requirements may also be related to
  something closer to architecture or operations. For instance, you may
  want to build a large corpus on Hadoop, fine-tune the merge policy to keep your
  index sharded in a time-wise fashion, or you may want to convert and existing
  index from a different format.

  Tantivy exposes a lot of low level API to do all of these things.
  

================================================
FILE: doc/src/basis.md
================================================
# Anatomy of an index

## Straight from disk

Tantivy accesses its data using an abstracting trait called `Directory`.
In theory, one can come and override the data access logic. In practise, the
trait somewhat assumes that your data can be mapped to memory, and tantivy
seems deeply married to using `mmap` for its io [^1], and the only persisting
directory shipped with tantivy is the `MmapDirectory`.

While this design has some downsides, this greatly simplifies the source code of
tantivy. Caching is also entirely delegated to the OS.

Tantivy works entirely (or almost) by directly reading the datastructures as they are laid on disk. As a result, the act of opening an indexing does not involve loading different datastructures from the disk into random access memory : starting a process, opening an index, and performing your first query can typically be done in a matter of milliseconds.

This is an interesting property for a command line search engine, or for some multi-tenant log search engine : spawning a new process for each new query can be a perfectly sensible solution in some use case.

In later chapters, we will discuss tantivy's inverted index data layout.
One key take away is that to achieve great performance, search indexes are extremely compact.
Of course this is crucial to reduce IO, and ensure that as much of our index can sit in RAM.

Also, whenever possible its data is accessed sequentially. Of course, this is an amazing property when tantivy needs to access the data from your spinning hard disk, but this is also
critical for performance, if your data is read from and an `SSD` or even already in your pagecache.

## Segments, and the log method

That kind of compact layout comes at one cost: it prevents our datastructures from being dynamic.
In fact, the `Directory` trait does not even allow you to modify part of a file.

To allow the addition / deletion of documents, and create the illusion that
your index is dynamic (i.e.: adding and deleting documents), tantivy uses a common database trick sometimes referred to as the *log method*.

Let's forget about deletes for a moment.

As you add documents, these documents are processed and stored in a dedicated datastructure, in a `RAM` buffer. This datastructure is not ready for search, but it is useful to receive your data and rearrange it very rapidly.

As you add documents, this buffer will reach its capacity and tantivy will transparently stop adding document to it and start converting this datastructure to its final read-only format on disk. Once written, an brand empty buffer is available to resume adding documents.

The resulting chunk of index obtained after this serialization is called a `Segment`.

> A segment is a self-contained atomic piece of index. It is identified with a UUID, and all of its files are identified using the naming scheme : `<UUID>.*`.

Which brings us to the nature of a tantivy `Index`.

> A tantivy `Index` is a collection of `Segments`.

Physically, this really just means and index is a bunch of segment files in a given `Directory`,
linked together by a `meta.json` file. This transparency can become extremely handy
to get tantivy to fit your use case:

*Example 1* You could for instance use hadoop to build a very large search index in a timely manner, copy all of the resulting segment files in the same directory and edit the `meta.json` to get a functional index.[^2]

*Example 2* You could also disable your merge policy and enforce daily segments. Removing data after one week can then be done very efficiently by just editing the `meta.json` and deleting the files associated with segment `D-7`.

## Merging

As you index more and more data, your index will accumulate more and more segments.
Having a lot of small segments is not really optimal. There is a bit of redundancy in having
all these term dictionary. Also when searching, we will need to do term lookups as many times as we have segments.  It can hurt search performance a bit.

That's where merging or compacting comes into place. Tantivy will continuously consider merge
opportunities and start merging segments in the background.

## Indexing throughput, number of indexing threads

[^1]: This may eventually change.

[^2]: Be careful however. By default these files will not be considered as *managed* by tantivy. This means they will never be garbage collected by tantivy, regardless of whether they become obsolete or not.


================================================
FILE: doc/src/best_practise.md.rs
================================================


================================================
FILE: doc/src/examples.md
================================================
# Examples

- [Basic search](/examples/basic_search.html)


================================================
FILE: doc/src/facetting.md
================================================
# Facetting

wewew

## weeewe


================================================
FILE: doc/src/faq.md
================================================


================================================
FILE: doc/src/index_sorting.md
================================================

- [Index Sorting](#index-sorting)
  - [Why Sorting](#why-sorting)
    - [Compression](#compression)
    - [Top-N Optimization](#top-n-optimization)
    - [Pruning](#pruning)
    - [Other](#other)
  - [Usage](#usage)

# Index Sorting has been removed!
More infos here:

https://github.com/quickwit-oss/tantivy/issues/2352

# Index Sorting

Tantivy allows you to sort the index according to a property.

## Why Sorting

Presorting an index has several advantages:

### Compression

When data is sorted it is easier to compress the data. E.g. the numbers sequence [5, 2, 3, 1, 4] would be sorted to [1, 2, 3, 4, 5].
If we apply delta encoding this list would be unsorted [5, -3, 1, -2, 3] vs. [1, 1, 1, 1, 1].
Compression ratio is mainly affected on the fast field of the sorted property, every thing else is likely unaffected.

### Top-N Optimization

When data is presorted by a field and search queries request sorting by the same field, we can leverage the natural order of the documents.
E.g. if the data is sorted by timestamp and want the top n newest docs containing a term, we can simply leveraging the order of the docids.

Note: tantivy 0.16 does not do this optimization yet.

### Pruning

Let's say we want all documents and want to apply the filter `>= 2010-08-11`. When the data is sorted, we could make a lookup in the fast field to find the docid range and use this as the filter.

Note: tantivy 0.16 does not do this optimization yet.

### Other?

In principle there are many algorithms possible that exploit the monotonically increasing nature. (aggregations maybe?)

## Usage

The index sorting can be configured setting [`sort_by_field`](https://github.com/quickwit-oss/tantivy/blob/000d76b11a139a84b16b9b95060a1c93e8b9851c/src/core/index_meta.rs#L238) on `IndexSettings` and passing it to a `IndexBuilder`. As of tantivy 0.16 only fast fields are allowed to be used.

```rust
let settings = IndexSettings {
    sort_by_field: Some(IndexSortByField {
        field: "intval".to_string(),
        order: Order::Desc,
    }),
    ..Default::default()
};
let mut index_builder = Index::builder().schema(schema);
index_builder = index_builder.settings(settings);
let index = index_builder.create_in_ram().unwrap();
```

## Implementation details

Sorting an index is applied in the serialization step. In general there are two serialization steps: [Finishing a single segment](https://github.com/quickwit-oss/tantivy/blob/000d76b11a139a84b16b9b95060a1c93e8b9851c/src/indexer/segment_writer.rs#L338) and [merging multiple segments](https://github.com/quickwit-oss/tantivy/blob/000d76b11a139a84b16b9b95060a1c93e8b9851c/src/indexer/merger.rs#L1073).

In both cases we generate a docid mapping reflecting the sort. This mapping is used when serializing the different components (doc store, fastfields, posting list, normfield, facets).


================================================
FILE: doc/src/innerworkings.md
================================================
# Innerworkings


================================================
FILE: doc/src/inverted_index.md
================================================
# Inverted index


================================================
FILE: doc/src/json.md
================================================
# Json

As of tantivy 0.17, tantivy supports a json object type.
This type can be used to allow for a schema-less search index.

When indexing a json object, we "flatten" the JSON. This operation emits terms that represent a triplet `(json_path, value_type, value)`

For instance,  if user is a json field, the following document:

```json
{
    "user": {
        "name": "Paul Masurel",
        "address": {
            "city": "Tokyo",
            "country": "Japan"
        },
        "created_at": "2018-11-12T23:20:50.52Z"
    }
}
```

emits the following tokens:

- ("name", Text, "Paul")
- ("name", Text, "Masurel")
- ("address.city", Text, "Tokyo")
- ("address.country", Text, "Japan")
- ("created_at", Date, 15420648505)

## Bytes-encoding and lexicographical sort

Like any other terms, these triplets are encoded into a binary format as follows.

- `json_path`: the json path is a sequence of "segments". In the example above, `address.city`
is just a debug representation of the json path `["address", "city"]`.
Its representation is done by separating segments by a unicode char `\x01`, and ending the path by `\x00`.
- `value type`: One byte represents the `Value` type.
- `value`: The value representation is just the regular Value representation.

This representation is designed to align the natural sort of Terms with the lexicographical sort
of their binary representation (tantivy's dictionary (whether fst or sstable) is sorted and does prefix encoding).

In the example above, the terms will be sorted as

- ("address.city", Text, "Tokyo")
- ("address.country", Text, "Japan")
- ("name", Text, "Masurel")
- ("name", Text, "Paul")
- ("created_at", Date, 15420648505)

As seen in "pitfalls", we may end up having to search for a value for a same path in several different fields. Putting the field code after the path makes it maximizes compression opportunities but also increases the chances for the two terms to end up in the actual same term dictionary block.

## Pitfalls, limitation and corner cases

Json gives very little information about the type of the literals it stores.
All numeric types end up mapped as a "Number" and there are no types for dates.

At indexing, tantivy will try to interpret number and strings as different type with a
priority order.

Numbers will be interpreted as u64, i64 and f64 in that order.
Strings will be interpreted as rfc3339 dates or simple strings.

The first working type is picked and is the only term that is emitted for indexing.
Note this interpretation happens on a per-document basis, and there is no effort to try to sniff
a consistent field type at the scale of a segment.

On the query parser side on the other hand, we may end up emitting more than one type.
For instance, we do not even know if the type is a number or string based.

So the query

```rust
my_path.my_segment:233
```

Will be interpreted as

```rust
(my_path.my_segment, String, 233) or (my_path.my_segment, u64, 233)
```

Likewise, we need to emit two tokens if the query contains an rfc3339 date.
Indeed the date could have been actually a single token inside the text of a document at ingestion time. Generally speaking, we will always at least emit a string token in query parsing, and sometimes more.

If one more json field is defined, things get even more complicated.

## Default json field

If the schema contains a text field called "text" and a json field that is set as a default field:
`text:hello` could be reasonably interpreted as targeting the text field or as targeting the json field called `json_dynamic` with the json_path "text".

If there is such an ambiguity, we decide to only search in the "text" field: `text:hello`.

In other words, the parser will not search in default json fields if there is a schema hit.
This is a product decision.

The user can still target the JSON field by specifying its name explicitly:
`json_dynamic.text:hello`.

## Range queries are not supported

Json field do not support range queries.

## Arrays do not work like nested object

If json object contains an array, a search query might return more documents
than what might be expected.

Let's take an example.

```json
{
    "cart_id": 3234234 ,
    "cart": [
        {"product_type": "sneakers", "attributes": {"color": "white"} },
        {"product_type": "t-shirt", "attributes": {"color": "red"}},
    ]
}
```

Despite the array structure, a document in tantivy is a bag of terms.
The query:

```rust
cart.product_type:sneakers AND cart.attributes.color:red
```

Actually match the document above.


================================================
FILE: doc/src/schema.md
================================================
# Defining your schema


================================================
FILE: examples/aggregation.rs
================================================
// # Aggregation example
//
// This example shows how you can use built-in aggregations.
// We will use nested aggregations with buckets and metrics:
// - Range buckets and compute the average in each bucket.
// - Term aggregation and compute the min price in each bucket
// ---

use serde_json::{Deserializer, Value};
use tantivy::aggregation::agg_req::Aggregations;
use tantivy::aggregation::agg_result::AggregationResults;
use tantivy::aggregation::AggregationCollector;
use tantivy::query::AllQuery;
use tantivy::schema::{self, IndexRecordOption, Schema, TextFieldIndexing, FAST};
use tantivy::{Index, IndexWriter, TantivyDocument};

fn main() -> tantivy::Result<()> {
    // # Create Schema
    //
    // Lets create a schema for a footwear shop, with 4 fields: name, category, stock and price.
    // category, stock and price will be fast fields as that's the requirement
    // for aggregation queries.
    //

    let mut schema_builder = Schema::builder();
    // In preparation of the `TermsAggregation`, the category field is configured with:
    // - `set_fast`
    // - `raw` tokenizer
    //
    // The tokenizer is set to "raw", because the fast field uses the same dictionary as the
    // inverted index. (This behaviour will change in tantivy 0.20, where the fast field will
    // always be raw tokenized independent from the regular tokenizing)
    //
    let text_fieldtype = schema::TextOptions::default()
        .set_indexing_options(
            TextFieldIndexing::default()
                .set_index_option(IndexRecordOption::WithFreqs)
                .set_tokenizer("raw"),
        )
        .set_fast(None)
        .set_stored();
    schema_builder.add_text_field("category", text_fieldtype);
    schema_builder.add_f64_field("stock", FAST);
    schema_builder.add_f64_field("price", FAST);

    let schema = schema_builder.build();

    // # Indexing documents
    //
    // Lets index a bunch of documents for this example.
    let index = Index::create_in_ram(schema.clone());

    let data = r#"{
        "name": "Almond Toe Court Shoes, Patent Black",
        "category": "Womens Footwear",
        "price": 99.00,
        "stock": 5
    }
    {
        "name": "Suede Shoes, Blue",
        "category": "Womens Footwear",
        "price": 42.00,
        "stock": 4
    }
    {
        "name": "Leather Driver Saddle Loafers, Tan",
        "category": "Mens Footwear",
        "price": 34.00,
        "stock": 12
    }
    {
        "name": "Flip Flops, Red",
        "category": "Mens Footwear",
        "price": 19.00,
        "stock": 6
    }
    {
        "name": "Flip Flops, Blue",
        "category": "Mens Footwear",
        "price": 19.00,
        "stock": 0
    }
    {
        "name": "Gold Button Cardigan, Black",
        "category": "Womens Casualwear",
        "price": 167.00,
        "stock": 6
    }
    {
        "name": "Cotton Shorts, Medium Red",
        "category": "Womens Casualwear",
        "price": 30.00,
        "stock": 5
    }
    {
        "name": "Fine Stripe Short Sleeve￼Shirt, Grey",
        "category": "Mens Casualwear",
        "price": 49.99,
        "stock": 9
    }
    {
        "name": "Fine Stripe Short Sleeve￼Shirt, Green",
        "category": "Mens Casualwear",
        "price": 49.99,
        "offer": 39.99,
        "stock": 9
    }
    {
        "name": "Sharkskin Waistcoat, Charcoal",
        "category": "Mens Formalwear",
        "price": 75.00,
        "stock": 2
    }
    {
        "name": "Lightweight Patch Pocket￼Blazer, Deer",
        "category": "Mens Formalwear",
        "price": 175.50,
        "stock": 1
    }
    {
        "name": "Bird Print Dress, Black",
        "category": "Womens Formalwear",
        "price": 270.00,
        "stock": 10
    }
    {
        "name": "Mid Twist Cut-Out Dress, Pink",
        "category": "Womens Formalwear",
        "price": 540.00,
        "stock": 5
    }"#;

    let stream = Deserializer::from_str(data).into_iter::<Value>();

    let mut index_writer: IndexWriter = index.writer(50_000_000)?;
    let mut num_indexed = 0;
    for value in stream {
        let doc = TantivyDocument::parse_json(&schema, &serde_json::to_string(&value.unwrap())?)?;
        index_writer.add_document(doc)?;
        num_indexed += 1;
        if num_indexed > 4 {
            // Writing the first segment
            index_writer.commit()?;
        }
    }

    // Writing the second segment
    index_writer.commit()?;

    // We have two segments now. The `AggregationCollector` will run the aggregation on each
    // segment and then merge the results into an `IntermediateAggregationResult`.

    let reader = index.reader()?;
    let searcher = reader.searcher();
    // ---
    // # Aggregation Query
    //
    //
    // We can construct the query by building the request structure or by deserializing from JSON.
    // The JSON API is more stable and therefore recommended.
    //
    // ## Request 1

    let agg_req_str = r#"
    {
      "group_by_stock": {
        "aggs": {
          "average_price": { "avg": { "field": "price" } }
        },
        "range": {
          "field": "stock",
          "ranges": [
            { "key": "few", "to": 1.0 },
            { "key": "some", "from": 1.0, "to": 10.0 },
            { "key": "many", "from": 10.0 }
          ]
        }
      }
    } "#;

    // In this Aggregation we want to get the average price for different groups, depending on how
    // many items are in stock. We define custom ranges `few`, `some`, `many` via the
    // range aggregation.
    // For every bucket we want the average price, so we create a nested metric aggregation on the
    // range bucket aggregation. Only buckets support nested aggregations.
    // ### Request JSON API
    //

    let agg_req: Aggregations = serde_json::from_str(agg_req_str)?;
    let collector = AggregationCollector::from_aggs(agg_req, Default::default());

    // We use the `AllQuery` which will pass all documents to the AggregationCollector.
    let agg_res: AggregationResults = searcher.search(&AllQuery, &collector).unwrap();
    let res: Value = serde_json::to_value(agg_res)?;

    // ### Aggregation Result
    //
    // The resulting structure deserializes in the same JSON format as elastic search.
    //
    let expected_res = r#"
    {
        "group_by_stock":{
            "buckets":[
                {"average_price":{"value":19.0},"doc_count":1,"key":"few","to":1.0},
                {"average_price":{"value":124.748},"doc_count":10,"from":1.0,"key":"some","to":10.0},
                {"average_price":{"value":152.0},"doc_count":2,"from":10.0,"key":"many"}
            ]
        }
    }
    "#;
    let expected_json: Value = serde_json::from_str(expected_res)?;
    assert_eq!(expected_json, res);

    // ### Request 2
    //
    // Now we are interested in the minimum price per category, so we create a bucket per
    // category via `TermsAggregation`. We are interested in the highest minimum prices, and set the
    // order of the buckets `"order": { "min_price": "desc" }` to be sorted by the the metric of
    // the sub aggregation. (awesome)
    //
    let agg_req_str = r#"
    {
      "min_price_per_category": {
        "aggs": {
          "min_price": { "min": { "field": "price" } }
        },
        "terms": {
          "field": "category",
          "min_doc_count": 1,
          "order": { "min_price": "desc" }
        }
      }
    } "#;

    let agg_req: Aggregations = serde_json::from_str(agg_req_str)?;

    let collector = AggregationCollector::from_aggs(agg_req, Default::default());

    let agg_res: AggregationResults = searcher.search(&AllQuery, &collector).unwrap();
    let res: Value = serde_json::to_value(agg_res)?;

    // Minimum price per category, sorted by minimum price descending
    //
    // As you can see, the starting prices for `Formalwear` are higher than `Casualwear`.
    //
    let expected_res = r#"
    {
      "min_price_per_category": {
        "buckets": [
          { "doc_count": 2, "key": "Womens Formalwear", "min_price": { "value": 270.0 } },
          { "doc_count": 2, "key": "Mens Formalwear", "min_price": { "value": 75.0 } },
          { "doc_count": 2, "key": "Mens Casualwear", "min_price": { "value": 49.99 } },
          { "doc_count": 2, "key": "Womens Footwear", "min_price": { "value": 42.0 } },
          { "doc_count": 2, "key": "Womens Casualwear", "min_price": { "value": 30.0 } },
          { "doc_count": 3, "key": "Mens Footwear", "min_price": { "value": 19.0 } }
        ],
        "sum_other_doc_count": 0
      }
    }
    "#;
    let expected_json: Value = serde_json::from_str(expected_res)?;

    assert_eq!(expected_json, res);

    Ok(())
}


================================================
FILE: examples/basic_search.rs
================================================
// # Basic Example
//
// This example covers the basic functionalities of
// tantivy.
//
// We will :
// - define our schema
// - create an index in a directory
// - index a few documents into our index
// - search for the best document matching a basic query
// - retrieve the best document's original content.

// ---
// Importing tantivy...
use tantivy::collector::TopDocs;
use tantivy::query::QueryParser;
use tantivy::schema::*;
use tantivy::{doc, Index, IndexWriter, ReloadPolicy};
use tempfile::TempDir;

fn main() -> tantivy::Result<()> {
    // Let's create a temporary directory for the
    // sake of this example
    let index_path = TempDir::new()?;

    // # Defining the schema
    //
    // The Tantivy index requires a very strict schema.
    // The schema declares which fields are in the index,
    // and for each field, its type and "the way it should
    // be indexed".

    // First we need to define a schema ...
    let mut schema_builder = Schema::builder();

    // Our first field is title.
    // We want full-text search for it, and we also want
    // to be able to retrieve the document after the search.
    //
    // `TEXT | STORED` is some syntactic sugar to describe
    // that.
    //
    // `TEXT` means the field should be tokenized and indexed,
    // along with its term frequency and term positions.
    //
    // `STORED` means that the field will also be saved
    // in a compressed, row-oriented key-value store.
    // This store is useful for reconstructing the
    // documents that were selected during the search phase.
    schema_builder.add_text_field("title", TEXT | STORED);

    // Our second field is body.
    // We want full-text search for it, but we do not
    // need to be able to retrieve it
    // for our application.
    //
    // We can make our index lighter by omitting the `STORED` flag.
    schema_builder.add_text_field("body", TEXT);

    let schema = schema_builder.build();

    // # Indexing documents
    //
    // Let's create a brand new index.
    //
    // This will actually just save a meta.json
    // with our schema in the directory.
    let index = Index::create_in_dir(&index_path, schema.clone())?;

    // To insert a document we will need an index writer.
    // There must be only one writer at a time.
    // This single `IndexWriter` is already
    // multithreaded.
    //
    // Here we give tantivy a budget of `50MB`.
    // Using a bigger memory_arena for the indexer may increase
    // throughput, but 50 MB is already plenty.
    let mut index_writer: IndexWriter = index.writer(50_000_000)?;

    // Let's index our documents!
    // We first need a handle on the title and the body field.

    // ### Adding documents
    //
    // We can create a document manually, by setting the fields
    // one by one in a Document object.
    let title = schema.get_field("title").unwrap();
    let body = schema.get_field("body").unwrap();

    let mut old_man_doc = TantivyDocument::default();
    old_man_doc.add_text(title, "The Old Man and the Sea");
    old_man_doc.add_text(
        body,
        "He was an old man who fished alone in a skiff in the Gulf Stream and he had gone \
         eighty-four days now without taking a fish.",
    );

    // ... and add it to the `IndexWriter`.
    index_writer.add_document(old_man_doc)?;

    // For convenience, tantivy also comes with a macro to
    // reduce the boilerplate above.
    index_writer.add_document(doc!(
    title => "Of Mice and Men",
    body => "A few miles south of Soledad, the Salinas River drops in close to the hillside \
            bank and runs deep and green. The water is warm too, for it has slipped twinkling \
            over the yellow sands in the sunlight before reaching the narrow pool. On one \
            side of the river the golden foothill slopes curve up to the strong and rocky \
            Gabilan Mountains, but on the valley side the water is lined with trees—willows \
            fresh and green with every spring, carrying in their lower leaf junctures the \
            debris of the winter’s flooding; and sycamores with mottled, white, recumbent \
            limbs and branches that arch over the pool"
    ))?;

    // Multivalued field just need to be repeated.
    index_writer.add_document(doc!(
    title => "Frankenstein",
    title => "The Modern Prometheus",
    body => "You will rejoice to hear that no disaster has accompanied the commencement of an \
             enterprise which you have regarded with such evil forebodings.  I arrived here \
             yesterday, and my first task is to assure my dear sister of my welfare and \
             increasing confidence in the success of my undertaking."
    ))?;

    // This is an example, so we will only index 3 documents
    // here. You can check out tantivy's tutorial to index
    // the English wikipedia. Tantivy's indexing is rather fast.
    // Indexing 5 million articles of the English wikipedia takes
    // around 3 minutes on my computer!

    // ### Committing
    //
    // At this point our documents are not searchable.
    //
    //
    // We need to call `.commit()` explicitly to force the
    // `index_writer` to finish processing the documents in the queue,
    // flush the current index to the disk, and advertise
    // the existence of new documents.
    //
    // This call is blocking.
    index_writer.commit()?;

    // If `.commit()` returns correctly, then all of the
    // documents that have been added are guaranteed to be
    // persistently indexed.
    //
    // In the scenario of a crash or a power failure,
    // tantivy behaves as if it has rolled back to its last
    // commit.

    // # Searching
    //
    // ### Searcher
    //
    // A reader is required first in order to search an index.
    // It acts as a `Searcher` pool that reloads itself,
    // depending on a `ReloadPolicy`.
    //
    // For a search server you will typically create one reader for the entire lifetime of your
    // program, and acquire a new searcher for every single request.
    //
    // In the code below, we rely on the 'ON_COMMIT' policy: the reader
    // will reload the index automatically after each commit.
    let reader = index
        .reader_builder()
        .reload_policy(ReloadPolicy::OnCommitWithDelay)
        .try_into()?;

    // We now need to acquire a searcher.
    //
    // A searcher points to a snapshotted, immutable version of the index.
    //
    // Some search experience might require more than
    // one query. Using the same searcher ensures that all of these queries will run on the
    // same version of the index.
    //
    // Acquiring a `searcher` is very cheap.
    //
    // You should acquire a searcher every time you start processing a request and
    // and release it right after your query is finished.
    let searcher = reader.searcher();

    // ### Query

    // The query parser can interpret human queries.
    // Here, if the user does not specify which
    // field they want to search, tantivy will search
    // in both title and body.
    let query_parser = QueryParser::for_index(&index, vec![title, body]);

    // `QueryParser` may fail if the query is not in the right
    // format. For user facing applications, this can be a problem.
    // A ticket has been opened regarding this problem.
    let query = query_parser.parse_query("sea whale")?;

    // A query defines a set of documents, as
    // well as the way they should be scored.
    //
    // A query created by the query parser is scored according
    // to a metric called Tf-Idf, and will consider
    // any document matching at least one of our terms.

    // ### Collectors
    //
    // We are not interested in all of the documents but
    // only in the top 10. Keeping track of our top 10 best documents
    // is the role of the `TopDocs` collector.

    // We can now perform our query.
    let top_docs = searcher.search(&query, &TopDocs::with_limit(10).order_by_score())?;

    // The actual documents still need to be
    // retrieved from Tantivy's store.
    //
    // Since the body field was not configured as stored,
    // the document returned will only contain
    // a title.
    for (_score, doc_address) in top_docs {
        let retrieved_doc: TantivyDocument = searcher.doc(doc_address)?;
        println!("{}", retrieved_doc.to_json(&schema));
    }

    // We can also get an explanation to understand
    // how a found document got its score.
    let query = query_parser.parse_query("title:sea^20 body:whale^70")?;

    let (_score, doc_address) = searcher
        .search(&query, &TopDocs::with_limit(1).order_by_score())?
        .into_iter()
        .next()
        .unwrap();

    let explanation = query.explain(&searcher, doc_address)?;

    println!("{}", explanation.to_pretty_json());

    Ok(())
}


================================================
FILE: examples/custom_collector.rs
================================================
// # Custom collector example
//
// This example shows how you can implement your own
// collector. As an example, we will compute a collector
// that computes the standard deviation of a given fast field.
//
// Of course, you can have a look at the tantivy's built-in collectors
// such as the `CountCollector` for more examples.

use columnar::Column;
// ---
// Importing tantivy...
use tantivy::collector::{Collector, SegmentCollector};
use tantivy::index::SegmentReader;
use tantivy::query::QueryParser;
use tantivy::schema::{Schema, FAST, INDEXED, TEXT};
use tantivy::{doc, Index, IndexWriter, Score};

#[derive(Default)]
struct Stats {
    count: usize,
    sum: f64,
    squared_sum: f64,
}

impl Stats {
    pub fn count(&self) -> usize {
        self.count
    }

    pub fn mean(&self) -> f64 {
        self.sum / (self.count as f64)
    }

    fn square_mean(&self) -> f64 {
        self.squared_sum / (self.count as f64)
    }

    pub fn standard_deviation(&self) -> f64 {
        let mean = self.mean();
        (self.square_mean() - mean * mean).sqrt()
    }

    fn non_zero_count(self) -> Option<Stats> {
        if self.count == 0 {
            None
        } else {
            Some(self)
        }
    }
}

struct StatsCollector {
    field: String,
}

impl StatsCollector {
    fn with_field(field: String) -> StatsCollector {
        StatsCollector { field }
    }
}

impl Collector for StatsCollector {
    // That's the type of our result.
    // Our standard deviation will be a float.
    type Fruit = Option<Stats>;

    type Child = StatsSegmentCollector;

    fn for_segment(
        &self,
        _segment_local_id: u32,
        segment_reader: &SegmentReader,
    ) -> tantivy::Result<StatsSegmentCollector> {
        let fast_field_reader = segment_reader.fast_fields().u64(&self.field)?;
        Ok(StatsSegmentCollector {
            fast_field_reader,
            stats: Stats::default(),
        })
    }

    fn requires_scoring(&self) -> bool {
        // this collector does not care about score.
        false
    }

    fn merge_fruits(&self, segment_stats: Vec<Option<Stats>>) -> tantivy::Result<Option<Stats>> {
        let mut stats = Stats::default();
        for segment_stats in segment_stats.into_iter().flatten() {
            stats.count += segment_stats.count;
            stats.sum += segment_stats.sum;
            stats.squared_sum += segment_stats.squared_sum;
        }
        Ok(stats.non_zero_count())
    }
}

struct StatsSegmentCollector {
    fast_field_reader: Column,
    stats: Stats,
}

impl SegmentCollector for StatsSegmentCollector {
    type Fruit = Option<Stats>;

    fn collect(&mut self, doc: u32, _score: Score) {
        // Since we know the values are single value, we could call `first_or_default_col` on the
        // column and fetch single values.
        for value in self.fast_field_reader.values_for_doc(doc) {
            let value = value as f64;
            self.stats.count += 1;
            self.stats.sum += value;
            self.stats.squared_sum += value * value;
        }
    }

    fn harvest(self) -> <Self as SegmentCollector>::Fruit {
        self.stats.non_zero_count()
    }
}

fn main() -> tantivy::Result<()> {
    // # Defining the schema
    //
    // The Tantivy index requires a very strict schema.
    // The schema declares which fields are in the index,
    // and for each field, its type and "the way it should
    // be indexed".

    // first we need to define a schema ...
    let mut schema_builder = Schema::builder();

    // We'll assume a fictional index containing
    // products, and with a name, a description, and a price.
    let product_name = schema_builder.add_text_field("name", TEXT);
    let product_description = schema_builder.add_text_field("description", TEXT);
    let price = schema_builder.add_u64_field("price", INDEXED | FAST);
    let schema = schema_builder.build();

    // # Indexing documents
    //
    // Lets index a bunch of fake documents for the sake of
    // this example.
    let index = Index::create_in_ram(schema);

    let mut index_writer: IndexWriter = index.writer(50_000_000)?;
    index_writer.add_document(doc!(
        product_name => "Super Broom 2000",
        product_description => "While it is ok for short distance travel, this broom \
        was designed quiditch. It will up your game.",
        price => 30_200u64
    ))?;
    index_writer.add_document(doc!(
        product_name => "Turbulobroom",
        product_description => "You might have heard of this broom before : it is the sponsor of the Wales team.\
            You'll enjoy its sharp turns, and rapid acceleration",
        price => 29_240u64
    ))?;
    index_writer.add_document(doc!(
        product_name => "Broomio",
        product_description => "Great value for the price. This broom is a market favorite",
        price => 21_240u64
    ))?;
    index_writer.add_document(doc!(
        product_name => "Whack a Mole",
        product_description => "Prime quality bat.",
        price => 5_200u64
    ))?;
    index_writer.commit()?;

    let reader = index.reader()?;
    let searcher = reader.searcher();
    let query_parser = QueryParser::for_index(&index, vec![product_name, product_description]);

    // here we want to search for `broom` and use `StatsCollector` on the hits.
    let query = query_parser.parse_query("broom")?;
    if let Some(stats) =
        searcher.search(&query, &StatsCollector::with_field("price".to_string()))?
    {
        println!("count: {}", stats.count());
        println!("mean: {}", stats.mean());
        println!("standard deviation: {}", stats.standard_deviation());
    }

    Ok(())
}


================================================
FILE: examples/custom_tokenizer.rs
================================================
// # Defining a tokenizer pipeline
//
// In this example, we'll see how to define a tokenizer
// by creating a custom `NgramTokenizer`.
use tantivy::collector::TopDocs;
use tantivy::query::QueryParser;
use tantivy::schema::*;
use tantivy::tokenizer::NgramTokenizer;
use tantivy::{doc, Index, IndexWriter};

fn main() -> tantivy::Result<()> {
    // # Defining the schema
    //
    // The Tantivy index requires a very strict schema.
    // The schema declares which fields are in the index,
    // and for each field, its type and "the way it should
    // be indexed".

    // first we need to define a schema ...
    let mut schema_builder = Schema::builder();

    // Our first field is title.
    // In this example we want to use NGram searching
    // we will set that to 3 characters, so any three
    // char in the title should be findable.
    let text_field_indexing = TextFieldIndexing::default()
        .set_tokenizer("ngram3")
        .set_index_option(IndexRecordOption::WithFreqsAndPositions);
    let text_options = TextOptions::default()
        .set_indexing_options(text_field_indexing)
        .set_stored();
    let title = schema_builder.add_text_field("title", text_options);

    // Our second field is body.
    // We want full-text search for it, but we do not
    // need to be able to be able to retrieve it
    // for our application.
    //
    // We can make our index lighter by omitting the `STORED` flag.
    let body = schema_builder.add_text_field("body", TEXT);

    let schema = schema_builder.build();

    // # Indexing documents
    //
    // Let's create a brand new index.
    // To simplify we will work entirely in RAM.
    // This is not what you want in reality, but it is very useful
    // for your unit tests... Or this example.
    let index = Index::create_in_ram(schema.clone());

    // here we are registering our custom tokenizer
    // this will store tokens of 3 characters each
    index
        .tokenizers()
        .register("ngram3", NgramTokenizer::new(3, 3, false).unwrap());

    // To insert document we need an index writer.
    // There must be only one writer at a time.
    // This single `IndexWriter` is already
    // multithreaded.
    //
    // Here we use a buffer of 50MB per thread. Using a bigger
    // memory arena for the indexer can increase its throughput.
    let mut index_writer: IndexWriter = index.writer(50_000_000)?;
    index_writer.add_document(doc!(
    title => "The Old Man and the Sea",
    body => "He was an old man who fished alone in a skiff in the Gulf Stream and \
     he had gone eighty-four days now without taking a fish."
    ))?;
    index_writer.add_document(doc!(
    title => "Of Mice and Men",
       body => r#"A few miles south of Soledad, the Salinas River drops in close to the hillside
                bank and runs deep and green. The water is warm too, for it has slipped twinkling
                over the yellow sands in the sunlight before reaching the narrow pool. On one
                side of the river the golden foothill slopes curve up to the strong and rocky
                Gabilan Mountains, but on the valley side the water is lined with trees—willows
                fresh and green with every spring, carrying in their lower leaf junctures the
                debris of the winter’s flooding; and sycamores with mottled, white, recumbent
                limbs and branches that arch over the pool"#
    ))?;
    index_writer.add_document(doc!(
    title => "Frankenstein",
        body => r#"You will rejoice to hear that no disaster has accompanied the commencement of an
                enterprise which you have regarded with such evil forebodings.  I arrived here
                yesterday, and my first task is to assure my dear sister of my welfare and
                increasing confidence in the success of my undertaking."#
    ))?;
    index_writer.commit()?;

    let reader = index.reader()?;
    let searcher = reader.searcher();

    // The query parser can interpret human queries.
    // Here, if the user does not specify which
    // field they want to search, tantivy will search
    // in both title and body.
    let query_parser = QueryParser::for_index(&index, vec![title, body]);

    // here we want to get a hit on the 'ken' in Frankenstein
    let query = query_parser.parse_query("ken")?;

    let top_docs = searcher.search(&query, &TopDocs::with_limit(10).order_by_score())?;

    for (_, doc_address) in top_docs {
        let retrieved_doc: TantivyDocument = searcher.doc(doc_address)?;
        println!("{}", retrieved_doc.to_json(&schema));
    }

    Ok(())
}


================================================
FILE: examples/date_time_field.rs
================================================
// # DateTime field example
//
// This example shows how the DateTime field can be used

use tantivy::collector::TopDocs;
use tantivy::query::QueryParser;
use tantivy::schema::{DateOptions, Document, Schema, Value, INDEXED, STORED, STRING};
use tantivy::{Index, IndexWriter, TantivyDocument};

fn main() -> tantivy::Result<()> {
    // # Defining the schema
    let mut schema_builder = Schema::builder();
    let opts = DateOptions::from(INDEXED)
        .set_stored()
        .set_fast()
        .set_precision(tantivy::schema::DateTimePrecision::Seconds);
    // Add `occurred_at` date field type
    let occurred_at = schema_builder.add_date_field("occurred_at", opts);
    let event_type = schema_builder.add_text_field("event", STRING | STORED);
    let schema = schema_builder.build();

    // # Indexing documents
    let index = Index::create_in_ram(schema.clone());

    let mut index_writer: IndexWriter = index.writer(50_000_000)?;
    // The dates are passed as string in the RFC3339 format
    let doc = TantivyDocument::parse_json(
        &schema,
        r#"{
        "occurred_at": "2022-06-22T12:53:50.53Z",
        "event": "pull-request"
    }"#,
    )?;
    index_writer.add_document(doc)?;
    let doc = TantivyDocument::parse_json(
        &schema,
        r#"{
        "occurred_at": "2022-06-22T13:00:00.22Z",
        "event": "comment"
    }"#,
    )?;
    index_writer.add_document(doc)?;
    index_writer.commit()?;

    let reader = index.reader()?;
    let searcher = reader.searcher();

    // # Search
    let query_parser = QueryParser::for_index(&index, vec![event_type]);
    {
        // Simple exact search on the date
        let query = query_parser.parse_query("occurred_at:\"2022-06-22T12:53:50.53Z\"")?;
        let count_docs = searcher.search(&*query, &TopDocs::with_limit(5).order_by_score())?;
        assert_eq!(count_docs.len(), 1);
    }
    {
        // Range query on the date field
        let query = query_parser
            .parse_query(r#"occurred_at:[2022-06-22T12:58:00Z TO 2022-06-23T00:00:00Z}"#)?;
        let count_docs = searcher.search(&*query, &TopDocs::with_limit(4).order_by_score())?;
        assert_eq!(count_docs.len(), 1);
        for (_score, doc_address) in count_docs {
            let retrieved_doc = searcher.doc::<TantivyDocument>(doc_address)?;
            assert!(retrieved_doc
                .get_first(occurred_at)
                .unwrap()
                .as_value()
                .as_datetime()
                .is_some(),);
            assert_eq!(
                retrieved_doc.to_json(&schema),
                r#"{"event":["comment"],"occurred_at":["2022-06-22T13:00:00.22Z"]}"#
            );
        }
    }
    Ok(())
}


================================================
FILE: examples/deleting_updating_documents.rs
================================================
// # Deleting and Updating (?) documents
//
// This example explains how to delete and update documents.
// In fact there is actually no such thing as an update in tantivy.
//
// To update a document, you need to delete a document and then reinsert
// its new version.
//
// ---
// Importing tantivy...
use tantivy::collector::TopDocs;
use tantivy::query::TermQuery;
use tantivy::schema::*;
use tantivy::{doc, Index, IndexReader, IndexWriter};

// A simple helper function to fetch a single document
// given its id from our index.
// It will be helpful to check our work.
fn extract_doc_given_isbn(
    reader: &IndexReader,
    isbn_term: &Term,
) -> tantivy::Result<Option<TantivyDocument>> {
    let searcher = reader.searcher();

    // This is the simplest query you can think of.
    // It matches all of the documents containing a specific term.
    //
    // The second argument is here to tell we don't care about decoding positions,
    // or term frequencies.
    let term_query = TermQuery::new(isbn_term.clone(), IndexRecordOption::Basic);
    let top_docs = searcher.search(&term_query, &TopDocs::with_limit(1).order_by_score())?;

    if let Some((_score, doc_address)) = top_docs.first() {
        let doc = searcher.doc(*doc_address)?;
        Ok(Some(doc))
    } else {
        // no doc matching this ID.
        Ok(None)
    }
}

fn main() -> tantivy::Result<()> {
    // # Defining the schema
    //
    // Check out the *basic_search* example if this makes
    // small sense to you.
    let mut schema_builder = Schema::builder();

    // Tantivy does not really have a notion of primary id.
    // This may change in the future.
    //
    // Still, we can create a `isbn` field and use it as an id. This
    // field can be `u64` or a `text`, depending on your use case.
    // It just needs to be indexed.
    //
    // If it is `text`, let's make sure to keep it `raw` and let's avoid
    // running any text processing on it.
    // This is done by associating this field to the tokenizer named `raw`.
    // Rather than building our
    // [`TextOptions`](//docs.rs/tantivy/~0/tantivy/schema/struct.TextOptions.html) manually, We
    // use the `STRING` shortcut. `STRING` stands for indexed (without term frequency or positions)
    // and untokenized.
    //
    // Because we also want to be able to see this `id` in our returned documents,
    // we also mark the field as stored.
    let isbn = schema_builder.add_text_field("isbn", STRING | STORED);
    let title = schema_builder.add_text_field("title", TEXT | STORED);
    let schema = schema_builder.build();

    let index = Index::create_in_ram(schema.clone());

    let mut index_writer: IndexWriter = index.writer(50_000_000)?;

    // Let's add a couple of documents, for the sake of the example.
    let mut old_man_doc = TantivyDocument::default();
    old_man_doc.add_text(title, "The Old Man and the Sea");
    index_writer.add_document(doc!(
        isbn => "978-0099908401",
        title => "The old Man and the see"
    ))?;
    index_writer.add_document(doc!(
        isbn => "978-0140177398",
        title => "Of Mice and Men",
    ))?;
    index_writer.add_document(doc!(
       title => "Frankentein", //< Oops there is a typo here.
       isbn => "978-9176370711",
    ))?;
    index_writer.commit()?;
    let reader = index.reader()?;

    let frankenstein_isbn = Term::from_field_text(isbn, "978-9176370711");

    // Oops our frankenstein doc seems misspelled
    let frankenstein_doc_misspelled = extract_doc_given_isbn(&reader, &frankenstein_isbn)?.unwrap();
    assert_eq!(
        frankenstein_doc_misspelled.to_json(&schema),
        r#"{"isbn":["978-9176370711"],"title":["Frankentein"]}"#,
    );

    // # Update = Delete + Insert
    //
    // Here we will want to update the typo in the `Frankenstein` book.
    //
    // Tantivy does not handle updates directly, we need to delete
    // and reinsert the document.
    //
    // This can be complicated as it means you need to have access
    // to the entire document. It is good practise to integrate tantivy
    // with a key value store for this reason.
    //
    // To remove one of the document, we just call `delete_term`
    // on its id.
    //
    // Note that `tantivy` does nothing to enforce the idea that
    // there is only one document associated with this id.
    //
    // Also you might have noticed that we apply the delete before
    // having committed. This does not matter really...
    index_writer.delete_term(frankenstein_isbn.clone());

    // We now need to reinsert our document without the typo.
    index_writer.add_document(doc!(
       title => "Frankenstein",
       isbn => "978-9176370711",
    ))?;

    // You are guaranteed that your clients will only observe your index in
    // the state it was in after a commit.
    // In this example, your search engine will at no point be missing the *Frankenstein* document.
    // Everything happened as if the document was updated.
    index_writer.commit()?;
    // We reload our searcher to make our change available to clients.
    reader.reload()?;

    // No more typo!
    let frankenstein_new_doc = extract_doc_given_isbn(&reader, &frankenstein_isbn)?.unwrap();
    assert_eq!(
        frankenstein_new_doc.to_json(&schema),
        r#"{"isbn":["978-9176370711"],"title":["Frankenstein"]}"#,
    );

    Ok(())
}


================================================
FILE: examples/faceted_search.rs
================================================
// # Faceted Search
//
// This example covers the faceted search functionalities of
// tantivy.
//
// We will :
// - define a text field "name" in our schema
// - define a facet field "classification" in our schema
// - create an index in memory
// - index few documents with respective facets in our index
// - search and count the number of documents that the classifications start the facet "/Felidae"
// - Search the facet "/Felidae/Pantherinae" and count the number of documents that the
//   classifications include the facet.
//
// ---
// Importing tantivy...
use tantivy::collector::FacetCollector;
use tantivy::query::{AllQuery, TermQuery};
use tantivy::schema::*;
use tantivy::{doc, Index, IndexWriter};

fn main() -> tantivy::Result<()> {
    // Let's create a temporary directory for the sake of this example
    let mut schema_builder = Schema::builder();

    let name = schema_builder.add_text_field("name", TEXT | STORED);
    // this is our faceted field: its scientific classification
    let classification = schema_builder.add_facet_field("classification", FacetOptions::default());

    let schema = schema_builder.build();
    let index = Index::create_in_ram(schema);

    let mut index_writer: IndexWriter = index.writer(30_000_000)?;

    // For convenience, tantivy also comes with a macro to
    // reduce the boilerplate above.
    index_writer.add_document(doc!(
        name => "Cat",
        classification => Facet::from("/Felidae/Felinae/Felis")
    ))?;
    index_writer.add_document(doc!(
        name => "Canada lynx",
        classification => Facet::from("/Felidae/Felinae/Lynx")
    ))?;
    index_writer.add_document(doc!(
        name => "Cheetah",
        classification => Facet::from("/Felidae/Felinae/Acinonyx")
    ))?;
    index_writer.add_document(doc!(
        name => "Tiger",
        classification => Facet::from("/Felidae/Pantherinae/Panthera")
    ))?;
    index_writer.add_document(doc!(
        name => "Lion",
        classification => Facet::from("/Felidae/Pantherinae/Panthera")
    ))?;
    index_writer.add_document(doc!(
        name => "Jaguar",
        classification => Facet::from("/Felidae/Pantherinae/Panthera")
    ))?;
    index_writer.add_document(doc!(
        name => "Sunda clouded leopard",
        classification => Facet::from("/Felidae/Pantherinae/Neofelis")
    ))?;
    index_writer.add_document(doc!(
        name => "Fossa",
        classification => Facet::from("/Eupleridae/Cryptoprocta")
    ))?;
    index_writer.commit()?;

    let reader = index.reader()?;
    let searcher = reader.searcher();
    {
        let mut facet_collector = FacetCollector::for_field("classification");
        facet_collector.add_facet("/Felidae");
        let facet_counts = searcher.search(&AllQuery, &facet_collector)?;
        // This lists all of the facet counts, right below "/Felidae".
        let facets: Vec<(&Facet, u64)> = facet_counts.get("/Felidae").collect();
        assert_eq!(
            facets,
            vec![
                (&Facet::from("/Felidae/Felinae"), 3),
                (&Facet::from("/Felidae/Pantherinae"), 4),
            ]
        );
    }

    // Facets are also searchable.
    //
    // For instance a common UI pattern is to allow the user someone to click on a facet link
    // (e.g: `Pantherinae`) to drill down and filter the current result set with this subfacet.
    //
    // The search would then look as follows.

    // Check the reference doc for different ways to create a `Facet` object.
    {
        let facet = Facet::from("/Felidae/Pantherinae");
        let facet_term = Term::from_facet(classification, &facet);
        let facet_term_query = TermQuery::new(facet_term, IndexRecordOption::Basic);
        let mut facet_collector = FacetCollector::for_field("classification");
        facet_collector.add_facet("/Felidae/Pantherinae");
        let facet_counts = searcher.search(&facet_term_query, &facet_collector)?;
        let facets: Vec<(&Facet, u64)> = facet_counts.get("/Felidae/Pantherinae").collect();
        assert_eq!(
            facets,
            vec![
                (&Facet::from("/Felidae/Pantherinae/Neofelis"), 1),
                (&Facet::from("/Felidae/Pantherinae/Panthera"), 3),
            ]
        );
    }

    Ok(())
}


================================================
FILE: examples/faceted_search_with_tweaked_score.rs
================================================
// # Faceted Search With Tweak Score
//
// This example covers the faceted search functionalities of
// tantivy.
//
// We will :
// - define a text field "name" in our schema
// - define a facet field "classification" in our schema

use std::collections::HashSet;

use tantivy::collector::TopDocs;
use tantivy::query::BooleanQuery;
use tantivy::schema::*;
use tantivy::{doc, DocId, Index, IndexWriter, Score, SegmentReader};

fn main() -> tantivy::Result<()> {
    let mut schema_builder = Schema::builder();

    let title = schema_builder.add_text_field("title", STORED);
    let ingredient = schema_builder.add_facet_field("ingredient", FacetOptions::default());

    let schema = schema_builder.build();
    let index = Index::create_in_ram(schema);

    let mut index_writer: IndexWriter = index.writer(30_000_000)?;

    index_writer.add_document(doc!(
        title => "Fried egg",
        ingredient => Facet::from("/ingredient/egg"),
        ingredient => Facet::from("/ingredient/oil"),
    ))?;
    index_writer.add_document(doc!(
        title => "Scrambled egg",
        ingredient => Facet::from("/ingredient/egg"),
        ingredient => Facet::from("/ingredient/butter"),
        ingredient => Facet::from("/ingredient/milk"),
        ingredient => Facet::from("/ingredient/salt"),
    ))?;
    index_writer.add_document(doc!(
        title => "Egg rolls",
        ingredient => Facet::from("/ingredient/egg"),
        ingredient => Facet::from("/ingredient/garlic"),
        ingredient => Facet::from("/ingredient/salt"),
        ingredient => Facet::from("/ingredient/oil"),
        ingredient => Facet::from("/ingredient/tortilla-wrap"),
        ingredient => Facet::from("/ingredient/mushroom"),
    ))?;
    index_writer.commit()?;

    let reader = index.reader()?;
    let searcher = reader.searcher();
    {
        let facets = [
            Facet::from("/ingredient/egg"),
            Facet::from("/ingredient/oil"),
            Facet::from("/ingredient/garlic"),
            Facet::from("/ingredient/mushroom"),
        ];
        let query = BooleanQuery::new_multiterms_query(
            facets
                .iter()
                .map(|key| Term::from_facet(ingredient, key))
                .collect(),
        );
        let top_docs_by_custom_score =
            // Call TopDocs with a custom tweak score
            TopDocs::with_limit(2).tweak_score(move |segment_reader: &SegmentReader| {
                let ingredient_reader = segment_reader.facet_reader("ingredient").unwrap();
                let facet_dict = ingredient_reader.facet_dict();

                let query_ords: HashSet<u64> = facets
                    .iter()
                    .filter_map(|key| facet_dict.term_ord(key.encoded_str()).unwrap())
                    .collect();

                move |doc: DocId, original_score: Score| {
                    // Update the original score with a tweaked score
                    let missing_ingredients = ingredient_reader
                        .facet_ords(doc)
                        .filter(|ord| !query_ords.contains(ord))
                        .count();
                    let tweak = 1.0 / 4_f32.powi(missing_ingredients as i32);

                    original_score * tweak
                }
            });
        let top_docs = searcher.search(&query, &top_docs_by_custom_score)?;

        let titles: Vec<String> = top_docs
            .iter()
            .map(|(_, doc_id)| {
                searcher
                    .doc::<TantivyDocument>(*doc_id)
                    .unwrap()
                    .get_first(title)
                    .and_then(|v| v.as_str().map(|el| el.to_string()))
                    .unwrap()
            })
            .collect();
        assert_eq!(titles, vec!["Fried egg", "Egg rolls"]);
    }
    Ok(())
}


================================================
FILE: examples/filter_aggregation.rs
================================================
// # Filter Aggregation Example
//
// This example demonstrates filter aggregations - creating buckets of documents
// matching specific queries, with nested aggregations computed on each bucket.
//
// Filter aggregations are useful for computing metrics on different subsets of
// your data in a single query, like "average price overall + average price for
// electronics + count of in-stock items".

use serde_json::json;
use tantivy::aggregation::agg_req::Aggregations;
use tantivy::aggregation::AggregationCollector;
use tantivy::query::AllQuery;
use tantivy::schema::{Schema, FAST, INDEXED, TEXT};
use tantivy::{doc, Index};

fn main() -> tantivy::Result<()> {
    // Create a simple product schema
    let mut schema_builder = Schema::builder();
    schema_builder.add_text_field("category", TEXT | FAST);
    schema_builder.add_text_field("brand", TEXT | FAST);
    schema_builder.add_u64_field("price", FAST);
    schema_builder.add_f64_field("rating", FAST);
    schema_builder.add_bool_field("in_stock", FAST | INDEXED);
    let schema = schema_builder.build();

    // Create index and add sample products
    let index = Index::create_in_ram(schema.clone());
    let mut writer = index.writer(50_000_000)?;

    writer.add_document(doc!(
        schema.get_field("category")? => "electronics",
        schema.get_field("brand")? => "apple",
        schema.get_field("price")? => 999u64,
        schema.get_field("rating")? => 4.5f64,
        schema.get_field("in_stock")? => true
    ))?;
    writer.add_document(doc!(
        schema.get_field("category")? => "electronics",
        schema.get_field("brand")? => "samsung",
        schema.get_field("price")? => 799u64,
        schema.get_field("rating")? => 4.2f64,
        schema.get_field("in_stock")? => true
    ))?;
    writer.add_document(doc!(
        schema.get_field("category")? => "clothing",
        schema.get_field("brand")? => "nike",
        schema.get_field("price")? => 120u64,
        schema.get_field("rating")? => 4.1f64,
        schema.get_field("in_stock")? => false
    ))?;
    writer.add_document(doc!(
        schema.get_field("category")? => "books",
        schema.get_field("brand")? => "penguin",
        schema.get_field("price")? => 25u64,
        schema.get_field("rating")? => 4.8f64,
        schema.get_field("in_stock")? => true
    ))?;

    writer.commit()?;

    let reader = index.reader()?;
    let searcher = reader.searcher();

    // Example 1: Basic filter with metric aggregation
    println!("=== Example 1: Electronics average price ===");
    let agg_req = json!({
        "electronics": {
            "filter": "category:electronics",
            "aggs": {
                "avg_price": { "avg": { "field": "price" } }
            }
        }
    });

    let agg: Aggregations = serde_json::from_value(agg_req)?;
    let collector = AggregationCollector::from_aggs(agg, Default::default());
    let result = searcher.search(&AllQuery, &collector)?;

    let expected = json!({
        "electronics": {
            "doc_count": 2,
            "avg_price": { "value": 899.0 }
        }
    });
    assert_eq!(serde_json::to_value(&result)?, expected);
    println!("{}\n", serde_json::to_string_pretty(&result)?);

    // Example 2: Multiple independent filters
    println!("=== Example 2: Multiple filters in one query ===");
    let agg_req = json!({
        "electronics": {
            "filter": "category:electronics",
            "aggs": { "avg_price": { "avg": { "field": "price" } } }
        },
        "in_stock": {
            "filter": "in_stock:true",
            "aggs": { "count": { "value_count": { "field": "brand" } } }
        },
        "high_rated": {
            "filter": "rating:[4.5 TO *]",
            "aggs": { "count": { "value_count": { "field": "brand" } } }
        }
    });

    let agg: Aggregations = serde_json::from_value(agg_req)?;
    let collector = AggregationCollector::from_aggs(agg, Default::default());
    let result = searcher.search(&AllQuery, &collector)?;

    let expected = json!({
        "electronics": {
            "doc_count": 2,
            "avg_price": { "value": 899.0 }
        },
        "in_stock": {
            "doc_count": 3,
            "count": { "value": 3.0 }
        },
        "high_rated": {
            "doc_count": 2,
            "count": { "value": 2.0 }
        }
    });
    assert_eq!(serde_json::to_value(&result)?, expected);
    println!("{}\n", serde_json::to_string_pretty(&result)?);

    // Example 3: Nested filters - progressive refinement
    println!("=== Example 3: Nested filters ===");
    let agg_req = json!({
        "in_stock": {
            "filter": "in_stock:true",
            "aggs": {
                "electronics": {
                    "filter": "category:electronics",
                    "aggs": {
                        "expensive": {
                            "filter": "price:[800 TO *]",
                            "aggs": {
                                "avg_rating": { "avg": { "field": "rating" } }
                            }
                        }
                    }
                }
            }
        }
    });

    let agg: Aggregations = serde_json::from_value(agg_req)?;
    let collector = AggregationCollector::from_aggs(agg, Default::default());
    let result = searcher.search(&AllQuery, &collector)?;

    let expected = json!({
        "in_stock": {
            "doc_count": 3,  // apple, samsung, penguin
            "electronics": {
                "doc_count": 2,  // apple, samsung
                "expensive": {
                    "doc_count": 1,  // only apple (999)
                    "avg_rating": { "value": 4.5 }
                }
            }
        }
    });
    assert_eq!(serde_json::to_value(&result)?, expected);
    println!("{}\n", serde_json::to_string_pretty(&result)?);

    // Example 4: Filter with sub-aggregation (terms)
    println!("=== Example 4: Filter with terms sub-aggregation ===");
    let agg_req = json!({
        "electronics": {
            "filter": "category:electronics",
            "aggs": {
                "by_brand": {
                    "terms": { "field": "brand" },
                    "aggs": {
                        "avg_price": { "avg": { "field": "price" } }
                    }
                }
            }
        }
    });

    let agg: Aggregations = serde_json::from_value(agg_req)?;
    let collector = AggregationCollector::from_aggs(agg, Default::default());
    let result = searcher.search(&AllQuery, &collector)?;

    let expected = json!({
        "electronics": {
            "doc_count": 2,
            "by_brand": {
                "buckets": [
                    {
                        "key": "samsung",
                        "doc_count": 1,
                        "avg_price": { "value": 799.0 }
                    },
                    {
                        "key": "apple",
                        "doc_count": 1,
                        "avg_price": { "value": 999.0 }
                    }
                ],
                "sum_other_doc_count": 0,
                "doc_count_error_upper_bound": 0
            }
        }
    });
    assert_eq!(serde_json::to_value(&result)?, expected);
    println!("{}", serde_json::to_string_pretty(&result)?);

    Ok(())
}


================================================
FILE: examples/fuzzy_search.rs
================================================
// # Basic Example
//
// This example covers the basic functionalities of
// tantivy.
//
// We will :
// - define our schema
// - create an index in a directory
// - index a few documents into our index
// - search for the best document matching a basic query
// - retrieve the best document's original content.
// ---
// Importing tantivy...
use tantivy::collector::{Count, TopDocs};
use tantivy::query::FuzzyTermQuery;
use tantivy::schema::*;
use tantivy::{doc, Index, IndexWriter, ReloadPolicy};
use tempfile::TempDir;

fn main() -> tantivy::Result<()> {
    // Let's create a temporary directory for the
    // sake of this example
    let index_path = TempDir::new()?;

    // # Defining the schema
    //
    // The Tantivy index requires a very strict schema.
    // The schema declares which fields are in the index,
    // and for each field, its type and "the way it should
    // be indexed".

    // First we need to define a schema ...
    let mut schema_builder = Schema::builder();

    // Our first field is title.
    // We want full-text search for it, and we also want
    // to be able to retrieve the document after the search.
    //
    // `TEXT | STORED` is some syntactic sugar to describe
    // that.
    //
    // `TEXT` means the field should be tokenized and indexed,
    // along with its term frequency and term positions.
    //
    // `STORED` means that the field will also be saved
    // in a compressed, row-oriented key-value store.
    // This store is useful for reconstructing the
    // documents that were selected during the search phase.
    let title = schema_builder.add_text_field("title", TEXT | STORED);

    let schema = schema_builder.build();

    // # Indexing documents
    //
    // Let's create a brand new index.
    //
    // This will actually just save a meta.json
    // with our schema in the directory.
    let index = Index::create_in_dir(&index_path, schema.clone())?;

    // To insert a document we will need an index writer.
    // There must be only one writer at a time.
    // This single `IndexWriter` is already
    // multithreaded.
    //
    // Here we give tantivy a budget of `50MB`.
    // Using a bigger memory_arena for the indexer may increase
    // throughput, but 50 MB is already plenty.
    let mut index_writer: IndexWriter = index.writer(50_000_000)?;

    // Let's index our documents!
    // We first need a handle on the title and the body field.

    // ### Adding documents
    //
    index_writer.add_document(doc!(
        title => "The Name of the Wind",
    ))?;
    index_writer.add_document(doc!(
        title => "The Diary of Muadib",
    ))?;
    index_writer.add_document(doc!(
        title => "A Dairy Cow",
    ))?;
    index_writer.add_document(doc!(
        title => "The Diary of a Young Girl",
    ))?;

    // ### Committing
    //
    // At this point our documents are not searchable.
    //
    //
    // We need to call `.commit()` explicitly to force the
    // `index_writer` to finish processing the documents in the queue,
    // flush the current index to the disk, and advertise
    // the existence of new documents.
    //
    // This call is blocking.
    index_writer.commit()?;

    // If `.commit()` returns correctly, then all of the
    // documents that have been added are guaranteed to be
    // persistently indexed.
    //
    // In the scenario of a crash or a power failure,
    // tantivy behaves as if it has rolled back to its last
    // commit.

    // # Searching
    //
    // ### Searcher
    //
    // A reader is required first in order to search an index.
    // It acts as a `Searcher` pool that reloads itself,
    // depending on a `ReloadPolicy`.
    //
    // For a search server you will typically create one reader for the entire lifetime of your
    // program, and acquire a new searcher for every single request.
    //
    // In the code below, we rely on the 'ON_COMMIT' policy: the reader
    // will reload the index automatically after each commit.
    let reader = index
        .reader_builder()
        .reload_policy(ReloadPolicy::OnCommitWithDelay)
        .try_into()?;

    // We now need to acquire a searcher.
    //
    // A searcher points to a snapshotted, immutable version of the index.
    //
    // Some search experience might require more than
    // one query. Using the same searcher ensures that all of these queries will run on the
    // same version of the index.
    //
    // Acquiring a `searcher` is very cheap.
    //
    // You should acquire a searcher every time you start processing a request and
    // and release it right after your query is finished.
    let searcher = reader.searcher();

    // ### FuzzyTermQuery
    {
        let term = Term::from_field_text(title, "Diary");
        let query = FuzzyTermQuery::new(term, 2, true);

        let (top_docs, count) = searcher
            .search(&query, &(TopDocs::with_limit(5).order_by_score(), Count))
            .unwrap();
        assert_eq!(count, 3);
        assert_eq!(top_docs.len(), 3);
        for (score, doc_address) in top_docs {
            // Note that the score is not lower for the fuzzy hit.
            // There's an issue open for that: https://github.com/quickwit-oss/tantivy/issues/563
            let retrieved_doc: TantivyDocument = searcher.doc(doc_address)?;
            println!("score {score:?} doc {}", retrieved_doc.to_json(&schema));
            // score 1.0 doc {"title":["The Diary of Muadib"]}
            //
            // score 1.0 doc {"title":["The Diary of a Young Girl"]}
            //
            // score 1.0 doc {"title":["A Dairy Cow"]}
        }
    }

    Ok(())
}


================================================
FILE: examples/index_from_multiple_threads.rs
================================================
// # Indexing from different threads.
//
// It is fairly common to have to index from different threads.
// Tantivy forbids to create more than one `IndexWriter` at a time.
//
// This `IndexWriter` itself has its own multithreaded layer, so managing your own
// indexing threads will not help. However, it can still be useful for some applications.
//
// For instance, if preparing documents to send to tantivy before indexing is the bottleneck of
// your application, it is reasonable to have multiple threads.
//
// Another very common reason to want to index from multiple threads, is implementing a webserver
// with CRUD capabilities. The server framework will most likely handle request from
// different threads.
//
// The recommended way to address both of these use case is to wrap your `IndexWriter` into a
// `Arc<RwLock<IndexWriter>>`.
//
// While this is counterintuitive, adding and deleting documents do not require mutability
// over the `IndexWriter`, so several threads will be able to do this operation concurrently.
//
// The example below does not represent an actual real-life use case (who would spawn thread to
// index a single document?), but aims at demonstrating the mechanism that makes indexing
// from several threads possible.

// ---
// Importing tantivy...
use std::sync::{Arc, RwLock};
use std::thread;
use std::time::Duration;

use tantivy::schema::{Schema, STORED, TEXT};
use tantivy::{doc, Index, IndexWriter, Opstamp, TantivyError};

fn main() -> tantivy::Result<()> {
    // # Defining the schema
    let mut schema_builder = Schema::builder();
    let title = schema_builder.add_text_field("title", TEXT | STORED);
    let body = schema_builder.add_text_field("body", TEXT);
    let schema = schema_builder.build();

    let index = Index::create_in_ram(schema);
    let index_writer: Arc<RwLock<IndexWriter>> = Arc::new(RwLock::new(index.writer(50_000_000)?));

    // # First indexing thread.
    let index_writer_clone_1 = index_writer.clone();
    thread::spawn(move || {
        // we index 100 times the document... for the sake of the example.
        for i in 0..100 {
            let opstamp = index_writer_clone_1
                .read().unwrap() //< A read lock is sufficient here.
                .add_document(
                    doc!(
                        title => "Of Mice and Men",
                        body => "A few miles south of Soledad, the Salinas River drops in close to the hillside \
                        bank and runs deep and green. The water is warm too, for it has slipped twinkling \
                        over the yellow sands in the sunlight before reaching the narrow pool. On one \
                        side of the river the golden foothill slopes curve up to the strong and rocky \
                        Gabilan Mountains, but on the valley side the water is lined with trees—willows \
                        fresh and green with every spring, carrying in their lower leaf junctures the \
                        debris of the winter’s flooding; and sycamores with mottled, white, recumbent \
                        limbs and branches that arch over the pool"
                    ))?;
            println!("add doc {i} from thread 1 - opstamp {opstamp}");
            thread::sleep(Duration::from_millis(20));
        }
        Result::<(), TantivyError>::Ok(())
    });

    // # Second indexing thread.
    let index_writer_clone_2 = index_writer.clone();
    // For convenience, tantivy also comes with a macro to
    // reduce the boilerplate above.
    thread::spawn(move || {
        // we index 100 times the document... for the sake of the example.
        for i in 0..100 {
            // A read lock is sufficient here.
            let opstamp = {
                let index_writer_rlock = index_writer_clone_2.read().unwrap();
                index_writer_rlock.add_document(doc!(
                    title => "Manufacturing consent",
                    body => "Some great book description..."
                ))?
            };
            println!("add doc {i} from thread 2 - opstamp {opstamp}");
            thread::sleep(Duration::from_millis(10));
        }
        Result::<(), TantivyError>::Ok(())
    });

    // # In the main thread, we commit 10 times, once every 500ms.
    for _ in 0..10 {
        let opstamp: Opstamp = {
            // Committing or rollbacking on the other hand requires write lock. This will block
            // other threads.
            let mut index_writer_wlock = index_writer.write().unwrap();
            index_writer_wlock.commit()?
        };
        println!("committed with opstamp {opstamp}");
        thread::sleep(Duration::from_millis(500));
    }

    Ok(())
}


================================================
FILE: examples/index_with_json.rs
================================================
use tantivy::schema::*;

// # Document from json
//
// For convenience, `Document` can be parsed directly from json.
fn main() -> tantivy::Result<()> {
    // Let's first define a schema and an index.
    // Check out the basic example if this is confusing to you.
    //
    // first we need to define a schema ...
    let mut schema_builder = Schema::builder();
    schema_builder.add_text_field("title", TEXT | STORED);
    schema_builder.add_text_field("body", TEXT);
    schema_builder.add_u64_field("year", INDEXED);
    let schema = schema_builder.build();

    // Let's assume we have a json-serialized document.
    let mice_and_men_doc_json = r#"{
       "title": "Of Mice and Men",
       "year": 1937
    }"#;

    // We can parse our document
    let _mice_and_men_doc = TantivyDocument::parse_json(&schema, mice_and_men_doc_json)?;

    // Multi-valued field are allowed, they are
    // expressed in JSON by an array.
    // The following document has two titles.
    let frankenstein_json = r#"{
       "title": ["Frankenstein", "The Modern Prometheus"],
       "year": 1818
    }"#;
    let _frankenstein_doc = TantivyDocument::parse_json(&schema, frankenstein_json)?;

    // Note that the schema is saved in your index directory.
    //
    // As a result, Indexes are aware of their schema, and you can use this feature
    // just by opening an existing `Index`, and calling `index.schema()..parse_document(json)`.
    Ok(())
}


================================================
FILE: examples/integer_range_search.rs
================================================
use std::ops::Bound;

// # Searching a range on an indexed int field.
//
// Below is an example of creating an indexed integer field in your schema
// You can use RangeQuery to get a Count of all occurrences in a given range.
use tantivy::collector::Count;
use tantivy::query::RangeQuery;
use tantivy::schema::{Schema, INDEXED};
use tantivy::{doc, Index, IndexWriter, Result, Term};

fn main() -> Result<()> {
    // For the sake of simplicity, this schema will only have 1 field
    let mut schema_builder = Schema::builder();

    // `INDEXED` is a short-hand to indicate that our field should be "searchable".
    let year_field = schema_builder.add_u64_field("year", INDEXED);
    let schema = schema_builder.build();
    let index = Index::create_in_ram(schema);
    let reader = index.reader()?;
    {
        let mut index_writer: IndexWriter = index.writer_with_num_threads(1, 6_000_000)?;
        for year in 1950u64..2019u64 {
            index_writer.add_document(doc!(year_field => year))?;
        }
        index_writer.commit()?;
        // The index will be a range of years
    }
    reader.reload()?;
    let searcher = reader.searcher();
    // The end is excluded i.e. here we are searching up to 1969
    let docs_in_the_sixties = RangeQuery::new(
        Bound::Included(Term::from_field_u64(year_field, 1960)),
        Bound::Excluded(Term::from_field_u64(year_field, 1970)),
    );
    // Uses a Count collector to sum the total number of docs in the range
    let num_60s_books = searcher.search(&docs_in_the_sixties, &Count)?;
    assert_eq!(num_60s_books, 10);
    Ok(())
}


================================================
FILE: examples/ip_field.rs
================================================
// # IP Address example
//
// This example shows how the ip field can be used
// with IpV6 and IpV4.

use tantivy::collector::{Count, TopDocs};
use tantivy::query::QueryParser;
use tantivy::schema::{Schema, FAST, INDEXED, STORED, STRING};
use tantivy::{Index, IndexWriter, TantivyDocument};

fn main() -> tantivy::Result<()> {
    // # Defining the schema
    // We set the IP field as `INDEXED`, so it can be searched
    // `FAST` will create a fast field. The fast field will be used to execute search queries.
    // `FAST` is not a requirement for range queries, it can also be executed on the inverted index
    // which is created by `INDEXED`.
    let mut schema_builder = Schema::builder();
    let event_type = schema_builder.add_text_field("event_type", STRING | STORED);
    let ip = schema_builder.add_ip_addr_field("ip", STORED | INDEXED | FAST);
    let schema = schema_builder.build();

    // # Indexing documents
    let index = Index::create_in_ram(schema.clone());

    let mut index_writer: IndexWriter = index.writer(50_000_000)?;

    // ### IPv4
    // Adding documents that contain an IPv4 address. Notice that the IP addresses are passed as
    // `String`. Since the field is of type ip, we parse the IP address from the string and store it
    // internally as IPv6.
    let doc = TantivyDocument::parse_json(
        &schema,
        r#"{
            "ip": "192.168.0.33",
            "event_type": "login"
        }"#,
    )?;
    index_writer.add_document(doc)?;
    let doc = TantivyDocument::parse_json(
        &schema,
        r#"{
            "ip": "192.168.0.80",
            "event_type": "checkout"
        }"#,
    )?;
    index_writer.add_document(doc)?;
    // ### IPv6
    // Adding a document that contains an IPv6 address.
    let doc = TantivyDocument::parse_json(
        &schema,
        r#"{
            "ip": "2001:0db8:85a3:0000:0000:8a2e:0370:7334",
            "event_type": "checkout"
        }"#,
    )?;

    index_writer.add_document(doc)?;
    // Commit will create a segment containing our documents.
    index_writer.commit()?;

    let reader = index.reader()?;
    let searcher = reader.searcher();

    // # Search
    // Range queries on IPv4. Since we created a fast field, the fast field will be used to execute
    // the search.
    // ### Range Queries
    let query_parser = QueryParser::for_index(&index, vec![event_type, ip]);
    {
        // Inclusive range queries
        let query = query_parser.parse_query("ip:[192.168.0.80 TO 192.168.0.100]")?;
        let count_docs = searcher.search(&*query, &TopDocs::with_limit(5).order_by_score())?;
        assert_eq!(count_docs.len(), 1);
    }
    {
        // Exclusive range queries
        let query = query_parser.parse_query("ip:{192.168.0.80 TO 192.168.1.100]")?;
        let count_docs = searcher.search(&*query, &TopDocs::with_limit(2).order_by_score())?;
        assert_eq!(count_docs.len(), 0);
    }
    {
        // Find docs with IP addresses smaller equal 192.168.1.100
        let query = query_parser.parse_query("ip:[* TO 192.168.1.100]")?;
        let count_docs = searcher.search(&*query, &TopDocs::with_limit(2).order_by_score())?;
        assert_eq!(count_docs.len(), 2);
    }
    {
        // Find docs with IP addresses smaller than 192.168.1.100
        let query = query_parser.parse_query("ip:[* TO 192.168.1.100}")?;
        let count_docs = searcher.search(&*query, &TopDocs::with_limit(2).order_by_score())?;
        assert_eq!(count_docs.len(), 2);
    }

    // ### Exact Queries
    // Exact search on IPv4.
    {
        let query = query_parser.parse_query("ip:192.168.0.80")?;
        let count_docs = searcher.search(&*query, &Count)?;
        assert_eq!(count_docs, 1);
    }
    // Exact search on IPv6.
    // IpV6 addresses need to be quoted because they contain `:`
    {
        let query = query_parser.parse_query("ip:\"2001:0db8:85a3:0000:0000:8a2e:0370:7334\"")?;
        let count_docs = searcher.search(&*query, &Count)?;
        assert_eq!(count_docs, 1);
    }

    Ok(())
}


================================================
FILE: examples/iterating_docs_and_positions.rs
================================================
// # Iterating docs and positions.
//
// At its core of tantivy, relies on a data structure
// called an inverted index.
//
// This example shows how to manually iterate through
// the list of documents containing a term, getting
// its term frequency, and accessing its positions.

use tantivy::postings::Postings;
// ---
// Importing tantivy...
use tantivy::schema::*;
use tantivy::{doc, DocSet, Index, IndexWriter, TERMINATED};

fn main() -> tantivy::Result<()> {
    // We first create a schema for the sake of the
    // example. Check the `basic_search` example for more information.
    let mut schema_builder = Schema::builder();

    // For this example, we need to make sure to index positions for our title
    // field. `TEXT` precisely does this.
    let title = schema_builder.add_text_field("title", TEXT | STORED);
    let schema = schema_builder.build();

    let index = Index::create_in_ram(schema);

    let mut index_writer: IndexWriter = index.writer_with_num_threads(1, 50_000_000)?;
    index_writer.add_document(doc!(title => "The Old Man and the Sea"))?;
    index_writer.add_document(doc!(title => "Of Mice and Men"))?;
    index_writer.add_document(doc!(title => "The modern Prometheus"))?;
    index_writer.commit()?;

    let reader = index.reader()?;

    let searcher = reader.searcher();

    // A tantivy index is actually a collection of segments.
    // Similarly, a searcher just wraps a list `segment_reader`.
    //
    // (Because we indexed a very small number of documents over one thread
    // there is actually only one segment here, but let's iterate through the list
    // anyway)
    for segment_reader in searcher.segment_readers() {
        // A segment contains different data structure.
        // Inverted index stands for the combination of
        // - the term dictionary
        // - the inverted lists associated with each terms and their positions
        let inverted_index = segment_reader.inverted_index(title)?;

        // A `Term` is a text token associated with a field.
        // Let's go through all docs containing the term `title:the` and access their position
        let term_the = Term::from_field_text(title, "the");

        // This segment posting object is like a cursor over the documents matching the term.
        // The `IndexRecordOption` arguments tells tantivy we will be interested in both term
        // frequencies and positions.
        //
        // If you don't need all this information, you may get better performance by decompressing
        // less information.
        if let Some(mut segment_postings) =
            inverted_index.read_postings(&term_the, IndexRecordOption::WithFreqsAndPositions)?
        {
            // this buffer will be used to request for positions
            let mut positions: Vec<u32> = Vec::with_capacity(100);
            let mut doc_id = segment_postings.doc();
            while doc_id != TERMINATED {
                // This MAY contains deleted documents as well.
                if segment_reader.is_deleted(doc_id) {
                    doc_id = segment_postings.advance();
                    continue;
                }

                // the number of time the term appears in the document.
                let term_freq: u32 = segment_postings.term_freq();
                // accessing positions is slightly expensive and lazy, do not request
                // for them if you don't need them for some documents.
                segment_postings.positions(&mut positions);

                // By definition we should have `term_freq` positions.
                assert_eq!(positions.len(), term_freq as usize);

                // This prints:
                // ```
                // Doc 0: TermFreq 2: [0, 4]
                // Doc 2: TermFreq 1: [0]
                // ```
                println!("Doc {doc_id}: TermFreq {term_freq}: {positions:?}");
                doc_id = segment_postings.advance();
            }
        }
    }

    // A `Term` is a text token associated with a field.
    // Let's go through all docs containing the term `title:the` and access their position
    let term_the = Term::from_field_text(title, "the");

    // Some other powerful operations (especially `.skip_to`) may be useful to consume these
    // posting lists rapidly.
    // You can check for them in the [`DocSet`](https://docs.rs/tantivy/~0/tantivy/trait.DocSet.html) trait
    // and the [`Postings`](https://docs.rs/tantivy/~0/tantivy/trait.Postings.html) trait

    // Also, for some VERY specific high performance use case like an OLAP analysis of logs,
    // you can get better performance by accessing directly the blocks of doc ids.
    for segment_reader in searcher.segment_readers() {
        // A segment contains different data structure.
        // Inverted index stands for the combination of
        // - the term dictionary
        // - the inverted lists associated with each terms and their positions
        let inverted_index = segment_reader.inverted_index(title)?;

        // This segment posting object is like a cursor over the documents matching the term.
        // The `IndexRecordOption` arguments tells tantivy we will be interested in both term
        // frequencies and positions.
        //
        // If you don't need all this information, you may get better performance by decompressing
        // less information.
        if let Some(mut block_segment_postings) =
            inverted_index.read_block_postings(&term_the, IndexRecordOption::Basic)?
        {
            loop {
                let docs = block_segment_postings.docs();
                if docs.is_empty() {
                    break;
                }
                // Once again these docs MAY contains deleted documents as well.
                let docs = block_segment_postings.docs();
                // Prints `Docs [0, 2].`
                println!("Docs {docs:?}");
                block_segment_postings.advance();
            }
        }
    }

    Ok(())
}


================================================
FILE: examples/json_field.rs
================================================
// # Json field example
//
// This example shows how the json field can be used
// to make tantivy partially schemaless by setting it as
// default query parser field.

use tantivy::collector::{Count, TopDocs};
use tantivy::query::QueryParser;
use tantivy::schema::{Schema, FAST, STORED, STRING, TEXT};
use tantivy::{Index, IndexWriter, TantivyDocument};

fn main() -> tantivy::Result<()> {
    // # Defining the schema
    let mut schema_builder = Schema::builder();
    schema_builder.add_date_field("timestamp", FAST | STORED);
    let event_type = schema_builder.add_text_field("event_type", STRING | STORED);
    let attributes = schema_builder.add_json_field("attributes", STORED | TEXT);
    let schema = schema_builder.build();

    // # Indexing documents
    let index = Index::create_in_ram(schema.clone());

    let mut index_writer: IndexWriter = index.writer(50_000_000)?;
    let doc = TantivyDocument::parse_json(
        &schema,
        r#"{
        "timestamp": "2022-02-22T23:20:50.53Z",
        "event_type": "click",
        "attributes": {
            "target": "submit-button",
            "cart": {"product_id": 103},
            "description": "the best vacuum cleaner ever"
        }
    }"#,
    )?;
    index_writer.add_document(doc)?;
    let doc = TantivyDocument::parse_json(
        &schema,
        r#"{
        "timestamp": "2022-02-22T23:20:51.53Z",
        "event_type": "click",
        "attributes": {
            "target": "submit-button",
            "cart": {"product_id": 133},
            "description": "das keyboard",
            "event_type": "holiday-sale"
        }
    }"#,
    )?;
    index_writer.add_document(doc)?;
    index_writer.commit()?;

    let reader = index.reader()?;
    let searcher = reader.searcher();

    // # Default fields: event_type and attributes
    // By setting attributes as a default field it allows omitting attributes itself, e.g. "target",
    // instead of "attributes.target"
    let query_parser = QueryParser::for_index(&index, vec![event_type, attributes]);
    {
        let query = query_parser.parse_query("target:submit-button")?;
        let count_docs = searcher.search(&*query, &TopDocs::with_limit(2).order_by_score())?;
        assert_eq!(count_docs.len(), 2);
    }
    {
        let query = query_parser.parse_query("target:submit")?;
        let count_docs = searcher.search(&*query, &TopDocs::with_limit(2).order_by_score())?;
        assert_eq!(count_docs.len(), 2);
    }
    {
        let query = query_parser.parse_query("cart.product_id:103")?;
        let count_docs = searcher.search(&*query, &Count)?;
        assert_eq!(count_docs, 1);
    }
    {
        let query = query_parser.parse_query("click AND cart.product_id:133")?;
        let hits = searcher.search(&*query, &TopDocs::with_limit(2).order_by_score())?;
        assert_eq!(hits.len(), 1);
    }
    {
        // The sub-fields in the json field marked as default field still need to be explicitly
        // addressed
        let query = query_parser.parse_query("click AND 133")?;
        let hits = searcher.search(&*query, &TopDocs::with_limit(2).order_by_score())?;
        assert_eq!(hits.len(), 0);
    }
    {
        // Default json fields are ignored if they collide with the schema
        let query = query_parser.parse_query("event_type:holiday-sale")?;
        let hits = searcher.search(&*query, &TopDocs::with_limit(2).order_by_score())?;
        assert_eq!(hits.len(), 0);
    }
    // # Query via full attribute path
    {
        // This only searches in our schema's `event_type` field
        let query = query_parser.parse_query("event_type:click")?;
        let hits = searcher.search(&*query, &TopDocs::with_limit(2).order_by_score())?;
        assert_eq!(hits.len(), 2);
    }
    {
        // Default json fields can still be accessed by full path
        let query = query_parser.parse_query("attributes.event_type:holiday-sale")?;
        let hits = searcher.search(&*query, &TopDocs::with_limit(2).order_by_score())?;
        assert_eq!(hits.len(), 1);
    }
    Ok(())
}


================================================
FILE: examples/phrase_prefix_search.rs
================================================
use tantivy::collector::TopDocs;
use tantivy::query::QueryParser;
use tantivy::schema::*;
use tantivy::{doc, Index, IndexWriter, ReloadPolicy, Result};
use tempfile::TempDir;

fn main() -> Result<()> {
    let index_path = TempDir::new()?;

    let mut schema_builder = Schema::builder();
    schema_builder.add_text_field("title", TEXT | STORED);
    schema_builder.add_text_field("body", TEXT);
    let schema = schema_builder.build();

    let title = schema.get_field("title").unwrap();
    let body = schema.get_field("body").unwrap();

    let index = Index::create_in_dir(&index_path, schema)?;

    let mut index_writer: IndexWriter = index.writer(50_000_000)?;

    index_writer.add_document(doc!(
    title => "The Old Man and the Sea",
    body => "He was an old man who fished alone in a skiff in the Gulf Stream and he had gone \
            eighty-four days now without taking a fish.",
    ))?;

    index_writer.add_document(doc!(
    title => "Of Mice and Men",
    body => "A few miles south of Soledad, the Salinas River drops in close to the hillside \
            bank and runs deep and green. The water is warm too, for it has slipped twinkling \
            over the yellow sands in the sunlight before reaching the narrow pool. On one \
            side of the river the golden foothill slopes curve up to the strong and rocky \
            Gabilan Mountains, but on the valley side the water is lined with trees—willows \
            fresh and green with every spring, carrying in their lower leaf junctures the \
            debris of the winter’s flooding; and sycamores with mottled, white, recumbent \
            limbs and branches that arch over the pool"
    ))?;

    // Multivalued field just need to be repeated.
    index_writer.add_document(doc!(
    title => "Frankenstein",
    title => "The Modern Prometheus",
    body => "You will rejoice to hear that no disaster has accompanied the commencement of an \
             enterprise which you have regarded with such evil forebodings.  I arrived here \
             yesterday, and my first task is to assure my dear sister of my welfare and \
             increasing confidence in the success of my undertaking."
    ))?;

    index_writer.commit()?;

    let reader = index
        .reader_builder()
        .reload_policy(ReloadPolicy::OnCommitWithDelay)
        .try_into()?;

    let searcher = reader.searcher();

    let query_parser = QueryParser::for_index(&index, vec![title, body]);
    // This will match documents containing the phrase "in the"
    // followed by some word starting with "su",
    // i.e. it will match "in the sunlight" and "in the success",
    // but not "in the Gulf Stream".
    let query = query_parser.parse_query("\"in the su\"*")?;

    let top_docs = searcher.search(&query, &TopDocs::with_limit(10).order_by_score())?;
    let mut titles = top_docs
        .into_iter()
        .map(|(_score, doc_address)| {
            let doc = searcher.doc::<TantivyDocument>(doc_address)?;
            let title = doc
                .get_first(title)
                .and_then(|v| v.as_str())
                .unwrap()
                .to_owned();
            Ok(title)
        })
        .collect::<Result<Vec<_>>>()?;
    titles.sort_unstable();
    assert_eq!(titles, ["Frankenstein", "Of Mice and Men"]);

    Ok(())
}


================================================
FILE: examples/pre_tokenized_text.rs
================================================
// # Pre-tokenized text example
//
// This example shows how to use pre-tokenized text. Sometimes you might
// want to index and search through text which is already split into
// tokens by some external tool.
//
// In this example we will:
// - use tantivy tokenizer to create tokens and load them directly into tantivy,
// - import tokenized text straight from json,
// - perform a search on documents with pre-tokenized text

use tantivy::collector::{Count, TopDocs};
use tantivy::query::TermQuery;
use tantivy::schema::*;
use tantivy::tokenizer::{PreTokenizedString, SimpleTokenizer, Token, TokenStream, Tokenizer};
use tantivy::{doc, Index, IndexWriter, ReloadPolicy};
use tempfile::TempDir;

fn pre_tokenize_text(text: &str) -> Vec<Token> {
    let mut tokenizer = SimpleTokenizer::default();
    let mut token_stream = tokenizer.token_stream(text);
    let mut tokens = vec![];
    while token_stream.advance() {
        tokens.push(token_stream.token().clone());
    }
    tokens
}

fn main() -> tantivy::Result<()> {
    let index_path = TempDir::new()?;

    let mut schema_builder = Schema::builder();

    schema_builder.add_text_field("title", TEXT | STORED);
    schema_builder.add_text_field("body", TEXT);

    let schema = schema_builder.build();

    let index = Index::create_in_dir(&index_path, schema.clone())?;

    let mut index_writer: IndexWriter = index.writer(50_000_000)?;

    // We can create a document manually, by setting the fields
    // one by one in a Document object.
    let title = schema.get_field("title").unwrap();
    let body = schema.get_field("body").unwrap();

    let title_text = "The Old Man and the Sea";
    let body_text = "He was an old man who fished alone in a skiff in the Gulf Stream";

    // Content of our first document
    // We create `PreTokenizedString` which contains original text and vector of tokens
    let title_tok = PreTokenizedString {
        text: String::from(title_text),
        tokens: pre_tokenize_text(title_text),
    };

    println!(
        "Original text: \"{}\" and tokens: {:?}",
        title_tok.text, title_tok.tokens
    );

    let body_tok = PreTokenizedString {
        text: String::from(body_text),
        tokens: pre_tokenize_text(body_text),
    };

    // Now lets create a document and add our `PreTokenizedString`
    let old_man_doc = doc!(title => title_tok, body => body_tok);

    // ... now let's just add it to the IndexWriter
    index_writer.add_document(old_man_doc)?;

    // Pretokenized text can also be fed as JSON
    let short_man_json = r#"{
        "title":[{
            "text":"The Old Man",
            "tokens":[
                {"offset_from":0,"offset_to":3,"position":0,"text":"The","position_length":1},
                {"offset_from":4,"offset_to":7,"position":1,"text":"Old","position_length":1},
                {"offset_from":8,"offset_to":11,"position":2,"text":"Man","position_length":1}
            ]
        }]
    }"#;

    let short_man_doc = TantivyDocument::parse_json(&schema, short_man_json)?;

    index_writer.add_document(short_man_doc)?;

    // Let's commit changes
    index_writer.commit()?;

    // ... and now is the time to query our index

    let reader = index
        .reader_builder()
        .reload_policy(ReloadPolicy::OnCommitWithDelay)
        .try_into()?;

    let searcher = reader.searcher();

    // We want to get documents with token "Man", we will use TermQuery to do it
    // Using PreTokenizedString means the tokens are stored as is avoiding stemming
    // and lowercasing, which preserves full words in their original form
    let query = TermQuery::new(
        Term::from_field_text(title, "Man"),
        IndexRecordOption::Basic,
    );

    let (top_docs, count) =
        searcher.search(&query, &(TopDocs::with_limit(2).order_by_score(), Count))?;

    assert_eq!(count, 2);

    // Now let's print out the results.
    // Note that the tokens are not stored along with the original text
    // in the document store
    for (_score, doc_address) in top_docs {
        let retrieved_doc: TantivyDocument = searcher.doc(doc_address)?;
        println!("{}", retrieved_doc.to_json(&schema));
    }

    // In contrary to the previous query, when we search for the "man" term we
    // should get no results, as it's not one of the indexed tokens. SimpleTokenizer
    // only splits text on whitespace / punctuation.

    let query = TermQuery::new(
        Term::from_field_text(title, "man"),
        IndexRecordOption::Basic,
    );

    let (_top_docs, count) =
        searcher.search(&query, &(TopDocs::with_limit(2).order_by_score(), Count))?;

    assert_eq!(count, 0);

    Ok(())
}


================================================
FILE: examples/snippet.rs
================================================
// # Snippet example
//
// This example shows how to return a representative snippet of
// your hit result.
// Snippet are an extracted of a target document, and returned in HTML format.
// The keyword searched by the user are highlighted with a `<b>` tag.

// ---
// Importing tantivy...
use tantivy::collector::TopDocs;
use tantivy::query::QueryParser;
use tantivy::schema::*;
use tantivy::snippet::{Snippet, SnippetGenerator};
use tantivy::{doc, Index, IndexWriter};
use tempfile::TempDir;

fn main() -> tantivy::Result<()> {
    // Let's create a temporary directory for the
    // sake of this example
    let index_path = TempDir::new()?;

    // # Defining the schema
    let mut schema_builder = Schema::builder();
    let title = schema_builder.add_text_field("title", TEXT | STORED);
    let body = schema_builder.add_text_field("body", TEXT | STORED);
    let schema = schema_builder.build();

    // # Indexing documents
    let index = Index::create_in_dir(&index_path, schema)?;

    let mut index_writer: IndexWriter = index.writer(50_000_000)?;

    // we'll only need one doc for this example.
    index_writer.add_document(doc!(
    title => "Of Mice and Men",
    body => "A few miles south of Soledad, the Salinas River drops in close to the hillside \
            bank and runs deep and green. The water is warm too, for it has slipped twinkling \
            over the yellow sands in the sunlight before reaching the narrow pool. On one \
            side of the river the golden foothill slopes curve up to the strong and rocky \
            Gabilan Mountains, but on the valley side the water is lined with trees—willows \
            fresh and green with every spring, carrying in their lower leaf junctures the \
            debris of the winter’s flooding; and sycamores with mottled, white, recumbent \
            limbs and branches that arch over the pool"
    ))?;
    // ...
    index_writer.commit()?;

    let reader = index.reader()?;
    let searcher = reader.searcher();
    let query_parser = QueryParser::for_index(&index, vec![title, body]);
    let query = query_parser.parse_query("sycamore spring")?;

    let top_docs = searcher.search(&query, &TopDocs::with_limit(10).order_by_score())?;

    let snippet_generator = SnippetGenerator::create(&searcher, &*query, body)?;

    for (score, doc_address) in top_docs {
        let doc = searcher.doc::<TantivyDocument>(doc_address)?;
        let snippet = snippet_generator.snippet_from_doc(&doc);
        println!("Document score {score}:");
        println!("title: {}", doc.get_first(title).unwrap().as_str().unwrap());
        println!("snippet: {}", snippet.to_html());
        println!("custom highlighting: {}", highlight(snippet));
    }

    Ok(())
}

fn highlight(snippet: Snippet) -> String {
    let mut result = String::new();
    let mut start_from = 0;

    for fragment_range in snippet.highlighted() {
        result.push_str(&snippet.fragment()[start_from..fragment_range.start]);
        result.push_str(" --> ");
        result.push_str(&snippet.fragment()[fragment_range.clone()]);
        result.push_str(" <-- ");
        start_from = fragment_range.end;
    }

    result.push_str(&snippet.fragment()[start_from..]);
    result
}


================================================
FILE: examples/stop_words.rs
================================================
// # Stop Words Example
//
// This example covers the basic usage of stop words
// with tantivy
//
// We will :
// - define our schema
// - create an index in a directory
// - add a few stop words
// - index few documents in our index

// ---
// Importing tantivy...
use tantivy::collector::TopDocs;
use tantivy::query::QueryParser;
use tantivy::schema::*;
use tantivy::tokenizer::*;
use tantivy::{doc, Index, IndexWriter};

fn main() -> tantivy::Result<()> {
    // this example assumes you understand the content in `basic_search`
    let mut schema_builder = Schema::builder();

    // This configures your custom options for how tantivy will
    // store and process your content in the index; The key
    // to note is that we are setting the tokenizer to `stoppy`
    // which will be defined and registered below.
    let text_field_indexing = TextFieldIndexing::default()
        .set_tokenizer("stoppy")
        .set_index_option(IndexRecordOption::WithFreqsAndPositions);
    let text_options = TextOptions::default()
        .set_indexing_options(text_field_indexing)
        .set_stored();

    // Our first field is title.
    schema_builder.add_text_field("title", text_options);

    // Our second field is body.
    let text_field_indexing = TextFieldIndexing::default()
        .set_tokenizer("stoppy")
        .set_index_option(IndexRecordOption::WithFreqsAndPositions);
    let text_options = TextOptions::default()
        .set_indexing_options(text_field_indexing)
        .set_stored();
    schema_builder.add_text_field("body", text_options);

    let schema = schema_builder.build();

    let index = Index::create_in_ram(schema.clone());

    // This tokenizer lowers all of the text (to help with stop word matching)
    // then removes all instances of `the` and `and` from the corpus
    let tokenizer = TextAnalyzer::builder(SimpleTokenizer::default())
        .filter(LowerCaser)
        .filter(StopWordFilter::remove(vec![
            "the".to_string(),
            "and".to_string(),
        ]))
        .build();

    index.tokenizers().register("stoppy", tokenizer);

    let mut index_writer: IndexWriter = index.writer(50_000_000)?;

    let title = schema.get_field("title").unwrap();
    let body = schema.get_field("body").unwrap();

    index_writer.add_document(doc!(
    title => "The Old Man and the Sea",
    body => "He was an old man who fished alone in a skiff in the Gulf Stream and \
     he had gone eighty-four days now without taking a fish."
    ))?;

    index_writer.add_document(doc!(
    title => "Of Mice and Men",
    body => "A few miles south of Soledad, the Salinas River drops in close to the hillside \
            bank and runs deep and green. The water is warm too, for it has slipped twinkling \
            over the yellow sands in the sunlight before reaching the narrow pool. On one \
            side of the river the golden foothill slopes curve up to the strong and rocky \
            Gabilan Mountains, but on the valley side the water is lined with trees—willows \
            fresh and green with every spring, carrying in their lower leaf junctures the \
            debris of the winter’s flooding; and sycamores with mottled, white, recumbent \
            limbs and branches that arch over the pool"
    ))?;

    index_writer.add_document(doc!(
    title => "Frankenstein",
    body => "You will rejoice to hear that no disaster has accompanied the commencement of an \
             enterprise which you have regarded with such evil forebodings.  I arrived here \
             yesterday, and my first task is to assure my dear sister of my welfare and \
             increasing confidence in the success of my undertaking."
    ))?;

    index_writer.commit()?;

    let reader = index.reader()?;

    let searcher = reader.searcher();

    let query_parser = QueryParser::for_index(&index, vec![title, body]);

    // stop words are applied on the query as well.
    // The following will be equivalent to `title:frankenstein`
    let query = query_parser.parse_query("title:\"the Frankenstein\"")?;
    let top_docs = searcher.search(&query, &TopDocs::with_limit(10).order_by_score())?;

    for (score, doc_address) in top_docs {
        let retrieved_doc: TantivyDocument = searcher.doc(doc_address)?;
        println!("\n==\nDocument score {score}:");
        println!("{}", retrieved_doc.to_json(&schema));
    }

    Ok(())
}


================================================
FILE: examples/warmer.rs
================================================
use std::cmp::Reverse;
use std::collections::{HashMap, HashSet};
use std::sync::{Arc, RwLock, Weak};

use tantivy::collector::TopDocs;
use tantivy::index::SegmentId;
use tantivy::query::QueryParser;
use tantivy::schema::{Schema, FAST, TEXT};
use tantivy::{
    doc, DocAddress, DocId, Index, IndexWriter, Opstamp, Searcher, SearcherGeneration,
    SegmentReader, Warmer,
};

// This example shows how warmers can be used to
// load values from an external sources and
// tie their lifecycle to that of the index segments
// using the Warmer API.
//
// In this example, we assume an e-commerce search engine.

type ProductId = u64;

type Price = u32;

pub trait PriceFetcher: Send + Sync + 'static {
    fn fetch_prices(&self, product_ids: &[ProductId]) -> Vec<Price>;
}

type SegmentKey = (SegmentId, Option<Opstamp>);

struct DynamicPriceColumn {
    field: String,
    price_cache: RwLock<HashMap<SegmentKey, Arc<Vec<Price>>>>,
    price_fetcher: Box<dyn PriceFetcher>,
}

impl DynamicPriceColumn {
    pub fn with_product_id_field<T: PriceFetcher>(field: String, price_fetcher: T) -> Self {
        DynamicPriceColumn {
            field,
            price_cache: Default::default(),
            price_fetcher: Box::new(price_fetcher),
        }
    }

    pub fn price_for_segment(&self, segment_reader: &SegmentReader) -> Option<Arc<Vec<Price>>> {
        let segment_key = (segment_reader.segment_id(), segment_reader.delete_opstamp());
        self.price_cache.read().unwrap().get(&segment_key).cloned()
    }
}
impl Warmer for DynamicPriceColumn {
    fn warm(&self, searcher: &Searcher) -> tantivy::Result<()> {
        for segment in searcher.segment_readers() {
            let product_id_reader = segment
                .fast_fields()
                .u64(&self.field)?
                .first_or_default_col(0);
            let product_ids: Vec<ProductId> = segment
                .doc_ids_alive()
                .map(|doc| product_id_reader.get_val(doc))
                .collect();

            let mut prices = self.price_fetcher.fetch_prices(&product_ids).into_iter();

            let prices: Vec<Price> = (0..segment.max_doc())
                .map(|doc| {
                    if !segment.is_deleted(doc) {
                        prices.next().unwrap()
                    } else {
                        0
                    }
                })
                .collect();

            let key = (segment.segment_id(), segment.delete_opstamp());
            self.price_cache
                .write()
                .unwrap()
                .insert(key, Arc::new(prices));
        }

        Ok(())
    }

    fn garbage_collect(&self, live_generations: &[&SearcherGeneration]) {
        let live_keys: HashSet<SegmentKey> = live_generations
            .iter()
            .flat_map(|gen| gen.segments())
            .map(|(&segment_id, &opstamp)| (segment_id, opstamp))
            .collect();

        self.price_cache
            .write()
            .unwrap()
            .retain(|key, _| live_keys.contains(key));
    }
}

// For the sake of this example, the table is just an editable HashMap behind a RwLock.
// This map represents a map (ProductId -> Price)
//
// In practise, it could be fetching things from an external service, like a SQL table.
#[derive(Default, Clone)]
pub struct ExternalPriceTable {
    prices: Arc<RwLock<HashMap<ProductId, Price>>>,
}

impl ExternalPriceTable {
    pub fn update_price(&self, product_id: ProductId, price: Price) {
        self.prices.write().unwrap().insert(product_id, price);
    }
}

impl PriceFetcher for ExternalPriceTable {
    fn fetch_prices(&self, product_ids: &[ProductId]) -> Vec<Price> {
        let prices = self.prices.read().unwrap();

        product_ids
            .iter()
            .map(|product_id| prices.get(product_id).cloned().unwrap_or(0))
            .collect()
    }
}

fn main() -> tantivy::Result<()> {
    // Declaring our schema.
    let mut schema_builder = Schema::builder();
    // The product id is assumed to be a primary id for our external price source.
    let product_id = schema_builder.add_u64_field("product_id", FAST);
    let text = schema_builder.add_text_field("text", TEXT);
    let schema: Schema = schema_builder.build();

    let price_table = ExternalPriceTable::default();
    let price_dynamic_column = Arc::new(DynamicPriceColumn::with_product_id_field(
        "product_id".to_string(),
        price_table.clone(),
    ));
    price_table.update_price(OLIVE_OIL, 12);
    price_table.update_price(GLOVES, 13);
    price_table.update_price(SNEAKERS, 80);

    const OLIVE_OIL: ProductId = 323423;
    const GLOVES: ProductId = 3966623;
    const SNEAKERS: ProductId = 23222;

    let index = Index::create_in_ram(schema);
    let mut writer: IndexWriter = index.writer_with_num_threads(1, 15_000_000)?;
    writer.add_document(doc!(product_id=>OLIVE_OIL, text=>"cooking olive oil from greece"))?;
    writer.add_document(doc!(product_id=>GLOVES, text=>"kitchen gloves, perfect for cooking"))?;
    writer.add_document(doc!(product_id=>SNEAKERS, text=>"uber sweet sneakers"))?;
    writer.commit()?;

    let warmers = vec![Arc::downgrade(&price_dynamic_column) as Weak<dyn Warmer>];
    let reader = index.reader_builder().warmers(warmers).try_into()?;

    let query_parser = QueryParser::for_index(&index, vec![text]);
    let query = query_parser.parse_query("cooking")?;

    let searcher = reader.searcher();
    let score_by_price = move |segment_reader: &SegmentReader| {
        let price = price_dynamic_column
            .price_for_segment(segment_reader)
            .unwrap();
        move |doc_id: DocId| Reverse(price[doc_id as usize])
    };

    let most_expensive_first = TopDocs::with_limit(10).order_by(score_by_price);

    let hits = searcher.search(&query, &most_expensive_first)?;
    assert_eq!(
        &hits,
        &[
            (
                Reverse(12u32),
                DocAddress {
                    segment_ord: 0,
                    doc_id: 0u32
                }
            ),
            (
                Reverse(13u32),
                DocAddress {
                    segment_ord: 0,
                    doc_id: 1u32
                }
            ),
        ]
    );

    // Olive oil just got more expensive!
    price_table.update_price(OLIVE_OIL, 15);

    // The price update are directly reflected on `reload`.
    //
    // Be careful here though!...
    // You may have spotted that we are still using the same `Searcher`.
    //
    // It is up to the `Warmer` implementer to decide how
    // to control this behavior.

    reader.reload()?;

    let hits_with_new_prices = searcher.search(&query, &most_expensive_first)?;
    assert_eq!(
        &hits_with_new_prices,
        &[
            (
                Reverse(13u32),
                DocAddress {
                    segment_ord: 0,
                    doc_id: 1u32
                }
            ),
            (
                Reverse(15u32),
                DocAddress {
                    segment_ord: 0,
                    doc_id: 0u32
                }
            ),
        ]
    );

    Ok(())
}


================================================
FILE: ownedbytes/Cargo.toml
================================================
[package]
authors = ["Paul Masurel <paul@quickwit.io>", "Pascal Seitz <pascal@quickwit.io>"]
name = "ownedbytes"
version = "0.9.0"
edition = "2021"
description = "Expose data as static slice"
license = "MIT"
documentation = "https://docs.rs/ownedbytes/"
homepage = "https://github.com/quickwit-oss/tantivy"
repository = "https://github.com/quickwit-oss/tantivy"

# See more keys and their definitions at https://doc.rust-lang.org/cargo/reference/manifest.html

[dependencies]
stable_deref_trait = "1.2.0"


================================================
FILE: ownedbytes/src/lib.rs
================================================
use std::ops::{Deref, Range};
use std::sync::Arc;
use std::{fmt, io};

pub use stable_deref_trait::StableDeref;

/// An OwnedBytes simply wraps an object that owns a slice of data and exposes
/// this data as a slice.
///
/// The backing object is required to be `StableDeref`.
#[derive(Clone)]
pub struct OwnedBytes {
    data: &'static [u8],
    box_stable_deref: Arc<dyn Deref<Target = [u8]> + Sync + Send>,
}

impl OwnedBytes {
    /// Creates an empty `OwnedBytes`.
    pub fn empty() -> OwnedBytes {
        OwnedBytes::new(&[][..])
    }

    /// Creates an `OwnedBytes` instance given a `StableDeref` object.
    pub fn new<T: StableDeref + Deref<Target = [u8]> + 'static + Send + Sync>(
        data_holder: T,
    ) -> OwnedBytes {
        let box_stable_deref = Arc::new(data_holder);
        let bytes: &[u8] = box_stable_deref.deref();
        let data = unsafe { &*(bytes as *const [u8]) };
        OwnedBytes {
            data,
            box_stable_deref,
        }
    }

    /// creates a fileslice that is just a view over a slice of the data.
    #[must_use]
    #[inline]
    pub fn slice(&self, range: Range<usize>) -> Self {
        OwnedBytes {
            data: &self.data[range],
            box_stable_deref: self.box_stable_deref.clone(),
        }
    }

    /// Returns the underlying slice of data.
    /// `Deref` and `AsRef` are also available.
    #[inline]
    pub fn as_slice(&self) -> &[u8] {
        self.data
    }

    /// Returns the len of the slice.
    #[inline]
    pub fn len(&self) -> usize {
        self.data.len()
    }

    /// Returns true iff this `OwnedBytes` is empty.
    #[inline]
    pub fn is_empty(&self) -> bool {
        self.data.is_empty()
    }

    /// Splits the OwnedBytes into two OwnedBytes `(left, right)`.
    ///
    /// Left will hold `split_len` bytes.
    ///
    /// This operation is cheap and does not require to copy any memory.
    /// On the other hand, both `left` and `right` retain a handle over
    /// the entire slice of memory. In other words, the memory will only
    /// be released when both left and right are dropped.
    #[inline]
    #[must_use]
    pub fn split(self, split_len: usize) -> (OwnedBytes, OwnedBytes) {
        let (left_data, right_data) = self.data.split_at(split_len);
        let right_box_stable_deref = self.box_stable_deref.clone();
        let left = OwnedBytes {
            data: left_data,
            box_stable_deref: self.box_stable_deref,
        };
        let right = OwnedBytes {
            data: right_data,
            box_stable_deref: right_box_stable_deref,
        };
        (left, right)
    }

    /// Splits the OwnedBytes into two OwnedBytes `(left, right)`.
    ///
    /// Right will hold `split_len` bytes.
    ///
    /// This operation is cheap and does not require to copy any memory.
    /// On the other hand, both `left` and `right` retain a handle over
    /// the entire slice of memory. In other words, the memory will only
    /// be released when both left and right are dropped.
    #[inline]
    #[must_use]
    pub fn rsplit(self, split_len: usize) -> (OwnedBytes, OwnedBytes) {
        let data_len = self.data.len();
        self.split(data_len - split_len)
    }

    /// Splits the right part of the `OwnedBytes` at the given offset.
    ///
    /// `self` is truncated to `split_len`, left with the remaining bytes.
    pub fn split_off(&mut self, split_len: usize) -> OwnedBytes {
        let (left, right) = self.data.split_at(split_len);
        let right_box_stable_deref = self.box_stable_deref.clone();
        let right_piece = OwnedBytes {
            data: right,
            box_stable_deref: right_box_stable_deref,
        };
        self.data = left;
        right_piece
    }

    /// Drops the left most `advance_len` bytes.
    #[inline]
    pub fn advance(&mut self, advance_len: usize) -> &[u8] {
        let (data, rest) = self.data.split_at(advance_len);
        self.data = rest;
        data
    }

    /// Reads an `u8` from the `OwnedBytes` and advance by one byte.
    #[inline]
    pub fn read_u8(&mut self) -> u8 {
        self.advance(1)[0]
    }

    #[inline]
    fn read_n<const N: usize>(&mut self) -> [u8; N] {
        self.advance(N).try_into().unwrap()
    }

    /// Reads an `u32` encoded as little-endian from the `OwnedBytes` and advance by 4 bytes.
    #[inline]
    pub fn read_u32(&mut self) -> u32 {
        u32::from_le_bytes(self.read_n())
    }

    /// Reads an `u64` encoded as little-endian from the `OwnedBytes` and advance by 8 bytes.
    #[inline]
    pub fn read_u64(&mut self) -> u64 {
        u64::from_le_bytes(self.read_n())
    }
}

impl fmt::Debug for OwnedBytes {
    fn fmt(&self, f: &mut fmt::Formatter) -> fmt::Result {
        // We truncate the bytes in order to make sure the debug string
        // is not too long.
        let bytes_truncated: &[u8] = if self.len() > 10 {
            &self.as_slice()[..10]
        } else {
            self.as_slice()
        };
        write!(f, "OwnedBytes({bytes_truncated:?}, len={})", self.len())
    }
}

impl PartialEq for OwnedBytes {
    fn eq(&self, other: &OwnedBytes) -> bool {
        self.as_slice() == other.as_slice()
    }
}

impl Eq for OwnedBytes {}

impl PartialEq<[u8]> for OwnedBytes {
    fn eq(&self, other: &[u8]) -> bool {
        self.as_slice() == other
    }
}

impl PartialEq<str> for OwnedBytes {
    fn eq(&self, other: &str) -> bool {
        self.as_slice() == other.as_bytes()
    }
}

impl<'a, T: ?Sized> PartialEq<&'a T> for OwnedBytes
where OwnedBytes: PartialEq<T>
{
    fn eq(&self, other: &&'a T) -> bool {
        *self == **other
    }
}

impl Deref for OwnedBytes {
    type Target = [u8];

    #[inline]
    fn deref(&self) -> &Self::Target {
        self.as_slice()
    }
}

impl AsRef<[u8]> for OwnedBytes {
    #[inline]
    fn as_ref(&self) -> &[u8] {
        self.as_slice()
    }
}

impl io::Read for OwnedBytes {
    #[inline]
    fn read(&mut self, buf: &mut [u8]) -> io::Result<usize> {
        let data_len = self.data.len();
        let buf_len = buf.len();
        if data_len >= buf_len {
            let data = self.advance(buf_len);
            buf.copy_from_slice(data);
            Ok(buf_len)
        } else {
            buf[..data_len].copy_from_slice(self.data);
            self.data = &[];
            Ok(data_len)
        }
    }
    #[inline]
    fn read_to_end(&mut self, buf: &mut Vec<u8>) -> io::Result<usize> {
        buf.extend(self.data);
        let read_len = self.data.len();
        self.data = &[];
        Ok(read_len)
    }
    #[inline]
    fn read_exact(&mut self, buf: &mut [u8]) -> io::Result<()> {
        let read_len = self.read(buf)?;
        if read_len != buf.len() {
            return Err(io::Error::new(
                io::ErrorKind::UnexpectedEof,
                "failed to fill whole buffer",
            ));
        }
        Ok(())
    }
}

#[cfg(test)]
mod tests {
    use std::io::{self, Read};

    use super::OwnedBytes;

    #[test]
    fn test_owned_bytes_debug() {
        let short_bytes = OwnedBytes::new(b"abcd".as_ref());
        assert_eq!(
            format!("{short_bytes:?}"),
            "OwnedBytes([97, 98, 99, 100], len=4)"
        );
        let medium_bytes = OwnedBytes::new(b"abcdefghi".as_ref());
        assert_eq!(
            format!("{medium_bytes:?}"),
            "OwnedBytes([97, 98, 99, 100, 101, 102, 103, 104, 105], len=9)"
        );
        let long_bytes = OwnedBytes::new(b"abcdefghijklmnopq".as_ref());
        assert_eq!(
            format!("{long_bytes:?}"),
            "OwnedBytes([97, 98, 99, 100, 101, 102, 103, 104, 105, 106], len=17)"
        );
    }

    #[test]
    fn test_owned_bytes_read() -> io::Result<()> {
        let mut bytes = OwnedBytes::new(b"abcdefghiklmnopqrstuvwxyz".as_ref());
        {
            let mut buf = [0u8; 5];
            bytes.read_exact(&mut buf[..]).unwrap();
            assert_eq!(&buf, b"abcde");
            assert_eq!(bytes.as_slice(), b"fghiklmnopqrstuvwxyz")
        }
        {
            let mut buf = [0u8; 2];
            bytes.read_exact(&mut buf[..]).unwrap();
            assert_eq!(&buf, b"fg");
            assert_eq!(bytes.as_slice(), b"hiklmnopqrstuvwxyz")
        }
        Ok(())
    }

    #[test]
    fn test_owned_bytes_read_right_at_the_end() -> io::Result<()> {
        let mut bytes = OwnedBytes::new(b"abcde".as_ref());
        let mut buf = [0u8; 5];
        assert_eq!(bytes.read(&mut buf[..]).unwrap(), 5);
        assert_eq!(&buf, b"abcde");
        assert_eq!(bytes.as_slice(), b"");
        assert_eq!(bytes.read(&mut buf[..]).unwrap(), 0);
        assert_eq!(&buf, b"abcde");
        Ok(())
    }
    #[test]
    fn test_owned_bytes_read_incomplete() -> io::Result<()> {
        let mut bytes = OwnedBytes::new(b"abcde".as_ref());
        let mut buf = [0u8; 7];
        assert_eq!(bytes.read(&mut buf[..]).unwrap(), 5);
        assert_eq!(&buf[..5], b"abcde");
        assert_eq!(bytes.read(&mut buf[..]).unwrap(), 0);
        Ok(())
    }

    #[test]
    fn test_owned_bytes_read_to_end() -> io::Result<()> {
        let mut bytes = OwnedBytes::new(b"abcde".as_ref());
        let mut buf = Vec::new();
        bytes.read_to_end(&mut buf)?;
        assert_eq!(buf.as_slice(), b"abcde".as_ref());
        Ok(())
    }

    #[test]
    fn test_owned_bytes_read_u8() -> io::Result<()> {
        let mut bytes = OwnedBytes::new(b"\xFF".as_ref());
        assert_eq!(bytes.read_u8(), 255);
        assert_eq!(bytes.len(), 0);
        Ok(())
    }

    #[test]
    fn test_owned_bytes_read_u64() -> io::Result<()> {
        let mut bytes = OwnedBytes::new(b"\0\xFF\xFF\xFF\xFF\xFF\xFF\xFF".as_ref());
        assert_eq!(bytes.read_u64(), u64::MAX - 255);
        assert_eq!(bytes.len(), 0);
        Ok(())
    }

    #[test]
    fn test_owned_bytes_split() {
        let bytes = OwnedBytes::new(b"abcdefghi".as_ref());
        let (left, right) = bytes.split(3);
        assert_eq!(left.as_slice(), b"abc");
        assert_eq!(right.as_slice(), b"defghi");
    }

    #[test]
    fn test_owned_bytes_split_boundary() {
        let bytes = OwnedBytes::new(b"abcdefghi".as_ref());
        {
            let (left, right) = bytes.clone().split(0);
            assert_eq!(left.as_slice(), b"");
            assert_eq!(right.as_slice(), b"abcdefghi");
        }
        {
            let (left, right) = bytes.split(9);
            assert_eq!(left.as_slice(), b"abcdefghi");
            assert_eq!(right.as_slice(), b"");
        }
    }

    #[test]
    fn test_split_off() {
        let mut data = OwnedBytes::new(b"abcdef".as_ref());
        assert_eq!(data, "abcdef");
        assert_eq!(data.split_off(2), "cdef");
        assert_eq!(data, "ab");
        assert_eq!(data.split_off(1), "b");
        assert_eq!(data, "a");
    }
}


================================================
FILE: query-grammar/Cargo.toml
================================================
[package]
name = "tantivy-query-grammar"
version = "0.25.0"
authors = ["Paul Masurel <paul.masurel@gmail.com>"]
license = "MIT"
categories = ["database-implementations", "data-structures"]
description = """Search engine library"""
homepage = "https://github.com/quickwit-oss/tantivy"
repository = "https://github.com/quickwit-oss/tantivy"
readme = "README.md"
keywords = ["search", "information", "retrieval"]
edition = "2024"

[dependencies]
nom = "7"
serde = { version = "1.0.219", features = ["derive"] }
serde_json = "1.0.140"
ordered-float = "5.0.0"
fnv = "1.0.7"


================================================
FILE: query-grammar/README.md
================================================
# Tantivy Query Grammar

This crate is used by tantivy to parse queries.


================================================
FILE: query-grammar/src/infallible.rs
================================================
//! nom combinators for infallible operations

use std::convert::Infallible;

use nom::{AsChar, IResult, InputLength, InputTakeAtPosition};
use serde::Serialize;

pub(crate) type ErrorList = Vec<LenientErrorInternal>;
pub(crate) type JResult<I, O> = IResult<I, (O, ErrorList), Infallible>;

/// An error, with an end-of-string based offset
#[derive(Debug)]
pub(crate) struct LenientErrorInternal {
    pub pos: usize,
    pub message: String,
}

/// A recoverable error and the position it happened at
#[derive(Debug, PartialEq, Serialize)]
#[serde(rename_all = "snake_case")]
pub struct LenientError {
    pub pos: usize,
    pub message: String,
}

impl LenientError {
    pub(crate) fn from_internal(internal: LenientErrorInternal, str_len: usize) -> LenientError {
        LenientError {
            pos: str_len - internal.pos,
            message: internal.message,
        }
    }
}

fn unwrap_infallible<T>(res: Result<T, nom::Err<Infallible>>) -> T {
    match res {
        Ok(val) => val,
        Err(_) => unreachable!(),
    }
}

// when rfcs#1733 get stabilized, this can make things clearer
// trait InfallibleParser<I, O> = nom::Parser<I, (O, ErrorList), std::convert::Infallible>;

/// A variant of the classical `opt` parser, except it returns an infallible error type.
///
/// It's less generic than the original to ease type resolution in the rest of the code.
pub(crate) fn opt_i<I: Clone, O, F>(mut f: F) -> impl FnMut(I) -> JResult<I, Option<O>>
where F: nom::Parser<I, O, nom::error::Error<I>> {
    move |input: I| {
        let i = input.clone();
        match f.parse(input) {
            Ok((i, o)) => Ok((i, (Some(o), Vec::new()))),
            Err(_) => Ok((i, (None, Vec::new()))),
        }
    }
}

pub(crate) fn opt_i_err<'a, I: Clone + InputLength, O, F>(
    mut f: F,
    message: impl ToString + 'a,
) -> impl FnMut(I) -> JResult<I, Option<O>> + 'a
where
    F: nom::Parser<I, O, nom::error::Error<I>> + 'a,
{
    move |input: I| {
        let i = input.clone();
        match f.parse(input) {
            Ok((i, o)) => Ok((i, (Some(o), Vec::new()))),
            Err(_) => {
                let errs = vec![LenientErrorInternal {
                    pos: i.input_len(),
                    message: message.to_string(),
                }];
                Ok((i, (None, errs)))
            }
        }
    }
}

pub(crate) fn space0_infallible<T>(input: T) -> JResult<T, T>
where
    T: InputTakeAtPosition + Clone,
    <T as InputTakeAtPosition>::Item: AsChar + Clone,
{
    opt_i(nom::character::complete::multispace0)(input)
        .map(|(left, (spaces, errors))| (left, (spaces.expect("multispace0 can't fail"), errors)))
}

pub(crate) fn space1_infallible<T>(input: T) -> JResult<T, Option<T>>
where
    T: InputTakeAtPosition + Clone + InputLength,
    <T as InputTakeAtPosition>::Item: AsChar + Clone,
{
    opt_i(nom::character::complete::multispace1)(input).map(|(left, (spaces, mut errors))| {
        if spaces.is_none() {
            errors.push(LenientErrorInternal {
                pos: left.input_len(),
                message: "missing space".to_string(),
            })
        }
        (left, (spaces, errors))
    })
}

pub(crate) fn fallible<I, O, E: nom::error::ParseError<I>, F>(
    mut f: F,
) -> impl FnMut(I) -> IResult<I, O, E>
where F: nom::Parser<I, (O, ErrorList), Infallible> {
    use nom::Err;
    move |input: I| match f.parse(input) {
        Ok((input, (output, _err))) => Ok((input, output)),
        Err(Err::Incomplete(needed)) => Err(Err::Incomplete(needed)),
        // old versions don't understand this is uninhabited and need the empty match to help,
        // newer versions warn because this arm is unreachable (which it is indeed).
        Err(Err::Error(val)) | Err(Err::Failure(val)) => match val {},
    }
}

pub(crate) fn terminated_infallible<I, O1, O2, F, G>(
    mut first: F,
    mut second: G,
) -> impl FnMut(I) -> JResult<I, O1>
where
    F: nom::Parser<I, (O1, ErrorList), Infallible>,
    G: nom::Parser<I, (O2, ErrorList), Infallible>,
{
    move |input: I| {
        let (input, (o1, mut err)) = first.parse(input)?;
        let (input, (_, mut err2)) = second.parse(input)?;
        err.append(&mut err2);
        Ok((input, (o1, err)))
    }
}

pub(crate) fn delimited_infallible<I, O1, O2, O3, F, G, H>(
    mut first: F,
    mut second: G,
    mut third: H,
) -> impl FnMut(I) -> JResult<I, O2>
where
    F: nom::Parser<I, (O1, ErrorList), Infallible>,
    G: nom::Parser<I, (O2, ErrorList), Infallible>,
    H: nom::Parser<I, (O3, ErrorList), Infallible>,
{
    move |input: I| {
        let (input, (_, mut err)) = first.parse(input)?;
        let (input, (o2, mut err2)) = second.parse(input)?;
        err.append(&mut err2);
        let (input, (_, mut err3)) = third.parse(input)?;
        err.append(&mut err3);
        Ok((input, (o2, err)))
    }
}

// Parse nothing. Just a lazy way to not implement terminated/preceded and use delimited instead
pub(crate) fn nothing(i: &str) -> JResult<&str, ()> {
    Ok((i, ((), Vec::new())))
}

pub(crate) trait TupleInfallible<I, O> {
    /// Parses the input and returns a tuple of results of each parser.
    fn parse(&mut self, input: I) -> JResult<I, O>;
}

impl<Input, Output, F: nom::Parser<Input, (Output, ErrorList), Infallible>>
    TupleInfallible<Input, (Output,)> for (F,)
{
    fn parse(&mut self, input: Input) -> JResult<Input, (Output,)> {
        self.0.parse(input).map(|(i, (o, e))| (i, ((o,), e)))
    }
}

// these macros are heavily copied from nom, with some minor adaptations for our type
macro_rules! tuple_trait(
  ($name1:ident $ty1:ident, $name2: ident $ty2:ident, $($name:ident $ty:ident),*) => (
    tuple_trait!(__impl $name1 $ty1, $name2 $ty2; $($name $ty),*);
  );
  (__impl $($name:ident $ty: ident),+; $name1:ident $ty1:ident, $($name2:ident $ty2:ident),*) => (
    tuple_trait_impl!($($name $ty),+);
    tuple_trait!(__impl $($name $ty),+ , $name1 $ty1; $($name2 $ty2),*);
  );
  (__impl $($name:ident $ty: ident),+; $name1:ident $ty1:ident) => (
    tuple_trait_impl!($($name $ty),+);
    tuple_trait_impl!($($name $ty),+, $name1 $ty1);
  );
);

macro_rules! tuple_trait_impl(
  ($($name:ident $ty: ident),+) => (
    impl<
      Input: Clone, $($ty),+ ,
      $($name: nom::Parser<Input, ($ty, ErrorList), Infallible>),+
    > TupleInfallible<Input, ( $($ty),+ )> for ( $($name),+ ) {

      fn parse(&mut self, input: Input) -> JResult<Input, ( $($ty),+ )> {
        let mut error_list = Vec::new();
        tuple_trait_inner!(0, self, input, (), error_list, $($name)+)
      }
    }
  );
);

macro_rules! tuple_trait_inner(
  ($it:tt, $self:expr_2021, $input:expr_2021, (), $error_list:expr_2021, $head:ident $($id:ident)+) => ({
    let (i, (o, mut err)) = $self.$it.parse($input.clone())?;
    $error_list.append(&mut err);

    succ!($it, tuple_trait_inner!($self, i, ( o ), $error_list, $($id)+))
  });
  ($it:tt, $self:expr_2021, $input:expr_2021, ($($parsed:tt)*), $error_list:expr_2021, $head:ident $($id:ident)+) => ({
    let (i, (o, mut err)) = $self.$it.parse($input.clone())?;
    $error_list.append(&mut err);

    succ!($it, tuple_trait_inner!($self, i, ($($parsed)* , o), $error_list, $($id)+))
  });
  ($it:tt, $self:expr_2021, $input:expr_2021, ($($parsed:tt)*), $error_list:expr_2021, $head:ident) => ({
    let (i, (o, mut err)) = $self.$it.parse($input.clone())?;
    $error_list.append(&mut err);

    Ok((i, (($($parsed)* , o), $error_list)))
  });
);

macro_rules! succ (
  (0, $submac:ident ! ($($rest:tt)*)) => ($submac!(1, $($rest)*));
  (1, $submac:ident ! ($($rest:tt)*)) => ($submac!(2, $($rest)*));
  (2, $submac:ident ! ($($rest:tt)*)) => ($submac!(3, $($rest)*));
  (3, $submac:ident ! ($($rest:tt)*)) => ($submac!(4, $($rest)*));
  (4, $submac:ident ! ($($rest:tt)*)) => ($submac!(5, $($rest)*));
  (5, $submac:ident ! ($($rest:tt)*)) => ($submac!(6, $($rest)*));
  (6, $submac:ident ! ($($rest:tt)*)) => ($submac!(7, $($rest)*));
  (7, $submac:ident ! ($($rest:tt)*)) => ($submac!(8, $($rest)*));
  (8, $submac:ident ! ($($rest:tt)*)) => ($submac!(9, $($rest)*));
  (9, $submac:ident ! ($($rest:tt)*)) => ($submac!(10, $($rest)*));
  (10, $submac:ident ! ($($rest:tt)*)) => ($submac!(11, $($rest)*));
  (11, $submac:ident ! ($($rest:tt)*)) => ($submac!(12, $($rest)*));
  (12, $submac:ident ! ($($rest:tt)*)) => ($submac!(13, $($rest)*));
  (13, $submac:ident ! ($($rest:tt)*)) => ($submac!(14, $($rest)*));
  (14, $submac:ident ! ($($rest:tt)*)) => ($submac!(15, $($rest)*));
  (15, $submac:ident ! ($($rest:tt)*)) => ($submac!(16, $($rest)*));
  (16, $submac:ident ! ($($rest:tt)*)) => ($submac!(17, $($rest)*));
  (17, $submac:ident ! ($($rest:tt)*)) => ($submac!(18, $($rest)*));
  (18, $submac:ident ! ($($rest:tt)*)) => ($submac!(19, $($rest)*));
  (19, $submac:ident ! ($($rest:tt)*)) => ($submac!(20, $($rest)*));
  (20, $submac:ident ! ($($rest:tt)*)) => ($submac!(21, $($rest)*));
);

tuple_trait!(FnA A, FnB B, FnC C, FnD D, FnE E, FnF F, FnG G, FnH H, FnI I, FnJ J, FnK K, FnL L,
  FnM M, FnN N, FnO O, FnP P, FnQ Q, FnR R, FnS S, FnT T, FnU U);

// Special case: implement `TupleInfallible` for `()`, the unit type.
// This can come up in macros which accept a variable number of arguments.
// Literally, `()` is an empty tuple, so it should simply parse nothing.
impl<I> TupleInfallible<I, ()> for () {
    fn parse(&mut self, input: I) -> JResult<I, ()> {
        Ok((input, ((), Vec::new())))
    }
}

pub(crate) fn tuple_infallible<I, O, List: TupleInfallible<I, O>>(
    mut l: List,
) -> impl FnMut(I) -> JResult<I, O> {
    move |i: I| l.parse(i)
}

pub(crate) fn separated_list_infallible<I, O, O2, F, G>(
    mut sep: G,
    mut f: F,
) -> impl FnMut(I) -> JResult<I, Vec<O>>
where
    I: Clone + InputLength,
    F: nom::Parser<I, (O, ErrorList), Infallible>,
    G: nom::Parser<I, (O2, ErrorList), Infallible>,
{
    move |i: I| {
        let mut res: Vec<O> = Vec::new();
        let mut errors: ErrorList = Vec::new();

        let (mut i, (o, mut err)) = unwrap_infallible(f.parse(i.clone()));
        errors.append(&mut err);
        res.push(o);

        loop {
            let (i_sep_parsed, (_, mut err_sep)) = unwrap_infallible(sep.parse(i.clone()));
            let len_before = i_sep_parsed.input_len();

            let (i_elem_parsed, (o, mut err_elem)) =
                unwrap_infallible(f.parse(i_sep_parsed.clone()));

            // infinite loop check: the parser must always consume
            // if we consumed nothing here, don't produce an element.
            if i_elem_parsed.input_len() == len_before {
                return Ok((i, (res, errors)));
            }
            res.push(o);
            errors.append(&mut err_sep);
            errors.append(&mut err_elem);
            i = i_elem_parsed;
        }
    }
}

pub(crate) trait Alt<I, O> {
    /// Tests each parser in the tuple and returns the result of the first one that succeeds
    fn choice(&mut self, input: I) -> Option<JResult<I, O>>;
}

macro_rules! alt_trait(
  ($first_cond:ident $first:ident, $($id_cond:ident $id: ident),+) => (
    alt_trait!(__impl $first_cond $first; $($id_cond $id),+);
  );
  (__impl $($current_cond:ident $current:ident),*; $head_cond:ident $head:ident, $($id_cond:ident $id:ident),+) => (
    alt_trait_impl!($($current_cond $current),*);

    alt_trait!(__impl $($current_cond $current,)* $head_cond $head; $($id_cond $id),+);
  );
  (__impl $($current_cond:ident $current:ident),*; $head_cond:ident $head:ident) => (
    alt_trait_impl!($($current_cond $current),*);
    alt_trait_impl!($($current_cond $current,)* $head_cond $head);
  );
);

macro_rules! alt_trait_impl(
  ($($id_cond:ident $id:ident),+) => (
    impl<
      Input: Clone, Output,
      $(
          // () are to make things easier on me, but I'm not entirely sure whether we can do better
          // with rule E0207
          $id_cond: nom::Parser<Input, (), ()>,
          $id: nom::Parser<Input, (Output, ErrorList), Infallible>
      ),+
    > Alt<Input, Output> for ( $(($id_cond, $id),)+ ) {

      fn choice(&mut self, input: Input) -> Option<JResult<Input, Output>> {
        match self.0.0.parse(input.clone()) {
          Err(_) => alt_trait_inner!(1, self, input, $($id_cond $id),+),
          Ok((input_left, _)) => Some(self.0.1.parse(input_left)),
        }
      }
    }
  );
);

macro_rules! alt_trait_inner(
  ($it:tt, $self:expr_2021, $input:expr_2021, $head_cond:ident $head:ident, $($id_cond:ident $id:ident),+) => (
    match $self.$it.0.parse($input.clone()) {
      Err(_) => succ!($it, alt_trait_inner!($self, $input, $($id_cond $id),+)),
      Ok((input_left, _)) => Some($self.$it.1.parse(input_left)),
    }
  );
  ($it:tt, $self:expr_2021, $input:expr_2021, $head_cond:ident $head:ident) => (
    None
  );
);

alt_trait!(A1 A, B1 B, C1 C, D1 D, E1 E, F1 F, G1 G, H1 H, I1 I, J1 J, K1 K,
           L1 L, M1 M, N1 N, O1 O, P1 P, Q1 Q, R1 R, S1 S, T1 T, U1 U);

/// An alt() like combinator. For each branch, it first tries a fallible parser, which commits to
/// this branch, or tells to check next branch, and the execute the infallible parser which follow.
///
/// In case no branch match, the default (fallible) parser is executed.
pub(crate) fn alt_infallible<I: Clone, O, F, List: Alt<I, O>>(
    mut l: List,
    mut default: F,
) -> impl FnMut(I) -> JResult<I, O>
where
    F: nom::Parser<I, (O, ErrorList), Infallible>,
{
    move |i: I| l.choice(i.clone()).unwrap_or_else(|| default.parse(i))
}

#[cfg(test)]
mod tests {
    use super::*;

    #[test]
    fn test_lenient_error_serialization() {
        let error = LenientError {
            pos: 42,
            message: "test error message".to_string(),
        };

        assert_eq!(
            serde_json::to_string(&error).unwrap(),
            "{\"pos\":42,\"message\":\"test error message\"}"
        );
    }
}


================================================
FILE: query-grammar/src/lib.rs
================================================
#![allow(clippy::derive_partial_eq_without_eq)]

use serde::Serialize;

mod infallible;
mod occur;
mod query_grammar;
mod user_input_ast;

pub use crate::infallible::LenientError;
pub use crate::occur::Occur;
use crate::query_grammar::{parse_to_ast, parse_to_ast_lenient};
pub use crate::user_input_ast::{
    Delimiter, UserInputAst, UserInputBound, UserInputLeaf, UserInputLiteral,
};

#[derive(Debug, Serialize)]
#[serde(rename_all = "snake_case")]
pub struct Error;

/// Parse a query
pub fn parse_query(query: &str) -> Result<UserInputAst, Error> {
    let (_remaining, user_input_ast) = parse_to_ast(query).map_err(|_| Error)?;
    Ok(user_input_ast)
}

/// Parse a query, trying to recover from syntax errors, and giving hints toward fixing errors.
pub fn parse_query_lenient(query: &str) -> (UserInputAst, Vec<LenientError>) {
    parse_to_ast_lenient(query)
}

#[cfg(test)]
mod tests {
    use crate::{UserInputAst, parse_query, parse_query_lenient};

    #[test]
    fn test_deduplication() {
        let ast: UserInputAst = parse_query("a a").unwrap();
        let json = serde_json::to_string(&ast).unwrap();
        assert_eq!(
            json,
            r#"{"type":"bool","clauses":[[null,{"type":"literal","field_name":null,"phrase":"a","delimiter":"none","slop":0,"prefix":false}]]}"#
        );
    }

    #[test]
    fn test_parse_query_serialization() {
        let ast = parse_query("title:hello OR title:x").unwrap();
        let json = serde_json::to_string(&ast).unwrap();
        assert_eq!(
            json,
            r#"{"type":"bool","clauses":[["should",{"type":"literal","field_name":"title","phrase":"hello","delimiter":"none","slop":0,"prefix":false}],["should",{"type":"literal","field_name":"title","phrase":"x","delimiter":"none","slop":0,"prefix":false}]]}"#
        );
    }

    #[test]
    fn test_parse_query_wrong_query() {
        assert!(parse_query("title:").is_err());
    }

    #[test]
    fn test_parse_query_lenient_wrong_query() {
        let (_, errors) = parse_query_lenient("title:");
        assert!(errors.len() == 1);
        let json = serde_json::to_string(&errors).unwrap();
        assert_eq!(json, r#"[{"pos":6,"message":"expected word"}]"#);
    }
}


================================================
FILE: query-grammar/src/occur.rs
================================================
use std::fmt;
use std::fmt::Write;

use serde::Serialize;

/// Defines whether a term in a query must be present,
/// should be present or must not be present.
#[derive(Debug, Clone, Hash, Copy, Eq, PartialEq, Serialize)]
#[serde(rename_all = "snake_case")]
pub enum Occur {
    /// For a given document to be considered for scoring,
    /// at least one of the queries with the Should or the Must
    /// Occur constraint must be within the document.
    Should,
    /// Document without the queries are excluded from the search.
    Must,
    /// Document that contain the query are excluded from the
    /// search.
    MustNot,
}

impl Occur {
    /// Returns the one-char prefix symbol for this `Occur`.
    /// - `Should` => '?',
    /// - `Must` => '+'
    /// - `Not` => '-'
    fn to_char(self) -> char {
        match self {
            Occur::Should => '?',
            Occur::Must => '+',
            Occur::MustNot => '-',
        }
    }

    /// Compose two occur values.
    pub fn compose(left: Occur, right: Occur) -> Occur {
        match (left, right) {
            (Occur::Should, _) => right,
            (Occur::Must, Occur::MustNot) => Occur::MustNot,
            (Occur::Must, _) => Occur::Must,
            (Occur::MustNot, Occur::MustNot) => Occur::Must,
            (Occur::MustNot, _) => Occur::MustNot,
        }
    }
}

impl fmt::Display for Occur {
    fn fmt(&self, f: &mut fmt::Formatter) -> fmt::Result {
        f.write_char(self.to_char())
    }
}

#[cfg(test)]
mod test {
    use crate::Occur;

    #[test]
    fn test_occur_compose() {
        assert_eq!(Occur::compose(Occur::Should, Occur::Should), Occur::Should);
        assert_eq!(Occur::compose(Occur::Should, Occur::Must), Occur::Must);
        assert_eq!(
            Occur::compose(Occur::Should, Occur::MustNot),
            Occur::MustNot
        );
        assert_eq!(Occur::compose(Occur::Must, Occur::Should), Occur::Must);
        assert_eq!(Occur::compose(Occur::Must, Occur::Must), Occur::Must);
        assert_eq!(Occur::compose(Occur::Must, Occur::MustNot), Occur::MustNot);
        assert_eq!(
            Occur::compose(Occur::MustNot, Occur::Should),
            Occur::MustNot
        );
        assert_eq!(Occur::compose(Occur::MustNot, Occur::Must), Occur::MustNot);
        assert_eq!(Occur::compose(Occur::MustNot, Occur::MustNot), Occur::Must);
    }
}


================================================
FILE: query-grammar/src/query_grammar.rs
================================================
use std::borrow::Cow;
use std::iter::once;

use fnv::FnvHashSet;
use nom::IResult;
use nom::branch::alt;
use nom::bytes::complete::tag;
use nom::character::complete::{
    anychar, char, digit1, multispace0, multispace1, none_of, one_of, satisfy, u32,
};
use nom::combinator::{eof, map, map_res, opt, peek, recognize, value, verify};
use nom::error::{Error, ErrorKind};
use nom::multi::{many0, many1, separated_list0};
use nom::sequence::{delimited, preceded, separated_pair, terminated, tuple};

use super::user_input_ast::{UserInputAst, UserInputBound, UserInputLeaf, UserInputLiteral};
use crate::Occur;
use crate::infallible::*;
use crate::user_input_ast::Delimiter;

// Note: '-' char is only forbidden at the beginning of a field name, would be clearer to add it to
// special characters.
const SPECIAL_CHARS: &[char] = &[
    '+', '^', '`', ':', '{', '}', '"', '\'', '[', ']', '(', ')', '!', '\\', '*', ' ',
];

/// consume a field name followed by colon. Return the field name with escape sequence
/// already interpreted
fn field_name(inp: &str) -> IResult<&str, String> {
    let simple_char = none_of(SPECIAL_CHARS);
    let first_char = verify(none_of(SPECIAL_CHARS), |c| *c != '-');
    let escape_sequence = || preceded(char('\\'), one_of(SPECIAL_CHARS));

    map(
        terminated(
            tuple((
                alt((first_char, escape_sequence())),
                many0(alt((simple_char, escape_sequence(), char('\\')))),
            )),
            tuple((multispace0, char(':'), multispace0)),
        ),
        |(first_char, next)| once(first_char).chain(next).collect(),
    )(inp)
}

const ESCAPE_IN_WORD: &[char] = &['^', '`', ':', '{', '}', '"', '\'', '[', ']', '(', ')', '\\'];

fn interpret_escape(source: &str) -> String {
    let mut res = String::with_capacity(source.len());
    let mut in_escape = false;
    let require_escape = |c: char| c.is_whitespace() || ESCAPE_IN_WORD.contains(&c) || c == '-';

    for c in source.chars() {
        if in_escape {
            if !require_escape(c) {
                // we re-add the escape sequence
                res.push('\\');
            }
            res.push(c);
            in_escape = false;
        } else if c == '\\' {
            in_escape = true;
        } else {
            res.push(c);
        }
    }
    res
}

/// Consume a word outside of any context.
// TODO should support escape sequences
fn word(inp: &str) -> IResult<&str, Cow<'_, str>> {
    map_res(
        recognize(tuple((
            alt((
                preceded(char('\\'), anychar),
                satisfy(|c| !c.is_whitespace() && !ESCAPE_IN_WORD.contains(&c) && c != '-'),
            )),
            many0(alt((
                preceded(char('\\'), anychar),
                satisfy(|c: char| !c.is_whitespace() && !ESCAPE_IN_WORD.contains(&c)),
            ))),
        ))),
        |s| match s {
            "OR" | "AND" | "NOT" | "IN" => Err(Error::new(inp, ErrorKind::Tag)),
            s if s.contains('\\') => Ok(Cow::Owned(interpret_escape(s))),
            s => Ok(Cow::Borrowed(s)),
        },
    )(inp)
}

fn word_infallible(
    delimiter: &str,
    emit_error: bool,
) -> impl Fn(&str) -> JResult<&str, Option<Cow<str>>> + '_ {
    // emit error is set when receiving an unescaped `:` should emit an error

    move |inp| {
        map(
            opt_i_err(
                preceded(
                    multispace0,
                    recognize(many1(alt((
                        preceded(char::<&str, _>('\\'), anychar),
                        satisfy(|c| !c.is_whitespace() && !delimiter.contains(c)),
                    )))),
                ),
                "expected word",
            ),
            |(opt_s, mut errors)| match opt_s {
                Some(s) => {
                    if emit_error
                        && (s
                            .as_bytes()
                            .windows(2)
                            .any(|window| window[0] != b'\\' && window[1] == b':')
                            || s.starts_with(':'))
                    {
                        errors.push(LenientErrorInternal {
                            pos: inp.len(),
                            message: "parsed possible invalid field as term".to_string(),
                        });
                    }
                    if s.contains('\\') {
                        (Some(Cow::Owned(interpret_escape(s))), errors)
                    } else {
                        (Some(Cow::Borrowed(s)), errors)
                    }
                }
                None => (None, errors),
            },
        )(inp)
    }
}

/// Consume a word inside a Range context. More values are allowed as they are
/// not ambiguous in this context.
fn relaxed_word(inp: &str) -> IResult<&str, &str> {
    recognize(tuple((
        satisfy(|c| !c.is_whitespace() && !['`', '{', '}', '"', '[', ']', '(', ')'].contains(&c)),
        many0(satisfy(|c: char| {
            !c.is_whitespace() && !['{', '}', '"', '[', ']', '(', ')'].contains(&c)
        })),
    )))(inp)
}

fn negative_number(inp: &str) -> IResult<&str, &str> {
    recognize(preceded(
        char('-'),
        tuple((digit1, opt(tuple((char('.'), digit1))))),
    ))(inp)
}

fn simple_term(inp: &str) -> IResult<&str, (Delimiter, String)> {
    let escaped_string = |delimiter| {
        // we need this because none_of can't accept an owned array of char.
        let not_delimiter = verify(anychar, move |parsed| *parsed != delimiter);
        map(
            delimited(
                char(delimiter),
                many0(alt((preceded(char('\\'), anychar), not_delimiter))),
                char(delimiter),
            ),
            |res| res.into_iter().collect::<String>(),
        )
    };

    let negative_number = map(negative_number, |number| {
        (Delimiter::None, number.to_string())
    });
    let double_quotes = map(escaped_string('"'), |phrase| {
        (Delimiter::DoubleQuotes, phrase)
    });
    let simple_quotes = map(escaped_string('\''), |phrase| {
        (Delimiter::SingleQuotes, phrase)
    });
    let text_no_delimiter = map(word, |text| (Delimiter::None, text.to_string()));

    alt((
        negative_number,
        simple_quotes,
        double_quotes,
        text_no_delimiter,
    ))(inp)
}

fn simple_term_infallible(
    delimiter: &str,
) -> impl Fn(&str) -> JResult<&str, Option<(Delimiter, String)>> + '_ {
    |inp| {
        let escaped_string = |delimiter| {
            // we need this because none_of can't accept an owned array of char.
            let not_delimiter = verify(anychar, move |parsed| *parsed != delimiter);
            map(
                delimited_infallible(
                    nothing,
                    opt_i(many0(alt((preceded(char('\\'), anychar), not_delimiter)))),
                    opt_i_err(char(delimiter), format!("missing delimiter \\{delimiter}")),
                ),
                |(res, err)| {
                    // many0 can't fail
                    (res.unwrap().into_iter().collect::<String>(), err)
                },
            )
        };

        let double_quotes = map(escaped_string('"'), |(phrase, errors)| {
            (Some((Delimiter::DoubleQuotes, phrase)), errors)
        });
        let simple_quotes = map(escaped_string('\''), |(phrase, errors)| {
            (Some((Delimiter::SingleQuotes, phrase)), errors)
        });

        alt_infallible(
            (
                (value((), char('"')), double_quotes),
                (value((), char('\'')), simple_quotes),
            ),
            // numbers are parsed with words in this case, as we allow string starting with a -
            map(word_infallible(delimiter, true), |(text, errors)| {
                (text.map(|text| (Delimiter::None, text.to_string())), errors)
            }),
        )(inp)
    }
}

fn term_or_phrase(inp: &str) -> IResult<&str, UserInputLeaf> {
    map(
        tuple((simple_term, fallible(slop_or_prefix_val))),
        |((delimiter, phrase), (slop, prefix))| {
            UserInputLiteral {
                field_name: None,
                phrase,
                delimiter,
                slop,
                prefix,
            }
            .into()
        },
    )(inp)
}

fn term_or_phrase_infallible(inp: &str) -> JResult<&str, Option<UserInputLeaf>> {
    map(
        // ~* for slop/prefix, ) inside group or ast tree, ^ if boost
        tuple_infallible((simple_term_infallible(")^"), slop_or_prefix_val)),
        |((delimiter_phrase, (slop, prefix)), errors)| {
            let leaf = if let Some((delimiter, phrase)) = delimiter_phrase {
                Some(
                    UserInputLiteral {
                        field_name: None,
                        phrase,
                        delimiter,
                        slop,
                        prefix,
                    }
                    .into(),
                )
            } else if slop != 0 {
                Some(
                    UserInputLiteral {
                        field_name: None,
                        phrase: "".to_string(),
                        delimiter: Delimiter::None,
                        slop,
                        prefix,
                    }
                    .into(),
                )
            } else {
                None
            };
            (leaf, errors)
        },
    )(inp)
}

fn term_group(inp: &str) -> IResult<&str, UserInputAst> {
    map(
        tuple((
            terminated(field_name, multispace0),
            delimited(tuple((char('('), multispace0)), ast, char(')')),
        )),
        |(field_name, mut ast)| {
            ast.set_default_field(field_name);
            ast
        },
    )(inp)
}

// this is a precondition for term_group_infallible. Without it, term_group_infallible can fail
// with a panic. It does not consume its input.
fn term_group_precond(inp: &str) -> IResult<&str, (), ()> {
    value(
        (),
        peek(tuple((
            field_name,
            multispace0,
            char('('), // when we are here, we know it can't be anything but a term group
        ))),
    )(inp)
    .map_err(|e| e.map(|_| ()))
}

fn term_group_infallible(inp: &str) -> JResult<&str, UserInputAst> {
    let (inp, (field_name, _, _, _)) =
        tuple((field_name, multispace0, char('('), multispace0))(inp).expect("precondition failed");

    delimited_infallible(
        nothing,
        map(ast_infallible, |(mut ast, errors)| {
            ast.set_default_field(field_name.to_string());
            (ast, errors)
        }),
        opt_i_err(char(')'), "expected ')'"),
    )(inp)
}

fn exists(inp: &str) -> IResult<&str, UserInputLeaf> {
    value(
        UserInputLeaf::Exists {
            field: String::new(),
        },
        tuple((
            multispace0,
            char('*'),
            peek(alt((
                value(
                    "",
                    satisfy(|c: char| c.is_whitespace() || ESCAPE_IN_WORD.contains(&c)),
                ),
                eof,
            ))),
        )),
    )(inp)
}

fn exists_precond(inp: &str) -> IResult<&str, (), ()> {
    value(
        (),
        peek(tuple((
            field_name,
            multispace0,
            char('*'),
            peek(alt((
                value(
                    "",
                    satisfy(|c: char| c.is_whitespace() || ESCAPE_IN_WORD.contains(&c)),
                ),
                eof,
            ))), // we need to check this isn't a wildcard query
        ))),
    )(inp)
    .map_err(|e| e.map(|_| ()))
}

fn exists_infallible(inp: &str) -> JResult<&str, UserInputAst> {
    let (inp, (field_name, _, _)) =
        tuple((field_name, multispace0, char('*')))(inp).expect("precondition failed");

    let exists = UserInputLeaf::Exists { field: field_name }.into();
    Ok((inp, (exists, Vec::new())))
}

fn literal(inp: &str) -> IResult<&str, UserInputAst> {
    // * alone is already parsed by our caller, so if `exists` succeed, we can be confident
    // something (a field name) got parsed before
    alt((
        map(
            tuple((
                opt(field_name),
                alt((range, set, exists, regex, term_or_phrase)),
            )),
            |(field_name, leaf): (Option<String>, UserInputLeaf)| leaf.set_field(field_name).into(),
        ),
        term_group,
    ))(inp)
}

fn literal_no_group_infallible(inp: &str) -> JResult<&str, Option<UserInputAst>> {
    map(
        tuple_infallible((
            opt_i(field_name),
            space0_infallible,
            alt_infallible(
                (
                    (
                        value((), tuple((tag("IN"), multispace0, char('[')))),
                        map(set_infallible, |(set, errs)| (Some(set), errs)),
                    ),
                    (
                        value((), peek(one_of("{[><"))),
                        map(range_infallible, |(range, errs)| (Some(range), errs)),
                    ),
                    (
                        value((), peek(one_of("/"))),
                        map(regex_infallible, |(regex, errs)| (Some(regex), errs)),
                    ),
                ),
                delimited_infallible(space0_infallible, term_or_phrase_infallible, nothing),
            ),
        )),
        |((field_name, _, leaf), mut errors)| {
            (
                leaf.map(|leaf| {
                    if matches!(&leaf, UserInputLeaf::Literal(literal)
                            if literal.phrase == "NOT" && literal.delimiter == Delimiter::None)
                        && field_name.is_none()
                    {
                        errors.push(LenientErrorInternal {
                            pos: inp.len(),
                            message: "parsed keyword NOT as term. It should be quoted".to_string(),
                        });
                    }
                    leaf.set_field(field_name).into()
                }),
                errors,
            )
        },
    )(inp)
}

fn literal_infallible(inp: &str) -> JResult<&str, Option<UserInputAst>> {
    alt_infallible(
        (
            (
                term_group_precond,
                map(term_group_infallible, |(group, errs)| (Some(group), errs)),
            ),
            (
                exists_precond,
                map(exists_infallible, |(exists, errs)| (Some(exists), errs)),
            ),
        ),
        literal_no_group_infallible,
    )(inp)
}

fn slop_or_prefix_val(inp: &str) -> JResult<&str, (u32, bool)> {
    map(
        opt_i(alt((
            value((0, true), char('*')),
            map(preceded(char('~'), u32), |slop| (slop, false)),
        ))),
        |(slop_or_prefix_opt, err)| (slop_or_prefix_opt.unwrap_or_default(), err),
    )(inp)
}

/// Function that parses a range out of a Stream
/// Supports ranges like:
/// [5 TO 10], {5 TO 10}, [* TO 10], [10 TO *], {10 TO *], >5, <=10
/// [a TO *], [a TO c], [abc TO bcd}
fn range(inp: &str) -> IResult<&str, UserInputLeaf> {
    let range_term_val = || {
        map(
            alt((negative_number, relaxed_word, tag("*"))),
            ToString::to_string,
        )
    };

    // check for unbounded range in the form of <5, <=10, >5, >=5
    let elastic_unbounded_range = map(
        tuple((
            preceded(multispace0, alt((tag(">="), tag("<="), tag("<"), tag(">")))),
            preceded(multispace0, range_term_val()),
        )),
        |(comparison_sign, bound)| match comparison_sign {
            ">=" => (UserInputBound::Inclusive(bound), UserInputBound::Unbounded),
            "<=" => (UserInputBound::Unbounded, UserInputBound::Inclusive(bound)),
            "<" => (UserInputBound::Unbounded, UserInputBound::Exclusive(bound)),
            ">" => (UserInputBound::Exclusive(bound), UserInputBound::Unbounded),
            // unreachable case
            _ => (UserInputBound::Unbounded, UserInputBound::Unbounded),
        },
    );

    let lower_bound = map(
        separated_pair(one_of("{["), multispace0, range_term_val()),
        |(boundary_char, lower_bound)| {
            if lower_bound == "*" {
                UserInputBound::Unbounded
            } else if boundary_char == '{' {
                UserInputBound::Exclusive(lower_bound)
            } else {
                UserInputBound::Inclusive(lower_bound)
            }
        },
    );

    let upper_bound = map(
        separated_pair(range_term_val(), multispace0, one_of("}]")),
        |(upper_bound, boundary_char)| {
            if upper_bound == "*" {
                UserInputBound::Unbounded
            } else if boundary_char == '}' {
                UserInputBound::Exclusive(upper_bound)
            } else {
                UserInputBound::Inclusive(upper_bound)
            }
        },
    );

    let lower_to_upper = separated_pair(
        lower_bound,
        tuple((multispace1, tag("TO"), multispace1)),
        upper_bound,
    );

    map(
        alt((elastic_unbounded_range, lower_to_upper)),
        |(lower, upper)| UserInputLeaf::Range {
            field: None,
            lower,
            upper,
        },
    )(inp)
}

fn range_infallible(inp: &str) -> JResult<&str, UserInputLeaf> {
    let lower_to_upper = map(
        tuple_infallible((
            opt_i(anychar),
            space0_infallible,
            word_infallible("]}", false),
            space1_infallible,
            opt_i_err(
                terminated(tag("TO"), alt((value((), multispace1), value((), eof)))),
                "missing keyword TO",
            ),
            word_infallible("]}", false),
            opt_i_err(one_of("]}"), "missing range delimiter"),
        )),
        |(
            (lower_bound_kind, _multispace0, lower, _multispace1, to, upper, upper_bound_kind),
            errs,
        )| {
            let lower_bound = match (lower_bound_kind, lower.as_deref()) {
                (_, Some("*")) => UserInputBound::Unbounded,
                (_, None) => UserInputBound::Unbounded,
                // if it is some, TO was actually the bound (i.e. [TO TO something])
                (_, Some("TO")) if to.is_none() => UserInputBound::Unbounded,
                (Some('['), Some(bound)) => UserInputBound::Inclusive(bound.to_string()),
                (Some('{'), Some(bound)) => UserInputBound::Exclusive(bound.to_string()),
                _ => unreachable!("precondition failed, range did not start with [ or {{"),
            };
            let upper_bound = match (upper_bound_kind, upper.as_deref()) {
                (_, Some("*")) => UserInputBound::Unbounded,
                (_, None) => UserInputBound::Unbounded,
                (Some(']'), Some(bound)) => UserInputBound::Inclusive(bound.to_string()),
                (Some('}'), Some(bound)) => UserInputBound::Exclusive(bound.to_string()),
                // the end is missing, assume this is an inclusive bound
                (_, Some(bound)) => UserInputBound::Inclusive(bound.to_string()),
            };
            ((lower_bound, upper_bound), errs)
        },
    );

    map(
        alt_infallible(
            (
                (
                    value((), tag(">=")),
                    map(word_infallible(")", false), |(bound, err)| {
                        (
                            (
                                bound
                                    .map(|bound| UserInputBound::Inclusive(bound.to_string()))
                                    .unwrap_or(UserInputBound::Unbounded),
                                UserInputBound::Unbounded,
                            ),
                            err,
                        )
                    }),
                ),
                (
                    value((), tag("<=")),
                    map(word_infallible(")", false), |(bound, err)| {
                        (
                            (
                                UserInputBound::Unbounded,
                                bound
                                    .map(|bound| UserInputBound::Inclusive(bound.to_string()))
                                    .unwrap_or(UserInputBound::Unbounded),
                            ),
                            err,
                        )
                    }),
                ),
                (
                    value((), tag(">")),
                    map(word_infallible(")", false), |(bound, err)| {
                        (
                            (
                                bound
                                    .map(|bound| UserInputBound::Exclusive(bound.to_string()))
                                    .unwrap_or(UserInputBound::Unbounded),
                                UserInputBound::Unbounded,
                            ),
                            err,
                        )
                    }),
                ),
                (
                    value((), tag("<")),
                    map(word_infallible(")", false), |(bound, err)| {
                        (
                            (
                                UserInputBound::Unbounded,
                                bound
                                    .map(|bound| UserInputBound::Exclusive(bound.to_string()))
                                    .unwrap_or(UserInputBound::Unbounded),
                            ),
                            err,
                        )
                    }),
                ),
            ),
            lower_to_upper,
        ),
        |((lower, upper), errors)| {
            (
                UserInputLeaf::Range {
                    field: None,
                    lower,
                    upper,
                },
                errors,
            )
        },
    )(inp)
}

fn set(inp: &str) -> IResult<&str, UserInputLeaf> {
    map(
        preceded(
            tuple((multispace0, tag("IN"), multispace1)),
            delimited(
                tuple((char('['), multispace0)),
                separated_list0(multispace1, map(simple_term, |(_, term)| term)),
                char(']'),
            ),
        ),
        |elements| UserInputLeaf::Set {
            field: None,
            elements,
        },
    )(inp)
}

fn set_infallible(mut inp: &str) -> JResult<&str, UserInputLeaf> {
    // `IN [` has already been parsed when we enter, we only need to parse simple terms until we
    // find a `]`
    let mut elements = Vec::new();
    let mut errs = Vec::new();
    let mut first_round = true;
    loop {
        let mut space_error = if first_round {
            first_round = false;
            Vec::new()
        } else {
            let (rest, (_, err)) = space1_infallible(inp)?;
            inp = rest;
            err
        };
        if inp.is_empty() {
            // TODO push error about missing ]
            //
            errs.push(LenientErrorInternal {
                pos: inp.len(),
                message: "missing ]".to_string(),
            });
            let res = UserInputLeaf::Set {
                field: None,
                elements,
            };
            return Ok((inp, (res, errs)));
        }
        if let Some(inp) = inp.strip_prefix(']') {
            let res = UserInputLeaf::Set {
                field: None,
                elements,
            };
            return Ok((inp, (res, errs)));
        }
        errs.append(&mut space_error);
        // TODO
        // here we do the assumption term_or_phrase_infallible always consume something if the
        // first byte is not `)` or ' '. If it did not, we would end up looping.

        let (rest, (delim_term, mut err)) = simple_term_infallible("]")(inp)?;
        errs.append(&mut err);
        if let Some((_, term)) = delim_term {
            elements.push(term);
        }
        inp = rest;
    }
}

fn regex(inp: &str) -> IResult<&str, UserInputLeaf> {
    map(
        terminated(
            delimited(
                char('/'),
                many1(alt((preceded(char('\\'), char('/')), none_of("/")))),
                char('/'),
            ),
            peek(alt((
                value((), multispace1),
                value((), char(')')),
                value((), eof),
            ))),
        ),
        |elements| UserInputLeaf::Regex {
            field: None,
            pattern: elements.into_iter().collect::<String>(),
        },
    )(inp)
}

fn regex_infallible(inp: &str) -> JResult<&str, UserInputLeaf> {
    match terminated_infallible(
        delimited_infallible(
            opt_i_err(char('/'), "missing delimiter /"),
            opt_i(many1(alt((preceded(char('\\'), char('/')), none_of("/"))))),
            opt_i_err(char('/'), "missing delimiter /"),
        ),
        opt_i_err(
            peek(alt((
                value((), multispace1),
                value((), char(')')),
                value((), eof),
            ))),
            "expected whitespace, closing parenthesis, or end of input",
        ),
    )(inp)
    {
        Ok((rest, (elements_part, errors))) => {
            let pattern = match elements_part {
                Some(elements_part) => elements_part.into_iter().collect(),
                None => String::new(),
            };
            let res = UserInputLeaf::Regex {
                field: None,
                pattern,
            };
            Ok((rest, (res, errors)))
        }
        Err(e) => {
            let errs = vec![LenientErrorInternal {
                pos: inp.len(),
                message: e.to_string(),
            }];
            let res = UserInputLeaf::Regex {
                field: None,
                pattern: String::new(),
            };
            Ok((inp, (res, errs)))
        }
    }
}

fn negate(expr: UserInputAst) -> UserInputAst {
    expr.unary(Occur::MustNot)
}

fn leaf(inp: &str) -> IResult<&str, UserInputAst> {
    alt((
        delimited(char('('), ast, char(')')),
        map(
            terminated(
                char('*'),
                peek(alt((
                    value((), multispace1),
                    value((), char(')')),
                    value((), eof),
                ))),
            ),
            |_| UserInputAst::from(UserInputLeaf::All),
        ),
        map(preceded(tuple((tag("NOT"), multispace1)), leaf), negate),
        literal,
    ))(inp)
}

fn leaf_infallible(inp: &str) -> JResult<&str, Option<UserInputAst>> {
    alt_infallible(
        (
            (
                value((), char('(')),
                map(
                    delimited_infallible(
                        nothing,
                        ast_infallible,
                        opt_i_err(char(')'), "expected ')'"),
                    ),
                    |(ast, errs)| (Some(ast), errs),
                ),
            ),
            (
                value(
                    (),
                    terminated(
                        char('*'),
                        peek(alt((
                            value((), multispace1),
                            value((), char(')')),
                            value((), eof),
                        ))),
                    ),
                ),
                map(nothing, |_| {
                    (Some(UserInputAst::from(UserInputLeaf::All)), Vec::new())
                }),
            ),
            (
                value((), tag("NOT ")),
                delimited_infallible(
                    space0_infallible,
                    map(leaf_infallible, |(res, err)| (res.map(negate), err)),
                    nothing,
                ),
            ),
        ),
        literal_infallible,
    )(inp)
}

fn positive_float_number(inp: &str) -> IResult<&str, f64> {
    map(
        recognize(tuple((digit1, opt(tuple((char('.'), digit1)))))),
        // TODO this is actually dangerous if the number is actually not representable as a f64
        // (too big for instance)
        |float_str: &str| float_str.parse::<f64>().unwrap(),
    )(inp)
}

fn boost(inp: &str) -> JResult<&str, Option<f64>> {
    opt_i(preceded(char('^'), positive_float_number))(inp)
}

fn boosted_leaf(inp: &str) -> IResult<&str, UserInputAst> {
    map(
        tuple((leaf, fallible(boost))),
        |(leaf, boost_opt)| match boost_opt {
            Some(boost) if (boost - 1.0).abs() > f64::EPSILON => {
                UserInputAst::Boost(Box::new(leaf), boost.into())
            }
            _ => leaf,
        },
    )(inp)
}

fn boosted_leaf_infallible(inp: &str) -> JResult<&str, Option<UserInputAst>> {
    map(
        tuple_infallible((leaf_infallible, boost)),
        |((leaf, boost_opt), error)| match boost_opt {
            Some(boost) if (boost - 1.0).abs() > f64::EPSILON => (
                leaf.map(|leaf| UserInputAst::Boost(Box::new(leaf), boost.into())),
                error,
            ),
            _ => (leaf, error),
        },
    )(inp)
}

fn occur_symbol(inp: &str) -> JResult<&str, Option<Occur>> {
    opt_i(alt((
        value(Occur::MustNot, char('-')),
        value(Occur::Must, char('+')),
    )))(inp)
}

fn occur_leaf(inp: &str) -> IResult<&str, (Option<Occur>, UserInputAst)> {
    tuple((fallible(occur_symbol), boosted_leaf))(inp)
}

#[expect(clippy::type_complexity)]
fn operand_occur_leaf_infallible(
    inp: &str,
) -> JResult<&str, (Option<BinaryOperand>, Option<Occur>, Option<UserInputAst>)> {
    // TODO maybe this should support multiple chained AND/OR, and "fuse" them?
    tuple_infallible((
        delimited_infallible(nothing, opt_i(binary_operand), space0_infallible),
        occur_symbol,
        boosted_leaf_infallible,
    ))(inp)
}

#[derive(Clone, Copy, Debug, PartialEq, Eq)]
enum BinaryOperand {
    Or,
    And,
}

fn binary_operand(inp: &str) -> IResult<&str, BinaryOperand> {
    alt((
        value(BinaryOperand::And, tag("AND ")),
        value(BinaryOperand::Or, tag("OR ")),
    ))(inp)
}

fn aggregate_binary_expressions(
    left: (Option<Occur>, UserInputAst),
    others: Vec<(Option<BinaryOperand>, Option<Occur>, UserInputAst)>,
) -> Result<UserInputAst, LenientErrorInternal> {
    let mut leafs = Vec::with_capacity(others.len() + 1);
    leafs.push((None, left.0, Some(left.1)));
    leafs.extend(
        others
            .into_iter()
            .map(|(operand, occur, ast)| (operand, occur, Some(ast))),
    );
    // the parameters we pass should statically guarantee we can't get errors
    // (no prefix BinaryOperand is provided)
    let (res, mut errors) = aggregate_infallible_expressions(leafs);
    if errors.is_empty() {
        Ok(res)
    } else {
        Err(errors.swap_remove(0))
    }
}

fn aggregate_infallible_expressions(
    input_leafs: Vec<(Option<BinaryOperand>, Option<Occur>, Option<UserInputAst>)>,
) -> (UserInputAst, ErrorList) {
    let mut err = Vec::new();
    let mut leafs: Vec<(_, _, UserInputAst)> = input_leafs
        .into_iter()
        .filter_map(|(operand, occur, ast)| ast.map(|ast| (operand, occur, ast)))
        .collect();
    if leafs.is_empty() {
        return (UserInputAst::empty_query(), err);
    }

    let early_operand = leafs
        .iter()
        .take(1)
        .all(|(operand, _, _)| operand.is_some());

    if early_operand {
        err.push(LenientErrorInternal {
            pos: 0,
            message: "Found unexpected boolean operator before term".to_string(),
        });
    }

    let mut clauses: Vec<Vec<(Option<Occur>, UserInputAst)>> = vec![];
    for ((prev_operator, occur, ast), (next_operator, _, _)) in
        leafs.iter().zip(leafs.iter().skip(1))
    {
        match prev_operator {
            Some(BinaryOperand::And) => {
                if let Some(last) = clauses.last_mut() {
                    last.push((occur.or(Some(Occur::Must)), ast.clone()));
                } else {
                    let last = vec![(occur.or(Some(Occur::Must)), ast.clone())];
                    clauses.push(last);
                }
            }
            Some(BinaryOperand::Or) => {
                let default_op = match next_operator {
                    Some(BinaryOperand::And) => Some(Occur::Must),
                    _ => Some(Occur::Should),
                };
                if occur == &Some(Occur::MustNot) && default_op == Some(Occur::Should) {
                    // if occur is MustNot *and* operation is OR, we synthesize a ShouldNot
                    clauses.push(vec![(
                        Some(Occur::Should),
                        ast.clone().unary(Occur::MustNot),
                    )])
                } else {
                    clauses.push(vec![(occur.or(default_op), ast.clone())]);
                }
            }
            None => {
                let default_op = match next_operator {
                    Some(BinaryOperand::And) => Some(Occur::Must),
                    Some(BinaryOperand::Or) => Some(Occur::Should),
                    None => None,
                };
                if occur == &Some(Occur::MustNot) && default_op == Some(Occur::Should) {
                    // if occur is MustNot *and* operation is OR, we synthesize a ShouldNot
                    clauses.push(vec![(
                        Some(Occur::Should),
                        ast.clone().unary(Occur::MustNot),
                    )])
                } else {
                    clauses.push(vec![(occur.or(default_op), ast.clone())])
                }
            }
        }
    }

    // leaf isn't empty, so we can unwrap
    let (last_operator, last_occur, last_ast) = leafs.pop().unwrap();
    match last_operator {
        Some(BinaryOperand::And) => {
            if let Some(last) = clauses.last_mut() {
                last.push((last_occur.or(Some(Occur::Must)), last_ast));
            } else {
                let last = vec![(last_occur.or(Some(Occur::Must)), last_ast)];
                clauses.push(last);
            }
        }
        Some(BinaryOperand::Or) => {
            if last_occur == Some(Occur::MustNot) {
                // if occur is MustNot *and* operation is OR, we synthesize a ShouldNot
                clauses.push(vec![(Some(Occur::Should), last_ast.unary(Occur::MustNot))]);
            } else {
                clauses.push(vec![(last_occur.or(Some(Occur::Should)), last_ast)]);
            }
        }
        None => clauses.push(vec![(last_occur, last_ast)]),
    }

    if clauses.len() == 1 {
        let mut clause = clauses.pop().unwrap();
        if clause.len() == 1 && clause[0].0 != Some(Occur::MustNot) {
            (clause.pop().unwrap().1, err)
        } else {
            (UserInputAst::Clause(clause), err)
        }
    } else {
        let mut final_clauses: Vec<(Option<Occur>, UserInputAst)> = Vec::new();
        for mut sub_clauses in clauses {
            if sub_clauses.len() == 1 {
                final_clauses.push(sub_clauses.pop().unwrap());
            } else {
                final_clauses.push((Some(Occur::Should), UserInputAst::Clause(sub_clauses)));
            }
        }

        (UserInputAst::Clause(final_clauses), err)
    }
}

fn operand_leaf(inp: &str) -> IResult<&str, (Option<BinaryOperand>, Option<Occur>, UserInputAst)> {
    map(
        tuple((
            terminated(opt(binary_operand), multispace0),
            terminated(occur_leaf, multispace0),
        )),
        |(operand, (occur, ast))| (operand, occur, ast),
    )(inp)
}

fn ast(inp: &str) -> IResult<&str, UserInputAst> {
    let boolean_expr = map_res(
        separated_pair(occur_leaf, multispace1, many1(operand_leaf)),
        |(left, right)| aggregate_binary_expressions(left, right),
    );
    let single_leaf = map(occur_leaf, |(occur, ast)| {
        if occur == Some(Occur::MustNot) {
            ast.unary(Occur::MustNot)
        } else {
            ast
        }
    });
    delimited(multispace0, alt((boolean_expr, single_leaf)), multispace0)(inp)
}

fn ast_infallible(inp: &str) -> JResult<&str, UserInputAst> {
    // ast() parse either `term AND term OR term` or `+term term -term`
    // both are locally ambiguous, and as we allow error, it's hard to permit backtracking.
    // Instead, we allow a mix of both syntaxes, trying to make sense of what a user meant.
    // For instance `term OR -term` is interpreted as `*term -term`, but `term AND -term`
    // is interpreted as `+term -term`. We also allow `AND term` to make things easier for us,
    // even if it's not very sensical.

    let expression = map(
        separated_list_infallible(space1_infallible, operand_occur_leaf_infallible),
        |(leaf, mut err)| {
            let (res, mut err2) = aggregate_infallible_expressions(leaf);
            err.append(&mut err2);
            (res, err)
        },
    );

    delimited_infallible(space0_infallible, expression, space0_infallible)(inp)
}

pub fn parse_to_ast(inp: &str) -> IResult<&str, UserInputAst> {
    map(delimited(multispace0, opt(ast), eof), |opt_ast| {
        rewrite_ast(opt_ast.unwrap_or_else(UserInputAst::empty_query))
    })(inp)
}

pub fn parse_to_ast_lenient(query_str: &str) -> (UserInputAst, Vec<LenientError>) {
    if query_str.trim().is_empty() {
        return (UserInputAst::Clause(Vec::new()), Vec::new());
    }
    let (left, (res, mut errors)) = ast_infallible(query_str).unwrap();
    if !left.trim().is_empty() {
        errors.push(LenientErrorInternal {
            pos: left.len(),
            message: "unparsed end of query".to_string(),
        })
    }

    // convert end-based index to start-based index.
    let errors = errors
        .into_iter()
        .map(|internal_error| LenientError::from_internal(internal_error, query_str.len()))
        .collect();

    (rewrite_ast(res), errors)
}

fn rewrite_ast(mut input: UserInputAst) -> UserInputAst {
    if let UserInputAst::Clause(sub_clauses) = &mut input {
        // call rewrite_ast recursively on children clauses if applicable
        let mut new_clauses = Vec::with_capacity(sub_clauses.len());
        for (occur, clause) in sub_clauses.drain(..) {
            let rewritten_clause = rewrite_ast(clause);
            new_clauses.push((occur, rewritten_clause));
        }
        *sub_clauses = new_clauses;

        // remove duplicate child clauses
        // e.g. (+a +b) OR (+c +d) OR (+a +b)  => (+a +b) OR (+c +d)
        let mut seen = FnvHashSet::default();
        sub_clauses.retain(|term| seen.insert(term.clone()));

        // Removes unnecessary children clauses in AST
        //
        // Motivated by [issue #1433](https://github.com/quickwit-oss/tantivy/issues/1433)
        for term in sub_clauses {
            rewrite_ast_clause(term);
        }
    }
    input
}

fn rewrite_ast_clause(input: &mut (Option<Occur>, UserInputAst)) {
    match input {
        (None, UserInputAst::Clause(clauses)) if clauses.len() == 1 => {
            *input = clauses.pop().unwrap(); // safe because clauses.len() == 1
        }
        _ => {}
    }
}

#[cfg(test)]
mod test {
    use super::*;

    pub fn nearly_equals(a: f64, b: f64) -> bool {
        (a - b).abs() < 0.0005 * (a + b).abs()
    }

    fn assert_nearly_equals(expected: f64, val: f64) {
        assert!(
            nearly_equals(val, expected),
            "Got {val}, expected {expected}."
        );
    }

    // TODO test as part of occur_leaf
    // #[test]
    // fn test_occur_symbol() -> TestParseResult {
    // assert_eq!(super::occur_symbol("-")?, ("", Occur::MustNot));
    // assert_eq!(super::occur_symbol("+")?, ("", Occur::Must));
    // Ok(())
    // }

    #[test]
    fn test_positive_float_number() {
        fn valid_parse(float_str: &str, expected_val: f64, expected_remaining: &str) {
            let (remaining, val) = positive_float_number(float_str).unwrap();
            assert_eq!(remaining, expected_remaining);
            assert_nearly_equals(val, expected_val);
        }
        fn error_parse(float_str: &str) {
            assert!(positive_float_number(float_str).is_err());
        }
        valid_parse("1.0", 1.0, "");
        valid_parse("1", 1.0, "");
        valid_parse("0.234234 aaa", 0.234234f64, " aaa");
        error_parse(".3332");
        // TODO trinity-1686a: I disagree that it should fail, I think it should succeed,
        // consuming only "1", and leave "." for the next thing (which will likely fail then)
        // error_parse("1.");
        error_parse("-1.");
    }

    #[test]
    fn test_date_time() {
        let (remaining, val) =
            relaxed_word("2015-08-02T18:54:42+02:30").expect("cannot parse date");
        assert_eq!(val, "2015-08-02T18:54:42+02:30");
        assert_eq!(remaining, "");
        // this isn't a valid date, but relaxed_word allows it.
        // assert!(date_time().parse("2015-08-02T18:54:42+02").is_err());

        let (remaining, val) = relaxed_word("2021-04-13T19:46:26.266051969+00:00")
            .expect("cannot parse fractional date");
        assert_eq!(val, "2021-04-13T19:46:26.266051969+00:00");
        assert_eq!(remaining, "");
    }

    #[track_caller]
    fn test_parse_query_to_ast_helper(query: &str, expected: &str) {
        let query_strict = parse_to_ast(query).unwrap().1;
        let query_strict_str = format!("{query_strict:?}");
        assert_eq!(query_strict_str, expected, "strict parser failed");

        let (query_lenient, errs) = parse_to_ast_lenient(query);
        let query_lenient_str = format!("{query_lenient:?}");
        assert_eq!(query_lenient_str, expected, "lenient parser failed");
        assert!(
            errs.is_empty(),
            "lenient parser returned errors on valid query: {errs:?}"
        );
    }

    #[track_caller]
    fn test_is_parse_err(query: &str, lenient_expected: &str) {
        assert!(
            parse_to_ast(query).is_err(),
            "strict parser succeeded where an error was expected."
        );

        let (query_lenient, errs) = parse_to_ast_lenient(query);
        let query_lenient_str = format!("{query_lenient:?}");
        assert_eq!(query_lenient_str, lenient_expected, "lenient parser failed");
        assert!(!errs.is_empty());
    }

    #[test]
    fn test_parse_empty_to_ast() {
        test_parse_query_to_ast_helper("", "<emptyclause>");
    }

    #[test]
    fn test_parse_query_to_ast_hyphen() {
        test_parse_query_to_ast_helper("\"www-form-encoded\"", "\"www-form-encoded\"");
        test_parse_query_to_ast_helper("'www-form-encoded'", "'www-form-encoded'");
        test_parse_query_to_ast_helper("www-form-encoded", "www-form-encoded");
        test_parse_query_to_ast_helper("www-form-encoded", "www-form-encoded");
        test_parse_query_to_ast_helper("mr james bo?d", "(*mr *james *bo?d)");
        test_parse_query_to_ast_helper("mr james bo*", "(*mr *james *bo*)");
        test_parse_query_to_ast_helper("mr james b*d", "(*mr *james *b*d)");
    }

    #[test]
    fn test_parse_query_lenient_unfinished_quote() {
        test_is_parse_err("\"www-form-encoded", "\"www-form-encoded\"");
        // TODO strict parser default to parsing a normal term, and parse "'www-forme-encoded" (note
        // the initial \')
        // test_is_parse_err("'www-form-encoded", "'www-form-encoded'");
    }

    #[test]
    fn test_parse_query_to_ast_not_op() {
        test_is_parse_err("NOT", "NOT");
        test_parse_query_to_ast_helper("NOTa", "NOTa");
        test_parse_query_to_ast_helper("NOT a", "(-a)");
    }

    #[test]
    fn test_boosting() {
        test_is_parse_err("a^2^3", "(a)^2");
        test_is_parse_err("a^2^", "(a)^2");
        test_parse_query_to_ast_helper("a^3", "(a)^3");
        test_parse_query_to_ast_helper("a^3 b^2", "(*(a)^3 *(b)^2)");
        test_parse_query_to_ast_helper("a^1", "a");
    }

    #[test]
    fn test_parse_query_to_ast_binary_op() {
        test_parse_query_to_ast_helper("a AND b", "(+a +b)");
        test_parse_query_to_ast_helper("a\nAND b", "(+a +b)");
        test_parse_query_to_ast_helper("a OR b", "(?a ?b)");
        test_parse_query_to_ast_helper("a OR b AND c", "(?a ?(+b +c))");
        test_parse_query_to_ast_helper("a AND b         AND c", "(+a +b +c)");
        test_parse_query_to_ast_helper("a OR b aaa", "(?a ?b *aaa)");
        test_parse_query_to_ast_helper("a AND b aaa", "(?(+a +b) *aaa)");
        test_parse_query_to_ast_helper("aaa a OR b ", "(*aaa ?a ?b)");
        test_parse_query_to_ast_helper("aaa ccc a OR b ", "(*aaa *ccc ?a ?b)");
        test_parse_query_to_ast_helper("aaa a AND b ", "(*aaa ?(+a +b))");
        test_parse_query_to_ast_helper("aaa ccc a AND b ", "(*aaa *ccc ?(+a +b))");
    }

    #[test]
    fn test_parse_mixed_bool_occur() {
        test_parse_query_to_ast_helper("+a OR +b", "(+a +b)");

        test_parse_query_to_ast_helper("a AND -b", "(+a -b)");
        test_parse_query_to_ast_helper("-a AND b", "(-a +b)");
        test_parse_query_to_ast_helper("a AND NOT b", "(+a +(-b))");
        test_parse_query_to_ast_helper("NOT a AND b", "(+(-a) +b)");

        test_parse_query_to_ast_helper("a AND NOT b AND c", "(+a +(-b) +c)");
        test_parse_query_to_ast_helper("a AND -b AND c", "(+a -b +c)");

        test_parse_query_to_ast_helper("a OR -b", "(?a ?(-b))");
        test_parse_query_to_ast_helper("-a OR b", "(?(-a) ?b)");
        test_parse_query_to_ast_helper("a OR NOT b", "(?a ?(-b))");
        test_parse_query_to_ast_helper("NOT a OR b", "(?(-a) ?b)");

        test_parse_query_to_ast_helper("a OR NOT b OR c", "(?a ?(-b) ?c)");
        test_parse_query_to_ast_helper("a OR -b OR c", "(?a ?(-b) ?c)");

        test_parse_query_to_ast_helper("a OR b +aaa", "(?a ?b +aaa)");
        test_parse_query_to_ast_helper("a AND b -aaa", "(?(+a +b) -aaa)");
        test_parse_query_to_ast_helper("+a OR +b aaa", "(+a +b *aaa)");
        test_parse_query_to_ast_helper("-a AND -b aaa", "(?(-a -b) *aaa)");
        test_parse_query_to_ast_helper("-aaa +ccc -a OR b ", "(-aaa +ccc ?(-a) ?b)");
    }

    #[test]
    fn test_parse_elastic_query_ranges() {
        test_parse_query_to_ast_helper("title: >a", "\"title\":{\"a\" TO \"*\"}");
        test_parse_query_to_ast_helper("title:>=a", "\"title\":[\"a\" TO \"*\"}");
        test_parse_query_to_ast_helper("title: <a", "\"title\":{\"*\" TO \"a\"}");
        test_parse_query_to_ast_helper("title:<=a", "\"title\":{\"*\" TO \"a\"]");
        test_parse_query_to_ast_helper("title:<=bsd", "\"title\":{\"*\" TO \"bsd\"]");

        test_parse_query_to_ast_helper("weight: >70", "\"weight\":{\"70\" TO \"*\"}");
        test_parse_query_to_ast_helper("weight:>=70", "\"weight\":[\"70\" TO \"*\"}");
        test_parse_query_to_ast_helper("weight: <70", "\"weight\":{\"*\" TO \"70\"}");
        test_parse_query_to_ast_helper("weight:<=70", "\"weight\":{\"*\" TO \"70\"]");
        test_parse_query_to_ast_helper("weight: >60.7", "\"weight\":{\"60.7\" TO \"*\"}");

        test_parse_query_to_ast_helper("weight: <= 70", "\"weight\":{\"*\" TO \"70\"]");

        test_parse_query_to_ast_helper("weight: <= 70.5", "\"weight\":{\"*\" TO \"70.5\"]");

        test_parse_query_to_ast_helper(">a", "{\"a\" TO \"*\"}");
        test_parse_query_to_ast_helper(">=a", "[\"a\" TO \"*\"}");
        test_parse_query_to_ast_helper("<a", "{\"*\" TO \"a\"}");
        test_parse_query_to_ast_helper("<=a", "{\"*\" TO \"a\"]");
        test_parse_query_to_ast_helper("<=bsd", "{\"*\" TO \"bsd\"]");

        test_parse_query_to_ast_helper("(<=42)", "{\"*\" TO \"42\"]");
        test_parse_query_to_ast_helper("(<=42 )", "{\"*\" TO \"42\"]");
        test_parse_query_to_ast_helper("(age:>5)", "\"age\":{\"5\" TO \"*\"}");
        test_parse_query_to_ast_helper(
            "(title:bar AND age:>12)",
            "(+\"title\":bar +\"age\":{\"12\" TO \"*\"})",
        );
    }

    #[test]
    fn test_occur_leaf() {
        let (_, (occur, ast)) = super::occur_leaf("+abc").unwrap();
        assert_eq!(occur, Some(Occur::Must));
        assert_eq!(format!("{ast:?}"), "abc");
    }

    #[test]
    fn test_field_name() {
        assert_eq!(
            super::field_name(".my.field.name:a"),
            Ok(("a", ".my.field.name".to_string()))
        );
        assert_eq!(
            super::field_name(r#"にんじん:a"#),
            Ok(("a", "にんじん".to_string()))
        );
        assert_eq!(
            super::field_name(r#"my\field:a"#),
            Ok(("a", r#"my\field"#.to_string()))
        );
        assert_eq!(
            super::field_name(r#"my\\field:a"#),
            Ok(("a", r#"my\field"#.to_string()))
        );
        assert!(super::field_name("my field:a").is_err());
        assert_eq!(
            super::field_name("\\(1\\+1\\):2"),
            Ok(("2", "(1+1)".to_string()))
        );
        assert_eq!(
            super::field_name("my_field_name:a"),
            Ok(("a", "my_field_name".to_string()))
        );
        assert_eq!(
            super::field_name("myfield.b:hello").unwrap(),
            ("hello", "myfield.b".to_string())
        );
        assert_eq!(
            super::field_name(r#"myfield\.b:hello"#).unwrap(),
            ("hello", r#"myfield\.b"#.to_string())
        );
        assert!(super::field_name("my_field_name").is_err());
        assert!(super::field_name(":a").is_err());
        assert!(super::field_name("-my_field:a").is_err());
        assert_eq!(
            super::field_name("_my_field:a"),
            Ok(("a", "_my_field".to_string()))
        );
        assert_eq!(
            super::field_name("~my~field:a"),
            Ok(("a", "~my~field".to_string()))
        );
        assert_eq!(
            super::field_name(".my.field.name : a"),
            Ok(("a", ".my.field.name".to_string()))
        );
        for special_char in SPECIAL_CHARS.iter() {
            let query = &format!("\\{special_char}my\\{special_char}field:a");
            assert_eq!(
                super::field_name(query),
                Ok(("a", format!("{special_char}my{special_char}field")))
            );
        }
    }

    #[test]
    fn test_range_parser() {
        // testing the range() parser separately
        let res = literal("title: <hello")
            .expect("Cannot parse flexible bound word")
            .1;
        let expected = UserInputLeaf::Range {
            field: Some("title".to_string()),
            lower: UserInputBound::Unbounded,
            upper: UserInputBound::Exclusive("hello".to_string()),
        }
        .into();
        let res2 = literal("title:{* TO hello}")
            .expect("Cannot parse ununbounded to word")
            .1;
        assert_eq!(res, expected);
        assert_eq!(res2, expected);

        let expected_weight = UserInputLeaf::Range {
            field: Some("weight".to_string()),
            lower: UserInputBound::Inclusive("71.2".to_string()),
            upper: UserInputBound::Unbounded,
        }
        .into();
        let res3 = literal("weight: >=71.2")
            .expect("Cannot parse flexible bound float")
            .1;
        let res4 = literal("weight:[71.2 TO *}")
            .expect("Cannot parse float to unbounded")
            .1;
        assert_eq!(res3, expected_weight);
        assert_eq!(res4, expected_weight);

        let expected_dates = UserInputLeaf::Range {
            field: Some("date_field".to_string()),
            lower: UserInputBound::Exclusive("2015-08-02T18:54:42Z".to_string()),
            upper: UserInputBound::Inclusive("2021-08-02T18:54:42+02:30".to_string()),
        }
        .into();
        let res5 = literal("date_field:{2015-08-02T18:54:42Z TO 2021-08-02T18:54:42+02:30]")
            .expect("Cannot parse date range")
            .1;
        assert_eq!(res5, expected_dates);

        let expected_flexible_dates = UserInputLeaf::Range {
            field: Some("date_field".to_string()),
            lower: UserInputBound::Unbounded,
            upper: UserInputBound::Inclusive("2021-08-02T18:54:42.12345+02:30".to_string()),
        }
        .into();

        let res6 = literal("date_field: <=2021-08-02T18:54:42.12345+02:30")
            .expect("Cannot parse date range")
            .1;
        assert_eq!(res6, expected_flexible_dates);
        // IP Range Unbounded
        let expected_weight = UserInputLeaf::Range {
            field: Some("ip".to_string()),
            lower: UserInputBound::Inclusive("::1".to_string()),
            upper: UserInputBound::Unbounded,
        }
        .into();
        let res1 = literal("ip: >=::1").expect("Cannot parse ip v6 format").1;
        let res2 = literal("ip:[::1 TO *}")
            .expect("Cannot parse ip v6 format")
            .1;
        assert_eq!(res1, expected_weight);
        assert_eq!(res2, expected_weight);

        // IP Range Bounded
        let expected_weight = UserInputLeaf::Range {
            field: Some("ip".to_string()),
            lower: UserInputBound::Inclusive("::0.0.0.50".to_string()),
            upper: UserInputBound::Exclusive("::0.0.0.52".to_string()),
        }
        .into();
        let res1 = literal("ip:[::0.0.0.50 TO ::0.0.0.52}")
            .expect("Cannot parse ip v6 format")
            .1;
        assert_eq!(res1, expected_weight);
    }

    #[test]
    fn test_range_parser_lenient() {
        let literal = |query| literal_infallible(query).unwrap().1.0.unwrap();

        // same tests as non-lenient
        let res = literal("title: <hello");
        let expected = UserInputLeaf::Range {
            field: Some("title".to_string()),
            lower: UserInputBound::Unbounded,
            upper: UserInputBound::Exclusive("hello".to_string()),
        }
        .into();
        let res2 = literal("title:{* TO hello}");
        assert_eq!(res, expected);
        assert_eq!(res2, expected);

        let expected_weight = UserInputLeaf::Range {
            field: Some("weight".to_string()),
            lower: UserInputBound::Inclusive("71.2".to_string()),
            upper: UserInputBound::Unbounded,
        }
        .into();
        let res3 = literal("weight: >=71.2");
        let res4 = literal("weight:[71.2 TO *}");
        assert_eq!(res3, expected_weight);
        assert_eq!(res4, expected_weight);

        let expected_dates = UserInputLeaf::Range {
            field: Some("date_field".to_string()),
            lower: UserInputBound::Exclusive("2015-08-02T18:54:42Z".to_string()),
            upper: UserInputBound::Inclusive("2021-08-02T18:54:42+02:30".to_string()),
        }
        .into();
        let res5 = literal("date_field:{2015-08-02T18:54:42Z TO 2021-08-02T18:54:42+02:30]");
        assert_eq!(res5, expected_dates);

        let expected_flexible_dates = UserInputLeaf::Range {
            field: Some("date_field".to_string()),
            lower: UserInputBound::Unbounded,
            upper: UserInputBound::Inclusive("2021-08-02T18:54:42.12345+02:30".to_string()),
        }
        .into();

        let res6 = literal("date_field: <=2021-08-02T18:54:42.12345+02:30");
        assert_eq!(res6, expected_flexible_dates);
        // IP Range Unbounded
        let expected_weight = UserInputLeaf::Range {
            field: Some("ip".to_string()),
            lower: UserInputBound::Inclusive("::1".to_string()),
            upper: UserInputBound::Unbounded,
        }
        .into();
        let res1 = literal("ip: >=::1");
        let res2 = literal("ip:[::1 TO *}");
        assert_eq!(res1, expected_weight);
        assert_eq!(res2, expected_weight);

        // IP Range Bounded
        let expected_weight = UserInputLeaf::Range {
            field: Some("ip".to_string()),
            lower: UserInputBound::Inclusive("::0.0.0.50".to_string()),
            upper: UserInputBound::Exclusive("::0.0.0.52".to_string()),
        }
        .into();
        let res1 = literal("ip:[::0.0.0.50 TO ::0.0.0.52}");
        assert_eq!(res1, expected_weight);

        // additional tests
        let expected_weight = UserInputLeaf::Range {
            field: Some("ip".to_string()),
            lower: UserInputBound::Inclusive("::0.0.0.50".to_string()),
            upper: UserInputBound::Inclusive("::0.0.0.52".to_string()),
        }
        .into();
        let res1 = literal("ip:[::0.0.0.50 TO ::0.0.0.52");
        let res2 = literal("ip:[::0.0.0.50 ::0.0.0.52");
        let res3 = literal("ip:[::0.0.0.50 ::0.0.0.52 AND ...");
        assert_eq!(res1, expected_weight);
        assert_eq!(res2, expected_weight);
        assert_eq!(res3, expected_weight);

        let expected_weight = UserInputLeaf::Range {
            field: Some("ip".to_string()),
            lower: UserInputBound::Inclusive("::0.0.0.50".to_string()),
            upper: UserInputBound::Unbounded,
        }
        .into();
        let res1 = literal("ip:[::0.0.0.50 TO ");
        let res2 = literal("ip:[::0.0.0.50 TO");
        let res3 = literal("ip:[::0.0.0.50");
        assert_eq!(res1, expected_weight);
        assert_eq!(res2, expected_weight);
        assert_eq!(res3, expected_weight);

        let expected_weight = UserInputLeaf::Range {
            field: Some("ip".to_string()),
            lower: UserInputBound::Unbounded,
            upper: UserInputBound::Unbounded,
        }
        .into();
        let res1 = literal("ip:[ ");
        let res2 = literal("ip:{ ");
        let res3 = literal("ip:[");
        assert_eq!(res1, expected_weight);
        assert_eq!(res2, expected_weight);
        assert_eq!(res3, expected_weight);
        // we don't test ip: as that is not a valid range request as per percondition
    }

    #[test]
    fn test_parse_query_to_trimming_spaces() {
        test_parse_query_to_ast_helper("   abc", "abc");
        test_parse_query_to_ast_helper("abc ", "abc");
        test_parse_query_to_ast_helper("(  a OR abc)", "(?a ?abc)");
        test_parse_query_to_ast_helper("(a  OR abc)", "(?a ?abc)");
        test_parse_query_to_ast_helper("(a OR  abc)", "(?a ?abc)");
        test_parse_query_to_ast_helper("a OR abc ", "(?a ?abc)");
        test_parse_query_to_ast_helper("(a OR abc )", "(?a ?abc)");
        test_parse_query_to_ast_helper("(a OR  abc) ", "(?a ?abc)");
        test_is_parse_err("(a OR  abc ", "(?a ?abc)");
    }

    #[test]
    fn test_parse_query_term_group() {
        test_parse_query_to_ast_helper(r#"field:(abc)"#, r#""field":abc"#);
        test_parse_query_to_ast_helper(r#"field:(+a -"b c")"#, r#"(+"field":a -"field":"b c")"#);
        test_parse_query_to_ast_helper(r#"field:(a AND "b c")"#, r#"(+"field":a +"field":"b c")"#);
        test_parse_query_to_ast_helper(r#"field:(a OR "b c")"#, r#"(?"field":a ?"field":"b c")"#);
        test_parse_query_to_ast_helper(
            r#"field:(a OR (b AND c))"#,
            r#"(?"field":a ?(+"field":b +"field":c))"#,
        );
        test_parse_query_to_ast_helper(
            r#"field:(a [b TO c])"#,
            r#"(*"field":a *"field":["b" TO "c"])"#,
        );

        test_is_parse_err(r#"field:(+a -"b c""#, r#"(+"field":a -"field":"b c")"#);
    }

    #[test]
    fn field_re_specification() {
        test_parse_query_to_ast_helper(r#"field:(abc AND b:cde)"#, r#"(+"field":abc +"b":cde)"#);
    }

    #[test]
    fn test_parse_query_single_term() {
        test_parse_query_to_ast_helper("abc", "abc");
    }

    #[test]
    fn test_parse_query_default_clause() {
        test_parse_query_to_ast_helper("a b", "(*a *b)");
    }

    #[test]
    fn test_parse_query_must_default_clause() {
        test_parse_query_to_ast_helper("+(a b)", "(*a *b)");
    }

    #[test]
    fn test_parse_query_must_single_term() {
        test_parse_query_to_ast_helper("+d", "d");
    }

    #[test]
    fn test_single_term_with_field() {
        test_parse_query_to_ast_helper("abc:toto", "\"abc\":toto");
    }

    #[test]
    fn test_phrase_with_field() {
        test_parse_query_to_ast_helper("abc:\"happy tax payer\"", "\"abc\":\"happy tax payer\"");
        test_parse_query_to_ast_helper("abc:'happy tax payer'", "\"abc\":'happy tax payer'");
    }

    #[test]
    fn test_single_term_with_float() {
        test_parse_query_to_ast_helper("abc:1.1", "\"abc\":1.1");
        test_parse_query_to_ast_helper("a.b.c:1.1", "\"a.b.c\":1.1");
        test_parse_query_to_ast_helper("a\\ b\\ c:1.1", "\"a b c\":1.1");
    }

    #[test]
    fn test_must_clause() {
        test_parse_query_to_ast_helper("(+a +b)", "(+a +b)");
    }

    #[test]
    fn test_parse_test_query_plus_a_b_plus_d() {
        test_parse_query_to_ast_helper("+(a b) +d", "(+(*a *b) +d)");
    }

    #[test]
    fn test_parse_test_query_set() {
        test_parse_query_to_ast_helper("abc: IN [a b c]", r#""abc": IN ["a" "b" "c"]"#);
        test_parse_query_to_ast_helper("abc: IN [1]", r#""abc": IN ["1"]"#);
        test_parse_query_to_ast_helper("abc: IN []", r#""abc": IN []"#);
        test_parse_query_to_ast_helper("IN [1 2]", r#"IN ["1" "2"]"#);
        test_is_parse_err("IN [1 2", r#"IN ["1" "2"]"#);

        // TODO maybe support these too?
        // test_is_parse_err("IN (1 2", r#"IN ["1" "2"]"#);
        // test_is_parse_err("IN {1 2", r#"IN ["1" "2"]"#);
    }

    #[test]
    fn test_parse_test_query_other() {
        test_parse_query_to_ast_helper("(+a +b) d", "(*(+a +b) *d)");
        test_parse_query_to_ast_helper("+abc:toto", "\"abc\":toto");
        test_parse_query_to_ast_helper("+a\\+b\\+c:toto", "\"a+b+c\":toto");
        test_parse_query_to_ast_helper("(+abc:toto -titi)", "(+\"abc\":toto -titi)");
        test_parse_query_to_ast_helper("-abc:toto", "(-\"abc\":toto)");
        // TODO not entirely sure about this one (it's seen as a NOT '-abc:toto')
        test_is_parse_err("--abc:toto", "(--abc:toto)");
        test_parse_query_to_ast_helper("abc:a b", "(*\"abc\":a *b)");
        test_parse_query_to_ast_helper("abc:\"a b\"", "\"abc\":\"a b\"");
        test_parse_query_to_ast_helper("foo:[1 TO 5]", "\"foo\":[\"1\" TO \"5\"]");

        // Phrase prefixed with *
        test_parse_query_to_ast_helper("foo:(*A)", "\"foo\":*A");
        test_parse_query_to_ast_helper("*A", "*A");
        test_parse_query_to_ast_helper("(*A)", "*A");
        test_parse_query_to_ast_helper("foo:(A OR B)", "(?\"foo\":A ?\"foo\":B)");
        test_parse_query_to_ast_helper("foo:(A* OR B*)", "(?\"foo\":A* ?\"foo\":B*)");
        test_parse_query_to_ast_helper("foo:(*A OR *B)", "(?\"foo\":*A ?\"foo\":*B)");

        // Regexes between parentheses
        test_parse_query_to_ast_helper("foo:(/A.*/)", "\"foo\":/A.*/");
        test_parse_query_to_ast_helper("foo:(/A.*/ OR /B.*/)", "(?\"foo\":/A.*/ ?\"foo\":/B.*/)");
    }

    #[test]
    fn test_parse_query_all() {
        test_parse_query_to_ast_helper("*", "*");
        test_parse_query_to_ast_helper("(*)", "*");
        test_parse_query_to_ast_helper("(* )", "*");
    }

    #[test]
    fn test_parse_query_with_range() {
        test_parse_query_to_ast_helper("[1 TO 5]", "[\"1\" TO \"5\"]");
        test_parse_query_to_ast_helper("foo:{a TO z}", "\"foo\":{\"a\" TO \"z\"}");
        test_parse_query_to_ast_helper("foo:[1 TO toto}", "\"foo\":[\"1\" TO \"toto\"}");
        test_parse_query_to_ast_helper("foo:[* TO toto}", "\"foo\":{\"*\" TO \"toto\"}");
        test_parse_query_to_ast_helper("foo:[1 TO *}", "\"foo\":[\"1\" TO \"*\"}");
        test_parse_query_to_ast_helper(
            "1.2.foo.bar:[1.1 TO *}",
            "\"1.2.foo.bar\":[\"1.1\" TO \"*\"}",
        );
        test_is_parse_err("abc +    ", "abc");
    }

    #[test]
    fn test_slop() {
        test_is_parse_err("\"a b\"~", "(*\"a b\" *~)");
        test_is_parse_err("foo:\"a b\"~", "(*\"foo\":\"a b\" *~)");
        test_is_parse_err("\"a b\"~a", "(*\"a b\" *~a)");
        test_is_parse_err(
            "\"a b\"~100000000000000000",
            "(*\"a b\" *~100000000000000000)",
        );
        test_parse_query_to_ast_helper("\"a b\"^2 ~4", "(*(\"a b\")^2 *~4)");
        test_parse_query_to_ast_helper("\"a b\"~4^2", "(\"a b\"~4)^2");
        test_parse_query_to_ast_helper("\"~Document\"", "\"~Document\"");
        test_parse_query_to_ast_helper("~Document", "~Document");
        test_parse_query_to_ast_helper("a~2", "a~2");
        test_parse_query_to_ast_helper("\"a b\"~0", "\"a b\"");
        test_parse_query_to_ast_helper("\"a b\"~1", "\"a b\"~1");
        test_parse_query_to_ast_helper("\"a b\"~3", "\"a b\"~3");
        test_parse_query_to_ast_helper("foo:\"a b\"~300", "\"foo\":\"a b\"~300");
        test_parse_query_to_ast_helper("\"a b\"~300^2", "(\"a b\"~300)^2");
    }

    #[test]
    fn test_phrase_prefix() {
        test_parse_query_to_ast_helper("\"a b\"*", "\"a b\"*");
        test_parse_query_to_ast_helper("\"a\"*", "\"a\"*");
        test_parse_query_to_ast_helper("\"\"*", "\"\"*");
        test_parse_query_to_ast_helper("foo:\"a b\"*", "\"foo\":\"a b\"*");
        test_parse_query_to_ast_helper("foo:\"a\"*", "\"foo\":\"a\"*");
        test_parse_query_to_ast_helper("foo:\"\"*", "\"foo\":\"\"*");
    }

    #[test]
    fn test_exist_query() {
        test_parse_query_to_ast_helper("a:*", "$exists(\"a\")");
        test_parse_query_to_ast_helper("a: *", "$exists(\"a\")");

        test_parse_query_to_ast_helper(
            "(hello AND toto:*) OR happy",
            "(?(+hello +$exists(\"toto\")) ?happy)",
        );
        test_parse_query_to_ast_helper("(a:*)", "$exists(\"a\")");

        // these are term/wildcard query (not a phrase prefix)
        test_parse_query_to_ast_helper("a:b*", "\"a\":b*");
        test_parse_query_to_ast_helper("a:*b", "\"a\":*b");
        test_parse_query_to_ast_helper(r#"a:*def*"#, "\"a\":*def*");
    }

    #[test]
    fn test_not_queries_are_consistent() {
        test_parse_query_to_ast_helper("tata -toto", "(*tata -toto)");
        test_parse_query_to_ast_helper("tata NOT toto", "(*tata -toto)");
    }

    #[test]
    fn test_escaping() {
        test_parse_query_to_ast_helper(
            r#"myfield:"hello\"happy\'tax""#,
            r#""myfield":"hello"happy'tax""#,
        );
        test_parse_query_to_ast_helper(
            r#"myfield:'hello\"happy\'tax'"#,
            r#""myfield":'hello"happy'tax'"#,
        );
        // we don't process escape sequence for chars which don't require it
        test_parse_query_to_ast_helper(r#"abc\*"#, r#"abc\*"#);
    }

    #[test]
    fn test_queries_with_colons() {
        test_parse_query_to_ast_helper(r#""abc:def""#, r#""abc:def""#);
        test_parse_query_to_ast_helper(r#"'abc:def'"#, r#"'abc:def'"#);
        test_parse_query_to_ast_helper(r#"abc\:def"#, r#"abc:def"#);
        test_parse_query_to_ast_helper(r#""abc\:def""#, r#""abc:def""#);
        test_parse_query_to_ast_helper(r#"'abc\:def'"#, r#"'abc:def'"#);
    }

    #[test]
    fn test_invalid_field() {
        test_is_parse_err(r#"!bc:def"#, "!bc:def");
    }

    #[test]
    fn test_regex_parser() {
        let r = parse_to_ast(r#"a:/joh?n(ath[oa]n)/"#);
        assert!(r.is_ok(), "Failed to parse custom query: {r:?}");
        let (_, input) = r.unwrap();
        match input {
            UserInputAst::Leaf(leaf) => match leaf.as_ref() {
                UserInputLeaf::Regex { field, pattern } => {
                    assert_eq!(field, &Some("a".to_string()));
                    assert_eq!(pattern, "joh?n(ath[oa]n)");
                }
                _ => panic!("Expected a regex leaf, got {leaf:?}"),
            },
            _ => panic!("Expected a leaf"),
        }
        let r = parse_to_ast(r#"a:/\\/cgi-bin\\/luci.*/"#);
        assert!(r.is_ok(), "Failed to parse custom query: {r:?}");
        let (_, input) = r.unwrap();
        match input {
            UserInputAst::Leaf(leaf) => match leaf.as_ref() {
                UserInputLeaf::Regex { field, pattern } => {
                    assert_eq!(field, &Some("a".to_string()));
                    assert_eq!(pattern, "\\/cgi-bin\\/luci.*");
                }
                _ => panic!("Expected a regex leaf, got {leaf:?}"),
            },
            _ => panic!("Expected a leaf"),
        }
    }

    #[test]
    fn test_regex_parser_lenient() {
        let literal = |query| literal_infallible(query).unwrap().1;

        let (res, errs) = literal(r#"a:/joh?n(ath[oa]n)/"#);
        let expected = UserInputLeaf::Regex {
            field: Some("a".to_string()),
            pattern: "joh?n(ath[oa]n)".to_string(),
        }
        .into();
        assert_eq!(res.unwrap(), expected);
        assert!(errs.is_empty(), "Expected no errors, got: {errs:?}");

        let (res, errs) = literal("title:/joh?n(ath[oa]n)");
        let expected = UserInputLeaf::Regex {
            field: Some("title".to_string()),
            pattern: "joh?n(ath[oa]n)".to_string(),
        }
        .into();
        assert_eq!(res.unwrap(), expected);
        assert_eq!(errs.len(), 1, "Expected 1 error, got: {errs:?}");
        assert_eq!(
            errs[0].message, "missing delimiter /",
            "Unexpected error message",
        );
    }

    #[test]
    fn test_space_before_value() {
        test_parse_query_to_ast_helper("field : a", r#""field":a"#);
        test_parse_query_to_ast_helper("field:    a", r#""field":a"#);
        test_parse_query_to_ast_helper("field         :a", r#""field":a"#);
        test_parse_query_to_ast_helper(
            "field : 'happy tax payer' AND other_field  : 1",
            r#"(+"field":'happy tax payer' +"other_field":1)"#,
        );
    }
}


================================================
FILE: query-grammar/src/user_input_ast.rs
================================================
use std::fmt;
use std::fmt::{Debug, Formatter};

use serde::Serialize;

use crate::Occur;

#[derive(PartialEq, Eq, Hash, Clone, Serialize)]
#[serde(tag = "type")]
#[serde(rename_all = "snake_case")]
pub enum UserInputLeaf {
    Literal(UserInputLiteral),
    All,
    Range {
        field: Option<String>,
        lower: UserInputBound,
        upper: UserInputBound,
    },
    Set {
        field: Option<String>,
        elements: Vec<String>,
    },
    Exists {
        field: String,
    },
    Regex {
        field: Option<String>,
        pattern: String,
    },
}

impl UserInputLeaf {
    pub(crate) fn set_field(self, field: Option<String>) -> Self {
        match self {
            UserInputLeaf::Literal(mut literal) => {
                literal.field_name = field;
                UserInputLeaf::Literal(literal)
            }
            UserInputLeaf::All => UserInputLeaf::All,
            UserInputLeaf::Range {
                field: _,
                lower,
                upper,
            } => UserInputLeaf::Range {
                field,
                lower,
                upper,
            },
            UserInputLeaf::Set { field: _, elements } => UserInputLeaf::Set { field, elements },
            UserInputLeaf::Exists { field: _ } => UserInputLeaf::Exists {
                field: field.expect("Exist query without a field isn't allowed"),
            },
            UserInputLeaf::Regex { field: _, pattern } => UserInputLeaf::Regex { field, pattern },
        }
    }

    pub(crate) fn set_default_field(&mut self, default_field: String) {
        match self {
            UserInputLeaf::Literal(literal) if literal.field_name.is_none() => {
                literal.field_name = Some(default_field)
            }
            UserInputLeaf::All => {
                *self = UserInputLeaf::Exists {
                    field: default_field,
                }
            }
            UserInputLeaf::Range { field, .. } if field.is_none() => *field = Some(default_field),
            UserInputLeaf::Set { field, .. } if field.is_none() => *field = Some(default_field),
            UserInputLeaf::Regex { field, .. } if field.is_none() => *field = Some(default_field),
            _ => (), // field was already set, do nothing
        }
    }
}

impl Debug for UserInputLeaf {
    fn fmt(&self, formatter: &mut Formatter) -> Result<(), fmt::Error> {
        match self {
            UserInputLeaf::Literal(literal) => literal.fmt(formatter),
            UserInputLeaf::Range {
                field,
                lower,
                upper,
            } => {
                if let Some(field) = field {
                    // TODO properly escape field (in case of \")
                    write!(formatter, "\"{field}\":")?;
                }
                lower.display_lower(formatter)?;
                write!(formatter, " TO ")?;
                upper.display_upper(formatter)?;
                Ok(())
            }
            UserInputLeaf::Set { field, elements } => {
                if let Some(field) = field {
                    // TODO properly escape field (in case of \")
                    write!(formatter, "\"{field}\": ")?;
                }
                write!(formatter, "IN [")?;
                for (i, text) in elements.iter().enumerate() {
                    if i != 0 {
                        write!(formatter, " ")?;
                    }
                    // TODO properly escape element
                    write!(formatter, "\"{text}\"")?;
                }
                write!(formatter, "]")
            }
            UserInputLeaf::All => write!(formatter, "*"),
            UserInputLeaf::Exists { field } => {
                write!(formatter, "$exists(\"{field}\")")
            }
            UserInputLeaf::Regex { field, pattern } => {
                if let Some(field) = field {
                    // TODO properly escape field (in case of \")
                    write!(formatter, "\"{field}\":")?;
                }
                // TODO properly escape pattern (in case of \")
                write!(formatter, "/{pattern}/")
            }
        }
    }
}

#[derive(Copy, Clone, Eq, PartialEq, Hash, Debug, Serialize)]
#[serde(rename_all = "snake_case")]
pub enum Delimiter {
    SingleQuotes,
    DoubleQuotes,
    None,
}

#[derive(PartialEq, Eq, Hash, Clone, Serialize)]
#[serde(rename_all = "snake_case")]
pub struct UserInputLiteral {
    pub field_name: Option<String>,
    pub phrase: String,
    pub delimiter: Delimiter,
    pub slop: u32,
    pub prefix: bool,
}

impl fmt::Debug for UserInputLiteral {
    fn fmt(&self, formatter: &mut fmt::Formatter) -> Result<(), fmt::Error> {
        if let Some(ref field) = self.field_name {
            // TODO properly escape field (in case of \")
            write!(formatter, "\"{field}\":")?;
        }
        match self.delimiter {
            Delimiter::SingleQuotes => {
                // TODO properly escape element (in case of \')
                write!(formatter, "'{}'", self.phrase)?;
            }
            Delimiter::DoubleQuotes => {
                // TODO properly escape element (in case of \")
                write!(formatter, "\"{}\"", self.phrase)?;
            }
            Delimiter::None => {
                // TODO properly escape element
                write!(formatter, "{}", self.phrase)?;
            }
        }
        if self.slop > 0 {
            write!(formatter, "~{}", self.slop)?;
        } else if self.prefix {
            write!(formatter, "*")?;
        }
        Ok(())
    }
}

#[derive(PartialEq, Eq, Hash, Debug, Clone, Serialize)]
#[serde(tag = "type", content = "value")]
#[serde(rename_all = "snake_case")]
pub enum UserInputBound {
    Inclusive(String),
    Exclusive(String),
    Unbounded,
}

impl UserInputBound {
    fn display_lower(&self, formatter: &mut fmt::Formatter) -> Result<(), fmt::Error> {
        match *self {
            // TODO properly escape word if required
            UserInputBound::Inclusive(ref word) => write!(formatter, "[\"{word}\""),
            UserInputBound::Exclusive(ref word) => write!(formatter, "{{\"{word}\""),
            UserInputBound::Unbounded => write!(formatter, "{{\"*\""),
        }
    }

    fn display_upper(&self, formatter: &mut fmt::Formatter) -> Result<(), fmt::Error> {
        match *self {
            // TODO properly escape word if required
            UserInputBound::Inclusive(ref word) => write!(formatter, "\"{word}\"]"),
            UserInputBound::Exclusive(ref word) => write!(formatter, "\"{word}\"}}"),
            UserInputBound::Unbounded => write!(formatter, "\"*\"}}"),
        }
    }

    pub fn term_str(&self) -> &str {
        match *self {
            UserInputBound::Inclusive(ref contents) => contents,
            UserInputBound::Exclusive(ref contents) => contents,
            UserInputBound::Unbounded => "*",
        }
    }
}

#[derive(PartialEq, Eq, Hash, Clone, Serialize)]
#[serde(into = "UserInputAstSerde")]
pub enum UserInputAst {
    Clause(Vec<(Option<Occur>, UserInputAst)>),
    Boost(Box<UserInputAst>, ordered_float::OrderedFloat<f64>),
    Leaf(Box<UserInputLeaf>),
}

#[derive(Serialize)]
#[serde(tag = "type", rename_all = "snake_case")]
enum UserInputAstSerde {
    Bool {
        clauses: Vec<(Option<Occur>, UserInputAst)>,
    },
    Boost {
        underlying: Box<UserInputAst>,
        boost: f64,
    },
    #[serde(untagged)]
    Leaf(Box<UserInputLeaf>),
}

impl From<UserInputAst> for UserInputAstSerde {
    fn from(ast: UserInputAst) -> Self {
        match ast {
            UserInputAst::Clause(clause) => UserInputAstSerde::Bool { clauses: clause },
            UserInputAst::Boost(underlying, boost) => UserInputAstSerde::Boost {
                underlying,
                boost: boost.into_inner(),
            },
            UserInputAst::Leaf(leaf) => UserInputAstSerde::Leaf(leaf),
        }
    }
}

impl UserInputAst {
    #[must_use]
    pub fn unary(self, occur: Occur) -> UserInputAst {
        UserInputAst::Clause(vec![(Some(occur), self)])
    }

    fn compose(occur: Occur, asts: Vec<UserInputAst>) -> UserInputAst {
        assert_ne!(occur, Occur::MustNot);
        assert!(!asts.is_empty());
        if asts.len() == 1 {
            asts.into_iter().next().unwrap() //< safe
        } else {
            UserInputAst::Clause(
                asts.into_iter()
                    .map(|ast: UserInputAst| (Some(occur), ast))
                    .collect::<Vec<_>>(),
            )
        }
    }

    pub fn empty_query() -> UserInputAst {
        UserInputAst::Clause(Vec::default())
    }

    pub fn and(asts: Vec<UserInputAst>) -> UserInputAst {
        UserInputAst::compose(Occur::Must, asts)
    }

    pub fn or(asts: Vec<UserInputAst>) -> UserInputAst {
        UserInputAst::compose(Occur::Should, asts)
    }

    pub(crate) fn set_default_field(&mut self, field: String) {
        match self {
            UserInputAst::Clause(clauses) => clauses
                .iter_mut()
                .for_each(|(_, ast)| ast.set_default_field(field.clone())),
            UserInputAst::Leaf(leaf) => leaf.set_default_field(field),
            UserInputAst::Boost(ast, _) => ast.set_default_field(field),
        }
    }
}

impl From<UserInputLiteral> for UserInputLeaf {
    fn from(literal: UserInputLiteral) -> UserInputLeaf {
        UserInputLeaf::Literal(literal)
    }
}

impl From<UserInputLeaf> for UserInputAst {
    fn from(leaf: UserInputLeaf) -> UserInputAst {
        UserInputAst::Leaf(Box::new(leaf))
    }
}

fn print_occur_ast(
    occur_opt: Option<Occur>,
    ast: &UserInputAst,
    formatter: &mut fmt::Formatter,
) -> fmt::Result {
    if let Some(occur) = occur_opt {
        write!(formatter, "{occur}{ast:?}")?;
    } else {
        write!(formatter, "*{ast:?}")?;
    }
    Ok(())
}

impl fmt::Debug for UserInputAst {
    fn fmt(&self, formatter: &mut fmt::Formatter) -> fmt::Result {
        match *self {
            UserInputAst::Clause(ref subqueries) => {
                if subqueries.is_empty() {
                    // TODO this will break ast reserialization, is writing "( )" enough?
                    write!(formatter, "<emptyclause>")?;
                } else {
                    write!(formatter, "(")?;
                    print_occur_ast(subqueries[0].0, &subqueries[0].1, formatter)?;
                    for subquery in &subqueries[1..] {
                        write!(formatter, " ")?;
                        print_occur_ast(subquery.0, &subquery.1, formatter)?;
                    }
                    write!(formatter, ")")?;
                }
                Ok(())
            }
            UserInputAst::Leaf(ref subquery) => write!(formatter, "{subquery:?}"),
            UserInputAst::Boost(ref leaf, boost) => write!(formatter, "({leaf:?})^{boost}"),
        }
    }
}

#[cfg(test)]
mod tests {
    use super::*;

    #[test]
    fn test_all_leaf_serialization() {
        let ast = UserInputAst::Leaf(Box::new(UserInputLeaf::All));
        let json = serde_json::to_string(&ast).unwrap();
        assert_eq!(json, r#"{"type":"all"}"#);
    }

    #[test]
    fn test_literal_leaf_serialization() {
        let literal = UserInputLiteral {
            field_name: Some("title".to_string()),
            phrase: "hello".to_string(),
            delimiter: Delimiter::None,
            slop: 0,
            prefix: false,
        };
        let ast = UserInputAst::Leaf(Box::new(UserInputLeaf::Literal(literal)));
        let json = serde_json::to_string(&ast).unwrap();
        assert_eq!(
            json,
            r#"{"type":"literal","field_name":"title","phrase":"hello","delimiter":"none","slop":0,"prefix":false}"#
        );
    }

    #[test]
    fn test_range_leaf_serialization() {
        let range = UserInputLeaf::Range {
            field: Some("price".to_string()),
            lower: UserInputBound::Inclusive("10".to_string()),
            upper: UserInputBound::Exclusive("100".to_string()),
        };
        let ast = UserInputAst::Leaf(Box::new(range));
        let json = serde_json::to_string(&ast).unwrap();
        assert_eq!(
            json,
            r#"{"type":"range","field":"price","lower":{"type":"inclusive","value":"10"},"upper":{"type":"exclusive","value":"100"}}"#
        );
    }

    #[test]
    fn test_range_leaf_unbounded_serialization() {
        let range = UserInputLeaf::Range {
            field: Some("price".to_string()),
            lower: UserInputBound::Inclusive("10".to_string()),
            upper: UserInputBound::Unbounded,
        };
        let ast = UserInputAst::Leaf(Box::new(range));
        let json = serde_json::to_string(&ast).unwrap();
        assert_eq!(
            json,
            r#"{"type":"range","field":"price","lower":{"type":"inclusive","value":"10"},"upper":{"type":"unbounded"}}"#
        );
    }

    #[test]
    fn test_boost_serialization() {
        let inner_ast = UserInputAst::Leaf(Box::new(UserInputLeaf::All));
        let boost_ast = UserInputAst::Boost(Box::new(inner_ast), 2.5.into());
        let json = serde_json::to_string(&boost_ast).unwrap();
        assert_eq!(
            json,
            r#"{"type":"boost","underlying":{"type":"all"},"boost":2.5}"#
        );
    }

    #[test]
    fn test_boost_serialization2() {
        let boost_ast = UserInputAst::Boost(
            Box::new(UserInputAst::Clause(vec![
                (
                    Some(Occur::Must),
                    UserInputAst::Leaf(Box::new(UserInputLeaf::All)),
                ),
                (
                    Some(Occur::Should),
                    UserInputAst::Leaf(Box::new(UserInputLeaf::Literal(UserInputLiteral {
                        field_name: Some("title".to_string()),
                        phrase: "hello".to_string(),
                        delimiter: Delimiter::None,
                        slop: 0,
                        prefix: false,
                    }))),
                ),
            ])),
            2.5.into(),
        );
        let json = serde_json::to_string(&boost_ast).unwrap();
        assert_eq!(
            json,
            r#"{"type":"boost","underlying":{"type":"bool","clauses":[["must",{"type":"all"}],["should",{"type":"literal","field_name":"title","phrase":"hello","delimiter":"none","slop":0,"prefix":false}]]},"boost":2.5}"#
        );
    }

    #[test]
    fn test_clause_serialization() {
        let clause = UserInputAst::Clause(vec![
            (
                Some(Occur::Must),
                UserInputAst::Leaf(Box::new(UserInputLeaf::All)),
            ),
            (
                Some(Occur::Should),
                UserInputAst::Leaf(Box::new(UserInputLeaf::Literal(UserInputLiteral {
                    field_name: Some("title".to_string()),
                    phrase: "hello".to_string(),
                    delimiter: Delimiter::None,
                    slop: 0,
                    prefix: false,
                }))),
            ),
        ]);
        let json = serde_json::to_string(&clause).unwrap();
        assert_eq!(
            json,
            r#"{"type":"bool","clauses":[["must",{"type":"all"}],["should",{"type":"literal","field_name":"title","phrase":"hello","delimiter":"none","slop":0,"prefix":false}]]}"#
        );
    }
}


================================================
FILE: rustfmt.toml
================================================
comment_width = 120
format_strings = true
group_imports = "StdExternalCrate"
imports_granularity = "Module"
normalize_comments = true
where_single_line = true
wrap_comments = true


================================================
FILE: src/aggregation/README.md
================================================
# Contributing

When adding new bucket aggregation make sure to extend the "test_aggregation_flushing" test for at least 2 levels.


# Code Organization

Tantivy's aggregations have been designed to mimic the 
[aggregations of elasticsearch](https://www.elastic.co/guide/en/elasticsearch/reference/current/search-aggregations.html).

The code is organized in submodules:

## bucket
Contains all bucket aggregations, like range aggregation. These bucket aggregations group documents into buckets and can contain sub-aggregations.

## metric
Contains all metric aggregations, like average aggregation. Metric aggregations do not have sub aggregations.

#### agg_req
agg_req contains the users aggregation request. Deserialization from json is compatible with elasticsearch aggregation requests.

#### agg_data
agg_data contains the users aggregation request enriched with fast field accessors etc, which are
used during collection.

#### segment_agg_result
segment_agg_result contains the aggregation result tree, which is used for collection of a segment.
agg_data is passed during collection.

#### intermediate_agg_result
intermediate_agg_result contains the aggregation tree for merging with other trees.

#### agg_result
agg_result contains the final aggregation tree.


================================================
FILE: src/aggregation/accessor_helpers.rs
================================================
//! This will enhance the request tree with access to the fastfield and metadata.

use std::io;

use columnar::{Column, ColumnType};

use crate::aggregation::{f64_to_fastfield_u64, Key};
use crate::index::SegmentReader;

/// Get the missing value as internal u64 representation
///
/// For terms we use u64::MAX as sentinel value
/// For numerical data we convert the value into the representation
/// we would get from the fast field, when we open it as u64_lenient_for_type.
///
/// That way we can use it the same way as if it would come from the fastfield.
pub(crate) fn get_missing_val_as_u64_lenient(
    column_type: ColumnType,
    column_max_value: u64,
    missing: &Key,
    field_name: &str,
) -> crate::Result<Option<u64>> {
    let missing_val = match missing {
        Key::Str(_) if column_type == ColumnType::Str => Some(column_max_value + 1),
        // Allow fallback to number on text fields
        Key::F64(_) if column_type == ColumnType::Str => Some(column_max_value + 1),
        Key::U64(_) if column_type == ColumnType::Str => Some(column_max_value + 1),
        Key::I64(_) if column_type == ColumnType::Str => Some(column_max_value + 1),
        Key::F64(val) if column_type.numerical_type().is_some() => {
            f64_to_fastfield_u64(*val, &column_type)
        }
        // NOTE: We may loose precision of the passed missing value by casting i64 and u64 to f64.
        Key::I64(val) if column_type.numerical_type().is_some() => {
            f64_to_fastfield_u64(*val as f64, &column_type)
        }
        Key::U64(val) if column_type.numerical_type().is_some() => {
            f64_to_fastfield_u64(*val as f64, &column_type)
        }
        _ => {
            return Err(crate::TantivyError::InvalidArgument(format!(
                "Missing value {missing:?} for field {field_name} is not supported for column \
                 type {column_type:?}"
            )));
        }
    };
    Ok(missing_val)
}

pub(crate) fn get_numeric_or_date_column_types() -> &'static [ColumnType] {
    &[
        ColumnType::F64,
        ColumnType::U64,
        ColumnType::I64,
        ColumnType::DateTime,
    ]
}

/// Get fast field reader or empty as default.
pub(crate) fn get_ff_reader(
    reader: &SegmentReader,
    field_name: &str,
    allowed_column_types: Option<&[ColumnType]>,
) -> crate::Result<(columnar::Column<u64>, ColumnType)> {
    let ff_fields = reader.fast_fields();
    let ff_field_with_type = ff_fields
        .u64_lenient_for_type(allowed_column_types, field_name)?
        .unwrap_or_else(|| {
            (
                Column::build_empty_column(reader.num_docs()),
                ColumnType::U64,
            )
        });
    Ok(ff_field_with_type)
}

pub(crate) fn get_dynamic_columns(
    reader: &SegmentReader,
    field_name: &str,
) -> crate::Result<Vec<columnar::DynamicColumn>> {
    let ff_fields = reader.fast_fields().dynamic_column_handles(field_name)?;
    let cols = ff_fields
        .iter()
        .map(|h| h.open())
        .collect::<io::Result<_>>()?;
    assert!(!ff_fields.is_empty(), "field {field_name} not found");
    Ok(cols)
}

/// Get all fast field reader or empty as default.
///
/// Is guaranteed to return at least one column.
pub(crate) fn get_all_ff_reader_or_empty(
    reader: &SegmentReader,
    field_name: &str,
    allowed_column_types: Option<&[ColumnType]>,
    fallback_type: ColumnType,
) -> crate::Result<Vec<(columnar::Column<u64>, ColumnType)>> {
    let ff_fields = reader.fast_fields();
    let mut ff_field_with_type =
        ff_fields.u64_lenient_for_type_all(allowed_column_types, field_name)?;
    if ff_field_with_type.is_empty() {
        ff_field_with_type.push((Column::build_empty_column(reader.num_docs()), fallback_type));
    }
    Ok(ff_field_with_type)
}


================================================
FILE: src/aggregation/agg_data.rs
================================================
use columnar::{Column, ColumnBlockAccessor, ColumnType, StrColumn};
use common::BitSet;
use rustc_hash::FxHashSet;
use serde::Serialize;
use tantivy_fst::Regex;

use crate::aggregation::accessor_helpers::{
    get_all_ff_reader_or_empty, get_dynamic_columns, get_ff_reader, get_missing_val_as_u64_lenient,
    get_numeric_or_date_column_types,
};
use crate::aggregation::agg_req::{Aggregation, AggregationVariants, Aggregations};
use crate::aggregation::bucket::{
    build_segment_filter_collector, build_segment_range_collector, CompositeAggReqData,
    CompositeAggregation, CompositeSourceAccessors, FilterAggReqData, HistogramAggReqData,
    HistogramBounds, IncludeExcludeParam, MissingTermAggReqData, RangeAggReqData,
    SegmentHistogramCollector, TermMissingAgg, TermsAggReqData, TermsAggregation,
    TermsAggregationInternal,
};
use crate::aggregation::metric::{
    build_segment_stats_collector, AverageAggregation, CardinalityAggReqData,
    CardinalityAggregationReq, CountAggregation, ExtendedStatsAggregation, MaxAggregation,
    MetricAggReqData, MinAggregation, SegmentCardinalityCollector, SegmentExtendedStatsCollector,
    SegmentPercentilesCollector, StatsAggregation, StatsType, SumAggregation, TopHitsAggReqData,
    TopHitsSegmentCollector,
};
use crate::aggregation::segment_agg_result::{
    GenericSegmentAggregationResultsCollector, SegmentAggregationCollector,
};
use crate::aggregation::{f64_to_fastfield_u64, AggContextParams, Key};
use crate::{SegmentOrdinal, SegmentReader};

#[derive(Default)]
/// Datastructure holding all request data for executing aggregations on a segment.
/// It is passed to the collectors during collection.
pub struct AggregationsSegmentCtx {
    /// Request data for each aggregation type.
    pub per_request: PerRequestAggSegCtx,
    pub context: AggContextParams,
    pub column_block_accessor: ColumnBlockAccessor<u64>,
}

impl AggregationsSegmentCtx {
    pub(crate) fn push_term_req_data(&mut self, data: TermsAggReqData) -> usize {
        self.per_request.term_req_data.push(Some(Box::new(data)));
        self.per_request.term_req_data.len() - 1
    }
    pub(crate) fn push_cardinality_req_data(&mut self, data: CardinalityAggReqData) -> usize {
        self.per_request.cardinality_req_data.push(data);
        self.per_request.cardinality_req_data.len() - 1
    }
    pub(crate) fn push_metric_req_data(&mut self, data: MetricAggReqData) -> usize {
        self.per_request.stats_metric_req_data.push(data);
        self.per_request.stats_metric_req_data.len() - 1
    }
    pub(crate) fn push_top_hits_req_data(&mut self, data: TopHitsAggReqData) -> usize {
        self.per_request.top_hits_req_data.push(data);
        self.per_request.top_hits_req_data.len() - 1
    }
    pub(crate) fn push_missing_term_req_data(&mut self, data: MissingTermAggReqData) -> usize {
        self.per_request.missing_term_req_data.push(data);
        self.per_request.missing_term_req_data.len() - 1
    }
    pub(crate) fn push_histogram_req_data(&mut self, data: HistogramAggReqData) -> usize {
        self.per_request
            .histogram_req_data
            .push(Some(Box::new(data)));
        self.per_request.histogram_req_data.len() - 1
    }
    pub(crate) fn push_range_req_data(&mut self, data: RangeAggReqData) -> usize {
        self.per_request.range_req_data.push(Some(Box::new(data)));
        self.per_request.range_req_data.len() - 1
    }
    pub(crate) fn push_filter_req_data(&mut self, data: FilterAggReqData) -> usize {
        self.per_request.filter_req_data.push(Some(Box::new(data)));
        self.per_request.filter_req_data.len() - 1
    }
    pub(crate) fn push_composite_req_data(&mut self, data: CompositeAggReqData) -> usize {
        self.per_request
            .composite_req_data
            .push(Some(Box::new(data)));
        self.per_request.composite_req_data.len() - 1
    }

    #[inline]
    pub(crate) fn get_term_req_data(&self, idx: usize) -> &TermsAggReqData {
        self.per_request.term_req_data[idx]
            .as_deref()
            .expect("term_req_data slot is empty (taken)")
    }
    #[inline]
    pub(crate) fn get_cardinality_req_data(&self, idx: usize) -> &CardinalityAggReqData {
        &self.per_request.cardinality_req_data[idx]
    }
    #[inline]
    pub(crate) fn get_metric_req_data(&self, idx: usize) -> &MetricAggReqData {
        &self.per_request.stats_metric_req_data[idx]
    }
    #[inline]
    pub(crate) fn get_top_hits_req_data(&self, idx: usize) -> &TopHitsAggReqData {
        &self.per_request.top_hits_req_data[idx]
    }
    #[inline]
    pub(crate) fn get_missing_term_req_data(&self, idx: usize) -> &MissingTermAggReqData {
        &self.per_request.missing_term_req_data[idx]
    }
    #[inline]
    pub(crate) fn get_histogram_req_data(&self, idx: usize) -> &HistogramAggReqData {
        self.per_request.histogram_req_data[idx]
            .as_deref()
            .expect("histogram_req_data slot is empty (taken)")
    }
    #[inline]
    pub(crate) fn get_range_req_data(&self, idx: usize) -> &RangeAggReqData {
        self.per_request.range_req_data[idx]
            .as_deref()
            .expect("range_req_data slot is empty (taken)")
    }
    #[inline]
    pub(crate) fn get_composite_req_data(&self, idx: usize) -> &CompositeAggReqData {
        self.per_request.composite_req_data[idx]
            .as_deref()
            .expect("composite_req_data slot is empty (taken)")
    }

    // ---------- mutable getters ----------

    #[inline]
    pub(crate) fn get_metric_req_data_mut(&mut self, idx: usize) -> &mut MetricAggReqData {
        &mut self.per_request.stats_metric_req_data[idx]
    }

    #[inline]
    pub(crate) fn get_cardinality_req_data_mut(
        &mut self,
        idx: usize,
    ) -> &mut CardinalityAggReqData {
        &mut self.per_request.cardinality_req_data[idx]
    }

    #[inline]
    pub(crate) fn get_histogram_req_data_mut(&mut self, idx: usize) -> &mut HistogramAggReqData {
        self.per_request.histogram_req_data[idx]
            .as_deref_mut()
            .expect("histogram_req_data slot is empty (taken)")
    }

    // ---------- take / put (terms, histogram, range) ----------

    /// Move out the boxed Histogram request at `idx`, leaving `None`.
    #[inline]
    pub(crate) fn take_histogram_req_data(&mut self, idx: usize) -> Box<HistogramAggReqData> {
        self.per_request.histogram_req_data[idx]
            .take()
            .expect("histogram_req_data slot is empty (taken)")
    }

    /// Put back a Histogram request into an empty slot at `idx`.
    #[inline]
    pub(crate) fn put_back_histogram_req_data(
        &mut self,
        idx: usize,
        value: Box<HistogramAggReqData>,
    ) {
        debug_assert!(self.per_request.histogram_req_data[idx].is_none());
        self.per_request.histogram_req_data[idx] = Some(value);
    }

    /// Move out the boxed Range request at `idx`, leaving `None`.
    #[inline]
    pub(crate) fn take_range_req_data(&mut self, idx: usize) -> Box<RangeAggReqData> {
        self.per_request.range_req_data[idx]
            .take()
            .expect("range_req_data slot is empty (taken)")
    }

    /// Put back a Range request into an empty slot at `idx`.
    #[inline]
    pub(crate) fn put_back_range_req_data(&mut self, idx: usize, value: Box<RangeAggReqData>) {
        debug_assert!(self.per_request.range_req_data[idx].is_none());
        self.per_request.range_req_data[idx] = Some(value);
    }

    /// Move out the boxed Filter request at `idx`, leaving `None`.
    #[inline]
    pub(crate) fn take_filter_req_data(&mut self, idx: usize) -> Box<FilterAggReqData> {
        self.per_request.filter_req_data[idx]
            .take()
            .expect("filter_req_data slot is empty (taken)")
    }

    /// Put back a Filter request into an empty slot at `idx`.
    #[inline]
    pub(crate) fn put_back_filter_req_data(&mut self, idx: usize, value: Box<FilterAggReqData>) {
        debug_assert!(self.per_request.filter_req_data[idx].is_none());
        self.per_request.filter_req_data[idx] = Some(value);
    }

    /// Move out the Composite request at `idx`.
    #[inline]
    pub(crate) fn take_composite_req_data(&mut self, idx: usize) -> Box<CompositeAggReqData> {
        self.per_request.composite_req_data[idx]
            .take()
            .expect("composite_req_data slot is empty (taken)")
    }

    /// Put back a Composite request into an empty slot at `idx`.
    #[inline]
    pub(crate) fn put_back_composite_req_data(
        &mut self,
        idx: usize,
        value: Box<CompositeAggReqData>,
    ) {
        debug_assert!(self.per_request.composite_req_data[idx].is_none());
        self.per_request.composite_req_data[idx] = Some(value);
    }
}

/// Each type of aggregation has its own request data struct. This struct holds
/// all request data to execute the aggregation request on a single segment.
///
/// The request tree is represented by `agg_tree`. Tree nodes contain the index
/// of their context in corresponding request data vector (e.g. `term_req_data`
/// for a node with [AggKind::Terms]).
#[derive(Default)]
pub struct PerRequestAggSegCtx {
    // Box for cheap take/put - Only necessary for bucket aggs that have sub-aggregations
    /// TermsAggReqData contains the request data for a terms aggregation.
    pub term_req_data: Vec<Option<Box<TermsAggReqData>>>,
    /// HistogramAggReqData contains the request data for a histogram aggregation.
    pub histogram_req_data: Vec<Option<Box<HistogramAggReqData>>>,
    /// RangeAggReqData contains the request data for a range aggregation.
    pub range_req_data: Vec<Option<Box<RangeAggReqData>>>,
    /// FilterAggReqData contains the request data for a filter aggregation.
    pub filter_req_data: Vec<Option<Box<FilterAggReqData>>>,
    /// Shared by avg, min, max, sum, stats, extended_stats, count
    pub stats_metric_req_data: Vec<MetricAggReqData>,
    /// CardinalityAggReqData contains the request data for a cardinality aggregation.
    pub cardinality_req_data: Vec<CardinalityAggReqData>,
    /// TopHitsAggReqData contains the request data for a top_hits aggregation.
    pub top_hits_req_data: Vec<TopHitsAggReqData>,
    /// MissingTermAggReqData contains the request data for a missing term aggregation.
    pub missing_term_req_data: Vec<MissingTermAggReqData>,
    /// CompositeAggReqData contains the request data for a composite aggregation.
    pub composite_req_data: Vec<Option<Box<CompositeAggReqData>>>,

    /// Request tree used to build collectors.
    pub agg_tree: Vec<AggRefNode>,
}

impl PerRequestAggSegCtx {
    /// Estimate the memory consumption of this struct in bytes.
    fn get_memory_consumption(&self) -> usize {
        self.term_req_data
            .iter()
            .map(|b| b.as_ref().unwrap().get_memory_consumption())
            .sum::<usize>()
            + self
                .histogram_req_data
                .iter()
                .map(|b| b.as_ref().unwrap().get_memory_consumption())
                .sum::<usize>()
            + self
                .range_req_data
                .iter()
                .map(|b| b.as_ref().unwrap().get_memory_consumption())
                .sum::<usize>()
            + self
                .filter_req_data
                .iter()
                .map(|b| b.as_ref().unwrap().get_memory_consumption())
                .sum::<usize>()
            + self
                .stats_metric_req_data
                .iter()
                .map(|t| t.get_memory_consumption())
                .sum::<usize>()
            + self
                .cardinality_req_data
                .iter()
                .map(|t| t.get_memory_consumption())
                .sum::<usize>()
            + self
                .top_hits_req_data
                .iter()
                .map(|t| t.get_memory_consumption())
                .sum::<usize>()
            + self
                .missing_term_req_data
                .iter()
                .map(|t| t.get_memory_consumption())
                .sum::<usize>()
            + self
                .composite_req_data
                .iter()
                .map(|b| b.as_ref().map(|d| d.get_memory_consumption()).unwrap_or(0))
                .sum::<usize>()
            + self.agg_tree.len() * std::mem::size_of::<AggRefNode>()
    }

    pub fn get_name(&self, node: &AggRefNode) -> &str {
        let idx = node.idx_in_req_data;
        let kind = node.kind;
        match kind {
            AggKind::Terms => self.term_req_data[idx]
                .as_deref()
                .expect("term_req_data slot is empty (taken)")
                .name
                .as_str(),
            AggKind::Cardinality => &self.cardinality_req_data[idx].name,
            AggKind::StatsKind(_) => &self.stats_metric_req_data[idx].name,
            AggKind::TopHits => &self.top_hits_req_data[idx].name,
            AggKind::MissingTerm => &self.missing_term_req_data[idx].name,
            AggKind::Histogram => self.histogram_req_data[idx]
                .as_deref()
                .expect("histogram_req_data slot is empty (taken)")
                .name
                .as_str(),
            AggKind::DateHistogram => self.histogram_req_data[idx]
                .as_deref()
                .expect("histogram_req_data slot is empty (taken)")
                .name
                .as_str(),
            AggKind::Range => self.range_req_data[idx]
                .as_deref()
                .expect("range_req_data slot is empty (taken)")
                .name
                .as_str(),
            AggKind::Filter => self.filter_req_data[idx]
                .as_deref()
                .expect("filter_req_data slot is empty (taken)")
                .name
                .as_str(),
            AggKind::Composite => self.composite_req_data[idx]
                .as_deref()
                .expect("composite_req_data slot is empty (taken)")
                .name
                .as_str(),
        }
    }

    /// Convert the aggregation tree into a serializable struct representation.
    /// Each node contains: { name, kind, children }.
    #[allow(dead_code)]
    pub fn get_view_tree(&self) -> Vec<AggTreeViewNode> {
        fn node_to_view(node: &AggRefNode, pr: &PerRequestAggSegCtx) -> AggTreeViewNode {
            let mut children: Vec<AggTreeViewNode> =
                node.children.iter().map(|c| node_to_view(c, pr)).collect();
            children.sort_by_key(|v| serde_json::to_string(v).unwrap());
            AggTreeViewNode {
                name: pr.get_name(node).to_string(),
                kind: node.kind.as_str().to_string(),
                children,
            }
        }

        let mut roots: Vec<AggTreeViewNode> = self
            .agg_tree
            .iter()
            .map(|n| node_to_view(n, self))
            .collect();
        roots.sort_by_key(|v| serde_json::to_string(v).unwrap());
        roots
    }
}

pub(crate) fn build_segment_agg_collectors_root(
    req: &mut AggregationsSegmentCtx,
) -> crate::Result<Box<dyn SegmentAggregationCollector>> {
    build_segment_agg_collectors_generic(req, &req.per_request.agg_tree.clone())
}

pub(crate) fn build_segment_agg_collectors(
    req: &mut AggregationsSegmentCtx,
    nodes: &[AggRefNode],
) -> crate::Result<Box<dyn SegmentAggregationCollector>> {
    build_segment_agg_collectors_generic(req, nodes)
}

fn build_segment_agg_collectors_generic(
    req: &mut AggregationsSegmentCtx,
    nodes: &[AggRefNode],
) -> crate::Result<Box<dyn SegmentAggregationCollector>> {
    let mut collectors = Vec::new();
    for node in nodes.iter() {
        collectors.push(build_segment_agg_collector(req, node)?);
    }

    req.context
        .limits
        .add_memory_consumed(req.per_request.get_memory_consumption() as u64)?;
    // Single collector special case
    if collectors.len() == 1 {
        return Ok(collectors.pop().unwrap());
    }
    let agg = GenericSegmentAggregationResultsCollector { aggs: collectors };
    Ok(Box::new(agg))
}

pub(crate) fn build_segment_agg_collector(
    req: &mut AggregationsSegmentCtx,
    node: &AggRefNode,
) -> crate::Result<Box<dyn SegmentAggregationCollector>> {
    match node.kind {
        AggKind::Terms => crate::aggregation::bucket::build_segment_term_collector(req, node),
        AggKind::MissingTerm => {
            let req_data = &mut req.per_request.missing_term_req_data[node.idx_in_req_data];
            if req_data.accessors.is_empty() {
                return Err(crate::TantivyError::InternalError(
                    "MissingTerm aggregation requires at least one field accessor.".to_string(),
                ));
            }
            Ok(Box::new(TermMissingAgg::new(req, node)?))
        }
        AggKind::Cardinality => {
            let req_data = &mut req.get_cardinality_req_data_mut(node.idx_in_req_data);
            Ok(Box::new(SegmentCardinalityCollector::from_req(
                req_data.column_type,
                node.idx_in_req_data,
                req_data.accessor.clone(),
                req_data.missing_value_for_accessor,
            )))
        }
        AggKind::StatsKind(stats_type) => {
            let req_data = &mut req.per_request.stats_metric_req_data[node.idx_in_req_data];
            match stats_type {
                StatsType::Sum
                | StatsType::Average
                | StatsType::Count
                | StatsType::Max
                | StatsType::Min
                | StatsType::Stats => build_segment_stats_collector(req_data),
                StatsType::ExtendedStats(sigma) => Ok(Box::new(
                    SegmentExtendedStatsCollector::from_req(req_data, sigma),
                )),
                StatsType::Percentiles => {
                    let req_data = req.get_metric_req_data_mut(node.idx_in_req_data);
                    Ok(Box::new(
                        SegmentPercentilesCollector::from_req_and_validate(
                            req_data.field_type,
                            req_data.missing_u64,
                            req_data.accessor.clone(),
                            node.idx_in_req_data,
                        ),
                    ))
                }
            }
        }
        AggKind::TopHits => {
            let req_data = &mut req.per_request.top_hits_req_data[node.idx_in_req_data];
            Ok(Box::new(TopHitsSegmentCollector::from_req(
                &req_data.req,
                node.idx_in_req_data,
                req_data.segment_ordinal,
            )))
        }
        AggKind::Histogram => Ok(Box::new(SegmentHistogramCollector::from_req_and_validate(
            req, node,
        )?)),
        AggKind::DateHistogram => Ok(Box::new(SegmentHistogramCollector::from_req_and_validate(
            req, node,
        )?)),
        AggKind::Range => Ok(build_segment_range_collector(req, node)?),
        AggKind::Filter => build_segment_filter_collector(req, node),
        AggKind::Composite => Ok(Box::new(
            crate::aggregation::bucket::SegmentCompositeCollector::from_req_and_validate(
                req, node,
            )?,
        )),
    }
}

/// See [PerRequestAggSegCtx]
#[derive(Debug, Clone)]
pub struct AggRefNode {
    pub kind: AggKind,
    pub idx_in_req_data: usize,
    pub children: Vec<AggRefNode>,
}
impl AggRefNode {
    pub fn get_sub_agg(&self, name: &str, pr: &PerRequestAggSegCtx) -> Option<&AggRefNode> {
        self.children
            .iter()
            .find(|&child| pr.get_name(child) == name)
    }
}

#[derive(Copy, Clone, Debug)]
pub enum AggKind {
    Terms,
    Cardinality,
    /// One of: Statistics, Average, Min, Max, Sum, Count, Stats, ExtendedStats
    StatsKind(StatsType),
    TopHits,
    MissingTerm,
    Histogram,
    DateHistogram,
    Range,
    Filter,
    Composite,
}

impl AggKind {
    #[cfg_attr(not(test), allow(dead_code))]
    fn as_str(&self) -> &'static str {
        match self {
            AggKind::Terms => "Terms",
            AggKind::Cardinality => "Cardinality",
            AggKind::StatsKind(_) => "Metric",
            AggKind::TopHits => "TopHits",
            AggKind::MissingTerm => "MissingTerm",
            AggKind::Histogram => "Histogram",
            AggKind::DateHistogram => "DateHistogram",
            AggKind::Range => "Range",
            AggKind::Filter => "Filter",
            AggKind::Composite => "Composite",
        }
    }
}

/// Build AggregationsData by walking the request tree.
pub(crate) fn build_aggregations_data_from_req(
    aggs: &Aggregations,
    reader: &SegmentReader,
    segment_ordinal: SegmentOrdinal,
    context: AggContextParams,
) -> crate::Result<AggregationsSegmentCtx> {
    let mut data = AggregationsSegmentCtx {
        per_request: Default::default(),
        context,
        column_block_accessor: ColumnBlockAccessor::default(),
    };

    for (name, agg) in aggs.iter() {
        let nodes = build_nodes(name, agg, reader, segment_ordinal, &mut data, true)?;
        data.per_request.agg_tree.extend(nodes);
    }
    Ok(data)
}

fn build_nodes(
    agg_name: &str,
    req: &Aggregation,
    reader: &SegmentReader,
    segment_ordinal: SegmentOrdinal,
    data: &mut AggregationsSegmentCtx,
    is_top_level: bool,
) -> crate::Result<Vec<AggRefNode>> {
    use AggregationVariants::*;
    match &req.agg {
        Range(range_req) => {
            let (accessor, field_type) = get_ff_reader(
                reader,
                &range_req.field,
                Some(get_numeric_or_date_column_types()),
            )?;
            let idx_in_req_data = data.push_range_req_data(RangeAggReqData {
                accessor,
                field_type,
                name: agg_name.to_string(),
                req: range_req.clone(),
                is_top_level,
            });
            let children = build_children(&req.sub_aggregation, reader, segment_ordinal, data)?;
            Ok(vec![AggRefNode {
                kind: AggKind::Range,
                idx_in_req_data,
                children,
            }])
        }
        Histogram(histo_req) => {
            let (accessor, field_type) = get_ff_reader(
                reader,
                &histo_req.field,
                Some(get_numeric_or_date_column_types()),
            )?;
            let idx_in_req_data = data.push_histogram_req_data(HistogramAggReqData {
                accessor,
                field_type,
                name: agg_name.to_string(),
                req: histo_req.clone(),
                is_date_histogram: false,
                bounds: HistogramBounds {
                    min: f64::MIN,
                    max: f64::MAX,
                },
                offset: 0.0,
            });
            let children = build_children(&req.sub_aggregation, reader, segment_ordinal, data)?;
            Ok(vec![AggRefNode {
                kind: AggKind::Histogram,
                idx_in_req_data,
                children,
            }])
        }
        DateHistogram(date_req) => {
            let (accessor, field_type) =
                get_ff_reader(reader, &date_req.field, Some(&[ColumnType::DateTime]))?;
            // Convert to histogram request, normalize to ns precision
            let mut histo_req = date_req.to_histogram_req()?;
            histo_req.normalize_date_time();
            let idx_in_req_data = data.push_histogram_req_data(HistogramAggReqData {
                accessor,
                field_type,
                name: agg_name.to_string(),
                req: histo_req,
                is_date_histogram: true,
                bounds: HistogramBounds {
                    min: f64::MIN,
                    max: f64::MAX,
                },
                offset: 0.0,
            });
            let children = build_children(&req.sub_aggregation, reader, segment_ordinal, data)?;
            Ok(vec![AggRefNode {
                kind: AggKind::DateHistogram,
                idx_in_req_data,
                children,
            }])
        }
        Terms(terms_req) => build_terms_or_cardinality_nodes(
            agg_name,
            &terms_req.field,
            &terms_req.missing,
            reader,
            segment_ordinal,
            data,
            &req.sub_aggregation,
            TermsOrCardinalityRequest::Terms(terms_req.clone()),
            is_top_level,
        ),
        Cardinality(card_req) => build_terms_or_cardinality_nodes(
            agg_name,
            &card_req.field,
            &card_req.missing,
            reader,
            segment_ordinal,
            data,
            &req.sub_aggregation,
            TermsOrCardinalityRequest::Cardinality(card_req.clone()),
            is_top_level,
        ),
        Average(AverageAggregation { field, missing, .. })
        | Max(MaxAggregation { field, missing, .. })
        | Min(MinAggregation { field, missing, .. })
        | Stats(StatsAggregation { field, missing, .. })
        | ExtendedStats(ExtendedStatsAggregation { field, missing, .. })
        | Sum(SumAggregation { field, missing, .. })
        | Count(CountAggregation { field, missing, .. }) => {
            let allowed_column_types = if matches!(&req.agg, Count(_)) {
                Some(
                    &[
                        ColumnType::I64,
                        ColumnType::U64,
                        ColumnType::F64,
                        ColumnType::Str,
                        ColumnType::DateTime,
                        ColumnType::Bool,
                        ColumnType::IpAddr,
                    ][..],
                )
            } else {
                Some(get_numeric_or_date_column_types())
            };
            let collecting_for = match &req.agg {
                Average(_) => StatsType::Average,
                Max(_) => StatsType::Max,
                Min(_) => StatsType::Min,
                Stats(_) => StatsType::Stats,
                ExtendedStats(req) => StatsType::ExtendedStats(req.sigma),
                Sum(_) => StatsType::Sum,
                Count(_) => StatsType::Count,
                _ => {
                    return Err(crate::TantivyError::InvalidArgument(
                        "Internal error: unexpected aggregation type in metric aggregation \
                         handling."
                            .to_string(),
                    ))
                }
            };
            let (accessor, field_type) = get_ff_reader(reader, field, allowed_column_types)?;
            let idx_in_req_data = data.push_metric_req_data(MetricAggReqData {
                accessor,
                field_type,
                name: agg_name.to_string(),
                collecting_for,
                missing: *missing,
                missing_u64: (*missing).and_then(|m| f64_to_fastfield_u64(m, &field_type)),
                is_number_or_date_type: matches!(
                    field_type,
                    ColumnType::I64 | ColumnType::U64 | ColumnType::F64 | ColumnType::DateTime
                ),
            });
            let children = build_children(&req.sub_aggregation, reader, segment_ordinal, data)?;
            Ok(vec![AggRefNode {
                kind: AggKind::StatsKind(collecting_for),
                idx_in_req_data,
                children,
            }])
        }
        // Percentiles handled as Metric as well
        AggregationVariants::Percentiles(percentiles_req) => {
            percentiles_req.validate()?;
            let (accessor, field_type) = get_ff_reader(
                reader,
                percentiles_req.field_name(),
                Some(get_numeric_or_date_column_types()),
            )?;
            let idx_in_req_data = data.push_metric_req_data(MetricAggReqData {
                accessor,
                field_type,
                name: agg_name.to_string(),
                collecting_for: StatsType::Percentiles,
                missing: percentiles_req.missing,
                missing_u64: percentiles_req
                    .missing
                    .and_then(|m| f64_to_fastfield_u64(m, &field_type)),
                is_number_or_date_type: matches!(
                    field_type,
                    ColumnType::I64 | ColumnType::U64 | ColumnType::F64 | ColumnType::DateTime
                ),
            });
            let children = build_children(&req.sub_aggregation, reader, segment_ordinal, data)?;
            Ok(vec![AggRefNode {
                kind: AggKind::StatsKind(StatsType::Percentiles),
                idx_in_req_data,
                children,
            }])
        }
        AggregationVariants::TopHits(top_hits_req) => {
            let mut top_hits = top_hits_req.clone();
            top_hits.validate_and_resolve_field_names(reader.fast_fields().columnar())?;
            let accessors: Vec<(Column<u64>, ColumnType)> = top_hits
                .field_names()
                .iter()
                .map(|field| get_ff_reader(reader, field, Some(get_numeric_or_date_column_types())))
                .collect::<crate::Result<_>>()?;

            let value_accessors = top_hits
                .value_field_names()
                .iter()
                .map(|field_name| {
                    Ok((
                        field_name.to_string(),
                        get_dynamic_columns(reader, field_name)?,
                    ))
                })
                .collect::<crate::Result<_>>()?;

            let idx_in_req_data = data.push_top_hits_req_data(TopHitsAggReqData {
                accessors,
                value_accessors,
                segment_ordinal,
                name: agg_name.to_string(),
                req: top_hits.clone(),
            });
            let children = build_children(&req.sub_aggregation, reader, segment_ordinal, data)?;
            Ok(vec![AggRefNode {
                kind: AggKind::TopHits,
                idx_in_req_data,
                children,
            }])
        }
        AggregationVariants::Composite(composite_req) => Ok(vec![build_composite_node(
            agg_name,
            reader,
            segment_ordinal,
            data,
            &req.sub_aggregation,
            composite_req,
        )?]),
        AggregationVariants::Filter(filter_req) => {
            // Build the query and evaluator upfront
            let schema = reader.schema();
            let tokenizers = &data.context.tokenizers;
            let query = filter_req.parse_query(schema, tokenizers)?;
            let evaluator = crate::aggregation::bucket::DocumentQueryEvaluator::new(
                query,
                schema.clone(),
                reader,
            )?;

            // Pre-allocate buffer for batch filtering
            let max_doc = reader.max_doc();
            let buffer_capacity = crate::docset::COLLECT_BLOCK_BUFFER_LEN.min(max_doc as usize);
            let matching_docs_buffer = Vec::with_capacity(buffer_capacity);

            let idx_in_req_data = data.push_filter_req_data(FilterAggReqData {
                name: agg_name.to_string(),
                req: filter_req.clone(),
                segment_reader: reader.clone(),
                evaluator,
                matching_docs_buffer,
                is_top_level,
            });
            let children = build_children(&req.sub_aggregation, reader, segment_ordinal, data)?;
            Ok(vec![AggRefNode {
                kind: AggKind::Filter,
                idx_in_req_data,
                children,
            }])
        }
    }
}

fn build_composite_node(
    agg_name: &str,
    reader: &SegmentReader,
    _segment_ordinal: SegmentOrdinal,
    data: &mut AggregationsSegmentCtx,
    sub_aggs: &Aggregations,
    req: &CompositeAggregation,
) -> crate::Result<AggRefNode> {
    let mut composite_accessors = Vec::with_capacity(req.sources.len());
    for source in &req.sources {
        let source_after_key_opt = req.after.get(source.name()).map(|k| &k.0);
        let source_accessor =
            CompositeSourceAccessors::build_for_source(reader, source, source_after_key_opt)?;
        composite_accessors.push(source_accessor);
    }
    let agg = CompositeAggReqData {
        name: agg_name.to_string(),
        req: req.clone(),
        composite_accessors,
    };
    let idx = data.push_composite_req_data(agg);
    let children = build_children(sub_aggs, reader, _segment_ordinal, data)?;
    Ok(AggRefNode {
        kind: AggKind::Composite,
        idx_in_req_data: idx,
        children,
    })
}

fn build_children(
    aggs: &Aggregations,
    reader: &SegmentReader,
    segment_ordinal: SegmentOrdinal,
    data: &mut AggregationsSegmentCtx,
) -> crate::Result<Vec<AggRefNode>> {
    let mut children = Vec::new();
    for (name, agg) in aggs.iter() {
        children.extend(build_nodes(
            name,
            agg,
            reader,
            segment_ordinal,
            data,
            false,
        )?);
    }
    Ok(children)
}

fn get_term_agg_accessors(
    reader: &SegmentReader,
    field_name: &str,
    missing: &Option<Key>,
) -> crate::Result<Vec<(Column<u64>, ColumnType)>> {
    let allowed_column_types = [
        ColumnType::I64,
        ColumnType::U64,
        ColumnType::F64,
        ColumnType::Str,
        ColumnType::DateTime,
        ColumnType::Bool,
        ColumnType::IpAddr,
    ];

    // In case the column is empty we want the shim column to match the missing type
    let fallback_type = missing
        .as_ref()
        .map(|missing| match missing {
            Key::Str(_) => ColumnType::Str,
            Key::F64(_) => ColumnType::F64,
            Key::I64(_) => ColumnType::I64,
            Key::U64(_) => ColumnType::U64,
        })
        .unwrap_or(ColumnType::U64);

    let column_and_types = get_all_ff_reader_or_empty(
        reader,
        field_name,
        Some(&allowed_column_types),
        fallback_type,
    )?;

    Ok(column_and_types)
}

enum TermsOrCardinalityRequest {
    Terms(TermsAggregation),
    Cardinality(CardinalityAggregationReq),
}
impl TermsOrCardinalityRequest {
    fn as_terms(&self) -> Option<&TermsAggregation> {
        match self {
            TermsOrCardinalityRequest::Terms(t) => Some(t),
            _ => None,
        }
    }
}

#[allow(clippy::too_many_arguments)]
fn build_terms_or_cardinality_nodes(
    agg_name: &str,
    field_name: &str,
    missing: &Option<Key>,
    reader: &SegmentReader,
    segment_ordinal: SegmentOrdinal,
    data: &mut AggregationsSegmentCtx,
    sub_aggs: &Aggregations,
    req: TermsOrCardinalityRequest,
    is_top_level: bool,
) -> crate::Result<Vec<AggRefNode>> {
    let mut nodes = Vec::new();

    let str_dict_column = reader.fast_fields().str(field_name)?;

    let column_and_types = get_term_agg_accessors(reader, field_name, missing)?;

    // Special handling when missing + multi column or incompatible type on text/date.
    let missing_and_more_than_one_col = column_and_types.len() > 1 && missing.is_some();
    let text_on_non_text_col = column_and_types.len() == 1
        && column_and_types[0].1 != ColumnType::Str
        && matches!(missing, Some(Key::Str(_)));

    let use_special_missing_agg = missing_and_more_than_one_col || text_on_non_text_col;

    // If special missing handling is required, build a MissingTerm node that carries all
    // accessors (across any column types) for existence checks.
    if use_special_missing_agg {
        let fallback_type = missing
            .as_ref()
            .map(|missing| match missing {
                Key::Str(_) => ColumnType::Str,
                Key::F64(_) => ColumnType::F64,
                Key::I64(_) => ColumnType::I64,
                Key::U64(_) => ColumnType::U64,
            })
            .unwrap_or(ColumnType::U64);
        let all_accessors = get_all_ff_reader_or_empty(reader, field_name, None, fallback_type)?
            .into_iter()
            .collect::<Vec<_>>();
        // This case only happens when we have term aggregation, or we fail
        let req = req.as_terms().cloned().ok_or_else(|| {
            crate::TantivyError::InvalidArgument(
                "Cardinality aggregation with missing on non-text/number field is not supported."
                    .to_string(),
            )
        })?;

        let children = build_children(sub_aggs, reader, segment_ordinal, data)?;
        let idx_in_req_data = data.push_missing_term_req_data(MissingTermAggReqData {
            accessors: all_accessors,
            name: agg_name.to_string(),
            req,
        });
        nodes.push(AggRefNode {
            kind: AggKind::MissingTerm,
            idx_in_req_data,
            children,
        });
    }

    // Add one node per accessor
    for (accessor, column_type) in column_and_types {
        let missing_value_for_accessor = if use_special_missing_agg {
            None
        } else if let Some(m) = missing.as_ref() {
            get_missing_val_as_u64_lenient(column_type, accessor.max_value(), m, field_name)?
        } else {
            None
        };

        let children = build_children(sub_aggs, reader, segment_ordinal, data)?;
        let (idx, kind) = match req {
            TermsOrCardinalityRequest::Terms(ref req) => {
                let mut allowed_term_ids = None;
                if req.include.is_some() || req.exclude.is_some() {
                    if column_type != ColumnType::Str {
                        // Skip non-string columns entirely when filtering is requested.
                        // When excluding, the behavior could be to include non-string values
                        continue;
                    }
                    let str_col = str_dict_column
                        .as_ref()
                        .expect("str_dict_column must exist for string column");
                    allowed_term_ids =
                        build_allowed_term_ids_for_str(str_col, &req.include, &req.exclude)?;
                };
                let idx_in_req_data = data.push_term_req_data(TermsAggReqData {
                    accessor,
                    column_type,
                    str_dict_column: str_dict_column.clone(),
                    missing_value_for_accessor,
                    name: agg_name.to_string(),
                    req: TermsAggregationInternal::from_req(req),
                    sug_aggregations: sub_aggs.clone(),
                    allowed_term_ids,
                    is_top_level,
                });
                (idx_in_req_data, AggKind::Terms)
            }
            TermsOrCardinalityRequest::Cardinality(ref req) => {
                let idx_in_req_data = data.push_cardinality_req_data(CardinalityAggReqData {
                    accessor,
                    column_type,
                    str_dict_column: str_dict_column.clone(),
                    missing_value_for_accessor,
                    name: agg_name.to_string(),
                    req: req.clone(),
                });
                (idx_in_req_data, AggKind::Cardinality)
            }
        };
        nodes.push(AggRefNode {
            kind,
            idx_in_req_data: idx,
            children,
        });
    }

    Ok(nodes)
}

/// Builds a single BitSet of allowed term ordinals for a string dictionary column according to
/// include/exclude parameters.
fn build_allowed_term_ids_for_str(
    str_col: &StrColumn,
    include: &Option<IncludeExcludeParam>,
    exclude: &Option<IncludeExcludeParam>,
) -> crate::Result<Option<BitSet>> {
    let mut allowed: Option<BitSet> = None;
    let num_terms = str_col.dictionary().num_terms() as u32;
    if let Some(include) = include {
        // add matches
        allowed = Some(BitSet::with_max_value(num_terms));
        let allowed = allowed.as_mut().unwrap();
        for_each_matching_term_ord(str_col, include, |ord| allowed.insert(ord))?;
    };

    if let Some(exclude) = exclude {
        if allowed.is_none() {
            // Start with all terms allowed
            allowed = Some(BitSet::with_max_value_and_full(num_terms));
        }
        let allowed = allowed.as_mut().unwrap();
        for_each_matching_term_ord(str_col, exclude, |ord| allowed.remove(ord))?;
    }

    Ok(allowed)
}

/// Apply a callback to each matching term ordinal for the given include/exclude parameter.
fn for_each_matching_term_ord(
    str_col: &StrColumn,
    param: &IncludeExcludeParam,
    mut cb: impl FnMut(u32),
) -> crate::Result<()> {
    match param {
        IncludeExcludeParam::Regex(pattern) => {
            let re = Regex::new(pattern).map_err(|e| {
                crate::TantivyError::InvalidArgument(format!("Invalid regex `{}`: {}", pattern, e))
            })?;
            // TODO: we can handle patterns like `^prefix.*` more efficiently
            let mut stream = str_col.dictionary().search(re).into_stream()?;
            while stream.advance() {
                cb(stream.term_ord() as u32);
            }
        }
        IncludeExcludeParam::Values(values) => {
            let set: FxHashSet<&str> = values.iter().map(|s| s.as_str()).collect();
            let mut stream = str_col.dictionary().stream()?;
            while stream.advance() {
                if let Ok(key_str) = std::str::from_utf8(stream.key()) {
                    if set.contains(key_str) {
                        cb(stream.term_ord() as u32);
                    }
                }
            }
        }
    }
    Ok(())
}

/// Convert the aggregation tree to something serializable and easy to read.
#[derive(Serialize, Debug, Clone, PartialEq, Eq)]
pub struct AggTreeViewNode {
    pub name: String,
    pub kind: String,
    #[serde(skip_serializing_if = "Vec::is_empty", default)]
    pub children: Vec<AggTreeViewNode>,
}

#[cfg(test)]
mod tests {
    use super::*;
    use crate::aggregation::agg_req::Aggregations;
    use crate::aggregation::tests::get_test_index_2_segments;

    fn agg_from_json(val: serde_json::Value) -> crate::aggregation::agg_req::Aggregation {
        serde_json::from_value(val).unwrap()
    }

    #[test]
    fn test_tree_roots_and_expansion_terms_missing_on_numeric() -> crate::Result<()> {
        let index = get_test_index_2_segments(true)?;
        let reader = index.reader()?;
        let searcher = reader.searcher();
        let seg_reader = searcher.segment_reader(0u32);

        // Build request with:
        // 1) Terms on numeric field with missing as string => expands to MissingTerm + Terms
        // 2) Avg metric
        // 3) Terms on string with child histogram
        let terms_score_missing = agg_from_json(json!({
            "terms": {"field": "score", "missing": "NA"}
        }));
        let avg_score = agg_from_json(json!({
            "avg": {"field": "score"}
        }));
        let terms_string_with_child = agg_from_json(json!({
            "terms": {"field": "string_id"},
            "aggs": {
                "histo": {"histogram": {"field": "score", "interval": 10.0}}
            }
        }));

        let aggs: Aggregations = vec![
            ("t_score_missing_str".to_string(), terms_score_missing),
            ("avg_score".to_string(), avg_score),
            ("terms_string".to_string(), terms_string_with_child),
        ]
        .into_iter()
        .collect();

        let data = build_aggregations_data_from_req(&aggs, seg_reader, 0u32, Default::default())?;
        let printed_nodes = data.per_request.get_view_tree();
        let printed = serde_json::to_value(&printed_nodes).unwrap();

        let expected = json!([
            {"name": "avg_score", "kind": "Metric"},
            {"name": "t_score_missing_str", "kind": "MissingTerm"},
            {"name": "t_score_missing_str", "kind": "Terms"},
            {"name": "terms_string", "kind": "Terms", "children": [
                {"name": "histo", "kind": "Histogram"}
            ]}
        ]);
        assert_eq!(
            printed,
            expected,
            "tree json:\n{}",
            serde_json::to_string_pretty(&printed).unwrap()
        );

        Ok(())
    }
}


================================================
FILE: src/aggregation/agg_limits.rs
================================================
use std::collections::HashMap;
use std::sync::atomic::{AtomicU64, Ordering};
use std::sync::Arc;

use common::ByteCount;

use super::collector::DEFAULT_MEMORY_LIMIT;
use super::{AggregationError, DEFAULT_BUCKET_LIMIT};

/// An estimate for memory consumption. Non recursive
pub trait MemoryConsumption {
    fn memory_consumption(&self) -> usize;
}

impl<K, V, S> MemoryConsumption for HashMap<K, V, S> {
    fn memory_consumption(&self) -> usize {
        let capacity = self.capacity();
        (std::mem::size_of::<K>() + std::mem::size_of::<V>() + 1) * capacity
    }
}

/// Aggregation memory limit after which the request fails. Defaults to DEFAULT_MEMORY_LIMIT
/// (500MB). The limit is shared by all SegmentCollectors
///
/// The memory limit is also a guard, which tracks how much it allocated and releases it's memory
/// on the shared counter. Cloning will create a new guard.
pub struct AggregationLimitsGuard {
    /// The counter which is shared between the aggregations for one request.
    memory_consumption: Arc<AtomicU64>,
    /// The memory_limit in bytes
    memory_limit: ByteCount,
    /// The maximum number of buckets _returned_
    /// This is not counting intermediate buckets.
    bucket_limit: u32,
    /// Allocated memory with this guard.
    allocated_with_the_guard: u64,
}

impl Clone for AggregationLimitsGuard {
    fn clone(&self) -> Self {
        Self {
            memory_consumption: Arc::clone(&self.memory_consumption),
            memory_limit: self.memory_limit,
            bucket_limit: self.bucket_limit,
            allocated_with_the_guard: 0,
        }
    }
}

impl Drop for AggregationLimitsGuard {
    /// Removes the memory consumed tracked by this _instance_ of AggregationLimits.
    /// This is used to clear the segment specific memory consumption all at once.
    fn drop(&mut self) {
        self.memory_consumption
            .fetch_sub(self.allocated_with_the_guard, Ordering::Relaxed);
    }
}

impl Default for AggregationLimitsGuard {
    fn default() -> Self {
        Self {
            memory_consumption: Default::default(),
            memory_limit: DEFAULT_MEMORY_LIMIT.into(),
            bucket_limit: DEFAULT_BUCKET_LIMIT,
            allocated_with_the_guard: 0,
        }
    }
}

impl AggregationLimitsGuard {
    /// *memory_limit*
    /// memory_limit is defined in bytes.
    /// Aggregation fails when the estimated memory consumption of the aggregation is higher than
    /// memory_limit.
    /// memory_limit will default to `DEFAULT_MEMORY_LIMIT` (500MB)
    ///
    /// *bucket_limit*
    /// Limits the maximum number of buckets returned from an aggregation request.
    /// bucket_limit will default to `DEFAULT_BUCKET_LIMIT` (65000)
    ///
    /// Note: The returned instance contains a Arc shared counter to track memory consumption.
    pub fn new(memory_limit: Option<u64>, bucket_limit: Option<u32>) -> Self {
        Self {
            memory_consumption: Default::default(),
            memory_limit: memory_limit.unwrap_or(DEFAULT_MEMORY_LIMIT).into(),
            bucket_limit: bucket_limit.unwrap_or(DEFAULT_BUCKET_LIMIT),
            allocated_with_the_guard: 0,
        }
    }

    pub(crate) fn add_memory_consumed(&mut self, add_num_bytes: u64) -> crate::Result<()> {
        let prev_value = self
            .memory_consumption
            .fetch_add(add_num_bytes, Ordering::Relaxed);
        self.allocated_with_the_guard += add_num_bytes;
        validate_memory_consumption(prev_value + add_num_bytes, self.memory_limit)?;
        Ok(())
    }

    pub(crate) fn get_bucket_limit(&self) -> u32 {
        self.bucket_limit
    }
}

fn validate_memory_consumption(
    memory_consumption: u64,
    memory_limit: ByteCount,
) -> Result<(), AggregationError> {
    // Load the estimated memory consumed by the aggregations
    let memory_consumed: ByteCount = memory_consumption.into();
    if memory_consumed > memory_limit {
        return Err(AggregationError::MemoryExceeded {
            limit: memory_limit,
            current: memory_consumed,
        });
    }
    Ok(())
}

#[cfg(test)]
mod tests {
    use crate::aggregation::tests::exec_request_with_query;

    // https://github.com/quickwit-oss/quickwit/issues/3837
    #[test]
    fn test_agg_limits_with_empty_merge() {
        use crate::aggregation::agg_req::Aggregations;
        use crate::aggregation::bucket::tests::get_test_index_from_docs;

        let docs = vec![
            vec![r#"{ "date": "2015-01-02T00:00:00Z", "text": "bbb", "text2": "bbb" }"#],
            vec![r#"{ "text": "aaa", "text2": "bbb" }"#],
        ];
        let index = get_test_index_from_docs(false, &docs).unwrap();

        {
            let elasticsearch_compatible_json = json!(
                {
                    "1": {
                        "terms": {"field": "text2", "min_doc_count": 0},
                        "aggs": {
                            "2":{
                                "date_histogram": {
                                    "field": "date",
                                    "fixed_interval": "1d",
                                    "extended_bounds": {
                                        "min": "2015-01-01T00:00:00Z",
                                        "max": "2015-01-10T00:00:00Z"
                                    }
                                }
                            }
                        }
                    }
                }
            );

            let agg_req: Aggregations = serde_json::from_str(
                &serde_json::to_string(&elasticsearch_compatible_json).unwrap(),
            )
            .unwrap();
            let res = exec_request_with_query(agg_req, &index, Some(("text", "bbb"))).unwrap();
            let expected_res = json!({
             "1": {
                "buckets": [
                  {
                    "2": {
                      "buckets": [
                        { "doc_count": 0, "key": 1420070400000.0, "key_as_string": "2015-01-01T00:00:00Z" },
                        { "doc_count": 1, "key": 1420156800000.0, "key_as_string": "2015-01-02T00:00:00Z" },
                        { "doc_count": 0, "key": 1420243200000.0, "key_as_string": "2015-01-03T00:00:00Z" },
                        { "doc_count": 0, "key": 1420329600000.0, "key_as_string": "2015-01-04T00:00:00Z" },
                        { "doc_count": 0, "key": 1420416000000.0, "key_as_string": "2015-01-05T00:00:00Z" },
                        { "doc_count": 0, "key": 1420502400000.0, "key_as_string": "2015-01-06T00:00:00Z" },
                        { "doc_count": 0, "key": 1420588800000.0, "key_as_string": "2015-01-07T00:00:00Z" },
                        { "doc_count": 0, "key": 1420675200000.0, "key_as_string": "2015-01-08T00:00:00Z" },
                        { "doc_count": 0, "key": 1420761600000.0, "key_as_string": "2015-01-09T00:00:00Z" },
                        { "doc_count": 0, "key": 1420848000000.0, "key_as_string": "2015-01-10T00:00:00Z" }
                      ]
                    },
                    "doc_count": 1,
                    "key": "bbb"
                  }
                ],
                "doc_count_error_upper_bound": 0,
                "sum_other_doc_count": 0
              }
            });
            assert_eq!(res, expected_res);
        }
    }

    // https://github.com/quickwit-oss/quickwit/issues/3837
    #[test]
    fn test_agg_limits_with_empty_data() {
        use crate::aggregation::agg_req::Aggregations;
        use crate::aggregation::bucket::tests::get_test_index_from_docs;

        let docs = vec![vec![r#"{ "text": "aaa", "text2": "bbb" }"#]];
        let index = get_test_index_from_docs(false, &docs).unwrap();

        {
            // Empty result since there is no doc with dates
            let elasticsearch_compatible_json = json!(
                {
                    "1": {
                        "terms": {"field": "text2", "min_doc_count": 0},
                        "aggs": {
                            "2":{
                                "date_histogram": {
                                    "field": "date",
                                    "fixed_interval": "1d",
                                    "extended_bounds": {
                                        "min": "2015-01-01T00:00:00Z",
                                        "max": "2015-01-10T00:00:00Z"
                                    }
                                }
                            }
                        }
                    }
                }
            );

            let agg_req: Aggregations = serde_json::from_str(
                &serde_json::to_string(&elasticsearch_compatible_json).unwrap(),
            )
            .unwrap();
            let res = exec_request_with_query(agg_req, &index, Some(("text", "bbb"))).unwrap();
            let expected_res = json!({
             "1": {
                "buckets": [
                  {
                    "2": {
                      "buckets": [
                        { "doc_count": 0, "key": 1420070400000.0, "key_as_string": "2015-01-01T00:00:00Z" },
                        { "doc_count": 0, "key": 1420156800000.0, "key_as_string": "2015-01-02T00:00:00Z" },
                        { "doc_count": 0, "key": 1420243200000.0, "key_as_string": "2015-01-03T00:00:00Z" },
                        { "doc_count": 0, "key": 1420329600000.0, "key_as_string": "2015-01-04T00:00:00Z" },
                        { "doc_count": 0, "key": 1420416000000.0, "key_as_string": "2015-01-05T00:00:00Z" },
                        { "doc_count": 0, "key": 1420502400000.0, "key_as_string": "2015-01-06T00:00:00Z" },
                        { "doc_count": 0, "key": 1420588800000.0, "key_as_string": "2015-01-07T00:00:00Z" },
                        { "doc_count": 0, "key": 1420675200000.0, "key_as_string": "2015-01-08T00:00:00Z" },
                        { "doc_count": 0, "key": 1420761600000.0, "key_as_string": "2015-01-09T00:00:00Z" },
                        { "doc_count": 0, "key": 1420848000000.0, "key_as_string": "2015-01-10T00:00:00Z" }
                      ]
                    },
                    "doc_count": 0,
                    "key": "bbb"
                  }
                ],
                "doc_count_error_upper_bound": 0,
                "sum_other_doc_count": 0
              }
            });
            assert_eq!(res, expected_res);
        }
    }
}


================================================
FILE: src/aggregation/agg_req.rs
================================================
//! Contains the aggregation request tree. Used to build an
//! [`AggregationCollector`](super::AggregationCollector).
//!
//! [`Aggregations`] is the top level entry point to create a request, which is a `HashMap<String,
//! Aggregation>`.
//!
//! Requests are compatible with the json format of elasticsearch.
//!
//! # Example
//!
//! ```
//! use tantivy::aggregation::agg_req::Aggregations;
//!
//! let elasticsearch_compatible_json_req = r#"
//! {
//!   "range": {
//!     "range": {
//!       "field": "score",
//!       "ranges": [
//!         { "from": 3.0, "to": 7.0 },
//!         { "from": 7.0, "to": 20.0 }
//!       ]
//!     }
//!   }
//! }"#;
//! let _agg_req: Aggregations = serde_json::from_str(elasticsearch_compatible_json_req).unwrap();
//! ```

use std::collections::HashSet;

use rustc_hash::FxHashMap;
use serde::{Deserialize, Serialize};

use super::bucket::{
    CompositeAggregation, DateHistogramAggregationReq, FilterAggregation, HistogramAggregation,
    RangeAggregation, TermsAggregation,
};
use super::metric::{
    AverageAggregation, CardinalityAggregationReq, CountAggregation, ExtendedStatsAggregation,
    MaxAggregation, MinAggregation, PercentilesAggregationReq, StatsAggregation, SumAggregation,
    TopHitsAggregationReq,
};

/// The top-level aggregation request structure, which contains [`Aggregation`] and their user
/// defined names. It is also used in buckets aggregations to define sub-aggregations.
///
/// The key is the user defined name of the aggregation.
pub type Aggregations = FxHashMap<String, Aggregation>;

/// Aggregation request.
///
/// An aggregation is either a bucket or a metric.
#[derive(Clone, Debug, PartialEq, Serialize, Deserialize)]
#[serde(try_from = "AggregationForDeserialization")]
pub struct Aggregation {
    /// The aggregation variant, which can be either a bucket or a metric.
    #[serde(flatten)]
    pub agg: AggregationVariants,
    /// on the document set in the bucket.
    #[serde(rename = "aggs")]
    #[serde(skip_serializing_if = "Aggregations::is_empty")]
    pub sub_aggregation: Aggregations,
}

/// In order to display proper error message, we cannot rely on flattening
/// the json enum. Instead we introduce an intermediary struct to separate
/// the aggregation from the subaggregation.
#[derive(Deserialize)]
struct AggregationForDeserialization {
    #[serde(flatten)]
    pub aggs_remaining_json: serde_json::Value,
    #[serde(rename = "aggs")]
    #[serde(default)]
    pub sub_aggregation: Aggregations,
}

impl TryFrom<AggregationForDeserialization> for Aggregation {
    type Error = serde_json::Error;

    fn try_from(value: AggregationForDeserialization) -> serde_json::Result<Self> {
        let AggregationForDeserialization {
            aggs_remaining_json,
            sub_aggregation,
        } = value;
        let agg: AggregationVariants = serde_json::from_value(aggs_remaining_json)?;
        Ok(Aggregation {
            agg,
            sub_aggregation,
        })
    }
}

impl Aggregation {
    pub(crate) fn sub_aggregation(&self) -> &Aggregations {
        &self.sub_aggregation
    }

    fn get_fast_field_names(&self, fast_field_names: &mut HashSet<String>) {
        fast_field_names.extend(
            self.agg
                .get_fast_field_names()
                .iter()
                .map(|s| s.to_string()),
        );
        fast_field_names.extend(get_fast_field_names(&self.sub_aggregation));
    }
}

/// Extract all fast field names used in the tree.
pub fn get_fast_field_names(aggs: &Aggregations) -> HashSet<String> {
    let mut fast_field_names = Default::default();
    for el in aggs.values() {
        el.get_fast_field_names(&mut fast_field_names)
    }
    fast_field_names
}

#[derive(Clone, Debug, PartialEq, Serialize, Deserialize)]
/// All aggregation types.
pub enum AggregationVariants {
    // Bucket aggregation types
    /// Put data into buckets of user-defined ranges.
    #[serde(rename = "range")]
    Range(RangeAggregation),
    /// Put data into a histogram.
    #[serde(rename = "histogram")]
    Histogram(HistogramAggregation),
    /// Put data into a date histogram.
    #[serde(rename = "date_histogram")]
    DateHistogram(DateHistogramAggregationReq),
    /// Put data into buckets of terms.
    #[serde(rename = "terms")]
    Terms(TermsAggregation),
    /// Filter documents into a single bucket.
    #[serde(rename = "filter")]
    Filter(FilterAggregation),
    /// Multi-dimensional, paginable bucket aggregation.
    #[serde(rename = "composite")]
    Composite(CompositeAggregation),

    // Metric aggregation types
    /// Computes the average of the extracted values.
    #[serde(rename = "avg")]
    Average(AverageAggregation),
    /// Counts the number of extracted values.
    #[serde(rename = "value_count")]
    Count(CountAggregation),
    /// Finds the maximum value.
    #[serde(rename = "max")]
    Max(MaxAggregation),
    /// Finds the minimum value.
    #[serde(rename = "min")]
    Min(MinAggregation),
    /// Computes a collection of statistics (`min`, `max`, `sum`, `count`, and `avg`) over the
    /// extracted values.
    #[serde(rename = "stats")]
    Stats(StatsAggregation),
    /// Computes a collection of estended statistics (`min`, `max`, `sum`, `count`, `avg`,
    /// `sum_of_squares`, `variance`, `variance_sampling`, `std_deviation`,
    /// `std_deviation_sampling`) over the  extracted values.
    #[serde(rename = "extended_stats")]
    ExtendedStats(ExtendedStatsAggregation),
    /// Computes the sum of the extracted values.
    #[serde(rename = "sum")]
    Sum(SumAggregation),
    /// Computes the sum of the extracted values.
    #[serde(rename = "percentiles")]
    Percentiles(PercentilesAggregationReq),
    /// Finds the top k values matching some order
    #[serde(rename = "top_hits")]
    TopHits(TopHitsAggregationReq),
    /// Computes an estimate of the number of unique values
    #[serde(rename = "cardinality")]
    Cardinality(CardinalityAggregationReq),
}

impl AggregationVariants {
    /// Returns the name of the fields used by the aggregation.
    pub fn get_fast_field_names(&self) -> Vec<&str> {
        match self {
            AggregationVariants::Terms(terms) => vec![terms.field.as_str()],
            AggregationVariants::Range(range) => vec![range.field.as_str()],
            AggregationVariants::Histogram(histogram) => vec![histogram.field.as_str()],
            AggregationVariants::DateHistogram(histogram) => vec![histogram.field.as_str()],
            AggregationVariants::Filter(filter) => filter.get_fast_field_names(),
            AggregationVariants::Composite(composite) => composite
                .sources
                .iter()
                .map(|source| source.field())
                .collect(),
            AggregationVariants::Average(avg) => vec![avg.field_name()],
            AggregationVariants::Count(count) => vec![count.field_name()],
            AggregationVariants::Max(max) => vec![max.field_name()],
            AggregationVariants::Min(min) => vec![min.field_name()],
            AggregationVariants::Stats(stats) => vec![stats.field_name()],
            AggregationVariants::ExtendedStats(extended_stats) => vec![extended_stats.field_name()],
            AggregationVariants::Sum(sum) => vec![sum.field_name()],
            AggregationVariants::Percentiles(per) => vec![per.field_name()],
            AggregationVariants::TopHits(top_hits) => top_hits.field_names(),
            AggregationVariants::Cardinality(per) => vec![per.field_name()],
        }
    }

    pub(crate) fn as_range(&self) -> Option<&RangeAggregation> {
        match &self {
            AggregationVariants::Range(range) => Some(range),
            _ => None,
        }
    }
    pub(crate) fn as_histogram(&self) -> crate::Result<Option<HistogramAggregation>> {
        match &self {
            AggregationVariants::Histogram(histogram) => Ok(Some(histogram.clone())),
            AggregationVariants::DateHistogram(histogram) => {
                Ok(Some(histogram.to_histogram_req()?))
            }
            _ => Ok(None),
        }
    }
    pub(crate) fn as_term(&self) -> Option<&TermsAggregation> {
        match &self {
            AggregationVariants::Terms(terms) => Some(terms),
            _ => None,
        }
    }
    pub(crate) fn as_composite(&self) -> Option<&CompositeAggregation> {
        match &self {
            AggregationVariants::Composite(composite) => Some(composite),
            _ => None,
        }
    }
    pub(crate) fn as_percentile(&self) -> Option<&PercentilesAggregationReq> {
        match &self {
            AggregationVariants::Percentiles(percentile_req) => Some(percentile_req),
            _ => None,
        }
    }
}

#[cfg(test)]
mod tests {

    use super::*;

    #[test]
    fn deser_json_test() {
        let agg_req_json = r#"{
            "price_avg": { "avg": { "field": "price" } },
            "price_count": { "value_count": { "field": "price" } },
            "price_max": { "max": { "field": "price" } },
            "price_min": { "min": { "field": "price" } },
            "price_stats": { "stats": { "field": "price" } },
            "price_sum": { "sum": { "field": "price" } }
        }"#;
        let _agg_req: Aggregations = serde_json::from_str(agg_req_json).unwrap();
    }

    #[test]
    fn deser_json_test_bucket() {
        let agg_req_json = r#"
    {
        "termagg": {
            "terms": {
                "field": "json.mixed_type",
                "order": { "min_price": "desc" }
            },
            "aggs": {
                "min_price": { "min": { "field": "json.mixed_type" } }
            }
        },
        "rangeagg": {
            "range": {
                "field": "json.mixed_type",
                "ranges": [
                    { "to": 3.0 },
                    { "from": 19.0, "to": 20.0 },
                    { "from": 20.0 }
                ]
            },
            "aggs": {
                "average_in_range": { "avg": { "field": "json.mixed_type" } }
            }
        }
    } "#;

        let _agg_req: Aggregations = serde_json::from_str(agg_req_json).unwrap();
    }

    #[test]
    fn test_metric_aggregations_deser() {
        let agg_req_json = r#"{
            "price_avg": { "avg": { "field": "price" } },
            "price_count": { "value_count": { "field": "price" } },
            "price_max": { "max": { "field": "price" } },
            "price_min": { "min": { "field": "price" } },
            "price_stats": { "stats": { "field": "price" } },
            "price_sum": { "sum": { "field": "price" } }
        }"#;
        let agg_req: Aggregations = serde_json::from_str(agg_req_json).unwrap();

        assert!(
            matches!(&agg_req.get("price_avg").unwrap().agg, AggregationVariants::Average(avg) if avg.field == "price")
        );
        assert!(
            matches!(&agg_req.get("price_count").unwrap().agg, AggregationVariants::Count(count) if count.field == "price")
        );
        assert!(
            matches!(&agg_req.get("price_max").unwrap().agg, AggregationVariants::Max(max) if max.field == "price")
        );
        assert!(
            matches!(&agg_req.get("price_min").unwrap().agg, AggregationVariants::Min(min) if min.field == "price")
        );
        assert!(
            matches!(&agg_req.get("price_stats").unwrap().agg, AggregationVariants::Stats(stats) if stats.field == "price")
        );
        assert!(
            matches!(&agg_req.get("price_sum").unwrap().agg, AggregationVariants::Sum(sum) if sum.field == "price")
        );
    }

    #[test]
    fn serialize_to_json_test() {
        let elasticsearch_compatible_json_req = r#"{
  "range": {
    "range": {
      "field": "score",
      "ranges": [
        {
          "to": 3.0
        },
        {
          "from": 3.0,
          "to": 7.0
        },
        {
          "from": 7.0,
          "to": 20.0
        },
        {
          "from": 20.0
        }
      ],
      "keyed": true
    }
  }
}"#;

        let agg_req1: Aggregations =
            { serde_json::from_str(elasticsearch_compatible_json_req).unwrap() };

        let agg_req2: String = serde_json::to_string_pretty(&agg_req1).unwrap();
        assert_eq!(agg_req2, elasticsearch_compatible_json_req);
    }

    #[test]
    fn test_get_fast_field_names() {
        let range_agg: Aggregation = {
            serde_json::from_value(json!({
                "range": {
                    "field": "score",
                    "ranges": [
                        { "to": 3.0 },
                        { "from": 3.0, "to": 7.0 },
                        { "from": 7.0, "to": 20.0 },
                        { "from": 20.0 }
                    ],
                }

            }))
            .unwrap()
        };

        let agg_req1: Aggregations = {
            serde_json::from_value(json!({
                "range1": range_agg,
                "range2":{
                    "range": {
                        "field": "score2",
                        "ranges": [
                            { "to": 3.0 },
                            { "from": 3.0, "to": 7.0 },
                            { "from": 7.0, "to": 20.0 },
                            { "from": 20.0 }
                        ],
                    },
                    "aggs": {
                        "metric": {
                            "avg": {
                                "field": "field123"
                            }
                        }
                    }
                }
            }))
            .unwrap()
        };

        assert_eq!(
            get_fast_field_names(&agg_req1),
            vec![
                "score".to_string(),
                "score2".to_string(),
                "field123".to_string()
            ]
            .into_iter()
            .collect()
        )
    }
}


================================================
FILE: src/aggregation/agg_result.rs
================================================
//! Contains the final aggregation tree.
//!
//! This tree can be converted via the `into()` method from `IntermediateAggregationResults`.
//! This conversion computes the final result. For example: The intermediate result contains
//! intermediate average results, which is the sum and the number of values. The actual average is
//! calculated on the step from intermediate to final aggregation result tree.

use rustc_hash::FxHashMap;
use serde::{Deserialize, Serialize};

use super::bucket::GetDocCount;
use super::intermediate_agg_result::CompositeIntermediateKey;
use super::metric::{
    ExtendedStats, PercentilesMetricResult, SingleMetricResult, Stats, TopHitsMetricResult,
};
use super::{AggregationError, Key};
use crate::aggregation::bucket::AfterKey;
use crate::TantivyError;

#[derive(Clone, Default, Debug, PartialEq, Serialize, Deserialize)]
/// The final aggregation result.
pub struct AggregationResults(pub FxHashMap<String, AggregationResult>);

impl AggregationResults {
    pub(crate) fn get_bucket_count(&self) -> u64 {
        self.0
            .values()
            .map(|agg| agg.get_bucket_count())
            .sum::<u64>()
    }

    pub(crate) fn get_value_from_aggregation(
        &self,
        name: &str,
        agg_property: &str,
    ) -> crate::Result<Option<f64>> {
        if let Some(agg) = self.0.get(name) {
            agg.get_value_from_aggregation(name, agg_property)
        } else {
            // Validation is be done during request parsing, so we can't reach this state.
            Err(TantivyError::InternalError(format!(
                "Can't find aggregation {name:?} in sub-aggregations"
            )))
        }
    }
}

#[derive(Clone, Debug, PartialEq, Serialize, Deserialize)]
#[serde(untagged)]
/// An aggregation is either a bucket or a metric.
pub enum AggregationResult {
    /// Bucket result variant.
    BucketResult(BucketResult),
    /// Metric result variant.
    MetricResult(MetricResult),
}

impl AggregationResult {
    pub(crate) fn get_bucket_count(&self) -> u64 {
        match self {
            AggregationResult::BucketResult(bucket) => bucket.get_bucket_count(),
            AggregationResult::MetricResult(_) => 0,
        }
    }

    pub(crate) fn get_value_from_aggregation(
        &self,
        _name: &str,
        agg_property: &str,
    ) -> crate::Result<Option<f64>> {
        match self {
            AggregationResult::BucketResult(_bucket) => Err(TantivyError::InternalError(
                "Tried to retrieve value from bucket aggregation. This is not supported and \
                 should not happen during collection phase, but should be caught during validation"
                    .to_string(),
            )),
            AggregationResult::MetricResult(metric) => metric.get_value(agg_property),
        }
    }
}

#[derive(Clone, Debug, PartialEq, Serialize, Deserialize)]
#[serde(untagged)]
/// MetricResult
pub enum MetricResult {
    /// Average metric result.
    Average(SingleMetricResult),
    /// Count metric result.
    Count(SingleMetricResult),
    /// Max metric result.
    Max(SingleMetricResult),
    /// Min metric result.
    Min(SingleMetricResult),
    /// Stats metric result.
    Stats(Stats),
    /// ExtendedStats metric result.
    ExtendedStats(Box<ExtendedStats>),
    /// Sum metric result.
    Sum(SingleMetricResult),
    /// Percentiles metric result.
    Percentiles(PercentilesMetricResult),
    /// Top hits metric result
    TopHits(TopHitsMetricResult),
    /// Cardinality metric result
    Cardinality(SingleMetricResult),
}

impl MetricResult {
    fn get_value(&self, agg_property: &str) -> crate::Result<Option<f64>> {
        match self {
            MetricResult::Average(avg) => Ok(avg.value),
            MetricResult::Count(count) => Ok(count.value),
            MetricResult::Max(max) => Ok(max.value),
            MetricResult::Min(min) => Ok(min.value),
            MetricResult::Stats(stats) => stats.get_value(agg_property),
            MetricResult::ExtendedStats(extended_stats) => extended_stats.get_value(agg_property),
            MetricResult::Sum(sum) => Ok(sum.value),
            MetricResult::Percentiles(_) => Err(TantivyError::AggregationError(
                AggregationError::InvalidRequest("percentiles can't be used to order".to_string()),
            )),
            MetricResult::TopHits(_) => Err(TantivyError::AggregationError(
                AggregationError::InvalidRequest("top_hits can't be used to order".to_string()),
            )),
            MetricResult::Cardinality(card) => Ok(card.value),
        }
    }
}

/// BucketEntry holds bucket aggregation result types.
#[derive(Clone, Debug, PartialEq, Serialize, Deserialize)]
#[serde(untagged)]
pub enum BucketResult {
    /// This is the range entry for a bucket, which contains a key, count, from, to, and optionally
    /// sub-aggregations.
    Range {
        /// The range buckets sorted by range.
        buckets: BucketEntries<RangeBucketEntry>,
    },
    /// This is the histogram entry for a bucket, which contains a key, count, and optionally
    /// sub-aggregations.
    Histogram {
        /// The buckets.
        ///
        /// If there are holes depends on the request, if min_doc_count is 0, then there are no
        /// holes between the first and last bucket.
        /// See [`HistogramAggregation`](super::bucket::HistogramAggregation)
        buckets: BucketEntries<BucketEntry>,
    },
    /// This is the term result
    Terms {
        /// The buckets.
        ///
        /// See [`TermsAggregation`](super::bucket::TermsAggregation)
        buckets: Vec<BucketEntry>,
        /// The number of documents that didn’t make it into to TOP N due to shard_size or size
        sum_other_doc_count: u64,
        #[serde(skip_serializing_if = "Option::is_none")]
        /// The upper bound error for the doc count of each term.
        doc_count_error_upper_bound: Option<u64>,
    },
    /// This is the filter result - a single bucket with sub-aggregations
    Filter(FilterBucketResult),
    /// This is the composite result
    Composite {
        /// The buckets
        buckets: Vec<CompositeBucketEntry>,
        /// The key to start after when paginating
        #[serde(skip_serializing_if = "FxHashMap::is_empty")]
        after_key: FxHashMap<String, AfterKey>,
    },
}

impl BucketResult {
    pub(crate) fn get_bucket_count(&self) -> u64 {
        match self {
            BucketResult::Range { buckets } => {
                buckets.iter().map(|bucket| bucket.get_bucket_count()).sum()
            }
            BucketResult::Histogram { buckets } => {
                buckets.iter().map(|bucket| bucket.get_bucket_count()).sum()
            }
            BucketResult::Terms {
                buckets,
                sum_other_doc_count: _,
                doc_count_error_upper_bound: _,
            } => buckets.iter().map(|bucket| bucket.get_bucket_count()).sum(),
            BucketResult::Filter(filter_result) => {
                // Filter doesn't add to bucket count - it's not a user-facing bucket
                // Only count sub-aggregation buckets
                filter_result.sub_aggregations.get_bucket_count()
            }
            BucketResult::Composite { buckets, .. } => {
                buckets.iter().map(|bucket| bucket.get_bucket_count()).sum()
            }
        }
    }
}

/// This is the wrapper of buckets entries, which can be vector or hashmap
/// depending on if it's keyed or not.
#[derive(Clone, Debug, PartialEq, Serialize, Deserialize)]
#[serde(untagged)]
pub enum BucketEntries<T> {
    /// Vector format bucket entries
    Vec(Vec<T>),
    /// HashMap format bucket entries
    HashMap(FxHashMap<String, T>),
}

impl<T> BucketEntries<T> {
    fn iter<'a>(&'a self) -> Box<dyn Iterator<Item = &'a T> + 'a> {
        match self {
            BucketEntries::Vec(vec) => Box::new(vec.iter()),
            BucketEntries::HashMap(map) => Box::new(map.values()),
        }
    }
}

/// This is the default entry for a bucket, which contains a key, count, and optionally
/// sub-aggregations.
///
/// # JSON Format
/// ```json
/// {
///   ...
///     "my_histogram": {
///       "buckets": [
///         {
///           "key": "2.0",
///           "doc_count": 5
///         },
///         {
///           "key": "4.0",
///           "doc_count": 2
///         },
///         {
///           "key": "6.0",
///           "doc_count": 3
///         }
///       ]
///    }
///    ...
/// }
/// ```
#[derive(Clone, Debug, PartialEq, Serialize, Deserialize)]
pub struct BucketEntry {
    #[serde(skip_serializing_if = "Option::is_none")]
    /// The string representation of the bucket.
    pub key_as_string: Option<String>,
    /// The identifier of the bucket.
    pub key: Key,
    /// Number of documents in the bucket.
    pub doc_count: u64,
    #[serde(flatten)]
    /// Sub-aggregations in this bucket.
    pub sub_aggregation: AggregationResults,
}
impl BucketEntry {
    pub(crate) fn get_bucket_count(&self) -> u64 {
        1 + self.sub_aggregation.get_bucket_count()
    }
}
impl GetDocCount for &BucketEntry {
    fn doc_count(&self) -> u64 {
        self.doc_count
    }
}
impl GetDocCount for BucketEntry {
    fn doc_count(&self) -> u64 {
        self.doc_count
    }
}

/// This is the range entry for a bucket, which contains a key, count, and optionally
/// sub-aggregations.
///
/// # JSON Format
/// ```json
/// {
///   ...
///     "my_ranges": {
///       "buckets": [
///         {
///           "key": "*-10",
///           "to": 10,
///           "doc_count": 5
///         },
///         {
///           "key": "10-20",
///           "from": 10,
///           "to": 20,
///           "doc_count": 2
///         },
///         {
///           "key": "20-*",
///           "from": 20,
///           "doc_count": 3
///         }
///       ]
///    }
///    ...
/// }
/// ```
#[derive(Clone, Debug, PartialEq, Serialize, Deserialize)]
pub struct RangeBucketEntry {
    /// The identifier of the bucket.
    pub key: Key,
    /// Number of documents in the bucket.
    pub doc_count: u64,
    #[serde(flatten)]
    /// Sub-aggregations in this bucket.
    pub sub_aggregation: AggregationResults,
    /// The from range of the bucket. Equals `f64::MIN` when `None`.
    #[serde(skip_serializing_if = "Option::is_none")]
    pub from: Option<f64>,
    /// The to range of the bucket. Equals `f64::MAX` when `None`.
    #[serde(skip_serializing_if = "Option::is_none")]
    pub to: Option<f64>,
    /// The optional string representation for the `from` range.
    #[serde(skip_serializing_if = "Option::is_none")]
    pub from_as_string: Option<String>,
    /// The optional string representation for the `to` range.
    #[serde(skip_serializing_if = "Option::is_none")]
    pub to_as_string: Option<String>,
}
impl RangeBucketEntry {
    pub(crate) fn get_bucket_count(&self) -> u64 {
        1 + self.sub_aggregation.get_bucket_count()
    }
}

/// This is the filter bucket result, which contains the document count and sub-aggregations.
///
/// # JSON Format
/// ```json
/// {
///   "electronics_only": {
///     "doc_count": 2,
///     "avg_price": {
///       "value": 150.0
///     }
///   }
/// }
/// ```
#[derive(Clone, Debug, PartialEq, Serialize, Deserialize)]
pub struct FilterBucketResult {
    /// Number of documents in the filter bucket
    pub doc_count: u64,
    /// Sub-aggregation results
    #[serde(flatten)]
    pub sub_aggregations: AggregationResults,
}

/// Note the type information loss compared to `CompositeIntermediateKey`.
/// Pagination is performed using `AfterKey`, which encodes type information.
#[derive(Clone, Debug, Serialize, Deserialize)]
#[serde(untagged)]
pub enum CompositeKey {
    /// Boolean key
    Bool(bool),
    /// String key
    Str(String),
    /// `i64` key
    I64(i64),
    /// `u64` key
    U64(u64),
    /// `f64` key
    F64(f64),
    /// Null key
    Null,
}
impl Eq for CompositeKey {}
impl std::hash::Hash for CompositeKey {
    fn hash<H: std::hash::Hasher>(&self, state: &mut H) {
        core::mem::discriminant(self).hash(state);
        match self {
            Self::Bool(val) => val.hash(state),
            Self::Str(text) => text.hash(state),
            Self::F64(val) => val.to_bits().hash(state),
            Self::U64(val) => val.hash(state),
            Self::I64(val) => val.hash(state),
            Self::Null => {}
        }
    }
}
impl PartialEq for CompositeKey {
    fn eq(&self, other: &Self) -> bool {
        match (self, other) {
            (Self::Bool(l), Self::Bool(r)) => l == r,
            (Self::Str(l), Self::Str(r)) => l == r,
            (Self::F64(l), Self::F64(r)) => l.to_bits() == r.to_bits(),
            (Self::I64(l), Self::I64(r)) => l == r,
            (Self::U64(l), Self::U64(r)) => l == r,
            (Self::Null, Self::Null) => true,
            _ => false,
        }
    }
}
impl From<CompositeIntermediateKey> for CompositeKey {
    fn from(value: CompositeIntermediateKey) -> Self {
        match value {
            CompositeIntermediateKey::Str(s) => Self::Str(s),
            CompositeIntermediateKey::IpAddr(s) => {
                if let Some(ip) = s.to_ipv4_mapped() {
                    Self::Str(ip.to_string())
                } else {
                    Self::Str(s.to_string())
                }
            }
            CompositeIntermediateKey::F64(f) => Self::F64(f),
            CompositeIntermediateKey::Bool(f) => Self::Bool(f),
            CompositeIntermediateKey::U64(f) => Self::U64(f),
            CompositeIntermediateKey::I64(f) => Self::I64(f),
            CompositeIntermediateKey::DateTime(f) => Self::I64(f / 1_000_000), // ns to ms
            CompositeIntermediateKey::Null => Self::Null,
        }
    }
}

/// Composite bucket entry with a multi-dimensional key.
#[derive(Clone, Debug, PartialEq, Serialize, Deserialize)]
pub struct CompositeBucketEntry {
    /// The identifier of the bucket.
    pub key: FxHashMap<String, CompositeKey>,
    /// Number of documents in the bucket.
    pub doc_count: u64,
    #[serde(flatten)]
    /// Sub-aggregations in this bucket.
    pub sub_aggregation: AggregationResults,
}

impl CompositeBucketEntry {
    pub(crate) fn get_bucket_count(&self) -> u64 {
        1 + self.sub_aggregation.get_bucket_count()
    }
}


================================================
FILE: src/aggregation/agg_tests.rs
================================================
use serde_json::Value;

use crate::aggregation::agg_req::{Aggregation, Aggregations};
use crate::aggregation::agg_result::AggregationResults;
use crate::aggregation::collector::AggregationCollector;
use crate::aggregation::intermediate_agg_result::IntermediateAggregationResults;
use crate::aggregation::tests::{get_test_index_2_segments, get_test_index_from_values_and_terms};
use crate::aggregation::DistributedAggregationCollector;
use crate::docset::COLLECT_BLOCK_BUFFER_LEN;
use crate::query::{AllQuery, TermQuery};
use crate::schema::{IndexRecordOption, Schema, FAST};
use crate::{Index, IndexWriter, Term};

// The following tests ensure that each bucket aggregation type correctly functions as a
// sub-aggregation of another bucket aggregation in two scenarios:
// 1) The parent has more buckets than the child sub-aggregation
// 2) The child sub-aggregation has more buckets than the parent
//
// These scenarios exercise the bucket id mapping and sub-aggregation routing logic.

#[test]
fn test_terms_as_subagg_parent_more_vs_child_more() -> crate::Result<()> {
    let index = get_test_index_2_segments(false)?;

    // Case A: parent has more buckets than child
    // Parent: range with 4 buckets
    // Child: terms on text -> 2 buckets
    let agg_parent_more: Aggregations = serde_json::from_value(json!({
        "parent_range": {
            "range": {
                "field": "score",
                "ranges": [
                    {"to": 3.0},
                    {"from": 3.0, "to": 7.0},
                    {"from": 7.0, "to": 20.0},
                    {"from": 20.0}
                ]
            },
            "aggs": {
                "child_terms": {"terms": {"field": "text", "order": {"_key": "asc"}}}
            }
        }
    }))
    .unwrap();

    let res = crate::aggregation::tests::exec_request(agg_parent_more, &index)?;
    // Exact expected structure and counts
    assert_eq!(
        res["parent_range"]["buckets"],
        json!([
            {
                "key": "*-3",
                "doc_count": 1,
                "to": 3.0,
                "child_terms": {
                    "buckets": [
                        {"doc_count": 1, "key": "cool"}
                    ],
                    "sum_other_doc_count": 0
                }
            },
            {
                "key": "3-7",
                "doc_count": 3,
                "from": 3.0,
                "to": 7.0,
                "child_terms": {
                    "buckets": [
                        {"doc_count": 2, "key": "cool"},
                        {"doc_count": 1, "key": "nohit"}
                    ],
                    "sum_other_doc_count": 0
                }
            },
            {
                "key": "7-20",
                "doc_count": 3,
                "from": 7.0,
                "to": 20.0,
                "child_terms": {
                    "buckets": [
                        {"doc_count": 3, "key": "cool"}
                    ],
                    "sum_other_doc_count": 0
                }
            },
            {
                "key": "20-*",
                "doc_count": 2,
                "from": 20.0,
                "child_terms": {
                    "buckets": [
                        {"doc_count": 1, "key": "cool"},
                        {"doc_count": 1, "key": "nohit"}
                    ],
                    "sum_other_doc_count": 0
                }
            }
        ])
    );

    // Case B: child has more buckets than parent
    // Parent: histogram on score with large interval -> 1 bucket
    // Child: terms on text -> 2 buckets (cool/nohit)
    let agg_child_more: Aggregations = serde_json::from_value(json!({
        "parent_hist": {
            "histogram": {"field": "score", "interval": 100.0},
            "aggs": {
                "child_terms": {"terms": {"field": "text", "order": {"_key": "asc"}}}
            }
        }
    }))
    .unwrap();

    let res = crate::aggregation::tests::exec_request(agg_child_more, &index)?;
    assert_eq!(
        res["parent_hist"],
        json!({
            "buckets": [
                {
                    "key": 0.0,
                    "doc_count": 9,
                    "child_terms": {
                        "buckets": [
                            {"doc_count": 7, "key": "cool"},
                            {"doc_count": 2, "key": "nohit"}
                        ],
                        "sum_other_doc_count": 0
                    }
                }
            ]
        })
    );

    Ok(())
}

#[test]
fn test_range_as_subagg_parent_more_vs_child_more() -> crate::Result<()> {
    let index = get_test_index_2_segments(false)?;

    // Case A: parent has more buckets than child
    // Parent: range with 5 buckets
    // Child: coarse range with 3 buckets
    let agg_parent_more: Aggregations = serde_json::from_value(json!({
        "parent_range": {
            "range": {
                "field": "score",
                "ranges": [
                    {"to": 3.0},
                    {"from": 3.0, "to": 7.0},
                    {"from": 7.0, "to": 11.0},
                    {"from": 11.0, "to": 20.0},
                    {"from": 20.0}
                ]
            },
            "aggs": {
                "child_range": {
                    "range": {
                        "field": "score",
                        "ranges": [
                            {"to": 3.0},
                            {"from": 3.0, "to": 20.0}
                        ]
                    }
                }
            }
        }
    }))
    .unwrap();
    let res = crate::aggregation::tests::exec_request(agg_parent_more, &index)?;
    assert_eq!(
        res["parent_range"]["buckets"],
        json!([
            {"key": "*-3", "doc_count": 1, "to": 3.0,
                "child_range": {"buckets": [
                    {"key": "*-3", "doc_count": 1, "to": 3.0},
                    {"key": "3-20", "doc_count": 0, "from": 3.0, "to": 20.0},
                    {"key": "20-*", "doc_count": 0, "from": 20.0}
                ]}
            },
            {"key": "3-7", "doc_count": 3, "from": 3.0, "to": 7.0,
                "child_range": {"buckets": [
                    {"key": "*-3", "doc_count": 0, "to": 3.0},
                    {"key": "3-20", "doc_count": 3, "from": 3.0, "to": 20.0},
                    {"key": "20-*", "doc_count": 0, "from": 20.0}
                ]}
            },
            {"key": "7-11", "doc_count": 1, "from": 7.0, "to": 11.0,
                "child_range": {"buckets": [
                    {"key": "*-3", "doc_count": 0, "to": 3.0},
                    {"key": "3-20", "doc_count": 1, "from": 3.0, "to": 20.0},
                    {"key": "20-*", "doc_count": 0, "from": 20.0}
                ]}
            },
            {"key": "11-20", "doc_count": 2, "from": 11.0, "to": 20.0,
                "child_range": {"buckets": [
                    {"key": "*-3", "doc_count": 0, "to": 3.0},
                    {"key": "3-20", "doc_count": 2, "from": 3.0, "to": 20.0},
                    {"key": "20-*", "doc_count": 0, "from": 20.0}
                ]}
            },
            {"key": "20-*", "doc_count": 2, "from": 20.0,
                "child_range": {"buckets": [
                    {"key": "*-3", "doc_count": 0, "to": 3.0},
                    {"key": "3-20", "doc_count": 0, "from": 3.0, "to": 20.0},
                    {"key": "20-*", "doc_count": 2, "from": 20.0}
                ]}
            }
        ])
    );

    // Case B: child has more buckets than parent
    // Parent: terms on text (2 buckets)
    // Child: range with 4 buckets
    let agg_child_more: Aggregations = serde_json::from_value(json!({
        "parent_terms": {
            "terms": {"field": "text"},
            "aggs": {
                "child_range": {
                    "range": {
                        "field": "score",
                        "ranges": [
                            {"to": 3.0},
                            {"from": 3.0, "to": 7.0},
                            {"from": 7.0, "to": 20.0}
                        ]
                    }
                }
            }
        }
    }))
    .unwrap();
    let res = crate::aggregation::tests::exec_request(agg_child_more, &index)?;

    assert_eq!(
        res["parent_terms"],
        json!({
            "buckets": [
                {
                    "key": "cool",
                    "doc_count": 7,
                    "child_range": {
                        "buckets": [
                            {"key": "*-3", "doc_count": 1, "to": 3.0},
                            {"key": "3-7", "doc_count": 2, "from": 3.0, "to": 7.0},
                            {"key": "7-20", "doc_count": 3, "from": 7.0, "to": 20.0},
                            {"key": "20-*", "doc_count": 1, "from": 20.0}
                        ]
                    }
                },
                {
                    "key": "nohit",
                    "doc_count": 2,
                    "child_range": {
                        "buckets": [
                            {"key": "*-3", "doc_count": 0, "to": 3.0},
                            {"key": "3-7", "doc_count": 1, "from": 3.0, "to": 7.0},
                            {"key": "7-20", "doc_count": 0, "from": 7.0, "to": 20.0},
                            {"key": "20-*", "doc_count": 1, "from": 20.0}
                        ]
                    }
                }
            ],
            "doc_count_error_upper_bound": 0,
            "sum_other_doc_count": 0
        })
    );

    Ok(())
}

#[test]
fn test_histogram_as_subagg_parent_more_vs_child_more() -> crate::Result<()> {
    let index = get_test_index_2_segments(false)?;

    // Case A: parent has more buckets than child
    // Parent: range with several ranges
    // Child: histogram with large interval (single bucket per parent)
    let agg_parent_more: Aggregations = serde_json::from_value(json!({
        "parent_range": {
            "range": {
                "field": "score",
                "ranges": [
                    {"to": 3.0},
                    {"from": 3.0, "to": 7.0},
                    {"from": 7.0, "to": 11.0},
                    {"from": 11.0, "to": 20.0},
                    {"from": 20.0}
                ]
            },
            "aggs": {
                "child_hist": {"histogram": {"field": "score", "interval": 100.0}}
            }
        }
    }))
    .unwrap();
    let res = crate::aggregation::tests::exec_request(agg_parent_more, &index)?;
    assert_eq!(
        res["parent_range"]["buckets"],
        json!([
            {"key": "*-3", "doc_count": 1, "to": 3.0,
                "child_hist": {"buckets": [ {"key": 0.0, "doc_count": 1} ]}
            },
            {"key": "3-7", "doc_count": 3, "from": 3.0, "to": 7.0,
                "child_hist": {"buckets": [ {"key": 0.0, "doc_count": 3} ]}
            },
            {"key": "7-11", "doc_count": 1, "from": 7.0, "to": 11.0,
                "child_hist": {"buckets": [ {"key": 0.0, "doc_count": 1} ]}
            },
            {"key": "11-20", "doc_count": 2, "from": 11.0, "to": 20.0,
                "child_hist": {"buckets": [ {"key": 0.0, "doc_count": 2} ]}
            },
            {"key": "20-*", "doc_count": 2, "from": 20.0,
                "child_hist": {"buckets": [ {"key": 0.0, "doc_count": 2} ]}
            }
        ])
    );

    // Case B: child has more buckets than parent
    // Parent: terms on text -> 2 buckets
    // Child: histogram with small interval -> multiple buckets including empties
    let agg_child_more: Aggregations = serde_json::from_value(json!({
        "parent_terms": {
            "terms": {"field": "text"},
            "aggs": {
                "child_hist": {"histogram": {"field": "score", "interval": 10.0}}
            }
        }
    }))
    .unwrap();
    let res = crate::aggregation::tests::exec_request(agg_child_more, &index)?;
    assert_eq!(
        res["parent_terms"],
        json!({
            "buckets": [
                {
                    "key": "cool",
                    "doc_count": 7,
                    "child_hist": {
                        "buckets": [
                            {"key": 0.0, "doc_count": 4},
                            {"key": 10.0, "doc_count": 2},
                            {"key": 20.0, "doc_count": 0},
                            {"key": 30.0, "doc_count": 0},
                            {"key": 40.0, "doc_count": 1}
                        ]
                    }
                },
                {
                    "key": "nohit",
                    "doc_count": 2,
                    "child_hist": {
                        "buckets": [
                            {"key": 0.0, "doc_count": 1},
                            {"key": 10.0, "doc_count": 0},
                            {"key": 20.0, "doc_count": 0},
                            {"key": 30.0, "doc_count": 0},
                            {"key": 40.0, "doc_count": 1}
                        ]
                    }
                }
            ],
            "doc_count_error_upper_bound": 0,
            "sum_other_doc_count": 0
        })
    );

    Ok(())
}

#[test]
fn test_date_histogram_as_subagg_parent_more_vs_child_more() -> crate::Result<()> {
    let index = get_test_index_2_segments(false)?;

    // Case A: parent has more buckets than child
    // Parent: range with several buckets
    // Child: date_histogram with 30d -> single bucket per parent
    let agg_parent_more: Aggregations = serde_json::from_value(json!({
        "parent_range": {
            "range": {
                "field": "score",
                "ranges": [
                    {"to": 3.0},
                    {"from": 3.0, "to": 7.0},
                    {"from": 7.0, "to": 11.0},
                    {"from": 11.0, "to": 20.0},
                    {"from": 20.0}
                ]
            },
            "aggs": {
                "child_date_hist": {"date_histogram": {"field": "date", "fixed_interval": "30d"}}
            }
        }
    }))
    .unwrap();
    let res = crate::aggregation::tests::exec_request(agg_parent_more, &index)?;
    let buckets = res["parent_range"]["buckets"].as_array().unwrap();
    // Verify each parent bucket has exactly one child date bucket with matching doc_count
    for bucket in buckets {
        let parent_count = bucket["doc_count"].as_u64().unwrap();
        let child_buckets = bucket["child_date_hist"]["buckets"].as_array().unwrap();
        assert_eq!(child_buckets.len(), 1);
        assert_eq!(child_buckets[0]["doc_count"], parent_count);
    }

    // Case B: child has more buckets than parent
    // Parent: terms on text (2 buckets)
    // Child: date_histogram with 1d -> multiple buckets
    let agg_child_more: Aggregations = serde_json::from_value(json!({
        "parent_terms": {
            "terms": {"field": "text"},
            "aggs": {
                "child_date_hist": {"date_histogram": {"field": "date", "fixed_interval": "1d"}}
            }
        }
    }))
    .unwrap();
    let res = crate::aggregation::tests::exec_request(agg_child_more, &index)?;
    let buckets = res["parent_terms"]["buckets"].as_array().unwrap();

    // cool bucket
    assert_eq!(buckets[0]["key"], "cool");
    let cool_buckets = buckets[0]["child_date_hist"]["buckets"].as_array().unwrap();
    assert_eq!(cool_buckets.len(), 3);
    assert_eq!(cool_buckets[0]["doc_count"], 1); // day 0
    assert_eq!(cool_buckets[1]["doc_count"], 4); // day 1
    assert_eq!(cool_buckets[2]["doc_count"], 2); // day 2

    // nohit bucket
    assert_eq!(buckets[1]["key"], "nohit");
    let nohit_buckets = buckets[1]["child_date_hist"]["buckets"].as_array().unwrap();
    assert_eq!(nohit_buckets.len(), 2);
    assert_eq!(nohit_buckets[0]["doc_count"], 1); // day 1
    assert_eq!(nohit_buckets[1]["doc_count"], 1); // day 2

    Ok(())
}

fn get_avg_req(field_name: &str) -> Aggregation {
    serde_json::from_value(json!({
        "avg": {
            "field": field_name,
        }
    }))
    .unwrap()
}

fn get_collector(agg_req: Aggregations) -> AggregationCollector {
    AggregationCollector::from_aggs(agg_req, Default::default())
}

// *** EVERY BUCKET-TYPE SHOULD BE TESTED HERE ***
// Note: The flushng part of these  tests are outdated, since the buffering change after converting
// the collection into one collector per request instead of per bucket.
//
// However they are useful as they test a complex aggregation requests.
fn test_aggregation_flushing(
    merge_segments: bool,
    use_distributed_collector: bool,
) -> crate::Result<()> {
    let mut values_and_terms = (0..80)
        .map(|val| vec![(val as f64, "terma".to_string())])
        .collect::<Vec<_>>();
    values_and_terms.last_mut().unwrap()[0].1 = "termb".to_string();
    let index = get_test_index_from_values_and_terms(merge_segments, &values_and_terms)?;

    let reader = index.reader()?;

    assert_eq!(COLLECT_BLOCK_BUFFER_LEN, 64);
    // In the tree we cache documents of COLLECT_BLOCK_BUFFER_LEN before passing them down as one
    // block.
    //
    // Build a request so that on the first level we have one full cache, which is then flushed.
    // The same cache should have some residue docs at the end, which are flushed (Range 0-70)
    // -> 70 docs
    //
    // The second level should also have some residue docs in the cache that are flushed at the
    // end.
    //
    // A second bucket on the first level should have the cache unfilled

    // let elasticsearch_compatible_json_req = r#"
    let elasticsearch_compatible_json = json!(
    {
    "bucketsL1": {
        "range": {
            "field": "score",
            "ranges": [ { "to": 3.0f64 }, { "from": 3.0f64, "to": 70.0f64 }, { "from": 70.0f64 } ]
        },
        "aggs": {
            "bucketsL2": {
                "range": {
                    "field": "score",
                    "ranges": [ { "to": 30.0f64 }, { "from": 30.0f64, "to": 70.0f64 }, { "from": 70.0f64 } ]
                }
            }
        }
    },
    "top_hits_test":{
        "terms": {
            "field": "string_id"
        },
        "aggs": {
            "bucketsL2": {
                "top_hits": {
                    "size": 2,
                    "sort": [
                        { "score": "asc" }
                    ],
                    "docvalue_fields": ["score"]
                }
            }
        }
    },
    "histogram_test":{
        "histogram": {
            "field": "score",
            "interval":  70.0,
            "offset": 3.0
        },
        "aggs": {
            "bucketsL2": {
                "histogram": {
                    "field": "score",
                    "interval":  70.0
                }
            }
        }
    },
    "term_agg_test":{
        "terms": {
            "field": "string_id"
        },
        "aggs": {
            "bucketsL2": {
                "histogram": {
                    "field": "score",
                    "interval":  70.0
                }
            }
        }
    },
    "cardinality_string_id":{
        "cardinality": {
            "field": "string_id"
        }
    },
    "cardinality_score":{
        "cardinality": {
            "field": "score"
        }
    }
    });

    let agg_req: Aggregations =
        serde_json::from_str(&serde_json::to_string(&elasticsearch_compatible_json).unwrap())
            .unwrap();

    let agg_res: AggregationResults = if use_distributed_collector {
        let collector =
            DistributedAggregationCollector::from_aggs(agg_req.clone(), Default::default());

        let searcher = reader.searcher();
        let intermediate_agg_result = searcher.search(&AllQuery, &collector).unwrap();

        // Test postcard roundtrip serialization
        let intermediate_agg_result_bytes = postcard::to_allocvec(&intermediate_agg_result).expect(
            "Postcard Serialization failed, flatten etc. is not supported in the intermediate \
             result",
        );
        let intermediate_agg_result: IntermediateAggregationResults =
            postcard::from_bytes(&intermediate_agg_result_bytes)
                .expect("Post deserialization failed");

        intermediate_agg_result
            .into_final_result(agg_req, Default::default())
            .unwrap()
    } else {
        let collector = get_collector(agg_req);

        let searcher = reader.searcher();
        searcher.search(&AllQuery, &collector).unwrap()
    };

    let res: Value = serde_json::from_str(&serde_json::to_string(&agg_res)?)?;

    assert_eq!(res["bucketsL1"]["buckets"][0]["doc_count"], 3);
    assert_eq!(
        res["bucketsL1"]["buckets"][0]["bucketsL2"]["buckets"][0]["doc_count"],
        3
    );
    assert_eq!(res["bucketsL1"]["buckets"][1]["key"], "3-70");
    assert_eq!(res["bucketsL1"]["buckets"][1]["doc_count"], 70 - 3);
    assert_eq!(
        res["bucketsL1"]["buckets"][1]["bucketsL2"]["buckets"][0]["doc_count"],
        27
    );
    assert_eq!(
        res["bucketsL1"]["buckets"][1]["bucketsL2"]["buckets"][1]["doc_count"],
        40
    );
    assert_eq!(
        res["bucketsL1"]["buckets"][1]["bucketsL2"]["buckets"][2]["doc_count"],
        0
    );
    assert_eq!(
        res["bucketsL1"]["buckets"][2]["bucketsL2"]["buckets"][2]["doc_count"],
        80 - 70
    );
    assert_eq!(res["bucketsL1"]["buckets"][2]["doc_count"], 80 - 70);

    assert_eq!(
        res["term_agg_test"],
        json!(
        {
            "buckets": [
              {
                "bucketsL2": {
                  "buckets": [
                    {
                      "doc_count": 70,
                      "key": 0.0
                    },
                    {
                      "doc_count": 9,
                      "key": 70.0
                    }
                  ]
                },
                "doc_count": 79,
                "key": "terma"
              },
              {
                "bucketsL2": {
                  "buckets": [
                    {
                      "doc_count": 1,
                      "key": 70.0
                    }
                  ]
                },
                "doc_count": 1,
                "key": "termb"
              }
            ],
            "doc_count_error_upper_bound": 0,
            "sum_other_doc_count": 0
          }
        )
    );

    assert_eq!(res["cardinality_string_id"]["value"], 2.0);
    assert_eq!(res["cardinality_score"]["value"], 80.0);

    Ok(())
}

#[test]
fn test_aggregation_flushing_variants() {
    test_aggregation_flushing(false, false).unwrap();
    test_aggregation_flushing(false, true).unwrap();
    test_aggregation_flushing(true, false).unwrap();
    test_aggregation_flushing(true, true).unwrap();
}

#[test]
fn test_aggregation_level1_simple() -> crate::Result<()> {
    let index = get_test_index_2_segments(true)?;

    let reader = index.reader()?;
    let text_field = reader.searcher().schema().get_field("text").unwrap();

    let term_query = TermQuery::new(
        Term::from_field_text(text_field, "cool"),
        IndexRecordOption::Basic,
    );

    let range_agg = |field_name: &str| -> Aggregation {
        serde_json::from_value(json!({
            "range": {
                "field": field_name,
                "ranges": [ { "from": 3.0f64, "to": 7.0f64 }, { "from": 7.0f64, "to": 20.0f64 } ]
            }
        }))
        .unwrap()
    };

    let agg_req_1: Aggregations = vec![
        ("average".to_string(), get_avg_req("score")),
        ("range".to_string(), range_agg("score")),
    ]
    .into_iter()
    .collect();

    let collector = get_collector(agg_req_1);

    let searcher = reader.searcher();
    let agg_res: AggregationResults = searcher.search(&term_query, &collector).unwrap();

    let res: Value = serde_json::from_str(&serde_json::to_string(&agg_res)?)?;
    assert_eq!(res["average"]["value"], 12.142857142857142);
    assert_eq!(
        res["range"]["buckets"],
        json!(
        [
        {
          "key": "*-3",
          "doc_count": 1,
          "to": 3.0
        },
        {
          "key": "3-7",
          "doc_count": 2,
          "from": 3.0,
          "to": 7.0
        },
        {
          "key": "7-20",
          "doc_count": 3,
          "from": 7.0,
          "to": 20.0
        },
        {
          "key": "20-*",
          "doc_count": 1,
          "from": 20.0
        }
        ])
    );

    Ok(())
}

#[test]
fn test_aggregation_level1() -> crate::Result<()> {
    let index = get_test_index_2_segments(true)?;

    let reader = index.reader()?;
    let text_field = reader.searcher().schema().get_field("text").unwrap();

    let term_query = TermQuery::new(
        Term::from_field_text(text_field, "cool"),
        IndexRecordOption::Basic,
    );

    let range_agg = |field_name: &str| -> Aggregation {
        serde_json::from_value(json!({
            "range": {
                "field": field_name,
                "ranges": [ { "from": 3.0f64, "to": 7.0f64 }, { "from": 7.0f64, "to": 20.0f64 } ]
            }
        }))
        .unwrap()
    };

    let agg_req_1: Aggregations = vec![
        ("average_i64".to_string(), get_avg_req("score_i64")),
        ("average_f64".to_string(), get_avg_req("score_f64")),
        ("average".to_string(), get_avg_req("score")),
        ("range".to_string(), range_agg("score")),
        ("rangef64".to_string(), range_agg("score_f64")),
        ("rangei64".to_string(), range_agg("score_i64")),
    ]
    .into_iter()
    .collect();

    let collector = get_collector(agg_req_1);

    let searcher = reader.searcher();
    let agg_res: AggregationResults = searcher.search(&term_query, &collector).unwrap();

    let res: Value = serde_json::from_str(&serde_json::to_string(&agg_res)?)?;
    assert_eq!(res["average"]["value"], 12.142857142857142);
    assert_eq!(res["average_f64"]["value"], 12.214285714285714);
    assert_eq!(res["average_i64"]["value"], 12.142857142857142);
    assert_eq!(
        res["range"]["buckets"],
        json!(
        [
        {
          "key": "*-3",
          "doc_count": 1,
          "to": 3.0
        },
        {
          "key": "3-7",
          "doc_count": 2,
          "from": 3.0,
          "to": 7.0
        },
        {
          "key": "7-20",
          "doc_count": 3,
          "from": 7.0,
          "to": 20.0
        },
        {
          "key": "20-*",
          "doc_count": 1,
          "from": 20.0
        }
        ])
    );

    Ok(())
}

fn test_aggregation_level2(
    merge_segments: bool,
    use_distributed_collector: bool,
) -> crate::Result<()> {
    let index = get_test_index_2_segments(merge_segments)?;

    let reader = index.reader()?;
    let text_field = reader.searcher().schema().get_field("text").unwrap();

    let term_query = TermQuery::new(
        Term::from_field_text(text_field, "cool"),
        IndexRecordOption::Basic,
    );

    let query_with_no_hits = TermQuery::new(
        Term::from_field_text(text_field, "thistermdoesnotexist"),
        IndexRecordOption::Basic,
    );

    let elasticsearch_compatible_json_req = r#"
{
  "rangef64": {
    "range": {
      "field": "score_f64",
      "ranges": [
        { "to": 3.0 },
        { "from": 3.0, "to": 7.0 },
        { "from": 7.0, "to": 19.0 },
        { "from": 19.0, "to": 20.0 },
        { "from": 20.0 }
      ]
    },
    "aggs": {
      "average_in_range": { "avg": { "field": "score" } },
      "term_agg": { "terms": { "field": "text" } }
    }
  },
  "rangei64": {
    "range": {
      "field": "score_i64",
      "ranges": [
        { "to": 3.0 },
        { "from": 3.0, "to": 7.0 },
        { "from": 7.0, "to": 19.0 },
        { "from": 19.0, "to": 20.0 },
        { "from": 20.0 }
      ]
    },
    "aggs": {
      "average_in_range": { "avg": { "field": "score" } },
      "term_agg": { "terms": { "field": "text" } }
    }
  },
  "average": {
    "avg": { "field": "score" }
  },
  "range": {
    "range": {
      "field": "score",
      "ranges": [
        { "to": 3.0 },
        { "from": 3.0, "to": 7.0 },
        { "from": 7.0, "to": 19.0 },
        { "from": 19.0, "to": 20.0 },
        { "from": 20.0 }
      ]
    },
    "aggs": {
      "average_in_range": { "avg": { "field": "score" } },
      "term_agg": { "terms": { "field": "text" } }
    }
  }
}
"#;
    let agg_req: Aggregations = serde_json::from_str(elasticsearch_compatible_json_req).unwrap();

    let agg_res: AggregationResults = if use_distributed_collector {
        let collector =
            DistributedAggregationCollector::from_aggs(agg_req.clone(), Default::default());

        let searcher = reader.searcher();
        let res = searcher.search(&term_query, &collector).unwrap();
        res.into_final_result(agg_req.clone(), Default::default())
            .unwrap()
    } else {
        let collector = get_collector(agg_req.clone());

        let searcher = reader.searcher();
        searcher.search(&term_query, &collector).unwrap()
    };

    let res: Value = serde_json::from_str(&serde_json::to_string(&agg_res)?)?;

    assert_eq!(res["range"]["buckets"][1]["key"], "3-7");
    assert_eq!(res["range"]["buckets"][1]["doc_count"], 2u64);
    assert_eq!(res["rangef64"]["buckets"][1]["doc_count"], 2u64);
    assert_eq!(res["rangei64"]["buckets"][1]["doc_count"], 2u64);

    assert_eq!(res["average"]["value"], 12.142857142857142f64);
    assert_eq!(res["range"]["buckets"][2]["key"], "7-19");
    assert_eq!(res["range"]["buckets"][2]["doc_count"], 3u64);
    assert_eq!(res["rangef64"]["buckets"][2]["doc_count"], 3u64);
    assert_eq!(res["rangei64"]["buckets"][2]["doc_count"], 3u64);
    assert_eq!(res["rangei64"]["buckets"][5], serde_json::Value::Null);

    assert_eq!(res["range"]["buckets"][4]["key"], "20-*");
    assert_eq!(res["range"]["buckets"][4]["doc_count"], 1u64);
    assert_eq!(res["rangef64"]["buckets"][4]["doc_count"], 1u64);
    assert_eq!(res["rangei64"]["buckets"][4]["doc_count"], 1u64);

    assert_eq!(res["range"]["buckets"][3]["key"], "19-20");
    assert_eq!(res["range"]["buckets"][3]["doc_count"], 0u64);
    assert_eq!(res["rangef64"]["buckets"][3]["doc_count"], 0u64);
    assert_eq!(res["rangei64"]["buckets"][3]["doc_count"], 0u64);

    assert_eq!(
        res["range"]["buckets"][3]["average_in_range"]["value"],
        serde_json::Value::Null
    );

    assert_eq!(
        res["range"]["buckets"][4]["average_in_range"]["value"],
        44.0f64
    );
    assert_eq!(
        res["rangef64"]["buckets"][4]["average_in_range"]["value"],
        44.0f64
    );
    assert_eq!(
        res["rangei64"]["buckets"][4]["average_in_range"]["value"],
        44.0f64
    );

    assert_eq!(
        res["range"]["7-19"]["average_in_range"]["value"],
        res["rangef64"]["7-19"]["average_in_range"]["value"]
    );
    assert_eq!(
        res["range"]["7-19"]["average_in_range"]["value"],
        res["rangei64"]["7-19"]["average_in_range"]["value"]
    );

    // Test empty result set
    let collector = get_collector(agg_req);
    let searcher = reader.searcher();
    searcher.search(&query_with_no_hits, &collector).unwrap();

    Ok(())
}

#[test]
fn test_aggregation_level2_multi_segments() -> crate::Result<()> {
    test_aggregation_level2(false, false)
}

#[test]
fn test_aggregation_level2_single_segment() -> crate::Result<()> {
    test_aggregation_level2(true, false)
}

#[test]
fn test_aggregation_level2_multi_segments_distributed_collector() -> crate::Result<()> {
    test_aggregation_level2(false, true)
}

#[test]
fn test_aggregation_level2_single_segment_distributed_collector() -> crate::Result<()> {
    test_aggregation_level2(true, true)
}

#[test]
fn test_aggregation_invalid_requests() -> crate::Result<()> {
    let index = get_test_index_2_segments(false)?;

    let reader = index.reader()?;

    let avg_on_field = |field_name: &str| {
        let agg_req_1: Aggregations = serde_json::from_value(json!({
            "average": {
                "avg": {
                    "field": field_name,
                },
            }
        }))
        .unwrap();

        let collector = get_collector(agg_req_1);

        let searcher = reader.searcher();

        searcher.search(&AllQuery, &collector)
    };

    let agg_res = avg_on_field("dummy_text").unwrap_err();
    assert_eq!(
        format!("{agg_res:?}"),
        r#"InvalidArgument("Field \"dummy_text\" is not configured as fast field")"#
    );

    let agg_req_1: Result<Aggregations, serde_json::Error> = serde_json::from_value(json!({
        "average": {
            "avg": {
                "fieldd": "a",
            },
        }
    }));

    assert_eq!(agg_req_1.is_err(), true);
    assert_eq!(agg_req_1.unwrap_err().to_string(), "missing field `field`");

    let agg_req_1: Result<Aggregations, serde_json::Error> = serde_json::from_value(json!({
        "average": {
            "doesnotmatchanyagg": {
                "field": "a",
            },
        }
    }));

    assert_eq!(agg_req_1.is_err(), true);
    // TODO: This should list valid values
    assert!(agg_req_1
        .unwrap_err()
        .to_string()
        .contains("unknown variant `doesnotmatchanyagg`, expected one of"));

    // TODO: This should return an error
    // let agg_res = avg_on_field("not_exist_field").unwrap_err();
    // assert_eq!(
    // format!("{:?}", agg_res),
    // r#"InvalidArgument("No fast field found for field: not_exist_field")"#
    //);

    // TODO: This should return an error
    // let agg_res = avg_on_field("ip_addr").unwrap_err();
    // assert_eq!(
    // format!("{:?}", agg_res),
    // r#"InvalidArgument("No fast field found for field: ip_addr")"#
    //);

    Ok(())
}

#[test]
fn test_aggregation_on_json_object() {
    let mut schema_builder = Schema::builder();
    let json = schema_builder.add_json_field("json", FAST);
    let schema = schema_builder.build();
    let index = Index::create_in_ram(schema);
    let mut index_writer: IndexWriter = index.writer_for_tests().unwrap();
    index_writer
        .add_document(doc!(json => json!({"color": "red"})))
        .unwrap();
    index_writer
        .add_document(doc!(json => json!({"color": "red"})))
        .unwrap();
    index_writer
        .add_document(doc!(json => json!({"color": "blue"})))
        .unwrap();
    index_writer.commit().unwrap();
    let reader = index.reader().unwrap();
    let searcher = reader.searcher();

    let agg: Aggregations = serde_json::from_value(json!({
        "jsonagg": {
            "terms": {
                "field": "json.color",
            }
        }
    }))
    .unwrap();

    let aggregation_collector = get_collector(agg);
    let aggregation_results = searcher.search(&AllQuery, &aggregation_collector).unwrap();
    let aggregation_res_json = serde_json::to_value(aggregation_results).unwrap();
    assert_eq!(
        &aggregation_res_json,
        &serde_json::json!({
            "jsonagg": {
                "buckets": [
                    {"doc_count": 2, "key": "red"},
                    {"doc_count": 1, "key": "blue"},
                ],
                "doc_count_error_upper_bound": 0,
                "sum_other_doc_count": 0
            }
        })
    );
}

#[test]
fn test_aggregation_on_nested_json_object() {
    let mut schema_builder = Schema::builder();
    let json = schema_builder.add_json_field("json.blub", FAST);
    let schema = schema_builder.build();
    let index = Index::create_in_ram(schema);
    let mut index_writer: IndexWriter = index.writer_for_tests().unwrap();
    index_writer
        .add_document(doc!(json => json!({"color.dot": "red", "color": {"nested":"red"} })))
        .unwrap();
    index_writer
        .add_document(doc!(json => json!({"color.dot": "blue", "color": {"nested":"blue"} })))
        .unwrap();
    index_writer
        .add_document(doc!(json => json!({"color.dot": "blue", "color": {"nested":"blue"} })))
        .unwrap();
    index_writer.commit().unwrap();
    let reader = index.reader().unwrap();
    let searcher = reader.searcher();

    let agg: Aggregations = serde_json::from_value(json!({
        "jsonagg1": {
            "terms": {
                "field": "json\\.blub.color\\.dot",
            }
        },
        "jsonagg2": {
            "terms": {
                "field": "json\\.blub.color.nested",
            }
        }

    }))
    .unwrap();

    let aggregation_collector = get_collector(agg);
    let aggregation_results = searcher.search(&AllQuery, &aggregation_collector).unwrap();
    let aggregation_res_json = serde_json::to_value(aggregation_results).unwrap();
    assert_eq!(
        &aggregation_res_json,
        &serde_json::json!({
            "jsonagg1": {
                "buckets": [
                    {"doc_count": 2, "key": "blue"},
                    {"doc_count": 1, "key": "red"}
                ],
                "doc_count_error_upper_bound": 0,
                "sum_other_doc_count": 0
            },
            "jsonagg2": {
                "buckets": [
                    {"doc_count": 2, "key": "blue"},
                    {"doc_count": 1, "key": "red"}
                ],
                "doc_count_error_upper_bound": 0,
                "sum_other_doc_count": 0
            }

        })
    );
}

#[test]
fn test_aggregation_on_json_object_empty_columns() {
    let mut schema_builder = Schema::builder();
    let json = schema_builder.add_json_field("json", FAST);
    let schema = schema_builder.build();
    let index = Index::create_in_ram(schema);
    let mut index_writer: IndexWriter = index.writer_for_tests().unwrap();
    // => Empty column when accessing color
    index_writer
        .add_document(doc!(json => json!({"price": 10.0})))
        .unwrap();
    index_writer.commit().unwrap();
    // => Empty column when accessing price
    index_writer
        .add_document(doc!(json => json!({"color": "blue"})))
        .unwrap();
    index_writer.commit().unwrap();

    // => Non Empty columns
    index_writer
        .add_document(doc!(json => json!({"color": "red", "price": 10.0})))
        .unwrap();
    index_writer
        .add_document(doc!(json => json!({"color": "red", "price": 10.0})))
        .unwrap();
    index_writer
        .add_document(doc!(json => json!({"color": "green", "price": 20.0})))
        .unwrap();
    index_writer
        .add_document(doc!(json => json!({"color": "green", "price": 20.0})))
        .unwrap();
    index_writer
        .add_document(doc!(json => json!({"color": "green", "price": 20.0})))
        .unwrap();

    index_writer.commit().unwrap();

    let reader = index.reader().unwrap();
    let searcher = reader.searcher();

    let agg: Aggregations = serde_json::from_value(json!({
        "jsonagg": {
            "terms": {
                "field": "json.color",
            }
        }
    }))
    .unwrap();

    let aggregation_collector = get_collector(agg);
    let aggregation_results = searcher.search(&AllQuery, &aggregation_collector).unwrap();
    let aggregation_res_json = serde_json::to_value(aggregation_results).unwrap();
    assert_eq!(
        &aggregation_res_json,
        &serde_json::json!({
            "jsonagg": {
                "buckets": [
                    {"doc_count": 3, "key": "green"},
                    {"doc_count": 2, "key": "red"},
                    {"doc_count": 1, "key": "blue"}
                ],
                "doc_count_error_upper_bound": 0,
                "sum_other_doc_count": 0
            }
        })
    );

    let agg_req_str = r#"
    {
      "jsonagg": {
        "aggs": {
          "min_price": { "min": { "field": "json.price" } }
        },
        "terms": {
          "field": "json.color",
          "order": { "min_price": "desc" }
        }
      }
    } "#;
    let agg: Aggregations = serde_json::from_str(agg_req_str).unwrap();
    let aggregation_collector = get_collector(agg);
    let aggregation_results = searcher.search(&AllQuery, &aggregation_collector).unwrap();
    let aggregation_res_json = serde_json::to_value(aggregation_results).unwrap();
    assert_eq!(
        &aggregation_res_json,
        &serde_json::json!(
            {
              "jsonagg": {
                "buckets": [
                  {
                    "key": "green",
                    "doc_count": 3,
                    "min_price": {
                      "value": 20.0
                    }
                  },
                  {
                    "key": "red",
                    "doc_count": 2,
                    "min_price": {
                      "value": 10.0
                    }
                  },
                  {
                    "key": "blue",
                    "doc_count": 1,
                    "min_price": {
                      "value": null
                    }
                  }
                ],
                "sum_other_doc_count": 0
              }
            }
        )
    );
}

#[test]
fn test_aggregation_on_json_object_mixed_types() {
    let mut schema_builder = Schema::builder();
    let json = schema_builder.add_json_field("json", FAST);
    let schema = schema_builder.build();
    let index = Index::create_in_ram(schema);
    let mut index_writer: IndexWriter = index.writer_for_tests().unwrap();
    // => Segment with all values numeric
    index_writer
        .add_document(doc!(json => json!({"mixed_type": 10.0, "mixed_price": 10.0})))
        .unwrap();
    index_writer.commit().unwrap();
    // => Segment with all values text
    index_writer
        .add_document(doc!(json => json!({"mixed_type": "blue", "mixed_price": 5.0})))
        .unwrap();
    index_writer
        .add_document(doc!(json => json!({"mixed_type": "blue", "mixed_price": 5.0})))
        .unwrap();
    index_writer
        .add_document(doc!(json => json!({"mixed_type": "blue", "mixed_price": 5.0})))
        .unwrap();
    index_writer.commit().unwrap();
    // => Segment with all boolean
    index_writer
        .add_document(doc!(json => json!({"mixed_type": true, "mixed_price": "no_price"})))
        .unwrap();
    index_writer.commit().unwrap();

    // => Segment with mixed values
    index_writer
        .add_document(doc!(json => json!({"mixed_type": "red", "mixed_price": 1.0})))
        .unwrap();
    index_writer
        .add_document(doc!(json => json!({"mixed_type": "red", "mixed_price": 1.0})))
        .unwrap();
    index_writer
        .add_document(doc!(json => json!({"mixed_type": -20.5, "mixed_price": -20.5})))
        .unwrap();
    index_writer
        .add_document(doc!(json => json!({"mixed_type": true, "mixed_price": "no_price"})))
        .unwrap();

    index_writer.commit().unwrap();

    // All bucket types
    let agg_req_str = r#"
    {
        "termagg": {
            "terms": {
                "field": "json.mixed_type",
                "order": { "min_price": "desc" }
            },
            "aggs": {
                "min_price": { "min": { "field": "json.mixed_price" } }
            }
        },
        "rangeagg": {
            "range": {
                "field": "json.mixed_type",
                "ranges": [
                    { "to": 3.0 },
                    { "from": 19.0, "to": 20.0 },
                    { "from": 20.0 }
                ]
            },
            "aggs": {
                "average_in_range": { "avg": { "field": "json.mixed_type" } }
            }
        }
    } "#;
    let agg: Aggregations = serde_json::from_str(agg_req_str).unwrap();
    let aggregation_collector = get_collector(agg);
    let reader = index.reader().unwrap();
    let searcher = reader.searcher();

    let aggregation_results = searcher.search(&AllQuery, &aggregation_collector).unwrap();
    let aggregation_res_json = serde_json::to_value(aggregation_results).unwrap();
    use pretty_assertions::assert_eq;
    assert_eq!(
        &aggregation_res_json,
        &serde_json::json!({
          "rangeagg": {
            "buckets": [
              { "average_in_range": { "value": -20.5 }, "doc_count": 1, "key": "*-3", "to": 3.0 },
              { "average_in_range": { "value": 10.0 }, "doc_count": 1, "from": 3.0, "key": "3-19", "to": 19.0 },
              { "average_in_range": { "value": null }, "doc_count": 0, "from": 19.0, "key": "19-20", "to": 20.0 },
              { "average_in_range": { "value": null }, "doc_count": 0, "from": 20.0, "key": "20-*" }
            ]
          },
          "termagg": {
            "buckets": [
              { "doc_count": 1, "key": 10, "min_price": { "value": 10.0 } },
              { "doc_count": 3, "key": "blue", "min_price": { "value": 5.0 } },
              { "doc_count": 2, "key": "red", "min_price": { "value": 1.0 } },
              { "doc_count": 1, "key": -20.5, "min_price": { "value": -20.5 } },
              { "doc_count": 2, "key": 1, "key_as_string": "true", "min_price": { "value": null } },
            ],
            "sum_other_doc_count": 0
          }
        }
        )
    );
}

#[test]
fn test_aggregation_on_json_object_mixed_numerical_segments() {
    let mut schema_builder = Schema::builder();
    let json = schema_builder.add_json_field("json", FAST);
    let schema = schema_builder.build();
    let index = Index::create_in_ram(schema);
    let mut index_writer: IndexWriter = index.writer_for_tests().unwrap();
    // => Segment with all values f64 numeric
    index_writer
        .add_document(doc!(json => json!({"mixed_price": 10.5})))
        .unwrap();
    // Gets converted to f64!
    index_writer
        .add_document(doc!(json => json!({"mixed_price": 10})))
        .unwrap();
    index_writer.commit().unwrap();
    // => Segment with all values i64 numeric
    index_writer
        .add_document(doc!(json => json!({"mixed_price": 10})))
        .unwrap();
    index_writer.commit().unwrap();

    index_writer.commit().unwrap();

    // All bucket types
    let agg_req_str = r#"
    {
        "termagg": {
            "terms": {
                "field": "json.mixed_price"
            }
        }
    } "#;
    let agg: Aggregations = serde_json::from_str(agg_req_str).unwrap();
    let aggregation_collector = get_collector(agg);
    let reader = index.reader().unwrap();
    let searcher = reader.searcher();

    let aggregation_results = searcher.search(&AllQuery, &aggregation_collector).unwrap();
    let aggregation_res_json = serde_json::to_value(aggregation_results).unwrap();
    use pretty_assertions::assert_eq;
    assert_eq!(
        &aggregation_res_json,
        &serde_json::json!({
          "termagg": {
            "buckets": [
              { "doc_count": 2, "key": 10},
              { "doc_count": 1, "key": 10.5},
            ],
            "doc_count_error_upper_bound": 0,
            "sum_other_doc_count": 0
          }
        }
        )
    );
}


================================================
FILE: src/aggregation/bucket/composite/accessors.rs
================================================
use std::net::Ipv6Addr;

use columnar::column_values::{CompactHit, CompactSpaceU64Accessor};
use columnar::{Column, ColumnType, MonotonicallyMappableToU64, StrColumn, TermOrdHit};

use crate::aggregation::accessor_helpers::get_numeric_or_date_column_types;
use crate::aggregation::bucket::composite::numeric_types::num_proj;
use crate::aggregation::bucket::composite::numeric_types::num_proj::ProjectedNumber;
use crate::aggregation::bucket::composite::ToTypePaginationOrder;
use crate::aggregation::bucket::{
    parse_into_milliseconds, CalendarInterval, CompositeAggregation, CompositeAggregationSource,
    MissingOrder, Order,
};
use crate::aggregation::intermediate_agg_result::CompositeIntermediateKey;
use crate::{SegmentReader, TantivyError};

/// Contains all information required by the SegmentCompositeCollector to perform the
/// composite aggregation on a segment.
pub struct CompositeAggReqData {
    /// The name of the aggregation.
    pub name: String,
    /// The normalized term aggregation request.
    pub req: CompositeAggregation,
    /// Accessors for each source, each source can have multiple accessors (columns).
    pub composite_accessors: Vec<CompositeSourceAccessors>,
}

impl CompositeAggReqData {
    /// Estimate the memory consumption of this struct in bytes.
    pub fn get_memory_consumption(&self) -> usize {
        std::mem::size_of::<Self>()
            + self.composite_accessors.len() * std::mem::size_of::<CompositeSourceAccessors>()
    }
}

/// Accessors for a single column in a composite source.
pub struct CompositeAccessor {
    /// The fast field column
    pub column: Column<u64>,
    /// The column type
    pub column_type: ColumnType,
    /// Term dictionary if the column type is Str
    ///
    /// Only used by term sources
    pub str_dict_column: Option<StrColumn>,
    /// Parsed date interval for date histogram sources
    pub date_histogram_interval: PrecomputedDateInterval,
}

/// Accessors to all the columns that belong to the field of a composite source.
pub struct CompositeSourceAccessors {
    /// The accessors for this source
    pub accessors: Vec<CompositeAccessor>,
    /// The key after which to start collecting results. Applies to the first
    /// column of the source.
    pub after_key: PrecomputedAfterKey,

    /// The column index the after_key applies to. The after_key only applies to
    /// one column. Columns before should be skipped. Columns after should be
    /// kept without comparison to the after_key.
    pub after_key_accessor_idx: usize,

    /// Whether to skip missing values because of the after_key. Skipping only
    /// applies if the value for previous columns were exactly equal to the
    /// corresponding after keys (is_on_after_key).
    pub skip_missing: bool,

    /// The after key was set to null to indicate that the last collected key
    /// was a missing value.
    pub is_after_key_explicit_missing: bool,
}

impl CompositeSourceAccessors {
    /// Creates a new set of accessors for the composite source.
    ///
    /// Precomputes some values to make collection faster.
    pub fn build_for_source(
        reader: &SegmentReader,
        source: &CompositeAggregationSource,
        // First option is None when no after key was set in the query, the
        // second option is None when the after key was set but its value for
        // this source was set to `null`
        source_after_key_opt: Option<&CompositeIntermediateKey>,
    ) -> crate::Result<Self> {
        let is_after_key_explicit_missing = source_after_key_opt
            .map(|after_key| matches!(after_key, CompositeIntermediateKey::Null))
            .unwrap_or(false);
        let mut skip_missing = false;
        if let Some(CompositeIntermediateKey::Null) = source_after_key_opt {
            if !source.missing_bucket() {
                return Err(TantivyError::InvalidArgument(
                    "the 'after' key for a source cannot be null when 'missing_bucket' is false"
                        .to_string(),
                ));
            }
        } else if source_after_key_opt.is_some() {
            // if missing buckets come first and we have a non null after key, we skip missing
            if MissingOrder::First == source.missing_order() {
                skip_missing = true;
            }
            if MissingOrder::Default == source.missing_order() && Order::Asc == source.order() {
                skip_missing = true;
            }
        };

        match source {
            CompositeAggregationSource::Terms(source) => {
                let allowed_column_types = [
                    ColumnType::I64,
                    ColumnType::U64,
                    ColumnType::F64,
                    ColumnType::Str,
                    ColumnType::DateTime,
                    ColumnType::Bool,
                    ColumnType::IpAddr,
                    // ColumnType::Bytes Unsupported
                ];
                let mut columns_and_types = reader
                    .fast_fields()
                    .u64_lenient_for_type_all(Some(&allowed_column_types), &source.field)?;

                // Sort columns by their pagination order and determine which to skip
                columns_and_types.sort_by_key(|(_, col_type): &(Column, ColumnType)| {
                    col_type.column_pagination_order()
                });
                if source.order == Order::Desc {
                    columns_and_types.reverse();
                }
                let after_key_accessor_idx = find_first_column_to_collect(
                    &columns_and_types,
                    source_after_key_opt,
                    source.missing_order,
                    source.order,
                )?;

                let source_collectors: Vec<CompositeAccessor> = columns_and_types
                    .into_iter()
                    .map(|(column, column_type)| {
                        Ok(CompositeAccessor {
                            column,
                            column_type,
                            str_dict_column: reader.fast_fields().str(&source.field)?,
                            date_histogram_interval: PrecomputedDateInterval::NotApplicable,
                        })
                    })
                    .collect::<crate::Result<_>>()?;

                let after_key = if let Some(first_col) =
                    source_collectors.get(after_key_accessor_idx)
                {
                    match source_after_key_opt {
                        Some(after_key) => PrecomputedAfterKey::precompute(
                            first_col,
                            after_key,
                            &source.field,
                            source.missing_order,
                            source.order,
                        )?,
                        None => {
                            precompute_missing_after_key(false, source.missing_order, source.order)
                        }
                    }
                } else {
                    // if no columns, we don't care about the after_key
                    PrecomputedAfterKey::Next(0)
                };

                Ok(CompositeSourceAccessors {
                    accessors: source_collectors,
                    is_after_key_explicit_missing,
                    skip_missing,
                    after_key,
                    after_key_accessor_idx,
                })
            }
            CompositeAggregationSource::Histogram(source) => {
                let column_and_types: Vec<(Column, ColumnType)> =
                    reader.fast_fields().u64_lenient_for_type_all(
                        Some(get_numeric_or_date_column_types()),
                        &source.field,
                    )?;
                let source_collectors: Vec<CompositeAccessor> = column_and_types
                    .into_iter()
                    .map(|(column, column_type)| {
                        Ok(CompositeAccessor {
                            column,
                            column_type,
                            str_dict_column: None,
                            date_histogram_interval: PrecomputedDateInterval::NotApplicable,
                        })
                    })
                    .collect::<crate::Result<_>>()?;
                let after_key = match source_after_key_opt {
                    Some(CompositeIntermediateKey::F64(key)) => {
                        let normalized_key = *key / source.interval;
                        num_proj::f64_to_i64(normalized_key).into()
                    }
                    Some(CompositeIntermediateKey::Null) => {
                        precompute_missing_after_key(true, source.missing_order, source.order)
                    }
                    None => precompute_missing_after_key(true, source.missing_order, source.order),
                    _ => {
                        return Err(crate::TantivyError::InvalidArgument(
                            "After key type invalid for interval composite source".to_string(),
                        ));
                    }
                };
                Ok(CompositeSourceAccessors {
                    accessors: source_collectors,
                    is_after_key_explicit_missing,
                    skip_missing,
                    after_key,
                    after_key_accessor_idx: 0,
                })
            }
            CompositeAggregationSource::DateHistogram(source) => {
                let column_and_types = reader
                    .fast_fields()
                    .u64_lenient_for_type_all(Some(&[ColumnType::DateTime]), &source.field)?;
                let date_histogram_interval =
                    PrecomputedDateInterval::from_date_histogram_source_intervals(
                        &source.fixed_interval,
                        source.calendar_interval,
                    )?;
                let source_collectors: Vec<CompositeAccessor> = column_and_types
                    .into_iter()
                    .map(|(column, column_type)| {
                        Ok(CompositeAccessor {
                            column,
                            column_type,
                            str_dict_column: None,
                            date_histogram_interval,
                        })
                    })
                    .collect::<crate::Result<_>>()?;
                let after_key = match source_after_key_opt {
                    Some(CompositeIntermediateKey::DateTime(key)) => {
                        PrecomputedAfterKey::Exact(key.to_u64())
                    }
                    Some(CompositeIntermediateKey::Null) => {
                        precompute_missing_after_key(true, source.missing_order, source.order)
                    }
                    None => precompute_missing_after_key(true, source.missing_order, source.order),
                    _ => {
                        return Err(crate::TantivyError::InvalidArgument(
                            "After key type invalid for interval composite source".to_string(),
                        ));
                    }
                };
                Ok(CompositeSourceAccessors {
                    accessors: source_collectors,
                    is_after_key_explicit_missing,
                    skip_missing,
                    after_key,
                    after_key_accessor_idx: 0,
                })
            }
        }
    }
}

/// Finds the index of the first column we should start collecting from to
/// resume the pagination from the after_key.
fn find_first_column_to_collect<T>(
    sorted_columns: &[(T, ColumnType)],
    after_key_opt: Option<&CompositeIntermediateKey>,
    missing_order: MissingOrder,
    order: Order,
) -> crate::Result<usize> {
    let after_key = match after_key_opt {
        None => return Ok(0), // No pagination, start from beginning
        Some(key) => key,
    };
    // Handle null after_key (we were on a missing value last time)
    if matches!(after_key, CompositeIntermediateKey::Null) {
        return match (missing_order, order) {
            // Missing values come first, so all columns remain
            (MissingOrder::First, _) | (MissingOrder::Default, Order::Asc) => Ok(0),
            // Missing values come last, so all columns are done
            (MissingOrder::Last, _) | (MissingOrder::Default, Order::Desc) => {
                Ok(sorted_columns.len())
            }
        };
    }
    // Find the first column whose type order matches or follows the after_key's
    // type in the pagination sequence
    let after_key_column_order = after_key.column_pagination_order();
    for (idx, (_, col_type)) in sorted_columns.iter().enumerate() {
        let col_order = col_type.column_pagination_order();
        let is_first_to_collect = match order {
            Order::Asc => col_order >= after_key_column_order,
            Order::Desc => col_order <= after_key_column_order,
        };
        if is_first_to_collect {
            return Ok(idx);
        }
    }
    // All columns are before the after_key, nothing left to collect
    Ok(sorted_columns.len())
}

fn precompute_missing_after_key(
    is_after_key_explicit_missing: bool,
    missing_order: MissingOrder,
    order: Order,
) -> PrecomputedAfterKey {
    let after_last = PrecomputedAfterKey::AfterLast;
    let before_first = PrecomputedAfterKey::Next(0);
    match (is_after_key_explicit_missing, missing_order, order) {
        (true, MissingOrder::First, Order::Asc) => before_first,
        (true, MissingOrder::First, Order::Desc) => after_last,
        (true, MissingOrder::Last, Order::Asc) => after_last,
        (true, MissingOrder::Last, Order::Desc) => before_first,
        (true, MissingOrder::Default, Order::Asc) => before_first,
        (true, MissingOrder::Default, Order::Desc) => after_last,
        (false, _, Order::Asc) => before_first,
        (false, _, Order::Desc) => after_last,
    }
}

/// A parsed representation of the date interval for date histogram sources
#[derive(Clone, Copy, Debug)]
pub enum PrecomputedDateInterval {
    /// This is not a date histogram source
    NotApplicable,
    /// Source was configured with a fixed interval
    FixedNanoseconds(i64),
    /// Source was configured with a calendar interval
    Calendar(CalendarInterval),
}

impl PrecomputedDateInterval {
    /// Validates the date histogram source interval fields and parses a date interval from them.
    pub fn from_date_histogram_source_intervals(
        fixed_interval: &Option<String>,
        calendar_interval: Option<CalendarInterval>,
    ) -> crate::Result<Self> {
        match (fixed_interval, calendar_interval) {
            (Some(_), Some(_)) | (None, None) => Err(TantivyError::InvalidArgument(
                "date histogram source must one and only one of fixed_interval or \
                 calendar_interval set"
                    .to_string(),
            )),
            (Some(fixed_interval), None) => {
                let fixed_interval_ms = parse_into_milliseconds(fixed_interval)?;
                Ok(PrecomputedDateInterval::FixedNanoseconds(
                    fixed_interval_ms * 1_000_000,
                ))
            }
            (None, Some(calendar_interval)) => {
                Ok(PrecomputedDateInterval::Calendar(calendar_interval))
            }
        }
    }
}

/// The after key projected to the u64 column space
///
/// Some column types (term, IP) might not have an exact representation of the
/// specified after key
#[derive(Debug)]
pub enum PrecomputedAfterKey {
    /// The after key could be exactly represented in the column space.
    Exact(u64),
    /// The after key could not be exactly represented exactly represented, so
    /// this is the next closest one.
    Next(u64),
    /// The after key could not be represented in the column space, it is
    /// greater than all value
    AfterLast,
}

impl From<CompactHit> for PrecomputedAfterKey {
    fn from(hit: CompactHit) -> Self {
        match hit {
            CompactHit::Exact(ord) => PrecomputedAfterKey::Exact(ord as u64),
            CompactHit::Next(ord) => PrecomputedAfterKey::Next(ord as u64),
            CompactHit::AfterLast => PrecomputedAfterKey::AfterLast,
        }
    }
}

impl From<TermOrdHit> for PrecomputedAfterKey {
    fn from(hit: TermOrdHit) -> Self {
        match hit {
            TermOrdHit::Exact(ord) => PrecomputedAfterKey::Exact(ord),
            // TermOrdHit represents AfterLast as Next(u64::MAX), we keep it as is
            TermOrdHit::Next(ord) => PrecomputedAfterKey::Next(ord),
        }
    }
}

impl<T: MonotonicallyMappableToU64> From<ProjectedNumber<T>> for PrecomputedAfterKey {
    fn from(num: ProjectedNumber<T>) -> Self {
        match num {
            ProjectedNumber::Exact(number) => PrecomputedAfterKey::Exact(number.to_u64()),
            ProjectedNumber::Next(number) => PrecomputedAfterKey::Next(number.to_u64()),
            ProjectedNumber::AfterLast => PrecomputedAfterKey::AfterLast,
        }
    }
}

// /!\ These operators only makes sense if both values are in the same column space
impl PrecomputedAfterKey {
    pub fn equals(&self, column_value: u64) -> bool {
        match self {
            PrecomputedAfterKey::Exact(v) => *v == column_value,
            PrecomputedAfterKey::Next(_) => false,
            PrecomputedAfterKey::AfterLast => false,
        }
    }

    pub fn gt(&self, column_value: u64) -> bool {
        match self {
            PrecomputedAfterKey::Exact(v) => *v > column_value,
            PrecomputedAfterKey::Next(v) => *v > column_value,
            PrecomputedAfterKey::AfterLast => true,
        }
    }

    pub fn lt(&self, column_value: u64) -> bool {
        match self {
            PrecomputedAfterKey::Exact(v) => *v < column_value,
            // a value equal to the next is greater than the after key
            PrecomputedAfterKey::Next(v) => *v <= column_value,
            PrecomputedAfterKey::AfterLast => false,
        }
    }

    fn precompute_ip_addr(column: &Column<u64>, key: &Ipv6Addr) -> crate::Result<Self> {
        let compact_space_accessor = column
            .values
            .clone()
            .downcast_arc::<CompactSpaceU64Accessor>()
            .map_err(|_| {
                TantivyError::AggregationError(crate::aggregation::AggregationError::InternalError(
                    "type mismatch: could not downcast to CompactSpaceU64Accessor".to_string(),
                ))
            })?;
        let ip_u128 = key.to_bits();
        let ip_next_compact = compact_space_accessor.u128_to_next_compact(ip_u128);
        Ok(ip_next_compact.into())
    }

    fn precompute_term_ord(
        str_dict_column: &Option<StrColumn>,
        key: &str,
        field: &str,
    ) -> crate::Result<Self> {
        let dict = str_dict_column
            .as_ref()
            .expect("dictionary missing for str accessor")
            .dictionary();
        let next_ord = dict.term_ord_or_next(key).map_err(|_| {
            TantivyError::InvalidArgument(format!(
                "failed to lookup after_key '{}' for field '{}'",
                key, field
            ))
        })?;
        Ok(next_ord.into())
    }

    /// Projects the after key into the column space of the given accessor.
    ///
    /// The computed after key will not take care of skipping entire columns
    /// when the after key type is ordered after the accessor's type, that
    /// should be performed earlier.
    pub fn precompute(
        composite_accessor: &CompositeAccessor,
        source_after_key: &CompositeIntermediateKey,
        field: &str,
        missing_order: MissingOrder,
        order: Order,
    ) -> crate::Result<Self> {
        use CompositeIntermediateKey as CIKey;
        let precomputed_key = match (composite_accessor.column_type, source_after_key) {
            (ColumnType::Bytes, _) => panic!("unsupported"),
            // null after key
            (_, CIKey::Null) => precompute_missing_after_key(false, missing_order, order),
            // numerical
            (ColumnType::I64, CIKey::I64(k)) => PrecomputedAfterKey::Exact(k.to_u64()),
            (ColumnType::I64, CIKey::U64(k)) => num_proj::u64_to_i64(*k).into(),
            (ColumnType::I64, CIKey::F64(k)) => num_proj::f64_to_i64(*k).into(),
            (ColumnType::U64, CIKey::I64(k)) => num_proj::i64_to_u64(*k).into(),
            (ColumnType::U64, CIKey::U64(k)) => PrecomputedAfterKey::Exact(*k),
            (ColumnType::U64, CIKey::F64(k)) => num_proj::f64_to_u64(*k).into(),
            (ColumnType::F64, CIKey::I64(k)) => num_proj::i64_to_f64(*k).into(),
            (ColumnType::F64, CIKey::U64(k)) => num_proj::u64_to_f64(*k).into(),
            (ColumnType::F64, CIKey::F64(k)) => PrecomputedAfterKey::Exact(k.to_u64()),
            // boolean
            (ColumnType::Bool, CIKey::Bool(key)) => PrecomputedAfterKey::Exact(key.to_u64()),
            // string
            (ColumnType::Str, CIKey::Str(key)) => PrecomputedAfterKey::precompute_term_ord(
                &composite_accessor.str_dict_column,
                key,
                field,
            )?,
            // date time
            (ColumnType::DateTime, CIKey::DateTime(key)) => {
                PrecomputedAfterKey::Exact(key.to_u64())
            }
            // ip address
            (ColumnType::IpAddr, CIKey::IpAddr(key)) => {
                PrecomputedAfterKey::precompute_ip_addr(&composite_accessor.column, key)?
            }
            // assume the column's type is ordered after the after_key's type
            _ => PrecomputedAfterKey::keep_all(order),
        };
        Ok(precomputed_key)
    }

    fn keep_all(order: Order) -> Self {
        match order {
            Order::Asc => PrecomputedAfterKey::Next(0),
            Order::Desc => PrecomputedAfterKey::Next(u64::MAX),
        }
    }
}


================================================
FILE: src/aggregation/bucket/composite/calendar_interval.rs
================================================
use time::convert::{Day, Nanosecond};
use time::{Time, UtcDateTime};

const NS_IN_DAY: i64 = Nanosecond::per_t::<i128>(Day) as i64;

/// Computes the timestamp in nanoseconds corresponding to the beginning of the
/// year (January 1st at midnight UTC).
pub(super) fn try_year_bucket(timestamp_ns: i64) -> crate::Result<i64> {
    year_bucket_using_time_crate(timestamp_ns).map_err(|e| {
        crate::TantivyError::InvalidArgument(format!(
            "Failed to compute year bucket for timestamp {}: {e}",
            timestamp_ns
        ))
    })
}

/// Computes the timestamp in nanoseconds corresponding to the beginning of the
/// month (1st at midnight UTC).
pub(super) fn try_month_bucket(timestamp_ns: i64) -> crate::Result<i64> {
    month_bucket_using_time_crate(timestamp_ns).map_err(|e| {
        crate::TantivyError::InvalidArgument(format!(
            "Failed to compute month bucket for timestamp {}: {e}",
            timestamp_ns
        ))
    })
}

/// Computes the timestamp in nanoseconds corresponding to the beginning of the
/// week (Monday at midnight UTC).
pub(super) fn week_bucket(timestamp_ns: i64) -> i64 {
    // 1970-01-01 was a Thursday (weekday = 4)
    let days_since_epoch = timestamp_ns.div_euclid(NS_IN_DAY);
    // Find the weekday: 0=Monday, ..., 6=Sunday
    let weekday = (days_since_epoch + 3).rem_euclid(7);
    let monday_days_since_epoch = days_since_epoch - weekday;
    monday_days_since_epoch * NS_IN_DAY
}

fn year_bucket_using_time_crate(timestamp_ns: i64) -> Result<i64, time::Error> {
    let timestamp_ns = UtcDateTime::from_unix_timestamp_nanos(timestamp_ns as i128)?
        .replace_ordinal(1)?
        .replace_time(Time::MIDNIGHT)
        .unix_timestamp_nanos();
    Ok(timestamp_ns as i64)
}

fn month_bucket_using_time_crate(timestamp_ns: i64) -> Result<i64, time::Error> {
    let timestamp_ns = UtcDateTime::from_unix_timestamp_nanos(timestamp_ns as i128)?
        .replace_day(1)?
        .replace_time(Time::MIDNIGHT)
        .unix_timestamp_nanos();
    Ok(timestamp_ns as i64)
}

#[cfg(test)]
mod tests {
    use std::i64;

    use time::format_description::well_known::Iso8601;
    use time::UtcDateTime;

    use super::*;

    fn ts_ns(iso: &str) -> i64 {
        UtcDateTime::parse(iso, &Iso8601::DEFAULT)
            .unwrap()
            .unix_timestamp_nanos() as i64
    }

    #[test]
    fn test_year_bucket() {
        let ts = ts_ns("1970-01-01T00:00:00Z");
        let res = try_year_bucket(ts).unwrap();
        assert_eq!(res, ts_ns("1970-01-01T00:00:00Z"));

        let ts = ts_ns("1970-06-01T10:00:01.010Z");
        let res = try_year_bucket(ts).unwrap();
        assert_eq!(res, ts_ns("1970-01-01T00:00:00Z"));

        let ts = ts_ns("2008-12-31T23:59:59.999999999Z"); // leap year
        let res = try_year_bucket(ts).unwrap();
        assert_eq!(res, ts_ns("2008-01-01T00:00:00Z"));

        let ts = ts_ns("2008-01-01T00:00:00Z"); // leap year
        let res = try_year_bucket(ts).unwrap();
        assert_eq!(res, ts_ns("2008-01-01T00:00:00Z"));

        let ts = ts_ns("2010-12-31T23:59:59.999999999Z");
        let res = try_year_bucket(ts).unwrap();
        assert_eq!(res, ts_ns("2010-01-01T00:00:00Z"));

        let ts = ts_ns("1972-06-01T00:10:00Z");
        let res = try_year_bucket(ts).unwrap();
        assert_eq!(res, ts_ns("1972-01-01T00:00:00Z"));
    }

    #[test]
    fn test_month_bucket() {
        let ts = ts_ns("1970-01-15T00:00:00Z");
        let res = try_month_bucket(ts).unwrap();
        assert_eq!(res, ts_ns("1970-01-01T00:00:00Z"));

        let ts = ts_ns("1970-02-01T00:00:00Z");
        let res = try_month_bucket(ts).unwrap();
        assert_eq!(res, ts_ns("1970-02-01T00:00:00Z"));

        let ts = ts_ns("2000-01-31T23:59:59.999999999Z");
        let res = try_month_bucket(ts).unwrap();
        assert_eq!(res, ts_ns("2000-01-01T00:00:00Z"));
    }

    #[test]
    fn test_week_bucket() {
        let ts = ts_ns("1970-01-05T00:00:00Z"); // Monday
        let res = week_bucket(ts);
        assert_eq!(res, ts_ns("1970-01-05T00:00:00Z"));

        let ts = ts_ns("1970-01-05T23:59:59Z"); // Monday
        let res = week_bucket(ts);
        assert_eq!(res, ts_ns("1970-01-05T00:00:00Z"));

        let ts = ts_ns("1970-01-07T01:13:00Z"); // Wednesday
        let res = week_bucket(ts);
        assert_eq!(res, ts_ns("1970-01-05T00:00:00Z"));

        let ts = ts_ns("1970-01-11T23:59:59.999999999Z"); // Sunday
        let res = week_bucket(ts);
        assert_eq!(res, ts_ns("1970-01-05T00:00:00Z"));

        let ts = ts_ns("2025-10-16T10:41:59.010Z"); // Thursday
        let res = week_bucket(ts);
        assert_eq!(res, ts_ns("2025-10-13T00:00:00Z"));

        let ts = ts_ns("1970-01-01T00:00:00Z"); // Thursday
        let res = week_bucket(ts);
        assert_eq!(res, ts_ns("1969-12-29T00:00:00Z")); // Negative
    }
}


================================================
FILE: src/aggregation/bucket/composite/collector.rs
================================================
use std::fmt::Debug;
use std::mem;
use std::net::Ipv6Addr;

use columnar::column_values::CompactSpaceU64Accessor;
use columnar::{
    Column, ColumnType, Dictionary, MonotonicallyMappableToU128, MonotonicallyMappableToU64,
    NumericalValue, StrColumn,
};
use rustc_hash::FxHashMap;
use smallvec::SmallVec;

use crate::aggregation::agg_data::{
    build_segment_agg_collectors, AggRefNode, AggregationsSegmentCtx,
};
use crate::aggregation::bucket::composite::accessors::{
    CompositeAccessor, CompositeAggReqData, PrecomputedDateInterval,
};
use crate::aggregation::bucket::composite::calendar_interval;
use crate::aggregation::bucket::composite::map::{DynArrayHeapMap, MAX_DYN_ARRAY_SIZE};
use crate::aggregation::bucket::{
    CalendarInterval, CompositeAggregationSource, MissingOrder, Order,
};
use crate::aggregation::cached_sub_aggs::{CachedSubAggs, HighCardSubAggCache};
use crate::aggregation::intermediate_agg_result::{
    CompositeIntermediateKey, IntermediateAggregationResult, IntermediateAggregationResults,
    IntermediateBucketResult, IntermediateCompositeBucketEntry, IntermediateCompositeBucketResult,
};
use crate::aggregation::segment_agg_result::{BucketIdProvider, SegmentAggregationCollector};
use crate::aggregation::BucketId;
use crate::TantivyError;

#[derive(Clone, Debug)]
struct CompositeBucketCollector {
    count: u32,
    bucket_id: BucketId,
}

/// Compact sortable representation of a single source value within a composite key.
///
/// The struct encodes both the column identity and the fast field value in a way
/// that preserves the desired sort order via the derived `Ord` implementation
/// (fields are compared top-to-bottom: `sort_key` first, then `encoded_value`).
///
/// ## `sort_key` encoding
/// - `0` — missing value, sorted first
/// - `1..=254` — present value; the original accessor index is `sort_key - 1`
/// - `u8::MAX` (255) — missing value, sorted last
///
/// ## `encoded_value` encoding
/// - `0` when the field is missing
/// - The raw u64 fast-field representation when order is ascending
/// - Bitwise NOT of the raw u64 when order is descending
#[derive(Clone, Copy, Debug, PartialEq, Eq, PartialOrd, Ord, Default, Hash)]
struct InternalValueRepr {
    /// Column index biased by +1 (so 0 and u8::MAX are reserved for missing sentinels).
    sort_key: u8,
    /// Fast field value, possibly bit-flipped for descending order.
    encoded_value: u64,
}

impl InternalValueRepr {
    #[inline]
    fn new_term(raw: u64, accessor_idx: u8, order: Order) -> Self {
        let encoded_value = match order {
            Order::Asc => raw,
            Order::Desc => !raw,
        };
        InternalValueRepr {
            sort_key: accessor_idx + 1,
            encoded_value,
        }
    }

    /// For histogram sources the column index is irrelevant (always 1).
    #[inline]
    fn new_histogram(raw: u64, order: Order) -> Self {
        let encoded_value = match order {
            Order::Asc => raw,
            Order::Desc => !raw,
        };
        InternalValueRepr {
            sort_key: 1,
            encoded_value,
        }
    }

    #[inline]
    fn new_missing(order: Order, missing_order: MissingOrder) -> Self {
        let sort_key = match (missing_order, order) {
            (MissingOrder::First, _) | (MissingOrder::Default, Order::Asc) => 0,
            (MissingOrder::Last, _) | (MissingOrder::Default, Order::Desc) => u8::MAX,
        };
        InternalValueRepr {
            sort_key,
            encoded_value: 0,
        }
    }

    /// Decode back to `(accessor_idx, raw_value)`.
    /// Returns `None` when the value represents a missing field.
    #[inline]
    fn decode(self, order: Order) -> Option<(u8, u64)> {
        if self.sort_key == 0 || self.sort_key == u8::MAX {
            return None;
        }
        let raw = match order {
            Order::Asc => self.encoded_value,
            Order::Desc => !self.encoded_value,
        };
        Some((self.sort_key - 1, raw))
    }
}

/// The collector puts values from the fast field into the correct buckets and
/// does a conversion to the correct datatype.
#[derive(Debug)]
pub struct SegmentCompositeCollector {
    /// One DynArrayHeapMap per parent bucket.
    parent_buckets: Vec<DynArrayHeapMap<InternalValueRepr, CompositeBucketCollector>>,
    accessor_idx: usize,
    sub_agg: Option<CachedSubAggs<HighCardSubAggCache>>,
    bucket_id_provider: BucketIdProvider,
    /// Number of sources, needed when creating new DynArrayHeapMaps.
    num_sources: usize,
}

impl SegmentAggregationCollector for SegmentCompositeCollector {
    fn add_intermediate_aggregation_result(
        &mut self,
        agg_data: &AggregationsSegmentCtx,
        results: &mut IntermediateAggregationResults,
        parent_bucket_id: BucketId,
    ) -> crate::Result<()> {
        let name = agg_data
            .get_composite_req_data(self.accessor_idx)
            .name
            .clone();

        let buckets = self.add_intermediate_bucket_result(agg_data, parent_bucket_id)?;
        results.push(
            name,
            IntermediateAggregationResult::Bucket(IntermediateBucketResult::Composite { buckets }),
        )?;

        Ok(())
    }

    fn collect(
        &mut self,
        parent_bucket_id: BucketId,
        docs: &[crate::DocId],
        agg_data: &mut AggregationsSegmentCtx,
    ) -> crate::Result<()> {
        let mem_pre = self.get_memory_consumption();
        let composite_agg_data = agg_data.take_composite_req_data(self.accessor_idx);

        for doc in docs {
            let mut visitor = CompositeKeyVisitor {
                doc_id: *doc,
                composite_agg_data: &composite_agg_data,
                buckets: &mut self.parent_buckets[parent_bucket_id as usize],
                sub_agg: &mut self.sub_agg,
                bucket_id_provider: &mut self.bucket_id_provider,
                sub_level_values: SmallVec::new(),
            };
            visitor.visit(0, true)?;
        }
        agg_data.put_back_composite_req_data(self.accessor_idx, composite_agg_data);

        if let Some(sub_agg) = &mut self.sub_agg {
            sub_agg.check_flush_local(agg_data)?;
        }

        let mem_delta = self.get_memory_consumption() - mem_pre;
        if mem_delta > 0 {
            agg_data.context.limits.add_memory_consumed(mem_delta)?;
        }

        Ok(())
    }

    fn flush(&mut self, agg_data: &mut AggregationsSegmentCtx) -> crate::Result<()> {
        if let Some(sub_agg) = &mut self.sub_agg {
            sub_agg.flush(agg_data)?;
        }
        Ok(())
    }

    fn prepare_max_bucket(
        &mut self,
        max_bucket: BucketId,
        _agg_data: &AggregationsSegmentCtx,
    ) -> crate::Result<()> {
        let required_len = max_bucket as usize + 1;
        while self.parent_buckets.len() < required_len {
            let map = DynArrayHeapMap::try_new(self.num_sources)?;
            self.parent_buckets.push(map);
        }
        Ok(())
    }
}

impl SegmentCompositeCollector {
    fn get_memory_consumption(&self) -> u64 {
        self.parent_buckets
            .iter()
            .map(|m| m.memory_consumption())
            .sum()
    }

    pub(crate) fn from_req_and_validate(
        req_data: &mut AggregationsSegmentCtx,
        node: &AggRefNode,
    ) -> crate::Result<Self> {
        validate_req(req_data, node.idx_in_req_data)?;

        let has_sub_aggregations = !node.children.is_empty();
        let sub_agg = if has_sub_aggregations {
            let sub_agg_collector = build_segment_agg_collectors(req_data, &node.children)?;
            Some(CachedSubAggs::new(sub_agg_collector))
        } else {
            None
        };

        let composite_req_data = req_data.get_composite_req_data(node.idx_in_req_data);
        let num_sources = composite_req_data.req.sources.len();

        Ok(SegmentCompositeCollector {
            parent_buckets: vec![DynArrayHeapMap::try_new(num_sources)?],
            accessor_idx: node.idx_in_req_data,
            sub_agg,
            bucket_id_provider: BucketIdProvider::default(),
            num_sources,
        })
    }

    #[inline]
    fn add_intermediate_bucket_result(
        &mut self,
        agg_data: &AggregationsSegmentCtx,
        parent_bucket_id: BucketId,
    ) -> crate::Result<IntermediateCompositeBucketResult> {
        let empty_map = DynArrayHeapMap::try_new(self.num_sources)?;
        let heap_map = mem::replace(
            &mut self.parent_buckets[parent_bucket_id as usize],
            empty_map,
        );

        let mut dict: FxHashMap<Vec<CompositeIntermediateKey>, IntermediateCompositeBucketEntry> =
            Default::default();
        dict.reserve(heap_map.size());
        let composite_data = agg_data.get_composite_req_data(self.accessor_idx);
        for (key_internal_repr, agg) in heap_map.into_iter() {
            let key = resolve_key(&key_internal_repr, composite_data)?;
            let mut sub_aggregation_res = IntermediateAggregationResults::default();
            if let Some(sub_agg) = &mut self.sub_agg {
                sub_agg
                    .get_sub_agg_collector()
                    .add_intermediate_aggregation_result(
                        agg_data,
                        &mut sub_aggregation_res,
                        agg.bucket_id,
                    )?;
            }

            dict.insert(
                key,
                IntermediateCompositeBucketEntry {
                    doc_count: agg.count,
                    sub_aggregation: sub_aggregation_res,
                },
            );
        }

        Ok(IntermediateCompositeBucketResult {
            entries: dict,
            target_size: composite_data.req.size,
            orders: composite_data
                .req
                .sources
                .iter()
                .map(|source| match source {
                    CompositeAggregationSource::Terms(t) => (t.order, t.missing_order),
                    CompositeAggregationSource::Histogram(h) => (h.order, h.missing_order),
                    CompositeAggregationSource::DateHistogram(d) => (d.order, d.missing_order),
                })
                .collect(),
        })
    }
}

fn validate_req(req_data: &mut AggregationsSegmentCtx, accessor_idx: usize) -> crate::Result<()> {
    let composite_data = req_data.get_composite_req_data(accessor_idx);
    let req = &composite_data.req;
    if req.sources.is_empty() {
        return Err(TantivyError::InvalidArgument(
            "composite aggregation must have at least one source".to_string(),
        ));
    }
    if req.size == 0 {
        return Err(TantivyError::InvalidArgument(
            "composite aggregation 'size' must be > 0".to_string(),
        ));
    }

    if composite_data.composite_accessors.len() > MAX_DYN_ARRAY_SIZE {
        return Err(TantivyError::InvalidArgument(format!(
            "composite aggregation source supports maximum {MAX_DYN_ARRAY_SIZE} sources",
        )));
    }

    let column_types_for_sources = composite_data.composite_accessors.iter().map(|item| {
        item.accessors
            .iter()
            .map(|a| a.column_type)
            .collect::<Vec<_>>()
    });

    for column_types in column_types_for_sources {
        if column_types.contains(&ColumnType::Bytes) {
            return Err(TantivyError::InvalidArgument(
                "composite aggregation does not support 'bytes' field type".to_string(),
            ));
        }
    }
    Ok(())
}

fn collect_bucket_with_limit(
    doc_id: crate::DocId,
    limit_num_buckets: usize,
    buckets: &mut DynArrayHeapMap<InternalValueRepr, CompositeBucketCollector>,
    key: &[InternalValueRepr],
    sub_agg: &mut Option<CachedSubAggs<HighCardSubAggCache>>,
    bucket_id_provider: &mut BucketIdProvider,
) {
    let mut record_in_bucket = |bucket: &mut CompositeBucketCollector| {
        bucket.count += 1;
        if let Some(sub_agg) = sub_agg {
            sub_agg.push(bucket.bucket_id, doc_id);
        }
    };

    // We still have room for buckets, just insert
    if buckets.size() < limit_num_buckets {
        let bucket = buckets.get_or_insert_with(key, || CompositeBucketCollector {
            count: 0,
            bucket_id: bucket_id_provider.next_bucket_id(),
        });
        record_in_bucket(bucket);
        return;
    }

    // Map is full, but we can still update the bucket if it already exists
    if let Some(bucket) = buckets.get_mut(key) {
        record_in_bucket(bucket);
        return;
    }

    // Check if the item qualifies to enter the top-k, and evict the highest if it does
    if let Some(highest_key) = buckets.peek_highest() {
        if key < highest_key {
            buckets.evict_highest();
            let bucket = buckets.get_or_insert_with(key, || CompositeBucketCollector {
                count: 0,
                bucket_id: bucket_id_provider.next_bucket_id(),
            });
            record_in_bucket(bucket);
        }
    }
}

/// Converts the composite key from its internal column space representation
/// (segment specific) into its intermediate form.
fn resolve_key(
    internal_key: &[InternalValueRepr],
    agg_data: &CompositeAggReqData,
) -> crate::Result<Vec<CompositeIntermediateKey>> {
    internal_key
        .iter()
        .enumerate()
        .map(|(idx, val)| {
            resolve_internal_value_repr(
                *val,
                &agg_data.req.sources[idx],
                &agg_data.composite_accessors[idx].accessors,
            )
        })
        .collect()
}

fn resolve_internal_value_repr(
    internal_value_repr: InternalValueRepr,
    source: &CompositeAggregationSource,
    composite_accessors: &[CompositeAccessor],
) -> crate::Result<CompositeIntermediateKey> {
    let decoded_value_opt = match source {
        CompositeAggregationSource::Terms(source) => internal_value_repr.decode(source.order),
        CompositeAggregationSource::Histogram(source) => internal_value_repr.decode(source.order),
        CompositeAggregationSource::DateHistogram(source) => {
            internal_value_repr.decode(source.order)
        }
    };
    let Some((decoded_accessor_idx, val)) = decoded_value_opt else {
        return Ok(CompositeIntermediateKey::Null);
    };
    let key = match source {
        CompositeAggregationSource::Terms(_) => {
            let CompositeAccessor {
                column_type,
                str_dict_column,
                column,
                ..
            } = &composite_accessors[decoded_accessor_idx as usize];
            resolve_term(val, column_type, str_dict_column, column)?
        }
        CompositeAggregationSource::Histogram(source) => {
            CompositeIntermediateKey::F64(i64::from_u64(val) as f64 * source.interval)
        }
        CompositeAggregationSource::DateHistogram(_) => {
            CompositeIntermediateKey::DateTime(i64::from_u64(val))
        }
    };

    Ok(key)
}

fn resolve_term(
    val: u64,
    column_type: &ColumnType,
    str_dict_column: &Option<StrColumn>,
    column: &Column,
) -> crate::Result<CompositeIntermediateKey> {
    let key = if *column_type == ColumnType::Str {
        let fallback_dict = Dictionary::empty();
        let term_dict = str_dict_column
            .as_ref()
            .map(|el| el.dictionary())
            .unwrap_or_else(|| &fallback_dict);

        let mut buffer = Vec::new();
        term_dict.ord_to_term(val, &mut buffer)?;
        CompositeIntermediateKey::Str(
            String::from_utf8(buffer.to_vec()).expect("could not convert to String"),
        )
    } else if *column_type == ColumnType::DateTime {
        let val = i64::from_u64(val);
        CompositeIntermediateKey::DateTime(val)
    } else if *column_type == ColumnType::Bool {
        let val = bool::from_u64(val);
        CompositeIntermediateKey::Bool(val)
    } else if *column_type == ColumnType::IpAddr {
        let compact_space_accessor = column
            .values
            .clone()
            .downcast_arc::<CompactSpaceU64Accessor>()
            .map_err(|_| {
                TantivyError::AggregationError(crate::aggregation::AggregationError::InternalError(
                    "Type mismatch: Could not downcast to CompactSpaceU64Accessor".to_string(),
                ))
            })?;
        let val: u128 = compact_space_accessor.compact_to_u128(val as u32);
        let val = Ipv6Addr::from_u128(val);
        CompositeIntermediateKey::IpAddr(val)
    } else if *column_type == ColumnType::U64 {
        CompositeIntermediateKey::U64(val)
    } else if *column_type == ColumnType::I64 {
        CompositeIntermediateKey::I64(i64::from_u64(val))
    } else {
        let val = f64::from_u64(val);
        let val: NumericalValue = val.into();

        match val.normalize() {
            NumericalValue::U64(val) => CompositeIntermediateKey::U64(val),
            NumericalValue::I64(val) => CompositeIntermediateKey::I64(val),
            NumericalValue::F64(val) => CompositeIntermediateKey::F64(val),
        }
    };
    Ok(key)
}

/// Browse through the cardinal product obtained by the different values of the doc composite key
/// sources.
///
/// For each of those tuple-key, that are after the limit key, we call collect_bucket_with_limit.
struct CompositeKeyVisitor<'a> {
    doc_id: crate::DocId,
    composite_agg_data: &'a CompositeAggReqData,
    buckets: &'a mut DynArrayHeapMap<InternalValueRepr, CompositeBucketCollector>,
    sub_agg: &'a mut Option<CachedSubAggs<HighCardSubAggCache>>,
    bucket_id_provider: &'a mut BucketIdProvider,
    sub_level_values: SmallVec<[InternalValueRepr; MAX_DYN_ARRAY_SIZE]>,
}

impl CompositeKeyVisitor<'_> {
    /// Depth-first walk of the accessors to build the composite key combinations
    /// and update the buckets.
    ///
    /// `source_idx` is the current source index in the recursion.
    /// `is_on_after_key` tracks whether we still need to consider the after_key
    /// for pruning at this level and below.
    fn visit(&mut self, source_idx: usize, is_on_after_key: bool) -> crate::Result<()> {
        if source_idx == self.composite_agg_data.req.sources.len() {
            if !is_on_after_key {
                collect_bucket_with_limit(
                    self.doc_id,
                    self.composite_agg_data.req.size as usize,
                    self.buckets,
                    &self.sub_level_values,
                    self.sub_agg,
                    self.bucket_id_provider,
                );
            }
            return Ok(());
        }

        let current_level_accessors = &self.composite_agg_data.composite_accessors[source_idx];
        let current_level_source = &self.composite_agg_data.req.sources[source_idx];
        let mut missing = true;
        for (accessor_idx, accessor) in current_level_accessors.accessors.iter().enumerate() {
            let values = accessor.column.values_for_doc(self.doc_id);
            for value in values {
                missing = false;
                match current_level_source {
                    CompositeAggregationSource::Terms(_) => {
                        let preceeds_after_key_type =
                            accessor_idx < current_level_accessors.after_key_accessor_idx;
                        if is_on_after_key && preceeds_after_key_type {
                            break;
                        }
                        let matches_after_key_type =
                            accessor_idx == current_level_accessors.after_key_accessor_idx;

                        if matches_after_key_type && is_on_after_key {
                            let should_skip = match current_level_source.order() {
                                Order::Asc => current_level_accessors.after_key.gt(value),
                                Order::Desc => current_level_accessors.after_key.lt(value),
                            };
                            if should_skip {
                                continue;
                            }
                        }
                        self.sub_level_values.push(InternalValueRepr::new_term(
                            value,
                            accessor_idx as u8,
                            current_level_source.order(),
                        ));
                        let still_on_after_key = matches_after_key_type
                            && current_level_accessors.after_key.equals(value);
                        self.visit(source_idx + 1, is_on_after_key && still_on_after_key)?;
                        self.sub_level_values.pop();
                    }
                    CompositeAggregationSource::Histogram(source) => {
                        let float_value = match accessor.column_type {
                            ColumnType::U64 => value as f64,
                            ColumnType::I64 => i64::from_u64(value) as f64,
                            ColumnType::DateTime => i64::from_u64(value) as f64 / 1_000_000.,
                            ColumnType::F64 => f64::from_u64(value),
                            _ => {
                                panic!(
                                    "unexpected type {:?}. This should not happen",
                                    accessor.column_type
                                )
                            }
                        };
                        let bucket_index = (float_value / source.interval).floor() as i64;
                        let bucket_value = i64::to_u64(bucket_index);
                        if is_on_after_key {
                            let should_skip = match current_level_source.order() {
                                Order::Asc => current_level_accessors.after_key.gt(bucket_value),
                                Order::Desc => current_level_accessors.after_key.lt(bucket_value),
                            };
                            if should_skip {
                                continue;
                            }
                        }
                        self.sub_level_values.push(InternalValueRepr::new_histogram(
                            bucket_value,
                            current_level_source.order(),
                        ));
                        let still_on_after_key =
                            current_level_accessors.after_key.equals(bucket_value);
                        self.visit(source_idx + 1, is_on_after_key && still_on_after_key)?;
                        self.sub_level_values.pop();
                    }
                    CompositeAggregationSource::DateHistogram(_) => {
                        let value_ns = match accessor.column_type {
                            ColumnType::DateTime => i64::from_u64(value),
                            _ => {
                                panic!(
                                    "unexpected type {:?}. This should not happen",
                                    accessor.column_type
                                )
                            }
                        };
                        let bucket_index = match accessor.date_histogram_interval {
                            PrecomputedDateInterval::FixedNanoseconds(fixed_interval_ns) => {
                                (value_ns / fixed_interval_ns) * fixed_interval_ns
                            }
                            PrecomputedDateInterval::Calendar(CalendarInterval::Year) => {
                                calendar_interval::try_year_bucket(value_ns)?
                            }
                            PrecomputedDateInterval::Calendar(CalendarInterval::Month) => {
                                calendar_interval::try_month_bucket(value_ns)?
                            }
                            PrecomputedDateInterval::Calendar(CalendarInterval::Week) => {
                                calendar_interval::week_bucket(value_ns)
                            }
                            PrecomputedDateInterval::NotApplicable => {
                                panic!("interval not precomputed for date histogram source")
                            }
                        };
                        let bucket_value = i64::to_u64(bucket_index);
                        if is_on_after_key {
                            let should_skip = match current_level_source.order() {
                                Order::Asc => current_level_accessors.after_key.gt(bucket_value),
                                Order::Desc => current_level_accessors.after_key.lt(bucket_value),
                            };
                            if should_skip {
                                continue;
                            }
                        }
                        self.sub_level_values.push(InternalValueRepr::new_histogram(
                            bucket_value,
                            current_level_source.order(),
                        ));
                        let still_on_after_key =
                            current_level_accessors.after_key.equals(bucket_value);
                        self.visit(source_idx + 1, is_on_after_key && still_on_after_key)?;
                        self.sub_level_values.pop();
                    }
                };
            }
        }
        if missing && current_level_source.missing_bucket() {
            if is_on_after_key && current_level_accessors.skip_missing {
                return Ok(());
            }
            self.sub_level_values.push(InternalValueRepr::new_missing(
                current_level_source.order(),
                current_level_source.missing_order(),
            ));
            self.visit(
                source_idx + 1,
                is_on_after_key && current_level_accessors.is_after_key_explicit_missing,
            )?;
            self.sub_level_values.pop();
        }
        Ok(())
    }
}


================================================
FILE: src/aggregation/bucket/composite/map.rs
================================================
use std::collections::BinaryHeap;
use std::fmt::Debug;
use std::hash::Hash;

use rustc_hash::FxHashMap;
use smallvec::SmallVec;

use crate::TantivyError;

/// Map backed by a hash map for fast access and a binary heap to track the
/// highest key. The key is an array of fixed size S.
#[derive(Clone, Debug)]
struct ArrayHeapMap<K: Ord, V, const S: usize> {
    pub(crate) buckets: FxHashMap<[K; S], V>,
    pub(crate) heap: BinaryHeap<[K; S]>,
}

impl<K: Ord, V, const S: usize> Default for ArrayHeapMap<K, V, S> {
    fn default() -> Self {
        ArrayHeapMap {
            buckets: FxHashMap::default(),
            heap: BinaryHeap::default(),
        }
    }
}

impl<K: Eq + Hash + Clone + Ord, V, const S: usize> ArrayHeapMap<K, V, S> {
    /// Panics if the length of `key` is not S.
    fn get_or_insert_with<F: FnOnce() -> V>(&mut self, key: &[K], f: F) -> &mut V {
        let key_array: &[K; S] = key.try_into().expect("Key length mismatch");
        self.buckets.entry(key_array.clone()).or_insert_with(|| {
            self.heap.push(key_array.clone());
            f()
        })
    }

    /// Panics if the length of `key` is not S.
    fn get_mut(&mut self, key: &[K]) -> Option<&mut V> {
        let key_array: &[K; S] = key.try_into().expect("Key length mismatch");
        self.buckets.get_mut(key_array)
    }

    fn peek_highest(&self) -> Option<&[K]> {
        self.heap.peek().map(|k_array| k_array.as_slice())
    }

    fn evict_highest(&mut self) {
        if let Some(highest) = self.heap.pop() {
            self.buckets.remove(&highest);
        }
    }

    fn memory_consumption(&self) -> u64 {
        let key_size = std::mem::size_of::<[K; S]>();
        let map_size = (key_size + std::mem::size_of::<V>()) * self.buckets.capacity();
        let heap_size = key_size * self.heap.capacity();
        (map_size + heap_size) as u64
    }
}

impl<K: Copy + Ord + Clone + 'static, V: 'static, const S: usize> ArrayHeapMap<K, V, S> {
    fn into_iter(self) -> Box<dyn Iterator<Item = (SmallVec<[K; MAX_DYN_ARRAY_SIZE]>, V)>> {
        Box::new(
            self.buckets
                .into_iter()
                .map(|(k, v)| (SmallVec::from_slice(&k), v)),
        )
    }
}

pub(super) const MAX_DYN_ARRAY_SIZE: usize = 16;
const MAX_DYN_ARRAY_SIZE_PLUS_ONE: usize = MAX_DYN_ARRAY_SIZE + 1;

/// A map optimized for memory footprint, fast access and efficient eviction of
/// the highest key.
///
/// Keys are inlined arrays of size 1 to [MAX_DYN_ARRAY_SIZE] but for a given
/// instance the key size is fixed. This allows to avoid heap allocations for the
/// keys.
#[derive(Clone, Debug)]
pub(super) struct DynArrayHeapMap<K: Ord, V>(DynArrayHeapMapInner<K, V>);

/// Wrapper around ArrayHeapMap to dynamically dispatch on the array size.
#[derive(Clone, Debug)]
enum DynArrayHeapMapInner<K: Ord, V> {
    Dim1(ArrayHeapMap<K, V, 1>),
    Dim2(ArrayHeapMap<K, V, 2>),
    Dim3(ArrayHeapMap<K, V, 3>),
    Dim4(ArrayHeapMap<K, V, 4>),
    Dim5(ArrayHeapMap<K, V, 5>),
    Dim6(ArrayHeapMap<K, V, 6>),
    Dim7(ArrayHeapMap<K, V, 7>),
    Dim8(ArrayHeapMap<K, V, 8>),
    Dim9(ArrayHeapMap<K, V, 9>),
    Dim10(ArrayHeapMap<K, V, 10>),
    Dim11(ArrayHeapMap<K, V, 11>),
    Dim12(ArrayHeapMap<K, V, 12>),
    Dim13(ArrayHeapMap<K, V, 13>),
    Dim14(ArrayHeapMap<K, V, 14>),
    Dim15(ArrayHeapMap<K, V, 15>),
    Dim16(ArrayHeapMap<K, V, 16>),
}

impl<K: Ord, V> DynArrayHeapMap<K, V> {
    /// Creates a new heap map with dynamic array keys of size `key_dimension`.
    pub(super) fn try_new(key_dimension: usize) -> crate::Result<Self> {
        let inner = match key_dimension {
            0 => {
                return Err(TantivyError::InvalidArgument(
                    "DynArrayHeapMap dimension must be at least 1".to_string(),
                ))
            }
            1 => DynArrayHeapMapInner::Dim1(ArrayHeapMap::default()),
            2 => DynArrayHeapMapInner::Dim2(ArrayHeapMap::default()),
            3 => DynArrayHeapMapInner::Dim3(ArrayHeapMap::default()),
            4 => DynArrayHeapMapInner::Dim4(ArrayHeapMap::default()),
            5 => DynArrayHeapMapInner::Dim5(ArrayHeapMap::default()),
            6 => DynArrayHeapMapInner::Dim6(ArrayHeapMap::default()),
            7 => DynArrayHeapMapInner::Dim7(ArrayHeapMap::default()),
            8 => DynArrayHeapMapInner::Dim8(ArrayHeapMap::default()),
            9 => DynArrayHeapMapInner::Dim9(ArrayHeapMap::default()),
            10 => DynArrayHeapMapInner::Dim10(ArrayHeapMap::default()),
            11 => DynArrayHeapMapInner::Dim11(ArrayHeapMap::default()),
            12 => DynArrayHeapMapInner::Dim12(ArrayHeapMap::default()),
            13 => DynArrayHeapMapInner::Dim13(ArrayHeapMap::default()),
            14 => DynArrayHeapMapInner::Dim14(ArrayHeapMap::default()),
            15 => DynArrayHeapMapInner::Dim15(ArrayHeapMap::default()),
            16 => DynArrayHeapMapInner::Dim16(ArrayHeapMap::default()),
            MAX_DYN_ARRAY_SIZE_PLUS_ONE.. => {
                return Err(TantivyError::InvalidArgument(format!(
                    "DynArrayHeapMap supports maximum {MAX_DYN_ARRAY_SIZE} dimensions, got \
                     {key_dimension}",
                )))
            }
        };
        Ok(DynArrayHeapMap(inner))
    }

    /// Number of elements in the map. This is not the dimension of the keys.
    pub(super) fn size(&self) -> usize {
        match &self.0 {
            DynArrayHeapMapInner::Dim1(map) => map.buckets.len(),
            DynArrayHeapMapInner::Dim2(map) => map.buckets.len(),
            DynArrayHeapMapInner::Dim3(map) => map.buckets.len(),
            DynArrayHeapMapInner::Dim4(map) => map.buckets.len(),
            DynArrayHeapMapInner::Dim5(map) => map.buckets.len(),
            DynArrayHeapMapInner::Dim6(map) => map.buckets.len(),
            DynArrayHeapMapInner::Dim7(map) => map.buckets.len(),
            DynArrayHeapMapInner::Dim8(map) => map.buckets.len(),
            DynArrayHeapMapInner::Dim9(map) => map.buckets.len(),
            DynArrayHeapMapInner::Dim10(map) => map.buckets.len(),
            DynArrayHeapMapInner::Dim11(map) => map.buckets.len(),
            DynArrayHeapMapInner::Dim12(map) => map.buckets.len(),
            DynArrayHeapMapInner::Dim13(map) => map.buckets.len(),
            DynArrayHeapMapInner::Dim14(map) => map.buckets.len(),
            DynArrayHeapMapInner::Dim15(map) => map.buckets.len(),
            DynArrayHeapMapInner::Dim16(map) => map.buckets.len(),
        }
    }
}

impl<K: Ord + Hash + Clone, V> DynArrayHeapMap<K, V> {
    /// Get a mutable reference to the value corresponding to `key` or inserts a new
    /// value created by calling `f`.
    ///
    /// Panics if the length of `key` does not match the key dimension of the map.
    pub(super) fn get_or_insert_with<F: FnOnce() -> V>(&mut self, key: &[K], f: F) -> &mut V {
        match &mut self.0 {
            DynArrayHeapMapInner::Dim1(map) => map.get_or_insert_with(key, f),
            DynArrayHeapMapInner::Dim2(map) => map.get_or_insert_with(key, f),
            DynArrayHeapMapInner::Dim3(map) => map.get_or_insert_with(key, f),
            DynArrayHeapMapInner::Dim4(map) => map.get_or_insert_with(key, f),
            DynArrayHeapMapInner::Dim5(map) => map.get_or_insert_with(key, f),
            DynArrayHeapMapInner::Dim6(map) => map.get_or_insert_with(key, f),
            DynArrayHeapMapInner::Dim7(map) => map.get_or_insert_with(key, f),
            DynArrayHeapMapInner::Dim8(map) => map.get_or_insert_with(key, f),
            DynArrayHeapMapInner::Dim9(map) => map.get_or_insert_with(key, f),
            DynArrayHeapMapInner::Dim10(map) => map.get_or_insert_with(key, f),
            DynArrayHeapMapInner::Dim11(map) => map.get_or_insert_with(key, f),
            DynArrayHeapMapInner::Dim12(map) => map.get_or_insert_with(key, f),
            DynArrayHeapMapInner::Dim13(map) => map.get_or_insert_with(key, f),
            DynArrayHeapMapInner::Dim14(map) => map.get_or_insert_with(key, f),
            DynArrayHeapMapInner::Dim15(map) => map.get_or_insert_with(key, f),
            DynArrayHeapMapInner::Dim16(map) => map.get_or_insert_with(key, f),
        }
    }

    /// Returns a mutable reference to the value corresponding to `key`.
    ///
    /// Panics if the length of `key` does not match the key dimension of the map.
    pub fn get_mut(&mut self, key: &[K]) -> Option<&mut V> {
        match &mut self.0 {
            DynArrayHeapMapInner::Dim1(map) => map.get_mut(key),
            DynArrayHeapMapInner::Dim2(map) => map.get_mut(key),
            DynArrayHeapMapInner::Dim3(map) => map.get_mut(key),
            DynArrayHeapMapInner::Dim4(map) => map.get_mut(key),
            DynArrayHeapMapInner::Dim5(map) => map.get_mut(key),
            DynArrayHeapMapInner::Dim6(map) => map.get_mut(key),
            DynArrayHeapMapInner::Dim7(map) => map.get_mut(key),
            DynArrayHeapMapInner::Dim8(map) => map.get_mut(key),
            DynArrayHeapMapInner::Dim9(map) => map.get_mut(key),
            DynArrayHeapMapInner::Dim10(map) => map.get_mut(key),
            DynArrayHeapMapInner::Dim11(map) => map.get_mut(key),
            DynArrayHeapMapInner::Dim12(map) => map.get_mut(key),
            DynArrayHeapMapInner::Dim13(map) => map.get_mut(key),
            DynArrayHeapMapInner::Dim14(map) => map.get_mut(key),
            DynArrayHeapMapInner::Dim15(map) => map.get_mut(key),
            DynArrayHeapMapInner::Dim16(map) => map.get_mut(key),
        }
    }

    /// Returns a reference to the highest key in the map.
    pub(super) fn peek_highest(&self) -> Option<&[K]> {
        match &self.0 {
            DynArrayHeapMapInner::Dim1(map) => map.peek_highest(),
            DynArrayHeapMapInner::Dim2(map) => map.peek_highest(),
            DynArrayHeapMapInner::Dim3(map) => map.peek_highest(),
            DynArrayHeapMapInner::Dim4(map) => map.peek_highest(),
            DynArrayHeapMapInner::Dim5(map) => map.peek_highest(),
            DynArrayHeapMapInner::Dim6(map) => map.peek_highest(),
            DynArrayHeapMapInner::Dim7(map) => map.peek_highest(),
            DynArrayHeapMapInner::Dim8(map) => map.peek_highest(),
            DynArrayHeapMapInner::Dim9(map) => map.peek_highest(),
            DynArrayHeapMapInner::Dim10(map) => map.peek_highest(),
            DynArrayHeapMapInner::Dim11(map) => map.peek_highest(),
            DynArrayHeapMapInner::Dim12(map) => map.peek_highest(),
            DynArrayHeapMapInner::Dim13(map) => map.peek_highest(),
            DynArrayHeapMapInner::Dim14(map) => map.peek_highest(),
            DynArrayHeapMapInner::Dim15(map) => map.peek_highest(),
            DynArrayHeapMapInner::Dim16(map) => map.peek_highest(),
        }
    }

    /// Removes the entry with the highest key from the map.
    pub(super) fn evict_highest(&mut self) {
        match &mut self.0 {
            DynArrayHeapMapInner::Dim1(map) => map.evict_highest(),
            DynArrayHeapMapInner::Dim2(map) => map.evict_highest(),
            DynArrayHeapMapInner::Dim3(map) => map.evict_highest(),
            DynArrayHeapMapInner::Dim4(map) => map.evict_highest(),
            DynArrayHeapMapInner::Dim5(map) => map.evict_highest(),
            DynArrayHeapMapInner::Dim6(map) => map.evict_highest(),
            DynArrayHeapMapInner::Dim7(map) => map.evict_highest(),
            DynArrayHeapMapInner::Dim8(map) => map.evict_highest(),
            DynArrayHeapMapInner::Dim9(map) => map.evict_highest(),
            DynArrayHeapMapInner::Dim10(map) => map.evict_highest(),
            DynArrayHeapMapInner::Dim11(map) => map.evict_highest(),
            DynArrayHeapMapInner::Dim12(map) => map.evict_highest(),
            DynArrayHeapMapInner::Dim13(map) => map.evict_highest(),
            DynArrayHeapMapInner::Dim14(map) => map.evict_highest(),
            DynArrayHeapMapInner::Dim15(map) => map.evict_highest(),
            DynArrayHeapMapInner::Dim16(map) => map.evict_highest(),
        }
    }

    pub(crate) fn memory_consumption(&self) -> u64 {
        match &self.0 {
            DynArrayHeapMapInner::Dim1(map) => map.memory_consumption(),
            DynArrayHeapMapInner::Dim2(map) => map.memory_consumption(),
            DynArrayHeapMapInner::Dim3(map) => map.memory_consumption(),
            DynArrayHeapMapInner::Dim4(map) => map.memory_consumption(),
            DynArrayHeapMapInner::Dim5(map) => map.memory_consumption(),
            DynArrayHeapMapInner::Dim6(map) => map.memory_consumption(),
            DynArrayHeapMapInner::Dim7(map) => map.memory_consumption(),
            DynArrayHeapMapInner::Dim8(map) => map.memory_consumption(),
            DynArrayHeapMapInner::Dim9(map) => map.memory_consumption(),
            DynArrayHeapMapInner::Dim10(map) => map.memory_consumption(),
            DynArrayHeapMapInner::Dim11(map) => map.memory_consumption(),
            DynArrayHeapMapInner::Dim12(map) => map.memory_consumption(),
            DynArrayHeapMapInner::Dim13(map) => map.memory_consumption(),
            DynArrayHeapMapInner::Dim14(map) => map.memory_consumption(),
            DynArrayHeapMapInner::Dim15(map) => map.memory_consumption(),
            DynArrayHeapMapInner::Dim16(map) => map.memory_consumption(),
        }
    }
}

impl<K: Ord + Clone + Copy + 'static, V: 'static> DynArrayHeapMap<K, V> {
    /// Turns this map into an iterator over key-value pairs.
    pub fn into_iter(self) -> impl Iterator<Item = (SmallVec<[K; MAX_DYN_ARRAY_SIZE]>, V)> {
        match self.0 {
            DynArrayHeapMapInner::Dim1(map) => map.into_iter(),
            DynArrayHeapMapInner::Dim2(map) => map.into_iter(),
            DynArrayHeapMapInner::Dim3(map) => map.into_iter(),
            DynArrayHeapMapInner::Dim4(map) => map.into_iter(),
            DynArrayHeapMapInner::Dim5(map) => map.into_iter(),
            DynArrayHeapMapInner::Dim6(map) => map.into_iter(),
            DynArrayHeapMapInner::Dim7(map) => map.into_iter(),
            DynArrayHeapMapInner::Dim8(map) => map.into_iter(),
            DynArrayHeapMapInner::Dim9(map) => map.into_iter(),
            DynArrayHeapMapInner::Dim10(map) => map.into_iter(),
            DynArrayHeapMapInner::Dim11(map) => map.into_iter(),
            DynArrayHeapMapInner::Dim12(map) => map.into_iter(),
            DynArrayHeapMapInner::Dim13(map) => map.into_iter(),
            DynArrayHeapMapInner::Dim14(map) => map.into_iter(),
            DynArrayHeapMapInner::Dim15(map) => map.into_iter(),
            DynArrayHeapMapInner::Dim16(map) => map.into_iter(),
        }
    }
}

#[cfg(test)]
mod tests {
    use super::*;

    #[test]
    fn test_dyn_array_heap_map() {
        let mut map = DynArrayHeapMap::<u32, &str>::try_new(2).unwrap();
        // insert
        let key1 = [1u32, 2u32];
        let key2 = [2u32, 1u32];
        map.get_or_insert_with(&key1, || "a");
        map.get_or_insert_with(&key2, || "b");
        assert_eq!(map.size(), 2);

        // evict highest
        assert_eq!(map.peek_highest(), Some(&key2[..]));
        map.evict_highest();
        assert_eq!(map.size(), 1);
        assert_eq!(map.peek_highest(), Some(&key1[..]));

        // into_iter
        let mut iter = map.into_iter();
        let (k, v) = iter.next().unwrap();
        assert_eq!(k.as_slice(), &key1);
        assert_eq!(v, "a");
        assert_eq!(iter.next(), None);
    }
}


================================================
FILE: src/aggregation/bucket/composite/mod.rs
================================================
mod accessors;
mod calendar_interval;
mod collector;
mod map;
mod numeric_types;

use core::panic;
use std::cmp::Ordering;
use std::fmt::Debug;
use std::net::{AddrParseError, IpAddr};
use std::str::FromStr;

use columnar::ColumnType;
use rustc_hash::FxHashMap;
use serde::{Deserialize, Serialize};

use crate::aggregation::agg_result::CompositeKey;
pub use crate::aggregation::bucket::composite::accessors::{
    CompositeAccessor, CompositeAggReqData, CompositeSourceAccessors, PrecomputedDateInterval,
};
pub use crate::aggregation::bucket::composite::collector::SegmentCompositeCollector;
use crate::aggregation::bucket::composite::numeric_types::num_cmp::{
    cmp_i64_f64, cmp_i64_u64, cmp_u64_f64,
};
use crate::aggregation::bucket::Order;
use crate::aggregation::deserialize_f64;
use crate::aggregation::intermediate_agg_result::CompositeIntermediateKey;
use crate::schema::IntoIpv6Addr;
use crate::TantivyError;

/// Position of missing keys in the ordering.
#[derive(Clone, Copy, Debug, PartialEq, Serialize, Deserialize, Default)]
#[serde(rename_all = "lowercase")]
pub enum MissingOrder {
    /// Missing keys appear first in ascending order, last in descending order.
    #[default]
    Default,
    /// Missing keys should appear first.
    First,
    /// Missing keys should appear last.
    Last,
}

fn agg_source_default_order() -> Order {
    Order::Asc
}

/// Term source for a composite aggregation.
#[derive(Clone, Debug, PartialEq, Serialize, Deserialize)]
pub struct TermCompositeAggregationSource {
    /// The name used to refer to this source in the composite key.
    #[serde(skip)]
    pub name: String,
    /// The field to aggregate on.
    pub field: String,
    /// The order for this source.
    #[serde(default = "agg_source_default_order")]
    pub order: Order,
    /// Whether to create a `null` bucket for documents without value for this
    /// field. By default documents without a value are ignored.
    #[serde(default)]
    pub missing_bucket: bool,
    /// Whether missing keys should appear first or last.
    #[serde(default)]
    pub missing_order: MissingOrder,
}

/// Histogram source for a composite aggregation.
#[derive(Clone, Debug, PartialEq, Serialize, Deserialize)]
pub struct HistogramCompositeAggregationSource {
    /// The name used to refer to this source in the composite key.
    #[serde(skip)]
    pub name: String,
    /// The field to aggregate on.
    pub field: String,
    /// The interval for the histogram. For datetime fields, this is expressed.
    /// in milliseconds.
    #[serde(deserialize_with = "deserialize_f64")]
    pub interval: f64,
    /// The order for this source.
    #[serde(default = "agg_source_default_order")]
    pub order: Order,
    /// Whether to create a `null` bucket for documents without value for this
    /// field. By default documents without a value are ignored.
    #[serde(default)]
    pub missing_bucket: bool,
    /// Whether missing keys should appear first or last.
    #[serde(default)]
    pub missing_order: MissingOrder,
}

/// Calendar intervals supported for date histogram sources
#[derive(Clone, Copy, Debug, PartialEq, Serialize, Deserialize)]
#[serde(rename_all = "lowercase")]
pub enum CalendarInterval {
    /// A year between Jan 1st and Dec 31st, taking into account leap years.
    Year,
    /// A month between the 1st and the last day of the month.
    Month,
    /// A week between Monday and Sunday.
    Week,
}

/// Date histogram source for a composite aggregation.
///
/// Time zone not supported yet. Every interval is aligned on UTC.
#[derive(Clone, Debug, PartialEq, Serialize, Deserialize)]
pub struct DateHistogramCompositeAggregationSource {
    /// The name used to refer to this source in the composite key.
    #[serde(skip)]
    pub name: String,
    /// The field to aggregate on.
    pub field: String,
    /// The fixed interval for the histogram. Either this or `calendar_interval`.
    /// must be set.
    #[serde(default, skip_serializing_if = "Option::is_none")]
    pub fixed_interval: Option<String>,
    /// The calendar adjusted interval for the histogram. Either this or
    /// `fixed_interval` must be set.
    #[serde(default, skip_serializing_if = "Option::is_none")]
    pub calendar_interval: Option<CalendarInterval>,
    /// The order for this source.
    #[serde(default = "agg_source_default_order")]
    pub order: Order,
    /// Whether to create a `null` bucket for documents without value for this
    /// field. By default documents without a value are ignored. Not supported
    /// in Elasticsearch.
    #[serde(default)]
    pub missing_bucket: bool,
    /// Whether missing keys should appear first or last.
    #[serde(default)]
    pub missing_order: MissingOrder,
}

/// Source for the composite aggregation. A composite aggregation can have
/// multiple sources.
#[derive(Clone, Debug, PartialEq, Serialize, Deserialize)]
#[serde(rename_all = "snake_case")]
pub enum CompositeAggregationSource {
    /// Terms source.
    Terms(TermCompositeAggregationSource),
    /// Histogram source.
    Histogram(HistogramCompositeAggregationSource),
    /// Date histogram source.
    DateHistogram(DateHistogramCompositeAggregationSource),
}

impl CompositeAggregationSource {
    pub(crate) fn field(&self) -> &str {
        match self {
            CompositeAggregationSource::Terms(source) => &source.field,
            CompositeAggregationSource::Histogram(source) => &source.field,
            CompositeAggregationSource::DateHistogram(source) => &source.field,
        }
    }

    pub(crate) fn name(&self) -> &str {
        match self {
            CompositeAggregationSource::Terms(source) => &source.name,
            CompositeAggregationSource::Histogram(source) => &source.name,
            CompositeAggregationSource::DateHistogram(source) => &source.name,
        }
    }

    pub(crate) fn order(&self) -> Order {
        match self {
            CompositeAggregationSource::Terms(source) => source.order,
            CompositeAggregationSource::Histogram(source) => source.order,
            CompositeAggregationSource::DateHistogram(source) => source.order,
        }
    }

    pub(crate) fn missing_order(&self) -> MissingOrder {
        match self {
            CompositeAggregationSource::Terms(source) => source.missing_order,
            CompositeAggregationSource::Histogram(source) => source.missing_order,
            CompositeAggregationSource::DateHistogram(source) => source.missing_order,
        }
    }

    pub(crate) fn missing_bucket(&self) -> bool {
        match self {
            CompositeAggregationSource::Terms(source) => source.missing_bucket,
            CompositeAggregationSource::Histogram(source) => source.missing_bucket,
            CompositeAggregationSource::DateHistogram(source) => source.missing_bucket,
        }
    }
}

/// A paginable aggregation that performs on multiple dimensions (sources),
/// potentially mixing term and range queries.
///
/// Pagination is made possible because the buckets are ordered by the composite
/// key, so the next page can be fetched "efficiently" by filtering using range
/// queries on the key dimensions.
#[derive(Clone, Debug, Default, PartialEq, Serialize, Deserialize)]
#[serde(
    try_from = "CompositeAggregationSerde",
    into = "CompositeAggregationSerde"
)]
pub struct CompositeAggregation {
    /// The fields and bucketting strategies.
    pub sources: Vec<CompositeAggregationSource>,
    /// Number of buckets to return (page size).
    pub size: u32,
    /// The key of the previous page's last bucket.
    pub after: FxHashMap<String, AfterKey>,
}

#[derive(Serialize, Deserialize)]
struct CompositeAggregationSerde {
    sources: Vec<FxHashMap<String, CompositeAggregationSource>>,
    size: u32,
    #[serde(default, skip_serializing_if = "FxHashMap::is_empty")]
    after: FxHashMap<String, AfterKey>,
}

impl TryFrom<CompositeAggregationSerde> for CompositeAggregation {
    type Error = TantivyError;

    fn try_from(value: CompositeAggregationSerde) -> Result<Self, Self::Error> {
        let mut sources = Vec::with_capacity(value.sources.len());
        for map in value.sources {
            if map.len() != 1 {
                return Err(TantivyError::InvalidArgument(
                    "each composite source must have exactly one named entry".to_string(),
                ));
            }
            let (name, mut source) = map.into_iter().next().unwrap();
            match &mut source {
                CompositeAggregationSource::Terms(source) => {
                    source.name = name;
                }
                CompositeAggregationSource::Histogram(source) => {
                    source.name = name;
                }
                CompositeAggregationSource::DateHistogram(source) => {
                    source.name = name;
                }
            }
            sources.push(source);
        }
        Ok(CompositeAggregation {
            sources,
            size: value.size,
            after: value.after,
        })
    }
}

impl From<CompositeAggregation> for CompositeAggregationSerde {
    fn from(value: CompositeAggregation) -> Self {
        let mut serde_sources = Vec::with_capacity(value.sources.len());
        for source in value.sources {
            let (name, stored_source) = match source {
                CompositeAggregationSource::Terms(source) => {
                    let name = source.name.clone();
                    // name field is #[serde(skip)] so it won't be serialized inside the value
                    (name, CompositeAggregationSource::Terms(source))
                }
                CompositeAggregationSource::Histogram(source) => {
                    let name = source.name.clone();
                    (name, CompositeAggregationSource::Histogram(source))
                }
                CompositeAggregationSource::DateHistogram(source) => {
                    let name = source.name.clone();
                    (name, CompositeAggregationSource::DateHistogram(source))
                }
            };
            let mut map = FxHashMap::default();
            map.insert(name, stored_source);
            serde_sources.push(map);
        }
        CompositeAggregationSerde {
            sources: serde_sources,
            size: value.size,
            after: value.after,
        }
    }
}

/// Key used to decide the order in which multi-type terms should be paginated.
#[derive(Ord, PartialOrd, PartialEq, Eq)]
enum ColumnPaginationOrder {
    Bool = 1,
    Str = 2,
    Numeric = 3,
    IpAddr = 4,
    DateTime = 5,
}

trait ToTypePaginationOrder {
    /// Returns the pagination order key for the current type related variant.
    ///
    /// Panics if called on a variant representing null. Null values must be
    /// handled separately.
    fn column_pagination_order(&self) -> ColumnPaginationOrder;
}

impl ToTypePaginationOrder for ColumnType {
    fn column_pagination_order(&self) -> ColumnPaginationOrder {
        match self {
            ColumnType::Bool => ColumnPaginationOrder::Bool,
            ColumnType::Str => ColumnPaginationOrder::Str,
            ColumnType::F64 | ColumnType::I64 | ColumnType::U64 => ColumnPaginationOrder::Numeric,
            ColumnType::IpAddr => ColumnPaginationOrder::IpAddr,
            ColumnType::DateTime => ColumnPaginationOrder::DateTime,
            ColumnType::Bytes => panic!("unsupported"),
        }
    }
}

impl ToTypePaginationOrder for CompositeIntermediateKey {
    fn column_pagination_order(&self) -> ColumnPaginationOrder {
        match self {
            CompositeIntermediateKey::Bool(_) => ColumnPaginationOrder::Bool,
            CompositeIntermediateKey::Str(_) => ColumnPaginationOrder::Str,
            CompositeIntermediateKey::F64(_)
            | CompositeIntermediateKey::I64(_)
            | CompositeIntermediateKey::U64(_) => ColumnPaginationOrder::Numeric,
            CompositeIntermediateKey::IpAddr(_) => ColumnPaginationOrder::IpAddr,
            CompositeIntermediateKey::DateTime(_) => ColumnPaginationOrder::DateTime,
            CompositeIntermediateKey::Null => panic!("null must be handled separately"),
        }
    }
}

impl ToTypePaginationOrder for CompositeKey {
    fn column_pagination_order(&self) -> ColumnPaginationOrder {
        match self {
            CompositeKey::Bool(_) => ColumnPaginationOrder::Bool,
            CompositeKey::Str(_) => ColumnPaginationOrder::Str,
            CompositeKey::F64(_) | CompositeKey::I64(_) | CompositeKey::U64(_) => {
                ColumnPaginationOrder::Numeric
            }
            CompositeKey::Null => panic!("null must be handled separately"),
        }
    }
}

/// After key is a string that encodes the intermediate composite key as "<type>:<value>"
/// A wrapper type for CompositeIntermediateKey that serializes/deserializes
/// to/from the "<type>:<value>" format.
#[derive(Clone, Debug, PartialEq)]
pub struct AfterKey(pub CompositeIntermediateKey);

impl Serialize for AfterKey {
    fn serialize<S>(&self, serializer: S) -> Result<S::Ok, S::Error>
    where S: serde::Serializer {
        let s = match &self.0 {
            CompositeIntermediateKey::Bool(b) => format!("bool:{}", b),
            CompositeIntermediateKey::Str(s) => format!("str:{}", s),
            CompositeIntermediateKey::I64(i) => format!("i64:{}", i),
            CompositeIntermediateKey::U64(u) => format!("u64:{}", u),
            CompositeIntermediateKey::F64(f) => format!("f64:{}", f),
            CompositeIntermediateKey::IpAddr(ip) => format!("ip:{}", ip),
            CompositeIntermediateKey::DateTime(dt) => format!("dt:{}", dt),
            CompositeIntermediateKey::Null => "null:".to_string(),
        };
        serializer.serialize_str(&s)
    }
}

impl<'de> Deserialize<'de> for AfterKey {
    fn deserialize<D>(deserializer: D) -> Result<Self, D::Error>
    where D: serde::Deserializer<'de> {
        let s = String::deserialize(deserializer)?;
        let parts: Vec<&str> = s.splitn(2, ':').collect();

        if parts.len() != 2 {
            return Err(serde::de::Error::custom("invalid after key format"));
        }

        let key = match parts[0] {
            "bool" => {
                let b = parts[1].parse::<bool>().map_err(|e| {
                    serde::de::Error::custom(format!("failed to parse bool: {}", e))
                })?;
                CompositeIntermediateKey::Bool(b)
            }
            "str" => CompositeIntermediateKey::Str(parts[1].to_string()),
            "i64" => {
                let i = parts[1]
                    .parse::<i64>()
                    .map_err(|e| serde::de::Error::custom(format!("failed to parse i64: {}", e)))?;
                CompositeIntermediateKey::I64(i)
            }
            "u64" => {
                let u = parts[1]
                    .parse::<u64>()
                    .map_err(|e| serde::de::Error::custom(format!("failed to parse u64: {}", e)))?;
                CompositeIntermediateKey::U64(u)
            }
            "f64" => {
                let f = parts[1]
                    .parse::<f64>()
                    .map_err(|e| serde::de::Error::custom(format!("failed to parse f64: {}", e)))?;
                if f.is_nan() {
                    return Err(serde::de::Error::custom(
                        "NaN is not supported in after key",
                    ));
                }
                CompositeIntermediateKey::F64(f)
            }
            "ip" => {
                let ip = IpAddr::from_str(parts[1]).map_err(|e: AddrParseError| {
                    serde::de::Error::custom(format!("failed to parse ip: {}", e))
                })?;
                CompositeIntermediateKey::IpAddr(ip.into_ipv6_addr())
            }
            "dt" => {
                let dt = parts[1].parse::<i64>().map_err(|e| {
                    serde::de::Error::custom(format!("failed to parse datetime: {}", e))
                })?;
                CompositeIntermediateKey::DateTime(dt)
            }
            "null" => CompositeIntermediateKey::Null,
            _ => {
                return Err(serde::de::Error::custom("invalid after key type"));
            }
        };

        Ok(AfterKey(key))
    }
}

impl From<CompositeIntermediateKey> for AfterKey {
    fn from(key: CompositeIntermediateKey) -> Self {
        AfterKey(key)
    }
}

impl From<AfterKey> for CompositeIntermediateKey {
    fn from(value: AfterKey) -> Self {
        value.0
    }
}

/// Calculates the ordering between intermediate keys.
pub fn composite_intermediate_key_ordering(
    left_opt: &CompositeIntermediateKey,
    right_opt: &CompositeIntermediateKey,
    order: Order,
    missing_order: MissingOrder,
) -> crate::Result<Ordering> {
    use CompositeIntermediateKey as CIKey;
    let mut forced_ordering = false;
    let asc_ordering = match (left_opt, right_opt) {
        // null comparisons
        (CIKey::Null, CIKey::Null) => Ordering::Equal,
        (CIKey::Null, _) => {
            forced_ordering = missing_order != MissingOrder::Default;
            match missing_order {
                MissingOrder::First => Ordering::Less,
                MissingOrder::Last => Ordering::Greater,
                MissingOrder::Default => Ordering::Less,
            }
        }
        (_, CIKey::Null) => {
            forced_ordering = missing_order != MissingOrder::Default;
            match missing_order {
                MissingOrder::First => Ordering::Greater,
                MissingOrder::Last => Ordering::Less,
                MissingOrder::Default => Ordering::Greater,
            }
        }
        // same type comparisons
        (CIKey::Bool(left), CIKey::Bool(right)) => left.cmp(right),
        (CIKey::I64(left), CIKey::I64(right)) => left.cmp(right),
        (CIKey::Str(left), CIKey::Str(right)) => left.cmp(right),
        (CIKey::IpAddr(left), CIKey::IpAddr(right)) => left.cmp(right),
        (CIKey::DateTime(left), CIKey::DateTime(right)) => left.cmp(right),
        (CIKey::U64(left), CIKey::U64(right)) => left.cmp(right),
        (CIKey::F64(f), CIKey::F64(_)) | (CIKey::F64(_), CIKey::F64(f)) if f.is_nan() => {
            return Err(TantivyError::InvalidArgument(
                "NaN comparison is not supported".to_string(),
            ))
        }
        (CIKey::F64(left), CIKey::F64(right)) => left.partial_cmp(right).unwrap_or(Ordering::Equal),
        // numeric cross-type comparisons
        (CIKey::F64(left), CIKey::I64(right)) => cmp_i64_f64(*right, *left)?.reverse(),
        (CIKey::F64(left), CIKey::U64(right)) => cmp_u64_f64(*right, *left)?.reverse(),
        (CIKey::I64(left), CIKey::F64(right)) => cmp_i64_f64(*left, *right)?,
        (CIKey::I64(left), CIKey::U64(right)) => cmp_i64_u64(*left, *right),
        (CIKey::U64(left), CIKey::I64(right)) => cmp_i64_u64(*right, *left).reverse(),
        (CIKey::U64(left), CIKey::F64(right)) => cmp_u64_f64(*left, *right)?,
        // other cross-type comparisons
        (type_a, type_b) => type_a
            .column_pagination_order()
            .cmp(&type_b.column_pagination_order()),
    };
    if !forced_ordering && order == Order::Desc {
        Ok(asc_ordering.reverse())
    } else {
        Ok(asc_ordering)
    }
}

#[cfg(test)]
mod tests {
    use std::net::{Ipv4Addr, Ipv6Addr};

    use serde_json::json;
    use time::format_description::well_known::Rfc3339;
    use time::OffsetDateTime;

    use crate::aggregation::agg_req::Aggregations;
    use crate::aggregation::tests::exec_request;
    use crate::schema::{Schema, FAST, STRING};
    use crate::Index;

    fn datetime_from_iso_str(date_str: &str) -> common::DateTime {
        let dt = OffsetDateTime::parse(date_str, &Rfc3339)
            .expect(&format!("Failed to parse date: {}", date_str));
        let timestamp_secs = dt.unix_timestamp_nanos();
        common::DateTime::from_timestamp_nanos(timestamp_secs as i64)
    }

    fn ms_timestamp_from_iso_str(date_str: &str) -> i64 {
        let dt = OffsetDateTime::parse(date_str, &Rfc3339)
            .expect(&format!("Failed to parse date: {}", date_str));
        (dt.unix_timestamp_nanos() / 1_000_000) as i64
    }

    /// Runs the query and compares the result buckets to the expected buckets,
    /// then run the same query with a all possible `after` keys and different
    /// page sizes.
    fn exec_and_assert_all_paginations(
        index: &Index,
        composite_agg_sources: serde_json::Value,
        expected_buckets: serde_json::Value,
    ) {
        let expected_buckets_vec = expected_buckets.as_array().unwrap();

        for page_size in 1..=expected_buckets_vec.len() {
            let page_count = (expected_buckets_vec.len() + page_size - 1) / page_size;
            let mut after_key = None;
            for page_idx in 0..page_count {
                let mut agg_req_json = json!({
                    "my_composite": {
                        "composite": {
                            "sources": composite_agg_sources,
                            "size": page_size,
                        }
                    }
                });
                if page_idx > 0 {
                    agg_req_json["my_composite"]["composite"]["after"] = after_key.take().unwrap();
                }
                let agg_req: Aggregations = serde_json::from_value(agg_req_json).unwrap();
                let res = exec_request(agg_req.clone(), &index).unwrap();
                let expected_page_buckets = &expected_buckets_vec[page_idx * page_size
                    ..std::cmp::min((page_idx + 1) * page_size, expected_buckets_vec.len())];
                assert_eq!(
                    &res["my_composite"]["buckets"],
                    &json!(expected_page_buckets),
                    "pagination failed at page {}, size {}, query: {:?}",
                    page_idx,
                    page_size,
                    agg_req,
                );
                if page_idx + 1 < page_count {
                    assert!(
                        res["my_composite"].get("after_key").is_some(),
                        "expected after_key on all but last page"
                    );
                    after_key = Some(res["my_composite"]["after_key"].clone());
                } else if let Some(_) = res["my_composite"].get("after_key") {
                    // currently we sometime have an after_key on the last page,
                    // check that the next "page" is empty
                    let agg_req_json = json!({
                        "my_composite": {
                            "composite": {
                                "sources": composite_agg_sources,
                                "size": page_size,
                                "after": res["my_composite"]["after_key"].clone(),
                            }
                        }
                    });
                    let agg_req: Aggregations = serde_json::from_value(agg_req_json).unwrap();
                    let res = exec_request(agg_req.clone(), &index).unwrap();
                    assert_eq!(
                        res["my_composite"]["buckets"],
                        json!([]),
                        "expected no buckets when using after_key from last page, query: {:?}",
                        agg_req
                    );
                }
            }
        }
    }

    fn composite_aggregation_test(merge_segments: bool) -> crate::Result<()> {
        let mut schema_builder = Schema::builder();
        let string_field = schema_builder.add_text_field("string_id", STRING | FAST);
        let index = Index::create_in_ram(schema_builder.build());
        {
            let mut index_writer = index.writer_with_num_threads(1, 20_000_000)?;
            index_writer.add_document(doc!(string_field => "terma"))?;
            index_writer.add_document(doc!(string_field => "termb"))?;
            index_writer.add_document(doc!(string_field => "termc"))?;
            index_writer.add_document(doc!(string_field => "terma"))?;
            index_writer.commit()?;
            index_writer.add_document(doc!(string_field => "terma"))?;
            index_writer.add_document(doc!(string_field => "terma"))?;
            index_writer.add_document(doc!(string_field => "termb"))?;
            index_writer.add_document(doc!(string_field => "terma"))?;
            index_writer.commit()?;
            if merge_segments {
                index_writer.wait_merging_threads()?;
            }
        }

        let agg_req: Aggregations = serde_json::from_value(json!({
            "my_composite": {
                "composite": {
                    "sources": [
                        {"term1": {"terms": {"field": "string_id"}}}
                    ],
                    "size": 10
                }
            }
        }))
        .unwrap();

        let res = exec_request(agg_req, &index)?;
        let buckets = &res["my_composite"]["buckets"];

        assert_eq!(
            buckets,
            &json!([
                {"key": {"term1": "terma"}, "doc_count": 5},
                {"key": {"term1": "termb"}, "doc_count": 2},
                {"key": {"term1": "termc"}, "doc_count": 1}
            ])
        );

        Ok(())
    }

    #[test]
    fn composite_aggregation_term_single_segment() -> crate::Result<()> {
        composite_aggregation_test(true)
    }

    #[test]
    fn composite_aggregation_term_multi_segment() -> crate::Result<()> {
        composite_aggregation_test(false)
    }

    fn composite_aggregation_term_size_limit(merge_segments: bool) -> crate::Result<()> {
        let mut schema_builder = Schema::builder();
        let string_field = schema_builder.add_text_field("string_id", STRING | FAST);
        let index = Index::create_in_ram(schema_builder.build());
        {
            let mut index_writer = index.writer_with_num_threads(1, 20_000_000)?;
            index_writer.add_document(doc!(string_field => "terma"))?;
            index_writer.add_document(doc!(string_field => "termb"))?;
            index_writer.commit()?;
            index_writer.add_document(doc!(string_field => "termc"))?;
            index_writer.add_document(doc!(string_field => "termd"))?;
            index_writer.add_document(doc!(string_field => "terme"))?;
            index_writer.commit()?;
            if merge_segments {
                index_writer.wait_merging_threads()?;
            }
        }

        let agg_req: Aggregations = serde_json::from_value(json!({
            "my_composite": {
                "composite": {
                    "sources": [
                        {"myterm": {"terms": {"field": "string_id"}}}
                    ],
                    "size": 3
                }
            }
        }))
        .unwrap();
        let res = exec_request(agg_req, &index)?;
        let buckets = &res["my_composite"]["buckets"];
        // Should only return 3 buckets due to size limit
        assert_eq!(
            buckets,
            &json!([
                {"key": {"myterm": "terma"}, "doc_count": 1},
                {"key": {"myterm": "termb"}, "doc_count": 1},
                {"key": {"myterm": "termc"}, "doc_count": 1}
            ])
        );

        // next page
        let agg_req: Aggregations = serde_json::from_value(json!({
            "my_composite": {
                "composite": {
                    "sources": [
                        {"myterm": {"terms": {"field": "string_id"}}}
                    ],
                    "size": 3,
                    "after":  &res["my_composite"]["after_key"]
                }
            }
        }))
        .unwrap();
        let res = exec_request(agg_req, &index)?;
        let buckets = &res["my_composite"]["buckets"];
        assert_eq!(
            buckets,
            &json!([
                {"key": {"myterm": "termd"}, "doc_count": 1},
                {"key": {"myterm": "terme"}, "doc_count": 1}
            ])
        );
        assert!(res["my_composite"].get("after_key").is_none());

        Ok(())
    }

    #[test]
    fn composite_aggregation_term_size_limit_single_segment() -> crate::Result<()> {
        composite_aggregation_term_size_limit(true)
    }

    #[test]
    fn composite_aggregation_term_size_limit_multi_segment() -> crate::Result<()> {
        composite_aggregation_term_size_limit(false)
    }

    #[test]
    fn composite_aggregation_term_ordering() -> crate::Result<()> {
        let mut schema_builder = Schema::builder();
        let string_field = schema_builder.add_text_field("string_id", STRING | FAST);
        let index = Index::create_in_ram(schema_builder.build());
        {
            let mut index_writer = index.writer_with_num_threads(1, 20_000_000)?;
            index_writer.add_document(doc!(string_field => "zebra"))?;
            index_writer.add_document(doc!(string_field => "apple"))?;
            index_writer.add_document(doc!(string_field => "banana"))?;
            index_writer.add_document(doc!(string_field => "cherry"))?;
            index_writer.add_document(doc!(string_field => "dog"))?;
            index_writer.add_document(doc!(string_field => "elephant"))?;
            index_writer.add_document(doc!(string_field => "fox"))?;
            index_writer.add_document(doc!(string_field => "grape"))?;
            index_writer.commit()?;
        }

        // Test ascending order (default)
        let agg_req: Aggregations = serde_json::from_value(json!({
            "fruity_aggreg": {
                "composite": {
                    "sources": [
                        {"myterm": {"terms": {"field": "string_id", "order": "asc"}}}
                    ],
                    "size": 5
                }
            }
        }))
        .unwrap();
        let res = exec_request(agg_req, &index)?;
        let buckets = &res["fruity_aggreg"]["buckets"];
        // Should return only 5 buckets due to size limit, in ascending order
        assert_eq!(
            buckets,
            &json!([
                {"key": {"myterm": "apple"}, "doc_count": 1},
                {"key": {"myterm": "banana"}, "doc_count": 1},
                {"key": {"myterm": "cherry"}, "doc_count": 1},
                {"key": {"myterm": "dog"}, "doc_count": 1},
                {"key": {"myterm": "elephant"}, "doc_count": 1}
            ])
        );

        // Test descending order
        let agg_req: Aggregations = serde_json::from_value(json!({
            "fruity_aggreg": {
                "composite": {
                    "sources": [
                        {"myterm": {"terms": {"field": "string_id", "order": "desc"}}}
                    ],
                    "size": 5
                }
            }
        }))
        .unwrap();
        let res = exec_request(agg_req, &index)?;
        let buckets = &res["fruity_aggreg"]["buckets"];
        // Should return only 5 buckets due to size limit, in descending order
        assert_eq!(
            buckets,
            &json!([
                {"key": {"myterm": "zebra"}, "doc_count": 1},
                {"key": {"myterm": "grape"}, "doc_count": 1},
                {"key": {"myterm": "fox"}, "doc_count": 1},
                {"key": {"myterm": "elephant"}, "doc_count": 1},
                {"key": {"myterm": "dog"}, "doc_count": 1}
            ])
        );

        // next page in descending order
        let agg_req: Aggregations = serde_json::from_value(json!({
            "fruity_aggreg": {
                "composite": {
                    "sources": [
                        {"myterm": {"terms": {"field": "string_id", "order": "desc"}}}
                    ],
                    "size": 5,
                    "after":  &res["fruity_aggreg"]["after_key"]
                }
            }
        }))
        .unwrap();
        let res = exec_request(agg_req, &index)?;
        let buckets = &res["fruity_aggreg"]["buckets"];
        // Should return only 5 buckets due to size limit, in descending order
        assert_eq!(
            buckets,
            &json!([
                {"key": {"myterm": "cherry"}, "doc_count": 1},
                {"key": {"myterm": "banana"}, "doc_count": 1},
                {"key": {"myterm": "apple"}, "doc_count": 1}
            ])
        );
        assert!(res["fruity_aggreg"].get("after_key").is_none());

        Ok(())
    }

    #[test]
    fn composite_aggregation_term_missing_values() -> crate::Result<()> {
        // Create index with some documents having missing values
        let mut schema_builder = Schema::builder();
        let string_field = schema_builder.add_text_field("string_id", STRING | FAST);
        let index = Index::create_in_ram(schema_builder.build());
        {
            let mut index_writer = index.writer_with_num_threads(1, 20_000_000)?;
            index_writer.add_document(doc!(string_field => "terma"))?;
            index_writer.add_document(doc!(string_field => "termb"))?;
            index_writer.add_document(doc!())?;
            index_writer.add_document(doc!(string_field => "terma"))?;
            index_writer.commit()?;
        }

        // Test without missing bucket (should ignore missing values)
        exec_and_assert_all_paginations(
            &index,
            json!([
                {"myterm": {"terms": {"field": "string_id", "missing_bucket": false}}}
            ]),
            json!([
                {"key": {"myterm": "terma"}, "doc_count": 2},
                {"key": {"myterm": "termb"}, "doc_count": 1}
            ]),
        );

        // Test with missing bucket enabled
        exec_and_assert_all_paginations(
            &index,
            json!([
                {"myterm": {"terms": {"field": "string_id", "missing_bucket": true}}}
            ]),
            // Should have 3 buckets including the missing bucket
            // Missing bucket should come first in ascending order by default
            json!([
                {"key": {"myterm": null}, "doc_count": 1},
                {"key": {"myterm": "terma"}, "doc_count": 2},
                {"key": {"myterm": "termb"}, "doc_count": 1}
            ]),
        );

        Ok(())
    }

    #[test]
    fn composite_aggregation_term_missing_order() -> crate::Result<()> {
        // Create index with missing values
        let mut schema_builder = Schema::builder();
        let string_field = schema_builder.add_text_field("string_id", STRING | FAST);
        let index = Index::create_in_ram(schema_builder.build());

        {
            let mut index_writer = index.writer_with_num_threads(1, 20_000_000)?;
            index_writer.add_document(doc!(string_field => "termb"))?;
            index_writer.add_document(doc!())?;
            index_writer.add_document(doc!(string_field => "terma"))?;
            index_writer.commit()?;
        }

        // Test missing_order: "first"
        exec_and_assert_all_paginations(
            &index,
            json!([
                {
                    "myterm": {
                        "terms": {
                            "field": "string_id",
                            "missing_bucket": true,
                            "missing_order": "first",
                            "order": "asc"
                        }
                    }
                }
            ]),
            json!([
                {"key": {"myterm": null}, "doc_count": 1},
                {"key": {"myterm": "terma"}, "doc_count": 1},
                {"key": {"myterm": "termb"}, "doc_count": 1}
            ]),
        );

        // Test missing_order: "last"
        exec_and_assert_all_paginations(
            &index,
            json!([
                {
                    "myterm": {
                        "terms": {
                            "field": "string_id",
                            "missing_bucket": true,
                            "missing_order": "last",
                            "order": "asc"
                        }
                    }
                }
            ]),
            json!([
                {"key": {"myterm": "terma"}, "doc_count": 1},
                {"key": {"myterm": "termb"}, "doc_count": 1},
                {"key": {"myterm": null}, "doc_count": 1}
            ]),
        );

        // Test missing_order: "default" with desc order
        exec_and_assert_all_paginations(
            &index,
            json!([
                {
                    "myterm": {
                        "terms": {
                            "field": "string_id",
                            "missing_bucket": true,
                            "missing_order": "default",
                            "order": "desc"
                        }
                    }
                }
            ]),
            json!([
                {"key": {"myterm": "termb"}, "doc_count": 1},
                {"key": {"myterm": "terma"}, "doc_count": 1},
                {"key": {"myterm": null}, "doc_count": 1}
            ]),
        );

        Ok(())
    }

    #[test]
    fn composite_aggregation_term_multi_source() -> crate::Result<()> {
        let mut schema_builder = Schema::builder();
        let cat = schema_builder.add_text_field("category", STRING | FAST);
        let status = schema_builder.add_text_field("status", STRING | FAST);
        let index = Index::create_in_ram(schema_builder.build());
        {
            let mut index_writer = index.writer_with_num_threads(1, 20_000_000)?;
            index_writer.add_document(doc!(cat => "electronics", status => "active"))?;
            index_writer.add_document(doc!(cat => "electronics", status => "inactive"))?;
            index_writer.add_document(doc!(cat => "electronics", status => "active"))?;
            index_writer.add_document(doc!(cat => "books", status => "active"))?;
            index_writer.add_document(doc!(cat => "books", status => "inactive"))?;
            index_writer.add_document(doc!(cat => "clothing", status => "active"))?;
            index_writer.commit()?;
        }

        exec_and_assert_all_paginations(
            &index,
            json!([
                {"category": {"terms": {"field": "category"}}},
                {"status": {"terms": {"field": "status"}}}
            ]),
            // Should have composite keys with both dimensions in sorted order
            json!([
                {"key": {"category": "books", "status": "active"}, "doc_count": 1},
                {"key": {"category": "books", "status": "inactive"}, "doc_count": 1},
                {"key": {"category": "clothing", "status": "active"}, "doc_count": 1},
                {"key": {"category": "electronics", "status": "active"}, "doc_count": 2},
                {"key": {"category": "electronics", "status": "inactive"}, "doc_count": 1}
            ]),
        );

        Ok(())
    }

    #[test]
    fn composite_aggregation_term_multi_source_ordering() -> crate::Result<()> {
        let mut schema_builder = Schema::builder();
        let cat = schema_builder.add_text_field("category", STRING | FAST);
        let priority = schema_builder.add_text_field("priority", STRING | FAST);
        let index = Index::create_in_ram(schema_builder.build());
        {
            let mut index_writer = index.writer_with_num_threads(1, 20_000_000)?;
            index_writer.add_document(doc!(cat => "zebra", priority => "high"))?;
            index_writer.add_document(doc!(cat => "apple", priority => "low"))?;
            index_writer.add_document(doc!(cat => "zebra", priority => "low"))?;
            index_writer.add_document(doc!(cat => "apple", priority => "high"))?;
            index_writer.commit()?;
        }

        // Test with different ordering on different sources
        exec_and_assert_all_paginations(
            &index,
            json!([
                {"category": {"terms": {"field": "category", "order": "asc"}}},
                {"priority": {"terms": {"field": "priority", "order": "desc"}}}
            ]),
            json!([
                {"key": {"category": "apple", "priority": "low"}, "doc_count": 1},
                {"key": {"category": "apple", "priority": "high"}, "doc_count": 1},
                {"key": {"category": "zebra", "priority": "low"}, "doc_count": 1},
                {"key": {"category": "zebra", "priority": "high"}, "doc_count": 1}
            ]),
        );

        Ok(())
    }

    #[test]
    fn composite_aggregation_term_with_sub_aggregations() -> crate::Result<()> {
        let mut schema_builder = Schema::builder();
        let score_field = schema_builder.add_f64_field("score_f64", FAST);
        let string_field = schema_builder.add_text_field("string_id", STRING | FAST);
        let index = Index::create_in_ram(schema_builder.build());
        {
            let mut index_writer = index.writer_with_num_threads(1, 20_000_000)?;
            index_writer.add_document(doc!(score_field => 5.0f64, string_field => "terma"))?;
            index_writer.add_document(doc!(score_field => 2.0f64, string_field => "termb"))?;
            index_writer.add_document(doc!(score_field => 3.0f64, string_field => "terma"))?;
            index_writer.add_document(doc!(score_field => 7.0f64, string_field => "termb"))?;
            index_writer.commit()?;
        }

        let agg_req: Aggregations = serde_json::from_value(json!({
            "my_composite": {
                "composite": {
                    "sources": [
                        {"myterm": {"terms": {"field": "string_id"}}}
                    ],
                    "size": 10
                },
                "aggs": {
                    "avg_score": {
                        "avg": {
                            "field": "score_f64"
                        }
                    },
                    "max_score": {
                        "max": {
                            "field": "score_f64"
                        }
                    }
                }
            }
        }))
        .unwrap();

        let res = exec_request(agg_req, &index)?;
        let buckets = &res["my_composite"]["buckets"];

        // Check that sub-aggregations are computed for each bucket with specific values
        assert_eq!(
            buckets,
            &json!([
                {
                    "key": {"myterm": "terma"},
                    "doc_count": 2,
                    "avg_score": {"value": 4.0}, // (5+3)/2
                    "max_score": {"value": 5.0}
                },
                {
                    "key": {"myterm": "termb"},
                    "doc_count": 2,
                    "avg_score": {"value": 4.5}, // (2+7)/2
                    "max_score": {"value": 7.0}
                }
            ])
        );

        Ok(())
    }

    #[test]
    fn composite_aggregation_term_validation_errors() -> crate::Result<()> {
        // Create index with explicit document creation
        let mut schema_builder = Schema::builder();
        let string_field = schema_builder.add_text_field("string_id", STRING | FAST);
        let index = Index::create_in_ram(schema_builder.build());

        {
            let mut index_writer = index.writer_with_num_threads(1, 20_000_000)?;
            index_writer.add_document(doc!(string_field => "term"))?;
            index_writer.commit()?;
        }

        // Test empty sources
        let agg_req: Aggregations = serde_json::from_value(json!({
            "my_composite": {
                "composite": {
                    "sources": [],
                    "size": 10
                }
            }
        }))
        .unwrap();

        let res = exec_request(agg_req, &index);
        assert!(res.is_err());

        // Test size = 0
        let agg_req: Aggregations = serde_json::from_value(json!({
            "my_composite": {
                "composite": {
                    "sources": [
                        {"myterm": {"terms": {"field": "string_id"}}}
                    ],
                    "size": 0
                }
            }
        }))
        .unwrap();

        let res = exec_request(agg_req, &index);
        assert!(res.is_err());

        Ok(())
    }

    #[test]
    fn composite_aggregation_term_numeric_fields() -> crate::Result<()> {
        let mut schema_builder = Schema::builder();
        let score_field = schema_builder.add_f64_field("score", FAST);
        let index = Index::create_in_ram(schema_builder.build());
        {
            let mut index_writer = index.writer_with_num_threads(1, 20_000_000)?;
            index_writer.add_document(doc!(score_field => 1.0f64))?;
            index_writer.add_document(doc!(score_field => 2.0f64))?;
            index_writer.add_document(doc!(score_field => 1.0f64))?;
            index_writer.add_document(doc!(score_field => 3.33f64))?;
            index_writer.commit()?;
            index_writer.add_document(doc!(score_field => 1.0f64))?;
            index_writer.commit()?;
        }

        // Test composite aggregation on numeric field
        exec_and_assert_all_paginations(
            &index,
            json!([
                {"score": {"terms": {"field": "score"}}}
            ]),
            json!([
                {"key": {"score": 1}, "doc_count": 3},
                {"key": {"score": 2}, "doc_count": 1},
                {"key": {"score": 3.33}, "doc_count": 1}
            ]),
        );

        Ok(())
    }

    #[test]
    fn composite_aggregation_term_date_fields() -> crate::Result<()> {
        let mut schema_builder = Schema::builder();
        let date_field = schema_builder.add_date_field("timestamp", FAST);
        let index = Index::create_in_ram(schema_builder.build());
        {
            let mut index_writer = index.writer_with_num_threads(1, 20_000_000)?;
            // Add documents with different dates
            index_writer
                .add_document(doc!(date_field => datetime_from_iso_str("2021-01-01T00:00:00Z")))?;
            index_writer
                .add_document(doc!(date_field => datetime_from_iso_str("2022-01-01T00:00:00Z")))?;
            index_writer
                .add_document(doc!(date_field => datetime_from_iso_str("2021-01-01T00:00:00Z")))?; // duplicate
            index_writer
                .add_document(doc!(date_field => datetime_from_iso_str("2023-01-01T00:00:00Z")))?;
            index_writer.commit()?;
        }

        // Test composite aggregation on date field
        exec_and_assert_all_paginations(
            &index,
            json!([
                {"timestamp": {"terms": {"field": "timestamp"}}}
            ]),
            json!([
                {"key": {"timestamp": 1609459200000i64}, "doc_count": 2},
                {"key": {"timestamp": 1640995200000i64}, "doc_count": 1},
                {"key": {"timestamp": 1672531200000i64}, "doc_count": 1}
            ]),
        );

        Ok(())
    }

    #[test]
    fn composite_aggregation_term_ip_fields() -> crate::Result<()> {
        let mut schema_builder = Schema::builder();
        let ip_field = schema_builder.add_ip_addr_field("ip_addr", FAST);
        let index = Index::create_in_ram(schema_builder.build());
        {
            let ipv4 = |ip: &str| ip.parse::<Ipv4Addr>().unwrap().to_ipv6_mapped();
            let ipv6 = |ip: &str| ip.parse::<Ipv6Addr>().unwrap();
            let mut index_writer = index.writer_with_num_threads(1, 20_000_000)?;
            index_writer.add_document(doc!(ip_field => ipv4("192.168.1.1")))?;
            index_writer.add_document(doc!(ip_field => ipv4("10.0.0.1")))?;
            index_writer.add_document(doc!(ip_field => ipv4("192.168.1.1")))?; // duplicate
            index_writer.add_document(doc!(ip_field => ipv4("172.16.0.1")))?;
            index_writer.add_document(doc!(ip_field => ipv6("2001:db8::1")))?;
            index_writer.add_document(doc!(ip_field => ipv6("::1")))?; // localhost
            index_writer.add_document(doc!())?;
            index_writer.add_document(doc!(ip_field => ipv6("2001:db8::1")))?; // duplicate
            index_writer.commit()?;
        }

        // Test composite aggregation on IP field
        exec_and_assert_all_paginations(
            &index,
            json!([
                {"ip_addr": {"terms": {"field": "ip_addr"}}}
            ]),
            json!([
                {"key": {"ip_addr": "::1"}, "doc_count": 1},
                {"key": {"ip_addr": "10.0.0.1"}, "doc_count": 1},
                {"key": {"ip_addr": "172.16.0.1"}, "doc_count": 1},
                {"key": {"ip_addr": "192.168.1.1"}, "doc_count": 2},
                {"key": {"ip_addr": "2001:db8::1"}, "doc_count": 2}
            ]),
        );

        Ok(())
    }

    #[test]
    fn composite_aggregation_term_multiple_column_types() -> crate::Result<()> {
        let mut schema_builder = Schema::builder();
        let score_field = schema_builder.add_f64_field("score", FAST);
        let string_field = schema_builder.add_text_field("string_id", STRING | FAST);
        let index = Index::create_in_ram(schema_builder.build());
        {
            let mut index_writer = index.writer_with_num_threads(1, 20_000_000)?;
            index_writer.add_document(doc!(score_field => 1.0f64, string_field => "apple"))?;
            index_writer.add_document(doc!(score_field => 2.0f64, string_field => "banana"))?;
            index_writer.add_document(doc!(score_field => 1.0f64, string_field => "apple"))?;
            index_writer.add_document(doc!(score_field => 2.0f64, string_field => "banana"))?;
            index_writer.add_document(doc!(score_field => 3.0f64, string_field => "cherry"))?;
            index_writer.add_document(doc!(score_field => 1.0f64, string_field => "banana"))?;
            index_writer.commit()?;
        }

        // Test composite aggregation mixing numeric and text fields
        exec_and_assert_all_paginations(
            &index,
            json!([
                {"category": {"terms": {"field": "string_id", "order": "asc"}}},
                {"score": {"terms": {"field": "score", "order": "desc"}}}
            ]),
            json!([
                {"key": {"category": "apple", "score": 1}, "doc_count": 2},
                {"key": {"category": "banana", "score": 2}, "doc_count": 2},
                {"key": {"category": "banana", "score": 1}, "doc_count": 1},
                {"key": {"category": "cherry", "score": 3}, "doc_count": 1}
            ]),
        );

        Ok(())
    }

    #[test]
    fn composite_aggregation_term_json_various_types() -> crate::Result<()> {
        let mut schema_builder = Schema::builder();
        let json_field = schema_builder.add_json_field("json_data", FAST);
        let index = Index::create_in_ram(schema_builder.build());
        {
            let mut index_writer = index.writer_with_num_threads(1, 20_000_000)?;
            index_writer.add_document(
                doc!(json_field => json!({"cat": "elec", "price": 999, "avail": true})),
            )?;
            index_writer.add_document(
                doc!(json_field => json!({"cat": "books", "price": 15, "avail": false})),
            )?;
            index_writer.add_document(
                doc!(json_field => json!({"cat": "elec", "price": 200, "avail": true})),
            )?;
            index_writer.add_document(
                doc!(json_field => json!({"cat": "books", "price": 25, "avail": true})),
            )?;
            index_writer.commit()?;
        }

        exec_and_assert_all_paginations(
            &index,
            json!([
                {"cat": {"terms": {"field": "json_data.cat"}}},
                {"avail": {"terms": {"field": "json_data.avail"}}},
                {"price": {"terms": {"field": "json_data.price", "order": "desc"}}}
            ]),
            json!([
                {"key": {"cat": "books", "avail": false, "price": 15}, "doc_count": 1},
                {"key": {"cat": "books", "avail": true, "price": 25}, "doc_count": 1},
                {"key": {"cat": "elec", "avail": true, "price": 999}, "doc_count": 1},
                {"key": {"cat": "elec", "avail": true, "price": 200}, "doc_count": 1}
            ]),
        );

        Ok(())
    }

    #[test]
    fn composite_aggregation_term_json_missing_fields() -> crate::Result<()> {
        let mut schema_builder = Schema::builder();
        let json_field = schema_builder.add_json_field("json_data", FAST);
        let index = Index::create_in_ram(schema_builder.build());
        {
            let mut index_writer = index.writer_with_num_threads(1, 20_000_000)?;
            index_writer
                .add_document(doc!(json_field => json!({"cat": "elec", "brand": "apple"})))?;
            index_writer
                .add_document(doc!(json_field => json!({"cat": "books", "brand": "gut"})))?;
            index_writer.add_document(doc!(json_field => json!({"cat": "books"})))?; // missing brand
            index_writer.add_document(doc!(json_field => json!({"brand": "samsung"})))?; // missing category
            index_writer
                .add_document(doc!(json_field => json!({"cat": "elec", "brand": "samsung"})))?;
            index_writer.commit()?;
        }

        // Test with missing bucket enabled
        exec_and_assert_all_paginations(
            &index,
            json!([
                {"cat": {"terms": {"field": "json_data.cat", "missing_bucket": true}}},
                {"brand": {"terms": {"field": "json_data.brand", "missing_bucket": true, "missing_order": "last"}}}
            ]),
            json!([
                {"key": {"cat": null, "brand": "samsung"}, "doc_count": 1},
                {"key": {"cat": "books", "brand": "gut"}, "doc_count": 1},
                {"key": {"cat": "books", "brand": null}, "doc_count": 1},
                {"key": {"cat": "elec", "brand": "apple"}, "doc_count": 1},
                {"key": {"cat": "elec", "brand": "samsung"}, "doc_count": 1}
            ]),
        );

        // Small twist on the missing order of the second source
        exec_and_assert_all_paginations(
            &index,
            json!([
                {"cat": {"terms": {"field": "json_data.cat", "missing_bucket": true}}},
                {"brand": {"terms": {"field": "json_data.brand", "missing_bucket": true, "missing_order": "first"}}}
            ]),
            json!([
                {"key": {"cat": null, "brand": "samsung"}, "doc_count": 1},
                {"key": {"cat": "books", "brand": null}, "doc_count": 1},
                {"key": {"cat": "books", "brand": "gut"}, "doc_count": 1},
                {"key": {"cat": "elec", "brand": "apple"}, "doc_count": 1},
                {"key": {"cat": "elec", "brand": "samsung"}, "doc_count": 1}
            ]),
        );

        Ok(())
    }

    #[test]
    fn composite_aggregation_term_json_nested_fields() -> crate::Result<()> {
        let mut schema_builder = Schema::builder();
        let json_field = schema_builder.add_json_field("json_data", FAST);
        let index = Index::create_in_ram(schema_builder.build());
        {
            let mut index_writer = index.writer_with_num_threads(1, 20_000_000)?;
            index_writer.add_document(
                doc!(json_field => json!({"prod": {"name": "laptop", "cpu": "intel"}})),
            )?;
            index_writer.add_document(
                doc!(json_field => json!({"prod": {"name": "phone", "cpu": "snap"}})),
            )?;
            index_writer.add_document(
                doc!(json_field => json!({"prod": {"name": "laptop", "cpu": "amd"}})),
            )?;
            index_writer.add_document(
                doc!(json_field => json!({"prod": {"name": "tablet", "cpu": "intel"}})),
            )?;
            index_writer.commit()?;
        }

        exec_and_assert_all_paginations(
            &index,
            json!([
                {"name": {"terms": {"field": "json_data.prod.name"}}},
                {"cpu": {"terms": {"field": "json_data.prod.cpu"}}}
            ]),
            json!([
                {"key": {"name": "laptop", "cpu": "amd"}, "doc_count": 1},
                {"key": {"name": "laptop", "cpu": "intel"}, "doc_count": 1},
                {"key": {"name": "phone", "cpu": "snap"}, "doc_count": 1},
                {"key": {"name": "tablet", "cpu": "intel"}, "doc_count": 1}
            ]),
        );

        Ok(())
    }

    #[test]
    fn composite_aggregation_term_json_mixed_types() -> crate::Result<()> {
        let mut schema_builder = Schema::builder();
        let json_field = schema_builder.add_json_field("json_data", FAST);
        let index = Index::create_in_ram(schema_builder.build());
        {
            let mut index_writer = index.writer_with_num_threads(1, 20_000_000)?;
            index_writer.add_document(doc!(json_field => json!({"id": "doc1"})))?;
            // this segment's numeric is i64
            index_writer.add_document(doc!(json_field => json!({"id": 100})))?;
            index_writer.add_document(doc!(json_field => json!({"id": true})))?;
            index_writer.add_document(doc!(json_field => json!({"id": "doc2"})))?;
            index_writer.add_document(doc!(json_field => json!({"id": 50})))?;
            index_writer.add_document(doc!(json_field => json!({"id": false})))?;
            index_writer.add_document(doc!(json_field => json!({"id": "doc3"})))?;
            index_writer.commit()?;
            // this segment's numeric is f64
            index_writer.add_document(doc!(json_field => json!({"id": 33.3})))?;
            index_writer.add_document(doc!(json_field => json!({"id": 50})))?;
            index_writer.commit()?;
            // this segment contains dates
            index_writer.add_document(doc!(json_field => json!({"id": "doc4"})))?;
            index_writer.add_document(doc!(json_field => json!({"id": "2023-01-01T00:00:00Z"})))?;
            index_writer.add_document(doc!(json_field => json!({"id": "2023-01-02T00:00:00Z"})))?;
            index_writer.commit()?;
        }

        exec_and_assert_all_paginations(
            &index,
            json!([
                {"id": {"terms": {"field": "json_data.id", "order": "asc"}}}
            ]),
            json!([
                {"key": {"id": false}, "doc_count": 1},
                {"key": {"id": true}, "doc_count": 1},
                {"key": {"id": "doc1"}, "doc_count": 1},
                {"key": {"id": "doc2"}, "doc_count": 1},
                {"key": {"id": "doc3"}, "doc_count": 1},
                {"key": {"id": "doc4"}, "doc_count": 1},
                {"key": {"id": 33.3}, "doc_count": 1},
                {"key": {"id": 50}, "doc_count": 2},
                {"key": {"id": 100}, "doc_count": 1},
                {"key": {"id": ms_timestamp_from_iso_str("2023-01-01T00:00:00Z")}, "doc_count": 1},
                {"key": {"id": ms_timestamp_from_iso_str("2023-01-02T00:00:00Z")}, "doc_count": 1},
            ]),
        );

        // Test descending order
        exec_and_assert_all_paginations(
            &index,
            json!([
                {"id": {"terms": {"field": "json_data.id", "order": "desc"}}}
            ]),
            json!([
                {"key": {"id": ms_timestamp_from_iso_str("2023-01-02T00:00:00Z")}, "doc_count": 1},
                {"key": {"id": ms_timestamp_from_iso_str("2023-01-01T00:00:00Z")}, "doc_count": 1},
                {"key": {"id": 100}, "doc_count": 1},
                {"key": {"id": 50}, "doc_count": 2},
                {"key": {"id": 33.3}, "doc_count": 1},
                {"key": {"id": "doc4"}, "doc_count": 1},
                {"key": {"id": "doc3"}, "doc_count": 1},
                {"key": {"id": "doc2"}, "doc_count": 1},
                {"key": {"id": "doc1"}, "doc_count": 1},
                {"key": {"id": true}, "doc_count": 1},
                {"key": {"id": false}, "doc_count": 1}
            ]),
        );

        Ok(())
    }

    #[test]
    fn composite_aggregation_term_multi_value_fields() -> crate::Result<()> {
        let mut schema_builder = Schema::builder();
        let text_field = schema_builder.add_text_field("text", FAST | STRING);
        let num_field = schema_builder.add_u64_field("num", FAST);
        let index = Index::create_in_ram(schema_builder.build());

        {
            let mut index_writer = index.writer_with_num_threads(1, 20_000_000)?;
            // Document with multiple values for text and num fields
            index_writer.add_document(doc!(
                text_field => "apple",
                text_field => "banana",
                num_field => 10u64,
                num_field => 20u64,
            ))?;
            index_writer.add_document(doc!(
                text_field => "cherry",
                num_field => 30u64,
            ))?;
            // Multi valued document with duplicate values
            index_writer.add_document(doc!(
                text_field => "elderberry",
                text_field => "date",
                text_field => "elderberry",
                num_field => 40u64,
            ))?;

            index_writer.commit()?;
        }

        exec_and_assert_all_paginations(
            &index,
            json!([
                {"text_terms": {"terms": {"field": "text"}}}
            ]),
            json!([
                {"key": {"text_terms": "apple"}, "doc_count": 1},
                {"key": {"text_terms": "banana"}, "doc_count": 1},
                {"key": {"text_terms": "cherry"}, "doc_count": 1},
                {"key": {"text_terms": "date"}, "doc_count": 1},
                // this is not the doc count but the term occurrence count
                // https://github.com/quickwit-oss/tantivy/issues/2721
                {"key": {"text_terms": "elderberry"}, "doc_count": 2}
            ]),
        );

        exec_and_assert_all_paginations(
            &index,
            json!([
                {"num_terms": {"terms": {"field": "num"}}}
            ]),
            json!([
                {"key": {"num_terms": 10}, "doc_count": 1},
                {"key": {"num_terms": 20}, "doc_count": 1},
                {"key": {"num_terms": 30}, "doc_count": 1},
                {"key": {"num_terms": 40}, "doc_count": 1}
            ]),
        );

        Ok(())
    }

    #[test]
    fn composite_aggregation_histogram_basic() -> crate::Result<()> {
        let mut schema_builder = Schema::builder();
        let num_field = schema_builder.add_f64_field("value", FAST);
        let index = Index::create_in_ram(schema_builder.build());
        {
            let mut index_writer = index.writer_with_num_threads(1, 20_000_000)?;
            index_writer.add_document(doc!(num_field => -0.5f64))?;
            index_writer.add_document(doc!(num_field => 1.0f64))?;
            index_writer.add_document(doc!(num_field => 2.0f64))?;
            index_writer.add_document(doc!(num_field => 5.0f64))?;
            index_writer.add_document(doc!(num_field => 7.0f64))?;
            index_writer.add_document(doc!(num_field => 11.0f64))?;
            index_writer.commit()?;
        }

        // Histogram with interval 5
        exec_and_assert_all_paginations(
            &index,
            json!([
                {"val_hist": {"histogram": {"field": "value", "interval": 5.0}}}
            ]),
            json!([
                {"key": {"val_hist": -5.0}, "doc_count": 1},
                {"key": {"val_hist": 0.0}, "doc_count": 2},
                {"key": {"val_hist": 5.0}, "doc_count": 2},
                {"key": {"val_hist": 10.0}, "doc_count": 1}
            ]),
        );
        Ok(())
    }

    #[test]
    fn composite_aggregation_histogram_json_mixed_types() -> crate::Result<()> {
        let mut schema_builder = Schema::builder();
        let json_field = schema_builder.add_json_field("json_data", FAST);
        let index = Index::create_in_ram(schema_builder.build());
        {
            let mut index_writer = index.writer_with_num_threads(1, 20_000_000)?;
            // this segment's numeric is i64
            index_writer.add_document(doc!(json_field => json!({"id": "doc1"})))?;
            index_writer.add_document(doc!(json_field => json!({"id": 100})))?;
            index_writer.add_document(doc!(json_field => json!({"id": true})))?;
            index_writer.add_document(doc!(json_field => json!({"id": "doc2"})))?;
            index_writer.add_document(doc!(json_field => json!({"id": 50})))?;
            index_writer.add_document(doc!(json_field => json!({"id": false})))?;
            index_writer.add_document(doc!(json_field => json!({"id": "doc3"})))?;
            index_writer.commit()?;
            // this segment's numeric is f64 and it also contains a date column
            index_writer.add_document(doc!(json_field => json!({"id": 33.3})))?;
            index_writer.add_document(doc!(json_field => json!({"id": 50})))?;
            index_writer.add_document(doc!(json_field => json!({"id": -0.01})))?;
            index_writer.add_document(doc!(json_field => json!({"id": "2023-01-01T00:00:00Z"})))?;
            index_writer.commit()?;
        }

        exec_and_assert_all_paginations(
            &index,
            json!([
                {"id": {"histogram": {"field": "json_data.id", "interval": 50, "order": "asc"}}}
            ]),
            json!([
                {"key": {"id": -50.0}, "doc_count": 1},
                {"key": {"id": 0.0}, "doc_count": 1},
                {"key": {"id": 50.0}, "doc_count": 2},
                {"key": {"id": 100.0}, "doc_count": 1},
                {"key": {"id": ms_timestamp_from_iso_str("2023-01-01T00:00:00Z") as f64}, "doc_count": 1},
            ]),
        );

        // Test descending order
        exec_and_assert_all_paginations(
            &index,
            json!([
                {"id": {"histogram": {"field": "json_data.id", "interval": 50, "order": "desc"}}}
            ]),
            json!([
                {"key": {"id": ms_timestamp_from_iso_str("2023-01-01T00:00:00Z") as f64},"doc_count": 1},
                {"key": {"id": 100.0}, "doc_count": 1},
                {"key": {"id": 50.0}, "doc_count": 2},
                {"key": {"id": 0.0}, "doc_count": 1},
                {"key": {"id": -50.0}, "doc_count": 1},
            ]),
        );

        Ok(())
    }

    #[test]
    fn composite_aggregation_date_histogram_calendar_interval() -> crate::Result<()> {
        let mut schema_builder = Schema::builder();
        let date_field = schema_builder.add_date_field("dt", FAST);
        let index = Index::create_in_ram(schema_builder.build());
        {
            let mut index_writer = index.writer_with_num_threads(1, 20_000_000)?;
            index_writer
                .add_document(doc!(date_field => datetime_from_iso_str("2021-01-01T00:00:00Z")))?;
            index_writer
                .add_document(doc!(date_field => datetime_from_iso_str("2021-02-01T00:00:00Z")))?;
            index_writer
                .add_document(doc!(date_field => datetime_from_iso_str("2022-01-01T00:00:00Z")))?;
            index_writer
                .add_document(doc!(date_field => datetime_from_iso_str("2023-01-01T00:00:00Z")))?;
            index_writer.commit()?;
        }

        // Date histogram with calendar_interval = "year"
        exec_and_assert_all_paginations(
            &index,
            json!([
                {"dt_hist": {"date_histogram": {"field": "dt", "calendar_interval": "year"}}}
            ]),
            json!([
                {"key": {"dt_hist": ms_timestamp_from_iso_str("2021-01-01T00:00:00Z")}, "doc_count": 2},
                {"key": {"dt_hist": ms_timestamp_from_iso_str("2022-01-01T00:00:00Z")}, "doc_count": 1},
                {"key": {"dt_hist": ms_timestamp_from_iso_str("2023-01-01T00:00:00Z")}, "doc_count": 1}
            ]),
        );
        Ok(())
    }

    #[test]
    fn composite_aggregation_date_histogram_fixed_interval() -> crate::Result<()> {
        let mut schema_builder = Schema::builder();
        let date_field = schema_builder.add_date_field("dt", FAST);
        let index = Index::create_in_ram(schema_builder.build());
        {
            let mut index_writer = index.writer_with_num_threads(1, 20_000_000)?;
            index_writer
                .add_document(doc!(date_field => datetime_from_iso_str("2021-01-01T00:00:00Z")))?;
            index_writer
                .add_document(doc!(date_field => datetime_from_iso_str("2021-01-01T05:30:00Z")))?;
            index_writer
                .add_document(doc!(date_field => datetime_from_iso_str("2021-01-01T06:00:00Z")))?;
            index_writer
                .add_document(doc!(date_field => datetime_from_iso_str("2021-01-01T12:00:00Z")))?;
            index_writer
                .add_document(doc!(date_field => datetime_from_iso_str("2021-01-01T18:00:00Z")))?;
            index_writer.commit()?;
        }

        exec_and_assert_all_paginations(
            &index,
            json!([
                {"dt_hist": {"date_histogram": {"field": "dt", "fixed_interval": "6h"}}}
            ]),
            json!([
                {"key": {"dt_hist": ms_timestamp_from_iso_str("2021-01-01T00:00:00Z")}, "doc_count": 2},
                {"key": {"dt_hist": ms_timestamp_from_iso_str("2021-01-01T06:00:00Z")}, "doc_count": 1},
                {"key": {"dt_hist": ms_timestamp_from_iso_str("2021-01-01T12:00:00Z")}, "doc_count": 1},
                {"key": {"dt_hist": ms_timestamp_from_iso_str("2021-01-01T18:00:00Z")}, "doc_count": 1}
            ]),
        );
        Ok(())
    }

    #[test]
    fn composite_aggregation_mixed_term_and_date_histogram() -> crate::Result<()> {
        let mut schema_builder = Schema::builder();
        let date_field = schema_builder.add_date_field("timestamp", FAST);
        let category_field = schema_builder.add_text_field("category", STRING | FAST);
        let index = Index::create_in_ram(schema_builder.build());

        {
            let mut index_writer = index.writer_with_num_threads(1, 20_000_000)?;
            index_writer.add_document(doc!(
                date_field => datetime_from_iso_str("2021-01-01T05:00:00Z"),
                category_field => "electronics"
            ))?;
            index_writer.add_document(doc!(
                date_field => datetime_from_iso_str("2021-01-15T10:30:00Z"),
                category_field => "electronics"
            ))?;
            index_writer.add_document(doc!(
                date_field => datetime_from_iso_str("2021-01-05T12:00:00Z"),
                category_field => "books"
            ))?;
            index_writer.add_document(doc!(
                date_field => datetime_from_iso_str("2021-02-10T08:45:00Z"),
                category_field => "books"
            ))?;
            index_writer.add_document(doc!(
                date_field => datetime_from_iso_str("2021-02-05T14:20:00Z"),
                category_field => "clothing"
            ))?;
            index_writer.add_document(doc!(
                date_field => datetime_from_iso_str("2021-02-20T09:15:00Z"),
                category_field => "clothing"
            ))?;

            index_writer.commit()?;
        }

        exec_and_assert_all_paginations(
            &index,
            json!([
                {"category": {"terms": {"field": "category"}}},
                {"month": {"date_histogram": {"field": "timestamp", "calendar_interval": "month"}}}
            ]),
            json!([
                {"key": {"category": "books", "month": ms_timestamp_from_iso_str("2021-01-01T00:00:00Z")}, "doc_count": 1},
                {"key": {"category": "books", "month": ms_timestamp_from_iso_str("2021-02-01T00:00:00Z")}, "doc_count": 1},
                {"key": {"category": "clothing", "month": ms_timestamp_from_iso_str("2021-02-01T00:00:00Z")}, "doc_count": 2},
                {"key": {"category": "electronics", "month": ms_timestamp_from_iso_str("2021-01-01T00:00:00Z")}, "doc_count": 2}
            ]),
        );

        // Test with different ordering for sources with a size limit
        let agg_req: Aggregations = serde_json::from_value(json!({
            "my_composite": {
                "composite": {
                    "sources": [
                        {"month": {"date_histogram": {"field": "timestamp", "calendar_interval": "month"}}},
                        {"category": {"terms": {"field": "category", "order": "desc"}}}
                    ],
                    "size": 3
                }
            }
        }))
        .unwrap();
        let res = exec_request(agg_req, &index)?;
        let buckets = &res["my_composite"]["buckets"];
        assert_eq!(
            buckets,
            &json!([
                {"key": {"month": ms_timestamp_from_iso_str("2021-01-01T00:00:00Z"), "category": "electronics"}, "doc_count": 2},
                {"key": {"month": ms_timestamp_from_iso_str("2021-01-01T00:00:00Z"), "category": "books"}, "doc_count": 1},
                {"key": {"month": ms_timestamp_from_iso_str("2021-02-01T00:00:00Z"), "category": "clothing"}, "doc_count": 2},
            ]),
        );

        // next page
        let agg_req: Aggregations = serde_json::from_value(json!({
            "my_composite": {
                "composite": {
                    "sources": [
                        {"month": {"date_histogram": {"field": "timestamp", "calendar_interval": "month"}}},
                        {"category": {"terms": {"field": "category", "order": "desc"}}}
                    ],
                    "size": 3,
                    "after": res["my_composite"]["after_key"]
                }
            }
        }))
        .unwrap();
        let res = exec_request(agg_req, &index)?;
        let buckets = &res["my_composite"]["buckets"];
        assert_eq!(
            buckets,
            &json!([
                {"key": {"month": ms_timestamp_from_iso_str("2021-02-01T00:00:00Z"), "category": "books"}, "doc_count": 1},
            ]),
        );
        assert!(res["my_composite"].get("after_key").is_none());

        Ok(())
    }

    #[test]
    fn composite_aggregation_no_matching_columns() -> crate::Result<()> {
        let mut schema_builder = Schema::builder();
        let date_field = schema_builder.add_f64_field("dt", FAST);
        let index = Index::create_in_ram(schema_builder.build());
        {
            let mut index_writer = index.writer_with_num_threads(1, 20_000_000)?;
            index_writer.add_document(doc!(date_field => 1.0))?;
            index_writer.add_document(doc!(date_field => 2.0))?;
            index_writer.commit()?;
        }

        let agg_req: Aggregations = serde_json::from_value(json!({
            "my_composite": {
                "composite": {
                    "sources": [
                        {"dt_hist": {"date_histogram": {"field": "dt", "fixed_interval": "6h"}}}
                    ],
                    "size": 10
                }
            }
        }))
        .unwrap();
        let res = exec_request(agg_req, &index)?;
        let buckets = &res["my_composite"]["buckets"];
        assert_eq!(buckets, &json!([]));

        let agg_req: Aggregations = serde_json::from_value(json!({
            "my_composite": {
                "composite": {
                    "sources": [
                        {"dt_hist": {"date_histogram": {"field": "dt", "fixed_interval": "6h", "missing_bucket": true}}}
                    ],
                    "size": 10,
                }
            }
        }))
        .unwrap();

        let res = exec_request(agg_req, &index)?;
        let buckets = &res["my_composite"]["buckets"];

        assert_eq!(
            buckets,
            &json!([{"key": {"dt_hist": null}, "doc_count": 2}])
        );
        Ok(())
    }
}


================================================
FILE: src/aggregation/bucket/composite/numeric_types.rs
================================================
/// This module helps comparing numerical values of different types (i64, u64
/// and f64).
pub(super) mod num_cmp {
    use std::cmp::Ordering;

    use crate::TantivyError;

    pub fn cmp_i64_f64(left_i: i64, right_f: f64) -> crate::Result<Ordering> {
        if right_f.is_nan() {
            return Err(TantivyError::InvalidArgument(
                "NaN comparison is not supported".to_string(),
            ));
        }

        // If right_f is < i64::MIN then left_i > right_f (i64::MIN=-2^63 can be
        // exactly represented as f64)
        if right_f < i64::MIN as f64 {
            return Ok(Ordering::Greater);
        }
        // If right_f is >= i64::MAX then left_i < right_f (i64::MAX=2^63-1 cannot
        // be exactly represented as f64)
        if right_f >= i64::MAX as f64 {
            return Ok(Ordering::Less);
        }

        // Now right_f is in (i64::MIN, i64::MAX), so `right_f as i64` is
        // well-defined (truncation toward 0)
        let right_as_i = right_f as i64;

        let result = match left_i.cmp(&right_as_i) {
            Ordering::Less => Ordering::Less,
            Ordering::Greater => Ordering::Greater,
            Ordering::Equal => {
                // they have the same integer part, compare the fraction
                let rem = right_f - (right_as_i as f64);
                if rem == 0.0 {
                    Ordering::Equal
                } else if right_f > 0.0 {
                    Ordering::Less
                } else {
                    Ordering::Greater
                }
            }
        };
        Ok(result)
    }

    pub fn cmp_u64_f64(left_u: u64, right_f: f64) -> crate::Result<Ordering> {
        if right_f.is_nan() {
            return Err(TantivyError::InvalidArgument(
                "NaN comparison is not supported".to_string(),
            ));
        }

        // Negative floats are always less than any u64 >= 0
        if right_f < 0.0 {
            return Ok(Ordering::Greater);
        }

        // If right_f is >= u64::MAX then left_u < right_f (u64::MAX=2^64-1 cannot be exactly)
        let max_as_f = u64::MAX as f64;
        if right_f > max_as_f {
            return Ok(Ordering::Less);
        }

        // Now right_f is in (0, u64::MAX), so `right_f as u64` is well-defined
        // (truncation toward 0)
        let right_as_u = right_f as u64;

        let result = match left_u.cmp(&right_as_u) {
            Ordering::Less => Ordering::Less,
            Ordering::Greater => Ordering::Greater,
            Ordering::Equal => {
                // they have the same integer part, compare the fraction
                let rem = right_f - (right_as_u as f64);
                if rem == 0.0 {
                    Ordering::Equal
                } else {
                    Ordering::Less
                }
            }
        };
        Ok(result)
    }

    pub fn cmp_i64_u64(left_i: i64, right_u: u64) -> Ordering {
        if left_i < 0 {
            Ordering::Less
        } else {
            let left_as_u = left_i as u64;
            left_as_u.cmp(&right_u)
        }
    }
}

/// This module helps projecting numerical values to other numerical types.
/// When the target value space cannot exactly represent the source value, the
/// next representable value is returned (or AfterLast if the source value is
/// larger than the largest representable value).
///
/// All functions in this module assume that f64 values are not NaN.
pub(super) mod num_proj {
    #[derive(Debug, PartialEq)]
    pub enum ProjectedNumber<T> {
        Exact(T),
        Next(T),
        AfterLast,
    }

    pub fn i64_to_u64(value: i64) -> ProjectedNumber<u64> {
        if value < 0 {
            ProjectedNumber::Next(0)
        } else {
            ProjectedNumber::Exact(value as u64)
        }
    }

    pub fn u64_to_i64(value: u64) -> ProjectedNumber<i64> {
        if value > i64::MAX as u64 {
            ProjectedNumber::AfterLast
        } else {
            ProjectedNumber::Exact(value as i64)
        }
    }

    pub fn f64_to_u64(value: f64) -> ProjectedNumber<u64> {
        if value < 0.0 {
            ProjectedNumber::Next(0)
        } else if value > u64::MAX as f64 {
            ProjectedNumber::AfterLast
        } else if value.fract() == 0.0 {
            ProjectedNumber::Exact(value as u64)
        } else {
            // casting f64 to u64 truncates toward zero
            ProjectedNumber::Next(value as u64 + 1)
        }
    }

    pub fn f64_to_i64(value: f64) -> ProjectedNumber<i64> {
        if value < (i64::MIN as f64) {
            ProjectedNumber::Next(i64::MIN)
        } else if value >= (i64::MAX as f64) {
            ProjectedNumber::AfterLast
        } else if value.fract() == 0.0 {
            ProjectedNumber::Exact(value as i64)
        } else if value > 0.0 {
            // casting f64 to i64 truncates toward zero
            ProjectedNumber::Next(value as i64 + 1)
        } else {
            ProjectedNumber::Next(value as i64)
        }
    }

    pub fn i64_to_f64(value: i64) -> ProjectedNumber<f64> {
        let value_f = value as f64;
        let k_roundtrip = value_f as i64;
        if k_roundtrip == value {
            // between -2^53 and 2^53 all i64 are exactly represented as f64
            ProjectedNumber::Exact(value_f)
        } else {
            // for very large/small i64 values, it is approximated to the closest f64
            if k_roundtrip > value {
                ProjectedNumber::Next(value_f)
            } else {
                ProjectedNumber::Next(value_f.next_up())
            }
        }
    }

    pub fn u64_to_f64(value: u64) -> ProjectedNumber<f64> {
        let value_f = value as f64;
        let k_roundtrip = value_f as u64;
        if k_roundtrip == value {
            // between 0 and 2^53 all u64 are exactly represented as f64
            ProjectedNumber::Exact(value_f)
        } else if k_roundtrip > value {
            ProjectedNumber::Next(value_f)
        } else {
            ProjectedNumber::Next(value_f.next_up())
        }
    }
}

#[cfg(test)]
mod num_cmp_tests {
    use std::cmp::Ordering;

    use super::num_cmp::*;

    #[test]
    fn test_cmp_u64_f64() {
        // Basic comparisons
        assert_eq!(cmp_u64_f64(5, 5.0).unwrap(), Ordering::Equal);
        assert_eq!(cmp_u64_f64(5, 6.0).unwrap(), Ordering::Less);
        assert_eq!(cmp_u64_f64(6, 5.0).unwrap(), Ordering::Greater);
        assert_eq!(cmp_u64_f64(0, 0.0).unwrap(), Ordering::Equal);
        assert_eq!(cmp_u64_f64(0, 0.1).unwrap(), Ordering::Less);

        // Negative float values should always be less than any u64
        assert_eq!(cmp_u64_f64(0, -0.1).unwrap(), Ordering::Greater);
        assert_eq!(cmp_u64_f64(5, -5.0).unwrap(), Ordering::Greater);
        assert_eq!(cmp_u64_f64(u64::MAX, -1e20).unwrap(), Ordering::Greater);

        // Tests with extreme values
        assert_eq!(cmp_u64_f64(u64::MAX, 1e20).unwrap(), Ordering::Less);

        // Precision edge cases: large u64 that loses precision when converted to f64
        // => 2^54, exactly represented as f64
        let large_f64 = 18_014_398_509_481_984.0;
        let large_u64 = 18_014_398_509_481_984;
        // prove that large_u64 is exactly represented as f64
        assert_eq!(large_u64 as f64, large_f64);
        assert_eq!(cmp_u64_f64(large_u64, large_f64).unwrap(), Ordering::Equal);
        // => (2^54 + 1) cannot be exactly represented in f64
        let large_u64_plus_1 = 18_014_398_509_481_985;
        // prove that it is represented as f64 by large_f64
        assert_eq!(large_u64_plus_1 as f64, large_f64);
        assert_eq!(
            cmp_u64_f64(large_u64_plus_1, large_f64).unwrap(),
            Ordering::Greater
        );
        // => (2^54 - 1) cannot be exactly represented in f64
        let large_u64_minus_1 = 18_014_398_509_481_983;
        // prove that it is also represented as f64 by large_f64
        assert_eq!(large_u64_minus_1 as f64, large_f64);
        assert_eq!(
            cmp_u64_f64(large_u64_minus_1, large_f64).unwrap(),
            Ordering::Less
        );

        // NaN comparison results in an error
        assert!(cmp_u64_f64(0, f64::NAN).is_err());
    }

    #[test]
    fn test_cmp_i64_f64() {
        // Basic comparisons
        assert_eq!(cmp_i64_f64(5, 5.0).unwrap(), Ordering::Equal);
        assert_eq!(cmp_i64_f64(5, 6.0).unwrap(), Ordering::Less);
        assert_eq!(cmp_i64_f64(6, 5.0).unwrap(), Ordering::Greater);
        assert_eq!(cmp_i64_f64(-5, -5.0).unwrap(), Ordering::Equal);
        assert_eq!(cmp_i64_f64(-5, -4.0).unwrap(), Ordering::Less);
        assert_eq!(cmp_i64_f64(-4, -5.0).unwrap(), Ordering::Greater);
        assert_eq!(cmp_i64_f64(-5, 5.0).unwrap(), Ordering::Less);
        assert_eq!(cmp_i64_f64(5, -5.0).unwrap(), Ordering::Greater);
        assert_eq!(cmp_i64_f64(0, -0.1).unwrap(), Ordering::Greater);
        assert_eq!(cmp_i64_f64(0, 0.1).unwrap(), Ordering::Less);
        assert_eq!(cmp_i64_f64(-1, -0.5).unwrap(), Ordering::Less);
        assert_eq!(cmp_i64_f64(-1, 0.0).unwrap(), Ordering::Less);
        assert_eq!(cmp_i64_f64(0, 0.0).unwrap(), Ordering::Equal);

        // Tests with extreme values
        assert_eq!(cmp_i64_f64(i64::MAX, 1e20).unwrap(), Ordering::Less);
        assert_eq!(cmp_i64_f64(i64::MIN, -1e20).unwrap(), Ordering::Greater);

        // Precision edge cases: large i64 that loses precision when converted to f64
        // => 2^54, exactly represented as f64
        let large_f64 = 18_014_398_509_481_984.0;
        let large_i64 = 18_014_398_509_481_984;
        // prove that large_i64 is exactly represented as f64
        assert_eq!(large_i64 as f64, large_f64);
        assert_eq!(cmp_i64_f64(large_i64, large_f64).unwrap(), Ordering::Equal);
        // => (1_i64 << 54) + 1 cannot be exactly represented in f64
        let large_i64_plus_1 = 18_014_398_509_481_985;
        // prove that it is represented as f64 by large_f64
        assert_eq!(large_i64_plus_1 as f64, large_f64);
        assert_eq!(
            cmp_i64_f64(large_i64_plus_1, large_f64).unwrap(),
            Ordering::Greater
        );
        // => (1_i64 << 54) - 1 cannot be exactly represented in f64
        let large_i64_minus_1 = 18_014_398_509_481_983;
        // prove that it is also represented as f64 by large_f64
        assert_eq!(large_i64_minus_1 as f64, large_f64);
        assert_eq!(
            cmp_i64_f64(large_i64_minus_1, large_f64).unwrap(),
            Ordering::Less
        );

        // Same precision edge case but with negative values
        // => -2^54, exactly represented as f64
        let large_neg_f64 = -18_014_398_509_481_984.0;
        let large_neg_i64 = -18_014_398_509_481_984;
        // prove that large_neg_i64 is exactly represented as f64
        assert_eq!(large_neg_i64 as f64, large_neg_f64);
        assert_eq!(
            cmp_i64_f64(large_neg_i64, large_neg_f64).unwrap(),
            Ordering::Equal
        );
        // => (-2^54 + 1) cannot be exactly represented in f64
        let large_neg_i64_plus_1 = -18_014_398_509_481_985;
        // prove that it is represented as f64 by large_neg_f64
        assert_eq!(large_neg_i64_plus_1 as f64, large_neg_f64);
        assert_eq!(
            cmp_i64_f64(large_neg_i64_plus_1, large_neg_f64).unwrap(),
            Ordering::Less
        );
        // => (-2^54 - 1) cannot be exactly represented in f64
        let large_neg_i64_minus_1 = -18_014_398_509_481_983;
        // prove that it is also represented as f64 by large_neg_f64
        assert_eq!(large_neg_i64_minus_1 as f64, large_neg_f64);
        assert_eq!(
            cmp_i64_f64(large_neg_i64_minus_1, large_neg_f64).unwrap(),
            Ordering::Greater
        );

        // NaN comparison results in an error
        assert!(cmp_i64_f64(0, f64::NAN).is_err());
    }

    #[test]
    fn test_cmp_i64_u64() {
        // Test with negative i64 values (should always be less than any u64)
        assert_eq!(cmp_i64_u64(-1, 0), Ordering::Less);
        assert_eq!(cmp_i64_u64(i64::MIN, 0), Ordering::Less);
        assert_eq!(cmp_i64_u64(i64::MIN, u64::MAX), Ordering::Less);

        // Test with positive i64 values
        assert_eq!(cmp_i64_u64(0, 0), Ordering::Equal);
        assert_eq!(cmp_i64_u64(1, 0), Ordering::Greater);
        assert_eq!(cmp_i64_u64(1, 1), Ordering::Equal);
        assert_eq!(cmp_i64_u64(0, 1), Ordering::Less);
        assert_eq!(cmp_i64_u64(5, 10), Ordering::Less);
        assert_eq!(cmp_i64_u64(10, 5), Ordering::Greater);

        // Test with values near i64::MAX and u64 conversion
        assert_eq!(cmp_i64_u64(i64::MAX, i64::MAX as u64), Ordering::Equal);
        assert_eq!(cmp_i64_u64(i64::MAX, (i64::MAX as u64) + 1), Ordering::Less);
        assert_eq!(cmp_i64_u64(i64::MAX, u64::MAX), Ordering::Less);
    }
}

#[cfg(test)]
mod num_proj_tests {
    use super::num_proj::{self, ProjectedNumber};

    #[test]
    fn test_i64_to_u64() {
        assert_eq!(num_proj::i64_to_u64(-1), ProjectedNumber::Next(0));
        assert_eq!(num_proj::i64_to_u64(i64::MIN), ProjectedNumber::Next(0));
        assert_eq!(num_proj::i64_to_u64(0), ProjectedNumber::Exact(0));
        assert_eq!(num_proj::i64_to_u64(42), ProjectedNumber::Exact(42));
        assert_eq!(
            num_proj::i64_to_u64(i64::MAX),
            ProjectedNumber::Exact(i64::MAX as u64)
        );
    }

    #[test]
    fn test_u64_to_i64() {
        assert_eq!(num_proj::u64_to_i64(0), ProjectedNumber::Exact(0));
        assert_eq!(num_proj::u64_to_i64(42), ProjectedNumber::Exact(42));
        assert_eq!(
            num_proj::u64_to_i64(i64::MAX as u64),
            ProjectedNumber::Exact(i64::MAX)
        );
        assert_eq!(
            num_proj::u64_to_i64((i64::MAX as u64) + 1),
            ProjectedNumber::AfterLast
        );
        assert_eq!(num_proj::u64_to_i64(u64::MAX), ProjectedNumber::AfterLast);
    }

    #[test]
    fn test_f64_to_u64() {
        assert_eq!(num_proj::f64_to_u64(-1e25), ProjectedNumber::Next(0));
        assert_eq!(num_proj::f64_to_u64(-0.1), ProjectedNumber::Next(0));
        assert_eq!(num_proj::f64_to_u64(1e20), ProjectedNumber::AfterLast);
        assert_eq!(
            num_proj::f64_to_u64(f64::INFINITY),
            ProjectedNumber::AfterLast
        );
        assert_eq!(num_proj::f64_to_u64(0.0), ProjectedNumber::Exact(0));
        assert_eq!(num_proj::f64_to_u64(42.0), ProjectedNumber::Exact(42));
        assert_eq!(num_proj::f64_to_u64(0.5), ProjectedNumber::Next(1));
        assert_eq!(num_proj::f64_to_u64(42.1), ProjectedNumber::Next(43));
    }

    #[test]
    fn test_f64_to_i64() {
        assert_eq!(num_proj::f64_to_i64(-1e20), ProjectedNumber::Next(i64::MIN));
        assert_eq!(
            num_proj::f64_to_i64(f64::NEG_INFINITY),
            ProjectedNumber::Next(i64::MIN)
        );
        assert_eq!(num_proj::f64_to_i64(1e20), ProjectedNumber::AfterLast);
        assert_eq!(
            num_proj::f64_to_i64(f64::INFINITY),
            ProjectedNumber::AfterLast
        );
        assert_eq!(num_proj::f64_to_i64(0.0), ProjectedNumber::Exact(0));
        assert_eq!(num_proj::f64_to_i64(42.0), ProjectedNumber::Exact(42));
        assert_eq!(num_proj::f64_to_i64(-42.0), ProjectedNumber::Exact(-42));
        assert_eq!(num_proj::f64_to_i64(0.5), ProjectedNumber::Next(1));
        assert_eq!(num_proj::f64_to_i64(42.1), ProjectedNumber::Next(43));
        assert_eq!(num_proj::f64_to_i64(-0.5), ProjectedNumber::Next(0));
        assert_eq!(num_proj::f64_to_i64(-42.1), ProjectedNumber::Next(-42));
    }

    #[test]
    fn test_i64_to_f64() {
        assert_eq!(num_proj::i64_to_f64(0), ProjectedNumber::Exact(0.0));
        assert_eq!(num_proj::i64_to_f64(42), ProjectedNumber::Exact(42.0));
        assert_eq!(num_proj::i64_to_f64(-42), ProjectedNumber::Exact(-42.0));

        let max_exact = 9_007_199_254_740_992; // 2^53
        assert_eq!(
            num_proj::i64_to_f64(max_exact),
            ProjectedNumber::Exact(max_exact as f64)
        );

        // Test values that cannot be exactly represented as f64 (integers above 2^53)
        let large_i64 = 9_007_199_254_740_993; // 2^53 + 1
        let closest_f64 = 9_007_199_254_740_992.0;
        assert_eq!(large_i64 as f64, closest_f64);
        if let ProjectedNumber::Next(val) = num_proj::i64_to_f64(large_i64) {
            // Verify that the returned float is different from the direct cast
            assert!(val > closest_f64);
            assert!(val - closest_f64 < 2. * f64::EPSILON * closest_f64);
        } else {
            panic!("Expected ProjectedNumber::Next for large_i64");
        }

        // Test with very large negative value
        let large_neg_i64 = -9_007_199_254_740_993; // -(2^53 + 1)
        let closest_neg_f64 = -9_007_199_254_740_992.0;
        assert_eq!(large_neg_i64 as f64, closest_neg_f64);
        if let ProjectedNumber::Next(val) = num_proj::i64_to_f64(large_neg_i64) {
            // Verify that the returned float is the closest representable f64
            assert_eq!(val, closest_neg_f64);
        } else {
            panic!("Expected ProjectedNumber::Next for large_neg_i64");
        }
    }

    #[test]
    fn test_u64_to_f64() {
        assert_eq!(num_proj::u64_to_f64(0), ProjectedNumber::Exact(0.0));
        assert_eq!(num_proj::u64_to_f64(42), ProjectedNumber::Exact(42.0));

        // Test the largest u64 value that can be exactly represented as f64 (2^53)
        let max_exact = 9_007_199_254_740_992; // 2^53
        assert_eq!(
            num_proj::u64_to_f64(max_exact),
            ProjectedNumber::Exact(max_exact as f64)
        );

        // Test values that cannot be exactly represented as f64 (integers above 2^53)
        let large_u64 = 9_007_199_254_740_993; // 2^53 + 1
        let closest_f64 = 9_007_199_254_740_992.0;
        assert_eq!(large_u64 as f64, closest_f64);
        if let ProjectedNumber::Next(val) = num_proj::u64_to_f64(large_u64) {
            // Verify that the returned float is different from the direct cast
            assert!(val > closest_f64);
            assert!(val - closest_f64 < 2. * f64::EPSILON * closest_f64);
        } else {
            panic!("Expected ProjectedNumber::Next for large_u64");
        }
    }
}


================================================
FILE: src/aggregation/bucket/filter.rs
================================================
use std::fmt::Debug;

use common::BitSet;
use serde::{Deserialize, Deserializer, Serialize, Serializer};

use crate::aggregation::agg_data::{
    build_segment_agg_collectors, AggRefNode, AggregationsSegmentCtx,
};
use crate::aggregation::cached_sub_aggs::{
    CachedSubAggs, HighCardSubAggCache, LowCardSubAggCache, SubAggCache,
};
use crate::aggregation::intermediate_agg_result::{
    IntermediateAggregationResult, IntermediateAggregationResults, IntermediateBucketResult,
};
use crate::aggregation::segment_agg_result::{BucketIdProvider, SegmentAggregationCollector};
use crate::aggregation::BucketId;
use crate::docset::DocSet;
use crate::query::{AllQuery, EnableScoring, Query, QueryParser};
use crate::schema::Schema;
use crate::tokenizer::TokenizerManager;
use crate::{DocId, SegmentReader, TantivyError};

/// A trait for query builders that can build queries programmatically.
///
/// This trait enables programmatic query construction for filter aggregations with
/// full serialization/deserialization support for distributed aggregation scenarios.
///
/// # Why This Exists
///
/// Filter aggregations need to support both:
/// - Query strings (simple, always serializable)
/// - Programmatic query construction (flexible, with serialization support)
///
/// This trait provides the programmatic query construction capability with full
/// serialization support via the `typetag` crate.
///
/// # Implementation Requirements
///
/// Implementers must:
/// 1. Derive `Debug`, `Clone`, `Serialize`, and `Deserialize`
/// 2. Use `#[typetag::serde]` attribute on the impl block
/// 3. Implement `build_query()` to construct the query from schema/tokenizers
/// 4. Implement `box_clone()` to enable cloning (typically just `Box::new(self.clone())`)
///
/// # Example
///
/// ```rust
/// use tantivy::aggregation::bucket::QueryBuilder;
/// use tantivy::query::{Query, TermQuery};
/// use tantivy::schema::{Schema, IndexRecordOption};
/// use tantivy::tokenizer::TokenizerManager;
/// use tantivy::Term;
/// use serde::{Serialize, Deserialize};
///
/// #[derive(Debug, Clone, Serialize, Deserialize)]
/// struct TermQueryBuilder {
///     field_name: String,
///     term_text: String,
/// }
///
/// #[typetag::serde]
/// impl QueryBuilder for TermQueryBuilder {
///     fn build_query(
///         &self,
///         schema: &Schema,
///         _tokenizers: &TokenizerManager,
///     ) -> tantivy::Result<Box<dyn Query>> {
///         let field = schema.get_field(&self.field_name)?;
///         let term = Term::from_field_text(field, &self.term_text);
///         Ok(Box::new(TermQuery::new(term, IndexRecordOption::Basic)))
///     }
///
///     fn box_clone(&self) -> Box<dyn QueryBuilder> {
///         Box::new(self.clone())
///     }
/// }
///
/// // Create an instance
/// let builder = TermQueryBuilder {
///     field_name: "category".to_string(),
///     term_text: "electronics".to_string(),
/// };
/// ```
#[typetag::serde(tag = "type")]
pub trait QueryBuilder: Debug + Send + Sync {
    /// Build a query from the given schema and tokenizer manager.
    ///
    /// This method is called once when creating the FilterAggReqData for a segment.
    ///
    /// # Parameters
    /// - `schema`: The index schema for field lookups
    /// - `tokenizers`: The tokenizer manager for text analysis
    ///
    /// # Returns
    /// A boxed Query object, or an error if construction fails
    fn build_query(
        &self,
        schema: &Schema,
        tokenizers: &TokenizerManager,
    ) -> crate::Result<Box<dyn Query>>;

    /// Clone this builder into a boxed trait object.
    ///
    /// Since builders are just data (no state), this simply clones the data.
    /// The typical implementation is:
    /// ```rust,ignore
    /// fn box_clone(&self) -> Box<dyn QueryBuilder> {
    ///     Box::new(self.clone())
    /// }
    /// ```
    fn box_clone(&self) -> Box<dyn QueryBuilder>;
}

/// Filter aggregation creates a single bucket containing documents that match a query.
///
/// # Usage
///
/// ## Query String (Recommended)
/// ```rust
/// use tantivy::aggregation::bucket::FilterAggregation;
///
/// // Query strings are parsed using Tantivy's standard QueryParser
/// let filter_agg = FilterAggregation::new("category:electronics AND price:[100 TO 500]".to_string());
/// ```
///
/// ## Custom Query Builder
/// ```rust
/// use tantivy::aggregation::bucket::{FilterAggregation, QueryBuilder};
/// use tantivy::query::{Query, TermQuery};
/// use tantivy::schema::{Schema, IndexRecordOption};
/// use tantivy::tokenizer::TokenizerManager;
/// use tantivy::Term;
/// use serde::{Serialize, Deserialize};
///
/// #[derive(Debug, Clone, Serialize, Deserialize)]
/// struct MyBuilder {
///     field_name: String,
///     term_text: String,
/// }
///
/// #[typetag::serde]
/// impl QueryBuilder for MyBuilder {
///     fn build_query(
///         &self,
///         schema: &Schema,
///         _tokenizers: &TokenizerManager,
///     ) -> tantivy::Result<Box<dyn Query>> {
///         let field = schema.get_field(&self.field_name)?;
///         let term = Term::from_field_text(field, &self.term_text);
///         Ok(Box::new(TermQuery::new(term, IndexRecordOption::Basic)))
///     }
///
///     fn box_clone(&self) -> Box<dyn QueryBuilder> {
///         Box::new(self.clone())
///     }
/// }
///
/// let builder = MyBuilder {
///     field_name: "category".to_string(),
///     term_text: "electronics".to_string(),
/// };
/// let filter_agg = FilterAggregation::new_with_builder(Box::new(builder));
/// ```
///
/// # Result
/// The filter aggregation returns a single bucket with:
/// - `doc_count`: Number of documents matching the filter
/// - Sub-aggregation results computed on the filtered document set
#[derive(Debug, Clone)]
pub struct FilterAggregation {
    /// The query for filtering - can be either a query string or a query builder
    query: FilterQuery,
}

/// Represents different ways to specify a filter query
pub enum FilterQuery {
    /// Query string that will be parsed using Tantivy's standard parsing facilities
    ///
    /// This is the recommended approach as it's serializable and doesn't carry runtime state.
    QueryString(String),

    /// Custom query builder for programmatic query building
    ///
    /// This variant stores a builder that builds the query once when creating FilterAggReqData.
    ///
    /// This is useful for:
    /// - Custom query types not expressible as query strings
    /// - Programmatic query construction based on schema
    /// - Extension query types
    ///
    /// **Note**: The builder is serializable and can be deserialized.
    CustomBuilder(Box<dyn QueryBuilder>),
}

impl Debug for FilterQuery {
    fn fmt(&self, f: &mut std::fmt::Formatter<'_>) -> std::fmt::Result {
        match self {
            FilterQuery::QueryString(s) => f.debug_tuple("QueryString").field(s).finish(),
            FilterQuery::CustomBuilder(_) => {
                f.debug_struct("CustomBuilder").finish_non_exhaustive()
            }
        }
    }
}

impl Clone for FilterQuery {
    fn clone(&self) -> Self {
        match self {
            FilterQuery::QueryString(query_string) => {
                FilterQuery::QueryString(query_string.clone())
            }
            FilterQuery::CustomBuilder(builder) => FilterQuery::CustomBuilder(builder.box_clone()),
        }
    }
}

impl FilterAggregation {
    /// Create a new filter aggregation with a query string
    /// The query string will be parsed using the QueryParser::parse_query() method.
    pub fn new(query_string: String) -> Self {
        Self {
            query: FilterQuery::QueryString(query_string),
        }
    }

    /// Create a new filter aggregation with a query builder
    ///
    /// The builder will be called once when creating the FilterAggReqData for each segment.
    ///
    /// # Example
    /// ```rust
    /// use tantivy::aggregation::bucket::{FilterAggregation, QueryBuilder};
    /// use tantivy::query::{Query, TermQuery};
    /// use tantivy::schema::{Schema, IndexRecordOption};
    /// use tantivy::tokenizer::TokenizerManager;
    /// use tantivy::Term;
    /// use serde::{Serialize, Deserialize};
    ///
    /// #[derive(Debug, Clone, Serialize, Deserialize)]
    /// struct MyBuilder {
    ///     field_name: String,
    ///     term_text: String,
    /// }
    ///
    /// #[typetag::serde]
    /// impl QueryBuilder for MyBuilder {
    ///     fn build_query(
    ///         &self,
    ///         schema: &Schema,
    ///         _tokenizers: &TokenizerManager,
    ///     ) -> tantivy::Result<Box<dyn Query>> {
    ///         let field = schema.get_field(&self.field_name)?;
    ///         let term = Term::from_field_text(field, &self.term_text);
    ///         Ok(Box::new(TermQuery::new(term, IndexRecordOption::Basic)))
    ///     }
    ///
    ///     fn box_clone(&self) -> Box<dyn QueryBuilder> {
    ///         Box::new(self.clone())
    ///     }
    /// }
    ///
    /// let builder = MyBuilder {
    ///     field_name: "category".to_string(),
    ///     term_text: "electronics".to_string(),
    /// };
    /// let filter_agg = FilterAggregation::new_with_builder(Box::new(builder));
    /// ```
    pub fn new_with_builder(builder: Box<dyn QueryBuilder>) -> Self {
        Self {
            query: FilterQuery::CustomBuilder(builder),
        }
    }

    /// Parse the query into a Tantivy Query object
    ///
    /// For query strings, this uses the QueryParser::parse_query() method.
    /// For custom builders, builds the query using the builder.
    pub(crate) fn parse_query(
        &self,
        schema: &Schema,
        tokenizer_manager: &TokenizerManager,
    ) -> crate::Result<Box<dyn Query>> {
        match &self.query {
            FilterQuery::QueryString(query_str) => {
                let query_parser =
                    QueryParser::new(schema.clone(), vec![], tokenizer_manager.clone());

                query_parser
                    .parse_query(query_str)
                    .map_err(|e| TantivyError::InvalidArgument(e.to_string()))
            }
            FilterQuery::CustomBuilder(builder) => {
                // Build the query using the builder
                builder.build_query(schema, tokenizer_manager)
            }
        }
    }

    /// Parse the query with a custom QueryParser
    ///
    /// This method allows using a pre-configured QueryParser with custom settings
    /// like field boosts, fuzzy matching, default fields, etc.
    ///
    /// For custom builders, this method is not supported and will return an error.
    /// Custom builders need schema and tokenizers which are not accessible from QueryParser.
    pub fn parse_query_with_parser(
        &self,
        query_parser: &QueryParser,
    ) -> crate::Result<Box<dyn Query>> {
        match &self.query {
            FilterQuery::QueryString(query_str) => query_parser
                .parse_query(query_str)
                .map_err(|e| TantivyError::InvalidArgument(e.to_string())),
            FilterQuery::CustomBuilder(_) => Err(TantivyError::InvalidArgument(
                "parse_query_with_parser is not supported for custom query builders. Use \
                 parse_query with explicit schema and tokenizers instead."
                    .to_string(),
            )),
        }
    }

    /// Get the fast field names used by this aggregation (none for filter aggregation)
    pub fn get_fast_field_names(&self) -> Vec<&str> {
        // Filter aggregation cannot introspect query fast field dependencies.
        //
        // As of PR #2693, queries can fall back to fast fields when fields are not indexed
        // (e.g., TermQuery falls back to RangeQuery on fast fields). However, the Query
        // trait has no mechanism to report these dependencies.
        //
        // For prefetching optimization, callers must analyze the query themselves to
        // determine fast field usage. This requires:
        // 1. Parsing the query string to extract field references
        // 2. Checking the schema to see if those fields are indexed or fast-only
        // 3. Collecting fast field names for non-indexed fields
        //
        // This limitation exists because:
        // - Query::weight() is called during execution, not during planning
        // - The fallback decision is based on schema configuration
        // - There's no Query trait method to declare potential fast field dependencies
        vec![]
    }
}

// Custom serialization implementation
impl Serialize for FilterAggregation {
    fn serialize<S>(&self, serializer: S) -> Result<S::Ok, S::Error>
    where S: Serializer {
        match &self.query {
            FilterQuery::QueryString(query_string) => {
                // Serialize query strings as plain strings
                query_string.serialize(serializer)
            }
            FilterQuery::CustomBuilder(builder) => {
                // Serialize custom builders using typetag (includes type information)
                builder.serialize(serializer)
            }
        }
    }
}

impl<'de> Deserialize<'de> for FilterAggregation {
    fn deserialize<D>(deserializer: D) -> Result<Self, D::Error>
    where D: Deserializer<'de> {
        // We need to peek at the value to determine if it's a string or an object
        use serde::de::Error;
        use serde_json::Value;

        let value = Value::deserialize(deserializer)?;

        let query = if let Some(query_string) = value.as_str() {
            // It's a plain string - query string
            FilterQuery::QueryString(query_string.to_string())
        } else {
            // It's an object - custom builder with typetag
            let builder: Box<dyn QueryBuilder> = serde_json::from_value(value).map_err(|e| {
                D::Error::custom(format!("Failed to deserialize QueryBuilder: {}", e))
            })?;
            FilterQuery::CustomBuilder(builder)
        };

        Ok(FilterAggregation { query })
    }
}

// PartialEq is required because AggregationVariants derives it
// We implement it manually to handle custom builders which cannot be compared
impl PartialEq for FilterAggregation {
    fn eq(&self, other: &Self) -> bool {
        match (&self.query, &other.query) {
            (FilterQuery::QueryString(a), FilterQuery::QueryString(b)) => a == b,
            // Custom builders cannot be compared for equality
            _ => false,
        }
    }
}

/// Request data for filter aggregation
/// This struct holds the per-segment data needed to execute a filter aggregation
pub struct FilterAggReqData {
    /// The name of the filter aggregation
    pub name: String,
    /// The filter aggregation
    pub req: FilterAggregation,
    /// The segment reader
    pub segment_reader: SegmentReader,
    /// Document evaluator for the filter query (precomputed BitSet)
    /// This is built once when the request data is created
    pub evaluator: DocumentQueryEvaluator,
    /// Reusable buffer for matching documents to minimize allocations during collection
    pub matching_docs_buffer: Vec<DocId>,
    /// True if this filter aggregation is at the top level of the aggregation tree (not nested).
    pub is_top_level: bool,
}

impl FilterAggReqData {
    pub(crate) fn get_memory_consumption(&self) -> usize {
        // Estimate: name + segment reader reference + bitset + buffer capacity
        self.name.len()
        + std::mem::size_of::<SegmentReader>()
        + self.evaluator.bitset.len() / 8 // BitSet memory (bits to bytes)
        + self.matching_docs_buffer.capacity() * std::mem::size_of::<DocId>()
        + std::mem::size_of::<bool>()
    }
}

/// Document evaluator for filter queries using BitSet
pub struct DocumentQueryEvaluator {
    /// BitSet containing all matching documents for this segment.
    /// For AllQuery, this is a full BitSet (all bits set).
    /// For other queries, only matching document bits are set.
    pub(crate) bitset: BitSet,
}

impl DocumentQueryEvaluator {
    /// Create and initialize a document query evaluator for a segment
    /// This executes the query upfront and collects results into a BitSet,
    /// unless the query is AllQuery in which case we skip BitSet creation.
    pub(crate) fn new(
        query: Box<dyn Query>,
        schema: Schema,
        segment_reader: &SegmentReader,
    ) -> crate::Result<Self> {
        let max_doc = segment_reader.max_doc();

        // Optimization: Detect AllQuery and create a full BitSet
        if query.as_any().downcast_ref::<AllQuery>().is_some() {
            return Ok(Self {
                bitset: BitSet::with_max_value_and_full(max_doc),
            });
        }

        // Get the weight for the query
        let weight = query.weight(EnableScoring::disabled_from_schema(&schema))?;

        // Get a scorer that iterates over matching documents
        let mut scorer = weight.scorer(segment_reader, 1.0)?;

        // Create a BitSet to hold all matching documents
        let mut bitset = BitSet::with_max_value(max_doc);

        // Collect all matching documents into the BitSet
        // This is the upfront cost, but then lookups are O(1)
        let mut doc = scorer.doc();
        while doc != crate::TERMINATED {
            bitset.insert(doc);
            doc = scorer.advance();
        }

        Ok(Self { bitset })
    }

    /// Evaluate if a document matches the filter query
    /// O(1) lookup in the precomputed BitSet
    #[inline]
    pub fn matches_document(&self, doc: DocId) -> bool {
        self.bitset.contains(doc)
    }

    /// Filter a batch of documents
    /// Returns matching documents from the input batch
    #[inline]
    pub fn filter_batch(&self, docs: &[DocId], output: &mut Vec<DocId>) {
        for &doc in docs {
            if self.bitset.contains(doc) {
                output.push(doc);
            }
        }
    }
}

impl Debug for DocumentQueryEvaluator {
    fn fmt(&self, f: &mut std::fmt::Formatter<'_>) -> std::fmt::Result {
        f.debug_struct("DocumentQueryEvaluator")
            .field("num_matches", &self.bitset.len())
            .finish()
    }
}

#[derive(Debug, Clone, PartialEq, Copy)]
struct DocCount {
    doc_count: u64,
    bucket_id: BucketId,
}

/// Segment collector for filter aggregation
pub struct SegmentFilterCollector<C: SubAggCache> {
    /// Document counts per parent bucket
    parent_buckets: Vec<DocCount>,
    /// Sub-aggregation collectors
    sub_aggregations: Option<CachedSubAggs<C>>,
    bucket_id_provider: BucketIdProvider,
    /// Accessor index for this filter aggregation (to access FilterAggReqData)
    accessor_idx: usize,
}

impl<C: SubAggCache> SegmentFilterCollector<C> {
    /// Create a new filter segment collector following the new agg_data pattern
    pub(crate) fn from_req_and_validate(
        req: &mut AggregationsSegmentCtx,
        node: &AggRefNode,
    ) -> crate::Result<Self> {
        // Build sub-aggregation collectors if any
        let sub_agg_collector = if !node.children.is_empty() {
            Some(build_segment_agg_collectors(req, &node.children)?)
        } else {
            None
        };
        let sub_agg_collector = sub_agg_collector.map(CachedSubAggs::new);

        Ok(SegmentFilterCollector {
            parent_buckets: Vec::new(),
            sub_aggregations: sub_agg_collector,
            accessor_idx: node.idx_in_req_data,
            bucket_id_provider: BucketIdProvider::default(),
        })
    }
}

pub(crate) fn build_segment_filter_collector(
    req: &mut AggregationsSegmentCtx,
    node: &AggRefNode,
) -> crate::Result<Box<dyn SegmentAggregationCollector>> {
    let is_top_level = req.per_request.filter_req_data[node.idx_in_req_data]
        .as_ref()
        .expect("filter_req_data slot is empty")
        .is_top_level;

    if is_top_level {
        Ok(Box::new(
            SegmentFilterCollector::<LowCardSubAggCache>::from_req_and_validate(req, node)?,
        ))
    } else {
        Ok(Box::new(
            SegmentFilterCollector::<HighCardSubAggCache>::from_req_and_validate(req, node)?,
        ))
    }
}

impl<C: SubAggCache> Debug for SegmentFilterCollector<C> {
    fn fmt(&self, f: &mut std::fmt::Formatter<'_>) -> std::fmt::Result {
        f.debug_struct("SegmentFilterCollector")
            .field("buckets", &self.parent_buckets)
            .field("has_sub_aggs", &self.sub_aggregations.is_some())
            .field("accessor_idx", &self.accessor_idx)
            .finish()
    }
}

impl<C: SubAggCache> SegmentAggregationCollector for SegmentFilterCollector<C> {
    fn add_intermediate_aggregation_result(
        &mut self,
        agg_data: &AggregationsSegmentCtx,
        results: &mut IntermediateAggregationResults,
        parent_bucket_id: BucketId,
    ) -> crate::Result<()> {
        let mut sub_results = IntermediateAggregationResults::default();
        let bucket_opt = self.parent_buckets.get(parent_bucket_id as usize);

        if let Some(sub_aggs) = &mut self.sub_aggregations {
            sub_aggs
                .get_sub_agg_collector()
                .add_intermediate_aggregation_result(
                    agg_data,
                    &mut sub_results,
                    // Here we create a new bucket ID for sub-aggregations if the bucket doesn't
                    // exist, so that sub-aggregations can still produce results (e.g., zero doc
                    // count)
                    bucket_opt
                        .map(|bucket| bucket.bucket_id)
                        .unwrap_or(self.bucket_id_provider.next_bucket_id()),
                )?;
        }

        // Create the filter bucket result
        let filter_bucket_result = IntermediateBucketResult::Filter {
            doc_count: bucket_opt.map(|b| b.doc_count).unwrap_or(0),
            sub_aggregations: sub_results,
        };

        // Get the name of this filter aggregation
        let name = agg_data.per_request.filter_req_data[self.accessor_idx]
            .as_ref()
            .expect("filter_req_data slot is empty")
            .name
            .clone();

        results.push(
            name,
            IntermediateAggregationResult::Bucket(filter_bucket_result),
        )?;

        Ok(())
    }

    fn collect(
        &mut self,
        parent_bucket_id: BucketId,
        docs: &[crate::DocId],
        agg_data: &mut AggregationsSegmentCtx,
    ) -> crate::Result<()> {
        if docs.is_empty() {
            return Ok(());
        }

        let mut bucket = self.parent_buckets[parent_bucket_id as usize];
        // Take the request data to avoid borrow checker issues with sub-aggregations
        let mut req = agg_data.take_filter_req_data(self.accessor_idx);

        // Use batch filtering with O(1) BitSet lookups
        req.matching_docs_buffer.clear();
        req.evaluator
            .filter_batch(docs, &mut req.matching_docs_buffer);

        bucket.doc_count += req.matching_docs_buffer.len() as u64;

        // Batch process sub-aggregations if we have matches
        if !req.matching_docs_buffer.is_empty() {
            if let Some(sub_aggs) = &mut self.sub_aggregations {
                for &doc_id in &req.matching_docs_buffer {
                    sub_aggs.push(bucket.bucket_id, doc_id);
                }
            }
        }

        // Put the request data back
        agg_data.put_back_filter_req_data(self.accessor_idx, req);
        if let Some(sub_aggs) = &mut self.sub_aggregations {
            sub_aggs.check_flush_local(agg_data)?;
        }
        // put back bucket
        self.parent_buckets[parent_bucket_id as usize] = bucket;

        Ok(())
    }

    fn flush(&mut self, agg_data: &mut AggregationsSegmentCtx) -> crate::Result<()> {
        if let Some(ref mut sub_aggs) = self.sub_aggregations {
            sub_aggs.flush(agg_data)?;
        }
        Ok(())
    }

    fn prepare_max_bucket(
        &mut self,
        max_bucket: BucketId,
        _agg_data: &AggregationsSegmentCtx,
    ) -> crate::Result<()> {
        while self.parent_buckets.len() <= max_bucket as usize {
            let bucket_id = self.bucket_id_provider.next_bucket_id();
            self.parent_buckets.push(DocCount {
                doc_count: 0,
                bucket_id,
            });
        }
        Ok(())
    }
}

/// Intermediate result for filter aggregation
#[derive(Debug, Clone, PartialEq)]
pub struct IntermediateFilterBucketResult {
    /// Document count in this bucket
    pub doc_count: u64,
    /// Sub-aggregation results
    pub sub_aggregations: IntermediateAggregationResults,
}

#[cfg(test)]
mod tests {
    use serde_json::{json, Value};

    use super::*;
    use crate::aggregation::agg_req::Aggregations;
    use crate::aggregation::agg_result::AggregationResults;
    use crate::aggregation::{AggContextParams, AggregationCollector};
    use crate::query::{AllQuery, TermQuery};
    use crate::schema::{IndexRecordOption, Schema, Term, FAST, INDEXED, TEXT};
    use crate::{doc, Index, IndexWriter};

    // Test helper functions
    fn aggregation_results_to_json(results: &AggregationResults) -> Value {
        serde_json::to_value(results).expect("Failed to serialize aggregation results")
    }

    fn json_values_match(actual: &Value, expected: &Value, tolerance: f64) -> bool {
        match (actual, expected) {
            (Value::Number(a), Value::Number(e)) => {
                let a_f64 = a.as_f64().unwrap_or(0.0);
                let e_f64 = e.as_f64().unwrap_or(0.0);
                (a_f64 - e_f64).abs() < tolerance
            }
            (Value::Object(a_map), Value::Object(e_map)) => {
                if a_map.len() != e_map.len() {
                    return false;
                }
                for (key, expected_val) in e_map {
                    match a_map.get(key) {
                        Some(actual_val) => {
                            if !json_values_match(actual_val, expected_val, tolerance) {
                                return false;
                            }
                        }
                        None => return false,
                    }
                }
                true
            }
            (Value::Array(a_arr), Value::Array(e_arr)) => {
                if a_arr.len() != e_arr.len() {
                    return false;
                }
                for (actual_item, expected_item) in a_arr.iter().zip(e_arr.iter()) {
                    if !json_values_match(actual_item, expected_item, tolerance) {
                        return false;
                    }
                }
                true
            }
            _ => actual == expected,
        }
    }

    fn assert_aggregation_results_match(
        actual_results: &AggregationResults,
        expected_json: Value,
        tolerance: f64,
    ) {
        let actual_json = aggregation_results_to_json(actual_results);

        if !json_values_match(&actual_json, &expected_json, tolerance) {
            panic!(
                "Aggregation results do not match expected JSON.\nActual:\n{}\nExpected:\n{}",
                serde_json::to_string_pretty(&actual_json).unwrap(),
                serde_json::to_string_pretty(&expected_json).unwrap()
            );
        }
    }

    macro_rules! assert_agg_results {
        ($actual:expr, $expected:expr) => {
            assert_aggregation_results_match($actual, $expected, 0.1)
        };
        ($actual:expr, $expected:expr, $tolerance:expr) => {
            assert_aggregation_results_match($actual, $expected, $tolerance)
        };
    }

    fn create_standard_test_index() -> crate::Result<Index> {
        let mut schema_builder = Schema::builder();
        let category = schema_builder.add_text_field("category", TEXT | FAST);
        let brand = schema_builder.add_text_field("brand", TEXT | FAST);
        let price = schema_builder.add_u64_field("price", FAST | INDEXED);
        let rating = schema_builder.add_f64_field("rating", FAST);
        let in_stock = schema_builder.add_bool_field("in_stock", FAST | INDEXED);

        let schema = schema_builder.build();
        let index = Index::create_in_ram(schema);
        let mut writer: IndexWriter = index.writer_for_tests()?;

        writer.add_document(doc!(
            category => "electronics", brand => "apple",
            price => 999u64, rating => 4.5f64, in_stock => true
        ))?;
        writer.commit()?;
        writer.add_document(doc!(
            category => "electronics", brand => "samsung",
            price => 799u64, rating => 4.2f64, in_stock => true
        ))?;
        writer.add_document(doc!(
            category => "clothing", brand => "nike",
            price => 120u64, rating => 4.1f64, in_stock => false
        ))?;
        writer.add_document(doc!(
            category => "books", brand => "penguin",
            price => 25u64, rating => 4.8f64, in_stock => true
        ))?;

        writer.commit()?;
        Ok(index)
    }

    /// Helper to create aggregation collector with serialization roundtrip
    /// This ensures all aggregations can be serialized and deserialized correctly
    fn create_collector(
        index: &Index,
        aggregations: Aggregations,
    ) -> crate::Result<AggregationCollector> {
        // Serialize and deserialize the aggregations
        let serialized = serde_json::to_string(&aggregations)?;
        let deserialized: Aggregations = serde_json::from_str(&serialized)?;

        // Create collector with deserialized aggregations
        Ok(AggregationCollector::from_aggs(
            deserialized,
            AggContextParams::new(Default::default(), index.tokenizers().clone()),
        ))
    }

    #[test]
    fn test_basic_filter_with_metric_agg() -> crate::Result<()> {
        let index = create_standard_test_index()?;
        let reader = index.reader()?;
        let searcher = reader.searcher();

        let agg = json!({
            "electronics": {
                "filter": "category:electronics",
                "aggs": {
                    "avg_price": { "avg": { "field": "price" } }
                }
            }
        });

        let aggregations: Aggregations = serde_json::from_value(agg)?;
        let collector = create_collector(&index, aggregations)?;
        let result = searcher.search(&AllQuery, &collector)?;

        let expected = json!({
            "electronics": {
                "doc_count": 2,
                "avg_price": { "value": 899.0 }  // (999 + 799) / 2
            }
        });

        assert_agg_results!(&result, expected);
        Ok(())
    }

    #[test]
    fn test_filter_with_no_matches() -> crate::Result<()> {
        let index = create_standard_test_index()?;
        let reader = index.reader()?;
        let searcher = reader.searcher();

        let agg = json!({
            "furniture": {
                "filter": "category:furniture",
                "aggs": {
                    "avg_price": { "avg": { "field": "price" } }
                }
            }
        });

        let aggregations: Aggregations = serde_json::from_value(agg)?;
        let collector = create_collector(&index, aggregations)?;
        let result = searcher.search(&AllQuery, &collector)?;

        let expected = json!({
            "furniture": {
                "doc_count": 0,
                "avg_price": { "value": null }
            }
        });

        assert_agg_results!(&result, expected);
        Ok(())
    }

    #[test]
    fn test_multiple_independent_filters() -> crate::Result<()> {
        let index = create_standard_test_index()?;
        let reader = index.reader()?;
        let searcher = reader.searcher();

        let agg = json!({
            "electronics": {
                "filter": "category:electronics",
                "aggs": { "avg_price": { "avg": { "field": "price" } } }
            },
            "in_stock": {
                "filter": "in_stock:true",
                "aggs": { "count": { "value_count": { "field": "brand" } } }
            },
            "high_rated": {
                "filter": "rating:[4.5 TO *]",
                "aggs": { "count": { "value_count": { "field": "brand" } } }
            }
        });

        let aggregations: Aggregations = serde_json::from_value(agg)?;
        let collector = create_collector(&index, aggregations)?;
        let result = searcher.search(&AllQuery, &collector)?;

        let expected = json!({
            "electronics": {
                "doc_count": 2,
                "avg_price": { "value": 899.0 }
            },
            "in_stock": {
                "doc_count": 3,  // apple, samsung, penguin
                "count": { "value": 3.0 }
            },
            "high_rated": {
                "doc_count": 2,  // apple (4.5), penguin (4.8)
                "count": { "value": 2.0 }
            }
        });

        assert_agg_results!(&result, expected);
        Ok(())
    }

    // ============================================================================
    // Query Type Tests
    // ============================================================================

    #[test]
    fn test_term_query_filter() -> crate::Result<()> {
        let index = create_standard_test_index()?;
        let reader = index.reader()?;
        let searcher = reader.searcher();

        let agg = json!({
            "apple_products": {
                "filter": "brand:apple",
                "aggs": { "max_price": { "max": { "field": "price" } } }
            }
        });

        let aggregations: Aggregations = serde_json::from_value(agg)?;
        let collector = create_collector(&index, aggregations)?;
        let result = searcher.search(&AllQuery, &collector)?;

        let expected = json!({
            "apple_products": {
                "doc_count": 1,
                "max_price": { "value": 999.0 }
            }
        });

        assert_agg_results!(&result, expected);
        Ok(())
    }

    #[test]
    fn test_range_query_filter() -> crate::Result<()> {
        let index = create_standard_test_index()?;
        let reader = index.reader()?;
        let searcher = reader.searcher();

        let agg = json!({
            "mid_price": {
                "filter": "price:[100 TO 900]",
                "aggs": { "count": { "value_count": { "field": "brand" } } }
            }
        });

        let aggregations: Aggregations = serde_json::from_value(agg)?;
        let collector = create_collector(&index, aggregations)?;
        let result = searcher.search(&AllQuery, &collector)?;

        let expected = json!({
            "mid_price": {
                "doc_count": 2,  // samsung (799), nike (120)
                "count": { "value": 2.0 }
            }
        });

        assert_agg_results!(&result, expected);
        Ok(())
    }

    #[test]
    fn test_boolean_query_filter() -> crate::Result<()> {
        let index = create_standard_test_index()?;
        let reader = index.reader()?;
        let searcher = reader.searcher();
        assert_eq!(searcher.segment_readers().len(), 2);
        let agg = json!({
            "premium_electronics": {
                "filter": "category:electronics AND price:[800 TO *]",
                "aggs": { "avg_rating": { "avg": { "field": "rating" } } }
            }
        });

        let aggregations: Aggregations = serde_json::from_value(agg)?;
        let collector = create_collector(&index, aggregations)?;
        let result = searcher.search(&AllQuery, &collector)?;

        let expected = json!({
            "premium_electronics": {
                "doc_count": 1,  // Only apple (999) is >= 800 in tantivy's range semantics
                "avg_rating": { "value": 4.5 }
            }
        });

        assert_agg_results!(&result, expected);
        Ok(())
    }

    #[test]
    fn test_bool_field_filter() -> crate::Result<()> {
        let index = create_standard_test_index()?;
        let reader = index.reader()?;
        let searcher = reader.searcher();

        let agg = json!({
            "in_stock": {
                "filter": "in_stock:true",
                "aggs": { "avg_price": { "avg": { "field": "price" } } }
            },
            "out_of_stock": {
                "filter": "in_stock:false",
                "aggs": { "count": { "value_count": { "field": "brand" } } }
            }
        });

        let aggregations: Aggregations = serde_json::from_value(agg)?;
        let collector = create_collector(&index, aggregations)?;
        let result = searcher.search(&AllQuery, &collector)?;

        let expected = json!({
            "in_stock": {
                "doc_count": 3,  // apple, samsung, penguin
                "avg_price": { "value": 607.67 }  // (999 + 799 + 25) / 3 ≈ 607.67
            },
            "out_of_stock": {
                "doc_count": 1,  // nike
                "count": { "value": 1.0 }
            }
        });

        assert_agg_results!(&result, expected, 1.0);
        Ok(())
    }

    // ============================================================================
    // Nested Filter Tests
    // ============================================================================

    #[test]
    fn test_two_level_nested_filters() -> crate::Result<()> {
        let index = create_standard_test_index()?;
        let reader = index.reader()?;
        let searcher = reader.searcher();

        let agg = json!({
            "all": {
                "filter": "*",
                "aggs": {
                    "electronics": {
                        "filter": "category:electronics",
                        "aggs": {
                            "expensive": {
                                "filter": "price:[900 TO *]",
                                "aggs": {
                                    "count": { "value_count": { "field": "brand" } }
                                }
                            }
                        }
                    }
                }
            }
        });

        let aggregations: Aggregations = serde_json::from_value(agg)?;
        let collector = create_collector(&index, aggregations)?;
        let result = searcher.search(&AllQuery, &collector)?;

        let expected = json!({
            "all": {
                "doc_count": 4,
                "electronics": {
                    "doc_count": 2,
                    "expensive": {
                        "doc_count": 1,  // Only apple (999) is >= 900
                        "count": { "value": 1.0 }
                    }
                }
            }
        });

        assert_agg_results!(&result, expected);
        Ok(())
    }

    #[test]
    fn test_deeply_nested_filters() -> crate::Result<()> {
        let index = create_standard_test_index()?;
        let reader = index.reader()?;
        let searcher = reader.searcher();

        let agg = json!({
            "level1": {
                "filter": "*",
                "aggs": {
                    "level2": {
                        "filter": "in_stock:true",
                        "aggs": {
                            "level3": {
                                "filter": "rating:[4.0 TO *]",
                                "aggs": {
                                    "level4": {
                                        "filter": "price:[500 TO *]",
                                        "aggs": {
                                            "final_count": { "value_count": { "field": "brand" } }
                                        }
                                    }
                                }
                            }
                        }
                    }
                }
            }
        });

        let aggregations: Aggregations = serde_json::from_value(agg)?;
        let collector = create_collector(&index, aggregations)?;
        let result = searcher.search(&AllQuery, &collector)?;

        let expected = json!({
            "level1": {
                "doc_count": 4,
                "level2": {
                    "doc_count": 3,  // in_stock: apple, samsung, penguin
                    "level3": {
                        "doc_count": 3,  // all have rating >= 4.0
                        "level4": {
                            "doc_count": 2,  // apple (999), samsung (799)
                            "final_count": { "value": 2.0 }
                        }
                    }
                }
            }
        });

        assert_agg_results!(&result, expected);
        Ok(())
    }

    #[test]
    fn test_multiple_nested_branches() -> crate::Result<()> {
        let index = create_standard_test_index()?;
        let reader = index.reader()?;
        let searcher = reader.searcher();

        let agg = json!({
            "root": {
                "filter": "*",
                "aggs": {
                    "electronics_branch": {
                        "filter": "category:electronics",
                        "aggs": {
                            "avg_price": { "avg": { "field": "price" } }
                        }
                    },
                    "in_stock_branch": {
                        "filter": "in_stock:true",
                        "aggs": {
                            "count": { "value_count": { "field": "brand" } }
                        }
                    }
                }
            }
        });

        let aggregations: Aggregations = serde_json::from_value(agg)?;
        let collector = create_collector(&index, aggregations)?;
        let result = searcher.search(&AllQuery, &collector)?;

        let expected = json!({
            "root": {
                "doc_count": 4,
                "electronics_branch": {
                    "doc_count": 2,
                    "avg_price": { "value": 899.0 }
                },
                "in_stock_branch": {
                    "doc_count": 3,
                    "count": { "value": 3.0 }
                }
            }
        });

        assert_agg_results!(&result, expected);
        Ok(())
    }

    #[test]
    fn test_nested_filters_with_multiple_siblings_at_each_level() -> crate::Result<()> {
        let index = create_standard_test_index()?;
        let reader = index.reader()?;
        let searcher = reader.searcher();

        // Test complex nesting: multiple branches at each level
        let agg = json!({
            "all": {
                "filter": "*",
                "aggs": {
                    // Level 2: Two independent filters
                    "expensive": {
                        "filter": "price:[500 TO *]",
                        "aggs": {
                            // Level 3: Multiple branches under "expensive"
                            "electronics": {
                                "filter": "category:electronics",
                                "aggs": {
                                    "avg_rating": { "avg": { "field": "rating" } }
                                }
                            },
                            "in_stock": {
                                "filter": "in_stock:true",
                                "aggs": {
                                    "count": { "value_count": { "field": "brand" } }
                                }
                            }
                        }
                    },
                    "affordable": {
                        "filter": "price:[0 TO 200]",
                        "aggs": {
                            // Level 3: Multiple branches under "affordable"
                            "books": {
                                "filter": "category:books",
                                "aggs": {
                                    "max_rating": { "max": { "field": "rating" } }
                                }
                            },
                            "clothing": {
                                "filter": "category:clothing",
                                "aggs": {
                                    "min_price": { "min": { "field": "price" } }
                                }
                            }
                        }
                    }
                }
            }
        });

        let aggregations: Aggregations = serde_json::from_value(agg)?;
        let collector = create_collector(&index, aggregations)?;
        let result = searcher.search(&AllQuery, &collector)?;

        let expected = json!({
            "all": {
                "doc_count": 4,
                "expensive": {
                    "doc_count": 2,  // apple (999), samsung (799)
                    "electronics": {
                        "doc_count": 2,  // both are electronics
                        "avg_rating": { "value": 4.35 }  // (4.5 + 4.2) / 2
                    },
                    "in_stock": {
                        "doc_count": 2,  // both are in stock
                        "count": { "value": 2.0 }
                    }
                },
                "affordable": {
                    "doc_count": 2,  // nike (120), penguin (25)
                    "books": {
                        "doc_count": 1,  // penguin (25)
                        "max_rating": { "value": 4.8 }
                    },
                    "clothing": {
                        "doc_count": 1,  // nike (120)
                        "min_price": { "value": 120.0 }
                    }
                }
            }
        });

        assert_agg_results!(&result, expected);
        Ok(())
    }

    // ============================================================================
    // Sub-Aggregation Combination Tests
    // ============================================================================

    #[test]
    fn test_filter_with_terms_sub_agg() -> crate::Result<()> {
        let index = create_standard_test_index()?;
        let reader = index.reader()?;
        let searcher = reader.searcher();

        let agg = json!({
            "electronics": {
                "filter": "category:electronics",
                "aggs": {
                    "brands": {
                        "terms": { "field": "brand" },
                        "aggs": {
                            "avg_price": { "avg": { "field": "price" } }
                        }
                    }
                }
            }
        });

        let aggregations: Aggregations = serde_json::from_value(agg)?;
        let collector = create_collector(&index, aggregations)?;
        let result = searcher.search(&AllQuery, &collector)?;

        // Verify the structure exists and has expected doc_count
        let expected = json!({
            "electronics": {
                "doc_count": 2,
                "brands": {
                    "buckets": [
                        {
                            "key": "samsung",
                            "doc_count": 1,
                            "avg_price": { "value": 799.0 }
                        },
                        {
                            "key": "apple",
                            "doc_count": 1,
                            "avg_price": { "value": 999.0 }
                        }
                    ],
                    "sum_other_doc_count": 0,
                    "doc_count_error_upper_bound": 0
                }
            }
        });

        assert_agg_results!(&result, expected);
        Ok(())
    }

    #[test]
    fn test_filter_with_multiple_metric_aggs() -> crate::Result<()> {
        let index = create_standard_test_index()?;
        let reader = index.reader()?;
        let searcher = reader.searcher();

        let agg = json!({
            "electronics": {
                "filter": "category:electronics",
                "aggs": {
                    "price_stats": { "stats": { "field": "price" } },
                    "rating_avg": { "avg": { "field": "rating" } },
                    "count": { "value_count": { "field": "brand" } }
                }
            }
        });

        let aggregations: Aggregations = serde_json::from_value(agg)?;
        let collector = create_collector(&index, aggregations)?;
        let result = searcher.search(&AllQuery, &collector)?;

        let expected = json!({
            "electronics": {
                "doc_count": 2,
                "price_stats": {
                    "count": 2,
                    "min": 799.0,
                    "max": 999.0,
                    "sum": 1798.0,
                    "avg": 899.0
                },
                "rating_avg": { "value": 4.35 },
                "count": { "value": 2.0 }
            }
        });

        assert_agg_results!(&result, expected);
        Ok(())
    }

    // ============================================================================
    // Edge Cases and Error Handling
    // ============================================================================

    #[test]
    fn test_filter_on_empty_index() -> crate::Result<()> {
        let mut schema_builder = Schema::builder();
        let _category = schema_builder.add_text_field("category", TEXT | FAST);
        let _price = schema_builder.add_u64_field("price", FAST);

        let schema = schema_builder.build();
        let index = Index::create_in_ram(schema);
        let mut writer: IndexWriter = index.writer(50_000_000)?;
        writer.commit()?; // Commit empty index

        let reader = index.reader()?;
        let searcher = reader.searcher();

        let agg = json!({
            "electronics": {
                "filter": "category:electronics",
                "aggs": { "avg_price": { "avg": { "field": "price" } } }
            }
        });

        let aggregations: Aggregations = serde_json::from_value(agg)?;
        let collector = create_collector(&index, aggregations)?;
        let result = searcher.search(&AllQuery, &collector)?;

        let expected = json!({
            "electronics": {
                "doc_count": 0,
                "avg_price": { "value": null }
            }
        });

        assert_agg_results!(&result, expected);
        Ok(())
    }

    #[test]
    fn test_malformed_query_string() -> crate::Result<()> {
        let index = create_standard_test_index()?;
        let reader = index.reader()?;
        let searcher = reader.searcher();

        // Empty query string
        let agg = json!({
            "test": {
                "filter": "",
                "aggs": { "count": { "value_count": { "field": "brand" } } }
            }
        });

        let result = serde_json::from_value::<Aggregations>(agg)
            .map_err(|e| crate::TantivyError::InvalidArgument(e.to_string()))
            .and_then(|aggregations| {
                let collector = create_collector(&index, aggregations)?;
                searcher.search(&AllQuery, &collector)
            });

        // Empty string should either work (matching nothing) or error gracefully
        assert!(result.is_ok() || result.is_err());
        Ok(())
    }

    #[test]
    fn test_filter_with_base_query() -> crate::Result<()> {
        let index = create_standard_test_index()?;
        let reader = index.reader()?;
        let searcher = reader.searcher();
        let schema = index.schema();

        // Use a base query to pre-filter to in_stock items only
        let in_stock_field = schema.get_field("in_stock").unwrap();
        let base_query = TermQuery::new(
            Term::from_field_bool(in_stock_field, true),
            IndexRecordOption::Basic,
        );

        let agg = json!({
            "electronics": {
                "filter": "category:electronics",
                "aggs": { "count": { "value_count": { "field": "brand" } } }
            }
        });

        let aggregations: Aggregations = serde_json::from_value(agg)?;
        let collector = create_collector(&index, aggregations)?;
        let result = searcher.search(&base_query, &collector)?;

        let expected = json!({
            "electronics": {
                "doc_count": 2,  // Both in-stock electronics
                "count": { "value": 2.0 }
            }
        });

        assert_agg_results!(&result, expected);
        Ok(())
    }

    // ============================================================================
    // Custom Query Integration Tests
    // ============================================================================

    #[test]
    fn test_custom_query_builder() -> crate::Result<()> {
        // Define a query builder with full serde support
        #[derive(Debug, Clone, Serialize, Deserialize)]
        struct TestTermQueryBuilder {
            field_name: String,
            term_text: String,
        }

        #[typetag::serde(name = "TestTermQueryBuilder")]
        impl QueryBuilder for TestTermQueryBuilder {
            fn build_query(
                &self,
                schema: &Schema,
                _tokenizers: &TokenizerManager,
            ) -> crate::Result<Box<dyn Query>> {
                let field = schema.get_field(&self.field_name)?;
                let term = Term::from_field_text(field, &self.term_text);
                Ok(Box::new(TermQuery::new(term, IndexRecordOption::Basic)))
            }

            fn box_clone(&self) -> Box<dyn QueryBuilder> {
                Box::new(self.clone())
            }
        }

        let index = create_standard_test_index()?;

        // Create a filter aggregation with a custom query builder
        let builder = TestTermQueryBuilder {
            field_name: "category".to_string(),
            term_text: "electronics".to_string(),
        };
        let filter_agg = FilterAggregation::new_with_builder(Box::new(builder));

        // Test that the query can be parsed
        let schema = index.schema();
        let tokenizers = index.tokenizers();
        let query = filter_agg.parse_query(&schema, tokenizers)?;

        // Verify the query was built correctly (it should be a TermQuery)
        assert!(format!("{:?}", query).contains("TermQuery"));

        // Test that it can be cloned
        let cloned = filter_agg.clone();
        let query2 = cloned.parse_query(&schema, tokenizers)?;
        assert!(format!("{:?}", query2).contains("TermQuery"));

        // Verify that custom builders CAN be serialized with typetag
        let serialized = serde_json::to_string(&filter_agg)?;
        assert!(
            serialized.contains("TestTermQueryBuilder"),
            "Serialized JSON should contain the type tag"
        );
        assert!(
            serialized.contains("electronics"),
            "Serialized JSON should contain the field data"
        );

        // Verify that it can be deserialized
        let deserialized: FilterAggregation = serde_json::from_str(&serialized)?;
        let query3 = deserialized.parse_query(&schema, tokenizers)?;
        assert!(format!("{:?}", query3).contains("TermQuery"));

        Ok(())
    }

    #[test]
    fn test_query_string_serialization() -> crate::Result<()> {
        // Query strings should serialize/deserialize correctly
        let filter_agg = FilterAggregation::new("category:electronics".to_string());

        let serialized = serde_json::to_string(&filter_agg)?;
        assert!(serialized.contains("electronics"));

        let deserialized: FilterAggregation = serde_json::from_str(&serialized)?;
        // Verify it deserializes correctly by using it in an aggregation
        let index = create_standard_test_index()?;
        let reader = index.reader()?;
        let searcher = reader.searcher();

        let agg = json!({
                "test": {
                    "filter": deserialized,
                    "aggs": { "count": { "value_count": { "field": "brand" } } }
            }
        });

        let aggregations: Aggregations = serde_json::from_value(agg)?;
        let collector = create_collector(&index, aggregations)?;
        let result = searcher.search(&AllQuery, &collector)?;

        // Should match 2 electronics
        let result_json = serde_json::to_value(&result)?;
        assert_eq!(result_json["test"]["doc_count"], 2);

        Ok(())
    }

    #[test]
    fn test_query_builder_serialization_roundtrip() -> crate::Result<()> {
        // Define a serializable query builder
        #[derive(Debug, Clone, Serialize, Deserialize)]
        struct RoundtripTermQueryBuilder {
            field_name: String,
            term_text: String,
        }

        #[typetag::serde(name = "RoundtripTermQueryBuilder")]
        impl QueryBuilder for RoundtripTermQueryBuilder {
            fn build_query(
                &self,
                schema: &Schema,
                _tokenizers: &TokenizerManager,
            ) -> crate::Result<Box<dyn Query>> {
                let field = schema.get_field(&self.field_name)?;
                let term = Term::from_field_text(field, &self.term_text);
                Ok(Box::new(TermQuery::new(term, IndexRecordOption::Basic)))
            }

            fn box_clone(&self) -> Box<dyn QueryBuilder> {
                Box::new(self.clone())
            }
        }

        let index = create_standard_test_index()?;

        // Create a filter aggregation with a custom query builder
        let builder = RoundtripTermQueryBuilder {
            field_name: "category".to_string(),
            term_text: "electronics".to_string(),
        };
        let filter_agg = FilterAggregation::new_with_builder(Box::new(builder));

        // Serialize the filter aggregation
        let serialized = serde_json::to_string(&filter_agg)?;

        // Verify the serialized JSON contains the builder data and type tag
        assert!(
            serialized.contains("RoundtripTermQueryBuilder"),
            "Serialized JSON should contain type tag"
        );
        assert!(
            serialized.contains("category"),
            "Serialized JSON should contain field_name"
        );
        assert!(
            serialized.contains("electronics"),
            "Serialized JSON should contain term_text"
        );

        // Deserialize back
        let deserialized: FilterAggregation = serde_json::from_str(&serialized)?;

        // Verify the aggregation produces correct results
        let agg = json!({
            "filtered": {
                "filter": deserialized
            }
        });

        let agg_req: Aggregations = serde_json::from_value(agg)?;
        let searcher = index.reader()?.searcher();
        let collector = create_collector(&index, agg_req)?;
        let agg_res = searcher.search(&AllQuery, &collector)?;

        let result_json = serde_json::to_value(&agg_res)?;
        assert_eq!(result_json["filtered"]["doc_count"], 2);

        Ok(())
    }

    // ============================================================================
    // Correctness Validation Tests
    // ============================================================================

    #[test]
    fn test_filter_result_correctness_vs_separate_query() -> crate::Result<()> {
        let index = create_standard_test_index()?;
        let reader = index.reader()?;
        let searcher = reader.searcher();
        let schema = index.schema();

        // Method 1: Filter aggregation
        let filter_agg = json!({
            "electronics": {
                "filter": "category:electronics",
                "aggs": { "avg_price": { "avg": { "field": "price" } } }
            }
        });

        let aggregations: Aggregations = serde_json::from_value(filter_agg)?;
        let collector = create_collector(&index, aggregations)?;
        let filter_result = searcher.search(&AllQuery, &collector)?;

        // Method 2: Separate query
        let category_field = schema.get_field("category").unwrap();
        let term = Term::from_field_text(category_field, "electronics");
        let term_query = TermQuery::new(term, IndexRecordOption::Basic);

        let separate_agg = json!({
            "result": { "avg": { "field": "price" } }
        });

        let separate_aggregations: Aggregations = serde_json::from_value(separate_agg)?;
        let separate_collector =
            AggregationCollector::from_aggs(separate_aggregations, Default::default());
        let separate_result = searcher.search(&term_query, &separate_collector)?;

        // Both methods should produce identical results
        let filter_expected = json!({
            "electronics": {
                "doc_count": 2,
                "avg_price": { "value": 899.0 }
            }
        });

        let separate_expected = json!({
            "result": {
                "value": 899.0
            }
        });

        // Verify filter aggregation result
        assert_agg_results!(&filter_result, filter_expected);

        // Verify separate query result matches
        assert_agg_results!(&separate_result, separate_expected);

        // This test demonstrates that filter aggregation produces the same results
        // as running a separate query with the same condition
        Ok(())
    }

    #[test]
    fn test_custom_tokenizer_required() -> crate::Result<()> {
        use crate::schema::{TextFieldIndexing, TextOptions};
        use crate::tokenizer::{SimpleTokenizer, TextAnalyzer, TokenizerManager};

        // Create a custom tokenizer that doesn't lowercase (just splits on whitespace)
        let custom_tokenizer = TextAnalyzer::builder(SimpleTokenizer::default()).build();

        // Register tokenizer
        let tokenizers = TokenizerManager::default();
        tokenizers.register("my_custom", custom_tokenizer);

        // Create a schema with a text field that uses our custom tokenizer
        let mut schema_builder = Schema::builder();
        let text_field_indexing = TextFieldIndexing::default()
            .set_tokenizer("my_custom")
            .set_index_option(IndexRecordOption::Basic);
        let text_options = TextOptions::default()
            .set_indexing_options(text_field_indexing)
            .set_stored();
        let text_field = schema_builder.add_text_field("text", text_options);
        let schema = schema_builder.build();

        // Build index with custom tokenizer
        let index = crate::IndexBuilder::new()
            .schema(schema.clone())
            .tokenizers(tokenizers)
            .create_in_ram()?;
        let mut writer = index.writer(50_000_000)?;

        // Add documents with UPPERCASE text
        writer.add_document(doc!(text_field => "HELLO"))?;
        writer.add_document(doc!(text_field => "WORLD"))?;
        writer.add_document(doc!(text_field => "hello"))?; // lowercase version
        writer.commit()?;

        let reader = index.reader()?;
        let searcher = reader.searcher();

        // Test: With correct tokenizer (from index) - should work
        let agg = json!({
            "uppercase_hello": {
                "filter": "text:HELLO"
            }
        });

        let aggregations: Aggregations = serde_json::from_value(agg)?;
        let collector_with_tokenizer = create_collector(&index, aggregations.clone())?;
        let result_with_tokenizer = searcher.search(&AllQuery, &collector_with_tokenizer)?;

        // Should match only the UPPERCASE "HELLO" (1 document)
        let result_json = serde_json::to_value(&result_with_tokenizer)?;
        assert_eq!(
            result_json["uppercase_hello"]["doc_count"], 1,
            "With custom tokenizer from index, should match exactly 1 UPPERCASE document"
        );

        // Test 2: With default tokenizer (wrong!) - should fail to parse the query
        // because "my_custom" tokenizer is not in the default TokenizerManager
        let collector_with_default = AggregationCollector::from_aggs(
            aggregations,
            AggContextParams::new(Default::default(), TokenizerManager::default()),
        );
        let result_with_default = searcher.search(&AllQuery, &collector_with_default);

        // This should error because the tokenizer "my_custom" is not registered
        assert!(
            result_with_default.is_err(),
            "Without proper tokenizers, query parsing should fail"
        );
        assert!(
            result_with_default
                .unwrap_err()
                .to_string()
                .contains("my_custom"),
            "Error should mention the missing tokenizer"
        );

        Ok(())
    }
}


================================================
FILE: src/aggregation/bucket/histogram/date_histogram.rs
================================================
use serde::{Deserialize, Serialize};

use super::{HistogramAggregation, HistogramBounds};
use crate::aggregation::*;

/// DateHistogramAggregation is similar to `HistogramAggregation`, but it can only be used with date
/// type.
///
/// Currently only **fixed time** intervals are supported. Calendar-aware time intervals are not
/// supported.
///
/// Like the histogram, values are rounded down into the closest bucket.
///
/// For this calculation all fastfield values are converted to f64.
///
/// # Limitations/Compatibility
/// Only fixed time intervals are supported.
///
/// # JSON Format
/// ```json
/// {
///     "prices": {
///         "date_histogram": {
///             "field": "price",
///             "fixed_interval": "30d"
///         }
///     }
/// }
/// ```
///
/// Response
/// See [`BucketEntry`](crate::aggregation::agg_result::BucketEntry)
#[derive(Clone, Debug, Default, PartialEq, Serialize, Deserialize)]
pub struct DateHistogramAggregationReq {
    #[doc(hidden)]
    /// Only for validation
    pub interval: Option<String>,
    #[doc(hidden)]
    /// Only for validation
    pub calendar_interval: Option<String>,
    /// The field to aggregate on.
    pub field: String,
    /// The format to format dates. Unsupported currently.
    pub format: Option<String>,
    /// The interval to chunk your data range. Each bucket spans a value range of
    /// [0..fixed_interval). Accepted values
    ///
    /// Fixed intervals are configured with the `fixed_interval` parameter.
    /// In contrast to calendar-aware intervals, fixed intervals are a fixed number of SI units and
    /// never deviate, regardless of where they fall on the calendar. One second is always
    /// composed of 1000ms. This allows fixed intervals to be specified in any multiple of the
    /// supported units. However, it means fixed intervals cannot express other units such as
    /// months, since the duration of a month is not a fixed quantity. Attempting to specify a
    /// calendar interval like month or quarter will return an Error.
    ///
    /// The accepted units for fixed intervals are:
    /// * `ms`: milliseconds
    /// * `s`: seconds. Defined as 1000 milliseconds each.
    /// * `m`: minutes. Defined as 60 seconds each (60_000 milliseconds).
    /// * `h`: hours. Defined as 60 minutes each (3_600_000 milliseconds).
    /// * `d`: days. Defined as 24 hours (86_400_000 milliseconds).
    ///
    /// Fractional time values are not supported, but you can address this by shifting to another
    /// time unit (e.g., `1.5h` could instead be specified as `90m`).
    ///
    /// `Option` for validation, the parameter is not optional
    pub fixed_interval: Option<String>,
    /// Intervals implicitly defines an absolute grid of buckets `[interval * k, interval * (k +
    /// 1))`.
    ///
    /// Offset makes it possible to shift this grid into
    /// `[offset + interval * k, offset + interval * (k + 1))`. Offset has to be in the range [0,
    /// interval).
    ///
    /// The `offset` parameter is has the same syntax as the `fixed_interval` parameter, but
    /// also allows for negative values.
    pub offset: Option<String>,
    /// The minimum number of documents in a bucket to be returned. Defaults to 0.
    pub min_doc_count: Option<u64>,
    /// Limits the data range to `[min, max]` closed interval.
    ///
    /// This can be used to filter values if they are not in the data range.
    ///
    /// hard_bounds only limits the buckets, to force a range set both extended_bounds and
    /// hard_bounds to the same range.
    ///
    /// Needs to be provided as timestamp in millisecond precision.
    ///
    /// ## Example
    /// ```json
    /// {
    ///     "sales_over_time": {
    ///        "date_histogram": {
    ///            "field": "dates",
    ///            "interval": "1d",
    ///            "hard_bounds": {
    ///                "min": 0,
    ///                "max": 1420502400000
    ///            }
    ///        }
    ///    }
    /// }
    /// ```
    pub hard_bounds: Option<HistogramBounds>,
    /// Can be set to extend your bounds. The range of the buckets is by default defined by the
    /// data range of the values of the documents. As the name suggests, this can only be used to
    /// extend the value range. If the bounds for min or max are not extending the range, the value
    /// has no effect on the returned buckets.
    ///
    /// Cannot be set in conjunction with min_doc_count > 0, since the empty buckets from extended
    /// bounds would not be returned.
    pub extended_bounds: Option<HistogramBounds>,

    /// Whether to return the buckets as a hash map
    #[serde(default)]
    pub keyed: bool,
}

impl DateHistogramAggregationReq {
    pub(crate) fn to_histogram_req(&self) -> crate::Result<HistogramAggregation> {
        self.validate()?;
        Ok(HistogramAggregation {
            field: self.field.to_string(),
            interval: parse_into_milliseconds(self.fixed_interval.as_ref().unwrap())? as f64,
            offset: self
                .offset
                .as_ref()
                .map(|offset| parse_offset_into_milliseconds(offset))
                .transpose()?
                .map(|el| el as f64),
            min_doc_count: self.min_doc_count,
            hard_bounds: self.hard_bounds,
            extended_bounds: self.extended_bounds,
            keyed: self.keyed,
            is_normalized_to_ns: false,
        })
    }

    fn validate(&self) -> crate::Result<()> {
        if let Some(interval) = self.interval.as_ref() {
            return Err(crate::TantivyError::InvalidArgument(format!(
                "`interval` parameter {interval:?} in date histogram is unsupported, only \
                 `fixed_interval` is supported"
            )));
        }
        if let Some(interval) = self.calendar_interval.as_ref() {
            return Err(crate::TantivyError::InvalidArgument(format!(
                "`calendar_interval` parameter {interval:?} in date histogram is unsupported, \
                 only `fixed_interval` is supported"
            )));
        }
        if self.format.is_some() {
            return Err(crate::TantivyError::InvalidArgument(
                "format parameter on date_histogram is unsupported".to_string(),
            ));
        }

        if self.fixed_interval.is_none() {
            return Err(crate::TantivyError::InvalidArgument(
                "fixed_interval in date histogram is missing".to_string(),
            ));
        }

        parse_into_milliseconds(self.fixed_interval.as_ref().unwrap())?;

        Ok(())
    }
}

#[derive(Debug, Clone, PartialEq, Eq, Error)]
/// Errors when parsing the fixed interval for `DateHistogramAggregationReq`.
pub enum DateHistogramParseError {
    /// Unit not recognized in passed String
    #[error("Unit not recognized in passed String {0:?}")]
    UnitNotRecognized(String),
    /// Number not found in passed String
    #[error("Number not found in passed String {0:?}")]
    NumberMissing(String),
    /// Unit not found in passed String
    #[error("Unit not found in passed String {0:?}")]
    UnitMissing(String),
    /// Offset invalid
    #[error("passed offset is invalid {0:?}")]
    InvalidOffset(String),
    /// Value out of bounds
    #[error("passed value is out of bounds: {0:?}")]
    OutOfBounds(String),
}

fn parse_offset_into_milliseconds(input: &str) -> Result<i64, AggregationError> {
    let is_sign = |byte| &[byte] == b"-" || &[byte] == b"+";
    if input.is_empty() {
        return Err(DateHistogramParseError::InvalidOffset(input.to_string()).into());
    }

    let has_sign = is_sign(input.as_bytes()[0]);
    if has_sign {
        let (sign, input) = input.split_at(1);
        let val = parse_into_milliseconds(input)?;
        if sign == "-" {
            Ok(-val)
        } else {
            Ok(val)
        }
    } else {
        parse_into_milliseconds(input)
    }
}

pub(crate) fn parse_into_milliseconds(input: &str) -> Result<i64, AggregationError> {
    let split_boundary = input
        .as_bytes()
        .iter()
        .take_while(|byte| byte.is_ascii_digit())
        .count();
    let (number, unit) = input.split_at(split_boundary);
    if number.is_empty() {
        return Err(DateHistogramParseError::NumberMissing(input.to_string()).into());
    }
    if unit.is_empty() {
        return Err(DateHistogramParseError::UnitMissing(input.to_string()).into());
    }
    let number: i64 = number
        .parse()
        // Technically this should never happen, but there was a bug
        // here and being defensive does not hurt.
        .map_err(|_err| DateHistogramParseError::NumberMissing(input.to_string()))?;

    let unit_in_ms = match unit {
        "ms" | "milliseconds" => 1,
        "s" | "seconds" => 1000,
        "m" | "minutes" => 60 * 1000,
        "h" | "hours" => 60 * 60 * 1000,
        "d" | "days" => 24 * 60 * 60 * 1000,
        _ => return Err(DateHistogramParseError::UnitNotRecognized(unit.to_string()).into()),
    };

    let val = number * unit_in_ms;
    // The field type is in nanoseconds precision, so validate the value to fit the range
    val.checked_mul(1_000_000)
        .ok_or_else(|| DateHistogramParseError::OutOfBounds(input.to_string()))?;

    Ok(val)
}

#[cfg(test)]
pub(crate) mod tests {
    use pretty_assertions::assert_eq;

    use super::*;
    use crate::aggregation::agg_req::Aggregations;
    use crate::aggregation::tests::exec_request;
    use crate::indexer::NoMergePolicy;
    use crate::schema::{Schema, FAST, STRING};
    use crate::{Index, IndexWriter, TantivyDocument};

    #[test]
    fn test_parse_into_millisecs() {
        assert_eq!(parse_into_milliseconds("1m").unwrap(), 60_000);
        assert_eq!(parse_into_milliseconds("2m").unwrap(), 120_000);
        assert_eq!(parse_into_milliseconds("2minutes").unwrap(), 120_000);
        assert_eq!(
            parse_into_milliseconds("2y").unwrap_err(),
            DateHistogramParseError::UnitNotRecognized("y".to_string()).into()
        );
        assert_eq!(
            parse_into_milliseconds("2000").unwrap_err(),
            DateHistogramParseError::UnitMissing("2000".to_string()).into()
        );
        assert_eq!(
            parse_into_milliseconds("ms").unwrap_err(),
            DateHistogramParseError::NumberMissing("ms".to_string()).into()
        );
    }

    #[test]
    fn test_parse_offset_into_milliseconds() {
        assert_eq!(parse_offset_into_milliseconds("1m").unwrap(), 60_000);
        assert_eq!(parse_offset_into_milliseconds("+1m").unwrap(), 60_000);
        assert_eq!(parse_offset_into_milliseconds("-1m").unwrap(), -60_000);
        assert_eq!(parse_offset_into_milliseconds("2m").unwrap(), 120_000);
        assert_eq!(parse_offset_into_milliseconds("+2m").unwrap(), 120_000);
        assert_eq!(parse_offset_into_milliseconds("-2m").unwrap(), -120_000);
        assert_eq!(parse_offset_into_milliseconds("-2ms").unwrap(), -2);
        assert_eq!(
            parse_offset_into_milliseconds("2y").unwrap_err(),
            DateHistogramParseError::UnitNotRecognized("y".to_string()).into()
        );
        assert_eq!(
            parse_offset_into_milliseconds("2000").unwrap_err(),
            DateHistogramParseError::UnitMissing("2000".to_string()).into()
        );
        assert_eq!(
            parse_offset_into_milliseconds("ms").unwrap_err(),
            DateHistogramParseError::NumberMissing("ms".to_string()).into()
        );
    }

    #[test]
    fn test_parse_into_milliseconds_do_not_accept_non_ascii() {
        assert!(parse_into_milliseconds("１m").is_err());
    }

    pub fn get_test_index_from_docs(
        merge_segments: bool,
        segment_and_docs: &[Vec<&str>],
    ) -> crate::Result<Index> {
        let mut schema_builder = Schema::builder();
        schema_builder.add_date_field("date", FAST);
        schema_builder.add_json_field("mixed", FAST);
        schema_builder.add_text_field("text", FAST | STRING);
        schema_builder.add_text_field("text2", FAST | STRING);
        let schema = schema_builder.build();
        let index = Index::create_in_ram(schema.clone());
        {
            let mut index_writer = index.writer_with_num_threads(1, 30_000_000)?;
            index_writer.set_merge_policy(Box::new(NoMergePolicy));
            for values in segment_and_docs {
                for doc_str in values {
                    let doc = TantivyDocument::parse_json(&schema, doc_str)?;
                    index_writer.add_document(doc)?;
                }
                // writing the segment
                index_writer.commit()?;
            }
        }
        if merge_segments {
            let segment_ids = index
                .searchable_segment_ids()
                .expect("Searchable segments failed.");
            if segment_ids.len() > 1 {
                let mut index_writer: IndexWriter = index.writer_for_tests()?;
                index_writer.merge(&segment_ids).wait()?;
                index_writer.wait_merging_threads()?;
            }
        }

        Ok(index)
    }

    #[test]
    fn histogram_test_date_force_merge_segments() {
        histogram_test_date_merge_segments(true)
    }

    #[test]
    fn histogram_test_date() {
        histogram_test_date_merge_segments(false)
    }

    fn histogram_test_date_merge_segments(merge_segments: bool) {
        let docs = vec![
            vec![r#"{ "date": "2015-01-01T12:10:30Z", "text": "aaa" }"#],
            vec![r#"{ "date": "2015-01-01T11:11:30Z", "text": "bbb" }"#],
            vec![r#"{ "date": "2015-01-01T11:11:30Z", "text": "bbb" }"#],
            vec![r#"{ "date": "2015-01-02T00:00:00Z", "text": "bbb" }"#],
            vec![r#"{ "date": "2015-01-06T00:00:00Z", "text": "ccc" }"#],
            vec![r#"{ "date": "2015-01-06T00:00:00Z", "text": "ccc" }"#],
        ];
        let index = get_test_index_from_docs(merge_segments, &docs).unwrap();

        {
            // 30day + offset
            let elasticsearch_compatible_json = json!(
                {
                "sales_over_time": {
                    "date_histogram": {
                    "field": "date",
                    "fixed_interval": "30d",
                    "offset": "-4d"
                    }
                }
                }
            );

            let agg_req: Aggregations = serde_json::from_str(
                &serde_json::to_string(&elasticsearch_compatible_json).unwrap(),
            )
            .unwrap();
            let res = exec_request(agg_req, &index).unwrap();
            let expected_res = json!({
                "sales_over_time" : {
                    "buckets" : [
                        {
                            "key_as_string" : "2015-01-01T00:00:00Z",
                            "key" : 1420070400000.0,
                            "doc_count" : 6
                        }
                    ]
                }
            });
            assert_eq!(res, expected_res);
        }

        {
            // 30day + offset + sub_agg
            let elasticsearch_compatible_json = json!(
                {
                    "sales_over_time": {
                        "date_histogram": {
                        "field": "date",
                        "fixed_interval": "30d",
                        "offset": "-4d"
                        },
                        "aggs": {
                            "texts": {
                                "terms": {"field": "text"}
                            }
                        }
                    }
                }
            );

            let agg_req: Aggregations = serde_json::from_str(
                &serde_json::to_string(&elasticsearch_compatible_json).unwrap(),
            )
            .unwrap();
            let res = exec_request(agg_req, &index).unwrap();
            let expected_res = json!({
                "sales_over_time" : {
                "buckets" : [
                    {
                        "key_as_string" : "2015-01-01T00:00:00Z",
                        "key" : 1420070400000.0,
                        "doc_count" : 6,
                        "texts": {
                            "buckets": [
                                {
                                "doc_count": 3,
                                "key": "bbb"
                                },
                                {
                                "doc_count": 2,
                                "key": "ccc"
                                },
                                {
                                "doc_count": 1,
                                "key": "aaa"
                                }
                            ],
                            "doc_count_error_upper_bound": 0,
                            "sum_other_doc_count": 0
                            }
                        }
                    ]
                }
            });
            assert_eq!(res, expected_res);
        }
        {
            // 1day
            let elasticsearch_compatible_json = json!(
                {
                    "sales_over_time": {
                        "date_histogram": {
                            "field": "date",
                            "fixed_interval": "1d"
                        }
                    }
                }
            );

            let agg_req: Aggregations = serde_json::from_str(
                &serde_json::to_string(&elasticsearch_compatible_json).unwrap(),
            )
            .unwrap();
            let res = exec_request(agg_req, &index).unwrap();
            let expected_res = json!( {
                "sales_over_time": {
                    "buckets": [
                        {
                            "doc_count": 3,
                            "key": 1420070400000.0,
                            "key_as_string": "2015-01-01T00:00:00Z"
                        },
                        {
                            "doc_count": 1,
                            "key": 1420156800000.0,
                            "key_as_string": "2015-01-02T00:00:00Z"
                        },
                        {
                            "doc_count": 0,
                            "key": 1420243200000.0,
                            "key_as_string": "2015-01-03T00:00:00Z"
                        },
                        {
                            "doc_count": 0,
                            "key": 1420329600000.0,
                            "key_as_string": "2015-01-04T00:00:00Z"
                        },
                        {
                            "doc_count": 0,
                            "key": 1420416000000.0,
                            "key_as_string": "2015-01-05T00:00:00Z"
                        },
                        {
                            "doc_count": 2,
                            "key": 1420502400000.0,
                            "key_as_string": "2015-01-06T00:00:00Z"
                        }
                    ]
                }
            });
            assert_eq!(res, expected_res);
        }

        {
            // 1day + extended_bounds
            let elasticsearch_compatible_json = json!(
                {
                    "sales_over_time": {
                        "date_histogram": {
                            "field": "date",
                            "fixed_interval": "1d",
                            "extended_bounds": {
                                "min": 1419984000000.0,
                                "max": 1420588800000.0
                            }
                        }
                    }
                }
            );

            let agg_req: Aggregations = serde_json::from_str(
                &serde_json::to_string(&elasticsearch_compatible_json).unwrap(),
            )
            .unwrap();
            let res = exec_request(agg_req, &index).unwrap();
            let expected_res = json!({
                "sales_over_time" : {
                    "buckets": [
                        {
                            "doc_count": 0,
                            "key": 1419984000000.0,
                            "key_as_string": "2014-12-31T00:00:00Z"
                        },
                        {
                            "doc_count": 3,
                            "key": 1420070400000.0,
                            "key_as_string": "2015-01-01T00:00:00Z"
                        },
                        {
                            "doc_count": 1,
                            "key": 1420156800000.0,
                            "key_as_string": "2015-01-02T00:00:00Z"
                        },
                        {
                            "doc_count": 0,
                            "key": 1420243200000.0,
                            "key_as_string": "2015-01-03T00:00:00Z"
                        },
                        {
                            "doc_count": 0,
                            "key": 1420329600000.0,
                            "key_as_string": "2015-01-04T00:00:00Z"
                        },
                        {
                            "doc_count": 0,
                            "key": 1420416000000.0,
                            "key_as_string": "2015-01-05T00:00:00Z"
                        },
                        {
                            "doc_count": 2,
                            "key": 1420502400000.0,
                            "key_as_string": "2015-01-06T00:00:00Z"
                        },
                        {
                            "doc_count": 0,
                            "key": 1420588800000.0,
                            "key_as_string": "2015-01-07T00:00:00Z"
                        }
                    ]
                }
            });
            assert_eq!(res, expected_res);
        }
        {
            // 1day + hard_bounds + extended_bounds
            let elasticsearch_compatible_json = json!(
                {
                    "sales_over_time": {
                        "date_histogram": {
                            "field": "date",
                            "fixed_interval": "1d",
                            "hard_bounds": {
                                "min": 1420156800000.0,
                                "max": 1420243200000.0
                            }
                        }
                    }
                }
            );

            let agg_req: Aggregations = serde_json::from_str(
                &serde_json::to_string(&elasticsearch_compatible_json).unwrap(),
            )
            .unwrap();
            let res = exec_request(agg_req, &index).unwrap();
            let expected_res = json!({
                "sales_over_time" : {
                    "buckets": [
                        {
                            "doc_count": 1,
                            "key": 1420156800000.0,
                            "key_as_string": "2015-01-02T00:00:00Z"
                        }
                    ]
                }
            });
            assert_eq!(res, expected_res);
        }

        {
            // 1day + hard_bounds as Rfc3339
            let elasticsearch_compatible_json = json!(
                {
                    "sales_over_time": {
                        "date_histogram": {
                            "field": "date",
                            "fixed_interval": "1d",
                            "hard_bounds": {
                                "min": "2015-01-02T00:00:00Z",
                                "max": "2015-01-02T12:00:00Z"
                            }
                        }
                    }
                }
            );

            let agg_req: Aggregations = serde_json::from_str(
                &serde_json::to_string(&elasticsearch_compatible_json).unwrap(),
            )
            .unwrap();
            let res = exec_request(agg_req, &index).unwrap();
            let expected_res = json!({
                "sales_over_time" : {
                    "buckets": [
                        {
                            "doc_count": 1,
                            "key": 1420156800000.0,
                            "key_as_string": "2015-01-02T00:00:00Z"
                        }
                    ]
                }
            });
            assert_eq!(res, expected_res);
        }
    }
    #[test]
    fn histogram_test_invalid_req() {
        let docs = vec![];

        let index = get_test_index_from_docs(false, &docs).unwrap();
        let elasticsearch_compatible_json = json!(
            {
              "sales_over_time": {
                "date_histogram": {
                  "field": "date",
                  "interval": "30d",
                  "offset": "-4d"
                }
              }
            }
        );

        let agg_req: Aggregations =
            serde_json::from_str(&serde_json::to_string(&elasticsearch_compatible_json).unwrap())
                .unwrap();
        let err = exec_request(agg_req, &index).unwrap_err();
        assert_eq!(
            err.to_string(),
            r#"An invalid argument was passed: '`interval` parameter "30d" in date histogram is unsupported, only `fixed_interval` is supported'"#
        );
    }
}


================================================
FILE: src/aggregation/bucket/histogram/histogram.rs
================================================
use std::cmp::Ordering;

use columnar::{Column, ColumnType};
use rustc_hash::FxHashMap;
use serde::{Deserialize, Serialize};
use tantivy_bitpacker::minmax;

use crate::aggregation::agg_data::{
    build_segment_agg_collectors, AggRefNode, AggregationsSegmentCtx,
};
use crate::aggregation::agg_req::Aggregations;
use crate::aggregation::agg_result::BucketEntry;
use crate::aggregation::cached_sub_aggs::{CachedSubAggs, HighCardCachedSubAggs};
use crate::aggregation::intermediate_agg_result::{
    IntermediateAggregationResult, IntermediateAggregationResults, IntermediateBucketResult,
    IntermediateHistogramBucketEntry,
};
use crate::aggregation::segment_agg_result::{BucketIdProvider, SegmentAggregationCollector};
use crate::aggregation::*;
use crate::TantivyError;

/// Contains all information required by the SegmentHistogramCollector to perform the
/// histogram or date_histogram aggregation on a segment.
pub struct HistogramAggReqData {
    /// The column accessor to access the fast field values.
    pub accessor: Column<u64>,
    /// The field type of the fast field.
    pub field_type: ColumnType,
    /// The name of the aggregation.
    pub name: String,
    /// The histogram aggregation request.
    pub req: HistogramAggregation,
    /// True if this is a date_histogram aggregation.
    pub is_date_histogram: bool,
    /// The bounds to limit the buckets to.
    pub bounds: HistogramBounds,
    /// The offset used to calculate the bucket position.
    pub offset: f64,
}
impl HistogramAggReqData {
    /// Estimate the memory consumption of this struct in bytes.
    pub fn get_memory_consumption(&self) -> usize {
        std::mem::size_of::<Self>()
    }
}

/// Histogram is a bucket aggregation, where buckets are created dynamically for given `interval`.
/// Each document value is rounded down to its bucket.
///
/// E.g. if we have a price 18 and an interval of 5, the document will fall into the bucket with
/// the key 15. The formula used for this is:
/// `((val - offset) / interval).floor() * interval + offset`
///
/// For this calculation all fastfield values are converted to f64.
///
/// # Returned Buckets
/// By default buckets are returned between the min and max value of the documents, including empty
/// buckets.
/// Setting min_doc_count to != 0 will filter empty buckets.
///
/// The value range of the buckets can bet extended via
/// [extended_bounds](HistogramAggregation::extended_bounds) or limit the range via
/// [hard_bounds](HistogramAggregation::hard_bounds).
///
/// # Result
/// Result type is [`BucketResult`](crate::aggregation::agg_result::BucketResult) with
/// [`BucketEntry`](crate::aggregation::agg_result::BucketEntry) on the
/// `AggregationCollector`.
///
/// Result type is
/// [`IntermediateBucketResult`](crate::aggregation::intermediate_agg_result::IntermediateBucketResult) with
/// [`IntermediateHistogramBucketEntry`](crate::aggregation::intermediate_agg_result::IntermediateHistogramBucketEntry) on the
/// `DistributedAggregationCollector`.
///
/// # Limitations/Compatibility
///
/// # JSON Format
/// ```json
/// {
///     "prices": {
///         "histogram": {
///             "field": "price",
///             "interval": 10
///         }
///     }
/// }
/// ```
///
/// Response
/// See [`BucketEntry`](crate::aggregation::agg_result::BucketEntry)
#[derive(Clone, Debug, Default, PartialEq, Serialize, Deserialize)]
pub struct HistogramAggregation {
    /// The field to aggregate on.
    pub field: String,
    /// The interval to chunk your data range. Each bucket spans a value range of [0..interval).
    /// Must be a positive value.
    #[serde(deserialize_with = "deserialize_f64")]
    pub interval: f64,
    /// Intervals implicitly defines an absolute grid of buckets `[interval * k, interval * (k +
    /// 1))`.
    ///
    /// Offset makes it possible to shift this grid into
    /// `[offset + interval * k, offset + interval * (k + 1))`. Offset has to be in the range [0,
    /// interval).
    ///
    /// As an example, if there are two documents with value 9 and 12 and interval 10.0, they would
    /// fall into the buckets with the key 0 and 10.
    /// With offset 5 and interval 10, they would both fall into the bucket with they key 5 and the
    /// range [5..15)
    #[serde(default, deserialize_with = "deserialize_option_f64")]
    pub offset: Option<f64>,
    /// The minimum number of documents in a bucket to be returned. Defaults to 0.
    pub min_doc_count: Option<u64>,
    /// Limits the data range to `[min, max]` closed interval.
    ///
    /// This can be used to filter values if they are not in the data range.
    ///
    /// hard_bounds only limits the buckets, to force a range set both extended_bounds and
    /// hard_bounds to the same range.
    ///
    /// ## Example
    /// ```json
    /// {
    ///     "prices": {
    ///        "histogram": {
    ///            "field": "price",
    ///            "interval": 10,
    ///            "hard_bounds": {
    ///                "min": 0,
    ///                "max": 100
    ///            }
    ///        }
    ///    }
    /// }
    /// ```
    pub hard_bounds: Option<HistogramBounds>,
    /// Can be set to extend your bounds. The range of the buckets is by default defined by the
    /// data range of the values of the documents. As the name suggests, this can only be used to
    /// extend the value range. If the bounds for min or max are not extending the range, the value
    /// has no effect on the returned buckets.
    ///
    /// Cannot be set in conjunction with min_doc_count > 0, since the empty buckets from extended
    /// bounds would not be returned.
    pub extended_bounds: Option<HistogramBounds>,
    /// Whether to return the buckets as a hash map
    #[serde(default)]
    pub keyed: bool,
    /// Whether the values are normalized to ns for date time values. Defaults to false.
    #[serde(default)]
    pub is_normalized_to_ns: bool,
}

impl HistogramAggregation {
    pub(crate) fn normalize_date_time(&mut self) {
        if !self.is_normalized_to_ns {
            // values are provided in ms, but the fastfield is in nano seconds
            self.interval *= 1_000_000.0;
            self.offset = self.offset.map(|off| off * 1_000_000.0);
            self.hard_bounds = self.hard_bounds.map(|bounds| HistogramBounds {
                min: bounds.min * 1_000_000.0,
                max: bounds.max * 1_000_000.0,
            });
            self.extended_bounds = self.extended_bounds.map(|bounds| HistogramBounds {
                min: bounds.min * 1_000_000.0,
                max: bounds.max * 1_000_000.0,
            });
            self.is_normalized_to_ns = true;
        }
    }

    fn validate(&self) -> crate::Result<()> {
        if self.interval <= 0.0f64 {
            return Err(TantivyError::InvalidArgument(
                "interval must be a positive value".to_string(),
            ));
        }

        if self.min_doc_count.unwrap_or(0) > 0 && self.extended_bounds.is_some() {
            return Err(TantivyError::InvalidArgument(
                "Cannot set min_doc_count and extended_bounds at the same time".to_string(),
            ));
        }

        if let (Some(hard_bounds), Some(extended_bounds)) = (self.hard_bounds, self.extended_bounds)
        {
            if extended_bounds.min < hard_bounds.min || extended_bounds.max > hard_bounds.max {
                return Err(TantivyError::InvalidArgument(format!(
                    "extended_bounds have to be inside hard_bounds, extended_bounds: \
                     {extended_bounds}, hard_bounds {hard_bounds}"
                )));
            }
        }

        Ok(())
    }

    /// Returns the minimum number of documents required for a bucket to be returned.
    pub fn min_doc_count(&self) -> u64 {
        self.min_doc_count.unwrap_or(0)
    }
}

/// Used to set extended or hard bounds on the histogram.
#[derive(Clone, Copy, Debug, PartialEq, Serialize, Deserialize)]
pub struct HistogramBounds {
    /// The lower bounds.
    #[serde(deserialize_with = "deserialize_date_or_num")]
    pub min: f64,
    /// The upper bounds.
    #[serde(deserialize_with = "deserialize_date_or_num")]
    pub max: f64,
}

fn deserialize_date_or_num<'de, D>(deserializer: D) -> Result<f64, D::Error>
where D: serde::Deserializer<'de> {
    let value: serde_json::Value = Deserialize::deserialize(deserializer)?;

    // Check if the value is a string representing an Rfc3339 formatted date
    if let serde_json::Value::String(date_str) = value {
        // Parse the Rfc3339 formatted date string into a DateTime<Utc>
        let date =
            time::OffsetDateTime::parse(&date_str, &time::format_description::well_known::Rfc3339)
                .map_err(|_| serde::de::Error::custom("Invalid Rfc3339 formatted date"))?;

        let milliseconds: i64 = (date.unix_timestamp_nanos() / 1_000_000)
            .try_into()
            .map_err(|_| serde::de::Error::custom("{date_str} out of allowed range"))?;

        // Return the milliseconds as f64
        Ok(milliseconds as f64)
    } else {
        // The value is not a string, so assume it's a regular f64 number
        value
            .as_f64()
            .ok_or_else(|| serde::de::Error::custom("Invalid number format"))
    }
}

impl Display for HistogramBounds {
    fn fmt(&self, f: &mut std::fmt::Formatter<'_>) -> std::fmt::Result {
        f.write_fmt(format_args!("[{},{}]", self.min, self.max))
    }
}

impl HistogramBounds {
    fn contains(&self, val: f64) -> bool {
        val >= self.min && val <= self.max
    }
}

#[derive(Default, Clone, Debug, PartialEq)]
pub(crate) struct SegmentHistogramBucketEntry {
    pub key: f64,
    pub doc_count: u64,
    pub bucket_id: BucketId,
}

impl SegmentHistogramBucketEntry {
    pub(crate) fn into_intermediate_bucket_entry(
        self,
        sub_aggregation: &mut Option<HighCardCachedSubAggs>,
        agg_data: &AggregationsSegmentCtx,
    ) -> crate::Result<IntermediateHistogramBucketEntry> {
        let mut sub_aggregation_res = IntermediateAggregationResults::default();
        if let Some(sub_aggregation) = sub_aggregation {
            sub_aggregation
                .get_sub_agg_collector()
                .add_intermediate_aggregation_result(
                    agg_data,
                    &mut sub_aggregation_res,
                    self.bucket_id,
                )?;
        }
        Ok(IntermediateHistogramBucketEntry {
            key: self.key,
            doc_count: self.doc_count,
            sub_aggregation: sub_aggregation_res,
        })
    }
}

#[derive(Clone, Debug, Default)]
struct HistogramBuckets {
    pub buckets: FxHashMap<i64, SegmentHistogramBucketEntry>,
}

/// The collector puts values from the fast field into the correct buckets and does a conversion to
/// the correct datatype.
#[derive(Debug)]
pub struct SegmentHistogramCollector {
    /// The buckets containing the aggregation data.
    /// One Histogram bucket per parent bucket id.
    parent_buckets: Vec<HistogramBuckets>,
    sub_agg: Option<HighCardCachedSubAggs>,
    accessor_idx: usize,
    bucket_id_provider: BucketIdProvider,
}

impl SegmentAggregationCollector for SegmentHistogramCollector {
    fn add_intermediate_aggregation_result(
        &mut self,
        agg_data: &AggregationsSegmentCtx,
        results: &mut IntermediateAggregationResults,
        parent_bucket_id: BucketId,
    ) -> crate::Result<()> {
        let name = agg_data
            .get_histogram_req_data(self.accessor_idx)
            .name
            .clone();
        // TODO: avoid prepare_max_bucket here and handle empty buckets.
        self.prepare_max_bucket(parent_bucket_id, agg_data)?;
        let histogram = std::mem::take(&mut self.parent_buckets[parent_bucket_id as usize]);
        let bucket = self.add_intermediate_bucket_result(agg_data, histogram)?;
        results.push(name, IntermediateAggregationResult::Bucket(bucket))?;

        Ok(())
    }

    #[inline]
    fn collect(
        &mut self,
        parent_bucket_id: BucketId,
        docs: &[crate::DocId],
        agg_data: &mut AggregationsSegmentCtx,
    ) -> crate::Result<()> {
        let req = agg_data.take_histogram_req_data(self.accessor_idx);
        let mem_pre = self.get_memory_consumption();
        let buckets = &mut self.parent_buckets[parent_bucket_id as usize].buckets;

        let bounds = req.bounds;
        let interval = req.req.interval;
        let offset = req.offset;
        let get_bucket_pos = |val| get_bucket_pos_f64(val, interval, offset) as i64;

        agg_data
            .column_block_accessor
            .fetch_block(docs, &req.accessor);
        for (doc, val) in agg_data
            .column_block_accessor
            .iter_docid_vals(docs, &req.accessor)
        {
            let val = f64_from_fastfield_u64(val, req.field_type);
            let bucket_pos = get_bucket_pos(val);
            if bounds.contains(val) {
                let bucket = buckets.entry(bucket_pos).or_insert_with(|| {
                    let key = get_bucket_key_from_pos(bucket_pos as f64, interval, offset);
                    SegmentHistogramBucketEntry {
                        key,
                        doc_count: 0,
                        bucket_id: self.bucket_id_provider.next_bucket_id(),
                    }
                });
                bucket.doc_count += 1;
                if let Some(sub_agg) = &mut self.sub_agg {
                    sub_agg.push(bucket.bucket_id, doc);
                }
            }
        }
        agg_data.put_back_histogram_req_data(self.accessor_idx, req);

        let mem_delta = self.get_memory_consumption() - mem_pre;
        if mem_delta > 0 {
            agg_data
                .context
                .limits
                .add_memory_consumed(mem_delta as u64)?;
        }

        if let Some(sub_agg) = &mut self.sub_agg {
            sub_agg.check_flush_local(agg_data)?;
        }

        Ok(())
    }

    fn flush(&mut self, agg_data: &mut AggregationsSegmentCtx) -> crate::Result<()> {
        if let Some(sub_aggregation) = &mut self.sub_agg {
            sub_aggregation.flush(agg_data)?;
        }
        Ok(())
    }

    fn prepare_max_bucket(
        &mut self,
        max_bucket: BucketId,
        _agg_data: &AggregationsSegmentCtx,
    ) -> crate::Result<()> {
        while self.parent_buckets.len() <= max_bucket as usize {
            self.parent_buckets.push(HistogramBuckets {
                buckets: FxHashMap::default(),
            });
        }
        Ok(())
    }
}

impl SegmentHistogramCollector {
    fn get_memory_consumption(&self) -> usize {
        let self_mem = std::mem::size_of::<Self>();
        let buckets_mem = self.parent_buckets.len() * std::mem::size_of::<HistogramBuckets>();
        self_mem + buckets_mem
    }
    /// Converts the collector result into a intermediate bucket result.
    fn add_intermediate_bucket_result(
        &mut self,
        agg_data: &AggregationsSegmentCtx,
        histogram: HistogramBuckets,
    ) -> crate::Result<IntermediateBucketResult> {
        let mut buckets = Vec::with_capacity(histogram.buckets.len());

        for bucket in histogram.buckets.into_values() {
            let bucket_res = bucket.into_intermediate_bucket_entry(&mut self.sub_agg, agg_data);

            buckets.push(bucket_res?);
        }
        buckets.sort_unstable_by(|b1, b2| b1.key.total_cmp(&b2.key));

        let is_date_agg = agg_data
            .get_histogram_req_data(self.accessor_idx)
            .field_type
            == ColumnType::DateTime;
        Ok(IntermediateBucketResult::Histogram {
            buckets,
            is_date_agg,
        })
    }

    pub(crate) fn from_req_and_validate(
        agg_data: &mut AggregationsSegmentCtx,
        node: &AggRefNode,
    ) -> crate::Result<Self> {
        let sub_agg = if !node.children.is_empty() {
            Some(build_segment_agg_collectors(agg_data, &node.children)?)
        } else {
            None
        };
        let req_data = agg_data.get_histogram_req_data_mut(node.idx_in_req_data);
        req_data.req.validate()?;
        if req_data.field_type == ColumnType::DateTime && !req_data.is_date_histogram {
            req_data.req.normalize_date_time();
        }
        req_data.bounds = req_data.req.hard_bounds.unwrap_or(HistogramBounds {
            min: f64::MIN,
            max: f64::MAX,
        });
        req_data.offset = req_data.req.offset.unwrap_or(0.0);
        let sub_agg = sub_agg.map(CachedSubAggs::new);

        Ok(Self {
            parent_buckets: Default::default(),
            sub_agg,
            accessor_idx: node.idx_in_req_data,
            bucket_id_provider: BucketIdProvider::default(),
        })
    }
}

#[inline]
fn get_bucket_pos_f64(val: f64, interval: f64, offset: f64) -> f64 {
    ((val - offset) / interval).floor()
}

#[inline]
fn get_bucket_key_from_pos(bucket_pos: f64, interval: f64, offset: f64) -> f64 {
    bucket_pos * interval + offset
}

// Convert to BucketEntry and fill gaps
fn intermediate_buckets_to_final_buckets_fill_gaps(
    buckets: Vec<IntermediateHistogramBucketEntry>,
    histogram_req: &HistogramAggregation,
    sub_aggregation: &Aggregations,
    limits: &mut AggregationLimitsGuard,
) -> crate::Result<Vec<BucketEntry>> {
    // Generate the full list of buckets without gaps.
    //
    // The bounds are the min max from the current buckets, optionally extended by
    // extended_bounds from the request
    let min_max = minmax(buckets.iter().map(|bucket| bucket.key));

    // memory check upfront
    let (_, first_bucket_num, last_bucket_num) =
        generate_bucket_pos_with_opt_minmax(histogram_req, min_max);

    // It's based on user input, so we need to account for overflows
    let added_buckets = ((last_bucket_num.saturating_sub(first_bucket_num)).max(0) as u64)
        .saturating_sub(buckets.len() as u64);
    limits.add_memory_consumed(
        added_buckets * std::mem::size_of::<IntermediateHistogramBucketEntry>() as u64,
    )?;
    // create buckets
    let fill_gaps_buckets = generate_buckets_with_opt_minmax(histogram_req, min_max);

    let empty_sub_aggregation = IntermediateAggregationResults::empty_from_req(sub_aggregation);

    // Use merge_join_by to fill in gaps, since buckets are sorted

    let final_buckets: Vec<BucketEntry> = buckets
        .into_iter()
        .merge_join_by(fill_gaps_buckets, |existing_bucket, fill_gaps_bucket| {
            existing_bucket
                .key
                .partial_cmp(fill_gaps_bucket)
                .unwrap_or(Ordering::Equal)
        })
        .map(|either| match either {
            // Ignore the generated bucket
            itertools::EitherOrBoth::Both(existing, _) => existing,
            itertools::EitherOrBoth::Left(existing) => existing,
            // Add missing bucket
            itertools::EitherOrBoth::Right(missing_bucket) => IntermediateHistogramBucketEntry {
                key: missing_bucket,
                doc_count: 0,
                sub_aggregation: empty_sub_aggregation.clone(),
            },
        })
        .map(|intermediate_bucket| {
            intermediate_bucket.into_final_bucket_entry(sub_aggregation, limits)
        })
        .collect::<crate::Result<Vec<_>>>()?;

    Ok(final_buckets)
}

// Convert to BucketEntry
pub(crate) fn intermediate_histogram_buckets_to_final_buckets(
    buckets: Vec<IntermediateHistogramBucketEntry>,
    is_date_agg: bool,
    histogram_req: &HistogramAggregation,
    sub_aggregation: &Aggregations,
    limits: &mut AggregationLimitsGuard,
) -> crate::Result<Vec<BucketEntry>> {
    // Normalization is column type dependent.
    // The request used in the the call to final is not yet be normalized.
    // Normalization is changing the precision from milliseconds to nanoseconds.
    let mut histogram_req = histogram_req.clone();
    if is_date_agg {
        histogram_req.normalize_date_time();
    }
    let mut buckets = if histogram_req.min_doc_count() == 0 {
        // With min_doc_count != 0, we may need to add buckets, so that there are no
        // gaps, since intermediate result does not contain empty buckets (filtered to
        // reduce serialization size).
        intermediate_buckets_to_final_buckets_fill_gaps(
            buckets,
            &histogram_req,
            sub_aggregation,
            limits,
        )?
    } else {
        buckets
            .into_iter()
            .filter(|histogram_bucket| histogram_bucket.doc_count >= histogram_req.min_doc_count())
            .map(|histogram_bucket| {
                histogram_bucket.into_final_bucket_entry(sub_aggregation, limits)
            })
            .collect::<crate::Result<Vec<_>>>()?
    };

    // If we have a date type on the histogram buckets, we add the `key_as_string` field as rfc339
    // and normalize from nanoseconds to milliseconds
    if is_date_agg {
        for bucket in buckets.iter_mut() {
            if let crate::aggregation::Key::F64(ref mut val) = bucket.key {
                let key_as_string = format_date(*val as i64)?;
                *val /= 1_000_000.0;
                bucket.key_as_string = Some(key_as_string);
            }
        }
    }

    Ok(buckets)
}

/// Applies req extended_bounds/hard_bounds on the min_max value
///
/// May return `(f64::MAX, f64::MIN)`, if there is no range.
fn get_req_min_max(req: &HistogramAggregation, min_max: Option<(f64, f64)>) -> (f64, f64) {
    let (mut min, mut max) = min_max.unwrap_or((f64::MAX, f64::MIN));

    if let Some(extended_bounds) = &req.extended_bounds {
        min = min.min(extended_bounds.min);
        max = max.max(extended_bounds.max);
    }

    if let Some(hard_bounds) = &req.hard_bounds {
        min = min.max(hard_bounds.min);
        max = max.min(hard_bounds.max);
    }

    (min, max)
}

/// Generates buckets with req.interval
/// Range is computed for provided min_max and request extended_bounds/hard_bounds
/// returns empty vec when there is no range to span
pub(crate) fn generate_bucket_pos_with_opt_minmax(
    req: &HistogramAggregation,
    min_max: Option<(f64, f64)>,
) -> (f64, i64, i64) {
    let (min, max) = get_req_min_max(req, min_max);

    let offset = req.offset.unwrap_or(0.0);
    let first_bucket_num = get_bucket_pos_f64(min, req.interval, offset) as i64;
    let last_bucket_num = get_bucket_pos_f64(max, req.interval, offset) as i64;
    (offset, first_bucket_num, last_bucket_num)
}

/// Generates buckets with req.interval
/// Range is computed for provided min_max and request extended_bounds/hard_bounds
/// returns empty vec when there is no range to span
pub(crate) fn generate_buckets_with_opt_minmax(
    req: &HistogramAggregation,
    min_max: Option<(f64, f64)>,
) -> Vec<f64> {
    let (offset, first_bucket_num, last_bucket_num) =
        generate_bucket_pos_with_opt_minmax(req, min_max);
    let mut buckets = Vec::with_capacity((first_bucket_num..=last_bucket_num).count());
    for bucket_pos in first_bucket_num..=last_bucket_num {
        let bucket_key = bucket_pos as f64 * req.interval + offset;
        buckets.push(bucket_key);
    }

    buckets
}

#[cfg(test)]
mod tests {

    use pretty_assertions::assert_eq;
    use serde_json::Value;

    use super::*;
    use crate::aggregation::agg_result::AggregationResults;
    use crate::aggregation::tests::{
        exec_request, exec_request_with_query, exec_request_with_query_and_memory_limit,
        get_test_index_2_segments, get_test_index_from_values, get_test_index_with_num_docs,
    };
    use crate::query::AllQuery;

    #[test]
    fn histogram_test_crooked_values() -> crate::Result<()> {
        let values = vec![-12.0, 12.31, 14.33, 16.23];

        let index = get_test_index_from_values(false, &values)?;

        let agg_req: Aggregations = serde_json::from_value(json!({
            "my_interval": {
                "histogram": {
                    "field": "score_f64",
                    "interval": 3.5,
                    "offset": 0.0,
                }
            }
        }))
        .unwrap();

        let res = exec_request(agg_req, &index)?;

        assert_eq!(res["my_interval"]["buckets"][0]["key"], -14.0);
        assert_eq!(res["my_interval"]["buckets"][0]["doc_count"], 1);
        assert_eq!(res["my_interval"]["buckets"][7]["key"], 10.5);
        assert_eq!(res["my_interval"]["buckets"][7]["doc_count"], 1);
        assert_eq!(res["my_interval"]["buckets"][8]["key"], 14.0);
        assert_eq!(res["my_interval"]["buckets"][8]["doc_count"], 2);
        assert_eq!(res["my_interval"]["buckets"][9], Value::Null);

        // With offset
        let agg_req: Aggregations = serde_json::from_value(json!({
            "my_interval": {
                "histogram": {
                    "field": "score_f64",
                    "interval": 3.5,
                    "offset": 1.2,
                }
            }
        }))
        .unwrap();

        let res = exec_request(agg_req, &index)?;

        assert_eq!(res["my_interval"]["buckets"][0]["key"], -12.8);
        assert_eq!(res["my_interval"]["buckets"][0]["doc_count"], 1);
        assert_eq!(res["my_interval"]["buckets"][1]["key"], -9.3);
        assert_eq!(res["my_interval"]["buckets"][1]["doc_count"], 0);
        assert_eq!(res["my_interval"]["buckets"][2]["key"], -5.8);
        assert_eq!(res["my_interval"]["buckets"][2]["doc_count"], 0);
        assert_eq!(res["my_interval"]["buckets"][3]["key"], -2.3);
        assert_eq!(res["my_interval"]["buckets"][3]["doc_count"], 0);

        assert_eq!(res["my_interval"]["buckets"][7]["key"], 11.7);
        assert_eq!(res["my_interval"]["buckets"][7]["doc_count"], 2);
        assert_eq!(res["my_interval"]["buckets"][8]["key"], 15.2);
        assert_eq!(res["my_interval"]["buckets"][8]["doc_count"], 1);
        assert_eq!(res["my_interval"]["buckets"][9], Value::Null);

        Ok(())
    }

    #[test]
    fn histogram_test_min_value_positive_force_merge_segments() -> crate::Result<()> {
        histogram_test_min_value_positive_merge_segments(true)
    }

    #[test]
    fn histogram_test_min_value_positive() -> crate::Result<()> {
        histogram_test_min_value_positive_merge_segments(false)
    }
    fn histogram_test_min_value_positive_merge_segments(merge_segments: bool) -> crate::Result<()> {
        let values = vec![10.0, 12.0, 14.0, 16.23];

        let index = get_test_index_from_values(merge_segments, &values)?;

        let agg_req: Aggregations = serde_json::from_value(json!({
            "my_interval": {
                "histogram": {
                    "field": "score_f64",
                    "interval": 1.0,
                }
            }
        }))
        .unwrap();

        let res = exec_request(agg_req, &index)?;

        assert_eq!(res["my_interval"]["buckets"][0]["key"], 10.0);
        assert_eq!(res["my_interval"]["buckets"][0]["doc_count"], 1);
        assert_eq!(res["my_interval"]["buckets"][1]["key"], 11.0);
        assert_eq!(res["my_interval"]["buckets"][1]["doc_count"], 0);
        assert_eq!(res["my_interval"]["buckets"][2]["key"], 12.0);
        assert_eq!(res["my_interval"]["buckets"][2]["doc_count"], 1);
        assert_eq!(res["my_interval"]["buckets"][3]["key"], 13.0);
        assert_eq!(res["my_interval"]["buckets"][3]["doc_count"], 0);
        assert_eq!(res["my_interval"]["buckets"][6]["key"], 16.0);
        assert_eq!(res["my_interval"]["buckets"][6]["doc_count"], 1);
        assert_eq!(res["my_interval"]["buckets"][7], Value::Null);

        Ok(())
    }

    #[test]
    fn histogram_simple_test() -> crate::Result<()> {
        let index = get_test_index_with_num_docs(false, 100)?;

        let agg_req: Aggregations = serde_json::from_value(json!({
            "histogram": {
                "histogram": {
                    "field": "score_f64",
                    "interval": 1.0,
                }
            }
        }))
        .unwrap();

        let res = exec_request(agg_req, &index)?;

        assert_eq!(res["histogram"]["buckets"][0]["key"], 0.0);
        assert_eq!(res["histogram"]["buckets"][0]["doc_count"], 1);
        assert_eq!(res["histogram"]["buckets"][1]["key"], 1.0);
        assert_eq!(res["histogram"]["buckets"][1]["doc_count"], 1);
        assert_eq!(res["histogram"]["buckets"][99]["key"], 99.0);
        assert_eq!(res["histogram"]["buckets"][99]["doc_count"], 1);
        assert_eq!(res["histogram"]["buckets"][100], Value::Null);
        Ok(())
    }

    #[test]
    fn histogram_memory_limit() -> crate::Result<()> {
        let index = get_test_index_with_num_docs(true, 100)?;

        let agg_req: Aggregations = serde_json::from_value(json!({
            "histogram": {
                "histogram": {
                    "field": "score_f64",
                    "interval": 0.1,
                }
            }
        }))
        .unwrap();

        let res = exec_request_with_query_and_memory_limit(
            agg_req,
            &index,
            None,
            AggregationLimitsGuard::new(Some(5_000), None),
        )
        .unwrap_err();
        assert!(res.to_string().starts_with(
            "Aborting aggregation because memory limit was exceeded. Limit: 5.00 KB, Current"
        ));

        Ok(())
    }

    #[test]
    fn histogram_merge_test() -> crate::Result<()> {
        // Merge buckets counts from different segments
        let values = vec![10.0, 12.0, 14.0, 16.23, 10.0, 13.0, 10.0, 12.0];

        let index = get_test_index_from_values(false, &values)?;

        let agg_req: Aggregations = serde_json::from_value(json!({
            "histogram": {
                "histogram": {
                    "field": "score_f64",
                    "interval": 1.0,
                }
            }
        }))
        .unwrap();

        let res = exec_request(agg_req, &index)?;

        assert_eq!(res["histogram"]["buckets"][0]["key"], 10.0);
        assert_eq!(res["histogram"]["buckets"][0]["doc_count"], 3);
        assert_eq!(res["histogram"]["buckets"][1]["key"], 11.0);
        assert_eq!(res["histogram"]["buckets"][1]["doc_count"], 0);
        assert_eq!(res["histogram"]["buckets"][2]["key"], 12.0);
        assert_eq!(res["histogram"]["buckets"][2]["doc_count"], 2);
        assert_eq!(res["histogram"]["buckets"][3]["key"], 13.0);
        assert_eq!(res["histogram"]["buckets"][3]["doc_count"], 1);

        Ok(())
    }
    #[test]
    fn histogram_min_doc_test_multi_segments() -> crate::Result<()> {
        histogram_min_doc_test_with_opt(false)
    }
    #[test]
    fn histogram_min_doc_test_single_segments() -> crate::Result<()> {
        histogram_min_doc_test_with_opt(true)
    }
    fn histogram_min_doc_test_with_opt(merge_segments: bool) -> crate::Result<()> {
        let values = vec![10.0, 12.0, 14.0, 16.23, 10.0, 13.0, 10.0, 12.0];

        let index = get_test_index_from_values(merge_segments, &values)?;

        let agg_req: Aggregations = serde_json::from_value(json!({
            "histogram": {
                "histogram": {
                    "field": "score_f64",
                    "interval": 1.0,
                    "min_doc_count": 2,
                }
            }
        }))
        .unwrap();

        let res = exec_request(agg_req, &index)?;

        assert_eq!(res["histogram"]["buckets"][0]["key"], 10.0);
        assert_eq!(res["histogram"]["buckets"][0]["doc_count"], 3);
        assert_eq!(res["histogram"]["buckets"][1]["key"], 12.0);
        assert_eq!(res["histogram"]["buckets"][1]["doc_count"], 2);
        assert_eq!(res["histogram"]["buckets"][2], Value::Null);

        Ok(())
    }

    #[test]
    fn histogram_extended_bounds_test_multi_segment() -> crate::Result<()> {
        histogram_extended_bounds_test_with_opt(false)
    }
    #[test]
    fn histogram_extended_bounds_test_single_segment() -> crate::Result<()> {
        histogram_extended_bounds_test_with_opt(true)
    }
    fn histogram_extended_bounds_test_with_opt(merge_segments: bool) -> crate::Result<()> {
        let values = vec![5.0];
        let index = get_test_index_from_values(merge_segments, &values)?;

        let agg_req: Aggregations = serde_json::from_value(json!({
            "histogram": {
                "histogram": {
                    "field": "score_f64",
                    "interval": 1.0,
                    "extended_bounds": {
                        "min": 2.0,
                        "max": 12.0,
                    },
                }
            }
        }))
        .unwrap();

        let res = exec_request(agg_req, &index)?;

        assert_eq!(res["histogram"]["buckets"][0]["key"], 2.0);
        assert_eq!(res["histogram"]["buckets"][0]["doc_count"], 0);
        assert_eq!(res["histogram"]["buckets"][1]["key"], 3.0);
        assert_eq!(res["histogram"]["buckets"][1]["doc_count"], 0);
        assert_eq!(res["histogram"]["buckets"][2]["doc_count"], 0);
        assert_eq!(res["histogram"]["buckets"][10]["key"], 12.0);
        assert_eq!(res["histogram"]["buckets"][10]["doc_count"], 0);

        // 2 hits
        let values = vec![5.0, 5.5];
        let index = get_test_index_from_values(merge_segments, &values)?;

        let agg_req: Aggregations = serde_json::from_value(json!({
            "histogram": {
                "histogram": {
                    "field": "score_f64",
                    "interval": 1.0,
                    "extended_bounds": {
                        "min": 3.0,
                        "max": 6.0,
                    },
                }
            }
        }))
        .unwrap();

        let res = exec_request(agg_req, &index)?;

        assert_eq!(res["histogram"]["buckets"][0]["key"], 3.0);
        assert_eq!(res["histogram"]["buckets"][0]["doc_count"], 0);
        assert_eq!(res["histogram"]["buckets"][1]["key"], 4.0);
        assert_eq!(res["histogram"]["buckets"][1]["doc_count"], 0);
        assert_eq!(res["histogram"]["buckets"][2]["key"], 5.0);
        assert_eq!(res["histogram"]["buckets"][2]["doc_count"], 2);
        assert_eq!(res["histogram"]["buckets"][3]["key"], 6.0);
        assert_eq!(res["histogram"]["buckets"][3]["doc_count"], 0);
        assert_eq!(res["histogram"]["buckets"][4], Value::Null);

        // 1 hit outside bounds
        let values = vec![15.0];
        let index = get_test_index_from_values(merge_segments, &values)?;

        let agg_req: Aggregations = serde_json::from_value(json!({
            "histogram": {
                "histogram": {
                    "field": "score_f64",
                    "interval": 1.0,
                    "extended_bounds": {
                        "min": 3.0,
                        "max": 6.0,
                    },
                    "hard_bounds": {
                        "min": 3.0,
                        "max": 6.0,
                    },
                }
            }
        }))
        .unwrap();

        let res = exec_request(agg_req, &index)?;

        assert_eq!(res["histogram"]["buckets"][0]["key"], 3.0);
        assert_eq!(res["histogram"]["buckets"][0]["doc_count"], 0);
        assert_eq!(res["histogram"]["buckets"][1]["key"], 4.0);
        assert_eq!(res["histogram"]["buckets"][1]["doc_count"], 0);
        assert_eq!(res["histogram"]["buckets"][2]["key"], 5.0);
        assert_eq!(res["histogram"]["buckets"][2]["doc_count"], 0);
        assert_eq!(res["histogram"]["buckets"][3]["key"], 6.0);
        assert_eq!(res["histogram"]["buckets"][3]["doc_count"], 0);
        assert_eq!(res["histogram"]["buckets"][4], Value::Null);

        Ok(())
    }

    #[test]
    fn histogram_hard_bounds_test_multi_segment() -> crate::Result<()> {
        histogram_hard_bounds_test_with_opt(false)
    }
    #[test]
    fn histogram_hard_bounds_test_single_segment() -> crate::Result<()> {
        histogram_hard_bounds_test_with_opt(true)
    }
    fn histogram_hard_bounds_test_with_opt(merge_segments: bool) -> crate::Result<()> {
        let values = vec![10.0, 12.0, 14.0, 16.23, 10.0, 13.0, 10.0, 12.0];

        let index = get_test_index_from_values(merge_segments, &values)?;

        let agg_req: Aggregations = serde_json::from_value(json!({
            "histogram": {
                "histogram": {
                    "field": "score_f64",
                    "interval": 1.0,
                    "hard_bounds": {
                        "min": 2.0,
                        "max": 12.0,
                    },
                }
            }
        }))
        .unwrap();

        let res = exec_request(agg_req, &index)?;

        assert_eq!(res["histogram"]["buckets"][0]["key"], 10.0);
        assert_eq!(res["histogram"]["buckets"][0]["doc_count"], 3);
        assert_eq!(res["histogram"]["buckets"][1]["key"], 11.0);
        assert_eq!(res["histogram"]["buckets"][1]["doc_count"], 0);
        assert_eq!(res["histogram"]["buckets"][2]["key"], 12.0);
        assert_eq!(res["histogram"]["buckets"][2]["doc_count"], 2);

        assert_eq!(res["histogram"]["buckets"][3], Value::Null);

        // hard_bounds and extended_bounds will act like a force bounds
        //
        let agg_req: Aggregations = serde_json::from_value(json!({
            "histogram": {
                "histogram": {
                    "field": "score_f64",
                    "interval": 1.0,
                    "extended_bounds": {
                        "min": 2.0,
                        "max": 12.0,
                    },
                    "hard_bounds": {
                        "min": 2.0,
                        "max": 12.0,
                    },
                }
            }
        }))
        .unwrap();

        let res = exec_request(agg_req, &index)?;

        assert_eq!(res["histogram"]["buckets"][0]["key"], 2.0);
        assert_eq!(res["histogram"]["buckets"][0]["doc_count"], 0);
        assert_eq!(res["histogram"]["buckets"][1]["key"], 3.0);
        assert_eq!(res["histogram"]["buckets"][1]["doc_count"], 0);
        assert_eq!(res["histogram"]["buckets"][10]["key"], 12.0);
        assert_eq!(res["histogram"]["buckets"][10]["doc_count"], 2);

        assert_eq!(res["histogram"]["buckets"][11], Value::Null);

        // invalid request
        let agg_req: Aggregations = serde_json::from_value(json!({
            "histogram": {
                "histogram": {
                    "field": "score_f64",
                    "interval": 1.0,
                    "extended_bounds": {
                        "min": 1.0,
                        "max": 12.0,
                    },
                    "hard_bounds": {
                        "min": 2.0,
                        "max": 12.0,
                    },
                }
            }
        }))
        .unwrap();

        let res = exec_request(agg_req, &index).unwrap_err();
        assert_eq!(
            res.to_string(),
            "An invalid argument was passed: 'extended_bounds have to be inside hard_bounds, \
             extended_bounds: [1,12], hard_bounds [2,12]'"
        );

        Ok(())
    }

    #[test]
    fn histogram_empty_result_behaviour_test_single_segment() -> crate::Result<()> {
        histogram_empty_result_behaviour_test_with_opt(true)
    }

    #[test]
    fn histogram_empty_result_behaviour_test_multi_segment() -> crate::Result<()> {
        histogram_empty_result_behaviour_test_with_opt(false)
    }

    fn histogram_empty_result_behaviour_test_with_opt(merge_segments: bool) -> crate::Result<()> {
        let index = get_test_index_2_segments(merge_segments)?;

        let agg_req: Aggregations = serde_json::from_value(json!({
            "histogram": {
                "histogram": {
                    "field": "score_f64",
                    "interval": 1.0,
                }
            }
        }))
        .unwrap();

        let res = exec_request_with_query(agg_req.clone(), &index, Some(("text", "blubberasdf")))?;

        assert_eq!(
            res,
            json!({
                "histogram": {
                    "buckets": []
                }
            })
        );

        // test index without segments
        let values = vec![];

        // Don't merge empty segments
        let index = get_test_index_from_values(false, &values)?;

        let res = exec_request_with_query(agg_req, &index, Some(("text", "blubberasdf")))?;

        assert_eq!(
            res,
            json!({
                "histogram": {
                    "buckets": []
                }
            })
        );

        // test index without segments
        let values = vec![];

        // Don't merge empty segments
        let index = get_test_index_from_values(false, &values)?;

        let agg_req: Aggregations = serde_json::from_value(json!({
            "histogram": {
                "histogram": {
                    "field": "score_f64",
                    "interval": 1.0,
                    "extended_bounds": {
                        "min": 2.0,
                        "max": 12.0,
                    },
                }
            }
        }))
        .unwrap();

        let res = exec_request(agg_req, &index)?;

        assert_eq!(res["histogram"]["buckets"][0]["key"], 2.0);
        assert_eq!(res["histogram"]["buckets"][0]["doc_count"], 0);
        assert_eq!(res["histogram"]["buckets"][1]["key"], 3.0);
        assert_eq!(res["histogram"]["buckets"][1]["doc_count"], 0);
        assert_eq!(res["histogram"]["buckets"][2]["doc_count"], 0);
        assert_eq!(res["histogram"]["buckets"][10]["key"], 12.0);
        assert_eq!(res["histogram"]["buckets"][10]["doc_count"], 0);

        let agg_req: Aggregations = serde_json::from_value(json!({
            "histogram": {
                "histogram": {
                    "field": "score_f64",
                    "interval": 1.0,
                    "extended_bounds": {
                        "min": 2.0,
                        "max": 5.0,
                    },
                    "hard_bounds": {
                        "min": 2.0,
                        "max": 12.0,
                    },

                }
            }
        }))
        .unwrap();

        let res = exec_request(agg_req, &index)?;

        assert_eq!(res["histogram"]["buckets"][0]["key"], 2.0);
        assert_eq!(res["histogram"]["buckets"][0]["doc_count"], 0);
        assert_eq!(res["histogram"]["buckets"][1]["key"], 3.0);
        assert_eq!(res["histogram"]["buckets"][1]["doc_count"], 0);
        assert_eq!(res["histogram"]["buckets"][2]["doc_count"], 0);
        assert_eq!(res["histogram"]["buckets"][10], Value::Null);

        // hard_bounds will not extend the result
        let agg_req: Aggregations = serde_json::from_value(json!({
            "histogram": {
                "histogram": {
                    "field": "score_f64",
                    "interval": 1.0,
                    "hard_bounds": {
                        "min": 2.0,
                        "max": 12.0,
                    },

                }
            }
        }))
        .unwrap();

        let res = exec_request(agg_req, &index)?;

        assert_eq!(
            res,
            json!({
                "histogram": {
                    "buckets": []
                }
            })
        );

        let sub_agg_req: Aggregations = serde_json::from_value(json!({
            "stats": { "stats": { "field": "score_f64", } },
            "avg": { "avg": { "field": "score_f64", } }

        }))
        .unwrap();

        let agg_req: Aggregations = serde_json::from_value(json!({
            "histogram": {
                "histogram": {
                    "field": "score_f64",
                    "interval": 1.0,
                    "extended_bounds": {
                        "min": 2.0,
                        "max": 12.0,
                    },
                },
                "aggs": sub_agg_req
            }
        }))
        .unwrap();

        let res = exec_request(agg_req, &index)?;

        assert_eq!(
            res["histogram"]["buckets"][0],
            json!({
                "avg": {
                    "value": Value::Null
                },
                "doc_count": 0,
                "key": 2.0,
                "stats": {
                    "sum": 0.0,
                    "count": 0,
                    "min": Value::Null,
                    "max": Value::Null,
                    "avg": Value::Null,
                }
            })
        );
        assert_eq!(res["histogram"]["buckets"][0]["key"], 2.0);
        assert_eq!(res["histogram"]["buckets"][0]["doc_count"], 0);
        assert_eq!(res["histogram"]["buckets"][1]["key"], 3.0);
        assert_eq!(res["histogram"]["buckets"][1]["doc_count"], 0);
        assert_eq!(res["histogram"]["buckets"][2]["doc_count"], 0);
        assert_eq!(res["histogram"]["buckets"][10]["key"], 12.0);
        assert_eq!(res["histogram"]["buckets"][10]["doc_count"], 0);

        Ok(())
    }

    #[test]
    fn histogram_single_bucket_test_single_segment() -> crate::Result<()> {
        histogram_single_bucket_test_with_opt(true)
    }

    #[test]
    fn histogram_single_bucket_test_multi_segment() -> crate::Result<()> {
        histogram_single_bucket_test_with_opt(false)
    }

    fn histogram_single_bucket_test_with_opt(merge_segments: bool) -> crate::Result<()> {
        let index = get_test_index_2_segments(merge_segments)?;

        let agg_req: Aggregations = serde_json::from_value(json!({
            "histogram": {
                "histogram": {
                    "field": "score_f64",
                    "interval": 100000.0,
                },
            }
        }))
        .unwrap();

        let agg_res = exec_request(agg_req, &index)?;

        let res: Value = serde_json::from_str(&serde_json::to_string(&agg_res)?)?;

        assert_eq!(res["histogram"]["buckets"][0]["key"], 0.0);
        assert_eq!(res["histogram"]["buckets"][0]["doc_count"], 9);
        assert_eq!(res["histogram"]["buckets"][1], Value::Null);

        Ok(())
    }

    #[test]
    fn histogram_date_test_single_segment() -> crate::Result<()> {
        histogram_date_test_with_opt(true)
    }

    #[test]
    fn histogram_date_test_multi_segment() -> crate::Result<()> {
        histogram_date_test_with_opt(false)
    }

    fn histogram_date_test_with_opt(merge_segments: bool) -> crate::Result<()> {
        let index = get_test_index_2_segments(merge_segments)?;

        let agg_req: Aggregations = serde_json::from_value(json!({
            "histogram": {
                "histogram": {
                    "field": "date",
                    "interval": 86400000.0, // one day in milliseconds seconds
                },
            }
        }))
        .unwrap();

        let agg_res = exec_request(agg_req, &index)?;

        let res: Value = serde_json::from_str(&serde_json::to_string(&agg_res)?)?;

        assert_eq!(res["histogram"]["buckets"][0]["key"], 1546300800000.0);
        assert_eq!(
            res["histogram"]["buckets"][0]["key_as_string"],
            "2019-01-01T00:00:00Z"
        );
        assert_eq!(res["histogram"]["buckets"][0]["doc_count"], 1);

        assert_eq!(res["histogram"]["buckets"][1]["key"], 1546387200000.0);
        assert_eq!(
            res["histogram"]["buckets"][1]["key_as_string"],
            "2019-01-02T00:00:00Z"
        );

        assert_eq!(res["histogram"]["buckets"][1]["doc_count"], 5);

        assert_eq!(res["histogram"]["buckets"][2]["key"], 1546473600000.0);
        assert_eq!(
            res["histogram"]["buckets"][2]["key_as_string"],
            "2019-01-03T00:00:00Z"
        );

        assert_eq!(res["histogram"]["buckets"][3], Value::Null);

        Ok(())
    }

    #[test]
    fn histogram_invalid_request() -> crate::Result<()> {
        let index = get_test_index_2_segments(true)?;

        let agg_req: Aggregations = serde_json::from_value(json!({
            "histogram": {
                "histogram": {
                    "field": "score_f64",
                    "interval": 0.0,
                },
            }
        }))
        .unwrap();

        let agg_res = exec_request(agg_req, &index);

        assert!(agg_res.is_err());

        Ok(())
    }

    #[test]
    fn histogram_keyed_buckets_test() -> crate::Result<()> {
        let index = get_test_index_with_num_docs(false, 100)?;
        let agg_req: Aggregations = serde_json::from_value(json!({
            "histogram": {
                "histogram": {
                    "field": "score_f64",
                    "interval": 50.0,
                    "keyed": true
                },
            }
        }))
        .unwrap();

        let res = exec_request(agg_req, &index)?;

        assert_eq!(
            res,
            json!({
                "histogram": {
                    "buckets": {
                        "0": {
                            "key": 0.0,
                            "doc_count": 50
                        },
                        "50": {
                            "key": 50.0,
                            "doc_count": 50
                        }
                    }
                }
            })
        );

        Ok(())
    }
    #[test]
    fn test_aggregation_histogram_empty_index() -> crate::Result<()> {
        // test index without segments
        let values = vec![];

        let index = get_test_index_from_values(false, &values)?;

        let agg_req_1: Aggregations = serde_json::from_value(json!({
            "myhisto": {
                "histogram": {
                    "field": "score",
                    "interval": 10.0
                },
            }
        }))
        .unwrap();

        let collector = AggregationCollector::from_aggs(agg_req_1, Default::default());

        let reader = index.reader()?;
        let searcher = reader.searcher();
        let agg_res: AggregationResults = searcher.search(&AllQuery, &collector).unwrap();

        let res: Value = serde_json::from_str(&serde_json::to_string(&agg_res)?)?;
        // Make sure the result structure is correct
        assert_eq!(res["myhisto"]["buckets"].as_array().unwrap().len(), 0);

        Ok(())
    }
}


================================================
FILE: src/aggregation/bucket/histogram/mod.rs
================================================
mod date_histogram;
mod histogram;
pub use date_histogram::*;
pub use histogram::*;


================================================
FILE: src/aggregation/bucket/mod.rs
================================================
//! Module for all bucket aggregations.
//!
//! BucketAggregations create buckets of documents.
//! Each bucket is associated with a rule which
//! determines whether or not a document in the falls into it. In other words, the buckets
//! effectively define document sets. Buckets are not necessarily disjunct, therefore a document can
//! fall into multiple buckets. In addition to the buckets themselves, the bucket aggregations also
//! compute and return the number of documents for each bucket. Bucket aggregations, as opposed to
//! metric aggregations, can hold sub-aggregations. These sub-aggregations will be aggregated for
//! the buckets created by their "parent" bucket aggregation. There are different bucket
//! aggregators, each with a different "bucketing" strategy. Some define a single bucket, some
//! define fixed number of multiple buckets, and others dynamically create the buckets during the
//! aggregation process.
//!
//! Results of final buckets are [`BucketResult`](super::agg_result::BucketResult).
//! Results of intermediate buckets are
//! [`IntermediateBucketResult`](super::intermediate_agg_result::IntermediateBucketResult)
//!
//! ## Supported Bucket Aggregations
//! - [Histogram](HistogramAggregation)
//! - [DateHistogram](DateHistogramAggregationReq)
//! - [Range](RangeAggregation)
//! - [Terms](TermsAggregation)

mod composite;
mod filter;
mod histogram;
mod range;
mod term_agg;
mod term_missing_agg;

use std::collections::HashMap;
use std::fmt;

pub use composite::*;
pub use filter::*;
pub use histogram::*;
pub use range::*;
use serde::{de, Deserialize, Deserializer, Serialize, Serializer};
pub use term_agg::*;
pub use term_missing_agg::*;

/// Order for buckets in a bucket aggregation.
#[derive(Clone, Copy, Debug, PartialEq, Serialize, Deserialize, Default)]
pub enum Order {
    /// Asc order
    #[serde(rename = "asc")]
    Asc,
    /// Desc order
    #[serde(rename = "desc")]
    #[default]
    Desc,
}

#[derive(Clone, Debug, PartialEq)]
/// Order property by which to apply the order
#[derive(Default)]
pub enum OrderTarget {
    /// The key of the bucket
    Key,
    /// The doc count of the bucket
    #[default]
    Count,
    /// Order by value of the sub aggregation metric with identified by given `String`.
    ///
    /// Only single value metrics are supported currently
    SubAggregation(String),
}

impl From<&str> for OrderTarget {
    fn from(val: &str) -> Self {
        match val {
            "_key" => OrderTarget::Key,
            "_count" => OrderTarget::Count,
            _ => OrderTarget::SubAggregation(val.to_string()),
        }
    }
}

impl fmt::Display for OrderTarget {
    fn fmt(&self, f: &mut fmt::Formatter) -> fmt::Result {
        match self {
            OrderTarget::Key => f.write_str("_key"),
            OrderTarget::Count => f.write_str("_count"),
            OrderTarget::SubAggregation(agg) => agg.fmt(f),
        }
    }
}

/// Set the order. target is either "_count", "_key", or the name of
/// a metric sub_aggregation.
///
/// De/Serializes to elasticsearch compatible JSON.
///
/// Examples in JSON format:
/// { "_count": "asc" }
/// { "_key": "asc" }
/// { "average_price": "asc" }
#[derive(Clone, Default, Debug, PartialEq)]
pub struct CustomOrder {
    /// The target property by which to sort by
    pub target: OrderTarget,
    /// The order asc or desc
    pub order: Order,
}

impl Serialize for CustomOrder {
    fn serialize<S>(&self, serializer: S) -> Result<S::Ok, S::Error>
    where S: Serializer {
        let map: HashMap<String, Order> =
            std::iter::once((self.target.to_string(), self.order)).collect();
        map.serialize(serializer)
    }
}

impl<'de> Deserialize<'de> for CustomOrder {
    fn deserialize<D>(deserializer: D) -> Result<CustomOrder, D::Error>
    where D: Deserializer<'de> {
        let value = serde_json::Value::deserialize(deserializer)?;
        let return_err = |message, val: serde_json::Value| {
            de::Error::custom(format!(
                "{}, but got {}",
                message,
                serde_json::to_string(&val).unwrap()
            ))
        };

        match value {
            serde_json::Value::Object(map) => {
                if map.len() != 1 {
                    return Err(return_err(
                        "expected exactly one key-value pair in the order map",
                        map.into(),
                    ));
                }

                let (key, value) = map.into_iter().next().unwrap();
                let order = serde_json::from_value(value).map_err(de::Error::custom)?;

                Ok(CustomOrder {
                    target: key.as_str().into(),
                    order,
                })
            }
            serde_json::Value::Array(arr) => {
                if arr.is_empty() {
                    return Err(return_err("unexpected empty array in order", arr.into()));
                }
                if arr.len() != 1 {
                    return Err(return_err(
                        "only one sort order supported currently",
                        arr.into(),
                    ));
                }
                let entry = arr.into_iter().next().unwrap();
                let map = entry
                    .as_object()
                    .ok_or_else(|| return_err("expected object as sort order", entry.clone()))?;
                let (key, value) = map.into_iter().next().ok_or_else(|| {
                    return_err(
                        "expected exactly one key-value pair in the order map",
                        entry.clone(),
                    )
                })?;
                let order = serde_json::from_value(value.clone()).map_err(de::Error::custom)?;

                Ok(CustomOrder {
                    target: key.as_str().into(),
                    order,
                })
            }
            _ => Err(return_err(
                "unexpected type, expected an object or array",
                value,
            )),
        }
    }
}

#[test]
fn custom_order_serde_test() {
    let order = CustomOrder {
        target: OrderTarget::Key,
        order: Order::Desc,
    };

    let order_str = serde_json::to_string(&order).unwrap();
    assert_eq!(order_str, "{\"_key\":\"desc\"}");
    let order_deser = serde_json::from_str(&order_str).unwrap();

    assert_eq!(order, order_deser);
    let order_deser: CustomOrder = serde_json::from_str("[{\"_key\":\"desc\"}]").unwrap();
    assert_eq!(order, order_deser);

    let order_deser: serde_json::Result<CustomOrder> = serde_json::from_str("{}");
    assert!(order_deser.is_err());

    let order_deser: serde_json::Result<CustomOrder> = serde_json::from_str("[]");
    assert!(order_deser
        .unwrap_err()
        .to_string()
        .contains("unexpected empty array in order"));

    let order_deser: serde_json::Result<CustomOrder> =
        serde_json::from_str(r#"[{"_key":"desc"},{"_key":"desc"}]"#);
    assert_eq!(
        order_deser.unwrap_err().to_string(),
        r#"only one sort order supported currently, but got [{"_key":"desc"},{"_key":"desc"}]"#
    );
}


================================================
FILE: src/aggregation/bucket/range.rs
================================================
use std::fmt::Debug;
use std::ops::Range;

use columnar::{Column, ColumnType};
use rustc_hash::FxHashMap;
use serde::{Deserialize, Serialize};

use crate::aggregation::agg_data::{
    build_segment_agg_collectors, AggRefNode, AggregationsSegmentCtx,
};
use crate::aggregation::agg_limits::AggregationLimitsGuard;
use crate::aggregation::cached_sub_aggs::{
    CachedSubAggs, HighCardSubAggCache, LowCardCachedSubAggs, LowCardSubAggCache, SubAggCache,
};
use crate::aggregation::intermediate_agg_result::{
    IntermediateAggregationResult, IntermediateAggregationResults, IntermediateBucketResult,
    IntermediateRangeBucketEntry, IntermediateRangeBucketResult,
};
use crate::aggregation::segment_agg_result::{BucketIdProvider, SegmentAggregationCollector};
use crate::aggregation::*;
use crate::TantivyError;

/// Contains all information required by the SegmentRangeCollector to perform the
/// range aggregation on a segment.
pub struct RangeAggReqData {
    /// The column accessor to access the fast field values.
    pub accessor: Column<u64>,
    /// The type of the fast field.
    pub field_type: ColumnType,
    /// The range aggregation request.
    pub req: RangeAggregation,
    /// The name of the aggregation.
    pub name: String,
    /// Whether this is a top-level aggregation.
    pub is_top_level: bool,
}

impl RangeAggReqData {
    /// Estimate the memory consumption of this struct in bytes.
    pub fn get_memory_consumption(&self) -> usize {
        std::mem::size_of::<Self>()
    }
}

/// Provide user-defined buckets to aggregate on.
///
/// Two special buckets will automatically be created to cover the whole range of values.
/// The provided buckets have to be continuous.
/// During the aggregation, the values extracted from the fast_field `field` will be checked
/// against each bucket range. Note that this aggregation includes the from value and excludes the
/// to value for each range.
///
/// Result type is [`BucketResult`](crate::aggregation::agg_result::BucketResult) with
/// [`RangeBucketEntry`](crate::aggregation::agg_result::RangeBucketEntry) on the
/// `AggregationCollector`.
///
/// Result type is
/// [`IntermediateBucketResult`](crate::aggregation::intermediate_agg_result::IntermediateBucketResult) with
/// [`IntermediateRangeBucketEntry`](crate::aggregation::intermediate_agg_result::IntermediateRangeBucketEntry) on the
/// `DistributedAggregationCollector`.
///
/// # Limitations/Compatibility
/// Overlapping ranges are not yet supported.
///
/// # Request JSON Format
/// ```json
/// {
///     "my_ranges": {
///         "field": "score",
///         "ranges": [
///             { "to": 3.0 },
///             { "from": 3.0, "to": 7.0 },
///             { "from": 7.0, "to": 20.0 },
///             { "from": 20.0 }
///         ]
///     }
/// }
/// ```
#[derive(Clone, Debug, Default, PartialEq, Serialize, Deserialize)]
pub struct RangeAggregation {
    /// The field to aggregate on.
    pub field: String,
    /// Note that this aggregation includes the from value and excludes the to value for each
    /// range. Extra buckets will be created until the first to, and last from, if necessary.
    pub ranges: Vec<RangeAggregationRange>,
    /// Whether to return the buckets as a hash map
    #[serde(default)]
    pub keyed: bool,
}

#[derive(Clone, Debug, PartialEq, Serialize, Deserialize)]
/// The range for one range bucket.
pub struct RangeAggregationRange {
    /// Custom key for the range bucket
    #[serde(skip_serializing_if = "Option::is_none", default)]
    pub key: Option<String>,
    /// The from range value, which is inclusive in the range.
    /// `None` equals to an open ended interval.
    #[serde(
        skip_serializing_if = "Option::is_none",
        default,
        deserialize_with = "deserialize_option_f64"
    )]
    pub from: Option<f64>,
    /// The to range value, which is not inclusive in the range.
    /// `None` equals to an open ended interval.
    #[serde(
        skip_serializing_if = "Option::is_none",
        default,
        deserialize_with = "deserialize_option_f64"
    )]
    pub to: Option<f64>,
}

impl From<Range<f64>> for RangeAggregationRange {
    fn from(range: Range<f64>) -> Self {
        let from = if range.start == f64::MIN {
            None
        } else {
            Some(range.start)
        };
        let to = if range.end == f64::MAX {
            None
        } else {
            Some(range.end)
        };
        RangeAggregationRange {
            key: None,
            from,
            to,
        }
    }
}

#[derive(Clone, Debug, PartialEq)]
/// Internally used u64 range for one range bucket.
pub(crate) struct InternalRangeAggregationRange {
    /// Custom key for the range bucket
    key: Option<String>,
    /// `u64` range value
    range: Range<u64>,
}

impl From<Range<u64>> for InternalRangeAggregationRange {
    fn from(range: Range<u64>) -> Self {
        InternalRangeAggregationRange { key: None, range }
    }
}

#[derive(Clone, Debug)]
pub(crate) struct SegmentRangeAndBucketEntry {
    range: Range<u64>,
    bucket: SegmentRangeBucketEntry,
}

/// The collector puts values from the fast field into the correct buckets and does a conversion to
/// the correct datatype.
pub struct SegmentRangeCollector<C: SubAggCache> {
    /// The buckets containing the aggregation data.
    /// One for each ParentBucketId
    parent_buckets: Vec<Vec<SegmentRangeAndBucketEntry>>,
    column_type: ColumnType,
    pub(crate) accessor_idx: usize,
    sub_agg: Option<CachedSubAggs<C>>,
    /// Here things get a bit weird. We need to assign unique bucket ids across all
    /// parent buckets. So we keep track of the next available bucket id here.
    /// This allows a kind of flattening of the bucket ids across all parent buckets.
    /// E.g. in nested aggregations:
    /// Term Agg -> Range aggregation -> Stats aggregation
    /// E.g. the Term Agg creates 3 buckets ["INFO", "ERROR", "WARN"], each of these has a Range
    /// aggregation with 4 buckets. The Range aggregation will create buckets with ids:
    /// - INFO: 0,1,2,3
    /// - ERROR: 4,5,6,7
    /// - WARN: 8,9,10,11
    ///
    /// This allows the Stats aggregation to have unique bucket ids to refer to.
    bucket_id_provider: BucketIdProvider,
    limits: AggregationLimitsGuard,
}

impl<C: SubAggCache> Debug for SegmentRangeCollector<C> {
    fn fmt(&self, f: &mut std::fmt::Formatter<'_>) -> std::fmt::Result {
        f.debug_struct("SegmentRangeCollector")
            .field("parent_buckets_len", &self.parent_buckets.len())
            .field("column_type", &self.column_type)
            .field("accessor_idx", &self.accessor_idx)
            .field("has_sub_agg", &self.sub_agg.is_some())
            .finish()
    }
}

/// TODO: Bad naming, there's also SegmentRangeAndBucketEntry
#[derive(Clone)]
pub(crate) struct SegmentRangeBucketEntry {
    pub key: Key,
    pub doc_count: u64,
    // pub sub_aggregation: Option<Box<dyn SegmentAggregationCollector>>,
    pub bucket_id: BucketId,
    /// The from range of the bucket. Equals `f64::MIN` when `None`.
    pub from: Option<f64>,
    /// The to range of the bucket. Equals `f64::MAX` when `None`. Open interval, `to` is not
    /// inclusive.
    pub to: Option<f64>,
}

impl Debug for SegmentRangeBucketEntry {
    fn fmt(&self, f: &mut std::fmt::Formatter<'_>) -> std::fmt::Result {
        f.debug_struct("SegmentRangeBucketEntry")
            .field("key", &self.key)
            .field("doc_count", &self.doc_count)
            .field("from", &self.from)
            .field("to", &self.to)
            .finish()
    }
}
impl SegmentRangeBucketEntry {
    pub(crate) fn into_intermediate_bucket_entry(
        self,
    ) -> crate::Result<IntermediateRangeBucketEntry> {
        let sub_aggregation = IntermediateAggregationResults::default();

        Ok(IntermediateRangeBucketEntry {
            key: self.key.into(),
            doc_count: self.doc_count,
            sub_aggregation_res: sub_aggregation,
            from: self.from,
            to: self.to,
        })
    }
}

impl<C: SubAggCache> SegmentAggregationCollector for SegmentRangeCollector<C> {
    fn add_intermediate_aggregation_result(
        &mut self,
        agg_data: &AggregationsSegmentCtx,
        results: &mut IntermediateAggregationResults,
        parent_bucket_id: BucketId,
    ) -> crate::Result<()> {
        self.prepare_max_bucket(parent_bucket_id, agg_data)?;
        let field_type = self.column_type;
        let name = agg_data
            .get_range_req_data(self.accessor_idx)
            .name
            .to_string();

        let buckets = std::mem::take(&mut self.parent_buckets[parent_bucket_id as usize]);

        let buckets: FxHashMap<SerializedKey, IntermediateRangeBucketEntry> = buckets
            .into_iter()
            .map(|range_bucket| {
                let bucket_id = range_bucket.bucket.bucket_id;
                let mut agg = range_bucket.bucket.into_intermediate_bucket_entry()?;
                if let Some(sub_aggregation) = &mut self.sub_agg {
                    sub_aggregation
                        .get_sub_agg_collector()
                        .add_intermediate_aggregation_result(
                            agg_data,
                            &mut agg.sub_aggregation_res,
                            bucket_id,
                        )?;
                }
                Ok((range_to_string(&range_bucket.range, &field_type)?, agg))
            })
            .collect::<crate::Result<_>>()?;

        let bucket = IntermediateBucketResult::Range(IntermediateRangeBucketResult {
            buckets,
            column_type: Some(self.column_type),
        });

        results.push(name, IntermediateAggregationResult::Bucket(bucket))?;

        Ok(())
    }

    #[inline]
    fn collect(
        &mut self,
        parent_bucket_id: BucketId,
        docs: &[crate::DocId],
        agg_data: &mut AggregationsSegmentCtx,
    ) -> crate::Result<()> {
        let req = agg_data.take_range_req_data(self.accessor_idx);

        agg_data
            .column_block_accessor
            .fetch_block(docs, &req.accessor);

        let buckets = &mut self.parent_buckets[parent_bucket_id as usize];

        for (doc, val) in agg_data
            .column_block_accessor
            .iter_docid_vals(docs, &req.accessor)
        {
            let bucket_pos = get_bucket_pos(val, buckets);
            let bucket = &mut buckets[bucket_pos];
            bucket.bucket.doc_count += 1;
            if let Some(sub_agg) = self.sub_agg.as_mut() {
                sub_agg.push(bucket.bucket.bucket_id, doc);
            }
        }

        agg_data.put_back_range_req_data(self.accessor_idx, req);
        if let Some(sub_agg) = self.sub_agg.as_mut() {
            sub_agg.check_flush_local(agg_data)?;
        }

        Ok(())
    }

    fn flush(&mut self, agg_data: &mut AggregationsSegmentCtx) -> crate::Result<()> {
        if let Some(sub_agg) = self.sub_agg.as_mut() {
            sub_agg.flush(agg_data)?;
        }
        Ok(())
    }

    fn prepare_max_bucket(
        &mut self,
        max_bucket: BucketId,
        agg_data: &AggregationsSegmentCtx,
    ) -> crate::Result<()> {
        while self.parent_buckets.len() <= max_bucket as usize {
            let new_buckets = self.create_new_buckets(agg_data)?;
            self.parent_buckets.push(new_buckets);
        }

        Ok(())
    }
}
/// Build a concrete `SegmentRangeCollector` with either a Vec- or HashMap-backed
/// bucket storage, depending on the column type and aggregation level.
pub(crate) fn build_segment_range_collector(
    agg_data: &mut AggregationsSegmentCtx,
    node: &AggRefNode,
) -> crate::Result<Box<dyn SegmentAggregationCollector>> {
    let accessor_idx = node.idx_in_req_data;
    let req_data = agg_data.get_range_req_data(node.idx_in_req_data);
    let field_type = req_data.field_type;

    // TODO: A better metric instead of is_top_level would be the number of buckets expected.
    // E.g. If range agg is not top level, but the parent is a bucket agg with less than 10 buckets,
    // we can are still in low cardinality territory.
    let is_low_card = req_data.is_top_level && req_data.req.ranges.len() <= 64;

    let sub_agg = if !node.children.is_empty() {
        Some(build_segment_agg_collectors(agg_data, &node.children)?)
    } else {
        None
    };

    if is_low_card {
        Ok(Box::new(SegmentRangeCollector::<LowCardSubAggCache> {
            sub_agg: sub_agg.map(LowCardCachedSubAggs::new),
            column_type: field_type,
            accessor_idx,
            parent_buckets: Vec::new(),
            bucket_id_provider: BucketIdProvider::default(),
            limits: agg_data.context.limits.clone(),
        }))
    } else {
        Ok(Box::new(SegmentRangeCollector::<HighCardSubAggCache> {
            sub_agg: sub_agg.map(CachedSubAggs::new),
            column_type: field_type,
            accessor_idx,
            parent_buckets: Vec::new(),
            bucket_id_provider: BucketIdProvider::default(),
            limits: agg_data.context.limits.clone(),
        }))
    }
}

impl<C: SubAggCache> SegmentRangeCollector<C> {
    pub(crate) fn create_new_buckets(
        &mut self,
        agg_data: &AggregationsSegmentCtx,
    ) -> crate::Result<Vec<SegmentRangeAndBucketEntry>> {
        let field_type = self.column_type;
        let req_data = agg_data.get_range_req_data(self.accessor_idx);
        // The range input on the request is f64.
        // We need to convert to u64 ranges, because we read the values as u64.
        // The mapping from the conversion is monotonic so ordering is preserved.
        let buckets: Vec<_> = extend_validate_ranges(&req_data.req.ranges, &field_type)?
            .iter()
            .map(|range| {
                let bucket_id = self.bucket_id_provider.next_bucket_id();
                let key = range
                    .key
                    .clone()
                    .map(|key| Ok(Key::Str(key)))
                    .unwrap_or_else(|| range_to_key(&range.range, &field_type))?;
                let to = if range.range.end == u64::MAX {
                    None
                } else {
                    Some(f64_from_fastfield_u64(range.range.end, field_type))
                };
                let from = if range.range.start == u64::MIN {
                    None
                } else {
                    Some(f64_from_fastfield_u64(range.range.start, field_type))
                };
                // let sub_aggregation = sub_agg_prototype.clone();

                Ok(SegmentRangeAndBucketEntry {
                    range: range.range.clone(),
                    bucket: SegmentRangeBucketEntry {
                        doc_count: 0,
                        bucket_id,
                        key,
                        from,
                        to,
                    },
                })
            })
            .collect::<crate::Result<_>>()?;

        self.limits.add_memory_consumed(
            buckets.len() as u64 * std::mem::size_of::<SegmentRangeAndBucketEntry>() as u64,
        )?;
        Ok(buckets)
    }
}
#[inline]
fn get_bucket_pos(val: u64, buckets: &[SegmentRangeAndBucketEntry]) -> usize {
    let pos = buckets
        .binary_search_by_key(&val, |probe| probe.range.start)
        .unwrap_or_else(|pos| pos - 1);
    debug_assert!(buckets[pos].range.contains(&val));
    pos
}

/// Converts the user provided f64 range value to fast field value space.
///
/// Internally fast field values are always stored as u64.
/// If the fast field has u64 `[1, 2, 5]`, these values are stored as is in the fast field.
/// A fast field with f64 `[1.0, 2.0, 5.0]` is converted to u64 space, using a
/// monotonic mapping function, so the order is preserved.
///
/// Consequently, a f64 user range 1.0..3.0 needs to be converted to fast field value space using
/// the same monotonic mapping function, so that the provided ranges contain the u64 values in the
/// fast field.
/// The alternative would be that every value read would be converted to the f64 range, but that is
/// more computational expensive when many documents are hit.
fn to_u64_range(
    range: &RangeAggregationRange,
    field_type: &ColumnType,
) -> crate::Result<InternalRangeAggregationRange> {
    let start = if let Some(from) = range.from {
        f64_to_fastfield_u64(from, field_type)
            .ok_or_else(|| TantivyError::InvalidArgument("invalid field type".to_string()))?
    } else {
        u64::MIN
    };

    let end = if let Some(to) = range.to {
        f64_to_fastfield_u64(to, field_type)
            .ok_or_else(|| TantivyError::InvalidArgument("invalid field type".to_string()))?
    } else {
        u64::MAX
    };

    Ok(InternalRangeAggregationRange {
        key: range.key.clone(),
        range: start..end,
    })
}

/// Extends the provided buckets to contain the whole value range, by inserting buckets at the
/// beginning and end and filling gaps.
fn extend_validate_ranges(
    buckets: &[RangeAggregationRange],
    field_type: &ColumnType,
) -> crate::Result<Vec<InternalRangeAggregationRange>> {
    let mut converted_buckets = buckets
        .iter()
        .map(|range| to_u64_range(range, field_type))
        .collect::<crate::Result<Vec<_>>>()?;

    converted_buckets.sort_by_key(|bucket| bucket.range.start);
    if converted_buckets[0].range.start != u64::MIN {
        converted_buckets.insert(0, (u64::MIN..converted_buckets[0].range.start).into());
    }

    if converted_buckets[converted_buckets.len() - 1].range.end != u64::MAX {
        converted_buckets
            .push((converted_buckets[converted_buckets.len() - 1].range.end..u64::MAX).into());
    }

    // fill up holes in the ranges
    let find_hole = |converted_buckets: &[InternalRangeAggregationRange]| {
        for (pos, ranges) in converted_buckets.windows(2).enumerate() {
            if ranges[0].range.end > ranges[1].range.start {
                return Err(TantivyError::InvalidArgument(format!(
                    "Overlapping ranges not supported range {:?}, range+1 {:?}",
                    ranges[0], ranges[1]
                )));
            }
            if ranges[0].range.end != ranges[1].range.start {
                return Ok(Some(pos));
            }
        }
        Ok(None)
    };

    while let Some(hole_pos) = find_hole(&converted_buckets)? {
        let new_range =
            converted_buckets[hole_pos].range.end..converted_buckets[hole_pos + 1].range.start;
        converted_buckets.insert(hole_pos + 1, new_range.into());
    }

    Ok(converted_buckets)
}

pub(crate) fn range_to_string(
    range: &Range<u64>,
    field_type: &ColumnType,
) -> crate::Result<String> {
    // is_start is there for malformed requests, e.g. ig the user passes the range u64::MIN..0.0,
    // it should be rendered as "*-0" and not "*-*"
    let to_str = |val: u64, is_start: bool| {
        if (is_start && val == u64::MIN) || (!is_start && val == u64::MAX) {
            Ok("*".to_string())
        } else if *field_type == ColumnType::DateTime {
            let val = i64::from_u64(val);
            format_date(val)
        } else {
            Ok(f64_from_fastfield_u64(val, *field_type).to_string())
        }
    };

    Ok(format!(
        "{}-{}",
        to_str(range.start, true)?,
        to_str(range.end, false)?
    ))
}

pub(crate) fn range_to_key(range: &Range<u64>, field_type: &ColumnType) -> crate::Result<Key> {
    Ok(Key::Str(range_to_string(range, field_type)?))
}

#[cfg(test)]
mod tests {

    use serde_json::Value;

    use super::*;
    use crate::aggregation::agg_req::Aggregations;
    use crate::aggregation::tests::{
        exec_request, exec_request_with_query, get_test_index_2_segments,
        get_test_index_with_num_docs,
    };

    pub fn get_collector_from_ranges(
        ranges: Vec<RangeAggregationRange>,
        field_type: ColumnType,
    ) -> SegmentRangeCollector<HighCardSubAggCache> {
        let req = RangeAggregation {
            field: "dummy".to_string(),
            ranges,
            ..Default::default()
        };
        // Build buckets directly as in from_req_and_validate without AggregationsData
        let buckets: Vec<_> = extend_validate_ranges(&req.ranges, &field_type)
            .expect("unexpected error in extend_validate_ranges")
            .iter()
            .map(|range| {
                let key = range
                    .key
                    .clone()
                    .map(|key| Ok(Key::Str(key)))
                    .unwrap_or_else(|| range_to_key(&range.range, &field_type))
                    .expect("unexpected error in range_to_key");
                let to = if range.range.end == u64::MAX {
                    None
                } else {
                    Some(f64_from_fastfield_u64(range.range.end, field_type))
                };
                let from = if range.range.start == u64::MIN {
                    None
                } else {
                    Some(f64_from_fastfield_u64(range.range.start, field_type))
                };
                SegmentRangeAndBucketEntry {
                    range: range.range.clone(),
                    bucket: SegmentRangeBucketEntry {
                        doc_count: 0,
                        key,
                        from,
                        to,
                        bucket_id: 0,
                    },
                }
            })
            .collect();

        SegmentRangeCollector {
            parent_buckets: vec![buckets],
            column_type: field_type,
            accessor_idx: 0,
            sub_agg: None,
            bucket_id_provider: Default::default(),
            limits: AggregationLimitsGuard::default(),
        }
    }

    #[test]
    fn range_fraction_test() -> crate::Result<()> {
        let index = get_test_index_with_num_docs(false, 100)?;

        let agg_req: Aggregations = serde_json::from_value(json!({
            "range": {
                "range": {
                    "field": "fraction_f64",
                    "ranges": [
                        {"from": 0.0, "to": 0.1},
                        {"from": 0.1, "to": 0.2},
                    ]
                },
            }
        }))
        .unwrap();

        let res = exec_request_with_query(agg_req, &index, None)?;

        assert_eq!(res["range"]["buckets"][0]["key"], "*-0");
        assert_eq!(res["range"]["buckets"][0]["doc_count"], 0);
        assert_eq!(res["range"]["buckets"][1]["key"], "0-0.1");
        assert_eq!(res["range"]["buckets"][1]["doc_count"], 10);
        assert_eq!(res["range"]["buckets"][2]["key"], "0.1-0.2");
        assert_eq!(res["range"]["buckets"][2]["doc_count"], 10);
        assert_eq!(res["range"]["buckets"][3]["key"], "0.2-*");
        assert_eq!(res["range"]["buckets"][3]["doc_count"], 80);

        Ok(())
    }

    #[test]
    fn range_fraction_test_with_sub_agg() -> crate::Result<()> {
        let index = get_test_index_with_num_docs(false, 100)?;

        let sub_agg_req: Aggregations = serde_json::from_value(json!({
            "avg": { "avg": { "field": "score_f64", } }

        }))
        .unwrap();

        let agg_req: Aggregations = serde_json::from_value(json!({
            "range": {
                "range": {
                    "field": "fraction_f64",
                    "ranges": [
                        {"from": 0.0, "to": 0.1},
                        {"from": 0.1, "to": 0.2},
                    ]
                },
                "aggs": sub_agg_req
            }
        }))
        .unwrap();

        let res = exec_request_with_query(agg_req, &index, None)?;

        assert_eq!(res["range"]["buckets"][0]["key"], "*-0");
        assert_eq!(res["range"]["buckets"][0]["doc_count"], 0);
        assert_eq!(res["range"]["buckets"][1]["key"], "0-0.1");
        assert_eq!(res["range"]["buckets"][1]["doc_count"], 10);
        assert_eq!(res["range"]["buckets"][2]["key"], "0.1-0.2");
        assert_eq!(res["range"]["buckets"][2]["doc_count"], 10);
        assert_eq!(res["range"]["buckets"][3]["key"], "0.2-*");
        assert_eq!(res["range"]["buckets"][3]["doc_count"], 80);

        Ok(())
    }

    #[test]
    fn range_keyed_buckets_test() -> crate::Result<()> {
        let index = get_test_index_with_num_docs(false, 100)?;

        let agg_req: Aggregations = serde_json::from_value(json!({
            "range": {
                "range": {
                    "field": "fraction_f64",
                    "ranges": [
                        {"from": 0.0, "to": 0.1},
                        {"from": 0.1, "to": 0.2},
                    ],
                    "keyed": true
                },
            }
        }))
        .unwrap();

        let res = exec_request_with_query(agg_req, &index, None)?;

        assert_eq!(
            res,
            json!({
                "range": {
                    "buckets": {
                        "*-0": { "key": "*-0", "doc_count": 0, "to": 0.0},
                        "0-0.1": {"key": "0-0.1", "doc_count": 10, "from": 0.0, "to": 0.1},
                        "0.1-0.2": {"key": "0.1-0.2", "doc_count": 10, "from": 0.1, "to": 0.2},
                        "0.2-*": {"key": "0.2-*", "doc_count": 80, "from": 0.2},
                    }
                }
            })
        );

        Ok(())
    }

    #[test]
    fn range_custom_key_test() -> crate::Result<()> {
        let index = get_test_index_with_num_docs(false, 100)?;

        let agg_req: Aggregations = serde_json::from_value(json!({
            "range": {
                "range": {
                    "field": "fraction_f64",
                    "ranges": [
                        {"key": "custom-key-0-to-0.1", "from": 0.0, "to": 0.1},
                        {"from": 0.1, "to": 0.2},
                    ],
                    "keyed": false
                },
            }
        }))
        .unwrap();

        let res = exec_request_with_query(agg_req, &index, None)?;

        assert_eq!(
            res,
            json!({
                "range": {
                    "buckets": [
                        {"key": "*-0", "doc_count": 0, "to": 0.0},
                        {"key": "custom-key-0-to-0.1", "doc_count": 10, "from": 0.0, "to": 0.1},
                        {"key": "0.1-0.2", "doc_count": 10, "from": 0.1, "to": 0.2},
                        {"key": "0.2-*", "doc_count": 80, "from": 0.2}
                    ]
                }
            })
        );

        Ok(())
    }

    #[test]
    fn range_date_test_single_segment() -> crate::Result<()> {
        range_date_test_with_opt(true)
    }

    #[test]
    fn range_date_test_multi_segment() -> crate::Result<()> {
        range_date_test_with_opt(false)
    }

    fn range_date_test_with_opt(merge_segments: bool) -> crate::Result<()> {
        let index = get_test_index_2_segments(merge_segments)?;

        let agg_req: Aggregations = serde_json::from_value(json!({
            "date_ranges": {
                "range": {
                    "field": "date",
                    "ranges": [
                        {"to": 1546300800000000000i64},
                        {"from": 1546300800000000000i64, "to": 1546387200000000000i64},
                    ],
                    "keyed": false
                },
            }
        }))
        .unwrap();

        let agg_res = exec_request(agg_req, &index)?;

        let res: Value = serde_json::from_str(&serde_json::to_string(&agg_res)?)?;

        assert_eq!(
            res["date_ranges"]["buckets"][0]["from_as_string"],
            Value::Null
        );
        assert_eq!(
            res["date_ranges"]["buckets"][0]["key"],
            "*-2019-01-01T00:00:00Z"
        );
        assert_eq!(
            res["date_ranges"]["buckets"][1]["from_as_string"],
            "2019-01-01T00:00:00Z"
        );
        assert_eq!(
            res["date_ranges"]["buckets"][1]["to_as_string"],
            "2019-01-02T00:00:00Z"
        );

        assert_eq!(
            res["date_ranges"]["buckets"][2]["from_as_string"],
            "2019-01-02T00:00:00Z"
        );
        assert_eq!(
            res["date_ranges"]["buckets"][2]["to_as_string"],
            Value::Null
        );

        Ok(())
    }

    #[test]
    fn range_custom_key_keyed_buckets_test() -> crate::Result<()> {
        let index = get_test_index_with_num_docs(false, 100)?;

        let agg_req: Aggregations = serde_json::from_value(json!({
            "range": {
                "range": {
                    "field": "fraction_f64",
                    "ranges": [
                        {"key": "custom-key-0-to-0.1", "from": 0.0, "to": 0.1},
                    ],
                    "keyed": true
                },
            }
        }))
        .unwrap();

        let res = exec_request_with_query(agg_req, &index, None)?;

        assert_eq!(
            res,
            json!({
                "range": {
                    "buckets": {
                        "*-0": { "key": "*-0", "doc_count": 0, "to": 0.0},
                        "custom-key-0-to-0.1": {"key": "custom-key-0-to-0.1", "doc_count": 10, "from": 0.0, "to": 0.1},
                        "0.1-*": {"key": "0.1-*", "doc_count": 90, "from": 0.1},
                    }
                }
            })
        );

        Ok(())
    }

    #[test]
    fn bucket_test_extend_range_hole() {
        let buckets = vec![(10f64..20f64).into(), (30f64..40f64).into()];
        let collector = get_collector_from_ranges(buckets, ColumnType::F64);

        let buckets = collector.parent_buckets[0].clone();
        assert_eq!(buckets[0].range.start, u64::MIN);
        assert_eq!(buckets[0].range.end, 10f64.to_u64());
        assert_eq!(buckets[1].range.start, 10f64.to_u64());
        assert_eq!(buckets[1].range.end, 20f64.to_u64());
        // Added bucket to fill hole
        assert_eq!(buckets[2].range.start, 20f64.to_u64());
        assert_eq!(buckets[2].range.end, 30f64.to_u64());
        assert_eq!(buckets[3].range.start, 30f64.to_u64());
        assert_eq!(buckets[3].range.end, 40f64.to_u64());
    }

    #[test]
    fn bucket_test_range_conversion_special_case() {
        // the monotonic conversion between f64 and u64, does not map f64::MIN.to_u64() ==
        // u64::MIN, but the into trait converts f64::MIN/MAX to None
        let buckets = vec![
            (f64::MIN..10f64).into(),
            (10f64..20f64).into(),
            (20f64..f64::MAX).into(),
        ];
        let collector = get_collector_from_ranges(buckets, ColumnType::F64);

        let buckets = collector.parent_buckets[0].clone();
        assert_eq!(buckets[0].range.start, u64::MIN);
        assert_eq!(buckets[0].range.end, 10f64.to_u64());
        assert_eq!(buckets[1].range.start, 10f64.to_u64());
        assert_eq!(buckets[1].range.end, 20f64.to_u64());
        assert_eq!(buckets[2].range.start, 20f64.to_u64());
        assert_eq!(buckets[2].range.end, u64::MAX);
        assert_eq!(buckets.len(), 3);
    }

    #[test]
    fn bucket_range_test_negative_vals() {
        let buckets = vec![(-10f64..-1f64).into()];
        let collector = get_collector_from_ranges(buckets, ColumnType::F64);

        let buckets = collector.parent_buckets[0].clone();
        assert_eq!(&buckets[0].bucket.key.to_string(), "*--10");
        assert_eq!(&buckets[buckets.len() - 1].bucket.key.to_string(), "-1-*");
    }
    #[test]
    fn bucket_range_test_positive_vals() {
        let buckets = vec![(0f64..10f64).into()];
        let collector = get_collector_from_ranges(buckets, ColumnType::F64);

        let buckets = collector.parent_buckets[0].clone();
        assert_eq!(&buckets[0].bucket.key.to_string(), "*-0");
        assert_eq!(&buckets[buckets.len() - 1].bucket.key.to_string(), "10-*");
    }

    #[test]
    fn range_binary_search_test_u64() {
        let check_ranges = |ranges: Vec<RangeAggregationRange>| {
            let collector = get_collector_from_ranges(ranges, ColumnType::U64);
            let search = |val: u64| get_bucket_pos(val, &collector.parent_buckets[0]);

            assert_eq!(search(u64::MIN), 0);
            assert_eq!(search(9), 0);
            assert_eq!(search(10), 1);
            assert_eq!(search(11), 1);
            assert_eq!(search(99), 1);
            assert_eq!(search(100), 2);
            assert_eq!(search(u64::MAX - 1), 2); // Since the end range is never included, the max
                                                 // value
        };

        let ranges = vec![(10.0..100.0).into()];
        check_ranges(ranges);

        let ranges = vec![
            RangeAggregationRange {
                key: None,
                to: Some(10.0),
                from: None,
            },
            (10.0..100.0).into(),
        ];
        check_ranges(ranges);

        let ranges = vec![
            RangeAggregationRange {
                key: None,
                to: Some(10.0),
                from: None,
            },
            (10.0..100.0).into(),
            RangeAggregationRange {
                key: None,
                to: None,
                from: Some(100.0),
            },
        ];
        check_ranges(ranges);
    }

    #[test]
    fn range_binary_search_test_f64() {
        let ranges = vec![(10.0..100.0).into()];

        let collector = get_collector_from_ranges(ranges, ColumnType::F64);
        let search = |val: u64| get_bucket_pos(val, &collector.parent_buckets[0]);

        assert_eq!(search(u64::MIN), 0);
        assert_eq!(search(9f64.to_u64()), 0);
        assert_eq!(search(10f64.to_u64()), 1);
        assert_eq!(search(11f64.to_u64()), 1);
        assert_eq!(search(99f64.to_u64()), 1);
        assert_eq!(search(100f64.to_u64()), 2);
        assert_eq!(search(u64::MAX - 1), 2); // Since the end range is never included,
                                             // the max value
    }
}


================================================
FILE: src/aggregation/bucket/term_agg.rs
================================================
use std::fmt::Debug;
use std::io;
use std::net::Ipv6Addr;

use columnar::column_values::CompactSpaceU64Accessor;
use columnar::{
    Column, ColumnType, Dictionary, MonotonicallyMappableToU128, MonotonicallyMappableToU64,
    NumericalValue, StrColumn,
};
use common::{BitSet, TinySet};
use rustc_hash::FxHashMap;
use serde::{Deserialize, Serialize};

use super::{CustomOrder, Order, OrderTarget};
use crate::aggregation::agg_data::{
    build_segment_agg_collectors, AggRefNode, AggregationsSegmentCtx,
};
use crate::aggregation::agg_limits::MemoryConsumption;
use crate::aggregation::agg_req::Aggregations;
use crate::aggregation::cached_sub_aggs::{
    CachedSubAggs, HighCardSubAggCache, LowCardCachedSubAggs, LowCardSubAggCache, SubAggCache,
};
use crate::aggregation::intermediate_agg_result::{
    IntermediateAggregationResult, IntermediateAggregationResults, IntermediateBucketResult,
    IntermediateKey, IntermediateTermBucketEntry, IntermediateTermBucketResult,
};
use crate::aggregation::segment_agg_result::{BucketIdProvider, SegmentAggregationCollector};
use crate::aggregation::{format_date, BucketId, Key};
use crate::error::DataCorruption;
use crate::TantivyError;

/// Contains all information required by the SegmentTermCollector to perform the
/// terms aggregation on a segment.
#[derive(Debug, Clone)]
pub struct TermsAggReqData {
    /// The column accessor to access the fast field values.
    pub accessor: Column<u64>,
    /// The type of the column.
    pub column_type: ColumnType,
    /// The string dictionary column if the field is of type text.
    pub str_dict_column: Option<StrColumn>,
    /// The missing value as u64 value.
    pub missing_value_for_accessor: Option<u64>,
    /// Used to build the correct nested result when we have an empty result.
    pub sug_aggregations: Aggregations,
    /// The name of the aggregation.
    pub name: String,
    /// The normalized term aggregation request.
    pub req: TermsAggregationInternal,
    /// Preloaded allowed term ords (string columns only). If set, only ords present are collected.
    pub allowed_term_ids: Option<BitSet>,
    /// True if this terms aggregation is at the top level of the aggregation tree (not nested).
    pub is_top_level: bool,
}

impl TermsAggReqData {
    /// Estimate the memory consumption of this struct in bytes.
    pub fn get_memory_consumption(&self) -> usize {
        std::mem::size_of::<Self>()
            + std::mem::size_of::<TermsAggregationInternal>()
            + self
                .allowed_term_ids
                .as_ref()
                .map(|bs| bs.len() / 8)
                .unwrap_or(0)
    }
}

/// Creates a bucket for every unique term and counts the number of occurrences.
/// Note that doc_count in the response buckets equals term count here.
///
/// If the text is untokenized and single value, that means one term per document and therefore it
/// is in fact doc count.
///
/// ## Prerequisite
/// Term aggregations work only on [fast fields](`crate::fastfield`) of type `u64`, `f64`, `i64` and
/// text.
///
/// ## Document count error
/// To improve performance, results from one segment are cut off at `segment_size`. On a index with
/// a single segment this is fine. When combining results of multiple segments, terms that
/// don't make it in the top n of a shard increase the theoretical upper bound error by lowest
/// term-count.
///
/// Even with a larger `segment_size` value, doc_count values for a terms aggregation may be
/// approximate. As a result, any sub-aggregations on the terms aggregation may also be approximate.
/// `sum_other_doc_count` is the number of documents that didn’t make it into the top size
/// terms. If this is greater than 0, you can be sure that the terms agg had to throw away some
/// buckets, either because they didn’t fit into size on the root node or they didn’t fit into
/// `segment_size` on the segment node.
///
/// ## Per bucket document count error
/// If you set the `show_term_doc_count_error` parameter to true, the terms aggregation will include
/// doc_count_error_upper_bound, which is an upper bound to the error on the doc_count returned by
/// each segment. It’s the sum of the size of the largest bucket on each segment that didn’t fit
/// into segment_size.
///
/// Result type is [`BucketResult`](crate::aggregation::agg_result::BucketResult) with
/// [`BucketEntry`](crate::aggregation::agg_result::BucketEntry) on the
/// `AggregationCollector`.
///
/// Result type is
/// [`IntermediateBucketResult`](crate::aggregation::intermediate_agg_result::IntermediateBucketResult) with
/// [`IntermediateTermBucketEntry`](crate::aggregation::intermediate_agg_result::IntermediateTermBucketEntry) on the
/// `DistributedAggregationCollector`.
///
/// # Limitations/Compatibility
///
/// Each segment returns up to [segment_size](TermsAggregation::segment_size) results. This
/// differences to elasticsearch behaviour.
///
/// # Request JSON Format
/// ```json
/// {
///     "genres": {
///         "terms":{ "field": "genre" }
///     }
/// }
/// ```
///
/// /// # Response JSON Format
/// ```json
/// {
///     ...
///     "aggregations": {
///         "genres": {
///             "doc_count_error_upper_bound": 0,
///             "sum_other_doc_count": 0,
///             "buckets": [
///                 { "key": "drumnbass", "doc_count": 6 },
///                 { "key": "raggae", "doc_count": 4 },
///                 { "key": "jazz", "doc_count": 2 }
///             ]
///         }
///     }
/// }
/// ```

#[derive(Clone, Debug, PartialEq)]
pub enum IncludeExcludeParam {
    /// A single string pattern is treated as regex.
    Regex(String),
    /// An array of strings is treated as exact values.
    Values(Vec<String>),
}

impl Serialize for IncludeExcludeParam {
    fn serialize<S>(&self, serializer: S) -> Result<S::Ok, S::Error>
    where S: serde::Serializer {
        match self {
            IncludeExcludeParam::Regex(s) => serializer.serialize_str(s),
            IncludeExcludeParam::Values(v) => v.serialize(serializer),
        }
    }
}

// Custom deserializer to accept either a single string (regex) or an array of strings (values).
impl<'de> Deserialize<'de> for IncludeExcludeParam {
    fn deserialize<D>(deserializer: D) -> Result<Self, D::Error>
    where D: serde::Deserializer<'de> {
        use serde::de::{self, SeqAccess, Visitor};
        struct IncludeExcludeVisitor;

        impl<'de> Visitor<'de> for IncludeExcludeVisitor {
            type Value = IncludeExcludeParam;

            fn expecting(&self, formatter: &mut std::fmt::Formatter) -> std::fmt::Result {
                formatter.write_str("a string (regex) or an array of strings")
            }

            fn visit_str<E>(self, v: &str) -> Result<Self::Value, E>
            where E: de::Error {
                Ok(IncludeExcludeParam::Regex(v.to_string()))
            }

            fn visit_borrowed_str<E>(self, v: &'de str) -> Result<Self::Value, E>
            where E: de::Error {
                Ok(IncludeExcludeParam::Regex(v.to_string()))
            }

            fn visit_string<E>(self, v: String) -> Result<Self::Value, E>
            where E: de::Error {
                Ok(IncludeExcludeParam::Regex(v))
            }

            fn visit_seq<A>(self, mut seq: A) -> Result<Self::Value, A::Error>
            where A: SeqAccess<'de> {
                let mut values: Vec<String> = Vec::new();
                while let Some(elem) = seq.next_element::<String>()? {
                    values.push(elem);
                }
                Ok(IncludeExcludeParam::Values(values))
            }
        }

        deserializer.deserialize_any(IncludeExcludeVisitor)
    }
}

/// The terms aggregation allows you to group documents by unique values of a field.
#[derive(Clone, Debug, Default, PartialEq, Serialize, Deserialize)]
pub struct TermsAggregation {
    /// The field to aggregate on.
    pub field: String,
    /// By default, the top 10 terms with the most documents are returned.
    /// Larger values for size are more expensive.
    #[serde(skip_serializing_if = "Option::is_none", default)]
    pub size: Option<u32>,

    /// To get more accurate results, we fetch more than `size` from each segment.
    ///
    /// Increasing this value is will increase the cost for more accuracy.
    ///
    /// Defaults to 10 * size.
    #[serde(skip_serializing_if = "Option::is_none", default)]
    #[serde(alias = "shard_size")]
    #[serde(alias = "split_size")]
    pub segment_size: Option<u32>,

    /// If you set the `show_term_doc_count_error` parameter to true, the terms aggregation will
    /// include doc_count_error_upper_bound, which is an upper bound to the error on the
    /// doc_count returned by each shard. It’s the sum of the size of the largest bucket on
    /// each segment that didn’t fit into `shard_size`.
    ///
    /// Defaults to true when ordering by count desc.
    #[serde(skip_serializing_if = "Option::is_none", default)]
    pub show_term_doc_count_error: Option<bool>,

    /// Filter all terms that are lower than `min_doc_count`. Defaults to 1.
    ///
    /// **Expensive**: When set to 0, this will return all terms in the field.
    #[serde(skip_serializing_if = "Option::is_none", default)]
    pub min_doc_count: Option<u64>,

    /// Set the order. `String` is here a target, which is either "_count", "_key", or the name of
    /// a metric sub_aggregation.
    ///
    /// Single value metrics like average can be addressed by its name.
    /// Multi value metrics like stats are required to address their field by name e.g.
    /// "stats.avg"
    ///
    /// Examples in JSON format:
    /// { "_count": "asc" }
    /// { "_key": "asc" }
    /// { "average_price": "asc" }
    #[serde(skip_serializing_if = "Option::is_none", default)]
    pub order: Option<CustomOrder>,

    /// The missing parameter defines how documents that are missing a value should be treated.
    /// By default they will be ignored but it is also possible to treat them as if they had a
    /// value. Examples in JSON format:
    /// { "missing": "NO_DATA" }
    ///
    /// # Internal
    ///
    /// Internally, `missing` requires some specialized handling in some scenarios.
    ///
    /// Simple Case:
    /// In the simplest case, we can just put the missing value in the termmap and use that. In
    /// case of text we put a special u64::MAX and replace it at the end with the actual
    /// missing value, when loading the text.
    /// Special Case 1:
    /// If we have multiple columns on one field, we need to have a union on the indices on both
    /// columns, to find docids without a value. That requires a special missing aggregation.
    /// Special Case 2: if the key is of type text and the column is numerical, we also need to use
    /// the special missing aggregation, since there is no mechanism in the numerical column to
    /// add text.
    #[serde(skip_serializing_if = "Option::is_none", default)]
    pub missing: Option<Key>,

    /// Include terms by either regex (single string) or exact values (array).
    #[serde(skip_serializing_if = "Option::is_none", default)]
    pub include: Option<IncludeExcludeParam>,
    /// Exclude terms by either regex (single string) or exact values (array).
    #[serde(skip_serializing_if = "Option::is_none", default)]
    pub exclude: Option<IncludeExcludeParam>,
}

/// Same as TermsAggregation, but with populated defaults.
#[derive(Clone, Debug, PartialEq)]
pub struct TermsAggregationInternal {
    /// The field to aggregate on.
    pub field: String,
    /// By default, the top 10 terms with the most documents are returned.
    /// Larger values for size are more expensive.
    ///
    /// Defaults to 10.
    pub size: u32,

    /// If you set the `show_term_doc_count_error` parameter to true, the terms aggregation will
    /// include doc_count_error_upper_bound, which is an upper bound to the error on the
    /// doc_count returned by each shard. It’s the sum of the size of the largest bucket on
    /// each segment that didn’t fit into `segment_size`.
    pub show_term_doc_count_error: bool,

    /// The get more accurate results, we fetch more than `size` from each segment.
    ///
    /// Increasing this value is will increase the cost for more accuracy.
    pub segment_size: u32,

    /// Filter all terms that are lower than `min_doc_count`. Defaults to 1.
    ///
    /// *Expensive*: When set to 0, this will return all terms in the field.
    pub min_doc_count: u64,

    /// Set the order. `String` is here a target, which is either "_count", "_key", or the name of
    /// a metric sub_aggregation.
    pub order: CustomOrder,

    /// The missing parameter defines how documents that are missing a value should be treated.
    pub missing: Option<Key>,
}

impl TermsAggregationInternal {
    pub(crate) fn from_req(req: &TermsAggregation) -> Self {
        let size = req.size.unwrap_or(10);

        let mut segment_size = req.segment_size.unwrap_or(size * 10);

        let order = req.order.clone().unwrap_or_default();
        segment_size = segment_size.max(size);
        TermsAggregationInternal {
            field: req.field.to_string(),
            size,
            segment_size,
            show_term_doc_count_error: req
                .show_term_doc_count_error
                .unwrap_or_else(|| order == CustomOrder::default()),
            min_doc_count: req.min_doc_count.unwrap_or(1),
            order,
            missing: req.missing.clone(),
        }
    }
}

/// The treshold for maximum number of terms to use a Vec-backed bucket storage.
/// TODO: Benchmark to validate the threshold
pub const MAX_NUM_TERMS_FOR_VEC: u64 = 100;

/// Build a concrete `SegmentTermCollector` with either a Vec- or HashMap-backed
/// bucket storage, depending on the column type and aggregation level.
pub(crate) fn build_segment_term_collector(
    req_data: &mut AggregationsSegmentCtx,
    node: &AggRefNode,
) -> crate::Result<Box<dyn SegmentAggregationCollector>> {
    let terms_req_data = req_data.get_term_req_data(node.idx_in_req_data).clone();
    let column_type = terms_req_data.column_type;

    if column_type == ColumnType::Bytes {
        return Err(TantivyError::InvalidArgument(format!(
            "terms aggregation is not supported for column type {column_type:?}"
        )));
    }

    // Validate sub aggregation exists when ordering by sub-aggregation.
    {
        if let OrderTarget::SubAggregation(sub_agg_name) = &terms_req_data.req.order.target {
            let (agg_name, _agg_property) = get_agg_name_and_property(sub_agg_name);

            node.get_sub_agg(agg_name, &req_data.per_request)
                .ok_or_else(|| {
                    TantivyError::InvalidArgument(format!(
                        "could not find aggregation with name {agg_name} in metric \
                         sub_aggregations"
                    ))
                })?;
        }
    }

    // Build sub-aggregation blueprint if there are children.
    let has_sub_aggregations = !node.children.is_empty();

    // TODO: A better metric instead of is_top_level would be the number of buckets expected.
    // E.g. If term agg is not top level, but the parent is a bucket agg with less than 10 buckets,
    // we can still use Vec.
    let is_top_level = terms_req_data.is_top_level;

    // Let's see if we can use a vec to aggregate our data
    // instead of a hashmap.
    let col_max_value = terms_req_data.accessor.max_value();
    let max_term_id: u64 =
        col_max_value.max(terms_req_data.missing_value_for_accessor.unwrap_or(0u64));

    let sub_agg_collector = if has_sub_aggregations {
        Some(build_segment_agg_collectors(req_data, &node.children)?)
    } else {
        None
    };

    let mut bucket_id_provider = BucketIdProvider::default();
    // Decide which bucket storage is best suited for this aggregation.
    if is_top_level && max_term_id < MAX_NUM_TERMS_FOR_VEC && !has_sub_aggregations {
        let term_buckets = VecTermBucketsNoAgg::new(max_term_id + 1, &mut bucket_id_provider);
        let collector: SegmentTermCollector<_, HighCardSubAggCache> = SegmentTermCollector {
            parent_buckets: vec![term_buckets],
            sub_agg: None,
            bucket_id_provider,
            max_term_id,
            terms_req_data,
        };
        Ok(Box::new(collector))
    } else if is_top_level && max_term_id < MAX_NUM_TERMS_FOR_VEC {
        let term_buckets = VecTermBuckets::new(max_term_id + 1, &mut bucket_id_provider);
        let sub_agg = sub_agg_collector.map(LowCardCachedSubAggs::new);
        let collector: SegmentTermCollector<_, LowCardSubAggCache> = SegmentTermCollector {
            parent_buckets: vec![term_buckets],
            sub_agg,
            bucket_id_provider,
            max_term_id,
            terms_req_data,
        };
        Ok(Box::new(collector))
    } else if max_term_id < 8_000_000 && is_top_level {
        let term_buckets: PagedTermMap =
            PagedTermMap::new(max_term_id + 1, &mut bucket_id_provider);
        // Build sub-aggregation blueprint (flat pairs)
        let sub_agg = sub_agg_collector.map(CachedSubAggs::new);
        let collector: SegmentTermCollector<PagedTermMap, HighCardSubAggCache> =
            SegmentTermCollector {
                parent_buckets: vec![term_buckets],
                sub_agg,
                bucket_id_provider,
                max_term_id,
                terms_req_data,
            };
        Ok(Box::new(collector))
    } else {
        let term_buckets: HashMapTermBuckets = HashMapTermBuckets::default();
        // Build sub-aggregation blueprint (flat pairs)
        let sub_agg = sub_agg_collector.map(CachedSubAggs::new);
        let collector: SegmentTermCollector<HashMapTermBuckets, HighCardSubAggCache> =
            SegmentTermCollector {
                parent_buckets: vec![term_buckets],
                sub_agg,
                bucket_id_provider,
                max_term_id,
                terms_req_data,
            };
        Ok(Box::new(collector))
    }
}

#[derive(Debug, Clone, Copy, Default)]
struct Bucket {
    pub count: u32,
    pub bucket_id: BucketId,
}

impl Bucket {
    #[inline(always)]
    fn new(bucket_id: BucketId) -> Self {
        Self {
            count: 0,
            bucket_id,
        }
    }
}

/// Abstraction over the storage used for term buckets (counts only).
trait TermAggregationMap: Clone + Debug + 'static {
    /// Create a new instance with a strict upper bound on term ids.
    fn new(max_term_id: u64, bucket_id_provider: &mut BucketIdProvider) -> Self;

    /// Estimate the memory consumption of this struct in bytes.
    fn get_memory_consumption(&self) -> usize;

    /// Increments the count and returns the bucket_id associated to a given term_id.
    fn term_entry(&mut self, term_id: u64, bucket_id_provider: &mut BucketIdProvider) -> BucketId;

    /// Returns the term aggregation as a vector of (term_id, bucket) pairs,
    /// in any order.
    fn into_vec(self) -> Vec<(u64, Bucket)>;
}

#[derive(Clone, Debug)]
struct HashMapTermBuckets {
    bucket_map: FxHashMap<u64, Bucket>,
}

impl Default for HashMapTermBuckets {
    #[inline(always)]
    fn default() -> Self {
        Self {
            bucket_map: FxHashMap::default(),
        }
    }
}

const PAGE_SHIFT: usize = 10;
const PAGE_SIZE: usize = 1 << PAGE_SHIFT; // 1024
const PAGE_MASK: usize = PAGE_SIZE - 1;
const BITMASK_LEN: usize = PAGE_SIZE / 64;

#[derive(Clone, Debug)]
struct Page {
    /// Bitmask indicating which offsets are present.
    /// It is chunked into TinySet words.
    presence: [TinySet; BITMASK_LEN],
    data: [Bucket; PAGE_SIZE],
}

impl Page {
    fn new() -> Self {
        Self {
            presence: [TinySet::empty(); BITMASK_LEN],
            data: [Bucket::default(); PAGE_SIZE],
        }
    }

    #[inline]
    fn is_set(&self, offset: usize) -> bool {
        let bucket_idx = offset / 64;
        let bit_idx = offset % 64;
        self.presence[bucket_idx].contains(bit_idx as u32)
    }

    #[inline]
    fn set_present(&mut self, offset: usize) {
        let bucket_idx = offset / 64;
        let bit_idx = offset % 64;
        self.presence[bucket_idx].insert_mut(bit_idx as u32);
    }

    // Flattened iteration logic
    fn collect_items(&self, base_term_id: u64, result: &mut Vec<(u64, Bucket)>) {
        for (bucket_pos, &tiny_set) in self.presence.iter().enumerate() {
            let base_offset = bucket_pos * 64;

            for bit in tiny_set.into_iter() {
                let offset = base_offset + bit as usize;
                result.push((base_term_id + offset as u64, self.data[offset]));
            }
        }
    }
}

/// A paged term map implementation for moderate sized term id sets.
/// Uses a fixed size vector of pages, each page containing a fixed size array of buckets.
///
/// Each page covers a range of term ids. Pages are allocated on demand.
/// This implementation is more memory efficient than a full Vec for high cardinality term id sets,
///
/// It has a fixed cost of `num_pages * 8 bytes` for the page directory.
/// For 1 million terms, this is 8 * 1024 = 8KB.
///
/// Note that for nested aggregations we create one TermAggregationMap per parent bucket.
/// For example, with 100 parent buckets and 1 million terms, this is 800KB overhead for the page
/// directories only. Therefore, this implementation is only enabled for top-level aggregations
/// TODO: pass expected number of buckets from parent instead of strict is_top_level flag.
#[derive(Clone, Debug, Default)]
struct PagedTermMap {
    // Fixed size vector based on max_term_id
    pages: Vec<Option<Box<Page>>>,
    mem_usage: usize,
}

impl PagedTermMap {}

impl TermAggregationMap for PagedTermMap {
    #[inline]
    fn get_memory_consumption(&self) -> usize {
        self.mem_usage + std::mem::size_of::<Self>()
    }

    #[inline]
    fn term_entry(&mut self, term_id: u64, bucket_id_provider: &mut BucketIdProvider) -> BucketId {
        let term_id = term_id as usize;
        let page_idx = term_id >> PAGE_SHIFT;
        let offset = term_id & PAGE_MASK;

        // This panics if term_id > max_term_id
        let page = match &mut self.pages[page_idx] {
            Some(p) => p,
            None => {
                let new_page = Box::new(Page::new());
                self.mem_usage += std::mem::size_of::<Page>();
                self.pages[page_idx] = Some(new_page);
                self.pages[page_idx].as_mut().unwrap()
            }
        };

        if page.is_set(offset) {
            let bucket = &mut page.data[offset];
            bucket.count += 1;
            bucket.bucket_id
        } else {
            let new_id = bucket_id_provider.next_bucket_id();
            page.data[offset] = Bucket {
                count: 1,
                bucket_id: new_id,
            };
            page.set_present(offset);
            new_id
        }
    }

    fn into_vec(self) -> Vec<(u64, Bucket)> {
        // estimate 16 entries per non-empty page
        let estimated_count = self.pages.iter().filter(|p| p.is_some()).count() * 16;
        let mut result = Vec::with_capacity(estimated_count);

        for (i, page_opt) in self.pages.into_iter().enumerate() {
            if let Some(page) = page_opt {
                let base_term_id = (i << PAGE_SHIFT) as u64;
                page.collect_items(base_term_id, &mut result);
            }
        }
        result
    }

    /// Initialize with a strict upper bound.
    /// Panics if you try to insert a term_id > max_term_id.
    fn new(max_term_id: u64, _bucket_id_provider: &mut BucketIdProvider) -> Self {
        let max_page_idx = (max_term_id as usize) >> PAGE_SHIFT;
        let num_pages = max_page_idx + 1;

        // Pre-allocate the directory (pointers only, not the heavy pages)
        // Memory cost: num_pages * 8 bytes
        let pages = vec![None; num_pages];

        let mem_usage = pages.capacity() * std::mem::size_of::<Option<Box<Page>>>();

        Self { pages, mem_usage }
    }
}

impl TermAggregationMap for HashMapTermBuckets {
    #[inline]
    fn get_memory_consumption(&self) -> usize {
        self.bucket_map.memory_consumption()
    }

    #[inline(always)]
    fn term_entry(&mut self, term_id: u64, bucket_id_provider: &mut BucketIdProvider) -> BucketId {
        let bucket = self
            .bucket_map
            .entry(term_id)
            .or_insert_with(|| Bucket::new(bucket_id_provider.next_bucket_id()));
        bucket.count += 1;
        bucket.bucket_id
    }

    fn into_vec(self) -> Vec<(u64, Bucket)> {
        self.bucket_map.into_iter().collect()
    }

    #[inline]
    fn new(_max_term_id: u64, _bucket_id_provider: &mut BucketIdProvider) -> Self {
        Self::default()
    }
}

/// An optimized term map implementation for a compact set of term ordinals.
#[derive(Clone, Debug)]
struct VecTermBucketsNoAgg {
    buckets: Vec<u32>,
}

impl TermAggregationMap for VecTermBucketsNoAgg {
    /// Estimate the memory consumption of this struct in bytes.
    fn get_memory_consumption(&self) -> usize {
        // We do not include `std::mem::size_of::<Self>()`
        // It is already measure by the parent aggregation.
        //
        self.buckets.capacity() * std::mem::size_of::<u32>()
    }

    /// Add an occurrence of the given term id.
    #[inline(always)]
    fn term_entry(&mut self, term_id: u64, _bucket_id_provider: &mut BucketIdProvider) -> BucketId {
        let term_id_usize = term_id as usize;
        debug_assert!(
            term_id_usize < self.buckets.len(),
            "term_id {} out of bounds for VecTermBuckets (len={})",
            term_id,
            self.buckets.len()
        );
        let count = unsafe { self.buckets.get_unchecked_mut(term_id_usize) };
        *count += 1;
        0 // unused
    }

    fn into_vec(self) -> Vec<(u64, Bucket)> {
        self.buckets
            .into_iter()
            .enumerate()
            .filter(|(_term_id, count)| *count > 0)
            .map(|(term_id, count)| {
                (
                    term_id as u64,
                    Bucket {
                        count,
                        bucket_id: 0, // unused, there are no sub-aggregations
                    },
                )
            })
            .collect()
    }

    fn new(num_terms: u64, _bucket_id_provider: &mut BucketIdProvider) -> Self {
        Self {
            buckets: std::iter::repeat_with(|| 0)
                .take(num_terms as usize)
                .collect(),
        }
    }
}

/// An optimized term map implementation for a compact set of term ordinals.
#[derive(Clone, Debug)]
struct VecTermBuckets {
    buckets: Vec<Bucket>,
}

impl TermAggregationMap for VecTermBuckets {
    /// Estimate the memory consumption of this struct in bytes.
    fn get_memory_consumption(&self) -> usize {
        // We do not include `std::mem::size_of::<Self>()`
        // It is already measure by the parent aggregation.
        //
        // The root aggregation mem size is not measure but we do not care.
        self.buckets.capacity() * std::mem::size_of::<Bucket>()
    }

    /// Add an occurrence of the given term id.
    #[inline(always)]
    fn term_entry(&mut self, term_id: u64, _bucket_id_provider: &mut BucketIdProvider) -> BucketId {
        let term_id_usize = term_id as usize;
        debug_assert!(
            term_id_usize < self.buckets.len(),
            "term_id {} out of bounds for VecTermBuckets (len={})",
            term_id,
            self.buckets.len()
        );
        let bucket = unsafe { self.buckets.get_unchecked_mut(term_id_usize) };
        bucket.count += 1;
        bucket.bucket_id
    }

    fn into_vec(self) -> Vec<(u64, Bucket)> {
        self.buckets
            .into_iter()
            .enumerate()
            .filter(|(_, bucket)| bucket.count > 0)
            .map(|(term_id, bucket)| (term_id as u64, bucket))
            .collect()
    }

    fn new(num_terms: u64, bucket_id_provider: &mut BucketIdProvider) -> Self {
        VecTermBuckets {
            buckets: std::iter::repeat_with(|| Bucket::new(bucket_id_provider.next_bucket_id()))
                .take(num_terms as usize)
                .collect(),
        }
    }
}

/// The collector puts values from the fast field into the correct buckets and does a conversion to
/// the correct datatype.
#[derive(Debug)]
struct SegmentTermCollector<TermMap: TermAggregationMap, C: SubAggCache> {
    /// The buckets containing the aggregation data.
    parent_buckets: Vec<TermMap>,
    sub_agg: Option<CachedSubAggs<C>>,
    bucket_id_provider: BucketIdProvider,
    max_term_id: u64,
    terms_req_data: TermsAggReqData,
}

pub(crate) fn get_agg_name_and_property(name: &str) -> (&str, &str) {
    let (agg_name, agg_property) = name.split_once('.').unwrap_or((name, ""));
    (agg_name, agg_property)
}

impl<TermMap: TermAggregationMap, C: SubAggCache> SegmentAggregationCollector
    for SegmentTermCollector<TermMap, C>
{
    fn add_intermediate_aggregation_result(
        &mut self,
        agg_data: &AggregationsSegmentCtx,
        results: &mut IntermediateAggregationResults,
        bucket: BucketId,
    ) -> crate::Result<()> {
        // TODO: avoid prepare_max_bucket here and handle empty buckets.
        self.prepare_max_bucket(bucket, agg_data)?;
        let bucket = std::mem::replace(
            &mut self.parent_buckets[bucket as usize],
            TermMap::new(0, &mut self.bucket_id_provider),
        );
        let term_req = &self.terms_req_data;
        let name = term_req.name.clone();

        let bucket =
            Self::into_intermediate_bucket_result(term_req, &mut self.sub_agg, bucket, agg_data)?;
        results.push(name, IntermediateAggregationResult::Bucket(bucket))?;
        Ok(())
    }

    #[inline]
    fn collect(
        &mut self,
        parent_bucket_id: BucketId,
        docs: &[crate::DocId],
        agg_data: &mut AggregationsSegmentCtx,
    ) -> crate::Result<()> {
        let mem_pre = self.get_memory_consumption();

        let req_data = &mut self.terms_req_data;

        agg_data.column_block_accessor.fetch_block_with_missing(
            docs,
            &req_data.accessor,
            req_data.missing_value_for_accessor,
        );

        if let Some(sub_agg) = &mut self.sub_agg {
            let term_buckets = &mut self.parent_buckets[parent_bucket_id as usize];
            let it = agg_data
                .column_block_accessor
                .iter_docid_vals(docs, &req_data.accessor);
            if let Some(allowed_bs) = req_data.allowed_term_ids.as_ref() {
                let it = it.filter(move |&(_doc, term_id)| allowed_bs.contains(term_id as u32));
                Self::collect_terms_with_docs(
                    it,
                    term_buckets,
                    &mut self.bucket_id_provider,
                    sub_agg,
                );
            } else {
                Self::collect_terms_with_docs(
                    it,
                    term_buckets,
                    &mut self.bucket_id_provider,
                    sub_agg,
                );
            }
        } else {
            let term_buckets = &mut self.parent_buckets[parent_bucket_id as usize];
            let it = agg_data.column_block_accessor.iter_vals();
            if let Some(allowed_bs) = req_data.allowed_term_ids.as_ref() {
                let it = it.filter(move |&term_id| allowed_bs.contains(term_id as u32));
                Self::collect_terms(it, term_buckets, &mut self.bucket_id_provider);
            } else {
                Self::collect_terms(it, term_buckets, &mut self.bucket_id_provider);
            }
        }

        let mem_delta = self.get_memory_consumption() - mem_pre;
        if mem_delta > 0 {
            agg_data
                .context
                .limits
                .add_memory_consumed(mem_delta as u64)?;
        }
        if let Some(sub_agg) = &mut self.sub_agg {
            sub_agg.check_flush_local(agg_data)?;
        }

        Ok(())
    }

    #[inline]
    fn flush(&mut self, agg_data: &mut AggregationsSegmentCtx) -> crate::Result<()> {
        if let Some(sub_agg) = &mut self.sub_agg {
            sub_agg.flush(agg_data)?;
        }
        Ok(())
    }

    fn prepare_max_bucket(
        &mut self,
        max_bucket: BucketId,
        _agg_data: &AggregationsSegmentCtx,
    ) -> crate::Result<()> {
        while self.parent_buckets.len() <= max_bucket as usize {
            let term_buckets: TermMap =
                TermMap::new(self.max_term_id, &mut self.bucket_id_provider);
            self.parent_buckets.push(term_buckets);
        }
        Ok(())
    }
}

/// Missing value are represented as a sentinel value in the column.
///
/// This function extracts the missing value from the entries vector,
/// computes the intermediate key, and returns it the key and the bucket
/// in an Option.
fn extract_missing_value<T>(
    entries: &mut Vec<(u64, T)>,
    term_req: &TermsAggReqData,
) -> Option<(IntermediateKey, T)> {
    let missing_sentinel = term_req.missing_value_for_accessor?;
    let missing_value_entry_pos = entries
        .iter()
        .position(|(term_id, _)| *term_id == missing_sentinel)?;
    let (_term_id, bucket) = entries.swap_remove(missing_value_entry_pos);
    let missing_key = term_req.req.missing.as_ref()?;
    let key = match missing_key {
        Key::Str(missing) => IntermediateKey::Str(missing.clone()),
        Key::F64(val) => IntermediateKey::F64(*val),
        Key::U64(val) => IntermediateKey::U64(*val),
        Key::I64(val) => IntermediateKey::I64(*val),
    };
    Some((key, bucket))
}

impl<TermMap, C> SegmentTermCollector<TermMap, C>
where
    TermMap: TermAggregationMap,
    C: SubAggCache,
{
    fn get_memory_consumption(&self) -> usize {
        self.parent_buckets
            .iter()
            .map(|b| b.get_memory_consumption())
            .sum()
    }

    #[inline]
    pub(crate) fn into_intermediate_bucket_result(
        term_req: &TermsAggReqData,
        sub_agg: &mut Option<CachedSubAggs<C>>,
        term_buckets: TermMap,
        agg_data: &AggregationsSegmentCtx,
    ) -> crate::Result<IntermediateBucketResult> {
        let mut entries: Vec<(u64, Bucket)> = term_buckets.into_vec();

        let order_by_sub_aggregation =
            matches!(term_req.req.order.target, OrderTarget::SubAggregation(_));

        match &term_req.req.order.target {
            OrderTarget::Key => {
                // We rely on the fact, that term ordinals match the order of the strings
                // TODO: We could have a special collector, that keeps only TOP n results at any
                // time.
                if term_req.req.order.order == Order::Desc {
                    entries.sort_unstable_by_key(|bucket| std::cmp::Reverse(bucket.0));
                } else {
                    entries.sort_unstable_by_key(|bucket| bucket.0);
                }
            }
            OrderTarget::SubAggregation(_name) => {
                // don't sort and cut off since it's hard to make assumptions on the quality of the
                // results when cutting off du to unknown nature of the sub_aggregation (possible
                // to check).
            }
            OrderTarget::Count => {
                if term_req.req.order.order == Order::Desc {
                    entries.sort_unstable_by_key(|bucket| std::cmp::Reverse(bucket.1.count));
                } else {
                    entries.sort_unstable_by_key(|bucket| bucket.1.count);
                }
            }
        }

        let (term_doc_count_before_cutoff, sum_other_doc_count) = if order_by_sub_aggregation {
            (0, 0)
        } else {
            cut_off_buckets(&mut entries, term_req.req.segment_size as usize)
        };

        let mut dict: FxHashMap<IntermediateKey, IntermediateTermBucketEntry> = Default::default();
        dict.reserve(entries.len());

        let into_intermediate_bucket_entry =
            |bucket: Bucket,
             sub_agg: &mut Option<CachedSubAggs<C>>|
             -> crate::Result<IntermediateTermBucketEntry> {
                if let Some(sub_agg) = sub_agg {
                    let mut sub_aggregation_res = IntermediateAggregationResults::default();
                    sub_agg
                        .get_sub_agg_collector()
                        .add_intermediate_aggregation_result(
                            agg_data,
                            &mut sub_aggregation_res,
                            bucket.bucket_id,
                        )?;
                    Ok(IntermediateTermBucketEntry {
                        doc_count: bucket.count,
                        sub_aggregation: sub_aggregation_res,
                    })
                } else {
                    Ok(IntermediateTermBucketEntry {
                        doc_count: bucket.count,
                        sub_aggregation: Default::default(),
                    })
                }
            };

        if term_req.column_type == ColumnType::Str {
            let fallback_dict = Dictionary::empty();
            let term_dict = term_req
                .str_dict_column
                .as_ref()
                .map(|el| el.dictionary())
                .unwrap_or_else(|| &fallback_dict);

            if let Some((intermediate_key, bucket)) = extract_missing_value(&mut entries, term_req)
            {
                let intermediate_entry = into_intermediate_bucket_entry(bucket, sub_agg)?;
                dict.insert(intermediate_key, intermediate_entry);
            }

            // Sort by term ord
            entries.sort_unstable_by_key(|bucket| bucket.0);

            let (term_ids, buckets): (Vec<u64>, Vec<Bucket>) = entries.into_iter().unzip();
            let mut buckets_it = buckets.into_iter();

            term_dict.sorted_ords_to_term_cb(term_ids.into_iter(), |term| {
                let bucket = buckets_it.next().unwrap();
                let intermediate_entry =
                    into_intermediate_bucket_entry(bucket, sub_agg).map_err(io::Error::other)?;
                dict.insert(
                    IntermediateKey::Str(
                        String::from_utf8(term.to_vec()).expect("could not convert to String"),
                    ),
                    intermediate_entry,
                );
                Ok(())
            })?;

            if term_req.req.min_doc_count == 0 {
                // TODO: Handle rev streaming for descending sorting by keys
                let mut stream = term_dict.stream()?;
                let empty_sub_aggregation =
                    IntermediateAggregationResults::empty_from_req(&term_req.sug_aggregations);
                while stream.advance() {
                    if dict.len() >= term_req.req.segment_size as usize {
                        break;
                    }

                    // Respect allowed filters if present
                    if let Some(allowed_bs) = term_req.allowed_term_ids.as_ref() {
                        if !allowed_bs.contains(stream.term_ord() as u32) {
                            continue;
                        }
                    }

                    let key = IntermediateKey::Str(
                        std::str::from_utf8(stream.key())
                            .map_err(|utf8_err| DataCorruption::comment_only(utf8_err.to_string()))?
                            .to_string(),
                    );

                    dict.entry(key.clone())
                        .or_insert_with(|| IntermediateTermBucketEntry {
                            doc_count: 0,
                            sub_aggregation: empty_sub_aggregation.clone(),
                        });
                }
            }
        } else if term_req.column_type == ColumnType::DateTime {
            for (val, doc_count) in entries {
                let intermediate_entry = into_intermediate_bucket_entry(doc_count, sub_agg)?;
                let val = i64::from_u64(val);
                let date = format_date(val)?;
                dict.insert(IntermediateKey::Str(date), intermediate_entry);
            }
        } else if term_req.column_type == ColumnType::Bool {
            for (val, doc_count) in entries {
                let intermediate_entry = into_intermediate_bucket_entry(doc_count, sub_agg)?;
                let val = bool::from_u64(val);
                dict.insert(IntermediateKey::Bool(val), intermediate_entry);
            }
        } else if term_req.column_type == ColumnType::IpAddr {
            let compact_space_accessor = term_req
                .accessor
                .values
                .clone()
                .downcast_arc::<CompactSpaceU64Accessor>()
                .map_err(|_| {
                    TantivyError::AggregationError(
                        crate::aggregation::AggregationError::InternalError(
                            "Type mismatch: Could not downcast to CompactSpaceU64Accessor"
                                .to_string(),
                        ),
                    )
                })?;

            for (val, doc_count) in entries {
                let intermediate_entry = into_intermediate_bucket_entry(doc_count, sub_agg)?;
                let val: u128 = compact_space_accessor.compact_to_u128(val as u32);
                let val = Ipv6Addr::from_u128(val);
                dict.insert(IntermediateKey::IpAddr(val), intermediate_entry);
            }
        } else {
            for (val, doc_count) in entries {
                let intermediate_entry = into_intermediate_bucket_entry(doc_count, sub_agg)?;
                if term_req.column_type == ColumnType::U64 {
                    dict.insert(IntermediateKey::U64(val), intermediate_entry);
                } else if term_req.column_type == ColumnType::I64 {
                    dict.insert(IntermediateKey::I64(i64::from_u64(val)), intermediate_entry);
                } else {
                    let val = f64::from_u64(val);
                    let val: NumericalValue = val.into();

                    match val.normalize() {
                        NumericalValue::U64(val) => {
                            dict.insert(IntermediateKey::U64(val), intermediate_entry);
                        }
                        NumericalValue::I64(val) => {
                            dict.insert(IntermediateKey::I64(val), intermediate_entry);
                        }
                        NumericalValue::F64(val) => {
                            dict.insert(IntermediateKey::F64(val), intermediate_entry);
                        }
                    }
                };
            }
        };

        Ok(IntermediateBucketResult::Terms {
            buckets: IntermediateTermBucketResult {
                entries: dict,
                sum_other_doc_count,
                doc_count_error_upper_bound: term_doc_count_before_cutoff,
            },
        })
    }
}

impl<TermMap: TermAggregationMap, C: SubAggCache> SegmentTermCollector<TermMap, C> {
    #[inline]
    fn collect_terms_with_docs(
        iter: impl Iterator<Item = (crate::DocId, u64)>,
        term_buckets: &mut TermMap,
        bucket_id_provider: &mut BucketIdProvider,
        sub_agg: &mut CachedSubAggs<C>,
    ) {
        for (doc, term_id) in iter {
            let bucket_id = term_buckets.term_entry(term_id, bucket_id_provider);
            sub_agg.push(bucket_id, doc);
        }
    }

    #[inline]
    fn collect_terms(
        iter: impl Iterator<Item = u64>,
        term_buckets: &mut TermMap,
        bucket_id_provider: &mut BucketIdProvider,
    ) {
        for term_id in iter {
            term_buckets.term_entry(term_id, bucket_id_provider);
        }
    }
}

pub(crate) trait GetDocCount {
    fn doc_count(&self) -> u64;
}

impl GetDocCount for (String, IntermediateTermBucketEntry) {
    fn doc_count(&self) -> u64 {
        self.1.doc_count as u64
    }
}

impl GetDocCount for (u64, Bucket) {
    fn doc_count(&self) -> u64 {
        self.1.count as u64
    }
}

pub(crate) fn cut_off_buckets<T: GetDocCount + Debug>(
    entries: &mut Vec<T>,
    num_elem: usize,
) -> (u64, u64) {
    let term_doc_count_before_cutoff = entries
        .get(num_elem)
        .map(|entry| entry.doc_count())
        .unwrap_or(0);

    let sum_other_doc_count = entries
        .get(num_elem..)
        .map(|cut_off_range| cut_off_range.iter().map(|entry| entry.doc_count()).sum())
        .unwrap_or(0);

    entries.truncate(num_elem);
    (term_doc_count_before_cutoff, sum_other_doc_count)
}

#[cfg(test)]
mod tests {
    use std::net::IpAddr;
    use std::str::FromStr;

    use common::DateTime;
    use time::{Date, Month};

    use super::{PagedTermMap, TermAggregationMap, PAGE_SIZE};
    use crate::aggregation::agg_req::Aggregations;
    use crate::aggregation::intermediate_agg_result::IntermediateAggregationResults;
    use crate::aggregation::segment_agg_result::BucketIdProvider;
    use crate::aggregation::tests::{
        exec_request, exec_request_with_query, exec_request_with_query_and_memory_limit,
        get_test_index_from_terms, get_test_index_from_values_and_terms,
    };
    use crate::aggregation::{AggregationLimitsGuard, DistributedAggregationCollector};
    use crate::indexer::NoMergePolicy;
    use crate::query::AllQuery;
    use crate::schema::{IntoIpv6Addr, Schema, FAST, STRING};
    use crate::{Index, IndexWriter};

    #[test]
    fn paged_term_map_reuses_buckets_and_counts() {
        let mut bucket_id_provider = BucketIdProvider::default();
        let mut map = PagedTermMap::new((PAGE_SIZE * 2) as u64, &mut bucket_id_provider);

        let bucket_first = map.term_entry(5, &mut bucket_id_provider);
        let bucket_second_page = map.term_entry((PAGE_SIZE + 7) as u64, &mut bucket_id_provider);

        // Reinsertions should increment counts and reuse bucket ids
        assert_eq!(map.term_entry(5, &mut bucket_id_provider), bucket_first);
        assert_eq!(
            map.term_entry((PAGE_SIZE + 7) as u64, &mut bucket_id_provider),
            bucket_second_page
        );

        // High offset exercises the TinySet presence word boundaries.
        let bucket_high_bit = map.term_entry(63, &mut bucket_id_provider);

        let mut entries = map.into_vec();
        entries.sort_by_key(|(term_id, _)| *term_id);

        let expected = vec![
            (5u64, bucket_first, 2u32),
            (63u64, bucket_high_bit, 1u32),
            ((PAGE_SIZE + 7) as u64, bucket_second_page, 2u32),
        ];

        assert_eq!(entries.len(), expected.len());
        for ((term_id, bucket), (expected_term, expected_bucket_id, expected_count)) in
            entries.into_iter().zip(expected)
        {
            assert_eq!(term_id, expected_term);
            assert_eq!(bucket.bucket_id, expected_bucket_id);
            assert_eq!(bucket.count, expected_count);
        }
    }

    #[test]
    fn terms_aggregation_test_single_segment() -> crate::Result<()> {
        terms_aggregation_test_merge_segment(true)
    }
    #[test]
    fn terms_aggregation_test() -> crate::Result<()> {
        terms_aggregation_test_merge_segment(false)
    }
    fn terms_aggregation_test_merge_segment(merge_segments: bool) -> crate::Result<()> {
        let segment_and_terms = vec![
            vec!["terma"],
            vec!["termb"],
            vec!["termc"],
            vec!["terma"],
            vec!["terma"],
            vec!["terma"],
            vec!["termb"],
            vec!["terma"],
        ];
        let index = get_test_index_from_terms(merge_segments, &segment_and_terms)?;

        let agg_req: Aggregations = serde_json::from_value(json!({
            "my_texts": {
                "terms": {
                    "field": "string_id",
                },
            }
        }))
        .unwrap();

        let res = exec_request(agg_req, &index)?;
        assert_eq!(res["my_texts"]["buckets"][0]["key"], "terma");
        assert_eq!(res["my_texts"]["buckets"][0]["doc_count"], 5);
        assert_eq!(res["my_texts"]["buckets"][1]["key"], "termb");
        assert_eq!(res["my_texts"]["buckets"][1]["doc_count"], 2);
        assert_eq!(res["my_texts"]["buckets"][2]["key"], "termc");
        assert_eq!(res["my_texts"]["buckets"][2]["doc_count"], 1);
        assert_eq!(res["my_texts"]["sum_other_doc_count"], 0);

        let agg_req: Aggregations = serde_json::from_value(json!({
            "my_texts": {
                "terms": {
                    "field": "string_id",
                    "size": 2,
                    "segment_size": 2
                },
            }
        }))
        .unwrap();

        let res = exec_request(agg_req, &index)?;
        assert_eq!(res["my_texts"]["buckets"][0]["key"], "terma");
        assert_eq!(res["my_texts"]["buckets"][0]["doc_count"], 5);
        assert_eq!(res["my_texts"]["buckets"][1]["key"], "termb");
        assert_eq!(res["my_texts"]["buckets"][1]["doc_count"], 2);
        assert_eq!(
            res["my_texts"]["buckets"][2]["key"],
            serde_json::Value::Null
        );
        assert_eq!(res["my_texts"]["sum_other_doc_count"], 1);

        // include filter: only terma and termc
        let agg_req: Aggregations = serde_json::from_value(json!({
            "my_texts": {
                "terms": {
                    "field": "string_id",
                    "include": ["terma", "termc"],
                },
            }
        }))
        .unwrap();

        let res = exec_request(agg_req, &index)?;
        assert_eq!(res["my_texts"]["buckets"][0]["key"], "terma");
        assert_eq!(res["my_texts"]["buckets"][0]["doc_count"], 5);
        assert_eq!(res["my_texts"]["buckets"][1]["key"], "termc");
        assert_eq!(res["my_texts"]["buckets"][1]["doc_count"], 1);
        assert_eq!(res["my_texts"]["sum_other_doc_count"], 0);

        // exclude filter: remove termc
        let agg_req: Aggregations = serde_json::from_value(json!({
            "my_texts": {
                "terms": {
                    "field": "string_id",
                    "exclude": ["termc"],
                },
            }
        }))
        .unwrap();

        let res = exec_request(agg_req, &index)?;
        assert_eq!(res["my_texts"]["buckets"][0]["key"], "terma");
        assert_eq!(res["my_texts"]["buckets"][0]["doc_count"], 5);
        assert_eq!(res["my_texts"]["buckets"][1]["key"], "termb");
        assert_eq!(res["my_texts"]["buckets"][1]["doc_count"], 2);
        assert_eq!(res["my_texts"]["sum_other_doc_count"], 0);

        // include regex (single string): only termb
        let agg_req: Aggregations = serde_json::from_value(json!({
            "my_texts": {
                "terms": {
                    "field": "string_id",
                    "include": "termb",
                },
            }
        }))
        .unwrap();

        let res = exec_request(agg_req, &index)?;
        assert_eq!(res["my_texts"]["buckets"][0]["key"], "termb");
        assert_eq!(res["my_texts"]["buckets"][0]["doc_count"], 2);
        assert_eq!(res["my_texts"]["sum_other_doc_count"], 0);

        // include regex (term.*) with exclude regex (termc): expect terma and termb
        let agg_req: Aggregations = serde_json::from_value(json!({
            "my_texts": {
                "terms": {
                    "field": "string_id",
                    "include": "term.*",
                    "exclude": "termc",
                },
            }
        }))
        .unwrap();

        let res = exec_request(agg_req, &index)?;
        assert_eq!(res["my_texts"]["buckets"][0]["key"], "terma");
        assert_eq!(res["my_texts"]["buckets"][0]["doc_count"], 5);
        assert_eq!(res["my_texts"]["buckets"][1]["key"], "termb");
        assert_eq!(res["my_texts"]["buckets"][1]["doc_count"], 2);
        assert_eq!(res["my_texts"]["sum_other_doc_count"], 0);

        // test min_doc_count
        let agg_req: Aggregations = serde_json::from_value(json!({
            "my_texts": {
                "terms": {
                    "field": "string_id",
                    "size": 2,
                    "min_doc_count": 3,
                },
            }
        }))
        .unwrap();

        let res = exec_request(agg_req, &index)?;
        assert_eq!(res["my_texts"]["buckets"][0]["key"], "terma");
        assert_eq!(res["my_texts"]["buckets"][0]["doc_count"], 5);
        assert_eq!(
            res["my_texts"]["buckets"][1]["key"],
            serde_json::Value::Null
        );
        assert_eq!(res["my_texts"]["sum_other_doc_count"], 0); // TODO sum_other_doc_count with min_doc_count
        Ok(())
    }

    #[test]
    fn terms_aggregation_test_order_count_single_segment() -> crate::Result<()> {
        terms_aggregation_test_order_count_merge_segment(true)
    }
    #[test]
    fn terms_aggregation_test_count_order() -> crate::Result<()> {
        terms_aggregation_test_order_count_merge_segment(false)
    }
    fn terms_aggregation_test_order_count_merge_segment(merge_segments: bool) -> crate::Result<()> {
        let segment_and_terms = vec![
            vec![(5.0, "terma".to_string())],
            vec![(2.0, "termb".to_string())],
            vec![(2.0, "terma".to_string())],
            vec![(1.0, "termc".to_string())],
            vec![(1.0, "termc".to_string())],
            vec![(1.0, "termc".to_string())],
            vec![(5.0, "terma".to_string())],
            vec![(5.0, "terma".to_string())],
            vec![(5.0, "terma".to_string())],
            vec![(8.0, "termb".to_string())],
            vec![(5.0, "terma".to_string())],
        ];
        let index = get_test_index_from_values_and_terms(merge_segments, &segment_and_terms)?;

        let sub_agg: Aggregations = serde_json::from_value(json!({
            "avg_score": {
                "avg": {
                    "field": "score",
                }
            },
            "stats_score": {
                "stats": {
                    "field": "score",
                }
            }
        }))
        .unwrap();

        // sub agg desc
        let agg_req: Aggregations = serde_json::from_value(json!({
            "my_texts": {
                "terms": {
                    "field": "string_id",
                    "order": {
                        "_count": "asc",
                    },
                },
                "aggs": sub_agg,
            }
        }))
        .unwrap();

        let res = exec_request(agg_req, &index)?;
        assert_eq!(res["my_texts"]["buckets"][0]["key"], "termb");
        assert_eq!(res["my_texts"]["buckets"][0]["doc_count"], 2);
        assert_eq!(res["my_texts"]["buckets"][0]["avg_score"]["value"], 5.0);

        assert_eq!(res["my_texts"]["buckets"][1]["key"], "termc");
        assert_eq!(res["my_texts"]["buckets"][1]["doc_count"], 3);
        assert_eq!(res["my_texts"]["buckets"][1]["avg_score"]["value"], 1.0);

        assert_eq!(res["my_texts"]["buckets"][2]["key"], "terma");
        assert_eq!(res["my_texts"]["buckets"][2]["doc_count"], 6);
        assert_eq!(res["my_texts"]["buckets"][2]["avg_score"]["value"], 4.5);

        assert_eq!(res["my_texts"]["sum_other_doc_count"], 0);

        // Agg on non string
        //
        let agg_req: Aggregations = serde_json::from_value(json!({
            "my_scores1": {
                "terms": {
                    "field": "score",
                    "order": {
                        "_count": "asc",
                    },
                },
                "aggs": sub_agg,
            },
            "my_scores2": {
                "terms": {
                    "field": "score_f64",
                    "order": {
                        "_count": "asc",
                    },
                },
                "aggs": sub_agg,
            },
            "my_scores3": {
                "terms": {
                    "field": "score_i64",
                    "order": {
                        "_count": "asc",
                    },
                },
                "aggs": sub_agg,
            }

        }))
        .unwrap();

        let res = exec_request(agg_req, &index)?;
        assert_eq!(res["my_scores1"]["buckets"][0]["key"], 8.0);
        assert_eq!(res["my_scores1"]["buckets"][0]["doc_count"], 1);
        assert_eq!(res["my_scores1"]["buckets"][0]["avg_score"]["value"], 8.0);

        assert_eq!(res["my_scores1"]["buckets"][1]["key"], 2.0);
        assert_eq!(res["my_scores1"]["buckets"][1]["doc_count"], 2);
        assert_eq!(res["my_scores1"]["buckets"][1]["avg_score"]["value"], 2.0);

        assert_eq!(res["my_scores1"]["buckets"][2]["key"], 1.0);
        assert_eq!(res["my_scores1"]["buckets"][2]["doc_count"], 3);
        assert_eq!(res["my_scores1"]["buckets"][2]["avg_score"]["value"], 1.0);

        assert_eq!(res["my_scores1"]["buckets"][3]["key"], 5.0);
        assert_eq!(res["my_scores1"]["buckets"][3]["doc_count"], 5);
        assert_eq!(res["my_scores1"]["buckets"][3]["avg_score"]["value"], 5.0);

        assert_eq!(res["my_scores1"]["sum_other_doc_count"], 0);

        assert_eq!(res["my_scores2"]["buckets"][0]["key"], 8.0);
        assert_eq!(res["my_scores2"]["buckets"][0]["doc_count"], 1);
        assert_eq!(res["my_scores2"]["buckets"][0]["avg_score"]["value"], 8.0);

        assert_eq!(res["my_scores2"]["buckets"][1]["key"], 2.0);
        assert_eq!(res["my_scores2"]["buckets"][1]["doc_count"], 2);
        assert_eq!(res["my_scores2"]["buckets"][1]["avg_score"]["value"], 2.0);

        assert_eq!(res["my_scores2"]["buckets"][2]["key"], 1.0);
        assert_eq!(res["my_scores2"]["buckets"][2]["doc_count"], 3);
        assert_eq!(res["my_scores2"]["buckets"][2]["avg_score"]["value"], 1.0);

        assert_eq!(res["my_scores2"]["sum_other_doc_count"], 0);

        assert_eq!(res["my_scores3"]["buckets"][0]["key"], 8.0);
        assert_eq!(res["my_scores3"]["buckets"][0]["doc_count"], 1);
        assert_eq!(res["my_scores3"]["buckets"][0]["avg_score"]["value"], 8.0);

        assert_eq!(res["my_scores3"]["buckets"][1]["key"], 2.0);
        assert_eq!(res["my_scores3"]["buckets"][1]["doc_count"], 2);
        assert_eq!(res["my_scores3"]["buckets"][1]["avg_score"]["value"], 2.0);

        assert_eq!(res["my_scores3"]["buckets"][2]["key"], 1.0);
        assert_eq!(res["my_scores3"]["buckets"][2]["doc_count"], 3);
        assert_eq!(res["my_scores3"]["buckets"][2]["avg_score"]["value"], 1.0);

        assert_eq!(res["my_scores3"]["sum_other_doc_count"], 0);

        Ok(())
    }

    #[test]
    fn test_simple_agg() {
        let segment_and_terms = vec![vec![(5.0, "terma".to_string())]];
        let index = get_test_index_from_values_and_terms(true, &segment_and_terms).unwrap();

        let sub_agg: Aggregations = serde_json::from_value(json!({
            "avg_score": {
                "avg": {
                    "field": "score",
                }
            }
        }))
        .unwrap();

        // sub agg desc
        let agg_req: Aggregations = serde_json::from_value(json!({
            "my_texts": {
                "terms": {
                    "field": "string_id",
                    "order": {
                        "_count": "asc",
                    },
                        },
                        "aggs": sub_agg,
                    }
        }))
        .unwrap();

        let res = exec_request(agg_req, &index).unwrap();
        assert_eq!(res["my_texts"]["buckets"][0]["key"], "terma");
        assert_eq!(res["my_texts"]["buckets"][0]["doc_count"], 1);
        assert_eq!(res["my_texts"]["buckets"][0]["avg_score"]["value"], 5.0);
    }

    #[test]
    fn terms_aggregation_test_order_sub_agg_single_segment() -> crate::Result<()> {
        terms_aggregation_test_order_sub_agg_merge_segment(true)
    }
    #[test]
    fn terms_aggregation_test_sub_agg_order() -> crate::Result<()> {
        terms_aggregation_test_order_sub_agg_merge_segment(false)
    }
    fn terms_aggregation_test_order_sub_agg_merge_segment(
        merge_segments: bool,
    ) -> crate::Result<()> {
        let segment_and_terms = vec![
            vec![(5.0, "terma".to_string())],
            vec![(4.0, "termb".to_string())],
            vec![(1.0, "termc".to_string())],
            vec![(1.0, "termc".to_string())],
            vec![(1.0, "termc".to_string())],
            vec![(5.0, "terma".to_string())],
            vec![(5.0, "terma".to_string())],
            vec![(5.0, "terma".to_string())],
            vec![(8.0, "termb".to_string())],
            vec![(5.0, "terma".to_string())],
        ];
        let index = get_test_index_from_values_and_terms(merge_segments, &segment_and_terms)?;

        let sub_agg: Aggregations = serde_json::from_value(json!({
            "avg_score": {
                "avg": {
                    "field": "score",
                }
            },
            "stats_score": {
                "stats": {
                    "field": "score",
                }
            }
        }))
        .unwrap();

        // sub agg desc
        let agg_req: Aggregations = serde_json::from_value(json!({
            "my_texts": {
                "terms": {
                    "field": "string_id",
                    "order": {
                        "avg_score": "desc"
                    }
                },
                "aggs": sub_agg,
            }
        }))
        .unwrap();

        let res = exec_request(agg_req, &index)?;
        assert_eq!(res["my_texts"]["buckets"][0]["key"], "termb");
        assert_eq!(res["my_texts"]["buckets"][0]["doc_count"], 2);
        assert_eq!(res["my_texts"]["buckets"][0]["avg_score"]["value"], 6.0);

        assert_eq!(res["my_texts"]["buckets"][1]["key"], "terma");
        assert_eq!(res["my_texts"]["buckets"][1]["doc_count"], 5);
        assert_eq!(res["my_texts"]["buckets"][1]["avg_score"]["value"], 5.0);

        assert_eq!(res["my_texts"]["buckets"][2]["key"], "termc");
        assert_eq!(res["my_texts"]["buckets"][2]["doc_count"], 3);
        assert_eq!(res["my_texts"]["buckets"][2]["avg_score"]["value"], 1.0);

        assert_eq!(res["my_texts"]["sum_other_doc_count"], 0);

        // sub agg asc
        //
        let agg_req: Aggregations = serde_json::from_value(json!({
            "my_texts": {
                "terms": {
                    "field": "string_id",
                    "order": {
                        "avg_score": "asc"
                    }
                },
                "aggs": sub_agg,
            }
        }))
        .unwrap();

        let res = exec_request(agg_req, &index)?;

        assert_eq!(res["my_texts"]["buckets"][0]["key"], "termc");
        assert_eq!(res["my_texts"]["buckets"][0]["doc_count"], 3);
        assert_eq!(res["my_texts"]["buckets"][0]["avg_score"]["value"], 1.0);

        assert_eq!(res["my_texts"]["buckets"][1]["key"], "terma");
        assert_eq!(res["my_texts"]["buckets"][1]["doc_count"], 5);
        assert_eq!(res["my_texts"]["buckets"][1]["avg_score"]["value"], 5.0);

        assert_eq!(res["my_texts"]["buckets"][2]["key"], "termb");
        assert_eq!(res["my_texts"]["buckets"][2]["doc_count"], 2);
        assert_eq!(res["my_texts"]["buckets"][2]["avg_score"]["value"], 6.0);

        assert_eq!(res["my_texts"]["sum_other_doc_count"], 0);

        // sub agg multi value asc
        let agg_req: Aggregations = serde_json::from_value(json!({
            "my_texts": {
                "terms": {
                    "field": "string_id",
                    "order": {
                        "stats_score.avg": "asc"
                    }
                },
                "aggs": sub_agg,
            }
        }))
        .unwrap();

        let res = exec_request(agg_req, &index)?;

        assert_eq!(res["my_texts"]["buckets"][0]["key"], "termc");
        assert_eq!(res["my_texts"]["buckets"][0]["doc_count"], 3);
        assert_eq!(res["my_texts"]["buckets"][0]["avg_score"]["value"], 1.0);

        assert_eq!(res["my_texts"]["buckets"][1]["key"], "terma");
        assert_eq!(res["my_texts"]["buckets"][1]["doc_count"], 5);
        assert_eq!(res["my_texts"]["buckets"][1]["avg_score"]["value"], 5.0);

        assert_eq!(res["my_texts"]["buckets"][2]["key"], "termb");
        assert_eq!(res["my_texts"]["buckets"][2]["doc_count"], 2);
        assert_eq!(res["my_texts"]["buckets"][2]["avg_score"]["value"], 6.0);

        assert_eq!(res["my_texts"]["sum_other_doc_count"], 0);

        // sub agg invalid request
        let agg_req: Aggregations = serde_json::from_value(json!({
            "my_texts": {
                "terms": {
                    "field": "string_id",
                    "order": {
                        "doesnotexist": "asc"
                    }
                },
                "aggs": sub_agg,
            }
        }))
        .unwrap();

        let res = exec_request(agg_req, &index);
        assert!(res.is_err());

        Ok(())
    }

    #[test]
    fn terms_aggregation_test_order_key_single_segment() -> crate::Result<()> {
        terms_aggregation_test_order_key_merge_segment(true)
    }
    #[test]
    fn terms_aggregation_test_key_order() -> crate::Result<()> {
        terms_aggregation_test_order_key_merge_segment(false)
    }
    fn terms_aggregation_test_order_key_merge_segment(merge_segments: bool) -> crate::Result<()> {
        let segment_and_terms = vec![
            vec![(5.0, "terma".to_string())],
            vec![(4.0, "termb".to_string())],
            vec![(1.0, "termc".to_string())],
            vec![(1.0, "termc".to_string())],
            vec![(1.0, "termc".to_string())],
            vec![(5.0, "terma".to_string())],
            vec![(5.0, "terma".to_string())],
            vec![(5.0, "terma".to_string())],
            vec![(8.0, "termb".to_string())],
            vec![(5.0, "terma".to_string())],
        ];
        let index = get_test_index_from_values_and_terms(merge_segments, &segment_and_terms)?;

        // key asc
        let agg_req: Aggregations = serde_json::from_value(json!({
            "my_texts": {
                "terms": {
                    "field": "string_id",
                    "order": {
                        "_key": "asc"
                    }
                },
            }
        }))
        .unwrap();

        let res = exec_request(agg_req, &index)?;
        assert_eq!(res["my_texts"]["buckets"][0]["key"], "terma");
        assert_eq!(res["my_texts"]["buckets"][0]["doc_count"], 5);
        assert_eq!(res["my_texts"]["buckets"][1]["key"], "termb");
        assert_eq!(res["my_texts"]["buckets"][1]["doc_count"], 2);
        assert_eq!(res["my_texts"]["buckets"][2]["key"], "termc");
        assert_eq!(res["my_texts"]["buckets"][2]["doc_count"], 3);
        assert_eq!(res["my_texts"]["sum_other_doc_count"], 0);

        // key desc and size cut_off
        let agg_req: Aggregations = serde_json::from_value(json!({
            "my_texts": {
                "terms": {
                    "field": "string_id",
                    "order": {
                        "_key": "asc"
                    },
                    "size": 2
                },
            }
        }))
        .unwrap();

        let res = exec_request(agg_req, &index)?;
        assert_eq!(res["my_texts"]["buckets"][0]["key"], "terma");
        assert_eq!(res["my_texts"]["buckets"][0]["doc_count"], 5);
        assert_eq!(res["my_texts"]["buckets"][1]["key"], "termb");
        assert_eq!(res["my_texts"]["buckets"][1]["doc_count"], 2);
        assert_eq!(
            res["my_texts"]["buckets"][2]["doc_count"],
            serde_json::Value::Null
        );

        assert_eq!(res["my_texts"]["sum_other_doc_count"], 3);

        // key asc and segment_size cut_off
        let agg_req: Aggregations = serde_json::from_value(json!({
            "my_texts": {
                "terms": {
                    "field": "string_id",
                    "order": {
                        "_key": "asc"
                    },
                    "size": 2,
                    "segment_size": 2
                },
            }
        }))
        .unwrap();

        let res = exec_request(agg_req, &index)?;
        assert_eq!(res["my_texts"]["buckets"][0]["key"], "terma");
        assert_eq!(res["my_texts"]["buckets"][0]["doc_count"], 5);
        assert_eq!(res["my_texts"]["buckets"][1]["key"], "termb");
        assert_eq!(res["my_texts"]["buckets"][1]["doc_count"], 2);
        assert_eq!(
            res["my_texts"]["buckets"][2]["doc_count"],
            serde_json::Value::Null
        );

        // key desc
        let agg_req: Aggregations = serde_json::from_value(json!({
            "my_texts": {
                "terms": {
                    "field": "string_id",
                    "order": {
                        "_key": "desc"
                    },
                },
            }
        }))
        .unwrap();

        let res = exec_request(agg_req, &index)?;
        assert_eq!(res["my_texts"]["buckets"][0]["key"], "termc");
        assert_eq!(res["my_texts"]["buckets"][0]["doc_count"], 3);
        assert_eq!(res["my_texts"]["buckets"][1]["key"], "termb");
        assert_eq!(res["my_texts"]["buckets"][1]["doc_count"], 2);
        assert_eq!(res["my_texts"]["buckets"][2]["key"], "terma");
        assert_eq!(res["my_texts"]["buckets"][2]["doc_count"], 5);
        assert_eq!(res["my_texts"]["sum_other_doc_count"], 0);

        // key desc, size cut_off
        let agg_req: Aggregations = serde_json::from_value(json!({
            "my_texts": {
                "terms": {
                    "field": "string_id",
                    "order": {
                        "_key": "desc"
                    },
                    "size": 2
                },
            }
        }))
        .unwrap();

        let res = exec_request(agg_req, &index)?;
        assert_eq!(res["my_texts"]["buckets"][0]["key"], "termc");
        assert_eq!(res["my_texts"]["buckets"][0]["doc_count"], 3);
        assert_eq!(res["my_texts"]["buckets"][1]["key"], "termb");
        assert_eq!(res["my_texts"]["buckets"][1]["doc_count"], 2);
        assert_eq!(
            res["my_texts"]["buckets"][2]["doc_count"],
            serde_json::Value::Null
        );
        assert_eq!(res["my_texts"]["sum_other_doc_count"], 5);

        // key desc, segment_size cut_off
        let agg_req: Aggregations = serde_json::from_value(json!({
            "my_texts": {
                "terms": {
                    "field": "string_id",
                    "order": {
                        "_key": "desc"
                    },
                    "size": 2,
                    "segment_size": 2
                },
            }
        }))
        .unwrap();

        let res = exec_request(agg_req, &index)?;
        assert_eq!(res["my_texts"]["buckets"][0]["key"], "termc");
        assert_eq!(res["my_texts"]["buckets"][0]["doc_count"], 3);
        assert_eq!(res["my_texts"]["buckets"][1]["key"], "termb");
        assert_eq!(res["my_texts"]["buckets"][1]["doc_count"], 2);
        assert_eq!(
            res["my_texts"]["buckets"][2]["doc_count"],
            serde_json::Value::Null
        );

        Ok(())
    }

    #[test]
    fn terms_aggregation_min_doc_count_special_case() -> crate::Result<()> {
        let terms_per_segment = vec![
            vec!["terma", "terma", "termb", "termb", "termb"],
            vec!["terma", "terma", "termb"],
        ];

        let index = get_test_index_from_terms(false, &terms_per_segment)?;

        let agg_req: Aggregations = serde_json::from_value(json!({
            "my_texts": {
                "terms": {
                    "field": "string_id",
                    "min_doc_count": 0,
                },
            }
        }))
        .unwrap();

        // searching for terma, but min_doc_count will return all terms
        let res = exec_request_with_query(agg_req, &index, Some(("string_id", "terma")))?;

        assert_eq!(res["my_texts"]["buckets"][0]["key"], "terma");
        assert_eq!(res["my_texts"]["buckets"][0]["doc_count"], 4);
        assert_eq!(res["my_texts"]["buckets"][1]["key"], "termb");
        assert_eq!(res["my_texts"]["buckets"][1]["doc_count"], 0);
        assert_eq!(res["my_texts"]["sum_other_doc_count"], 0);
        assert_eq!(res["my_texts"]["doc_count_error_upper_bound"], 0);

        Ok(())
    }

    #[test]
    fn terms_aggregation_min_doc_count_special_case_with_sub_agg_empty_merge() -> crate::Result<()>
    {
        let mut schema_builder = Schema::builder();
        let string_field_1 = schema_builder.add_text_field("string1", STRING | FAST);
        let string_field_2 = schema_builder.add_text_field("string2", STRING | FAST);
        let score_fieldtype = crate::schema::NumericOptions::default().set_fast();
        let score_field = schema_builder.add_u64_field("score", score_fieldtype);
        let index = Index::create_in_ram(schema_builder.build());
        {
            let mut index_writer = index.writer_with_num_threads(1, 20_000_000)?;
            index_writer.set_merge_policy(Box::new(NoMergePolicy));
            // writing the segment
            index_writer.add_document(doc!(
                string_field_1 => "A".to_string(),
                string_field_2 => "hit".to_string(),
                score_field => 1u64,
            ))?;
            index_writer.add_document(doc!(
                string_field_1 => "B".to_string(),
                string_field_2 => "nohit".to_string(), // this doc gets filtered in this segment,
                                                       // but the term will still be loaded because
                                                       // min_doc_count == 0
                score_field => 2u64,
            ))?;
            index_writer.commit()?;

            index_writer.add_document(doc!(
                string_field_1 => "A".to_string(),
                string_field_2 => "hit".to_string(),
                score_field => 2u64,
            ))?;
            index_writer.add_document(doc!(
                string_field_1 => "B".to_string(),
                string_field_2 => "hit".to_string(),
                score_field => 4u64,
            ))?;
            index_writer.commit()?;
        }

        let agg_req: Aggregations = serde_json::from_value(json!({
            "my_texts": {
                "terms": {
                    "field": "string1",
                    "min_doc_count": 0,
                },
                "aggs":{
                    "elhistogram": {
                        "histogram": {
                            "field": "score",
                            "interval": 1
                        }
                    }
                }
            }
        }))
        .unwrap();

        // searching for terma, but min_doc_count will return all terms
        let res = exec_request_with_query(agg_req, &index, Some(("string2", "hit")))?;

        assert_eq!(res["my_texts"]["buckets"][0]["key"], "A");
        assert_eq!(res["my_texts"]["buckets"][0]["doc_count"], 2);
        assert_eq!(
            res["my_texts"]["buckets"][0]["elhistogram"]["buckets"],
            json!([{ "doc_count": 1, "key": 1.0 }, { "doc_count": 1, "key": 2.0 } ])
        );
        assert_eq!(res["my_texts"]["buckets"][1]["key"], "B");
        assert_eq!(res["my_texts"]["buckets"][1]["doc_count"], 1);
        assert_eq!(
            res["my_texts"]["buckets"][1]["elhistogram"]["buckets"],
            json!([ { "doc_count": 1, "key": 4.0 } ])
        );
        assert_eq!(res["my_texts"]["sum_other_doc_count"], 0);
        assert_eq!(res["my_texts"]["doc_count_error_upper_bound"], 0);

        Ok(())
    }

    #[test]
    fn terms_aggregation_error_count_test() -> crate::Result<()> {
        let terms_per_segment = vec![
            vec!["terma", "terma", "termb", "termb", "termb", "termc"], /* termc doesn't make it
                                                                         * from this segment */
            vec!["terma", "terma", "termb", "termc", "termc"], /* termb doesn't make it from
                                                                * this segment */
        ];

        let index = get_test_index_from_terms(false, &terms_per_segment)?;
        assert_eq!(index.searchable_segments().unwrap().len(), 2);

        let agg_req: Aggregations = serde_json::from_value(json!({
            "my_texts": {
                "terms": {
                    "field": "string_id",
                    "size": 2,
                    "segment_size": 2
                },
            }
        }))
        .unwrap();

        let res = exec_request(agg_req, &index)?;

        assert_eq!(res["my_texts"]["buckets"][0]["key"], "terma");
        assert_eq!(res["my_texts"]["buckets"][0]["doc_count"], 4);
        assert_eq!(res["my_texts"]["buckets"][1]["key"], "termb");
        assert_eq!(res["my_texts"]["buckets"][1]["doc_count"], 3);
        assert_eq!(
            res["my_texts"]["buckets"][2]["doc_count"],
            serde_json::Value::Null
        );
        assert_eq!(res["my_texts"]["sum_other_doc_count"], 4);
        assert_eq!(res["my_texts"]["doc_count_error_upper_bound"], 2);

        // disable doc_count_error_upper_bound

        let agg_req: Aggregations = serde_json::from_value(json!({
            "my_texts": {
                "terms": {
                    "field": "string_id",
                    "size": 2,
                    "segment_size": 2,
                    "show_term_doc_count_error": false
                },
            }
        }))
        .unwrap();

        let res = exec_request(agg_req, &index)?;

        assert_eq!(res["my_texts"]["sum_other_doc_count"], 4);
        assert_eq!(
            res["my_texts"]["doc_count_error_upper_bound"],
            serde_json::Value::Null
        );

        Ok(())
    }

    #[test]
    fn terms_aggregation_term_bucket_limit() -> crate::Result<()> {
        let terms: Vec<String> = (0..20_000).map(|el| el.to_string()).collect();
        let terms_per_segment = vec![terms.iter().map(|el| el.as_str()).collect()];

        let index = get_test_index_from_terms(true, &terms_per_segment)?;

        let agg_req: Aggregations = serde_json::from_value(json!({
            "my_texts": {
                "terms": {
                    "field": "string_id",
                    "min_doc_count": 0,
                },
            }
        }))
        .unwrap();

        let res = exec_request_with_query_and_memory_limit(
            agg_req,
            &index,
            None,
            AggregationLimitsGuard::new(Some(50_000), None),
        )
        .unwrap_err();
        assert!(res
            .to_string()
            .contains("Aborting aggregation because memory limit was exceeded. Limit: 50.00 KB"));

        Ok(())
    }

    #[test]
    fn terms_aggregation_different_tokenizer_on_ff_test() -> crate::Result<()> {
        let terms = vec!["Hello Hello", "Hallo Hallo", "Hallo Hallo"];

        let index = get_test_index_from_terms(true, &[terms])?;

        let agg_req: Aggregations = serde_json::from_value(json!({
            "my_texts": {
                "terms": {
                    "field": "text_id",
                    "min_doc_count": 0,
                },
            }
        }))
        .unwrap();

        let res = exec_request_with_query(agg_req, &index, None).unwrap();
        println!("{}", serde_json::to_string_pretty(&res).unwrap());

        assert_eq!(res["my_texts"]["buckets"][0]["key"], "Hallo Hallo");
        assert_eq!(res["my_texts"]["buckets"][0]["doc_count"], 2);

        assert_eq!(res["my_texts"]["buckets"][1]["key"], "Hello Hello");
        assert_eq!(res["my_texts"]["buckets"][1]["doc_count"], 1);

        Ok(())
    }

    #[test]
    fn test_json_format() -> crate::Result<()> {
        let agg_req: Aggregations = serde_json::from_value(json!({
            "term_agg_test": {
                "terms": {
                    "field": "string_id",
                    "size": 2,
                    "segment_size": 2,
                    "order": {
                        "_key": "desc"
                    }
                },
            }
        }))
        .unwrap();

        let elasticsearch_compatible_json = json!(
        {
        "term_agg_test":{
            "terms": {
                "field": "string_id",
                "size": 2u64,
                "segment_size": 2u64,
                "order": {"_key": "desc"}
            }
        }
        });

        let agg_req_deser: Aggregations =
            serde_json::from_str(&serde_json::to_string(&elasticsearch_compatible_json).unwrap())
                .unwrap();
        assert_eq!(agg_req, agg_req_deser);

        let elasticsearch_compatible_json = json!(
        {
        "term_agg_test":{
            "terms": {
                "field": "string_id",
                "split_size": 2u64,
            }
        }
        });

        // test alias shard_size, split_size
        let agg_req: Aggregations = serde_json::from_value(json!({
            "term_agg_test": {
                "terms": {
                    "field": "string_id",
                    "split_size": 2,
                },
            }
        }))
        .unwrap();

        let agg_req_deser: Aggregations =
            serde_json::from_str(&serde_json::to_string(&elasticsearch_compatible_json).unwrap())
                .unwrap();
        assert_eq!(agg_req, agg_req_deser);

        let elasticsearch_compatible_json = json!(
        {
        "term_agg_test":{
            "terms": {
                "field": "string_id",
                "shard_size": 2u64,
            }
        }
        });

        let agg_req_deser: Aggregations =
            serde_json::from_str(&serde_json::to_string(&elasticsearch_compatible_json).unwrap())
                .unwrap();
        assert_eq!(agg_req, agg_req_deser);

        Ok(())
    }
    #[test]
    fn terms_empty_json() -> crate::Result<()> {
        let mut schema_builder = Schema::builder();
        let json = schema_builder.add_json_field("json", FAST);
        let schema = schema_builder.build();
        let index = Index::create_in_ram(schema);
        let mut index_writer: IndexWriter = index.writer_for_tests().unwrap();
        // => Segment with empty json
        index_writer.add_document(doc!()).unwrap();
        index_writer.commit().unwrap();
        // => Segment with json, but no field partially_empty
        index_writer
            .add_document(doc!(json => json!({"different_field": "blue"})))
            .unwrap();
        index_writer.commit().unwrap();
        //// => Segment with field partially_empty
        index_writer
            .add_document(doc!(json => json!({"partially_empty": "blue"})))
            .unwrap();
        index_writer.add_document(doc!())?;
        index_writer.commit().unwrap();

        let agg_req: Aggregations = serde_json::from_value(json!({
            "my_texts": {
                "terms": {
                    "field": "json.partially_empty"
                },
            }
        }))
        .unwrap();

        let res = exec_request_with_query(agg_req, &index, None)?;

        assert_eq!(res["my_texts"]["buckets"][0]["key"], "blue");
        assert_eq!(res["my_texts"]["buckets"][0]["doc_count"], 1);
        assert_eq!(res["my_texts"]["buckets"][1], serde_json::Value::Null);
        assert_eq!(res["my_texts"]["sum_other_doc_count"], 0);
        assert_eq!(res["my_texts"]["doc_count_error_upper_bound"], 0);

        Ok(())
    }

    #[test]
    fn terms_aggregation_bytes() -> crate::Result<()> {
        let mut schema_builder = Schema::builder();
        let bytes_field = schema_builder.add_bytes_field("bytes", FAST);
        let index = Index::create_in_ram(schema_builder.build());
        {
            let mut index_writer = index.writer_with_num_threads(1, 20_000_000)?;
            index_writer.set_merge_policy(Box::new(NoMergePolicy));
            index_writer.add_document(doc!(
                bytes_field => vec![1,2,3],
            ))?;
            index_writer.commit()?;
        }

        let agg_req: Aggregations = serde_json::from_value(json!({
            "my_texts": {
                "terms": {
                    "field": "bytes"
                },
            }
        }))
        .unwrap();

        let res = exec_request_with_query(agg_req, &index, None)?;

        // TODO: Returning an error would be better instead of an empty result, since this is not a
        // JSON field
        assert_eq!(
            res["my_texts"]["buckets"][0]["key"],
            serde_json::Value::Null
        );
        assert_eq!(res["my_texts"]["sum_other_doc_count"], 0);
        assert_eq!(res["my_texts"]["doc_count_error_upper_bound"], 0);

        Ok(())
    }

    #[test]
    fn terms_aggregation_missing_multi_value() -> crate::Result<()> {
        let mut schema_builder = Schema::builder();
        let text_field = schema_builder.add_text_field("text", FAST);
        let id_field = schema_builder.add_u64_field("id", FAST);
        let index = Index::create_in_ram(schema_builder.build());
        {
            let mut index_writer = index.writer_with_num_threads(1, 20_000_000)?;
            index_writer.set_merge_policy(Box::new(NoMergePolicy));
            index_writer.add_document(doc!(
                text_field => "Hello Hello",
                text_field => "Hello Hello",
                id_field => 1u64,
                id_field => 1u64,
            ))?;
            // Missing
            index_writer.add_document(doc!())?;
            index_writer.add_document(doc!(
                text_field => "Hello Hello",
            ))?;
            index_writer.add_document(doc!(
                text_field => "Hello Hello",
            ))?;
            index_writer.commit()?;
            // Empty segment special case
            index_writer.add_document(doc!())?;
            index_writer.commit()?;
            // Full segment special case
            index_writer.add_document(doc!(
                text_field => "Hello Hello",
                id_field => 1u64,
            ))?;
            index_writer.commit()?;
        }

        let agg_req: Aggregations = serde_json::from_value(json!({
            "my_texts": {
                "terms": {
                    "field": "text",
                    "missing": "Empty"
                },
            },
            "my_texts2": {
                "terms": {
                    "field": "text",
                    "missing": 1337
                },
            },
            "my_ids": {
                "terms": {
                    "field": "id",
                    "missing": 1337
                },
            }
        }))
        .unwrap();

        let res = exec_request_with_query(agg_req, &index, None)?;

        // text field
        assert_eq!(res["my_texts"]["buckets"][0]["key"], "Hello Hello");
        assert_eq!(res["my_texts"]["buckets"][0]["doc_count"], 5);
        assert_eq!(res["my_texts"]["buckets"][1]["key"], "Empty");
        assert_eq!(res["my_texts"]["buckets"][1]["doc_count"], 2);
        assert_eq!(
            res["my_texts"]["buckets"][2]["key"],
            serde_json::Value::Null
        );
        // text field with number as missing fallback
        assert_eq!(res["my_texts2"]["buckets"][0]["key"], "Hello Hello");
        assert_eq!(res["my_texts2"]["buckets"][0]["doc_count"], 5);
        assert_eq!(res["my_texts2"]["buckets"][1]["key"], 1337.0);
        assert_eq!(res["my_texts2"]["buckets"][1]["doc_count"], 2);
        assert_eq!(
            res["my_texts2"]["buckets"][2]["key"],
            serde_json::Value::Null
        );
        assert_eq!(res["my_texts"]["sum_other_doc_count"], 0);
        assert_eq!(res["my_texts"]["doc_count_error_upper_bound"], 0);

        // id field
        assert_eq!(res["my_ids"]["buckets"][0]["key"], 1337.0);
        assert_eq!(res["my_ids"]["buckets"][0]["doc_count"], 4);
        assert_eq!(res["my_ids"]["buckets"][1]["key"], 1.0);
        assert_eq!(res["my_ids"]["buckets"][1]["doc_count"], 3);
        assert_eq!(res["my_ids"]["buckets"][2]["key"], serde_json::Value::Null);

        Ok(())
    }
    #[test]
    fn terms_aggregation_missing_simple_id() -> crate::Result<()> {
        let mut schema_builder = Schema::builder();
        let id_field = schema_builder.add_u64_field("id", FAST);
        let index = Index::create_in_ram(schema_builder.build());
        {
            let mut index_writer = index.writer_with_num_threads(1, 20_000_000)?;
            index_writer.set_merge_policy(Box::new(NoMergePolicy));
            index_writer.add_document(doc!(
                id_field => 1u64,
            ))?;
            // Missing
            index_writer.add_document(doc!())?;
            index_writer.add_document(doc!())?;
            index_writer.commit()?;
        }

        let agg_req: Aggregations = serde_json::from_value(json!({
            "my_ids": {
                "terms": {
                    "field": "id",
                    "missing": 1337
                },
            }
        }))
        .unwrap();

        let res = exec_request_with_query(agg_req, &index, None)?;

        // id field
        assert_eq!(res["my_ids"]["buckets"][0]["key"], 1337.0);
        assert_eq!(res["my_ids"]["buckets"][0]["doc_count"], 2);
        assert_eq!(res["my_ids"]["buckets"][1]["key"], 1.0);
        assert_eq!(res["my_ids"]["buckets"][1]["doc_count"], 1);
        assert_eq!(res["my_ids"]["buckets"][2]["key"], serde_json::Value::Null);

        Ok(())
    }

    #[test]
    fn terms_aggregation_u64_value() -> crate::Result<()> {
        // Make sure that large u64 are not truncated
        let mut schema_builder = Schema::builder();
        let id_field = schema_builder.add_u64_field("id", FAST);
        let index = Index::create_in_ram(schema_builder.build());
        {
            let mut index_writer = index.writer_with_num_threads(1, 20_000_000)?;
            index_writer.set_merge_policy(Box::new(NoMergePolicy));
            index_writer.add_document(doc!(
                id_field => 9_223_372_036_854_775_807u64,
            ))?;
            index_writer.add_document(doc!(
                id_field => 1_769_070_189_829_214_202u64,
            ))?;
            index_writer.add_document(doc!(
                id_field => 1_769_070_189_829_214_202u64,
            ))?;
            index_writer.commit()?;
        }

        let agg_req: Aggregations = serde_json::from_value(json!({
            "my_ids": {
                "terms": {
                    "field": "id"
                },
            }
        }))
        .unwrap();

        let res = exec_request_with_query(agg_req, &index, None)?;

        // id field
        assert_eq!(
            res["my_ids"]["buckets"][0]["key"],
            1_769_070_189_829_214_202u64
        );
        assert_eq!(res["my_ids"]["buckets"][0]["doc_count"], 2);
        assert_eq!(
            res["my_ids"]["buckets"][1]["key"],
            9_223_372_036_854_775_807u64
        );
        assert_eq!(res["my_ids"]["buckets"][1]["doc_count"], 1);
        assert_eq!(res["my_ids"]["buckets"][2]["key"], serde_json::Value::Null);

        Ok(())
    }

    #[test]
    fn terms_aggregation_missing1() -> crate::Result<()> {
        let mut schema_builder = Schema::builder();
        let text_field = schema_builder.add_text_field("text", FAST);
        let id_field = schema_builder.add_u64_field("id", FAST);
        let index = Index::create_in_ram(schema_builder.build());
        {
            let mut index_writer = index.writer_with_num_threads(1, 20_000_000)?;
            index_writer.set_merge_policy(Box::new(NoMergePolicy));
            index_writer.add_document(doc!(
                text_field => "Hello Hello",
                id_field => 1u64,
            ))?;
            // Missing
            index_writer.add_document(doc!())?;
            index_writer.add_document(doc!(
                text_field => "Hello Hello",
            ))?;
            index_writer.add_document(doc!(
                text_field => "Hello Hello",
            ))?;
            index_writer.commit()?;
            // Empty segment special case
            index_writer.add_document(doc!())?;
            index_writer.commit()?;
            // Full segment special case
            index_writer.add_document(doc!(
                text_field => "Hello Hello",
                id_field => 1u64,
            ))?;
            index_writer.commit()?;
        }

        let agg_req: Aggregations = serde_json::from_value(json!({
            "my_texts": {
                "terms": {
                    "field": "text",
                    "missing": "Empty"
                },
            },
            "my_texts2": {
                "terms": {
                    "field": "text",
                    "missing": 1337
                },
            },
            "my_ids": {
                "terms": {
                    "field": "id",
                    "missing": 1337
                },
            }
        }))
        .unwrap();

        let res = exec_request_with_query(agg_req, &index, None)?;

        // text field
        assert_eq!(res["my_texts"]["buckets"][0]["key"], "Hello Hello");
        assert_eq!(res["my_texts"]["buckets"][0]["doc_count"], 4);
        assert_eq!(res["my_texts"]["buckets"][1]["key"], "Empty");
        assert_eq!(res["my_texts"]["buckets"][1]["doc_count"], 2);
        assert_eq!(
            res["my_texts"]["buckets"][2]["key"],
            serde_json::Value::Null
        );
        // text field with number as missing fallback
        assert_eq!(res["my_texts2"]["buckets"][0]["key"], "Hello Hello");
        assert_eq!(res["my_texts2"]["buckets"][0]["doc_count"], 4);
        assert_eq!(res["my_texts2"]["buckets"][1]["key"], 1337.0);
        assert_eq!(res["my_texts2"]["buckets"][1]["doc_count"], 2);
        assert_eq!(
            res["my_texts2"]["buckets"][2]["key"],
            serde_json::Value::Null
        );
        assert_eq!(res["my_texts"]["sum_other_doc_count"], 0);
        assert_eq!(res["my_texts"]["doc_count_error_upper_bound"], 0);

        // id field
        assert_eq!(res["my_ids"]["buckets"][0]["key"], 1337.0);
        assert_eq!(res["my_ids"]["buckets"][0]["doc_count"], 4);
        assert_eq!(res["my_ids"]["buckets"][1]["key"], 1.0);
        assert_eq!(res["my_ids"]["buckets"][1]["doc_count"], 2);
        assert_eq!(res["my_ids"]["buckets"][2]["key"], serde_json::Value::Null);

        Ok(())
    }
    #[test]
    fn terms_aggregation_missing_empty() -> crate::Result<()> {
        let mut schema_builder = Schema::builder();
        schema_builder.add_text_field("text", FAST);
        schema_builder.add_u64_field("id", FAST);
        let index = Index::create_in_ram(schema_builder.build());
        {
            let mut index_writer = index.writer_with_num_threads(1, 20_000_000)?;
            index_writer.set_merge_policy(Box::new(NoMergePolicy));
            // Empty segment special case
            index_writer.add_document(doc!())?;
            index_writer.commit()?;
        }

        let agg_req: Aggregations = serde_json::from_value(json!({
            "my_texts": {
                "terms": {
                    "field": "text",
                    "missing": "Empty"
                },
            },
            "my_texts2": {
                "terms": {
                    "field": "text",
                    "missing": 1337
                },
            },
            "my_ids": {
                "terms": {
                    "field": "id",
                    "missing": 1337
                },
            }
        }))
        .unwrap();

        let res = exec_request_with_query(agg_req, &index, None)?;

        // text field
        assert_eq!(res["my_texts"]["buckets"][0]["key"], "Empty");
        assert_eq!(res["my_texts"]["buckets"][0]["doc_count"], 1);
        assert_eq!(
            res["my_texts"]["buckets"][1]["key"],
            serde_json::Value::Null
        );
        // text field with number as missing fallback
        assert_eq!(res["my_texts2"]["buckets"][0]["key"], 1337.0);
        assert_eq!(res["my_texts2"]["buckets"][0]["doc_count"], 1);
        assert_eq!(
            res["my_texts2"]["buckets"][1]["key"],
            serde_json::Value::Null
        );
        assert_eq!(res["my_texts"]["sum_other_doc_count"], 0);
        assert_eq!(res["my_texts"]["doc_count_error_upper_bound"], 0);

        // id field
        assert_eq!(res["my_ids"]["buckets"][0]["key"], 1337.0);
        assert_eq!(res["my_ids"]["buckets"][0]["doc_count"], 1);
        assert_eq!(res["my_ids"]["buckets"][1]["key"], serde_json::Value::Null);

        Ok(())
    }

    #[test]
    fn terms_aggregation_date() -> crate::Result<()> {
        let mut schema_builder = Schema::builder();
        let date_field = schema_builder.add_date_field("date_field", FAST);
        let schema = schema_builder.build();
        let index = Index::create_in_ram(schema);
        {
            let mut writer = index.writer_with_num_threads(1, 15_000_000)?;
            writer.add_document(doc!(date_field=>DateTime::from_primitive(Date::from_calendar_date(1982, Month::September, 17)?.with_hms(0, 0, 0)?)))?;
            writer.add_document(doc!(date_field=>DateTime::from_primitive(Date::from_calendar_date(1982, Month::September, 17)?.with_hms(0, 0, 0)?)))?;
            writer.add_document(doc!(date_field=>DateTime::from_primitive(Date::from_calendar_date(1983, Month::September, 27)?.with_hms(0, 0, 0)?)))?;
            writer.commit()?;
        }

        let agg_req: Aggregations = serde_json::from_value(json!({
            "my_date": {
                "terms": {
                    "field": "date_field"
                },
            }
        }))
        .unwrap();

        let res = exec_request_with_query(agg_req, &index, None)?;

        // date_field field
        assert_eq!(res["my_date"]["buckets"][0]["key"], "1982-09-17T00:00:00Z");
        assert_eq!(res["my_date"]["buckets"][0]["doc_count"], 2);
        assert_eq!(res["my_date"]["buckets"][1]["key"], "1983-09-27T00:00:00Z");
        assert_eq!(res["my_date"]["buckets"][1]["doc_count"], 1);
        assert_eq!(res["my_date"]["buckets"][2]["key"], serde_json::Value::Null);

        Ok(())
    }
    #[test]
    fn terms_aggregation_date_missing() -> crate::Result<()> {
        let mut schema_builder = Schema::builder();
        let date_field = schema_builder.add_date_field("date_field", FAST);
        let schema = schema_builder.build();
        let index = Index::create_in_ram(schema);
        {
            let mut writer = index.writer_with_num_threads(1, 15_000_000)?;
            writer.add_document(doc!(date_field=>DateTime::from_primitive(Date::from_calendar_date(1982, Month::September, 17)?.with_hms(0, 0, 0)?)))?;
            writer.add_document(doc!(date_field=>DateTime::from_primitive(Date::from_calendar_date(1982, Month::September, 17)?.with_hms(0, 0, 0)?)))?;
            writer.add_document(doc!(date_field=>DateTime::from_primitive(Date::from_calendar_date(1983, Month::September, 27)?.with_hms(0, 0, 0)?)))?;
            writer.add_document(doc!())?;
            writer.commit()?;
        }

        let agg_req: Aggregations = serde_json::from_value(json!({
            "my_date": {
                "terms": {
                    "field": "date_field",
                    "missing": "1982-09-17T00:00:00Z"
                },
            }
        }))
        .unwrap();

        let res = exec_request_with_query(agg_req, &index, None)?;

        // date_field field
        assert_eq!(res["my_date"]["buckets"][0]["key"], "1982-09-17T00:00:00Z");
        assert_eq!(res["my_date"]["buckets"][0]["doc_count"], 3);
        assert_eq!(res["my_date"]["buckets"][1]["key"], "1983-09-27T00:00:00Z");
        assert_eq!(res["my_date"]["buckets"][1]["doc_count"], 1);
        assert_eq!(res["my_date"]["buckets"][2]["key"], serde_json::Value::Null);

        Ok(())
    }

    #[test]
    fn terms_aggregation_bool() -> crate::Result<()> {
        let mut schema_builder = Schema::builder();
        let field = schema_builder.add_bool_field("bool_field", FAST);
        let schema = schema_builder.build();
        let index = Index::create_in_ram(schema);
        {
            let mut writer = index.writer_with_num_threads(1, 15_000_000)?;
            writer.add_document(doc!(field=>true))?;
            writer.add_document(doc!(field=>false))?;
            writer.add_document(doc!(field=>true))?;
            writer.commit()?;
        }

        let agg_req: Aggregations = serde_json::from_value(json!({
            "my_bool": {
                "terms": {
                    "field": "bool_field"
                },
            }
        }))
        .unwrap();

        let res = exec_request_with_query(agg_req, &index, None)?;

        assert_eq!(res["my_bool"]["buckets"][0]["key"], 1.0);
        assert_eq!(res["my_bool"]["buckets"][0]["key_as_string"], "true");
        assert_eq!(res["my_bool"]["buckets"][0]["doc_count"], 2);
        assert_eq!(res["my_bool"]["buckets"][1]["key"], 0.0);
        assert_eq!(res["my_bool"]["buckets"][1]["key_as_string"], "false");
        assert_eq!(res["my_bool"]["buckets"][1]["doc_count"], 1);
        assert_eq!(res["my_bool"]["buckets"][2]["key"], serde_json::Value::Null);

        Ok(())
    }

    #[test]
    fn terms_aggregation_ip_addr() -> crate::Result<()> {
        let mut schema_builder = Schema::builder();
        let field = schema_builder.add_ip_addr_field("ip_field", FAST);
        let schema = schema_builder.build();
        let index = Index::create_in_ram(schema);
        {
            let mut writer = index.writer_with_num_threads(1, 15_000_000)?;
            // IpV6 loopback
            writer.add_document(doc!(field=>IpAddr::from_str("::1").unwrap().into_ipv6_addr()))?;
            writer.add_document(doc!(field=>IpAddr::from_str("::1").unwrap().into_ipv6_addr()))?;
            // IpV4
            writer.add_document(
                doc!(field=>IpAddr::from_str("127.0.0.1").unwrap().into_ipv6_addr()),
            )?;
            writer.commit()?;
        }

        let agg_req: Aggregations = serde_json::from_value(json!({
            "my_bool": {
                "terms": {
                    "field": "ip_field"
                },
            }
        }))
        .unwrap();

        let res = exec_request_with_query(agg_req, &index, None)?;
        // print as json
        // println!("{}", serde_json::to_string_pretty(&res).unwrap());

        assert_eq!(res["my_bool"]["buckets"][0]["key"], "::1");
        assert_eq!(res["my_bool"]["buckets"][0]["doc_count"], 2);
        assert_eq!(res["my_bool"]["buckets"][1]["key"], "127.0.0.1");
        assert_eq!(res["my_bool"]["buckets"][1]["doc_count"], 1);
        assert_eq!(res["my_bool"]["buckets"][2]["key"], serde_json::Value::Null);

        Ok(())
    }

    #[test]
    fn terms_aggs_hosts_and_tags_merge_on_mixed_order_request() -> crate::Result<()> {
        // This test ensures that merging of aggregation results works correctly
        // even if the order of the aggregation requests is different and
        // running on different indexes with the same data.
        let build_index = || -> crate::Result<Index> {
            let mut schema_builder = Schema::builder();
            let fielda = schema_builder.add_text_field("fielda", FAST);
            let fieldb = schema_builder.add_text_field("fieldb", FAST);
            let host = schema_builder.add_text_field("host", FAST);
            let tags = schema_builder.add_text_field("tags", FAST);
            let schema = schema_builder.build();

            let index = Index::create_in_ram(schema.clone());
            let mut writer = index.writer(50_000_000).unwrap();

            // --- Ingest documents (batch #1) ---
            writer.add_document(doc!(
                host => "192.168.0.10",
                tags => "nice",
                fielda => "a",
                fieldb => "b",
            ))?;
            writer.add_document(doc!(
                host => "192.168.0.1",
                tags => "nice",
            ))?;
            writer.add_document(doc!(
                host => "192.168.0.11",
                tags => "nice",
            ))?;
            writer.add_document(doc!(
                host => "192.168.0.10",
                tags => "nice",
                tags => "cool",
            ))?;
            writer.add_document(doc!(
                host => "192.168.0.1",
                tags => "nice",
                tags => "cool",
            ))?;

            writer.commit()?;

            // --- Ingest documents (batch #2) ---
            writer.add_document(doc!())?;
            writer.add_document(doc!())?;
            writer.add_document(doc!(
                host => "192.168.0.10",
            ))?;
            writer.add_document(doc!(
                host => "192.168.0.10",
            ))?;
            writer.add_document(doc!())?;

            writer.commit()?;
            Ok(index)
        };
        let index = build_index()?;
        let index2 = build_index()?;

        let search = |idx: &Index,
                      agg_req: &Aggregations|
         -> crate::Result<IntermediateAggregationResults> {
            let collector =
                DistributedAggregationCollector::from_aggs(agg_req.clone(), Default::default());
            let reader = idx.reader()?;
            let searcher = reader.searcher();
            let agg_res = searcher.search(&AllQuery, &collector)?;
            Ok(agg_res)
        };

        // --- Aggregations: terms on host and tags ---
        let agg_req: Aggregations = serde_json::from_value(json!({
            "hosts": { "terms": { "field": "host" } },
            "tags":  { "terms": { "field": "tags" } },
            "fielda":  { "terms": { "field": "fielda" } },
            "fieldb":  { "terms": { "field": "fieldb" } },
        }))
        .unwrap();

        let mut agg_res = search(&index, &agg_req)?;

        // --- Aggregations: terms on host and tags ---
        let mut agg_req2: Aggregations =
            Aggregations::with_capacity_and_hasher(20, Default::default());
        agg_req2.insert(
            "tags".to_string(),
            serde_json::from_value(json!({ "terms": { "field": "tags" } }))?,
        );
        agg_req2.insert(
            "fielda".to_string(),
            serde_json::from_value(json!({ "terms": { "field": "fielda" } }))?,
        );
        agg_req2.insert(
            "hosts".to_string(),
            serde_json::from_value(json!({ "terms": { "field": "host" } }))?,
        );
        agg_req2.insert(
            "fieldb".to_string(),
            serde_json::from_value(json!({ "terms": { "field": "fieldb" } }))?,
        );
        // make sure the order of the aggregation request is different
        // disabled to avoid flaky test with hashmap changes
        // assert_ne!(agg_req.keys().next(), agg_req2.keys().next());

        let agg_res2 = search(&index2, &agg_req2)?;

        agg_res.merge_fruits(agg_res2).unwrap();
        let agg_json =
            serde_json::to_value(&agg_res.into_final_result(agg_req2, Default::default())?)?;

        // hosts:
        let hosts = &agg_json["hosts"]["buckets"];
        assert_eq!(hosts[0]["key"], "192.168.0.10");
        assert_eq!(hosts[0]["doc_count"], 8);
        assert_eq!(hosts[1]["key"], "192.168.0.1");
        assert_eq!(hosts[1]["doc_count"], 4);
        assert_eq!(hosts[2]["key"], "192.168.0.11");
        assert_eq!(hosts[2]["doc_count"], 2);
        // Implementation currently reports error bounds/other count; ensure zero.
        assert_eq!(agg_json["hosts"]["doc_count_error_upper_bound"], 0);
        assert_eq!(agg_json["hosts"]["sum_other_doc_count"], 0);

        // tags:
        let tags_buckets = &agg_json["tags"]["buckets"];
        assert_eq!(tags_buckets[0]["key"], "nice");
        assert_eq!(tags_buckets[0]["doc_count"], 10);
        assert_eq!(tags_buckets[1]["key"], "cool");
        assert_eq!(tags_buckets[1]["doc_count"], 4);
        assert_eq!(agg_json["tags"]["doc_count_error_upper_bound"], 0);
        assert_eq!(agg_json["tags"]["sum_other_doc_count"], 0);

        Ok(())
    }
}


================================================
FILE: src/aggregation/bucket/term_missing_agg.rs
================================================
use columnar::{Column, ColumnType};
use rustc_hash::FxHashMap;

use crate::aggregation::agg_data::{
    build_segment_agg_collectors, AggRefNode, AggregationsSegmentCtx,
};
use crate::aggregation::bucket::term_agg::TermsAggregation;
use crate::aggregation::cached_sub_aggs::{CachedSubAggs, HighCardCachedSubAggs};
use crate::aggregation::intermediate_agg_result::{
    IntermediateAggregationResult, IntermediateAggregationResults, IntermediateBucketResult,
    IntermediateKey, IntermediateTermBucketEntry, IntermediateTermBucketResult,
};
use crate::aggregation::segment_agg_result::{BucketIdProvider, SegmentAggregationCollector};
use crate::aggregation::BucketId;

/// Special aggregation to handle missing values for term aggregations.
/// This missing aggregation will check multiple columns for existence.
///
/// This is needed when:
/// - The field is multi-valued and we therefore have multiple columns
/// - The field is not text and missing is provided as string (we cannot use the numeric missing
///   value optimization)
#[derive(Default)]
pub struct MissingTermAggReqData {
    /// The accessors to check for existence of a value.
    pub accessors: Vec<(Column<u64>, ColumnType)>,
    /// The name of the aggregation.
    pub name: String,
    /// The original terms aggregation request.
    pub req: TermsAggregation,
}

impl MissingTermAggReqData {
    /// Estimate the memory consumption of this struct in bytes.
    pub fn get_memory_consumption(&self) -> usize {
        std::mem::size_of::<Self>()
    }
}

#[derive(Default, Debug, Clone)]
struct MissingCount {
    missing_count: u32,
    bucket_id: BucketId,
}

/// The specialized missing term aggregation.
#[derive(Default, Debug)]
pub struct TermMissingAgg {
    accessor_idx: usize,
    sub_agg: Option<HighCardCachedSubAggs>,
    /// Idx = parent bucket id, Value = missing count for that bucket
    missing_count_per_bucket: Vec<MissingCount>,
    bucket_id_provider: BucketIdProvider,
}
impl TermMissingAgg {
    pub(crate) fn new(
        agg_data: &mut AggregationsSegmentCtx,
        node: &AggRefNode,
    ) -> crate::Result<Self> {
        let has_sub_aggregations = !node.children.is_empty();
        let accessor_idx = node.idx_in_req_data;
        let sub_agg = if has_sub_aggregations {
            let sub_aggregation = build_segment_agg_collectors(agg_data, &node.children)?;
            Some(sub_aggregation)
        } else {
            None
        };

        let sub_agg = sub_agg.map(CachedSubAggs::new);
        let bucket_id_provider = BucketIdProvider::default();

        Ok(Self {
            accessor_idx,
            sub_agg,
            missing_count_per_bucket: Vec::new(),
            bucket_id_provider,
        })
    }
}

impl SegmentAggregationCollector for TermMissingAgg {
    fn add_intermediate_aggregation_result(
        &mut self,
        agg_data: &AggregationsSegmentCtx,
        results: &mut IntermediateAggregationResults,
        parent_bucket_id: BucketId,
    ) -> crate::Result<()> {
        self.prepare_max_bucket(parent_bucket_id, agg_data)?;
        let req_data = agg_data.get_missing_term_req_data(self.accessor_idx);
        let term_agg = &req_data.req;
        let missing = term_agg
            .missing
            .as_ref()
            .expect("TermMissingAgg collector, but no missing found in agg req")
            .clone();
        let mut entries: FxHashMap<IntermediateKey, IntermediateTermBucketEntry> =
            Default::default();

        let missing_count = &self.missing_count_per_bucket[parent_bucket_id as usize];
        let mut missing_entry = IntermediateTermBucketEntry {
            doc_count: missing_count.missing_count,
            sub_aggregation: Default::default(),
        };
        if let Some(sub_agg) = &mut self.sub_agg {
            let mut res = IntermediateAggregationResults::default();
            sub_agg
                .get_sub_agg_collector()
                .add_intermediate_aggregation_result(agg_data, &mut res, missing_count.bucket_id)?;
            missing_entry.sub_aggregation = res;
        }
        entries.insert(missing.into(), missing_entry);

        let bucket = IntermediateBucketResult::Terms {
            buckets: IntermediateTermBucketResult {
                entries,
                sum_other_doc_count: 0,
                doc_count_error_upper_bound: 0,
            },
        };

        results.push(
            req_data.name.to_string(),
            IntermediateAggregationResult::Bucket(bucket),
        )?;

        Ok(())
    }

    fn collect(
        &mut self,
        parent_bucket_id: BucketId,
        docs: &[crate::DocId],
        agg_data: &mut AggregationsSegmentCtx,
    ) -> crate::Result<()> {
        let bucket = &mut self.missing_count_per_bucket[parent_bucket_id as usize];
        let req_data = agg_data.get_missing_term_req_data(self.accessor_idx);

        for doc in docs {
            let doc = *doc;
            let has_value = req_data
                .accessors
                .iter()
                .any(|(acc, _)| acc.index.has_value(doc));
            if !has_value {
                bucket.missing_count += 1;

                if let Some(sub_agg) = self.sub_agg.as_mut() {
                    sub_agg.push(bucket.bucket_id, doc);
                }
            }
        }

        if let Some(sub_agg) = self.sub_agg.as_mut() {
            sub_agg.check_flush_local(agg_data)?;
        }
        Ok(())
    }

    fn prepare_max_bucket(
        &mut self,
        max_bucket: BucketId,
        _agg_data: &AggregationsSegmentCtx,
    ) -> crate::Result<()> {
        while self.missing_count_per_bucket.len() <= max_bucket as usize {
            let bucket_id = self.bucket_id_provider.next_bucket_id();
            self.missing_count_per_bucket.push(MissingCount {
                missing_count: 0,
                bucket_id,
            });
        }
        Ok(())
    }

    fn flush(&mut self, agg_data: &mut AggregationsSegmentCtx) -> crate::Result<()> {
        if let Some(sub_agg) = self.sub_agg.as_mut() {
            sub_agg.flush(agg_data)?;
        }
        Ok(())
    }
}

#[cfg(test)]
mod tests {
    use crate::aggregation::agg_req::Aggregations;
    use crate::aggregation::tests::exec_request_with_query;
    use crate::schema::{Schema, FAST};
    use crate::{Index, IndexWriter};

    #[test]
    fn terms_aggregation_missing_mixed_type_mult_seg_sub_agg() -> crate::Result<()> {
        let mut schema_builder = Schema::builder();
        let json = schema_builder.add_json_field("json", FAST);
        let score = schema_builder.add_f64_field("score", FAST);
        let schema = schema_builder.build();
        let index = Index::create_in_ram(schema);
        let mut index_writer: IndexWriter = index.writer_for_tests().unwrap();
        // => Segment with all values numeric
        index_writer
            .add_document(doc!(score => 1.0, json => json!({"mixed_type": 10.0})))
            .unwrap();
        index_writer.add_document(doc!(score => 5.0))?;
        // index_writer.commit().unwrap();
        //// => Segment with all values text
        index_writer
            .add_document(doc!(score => 1.0, json => json!({"mixed_type": "blue"})))
            .unwrap();
        index_writer.add_document(doc!(score => 5.0))?;
        // index_writer.commit().unwrap();

        // => Segment with mixed values
        index_writer.add_document(doc!(json => json!({"mixed_type": "red"})))?;
        index_writer.add_document(doc!(json => json!({"mixed_type": -20.5})))?;
        index_writer.add_document(doc!(json => json!({"mixed_type": true})))?;
        index_writer.add_document(doc!(score => 5.0))?;

        index_writer.commit().unwrap();
        let agg_req: Aggregations = serde_json::from_value(json!({
            "replace_null": {
                "terms": {
                    "field": "json.mixed_type",
                    "missing": "NULL"
                },
                "aggs": {
                    "sum_score": {
                        "sum": {
                            "field": "score"
                        }
                    }
                }
            },
        }))
        .unwrap();

        let res = exec_request_with_query(agg_req, &index, None)?;

        // text field
        assert_eq!(res["replace_null"]["buckets"][0]["key"], "NULL");
        assert_eq!(res["replace_null"]["buckets"][0]["doc_count"], 3);
        assert_eq!(
            res["replace_null"]["buckets"][0]["sum_score"]["value"],
            15.0
        );
        assert_eq!(res["replace_null"]["sum_other_doc_count"], 0);
        assert_eq!(res["replace_null"]["doc_count_error_upper_bound"], 0);

        Ok(())
    }

    #[test]
    fn terms_aggregation_missing_mixed_type_sub_agg_reg1() -> crate::Result<()> {
        let mut schema_builder = Schema::builder();
        let json = schema_builder.add_json_field("json", FAST);
        let score = schema_builder.add_f64_field("score", FAST);
        let schema = schema_builder.build();
        let index = Index::create_in_ram(schema);
        let mut index_writer: IndexWriter = index.writer_for_tests().unwrap();
        // => Segment with all values numeric
        index_writer.add_document(doc!(score => 1.0, json => json!({"mixed_type": 10.0})))?;
        index_writer.add_document(doc!(score => 5.0))?;
        index_writer.add_document(doc!(score => 5.0))?;

        index_writer.commit().unwrap();
        let agg_req: Aggregations = serde_json::from_value(json!({
            "replace_null": {
                "terms": {
                    "field": "json.mixed_type",
                    "missing": "NULL"
                },
                "aggs": {
                    "sum_score": {
                        "sum": {
                            "field": "score"
                        }
                    }
                }
            },
        }))
        .unwrap();

        let res = exec_request_with_query(agg_req, &index, None)?;

        // text field
        assert_eq!(res["replace_null"]["buckets"][0]["key"], "NULL");
        assert_eq!(res["replace_null"]["buckets"][0]["doc_count"], 2);
        assert_eq!(
            res["replace_null"]["buckets"][0]["sum_score"]["value"],
            10.0
        );
        assert_eq!(res["replace_null"]["sum_other_doc_count"], 0);
        assert_eq!(res["replace_null"]["doc_count_error_upper_bound"], 0);

        Ok(())
    }

    #[test]
    fn terms_aggregation_missing_mult_seg_empty() -> crate::Result<()> {
        let mut schema_builder = Schema::builder();
        let score = schema_builder.add_f64_field("score", FAST);
        let schema = schema_builder.build();
        let index = Index::create_in_ram(schema);
        let mut index_writer: IndexWriter = index.writer_for_tests().unwrap();

        index_writer.add_document(doc!(score => 5.0))?;
        index_writer.commit().unwrap();
        index_writer.add_document(doc!(score => 5.0))?;
        index_writer.commit().unwrap();
        index_writer.add_document(doc!(score => 5.0))?;

        index_writer.commit().unwrap();
        let agg_req: Aggregations = serde_json::from_value(json!({
            "replace_null": {
                "terms": {
                    "field": "json.mixed_type",
                    "missing": "NULL"
                },
                "aggs": {
                    "sum_score": {
                        "sum": {
                            "field": "score"
                        }
                    }
                }
            },
        }))
        .unwrap();

        let res = exec_request_with_query(agg_req, &index, None)?;

        // text field
        assert_eq!(res["replace_null"]["buckets"][0]["key"], "NULL");
        assert_eq!(res["replace_null"]["buckets"][0]["doc_count"], 3);
        assert_eq!(
            res["replace_null"]["buckets"][0]["sum_score"]["value"],
            15.0
        );
        assert_eq!(res["replace_null"]["sum_other_doc_count"], 0);
        assert_eq!(res["replace_null"]["doc_count_error_upper_bound"], 0);

        Ok(())
    }

    #[test]
    fn terms_aggregation_missing_single_seg_empty() -> crate::Result<()> {
        let mut schema_builder = Schema::builder();
        let score = schema_builder.add_f64_field("score", FAST);
        let schema = schema_builder.build();
        let index = Index::create_in_ram(schema);
        let mut index_writer: IndexWriter = index.writer_for_tests().unwrap();

        index_writer.add_document(doc!(score => 5.0))?;
        index_writer.add_document(doc!(score => 5.0))?;
        index_writer.add_document(doc!(score => 5.0))?;

        index_writer.commit().unwrap();
        let agg_req: Aggregations = serde_json::from_value(json!({
            "replace_null": {
                "terms": {
                    "field": "json.mixed_type",
                    "missing": "NULL"
                },
                "aggs": {
                    "sum_score": {
                        "sum": {
                            "field": "score"
                        }
                    }
                }
            },
        }))
        .unwrap();

        let res = exec_request_with_query(agg_req, &index, None)?;

        // text field
        assert_eq!(res["replace_null"]["buckets"][0]["key"], "NULL");
        assert_eq!(res["replace_null"]["buckets"][0]["doc_count"], 3);
        assert_eq!(
            res["replace_null"]["buckets"][0]["sum_score"]["value"],
            15.0
        );
        assert_eq!(res["replace_null"]["sum_other_doc_count"], 0);
        assert_eq!(res["replace_null"]["doc_count_error_upper_bound"], 0);

        Ok(())
    }

    #[test]
    fn terms_aggregation_missing_mixed_type_mult_seg() -> crate::Result<()> {
        let mut schema_builder = Schema::builder();
        let json = schema_builder.add_json_field("json", FAST);
        let schema = schema_builder.build();
        let index = Index::create_in_ram(schema);
        let mut index_writer: IndexWriter = index.writer_for_tests().unwrap();
        // => Segment with all values numeric
        index_writer
            .add_document(doc!(json => json!({"mixed_type": 10.0})))
            .unwrap();
        index_writer.add_document(doc!())?;
        index_writer.commit().unwrap();
        //// => Segment with all values text
        index_writer
            .add_document(doc!(json => json!({"mixed_type": "blue"})))
            .unwrap();
        index_writer.add_document(doc!())?;
        index_writer.commit().unwrap();

        // => Segment with mixed values
        index_writer
            .add_document(doc!(json => json!({"mixed_type": "red"})))
            .unwrap();
        index_writer
            .add_document(doc!(json => json!({"mixed_type": -20.5})))
            .unwrap();
        index_writer
            .add_document(doc!(json => json!({"mixed_type": true})))
            .unwrap();
        index_writer.add_document(doc!())?;

        index_writer.commit().unwrap();
        let agg_req: Aggregations = serde_json::from_value(json!({
            "replace_null": {
                "terms": {
                    "field": "json.mixed_type",
                    "missing": "NULL"
                },
            },
            "replace_num": {
                "terms": {
                    "field": "json.mixed_type",
                    "missing": 1337
                },
            },
        }))
        .unwrap();

        let res = exec_request_with_query(agg_req, &index, None)?;

        // text field
        assert_eq!(res["replace_null"]["buckets"][0]["key"], "NULL");
        assert_eq!(res["replace_null"]["buckets"][0]["doc_count"], 3);
        assert_eq!(res["replace_num"]["buckets"][0]["key"], 1337.0);
        assert_eq!(res["replace_num"]["buckets"][0]["doc_count"], 3);
        assert_eq!(res["replace_null"]["sum_other_doc_count"], 0);
        assert_eq!(res["replace_null"]["doc_count_error_upper_bound"], 0);

        Ok(())
    }

    #[test]
    fn terms_aggregation_missing_str_on_numeric_field() -> crate::Result<()> {
        let mut schema_builder = Schema::builder();
        let json = schema_builder.add_json_field("json", FAST);
        let schema = schema_builder.build();
        let index = Index::create_in_ram(schema);
        let mut index_writer: IndexWriter = index.writer_for_tests().unwrap();
        // => Segment with all values numeric
        index_writer
            .add_document(doc!(json => json!({"mixed_type": 10.0})))
            .unwrap();
        index_writer.add_document(doc!())?;
        index_writer.add_document(doc!())?;

        index_writer
            .add_document(doc!(json => json!({"mixed_type": -20.5})))
            .unwrap();
        index_writer.add_document(doc!())?;

        index_writer.commit().unwrap();

        let agg_req: Aggregations = serde_json::from_value(json!({
            "replace_null": {
                "terms": {
                    "field": "json.mixed_type",
                    "missing": "NULL"
                },
            },
        }))
        .unwrap();

        let res = exec_request_with_query(agg_req, &index, None)?;

        // text field
        assert_eq!(res["replace_null"]["buckets"][0]["key"], "NULL");
        assert_eq!(res["replace_null"]["buckets"][0]["doc_count"], 3);
        assert_eq!(res["replace_null"]["sum_other_doc_count"], 0);
        assert_eq!(res["replace_null"]["doc_count_error_upper_bound"], 0);

        Ok(())
    }

    #[test]
    fn terms_aggregation_missing_mixed_type_one_seg() -> crate::Result<()> {
        let mut schema_builder = Schema::builder();
        let json = schema_builder.add_json_field("json", FAST);
        let schema = schema_builder.build();
        let index = Index::create_in_ram(schema);
        let mut index_writer: IndexWriter = index.writer_for_tests().unwrap();
        // => Segment with all values numeric
        index_writer
            .add_document(doc!(json => json!({"mixed_type": 10.0})))
            .unwrap();
        index_writer.add_document(doc!())?;
        //// => Segment with all values text
        index_writer
            .add_document(doc!(json => json!({"mixed_type": "blue"})))
            .unwrap();
        index_writer.add_document(doc!())?;

        // => Segment with mixed values
        index_writer
            .add_document(doc!(json => json!({"mixed_type": "red"})))
            .unwrap();
        index_writer
            .add_document(doc!(json => json!({"mixed_type": -20.5})))
            .unwrap();
        index_writer
            .add_document(doc!(json => json!({"mixed_type": true})))
            .unwrap();
        index_writer.add_document(doc!())?;

        index_writer.commit().unwrap();

        let agg_req: Aggregations = serde_json::from_value(json!({
            "replace_null": {
                "terms": {
                    "field": "json.mixed_type",
                    "missing": "NULL"
                },
            },
        }))
        .unwrap();

        let res = exec_request_with_query(agg_req, &index, None)?;

        // text field
        assert_eq!(res["replace_null"]["buckets"][0]["key"], "NULL");
        assert_eq!(res["replace_null"]["buckets"][0]["doc_count"], 3);
        assert_eq!(res["replace_null"]["sum_other_doc_count"], 0);
        assert_eq!(res["replace_null"]["doc_count_error_upper_bound"], 0);

        Ok(())
    }
}


================================================
FILE: src/aggregation/cached_sub_aggs.rs
================================================
use std::fmt::Debug;

use super::segment_agg_result::SegmentAggregationCollector;
use crate::aggregation::agg_data::AggregationsSegmentCtx;
use crate::aggregation::bucket::MAX_NUM_TERMS_FOR_VEC;
use crate::aggregation::BucketId;
use crate::DocId;

/// A cache for sub-aggregations, storing doc ids per bucket id.
/// Depending on the cardinality of the parent aggregation, we use different
/// storage strategies.
///
/// ## Low Cardinality
/// Cardinality here refers to the number of unique flattened buckets that can be created
/// by the parent aggregation.
/// Flattened buckets are the result of combining all buckets per collector
/// into a single list of buckets, where each bucket is identified by its BucketId.
///
/// ## Usage
/// Since this is caching for sub-aggregations, it is only used by bucket
/// aggregations.
///
/// TODO: consider using a more advanced data structure for high cardinality
/// aggregations.
/// What this datastructure does in general is to group docs by bucket id.
#[derive(Debug)]
pub(crate) struct CachedSubAggs<C: SubAggCache> {
    cache: C,
    sub_agg_collector: Box<dyn SegmentAggregationCollector>,
    num_docs: usize,
}

pub type LowCardCachedSubAggs = CachedSubAggs<LowCardSubAggCache>;
pub type HighCardCachedSubAggs = CachedSubAggs<HighCardSubAggCache>;

const FLUSH_THRESHOLD: usize = 2048;

/// A trait for caching sub-aggregation doc ids per bucket id.
/// Different implementations can be used depending on the cardinality
/// of the parent aggregation.
pub trait SubAggCache: Debug {
    fn new() -> Self;
    fn push(&mut self, bucket_id: BucketId, doc_id: DocId);
    fn flush_local(
        &mut self,
        sub_agg: &mut Box<dyn SegmentAggregationCollector>,
        agg_data: &mut AggregationsSegmentCtx,
        force: bool,
    ) -> crate::Result<()>;
}

impl<Backend: SubAggCache + Debug> CachedSubAggs<Backend> {
    pub fn new(sub_agg: Box<dyn SegmentAggregationCollector>) -> Self {
        Self {
            cache: Backend::new(),
            sub_agg_collector: sub_agg,
            num_docs: 0,
        }
    }

    pub fn get_sub_agg_collector(&mut self) -> &mut Box<dyn SegmentAggregationCollector> {
        &mut self.sub_agg_collector
    }

    #[inline]
    pub fn push(&mut self, bucket_id: BucketId, doc_id: DocId) {
        self.cache.push(bucket_id, doc_id);
        self.num_docs += 1;
    }

    /// Check if we need to flush based on the number of documents cached.
    /// If so, flushes the cache to the provided aggregation collector.
    pub fn check_flush_local(
        &mut self,
        agg_data: &mut AggregationsSegmentCtx,
    ) -> crate::Result<()> {
        if self.num_docs >= FLUSH_THRESHOLD {
            self.cache
                .flush_local(&mut self.sub_agg_collector, agg_data, false)?;
            self.num_docs = 0;
        }
        Ok(())
    }

    /// Note: this _does_ flush the sub aggregations.
    pub fn flush(&mut self, agg_data: &mut AggregationsSegmentCtx) -> crate::Result<()> {
        if self.num_docs != 0 {
            self.cache
                .flush_local(&mut self.sub_agg_collector, agg_data, true)?;
            self.num_docs = 0;
        }
        self.sub_agg_collector.flush(agg_data)?;
        Ok(())
    }
}

/// Number of partitions for high cardinality sub-aggregation cache.
const NUM_PARTITIONS: usize = 16;

#[derive(Debug)]
pub(crate) struct HighCardSubAggCache {
    /// This weird partitioning is used to do some cheap grouping on the bucket ids.
    /// bucket ids are dense, e.g. when we don't detect the cardinality as low cardinality,
    /// but there are just 16 bucket ids, each bucket id will go to its own partition.
    ///
    /// We want to keep this cheap, because high cardinality aggregations can have a lot of
    /// buckets, and there may be nothing to group.
    partitions: Box<[PartitionEntry; NUM_PARTITIONS]>,
}

impl HighCardSubAggCache {
    #[inline]
    fn clear(&mut self) {
        for partition in self.partitions.iter_mut() {
            partition.clear();
        }
    }
}

#[derive(Debug, Clone, Default)]
struct PartitionEntry {
    bucket_ids: Vec<BucketId>,
    docs: Vec<DocId>,
}

impl PartitionEntry {
    #[inline]
    fn clear(&mut self) {
        self.bucket_ids.clear();
        self.docs.clear();
    }
}

impl SubAggCache for HighCardSubAggCache {
    fn new() -> Self {
        Self {
            partitions: Box::new(core::array::from_fn(|_| PartitionEntry::default())),
        }
    }

    fn push(&mut self, bucket_id: BucketId, doc_id: DocId) {
        let idx = bucket_id % NUM_PARTITIONS as u32;
        let slot = &mut self.partitions[idx as usize];
        slot.bucket_ids.push(bucket_id);
        slot.docs.push(doc_id);
    }

    fn flush_local(
        &mut self,
        sub_agg: &mut Box<dyn SegmentAggregationCollector>,
        agg_data: &mut AggregationsSegmentCtx,
        _force: bool,
    ) -> crate::Result<()> {
        let mut max_bucket = 0u32;
        for partition in self.partitions.iter() {
            if let Some(&local_max) = partition.bucket_ids.iter().max() {
                max_bucket = max_bucket.max(local_max);
            }
        }

        sub_agg.prepare_max_bucket(max_bucket, agg_data)?;

        for slot in self.partitions.iter() {
            if !slot.bucket_ids.is_empty() {
                // Reduce dynamic dispatch overhead by collecting a full partition in one call.
                sub_agg.collect_multiple(&slot.bucket_ids, &slot.docs, agg_data)?;
            }
        }

        self.clear();
        Ok(())
    }
}

#[derive(Debug)]
pub(crate) struct LowCardSubAggCache {
    /// Cache doc ids per bucket for sub-aggregations.
    ///
    /// The outer Vec is indexed by BucketId.
    per_bucket_docs: Vec<Vec<DocId>>,
}

impl LowCardSubAggCache {
    #[inline]
    fn clear(&mut self) {
        for v in &mut self.per_bucket_docs {
            v.clear();
        }
    }
}

impl SubAggCache for LowCardSubAggCache {
    fn new() -> Self {
        Self {
            per_bucket_docs: Vec::new(),
        }
    }

    fn push(&mut self, bucket_id: BucketId, doc_id: DocId) {
        let idx = bucket_id as usize;
        if self.per_bucket_docs.len() <= idx {
            self.per_bucket_docs.resize_with(idx + 1, Vec::new);
        }
        self.per_bucket_docs[idx].push(doc_id);
    }

    fn flush_local(
        &mut self,
        sub_agg: &mut Box<dyn SegmentAggregationCollector>,
        agg_data: &mut AggregationsSegmentCtx,
        force: bool,
    ) -> crate::Result<()> {
        // Pre-aggregated: call collect per bucket.
        let max_bucket = (self.per_bucket_docs.len() as BucketId).saturating_sub(1);
        sub_agg.prepare_max_bucket(max_bucket, agg_data)?;
        // The threshold above which we flush buckets individually.
        // Note: We need to make sure that we don't lock ourselves into a situation where we hit
        // the FLUSH_THRESHOLD, but never flush any buckets. (except the final flush)
        let mut bucket_treshold = FLUSH_THRESHOLD / (self.per_bucket_docs.len().max(1) * 2);
        const _: () = {
            // MAX_NUM_TERMS_FOR_VEC threshold is used for term aggregations
            // Note: There may be other flexible values, for other aggregations, but we can use the
            // const value here as a upper bound. (better than nothing)
            let bucket_treshold_limit = FLUSH_THRESHOLD / (MAX_NUM_TERMS_FOR_VEC as usize * 2);
            assert!(
                bucket_treshold_limit > 0,
                "Bucket threshold must be greater than 0"
            );
        };
        if force {
            bucket_treshold = 0;
        }
        for (bucket_id, docs) in self
            .per_bucket_docs
            .iter()
            .enumerate()
            .filter(|(_, docs)| docs.len() > bucket_treshold)
        {
            sub_agg.collect(bucket_id as BucketId, docs, agg_data)?;
        }

        self.clear();
        Ok(())
    }
}


================================================
FILE: src/aggregation/collector.rs
================================================
use super::agg_req::Aggregations;
use super::agg_result::AggregationResults;
use super::cached_sub_aggs::LowCardCachedSubAggs;
use super::intermediate_agg_result::IntermediateAggregationResults;
use super::AggContextParams;
// group buffering strategy is chosen explicitly by callers; no need to hash-group on the fly.
use crate::aggregation::agg_data::{
    build_aggregations_data_from_req, build_segment_agg_collectors_root, AggregationsSegmentCtx,
};
use crate::collector::{Collector, SegmentCollector};
use crate::index::SegmentReader;
use crate::{DocId, SegmentOrdinal, TantivyError};

/// The default max bucket count, before the aggregation fails.
pub const DEFAULT_BUCKET_LIMIT: u32 = 65000;

/// The default memory limit in bytes before the aggregation fails. 500MB
pub const DEFAULT_MEMORY_LIMIT: u64 = 500_000_000;

/// Collector for aggregations.
///
/// The collector collects all aggregations by the underlying aggregation request.
pub struct AggregationCollector {
    agg: Aggregations,
    context: AggContextParams,
}

impl AggregationCollector {
    /// Create collector from aggregation request.
    ///
    /// Aggregation fails when the limits in `AggregationLimits` is exceeded. (memory limit and
    /// bucket limit)
    pub fn from_aggs(agg: Aggregations, context: AggContextParams) -> Self {
        Self { agg, context }
    }
}

/// Collector for distributed aggregations.
///
/// The collector collects all aggregations by the underlying aggregation request.
///
/// # Purpose
/// AggregationCollector returns `IntermediateAggregationResults` and not the final
/// `AggregationResults`, so that results from different indices can be merged and then converted
/// into the final `AggregationResults` via the `into_final_result()` method.
pub struct DistributedAggregationCollector {
    agg: Aggregations,
    context: AggContextParams,
}

impl DistributedAggregationCollector {
    /// Create collector from aggregation request.
    ///
    /// Aggregation fails when the limits in `AggregationLimits` is exceeded. (memory limit and
    /// bucket limit)
    pub fn from_aggs(agg: Aggregations, context: AggContextParams) -> Self {
        Self { agg, context }
    }
}

impl Collector for DistributedAggregationCollector {
    type Fruit = IntermediateAggregationResults;

    type Child = AggregationSegmentCollector;

    fn for_segment(
        &self,
        segment_local_id: crate::SegmentOrdinal,
        reader: &crate::SegmentReader,
    ) -> crate::Result<Self::Child> {
        AggregationSegmentCollector::from_agg_req_and_reader(
            &self.agg,
            reader,
            segment_local_id,
            &self.context,
        )
    }

    fn requires_scoring(&self) -> bool {
        false
    }

    fn merge_fruits(
        &self,
        segment_fruits: Vec<<Self::Child as SegmentCollector>::Fruit>,
    ) -> crate::Result<Self::Fruit> {
        merge_fruits(segment_fruits)
    }
}

impl Collector for AggregationCollector {
    type Fruit = AggregationResults;

    type Child = AggregationSegmentCollector;

    fn for_segment(
        &self,
        segment_local_id: crate::SegmentOrdinal,
        reader: &crate::SegmentReader,
    ) -> crate::Result<Self::Child> {
        AggregationSegmentCollector::from_agg_req_and_reader(
            &self.agg,
            reader,
            segment_local_id,
            &self.context,
        )
    }

    fn requires_scoring(&self) -> bool {
        false
    }

    fn merge_fruits(
        &self,
        segment_fruits: Vec<<Self::Child as SegmentCollector>::Fruit>,
    ) -> crate::Result<Self::Fruit> {
        let res = merge_fruits(segment_fruits)?;
        res.into_final_result(self.agg.clone(), self.context.limits.clone())
    }
}

fn merge_fruits(
    mut segment_fruits: Vec<crate::Result<IntermediateAggregationResults>>,
) -> crate::Result<IntermediateAggregationResults> {
    if let Some(fruit) = segment_fruits.pop() {
        let mut fruit = fruit?;
        for next_fruit in segment_fruits {
            fruit.merge_fruits(next_fruit?)?;
        }
        Ok(fruit)
    } else {
        Ok(IntermediateAggregationResults::default())
    }
}

/// `AggregationSegmentCollector` does the aggregation collection on a segment.
pub struct AggregationSegmentCollector {
    aggs_with_accessor: AggregationsSegmentCtx,
    agg_collector: LowCardCachedSubAggs,
    error: Option<TantivyError>,
}

impl AggregationSegmentCollector {
    /// Creates an `AggregationSegmentCollector from` an [`Aggregations`] request and a segment
    /// reader. Also includes validation, e.g. checking field types and existence.
    pub fn from_agg_req_and_reader(
        agg: &Aggregations,
        reader: &SegmentReader,
        segment_ordinal: SegmentOrdinal,
        context: &AggContextParams,
    ) -> crate::Result<Self> {
        let mut agg_data =
            build_aggregations_data_from_req(agg, reader, segment_ordinal, context.clone())?;
        let mut result =
            LowCardCachedSubAggs::new(build_segment_agg_collectors_root(&mut agg_data)?);
        result
            .get_sub_agg_collector()
            .prepare_max_bucket(0, &agg_data)?; // prepare for bucket zero

        Ok(AggregationSegmentCollector {
            aggs_with_accessor: agg_data,
            agg_collector: result,
            error: None,
        })
    }
}

impl SegmentCollector for AggregationSegmentCollector {
    type Fruit = crate::Result<IntermediateAggregationResults>;

    #[inline]
    fn collect(&mut self, doc: DocId, _score: crate::Score) {
        if self.error.is_some() {
            return;
        }
        self.agg_collector.push(0, doc);
        match self
            .agg_collector
            .check_flush_local(&mut self.aggs_with_accessor)
        {
            Ok(_) => {}
            Err(e) => {
                self.error = Some(e);
            }
        }
    }
    fn collect_block(&mut self, docs: &[DocId]) {
        if self.error.is_some() {
            return;
        }

        match self.agg_collector.get_sub_agg_collector().collect(
            0,
            docs,
            &mut self.aggs_with_accessor,
        ) {
            Ok(_) => {}
            Err(e) => {
                self.error = Some(e);
            }
        }
    }

    fn harvest(mut self) -> Self::Fruit {
        if let Some(err) = self.error {
            return Err(err);
        }
        self.agg_collector.flush(&mut self.aggs_with_accessor)?;

        let mut sub_aggregation_res = IntermediateAggregationResults::default();
        self.agg_collector
            .get_sub_agg_collector()
            .add_intermediate_aggregation_result(
                &self.aggs_with_accessor,
                &mut sub_aggregation_res,
                0,
            )?;

        Ok(sub_aggregation_res)
    }
}


================================================
FILE: src/aggregation/date.rs
================================================
use time::format_description::well_known::Rfc3339;
use time::OffsetDateTime;

use crate::TantivyError;

pub(crate) fn format_date(val: i64) -> crate::Result<String> {
    let datetime = OffsetDateTime::from_unix_timestamp_nanos(val as i128).map_err(|err| {
        TantivyError::InvalidArgument(format!(
            "Could not convert {val:?} to OffsetDateTime, err {err:?}"
        ))
    })?;
    let key_as_string = datetime
        .format(&Rfc3339)
        .map_err(|_err| TantivyError::InvalidArgument("Could not serialize date".to_string()))?;
    Ok(key_as_string)
}


================================================
FILE: src/aggregation/error.rs
================================================
use common::ByteCount;

use super::bucket::DateHistogramParseError;

/// Error that may occur when opening a directory
#[derive(Debug, Clone, PartialEq, Eq, Error)]
pub enum AggregationError {
    /// InternalError Aggregation Request
    #[error("InternalError: {0:?}")]
    InternalError(String),
    /// Invalid Aggregation Request
    #[error("InvalidRequest: {0:?}")]
    InvalidRequest(String),
    /// Date histogram parse error
    #[error("Date histogram parse error: {0:?}")]
    DateHistogramParseError(#[from] DateHistogramParseError),
    /// Memory limit exceeded
    #[error(
        "Aborting aggregation because memory limit was exceeded. Limit: {limit:?}, Current: \
         {current:?}"
    )]
    MemoryExceeded {
        /// Memory consumption limit
        limit: ByteCount,
        /// Current memory consumption
        current: ByteCount,
    },
    /// Bucket limit exceeded
    #[error(
        "Aborting aggregation because bucket limit was exceeded. Limit: {limit:?}, Current: \
         {current:?}"
    )]
    BucketLimitExceeded {
        /// Bucket limit
        limit: u32,
        /// Current num buckets
        current: u32,
    },
}


================================================
FILE: src/aggregation/intermediate_agg_result.rs
================================================
//! Contains the intermediate aggregation tree, that can be merged.
//! Intermediate aggregation results can be used to merge results between segments or between
//! indices.

use std::cmp::Ordering;
use std::collections::hash_map::Entry;
use std::hash::Hash;
use std::net::Ipv6Addr;

use columnar::ColumnType;
use itertools::Itertools;
use rustc_hash::FxHashMap;
use serde::{Deserialize, Serialize};

use super::agg_req::{Aggregation, AggregationVariants, Aggregations};
use super::agg_result::{AggregationResult, BucketResult, MetricResult, RangeBucketEntry};
use super::bucket::{
    composite_intermediate_key_ordering, cut_off_buckets, get_agg_name_and_property,
    intermediate_histogram_buckets_to_final_buckets, CompositeAggregation, GetDocCount,
    MissingOrder, Order, OrderTarget, RangeAggregation, TermsAggregation,
};
use super::metric::{
    IntermediateAverage, IntermediateCount, IntermediateExtendedStats, IntermediateMax,
    IntermediateMin, IntermediateStats, IntermediateSum, PercentilesCollector, TopHitsTopNComputer,
};
use super::segment_agg_result::AggregationLimitsGuard;
use super::{format_date, AggregationError, Key, SerializedKey};
use crate::aggregation::agg_result::{
    AggregationResults, BucketEntries, BucketEntry, CompositeBucketEntry, FilterBucketResult,
};
use crate::aggregation::bucket::TermsAggregationInternal;
use crate::aggregation::metric::CardinalityCollector;
use crate::TantivyError;

/// Contains the intermediate aggregation result, which is optimized to be merged with other
/// intermediate results.
///
/// Notice: This struct should not be de/serialized via JSON format.
#[derive(Default, Clone, Debug, PartialEq, Serialize, Deserialize)]
pub struct IntermediateAggregationResults {
    pub(crate) aggs_res: FxHashMap<String, IntermediateAggregationResult>,
}

#[derive(Clone, Debug, Serialize, Deserialize, PartialOrd, PartialEq)]
/// The key to identify a bucket.
/// This might seem redundant with `Key`, but the point is to have a different
/// Serialize implementation.
pub enum IntermediateKey {
    /// Ip Addr key
    IpAddr(Ipv6Addr),
    /// Bool key
    Bool(bool),
    /// String key
    Str(String),
    /// `f64` key
    F64(f64),
    /// `i64` key
    I64(i64),
    /// `u64` key
    U64(u64),
}
impl From<Key> for IntermediateKey {
    fn from(value: Key) -> Self {
        match value {
            Key::Str(s) => Self::Str(s),
            Key::F64(f) => Self::F64(f),
            Key::U64(f) => Self::U64(f),
            Key::I64(f) => Self::I64(f),
        }
    }
}
impl From<IntermediateKey> for Key {
    fn from(value: IntermediateKey) -> Self {
        match value {
            IntermediateKey::Str(s) => Self::Str(s),
            IntermediateKey::IpAddr(s) => {
                // Prefer to use the IPv4 representation if possible
                if let Some(ip) = s.to_ipv4_mapped() {
                    Self::Str(ip.to_string())
                } else {
                    Self::Str(s.to_string())
                }
            }
            IntermediateKey::F64(f) => Self::F64(f),
            IntermediateKey::Bool(f) => Self::U64(f as u64),
            IntermediateKey::U64(f) => Self::U64(f),
            IntermediateKey::I64(f) => Self::I64(f),
        }
    }
}

impl Eq for IntermediateKey {}

impl std::fmt::Display for IntermediateKey {
    fn fmt(&self, f: &mut std::fmt::Formatter<'_>) -> std::fmt::Result {
        match self {
            IntermediateKey::Str(val) => f.write_str(val),
            IntermediateKey::F64(val) => f.write_str(&val.to_string()),
            IntermediateKey::U64(val) => f.write_str(&val.to_string()),
            IntermediateKey::I64(val) => f.write_str(&val.to_string()),
            IntermediateKey::Bool(val) => f.write_str(&val.to_string()),
            IntermediateKey::IpAddr(val) => f.write_str(&val.to_string()),
        }
    }
}

impl std::hash::Hash for IntermediateKey {
    fn hash<H: std::hash::Hasher>(&self, state: &mut H) {
        core::mem::discriminant(self).hash(state);
        match self {
            IntermediateKey::Str(text) => text.hash(state),
            IntermediateKey::F64(val) => val.to_bits().hash(state),
            IntermediateKey::U64(val) => val.hash(state),
            IntermediateKey::I64(val) => val.hash(state),
            IntermediateKey::Bool(val) => val.hash(state),
            IntermediateKey::IpAddr(val) => val.hash(state),
        }
    }
}

impl IntermediateAggregationResults {
    /// Returns a reference to the intermediate aggregation result for the given key.
    pub fn get(&self, key: &str) -> Option<&IntermediateAggregationResult> {
        self.aggs_res.get(key)
    }

    /// Removes and returns the intermediate aggregation result for the given key.
    pub fn remove(&mut self, key: &str) -> Option<IntermediateAggregationResult> {
        self.aggs_res.remove(key)
    }

    /// Returns an iterator over the keys in the intermediate aggregation results.
    pub fn keys(&self) -> impl Iterator<Item = &String> {
        self.aggs_res.keys()
    }

    /// Add a result
    pub fn push(&mut self, key: String, value: IntermediateAggregationResult) -> crate::Result<()> {
        let entry = self.aggs_res.entry(key);
        match entry {
            Entry::Occupied(mut e) => {
                // In case of term aggregation over different types, we need to merge the results.
                e.get_mut().merge_fruits(value)?;
            }
            Entry::Vacant(e) => {
                e.insert(value);
            }
        }
        Ok(())
    }

    /// Convert intermediate result and its aggregation request to the final result.
    pub fn into_final_result(
        self,
        req: Aggregations,
        mut limits: AggregationLimitsGuard,
    ) -> crate::Result<AggregationResults> {
        let res = self.into_final_result_internal(&req, &mut limits)?;
        let bucket_count = res.get_bucket_count() as u32;
        if bucket_count > limits.get_bucket_limit() {
            return Err(TantivyError::AggregationError(
                AggregationError::BucketLimitExceeded {
                    limit: limits.get_bucket_limit(),
                    current: bucket_count,
                },
            ));
        }
        Ok(res)
    }

    /// Convert intermediate result and its aggregation request to the final result.
    pub(crate) fn into_final_result_internal(
        self,
        req: &Aggregations,
        limits: &mut AggregationLimitsGuard,
    ) -> crate::Result<AggregationResults> {
        let mut results: FxHashMap<String, AggregationResult> = FxHashMap::default();
        for (key, agg_res) in self.aggs_res.into_iter() {
            let req = req.get(key.as_str()).unwrap_or_else(|| {
                panic!(
                    "Could not find key {:?} in request keys {:?}. This probably means that \
                     add_intermediate_aggregation_result passed the wrong agg object.",
                    key,
                    req.keys().collect::<Vec<_>>()
                )
            });
            results.insert(key, agg_res.into_final_result(req, limits)?);
        }
        // Handle empty results
        if results.len() != req.len() {
            for (key, req) in req.iter() {
                if !results.contains_key(key) {
                    let empty_res = empty_from_req(req);
                    results.insert(key.to_string(), empty_res.into_final_result(req, limits)?);
                }
            }
        }

        Ok(AggregationResults(results))
    }

    pub(crate) fn empty_from_req(req: &Aggregations) -> Self {
        let mut aggs_res: FxHashMap<String, IntermediateAggregationResult> = FxHashMap::default();
        for (key, req) in req.iter() {
            let empty_res = empty_from_req(req);
            aggs_res.insert(key.to_string(), empty_res);
        }

        Self { aggs_res }
    }

    /// Merge another intermediate aggregation result into this result.
    pub fn merge_fruits(&mut self, mut other: IntermediateAggregationResults) -> crate::Result<()> {
        for (key, left) in self.aggs_res.iter_mut() {
            if let Some(key) = other.aggs_res.remove(key) {
                left.merge_fruits(key)?;
            }
        }
        // Move remainder of other aggs_res into self.
        // Note: Currently we don't expect this to happen, as we create empty intermediate results
        // via [IntermediateAggregationResults::empty_from_req].
        for (key, value) in other.aggs_res {
            self.aggs_res.insert(key, value);
        }
        Ok(())
    }
}

pub(crate) fn empty_from_req(req: &Aggregation) -> IntermediateAggregationResult {
    use AggregationVariants::*;
    match req.agg {
        Terms(_) => IntermediateAggregationResult::Bucket(IntermediateBucketResult::Terms {
            buckets: Default::default(),
        }),
        Range(_) => IntermediateAggregationResult::Bucket(IntermediateBucketResult::Range(
            Default::default(),
        )),
        Histogram(_) => {
            IntermediateAggregationResult::Bucket(IntermediateBucketResult::Histogram {
                buckets: Vec::new(),
                is_date_agg: false,
            })
        }
        DateHistogram(_) => {
            IntermediateAggregationResult::Bucket(IntermediateBucketResult::Histogram {
                buckets: Vec::new(),
                is_date_agg: true,
            })
        }
        Average(_) => IntermediateAggregationResult::Metric(IntermediateMetricResult::Average(
            IntermediateAverage::default(),
        )),
        Count(_) => IntermediateAggregationResult::Metric(IntermediateMetricResult::Count(
            IntermediateCount::default(),
        )),
        Max(_) => IntermediateAggregationResult::Metric(IntermediateMetricResult::Max(
            IntermediateMax::default(),
        )),
        Min(_) => IntermediateAggregationResult::Metric(IntermediateMetricResult::Min(
            IntermediateMin::default(),
        )),
        Stats(_) => IntermediateAggregationResult::Metric(IntermediateMetricResult::Stats(
            IntermediateStats::default(),
        )),
        ExtendedStats(_) => IntermediateAggregationResult::Metric(
            IntermediateMetricResult::ExtendedStats(IntermediateExtendedStats::default()),
        ),
        Sum(_) => IntermediateAggregationResult::Metric(IntermediateMetricResult::Sum(
            IntermediateSum::default(),
        )),
        Percentiles(_) => IntermediateAggregationResult::Metric(
            IntermediateMetricResult::Percentiles(PercentilesCollector::default()),
        ),
        TopHits(ref req) => IntermediateAggregationResult::Metric(
            IntermediateMetricResult::TopHits(TopHitsTopNComputer::new(req)),
        ),
        Cardinality(_) => IntermediateAggregationResult::Metric(
            IntermediateMetricResult::Cardinality(CardinalityCollector::default()),
        ),
        Filter(_) => IntermediateAggregationResult::Bucket(IntermediateBucketResult::Filter {
            doc_count: 0,
            sub_aggregations: IntermediateAggregationResults::default(),
        }),
        Composite(_) => {
            IntermediateAggregationResult::Bucket(IntermediateBucketResult::Composite {
                buckets: IntermediateCompositeBucketResult::default(),
            })
        }
    }
}

/// An aggregation is either a bucket or a metric.
#[derive(Clone, Debug, PartialEq, Serialize, Deserialize)]
#[allow(clippy::large_enum_variant)]
pub enum IntermediateAggregationResult {
    /// Bucket variant
    Bucket(IntermediateBucketResult),
    /// Metric variant
    Metric(IntermediateMetricResult),
}

impl IntermediateAggregationResult {
    pub(crate) fn into_final_result(
        self,
        req: &Aggregation,
        limits: &mut AggregationLimitsGuard,
    ) -> crate::Result<AggregationResult> {
        let res = match self {
            IntermediateAggregationResult::Bucket(bucket) => {
                AggregationResult::BucketResult(bucket.into_final_bucket_result(req, limits)?)
            }
            IntermediateAggregationResult::Metric(metric) => {
                AggregationResult::MetricResult(metric.into_final_metric_result(req))
            }
        };
        Ok(res)
    }
    fn merge_fruits(&mut self, other: IntermediateAggregationResult) -> crate::Result<()> {
        match (self, other) {
            (
                IntermediateAggregationResult::Bucket(b1),
                IntermediateAggregationResult::Bucket(b2),
            ) => b1.merge_fruits(b2),
            (
                IntermediateAggregationResult::Metric(m1),
                IntermediateAggregationResult::Metric(m2),
            ) => m1.merge_fruits(m2),
            _ => panic!("aggregation result type mismatch (mixed metric and buckets)"),
        }
    }
}

/// Holds the intermediate data for metric results
#[derive(Clone, Debug, PartialEq, Serialize, Deserialize)]
pub enum IntermediateMetricResult {
    /// Intermediate average result.
    Percentiles(PercentilesCollector),
    /// Intermediate average result.
    Average(IntermediateAverage),
    /// Intermediate count result.
    Count(IntermediateCount),
    /// Intermediate max result.
    Max(IntermediateMax),
    /// Intermediate min result.
    Min(IntermediateMin),
    /// Intermediate stats result.
    Stats(IntermediateStats),
    /// Intermediate stats result.
    ExtendedStats(IntermediateExtendedStats),
    /// Intermediate sum result.
    Sum(IntermediateSum),
    /// Intermediate top_hits result
    TopHits(TopHitsTopNComputer),
    /// Intermediate cardinality result
    Cardinality(CardinalityCollector),
}

impl IntermediateMetricResult {
    fn into_final_metric_result(self, req: &Aggregation) -> MetricResult {
        match self {
            IntermediateMetricResult::Average(intermediate_avg) => {
                MetricResult::Average(intermediate_avg.finalize().into())
            }
            IntermediateMetricResult::Count(intermediate_count) => {
                MetricResult::Count(intermediate_count.finalize().into())
            }
            IntermediateMetricResult::Max(intermediate_max) => {
                MetricResult::Max(intermediate_max.finalize().into())
            }
            IntermediateMetricResult::Min(intermediate_min) => {
                MetricResult::Min(intermediate_min.finalize().into())
            }
            IntermediateMetricResult::Stats(intermediate_stats) => {
                MetricResult::Stats(intermediate_stats.finalize())
            }
            IntermediateMetricResult::ExtendedStats(intermediate_stats) => {
                MetricResult::ExtendedStats(intermediate_stats.finalize())
            }
            IntermediateMetricResult::Sum(intermediate_sum) => {
                MetricResult::Sum(intermediate_sum.finalize().into())
            }
            IntermediateMetricResult::Percentiles(percentiles) => MetricResult::Percentiles(
                percentiles
                    .into_final_result(req.agg.as_percentile().expect("unexpected metric type")),
            ),
            IntermediateMetricResult::TopHits(top_hits) => {
                MetricResult::TopHits(top_hits.into_final_result())
            }
            IntermediateMetricResult::Cardinality(cardinality) => {
                MetricResult::Cardinality(cardinality.finalize().into())
            }
        }
    }

    // TODO: this is our top-of-the-chain fruit merge mech
    fn merge_fruits(&mut self, other: IntermediateMetricResult) -> crate::Result<()> {
        match (self, other) {
            (
                IntermediateMetricResult::Average(avg_left),
                IntermediateMetricResult::Average(avg_right),
            ) => {
                avg_left.merge_fruits(avg_right);
            }
            (
                IntermediateMetricResult::Count(count_left),
                IntermediateMetricResult::Count(count_right),
            ) => {
                count_left.merge_fruits(count_right);
            }
            (IntermediateMetricResult::Max(max_left), IntermediateMetricResult::Max(max_right)) => {
                max_left.merge_fruits(max_right);
            }
            (IntermediateMetricResult::Min(min_left), IntermediateMetricResult::Min(min_right)) => {
                min_left.merge_fruits(min_right);
            }
            (
                IntermediateMetricResult::Stats(stats_left),
                IntermediateMetricResult::Stats(stats_right),
            ) => {
                stats_left.merge_fruits(stats_right);
            }
            (
                IntermediateMetricResult::ExtendedStats(extended_stats_left),
                IntermediateMetricResult::ExtendedStats(extended_stats_right),
            ) => {
                extended_stats_left.merge_fruits(extended_stats_right);
            }
            (IntermediateMetricResult::Sum(sum_left), IntermediateMetricResult::Sum(sum_right)) => {
                sum_left.merge_fruits(sum_right);
            }
            (
                IntermediateMetricResult::Percentiles(left),
                IntermediateMetricResult::Percentiles(right),
            ) => {
                left.merge_fruits(right)?;
            }
            (IntermediateMetricResult::TopHits(left), IntermediateMetricResult::TopHits(right)) => {
                left.merge_fruits(right)?;
            }
            (
                IntermediateMetricResult::Cardinality(left),
                IntermediateMetricResult::Cardinality(right),
            ) => {
                left.merge_fruits(right)?;
            }
            _ => {
                panic!("incompatible fruit types in tree or missing merge_fruits handler");
            }
        }

        Ok(())
    }
}

/// The intermediate bucket results. Internally they can be easily merged via the keys of the
/// buckets.
#[derive(Clone, Debug, PartialEq, Serialize, Deserialize)]
pub enum IntermediateBucketResult {
    /// This is the range entry for a bucket, which contains a key, count, from, to, and optionally
    /// sub_aggregations.
    Range(IntermediateRangeBucketResult),
    /// This is the histogram entry for a bucket, which contains a key, count, and optionally
    /// sub_aggregations.
    Histogram {
        /// The column_type of the underlying `Column` is DateTime
        is_date_agg: bool,
        /// The histogram buckets
        buckets: Vec<IntermediateHistogramBucketEntry>,
    },
    /// Term aggregation
    Terms {
        /// The term buckets
        buckets: IntermediateTermBucketResult,
    },
    /// Filter aggregation - a single bucket with sub-aggregations
    Filter {
        /// Document count in the filter bucket
        doc_count: u64,
        /// Sub-aggregation results
        sub_aggregations: IntermediateAggregationResults,
    },
    /// Composite aggregation
    Composite {
        /// The composite buckets
        buckets: IntermediateCompositeBucketResult,
    },
}

impl IntermediateBucketResult {
    pub(crate) fn into_final_bucket_result(
        self,
        req: &Aggregation,
        limits: &mut AggregationLimitsGuard,
    ) -> crate::Result<BucketResult> {
        match self {
            IntermediateBucketResult::Range(range_res) => {
                let mut buckets: Vec<RangeBucketEntry> = range_res
                    .buckets
                    .into_values()
                    .map(|bucket| {
                        bucket.into_final_bucket_entry(
                            req.sub_aggregation(),
                            req.agg
                                .as_range()
                                .expect("unexpected aggregation, expected histogram aggregation"),
                            range_res.column_type,
                            limits,
                        )
                    })
                    .collect::<crate::Result<Vec<_>>>()?;

                buckets.sort_by(|left, right| {
                    left.from
                        .unwrap_or(f64::MIN)
                        .total_cmp(&right.from.unwrap_or(f64::MIN))
                });

                let is_keyed = req
                    .agg
                    .as_range()
                    .expect("unexpected aggregation, expected range aggregation")
                    .keyed;
                let buckets = if is_keyed {
                    let mut bucket_map =
                        FxHashMap::with_capacity_and_hasher(buckets.len(), Default::default());
                    for bucket in buckets {
                        bucket_map.insert(bucket.key.to_string(), bucket);
                    }
                    BucketEntries::HashMap(bucket_map)
                } else {
                    BucketEntries::Vec(buckets)
                };
                Ok(BucketResult::Range { buckets })
            }
            IntermediateBucketResult::Histogram {
                is_date_agg,
                buckets,
            } => {
                let histogram_req = &req
                    .agg
                    .as_histogram()?
                    .expect("unexpected aggregation, expected histogram aggregation");
                let buckets = intermediate_histogram_buckets_to_final_buckets(
                    buckets,
                    is_date_agg,
                    histogram_req,
                    req.sub_aggregation(),
                    limits,
                )?;

                let buckets = if histogram_req.keyed {
                    let mut bucket_map =
                        FxHashMap::with_capacity_and_hasher(buckets.len(), Default::default());
                    for bucket in buckets {
                        bucket_map.insert(bucket.key.to_string(), bucket);
                    }
                    BucketEntries::HashMap(bucket_map)
                } else {
                    BucketEntries::Vec(buckets)
                };
                Ok(BucketResult::Histogram { buckets })
            }
            IntermediateBucketResult::Terms { buckets: terms } => terms.into_final_result(
                req.agg
                    .as_term()
                    .expect("unexpected aggregation, expected term aggregation"),
                req.sub_aggregation(),
                limits,
            ),
            IntermediateBucketResult::Filter {
                doc_count,
                sub_aggregations,
            } => {
                // Convert sub-aggregation results to final format
                let final_sub_aggregations = sub_aggregations
                    .into_final_result(req.sub_aggregation().clone(), limits.clone())?;
                Ok(BucketResult::Filter(FilterBucketResult {
                    doc_count,
                    sub_aggregations: final_sub_aggregations,
                }))
            }
            IntermediateBucketResult::Composite { buckets } => {
                let composite_req = req
                    .agg
                    .as_composite()
                    .expect("unexpected aggregation, expected composite aggregation");
                buckets.into_final_result(composite_req, req.sub_aggregation(), limits)
            }
        }
    }

    fn merge_fruits(&mut self, other: IntermediateBucketResult) -> crate::Result<()> {
        match (self, other) {
            (
                IntermediateBucketResult::Terms {
                    buckets: term_res_left,
                },
                IntermediateBucketResult::Terms {
                    buckets: term_res_right,
                },
            ) => {
                merge_maps(&mut term_res_left.entries, term_res_right.entries)?;
                term_res_left.sum_other_doc_count += term_res_right.sum_other_doc_count;
                term_res_left.doc_count_error_upper_bound +=
                    term_res_right.doc_count_error_upper_bound;
            }

            (
                IntermediateBucketResult::Range(range_res_left),
                IntermediateBucketResult::Range(range_res_right),
            ) => {
                merge_maps(&mut range_res_left.buckets, range_res_right.buckets)?;
            }
            (
                IntermediateBucketResult::Histogram {
                    buckets: buckets_left,
                    is_date_agg: _,
                },
                IntermediateBucketResult::Histogram {
                    buckets: buckets_right,
                    is_date_agg: _,
                },
            ) => {
                let buckets: Result<Vec<IntermediateHistogramBucketEntry>, TantivyError> =
                    buckets_left
                        .drain(..)
                        .merge_join_by(buckets_right, |left, right| {
                            left.key.partial_cmp(&right.key).unwrap_or(Ordering::Equal)
                        })
                        .map(|either| match either {
                            itertools::EitherOrBoth::Both(mut left, right) => {
                                left.merge_fruits(right)?;
                                Ok(left)
                            }
                            itertools::EitherOrBoth::Left(left) => Ok(left),
                            itertools::EitherOrBoth::Right(right) => Ok(right),
                        })
                        .collect::<Result<_, _>>();

                *buckets_left = buckets?;
            }
            (
                IntermediateBucketResult::Filter {
                    doc_count: doc_count_left,
                    sub_aggregations: sub_aggs_left,
                },
                IntermediateBucketResult::Filter {
                    doc_count: doc_count_right,
                    sub_aggregations: sub_aggs_right,
                },
            ) => {
                *doc_count_left += doc_count_right;
                sub_aggs_left.merge_fruits(sub_aggs_right)?;
            }
            (
                IntermediateBucketResult::Composite {
                    buckets: composite_left,
                },
                IntermediateBucketResult::Composite {
                    buckets: composite_right,
                },
            ) => {
                composite_left.merge_fruits(composite_right)?;
            }
            (IntermediateBucketResult::Range(_), _) => {
                panic!("try merge on different types")
            }
            (IntermediateBucketResult::Histogram { .. }, _) => {
                panic!("try merge on different types")
            }
            (IntermediateBucketResult::Terms { .. }, _) => {
                panic!("try merge on different types")
            }
            (IntermediateBucketResult::Filter { .. }, _) => {
                panic!("try merge on different types")
            }
            (IntermediateBucketResult::Composite { .. }, _) => {
                panic!("try merge on different types")
            }
        }
        Ok(())
    }
}

#[derive(Default, Clone, Debug, PartialEq, Serialize, Deserialize)]
/// Range aggregation including error counts
pub struct IntermediateRangeBucketResult {
    pub(crate) buckets: FxHashMap<SerializedKey, IntermediateRangeBucketEntry>,
    pub(crate) column_type: Option<ColumnType>,
}

#[derive(Default, Clone, Debug, PartialEq, Serialize, Deserialize)]
/// Term aggregation including error counts
pub struct IntermediateTermBucketResult {
    pub(crate) entries: FxHashMap<IntermediateKey, IntermediateTermBucketEntry>,
    pub(crate) sum_other_doc_count: u64,
    pub(crate) doc_count_error_upper_bound: u64,
}

impl IntermediateTermBucketResult {
    /// Returns a reference to the map of bucket entries keyed by [`IntermediateKey`].
    pub fn entries(&self) -> &FxHashMap<IntermediateKey, IntermediateTermBucketEntry> {
        &self.entries
    }

    /// Returns the count of documents not included in the returned buckets.
    pub fn sum_other_doc_count(&self) -> u64 {
        self.sum_other_doc_count
    }

    /// Returns the upper bound of the error on document counts in the returned buckets.
    pub fn doc_count_error_upper_bound(&self) -> u64 {
        self.doc_count_error_upper_bound
    }

    pub(crate) fn into_final_result(
        self,
        req: &TermsAggregation,
        sub_aggregation_req: &Aggregations,
        limits: &mut AggregationLimitsGuard,
    ) -> crate::Result<BucketResult> {
        let req = TermsAggregationInternal::from_req(req);
        let mut buckets: Vec<BucketEntry> = self
            .entries
            .into_iter()
            .filter(|bucket| bucket.1.doc_count as u64 >= req.min_doc_count)
            .map(|(key, entry)| {
                let key_as_string = match key {
                    IntermediateKey::Bool(key) => {
                        let val = if key { "true" } else { "false" };
                        Some(val.to_string())
                    }
                    _ => None,
                };
                Ok(BucketEntry {
                    key_as_string,
                    key: key.into(),
                    doc_count: entry.doc_count as u64,
                    sub_aggregation: entry
                        .sub_aggregation
                        .into_final_result_internal(sub_aggregation_req, limits)?,
                })
            })
            .collect::<crate::Result<_>>()?;

        let order = req.order.order;
        match req.order.target {
            OrderTarget::Key => {
                buckets.sort_by(|left, right| {
                    if req.order.order == Order::Asc {
                        left.key.partial_cmp(&right.key)
                    } else {
                        right.key.partial_cmp(&left.key)
                    }
                    .expect("expected type string, which is always sortable")
                });
            }
            OrderTarget::Count => {
                if req.order.order == Order::Desc {
                    buckets.sort_unstable_by_key(|bucket| std::cmp::Reverse(bucket.doc_count()));
                } else {
                    buckets.sort_unstable_by_key(|bucket| bucket.doc_count());
                }
            }
            OrderTarget::SubAggregation(name) => {
                let (agg_name, agg_property) = get_agg_name_and_property(&name);
                let mut buckets_with_val = buckets
                    .into_iter()
                    .map(|bucket| {
                        let val = bucket
                            .sub_aggregation
                            .get_value_from_aggregation(agg_name, agg_property)?
                            .unwrap_or(f64::MIN);
                        Ok((bucket, val))
                    })
                    .collect::<crate::Result<Vec<_>>>()?;

                buckets_with_val.sort_by(|(_, val1), (_, val2)| match &order {
                    Order::Desc => val2.total_cmp(val1),
                    Order::Asc => val1.total_cmp(val2),
                });
                buckets = buckets_with_val
                    .into_iter()
                    .map(|(bucket, _val)| bucket)
                    .collect_vec();
            }
        }

        // We ignore _term_doc_count_before_cutoff here, because it increases the upperbound error
        // only for terms that didn't make it into the top N.
        //
        // This can be interesting, as a value of quality of the results, but not good to check the
        // actual error count for the returned terms.
        let (_term_doc_count_before_cutoff, sum_other_doc_count) =
            cut_off_buckets(&mut buckets, req.size as usize);

        let doc_count_error_upper_bound = if req.show_term_doc_count_error {
            Some(self.doc_count_error_upper_bound)
        } else {
            None
        };

        Ok(BucketResult::Terms {
            buckets,
            sum_other_doc_count: self.sum_other_doc_count + sum_other_doc_count,
            doc_count_error_upper_bound,
        })
    }
}

trait MergeFruits {
    fn merge_fruits(&mut self, other: Self) -> crate::Result<()>;
}

fn merge_maps<V: MergeFruits + Clone, T: Eq + PartialEq + Hash>(
    entries_left: &mut FxHashMap<T, V>,
    mut entries_right: FxHashMap<T, V>,
) -> crate::Result<()> {
    for (name, entry_left) in entries_left.iter_mut() {
        if let Some(entry_right) = entries_right.remove(name) {
            entry_left.merge_fruits(entry_right)?;
        }
    }

    for (key, res) in entries_right.into_iter() {
        entries_left.entry(key).or_insert(res);
    }
    Ok(())
}

/// This is the histogram entry for a bucket, which contains a key, count, and optionally
/// sub_aggregations.
#[derive(Clone, Debug, PartialEq, Serialize, Deserialize)]
pub struct IntermediateHistogramBucketEntry {
    /// The unique the bucket is identified.
    pub key: f64,
    /// The number of documents in the bucket.
    pub doc_count: u64,
    /// The sub_aggregation in this bucket.
    pub sub_aggregation: IntermediateAggregationResults,
}

impl IntermediateHistogramBucketEntry {
    pub(crate) fn into_final_bucket_entry(
        self,
        req: &Aggregations,
        limits: &mut AggregationLimitsGuard,
    ) -> crate::Result<BucketEntry> {
        Ok(BucketEntry {
            key_as_string: None,
            key: Key::F64(self.key),
            doc_count: self.doc_count,
            sub_aggregation: self
                .sub_aggregation
                .into_final_result_internal(req, limits)?,
        })
    }
}

/// This is the range entry for a bucket, which contains a key, count, and optionally
/// sub_aggregations.
#[derive(Clone, Debug, PartialEq, Serialize, Deserialize)]
pub struct IntermediateRangeBucketEntry {
    /// The unique key the bucket is identified with.
    pub key: IntermediateKey,
    /// The number of documents in the bucket.
    pub doc_count: u64,
    /// The sub_aggregation in this bucket.
    pub sub_aggregation_res: IntermediateAggregationResults,
    /// The from range of the bucket. Equals `f64::MIN` when `None`.
    pub from: Option<f64>,
    /// The to range of the bucket. Equals `f64::MAX` when `None`.
    pub to: Option<f64>,
}

impl IntermediateRangeBucketEntry {
    pub(crate) fn into_final_bucket_entry(
        self,
        req: &Aggregations,
        _range_req: &RangeAggregation,
        column_type: Option<ColumnType>,
        limits: &mut AggregationLimitsGuard,
    ) -> crate::Result<RangeBucketEntry> {
        let mut range_bucket_entry = RangeBucketEntry {
            key: self.key.into(),
            doc_count: self.doc_count,
            sub_aggregation: self
                .sub_aggregation_res
                .into_final_result_internal(req, limits)?,
            to: self.to,
            from: self.from,
            to_as_string: None,
            from_as_string: None,
        };

        // If we have a date type on the histogram buckets, we add the `key_as_string` field as
        // rfc3339
        if column_type == Some(ColumnType::DateTime) {
            if let Some(val) = range_bucket_entry.to {
                let key_as_string = format_date(val as i64)?;
                range_bucket_entry.to_as_string = Some(key_as_string);
            }
            if let Some(val) = range_bucket_entry.from {
                let key_as_string = format_date(val as i64)?;
                range_bucket_entry.from_as_string = Some(key_as_string);
            }
        }

        Ok(range_bucket_entry)
    }
}

/// This is the term entry for a bucket, which contains a count, and optionally
/// sub_aggregations.
#[derive(Clone, Default, Debug, PartialEq, Serialize, Deserialize)]
pub struct IntermediateTermBucketEntry {
    /// The number of documents in the bucket.
    pub doc_count: u32,
    /// The sub_aggregation in this bucket.
    pub sub_aggregation: IntermediateAggregationResults,
}

impl MergeFruits for IntermediateTermBucketEntry {
    fn merge_fruits(&mut self, other: IntermediateTermBucketEntry) -> crate::Result<()> {
        self.doc_count += other.doc_count;
        self.sub_aggregation.merge_fruits(other.sub_aggregation)?;
        Ok(())
    }
}

impl MergeFruits for IntermediateRangeBucketEntry {
    fn merge_fruits(&mut self, other: IntermediateRangeBucketEntry) -> crate::Result<()> {
        self.doc_count += other.doc_count;
        self.sub_aggregation_res
            .merge_fruits(other.sub_aggregation_res)?;
        Ok(())
    }
}

impl MergeFruits for IntermediateHistogramBucketEntry {
    fn merge_fruits(&mut self, other: IntermediateHistogramBucketEntry) -> crate::Result<()> {
        self.doc_count += other.doc_count;
        self.sub_aggregation.merge_fruits(other.sub_aggregation)?;
        Ok(())
    }
}

/// Entry for the composite bucket.
pub type IntermediateCompositeBucketEntry = IntermediateTermBucketEntry;

/// The fully typed key for composite aggregation
#[derive(Clone, Debug, PartialEq, Serialize, Deserialize)]
pub enum CompositeIntermediateKey {
    /// Bool key
    Bool(bool),
    /// String key
    Str(String),
    /// Float key
    F64(f64),
    /// Signed integer key
    I64(i64),
    /// Unsigned integer key
    U64(u64),
    /// DateTime key, nanoseconds since epoch
    DateTime(i64),
    /// IP Address key
    IpAddr(Ipv6Addr),
    /// Missing value key
    Null,
}

impl Eq for CompositeIntermediateKey {}

impl std::hash::Hash for CompositeIntermediateKey {
    fn hash<H: std::hash::Hasher>(&self, state: &mut H) {
        core::mem::discriminant(self).hash(state);
        match self {
            CompositeIntermediateKey::Bool(val) => val.hash(state),
            CompositeIntermediateKey::Str(text) => text.hash(state),
            CompositeIntermediateKey::F64(val) => val.to_bits().hash(state),
            CompositeIntermediateKey::U64(val) => val.hash(state),
            CompositeIntermediateKey::I64(val) => val.hash(state),
            CompositeIntermediateKey::DateTime(val) => val.hash(state),
            CompositeIntermediateKey::IpAddr(val) => val.hash(state),
            CompositeIntermediateKey::Null => {}
        }
    }
}

/// Composite aggregation page.
#[derive(Default, Clone, Debug, PartialEq, Serialize, Deserialize)]
pub struct IntermediateCompositeBucketResult {
    pub(crate) entries: FxHashMap<Vec<CompositeIntermediateKey>, IntermediateCompositeBucketEntry>,
    pub(crate) target_size: u32,
    pub(crate) orders: Vec<(Order, MissingOrder)>,
}

impl IntermediateCompositeBucketResult {
    pub(crate) fn into_final_result(
        self,
        req: &CompositeAggregation,
        sub_aggregation_req: &Aggregations,
        limits: &mut AggregationLimitsGuard,
    ) -> crate::Result<BucketResult> {
        let trimmed_entry_vec =
            trim_composite_buckets(self.entries, &self.orders, self.target_size)?;
        let after_key = if trimmed_entry_vec.len() == req.size as usize {
            trimmed_entry_vec
                .last()
                .map(|bucket| {
                    let (intermediate_key, _entry) = bucket;
                    intermediate_key
                        .iter()
                        .enumerate()
                        .map(|(idx, intermediate_key)| {
                            let source = &req.sources[idx];
                            (source.name().to_string(), intermediate_key.clone().into())
                        })
                        .collect()
                })
                .unwrap()
        } else {
            FxHashMap::default()
        };

        let buckets = trimmed_entry_vec
            .into_iter()
            .map(|(intermediate_key, entry)| {
                let key = intermediate_key
                    .into_iter()
                    .enumerate()
                    .map(|(idx, intermediate_key)| {
                        let source = &req.sources[idx];
                        (source.name().to_string(), intermediate_key.into())
                    })
                    .collect();
                Ok(CompositeBucketEntry {
                    key,
                    doc_count: entry.doc_count as u64,
                    sub_aggregation: entry
                        .sub_aggregation
                        .into_final_result_internal(sub_aggregation_req, limits)?,
                })
            })
            .collect::<crate::Result<Vec<_>>>()?;

        Ok(BucketResult::Composite { after_key, buckets })
    }

    fn merge_fruits(&mut self, other: IntermediateCompositeBucketResult) -> crate::Result<()> {
        merge_maps(&mut self.entries, other.entries)?;
        if self.entries.len() as u32 > 2 * self.target_size {
            self.trim()?;
        }
        Ok(())
    }

    /// Trim the composite buckets to the target size, according to the ordering.
    pub(crate) fn trim(&mut self) -> crate::Result<()> {
        if self.entries.len() as u32 <= self.target_size {
            return Ok(());
        }

        let sorted_entries = trim_composite_buckets(
            std::mem::take(&mut self.entries),
            &self.orders,
            self.target_size,
        )?;

        self.entries = sorted_entries.into_iter().collect();
        Ok(())
    }
}

fn trim_composite_buckets(
    entries: FxHashMap<Vec<CompositeIntermediateKey>, IntermediateCompositeBucketEntry>,
    orders: &[(Order, MissingOrder)],
    target_size: u32,
) -> crate::Result<
    Vec<(
        Vec<CompositeIntermediateKey>,
        IntermediateCompositeBucketEntry,
    )>,
> {
    let mut entries: Vec<_> = entries.into_iter().collect();
    let mut sort_error: Option<TantivyError> = None;
    entries.sort_by(|(left_key, _), (right_key, _)| {
        if sort_error.is_some() {
            return Ordering::Equal;
        }

        for idx in 0..orders.len() {
            match composite_intermediate_key_ordering(
                &left_key[idx],
                &right_key[idx],
                orders[idx].0,
                orders[idx].1,
            ) {
                Ok(ordering) if ordering != Ordering::Equal => return ordering,
                Ok(_) => continue,
                Err(err) => {
                    sort_error = Some(err);
                    break;
                }
            }
        }
        Ordering::Equal
    });

    if let Some(err) = sort_error {
        return Err(err);
    }

    entries.truncate(target_size as usize);
    Ok(entries)
}

#[cfg(test)]
mod tests {
    use std::collections::HashMap;

    use pretty_assertions::assert_eq;

    use super::*;

    fn get_sub_test_tree(data: &[(String, u64)]) -> IntermediateAggregationResults {
        let mut map = HashMap::new();
        let mut buckets = FxHashMap::default();
        for (key, doc_count) in data {
            buckets.insert(
                key.to_string(),
                IntermediateRangeBucketEntry {
                    key: IntermediateKey::Str(key.to_string()),
                    doc_count: *doc_count,
                    sub_aggregation_res: Default::default(),
                    from: None,
                    to: None,
                },
            );
        }
        map.insert(
            "my_agg_level2".to_string(),
            IntermediateAggregationResult::Bucket(IntermediateBucketResult::Range(
                IntermediateRangeBucketResult {
                    buckets,
                    column_type: None,
                },
            )),
        );
        IntermediateAggregationResults {
            aggs_res: map.into_iter().collect(),
        }
    }

    fn get_intermediate_tree_with_ranges(
        data: &[(String, u64, String, u64)],
    ) -> IntermediateAggregationResults {
        let mut map = HashMap::new();
        let mut buckets: FxHashMap<_, _> = Default::default();
        for (key, doc_count, sub_aggregation_key, sub_aggregation_count) in data {
            buckets.insert(
                key.to_string(),
                IntermediateRangeBucketEntry {
                    key: IntermediateKey::Str(key.to_string()),
                    doc_count: *doc_count,
                    from: None,
                    to: None,
                    sub_aggregation_res: get_sub_test_tree(&[(
                        sub_aggregation_key.to_string(),
                        *sub_aggregation_count,
                    )]),
                },
            );
        }
        map.insert(
            "my_agg_level1".to_string(),
            IntermediateAggregationResult::Bucket(IntermediateBucketResult::Range(
                IntermediateRangeBucketResult {
                    buckets,
                    column_type: None,
                },
            )),
        );
        IntermediateAggregationResults {
            aggs_res: map.into_iter().collect(),
        }
    }

    #[test]
    fn test_merge_fruits_tree_1() {
        let mut tree_left = get_intermediate_tree_with_ranges(&[
            ("red".to_string(), 50, "1900".to_string(), 25),
            ("blue".to_string(), 30, "1900".to_string(), 30),
        ]);
        let tree_right = get_intermediate_tree_with_ranges(&[
            ("red".to_string(), 60, "1900".to_string(), 30),
            ("blue".to_string(), 25, "1900".to_string(), 50),
        ]);

        tree_left.merge_fruits(tree_right).unwrap();

        let tree_expected = get_intermediate_tree_with_ranges(&[
            ("red".to_string(), 110, "1900".to_string(), 55),
            ("blue".to_string(), 55, "1900".to_string(), 80),
        ]);

        assert_eq!(tree_left, tree_expected);
    }

    #[test]
    fn test_merge_fruits_tree_2() {
        let mut tree_left = get_intermediate_tree_with_ranges(&[
            ("red".to_string(), 50, "1900".to_string(), 25),
            ("blue".to_string(), 30, "1900".to_string(), 30),
        ]);
        let tree_right = get_intermediate_tree_with_ranges(&[
            ("red".to_string(), 60, "1900".to_string(), 30),
            ("green".to_string(), 25, "1900".to_string(), 50),
        ]);

        tree_left.merge_fruits(tree_right).unwrap();

        let tree_expected = get_intermediate_tree_with_ranges(&[
            ("red".to_string(), 110, "1900".to_string(), 55),
            ("blue".to_string(), 30, "1900".to_string(), 30),
            ("green".to_string(), 25, "1900".to_string(), 50),
        ]);

        assert_eq!(tree_left, tree_expected);
    }

    #[test]
    fn test_merge_fruits_tree_empty() {
        let mut tree_left = get_intermediate_tree_with_ranges(&[
            ("red".to_string(), 50, "1900".to_string(), 25),
            ("blue".to_string(), 30, "1900".to_string(), 30),
        ]);

        let orig = tree_left.clone();

        tree_left
            .merge_fruits(IntermediateAggregationResults::default())
            .unwrap();

        assert_eq!(tree_left, orig);
    }
}


================================================
FILE: src/aggregation/metric/average.rs
================================================
use std::fmt::Debug;

use serde::{Deserialize, Serialize};

use super::*;
use crate::aggregation::*;

/// A single-value metric aggregation that computes the average of numeric values that are
/// extracted from the aggregated documents.
/// See [super::SingleMetricResult] for return value.
///
/// # JSON Format
/// ```json
/// {
///     "avg": {
///         "field": "score"
///     }
/// }
/// ```
#[derive(Clone, Debug, PartialEq, Serialize, Deserialize)]
pub struct AverageAggregation {
    /// The field name to compute the average on.
    pub field: String,
    /// The missing parameter defines how documents that are missing a value should be treated.
    /// By default they will be ignored but it is also possible to treat them as if they had a
    /// value. Examples in JSON format:
    /// { "field": "my_numbers", "missing": "10.0" }
    #[serde(default, deserialize_with = "deserialize_option_f64")]
    pub missing: Option<f64>,
}

impl AverageAggregation {
    /// Creates a new [`AverageAggregation`] instance from a field name.
    pub fn from_field_name(field_name: String) -> Self {
        Self {
            field: field_name,
            missing: None,
        }
    }
    /// Returns the field name the aggregation is computed on.
    pub fn field_name(&self) -> &str {
        &self.field
    }
}

/// Intermediate result of the average aggregation that can be combined with other intermediate
/// results.
#[derive(Default, Clone, Debug, PartialEq, Serialize, Deserialize)]
pub struct IntermediateAverage {
    stats: IntermediateStats,
}

impl IntermediateAverage {
    /// Creates a new [`IntermediateAverage`] instance from a [`SegmentStatsCollector`].
    pub(crate) fn from_stats(stats: IntermediateStats) -> Self {
        Self { stats }
    }

    /// Returns a reference to the underlying [`IntermediateStats`].
    pub fn stats(&self) -> &IntermediateStats {
        &self.stats
    }

    /// Merges the other intermediate result into self.
    pub fn merge_fruits(&mut self, other: IntermediateAverage) {
        self.stats.merge_fruits(other.stats);
    }
    /// Computes the final average value.
    pub fn finalize(&self) -> Option<f64> {
        self.stats.finalize().avg
    }
}

#[cfg(test)]
mod tests {
    use super::*;

    #[test]
    fn deserialization_with_missing_test1() {
        let json = r#"{
            "field": "score",
            "missing": "10.0"
        }"#;
        let avg: AverageAggregation = serde_json::from_str(json).unwrap();
        assert_eq!(avg.field, "score");
        assert_eq!(avg.missing, Some(10.0));
        // no dot
        let json = r#"{
            "field": "score",
            "missing": "10"
        }"#;
        let avg: AverageAggregation = serde_json::from_str(json).unwrap();
        assert_eq!(avg.field, "score");
        assert_eq!(avg.missing, Some(10.0));

        // from value
        let avg: AverageAggregation = serde_json::from_value(json!({
            "field": "score_f64",
            "missing": 10u64,
        }))
        .unwrap();
        assert_eq!(avg.missing, Some(10.0));
        // from value
        let avg: AverageAggregation = serde_json::from_value(json!({
            "field": "score_f64",
            "missing": 10u32,
        }))
        .unwrap();
        assert_eq!(avg.missing, Some(10.0));
        let avg: AverageAggregation = serde_json::from_value(json!({
            "field": "score_f64",
            "missing": 10i8,
        }))
        .unwrap();
        assert_eq!(avg.missing, Some(10.0));
    }

    #[test]
    fn deserialization_with_missing_test_fail() {
        let json = r#"{
            "field": "score",
            "missing": "a"
        }"#;
        let avg: Result<AverageAggregation, _> = serde_json::from_str(json);
        assert!(avg.is_err());
        assert!(avg
            .unwrap_err()
            .to_string()
            .contains("Failed to parse f64 from string: \"a\""));

        // Disallow NaN
        let json = r#"{
            "field": "score",
            "missing": "NaN"
        }"#;
        let avg: Result<AverageAggregation, _> = serde_json::from_str(json);
        assert!(avg.is_err());
        assert!(avg.unwrap_err().to_string().contains("NaN"));
    }
}


================================================
FILE: src/aggregation/metric/cardinality.rs
================================================
use std::hash::Hash;

use columnar::column_values::CompactSpaceU64Accessor;
use columnar::{Column, ColumnType, Dictionary, StrColumn};
use common::f64_to_u64;
use datasketches::hll::{HllSketch, HllType, HllUnion};
use rustc_hash::FxHashSet;
use serde::{Deserialize, Deserializer, Serialize, Serializer};

use crate::aggregation::agg_data::AggregationsSegmentCtx;
use crate::aggregation::intermediate_agg_result::{
    IntermediateAggregationResult, IntermediateAggregationResults, IntermediateMetricResult,
};
use crate::aggregation::segment_agg_result::SegmentAggregationCollector;
use crate::aggregation::*;
use crate::TantivyError;

/// Log2 of the number of registers for the HLL sketch.
/// 2^11 = 2048 registers, giving ~2.3% relative error and ~1KB per sketch (Hll4).
const LG_K: u8 = 11;

/// # Cardinality
///
/// The cardinality aggregation allows for computing an estimate
/// of the number of different values in a data set based on the
/// Apache DataSketches HyperLogLog algorithm. This is particularly useful for
/// understanding the uniqueness of values in a large dataset where counting
/// each unique value individually would be computationally expensive.
///
/// For example, you might use a cardinality aggregation to estimate the number
/// of unique visitors to a website by aggregating on a field that contains
/// user IDs or session IDs.
///
/// To use the cardinality aggregation, you'll need to provide a field to
/// aggregate on. The following example demonstrates a request for the cardinality
/// of the "user_id" field:
///
/// ```JSON
/// {
///     "cardinality": {
///         "field": "user_id"
///     }
/// }
/// ```
///
/// This request will return an estimate of the number of unique values in the
/// "user_id" field.
///
/// ## Missing Values
///
/// The `missing` parameter defines how documents that are missing a value should be treated.
/// By default, documents without a value for the specified field are ignored. However, you can
/// specify a default value for these documents using the `missing` parameter. This can be useful
/// when you want to include documents with missing values in the aggregation.
///
/// For example, the following request treats documents with missing values in the "user_id"
/// field as if they had a value of "unknown":
///
/// ```JSON
/// {
///     "cardinality": {
///         "field": "user_id",
///         "missing": "unknown"
///     }
/// }
/// ```
///
/// # Estimation Accuracy
///
/// The cardinality aggregation provides an approximate count, which is usually
/// accurate within a small error range. This trade-off allows for efficient
/// computation even on very large datasets.
#[derive(Clone, Debug, PartialEq, Serialize, Deserialize)]
pub struct CardinalityAggregationReq {
    /// The field name to compute the percentiles on.
    pub field: String,
    /// The missing parameter defines how documents that are missing a value should be treated.
    /// By default they will be ignored but it is also possible to treat them as if they had a
    /// value. Examples in JSON format:
    /// { "field": "my_numbers", "missing": "10.0" }
    #[serde(skip_serializing_if = "Option::is_none", default)]
    pub missing: Option<Key>,
}

/// Contains all information required by the SegmentCardinalityCollector to perform the
/// cardinality aggregation on a segment.
pub struct CardinalityAggReqData {
    /// The column accessor to access the fast field values.
    pub accessor: Column<u64>,
    /// The column_type of the field.
    pub column_type: ColumnType,
    /// The string dictionary column if the field is of type string.
    pub str_dict_column: Option<StrColumn>,
    /// The missing value normalized to the internal u64 representation of the field type.
    pub missing_value_for_accessor: Option<u64>,
    /// The name of the aggregation.
    pub name: String,
    /// The aggregation request.
    pub req: CardinalityAggregationReq,
}

impl CardinalityAggReqData {
    /// Estimate the memory consumption of this struct in bytes.
    pub fn get_memory_consumption(&self) -> usize {
        std::mem::size_of::<Self>()
    }
}

impl CardinalityAggregationReq {
    /// Creates a new [`CardinalityAggregationReq`] instance from a field name.
    pub fn from_field_name(field_name: String) -> Self {
        Self {
            field: field_name,
            missing: None,
        }
    }
    /// Returns the field name the aggregation is computed on.
    pub fn field_name(&self) -> &str {
        &self.field
    }
}

#[derive(Clone, Debug)]
pub(crate) struct SegmentCardinalityCollector {
    buckets: Vec<SegmentCardinalityCollectorBucket>,
    accessor_idx: usize,
    /// The column accessor to access the fast field values.
    accessor: Column<u64>,
    /// The column_type of the field.
    column_type: ColumnType,
    /// The missing value normalized to the internal u64 representation of the field type.
    missing_value_for_accessor: Option<u64>,
}

#[derive(Clone, Debug, PartialEq, Default)]
pub(crate) struct SegmentCardinalityCollectorBucket {
    cardinality: CardinalityCollector,
    entries: FxHashSet<u64>,
}
impl SegmentCardinalityCollectorBucket {
    pub fn new(column_type: ColumnType) -> Self {
        Self {
            cardinality: CardinalityCollector::new(column_type as u8),
            entries: FxHashSet::default(),
        }
    }
    fn into_intermediate_metric_result(
        mut self,
        req_data: &CardinalityAggReqData,
    ) -> crate::Result<IntermediateMetricResult> {
        if req_data.column_type == ColumnType::Str {
            let fallback_dict = Dictionary::empty();
            let dict = req_data
                .str_dict_column
                .as_ref()
                .map(|el| el.dictionary())
                .unwrap_or_else(|| &fallback_dict);
            let mut has_missing = false;

            // TODO: replace FxHashSet with something that allows iterating in order
            // (e.g. sparse bitvec)
            let mut term_ids = Vec::new();
            for term_ord in self.entries.into_iter() {
                if term_ord == u64::MAX {
                    has_missing = true;
                } else {
                    // we can reasonably exclude values above u32::MAX
                    term_ids.push(term_ord as u32);
                }
            }

            term_ids.sort_unstable();
            dict.sorted_ords_to_term_cb(term_ids.iter().map(|term| *term as u64), |term| {
                self.cardinality.insert(term);
                Ok(())
            })?;
            if has_missing {
                // Replace missing with the actual value provided
                let missing_key =
                    req_data.req.missing.as_ref().expect(
                        "Found sentinel value u64::MAX for term_ord but `missing` is not set",
                    );
                match missing_key {
                    Key::Str(missing) => {
                        self.cardinality.insert(missing.as_str());
                    }
                    Key::F64(val) => {
                        let val = f64_to_u64(*val);
                        self.cardinality.insert(val);
                    }
                    Key::U64(val) => {
                        self.cardinality.insert(*val);
                    }
                    Key::I64(val) => {
                        self.cardinality.insert(*val);
                    }
                }
            }
        }

        Ok(IntermediateMetricResult::Cardinality(self.cardinality))
    }
}

impl SegmentCardinalityCollector {
    pub fn from_req(
        column_type: ColumnType,
        accessor_idx: usize,
        accessor: Column<u64>,
        missing_value_for_accessor: Option<u64>,
    ) -> Self {
        Self {
            buckets: vec![SegmentCardinalityCollectorBucket::new(column_type); 1],
            column_type,
            accessor_idx,
            accessor,
            missing_value_for_accessor,
        }
    }

    fn fetch_block_with_field(
        &mut self,
        docs: &[crate::DocId],
        agg_data: &mut AggregationsSegmentCtx,
    ) {
        agg_data.column_block_accessor.fetch_block_with_missing(
            docs,
            &self.accessor,
            self.missing_value_for_accessor,
        );
    }
}

impl SegmentAggregationCollector for SegmentCardinalityCollector {
    fn add_intermediate_aggregation_result(
        &mut self,
        agg_data: &AggregationsSegmentCtx,
        results: &mut IntermediateAggregationResults,
        parent_bucket_id: BucketId,
    ) -> crate::Result<()> {
        self.prepare_max_bucket(parent_bucket_id, agg_data)?;
        let req_data = &agg_data.get_cardinality_req_data(self.accessor_idx);
        let name = req_data.name.to_string();
        // take the bucket in buckets and replace it with a new empty one
        let bucket = std::mem::take(&mut self.buckets[parent_bucket_id as usize]);

        let intermediate_result = bucket.into_intermediate_metric_result(req_data)?;
        results.push(
            name,
            IntermediateAggregationResult::Metric(intermediate_result),
        )?;

        Ok(())
    }

    fn collect(
        &mut self,
        parent_bucket_id: BucketId,
        docs: &[crate::DocId],
        agg_data: &mut AggregationsSegmentCtx,
    ) -> crate::Result<()> {
        self.fetch_block_with_field(docs, agg_data);
        let bucket = &mut self.buckets[parent_bucket_id as usize];

        let col_block_accessor = &agg_data.column_block_accessor;
        if self.column_type == ColumnType::Str {
            for term_ord in col_block_accessor.iter_vals() {
                bucket.entries.insert(term_ord);
            }
        } else if self.column_type == ColumnType::IpAddr {
            let compact_space_accessor = self
                .accessor
                .values
                .clone()
                .downcast_arc::<CompactSpaceU64Accessor>()
                .map_err(|_| {
                    TantivyError::AggregationError(
                        crate::aggregation::AggregationError::InternalError(
                            "Type mismatch: Could not downcast to CompactSpaceU64Accessor"
                                .to_string(),
                        ),
                    )
                })?;
            for val in col_block_accessor.iter_vals() {
                let val: u128 = compact_space_accessor.compact_to_u128(val as u32);
                bucket.cardinality.insert(val);
            }
        } else {
            for val in col_block_accessor.iter_vals() {
                bucket.cardinality.insert(val);
            }
        }

        Ok(())
    }

    fn prepare_max_bucket(
        &mut self,
        max_bucket: BucketId,
        _agg_data: &AggregationsSegmentCtx,
    ) -> crate::Result<()> {
        if max_bucket as usize >= self.buckets.len() {
            self.buckets.resize_with(max_bucket as usize + 1, || {
                SegmentCardinalityCollectorBucket::new(self.column_type)
            });
        }
        Ok(())
    }
}

#[derive(Clone, Debug)]
/// The cardinality collector used during segment collection and for merging results.
/// Uses Apache DataSketches HLL (lg_k=11, Hll4) for compact binary serialization
/// and cross-language compatibility (e.g. Java `datasketches` library).
pub struct CardinalityCollector {
    sketch: HllSketch,
    /// Salt derived from `ColumnType`, used to differentiate values of different column types
    /// that map to the same u64 (e.g. bool `false` = 0 vs i64 `0`).
    /// Not serialized — only needed during insertion, not after sketch registers are populated.
    salt: u8,
}

impl Default for CardinalityCollector {
    fn default() -> Self {
        Self::new(0)
    }
}

impl PartialEq for CardinalityCollector {
    fn eq(&self, _other: &Self) -> bool {
        false
    }
}

impl Serialize for CardinalityCollector {
    fn serialize<S: Serializer>(&self, serializer: S) -> Result<S::Ok, S::Error> {
        let bytes = self.sketch.serialize();
        serializer.serialize_bytes(&bytes)
    }
}

impl<'de> Deserialize<'de> for CardinalityCollector {
    fn deserialize<D: Deserializer<'de>>(deserializer: D) -> Result<Self, D::Error> {
        let bytes: Vec<u8> = Deserialize::deserialize(deserializer)?;
        let sketch = HllSketch::deserialize(&bytes).map_err(serde::de::Error::custom)?;
        Ok(Self { sketch, salt: 0 })
    }
}

impl CardinalityCollector {
    fn new(salt: u8) -> Self {
        Self {
            sketch: HllSketch::new(LG_K, HllType::Hll4),
            salt,
        }
    }

    /// Insert a value into the HLL sketch, salted by the column type.
    /// The salt ensures that identical u64 values from different column types
    /// (e.g. bool `false` vs i64 `0`) are counted as distinct.
    pub(crate) fn insert<T: Hash>(&mut self, value: T) {
        self.sketch.update((self.salt, value));
    }

    /// Compute the final cardinality estimate.
    pub fn finalize(self) -> Option<f64> {
        Some(self.sketch.estimate().trunc())
    }

    /// Serialize the HLL sketch to its compact binary representation.
    /// The format is cross-language compatible with Apache DataSketches (Java, C++, Python).
    pub fn to_sketch_bytes(&self) -> Vec<u8> {
        self.sketch.serialize()
    }

    pub(crate) fn merge_fruits(&mut self, right: CardinalityCollector) -> crate::Result<()> {
        let mut union = HllUnion::new(LG_K);
        union.update(&self.sketch);
        union.update(&right.sketch);
        self.sketch = union.get_result(HllType::Hll4);
        Ok(())
    }
}

#[cfg(test)]
mod tests {

    use std::net::IpAddr;
    use std::str::FromStr;

    use columnar::MonotonicallyMappableToU64;

    use crate::aggregation::agg_req::Aggregations;
    use crate::aggregation::tests::{exec_request, get_test_index_from_terms};
    use crate::schema::{IntoIpv6Addr, Schema, FAST};
    use crate::Index;

    #[test]
    fn cardinality_aggregation_test_empty_index() -> crate::Result<()> {
        let values = vec![];
        let index = get_test_index_from_terms(false, &values)?;
        let agg_req: Aggregations = serde_json::from_value(json!({
            "cardinality": {
                "cardinality": {
                    "field": "string_id",
                }
            },
        }))
        .unwrap();

        let res = exec_request(agg_req, &index)?;
        assert_eq!(res["cardinality"]["value"], 0.0);

        Ok(())
    }

    #[test]
    fn cardinality_aggregation_test_single_segment() -> crate::Result<()> {
        cardinality_aggregation_test_merge_segment(true)
    }
    #[test]
    fn cardinality_aggregation_test() -> crate::Result<()> {
        cardinality_aggregation_test_merge_segment(false)
    }
    fn cardinality_aggregation_test_merge_segment(merge_segments: bool) -> crate::Result<()> {
        let segment_and_terms = vec![
            vec!["terma"],
            vec!["termb"],
            vec!["termc"],
            vec!["terma"],
            vec!["terma"],
            vec!["terma"],
            vec!["termb"],
            vec!["terma"],
        ];
        let index = get_test_index_from_terms(merge_segments, &segment_and_terms)?;
        let agg_req: Aggregations = serde_json::from_value(json!({
            "cardinality": {
                "cardinality": {
                    "field": "string_id",
                }
            },
        }))
        .unwrap();

        let res = exec_request(agg_req, &index)?;
        assert_eq!(res["cardinality"]["value"], 3.0);

        Ok(())
    }

    #[test]
    fn cardinality_aggregation_u64() -> crate::Result<()> {
        let mut schema_builder = Schema::builder();
        let id_field = schema_builder.add_u64_field("id", FAST);
        let index = Index::create_in_ram(schema_builder.build());
        {
            let mut writer = index.writer_for_tests()?;
            writer.add_document(doc!(id_field => 1u64))?;
            writer.add_document(doc!(id_field => 2u64))?;
            writer.add_document(doc!(id_field => 3u64))?;
            writer.add_document(doc!())?;
            writer.commit()?;
        }

        let agg_req: Aggregations = serde_json::from_value(json!({
            "cardinality": {
                "cardinality": {
                    "field": "id",
                    "missing": 0u64
                },
            }
        }))
        .unwrap();

        let res = exec_request(agg_req, &index)?;
        assert_eq!(res["cardinality"]["value"], 4.0);

        Ok(())
    }

    #[test]
    fn cardinality_aggregation_ip_addr() -> crate::Result<()> {
        let mut schema_builder = Schema::builder();
        let field = schema_builder.add_ip_addr_field("ip_field", FAST);
        let index = Index::create_in_ram(schema_builder.build());
        {
            let mut writer = index.writer_for_tests()?;
            // IpV6 loopback
            writer.add_document(doc!(field=>IpAddr::from_str("::1").unwrap().into_ipv6_addr()))?;
            writer.add_document(doc!(field=>IpAddr::from_str("::1").unwrap().into_ipv6_addr()))?;
            // IpV4
            writer.add_document(
                doc!(field=>IpAddr::from_str("127.0.0.1").unwrap().into_ipv6_addr()),
            )?;
            writer.commit()?;
        }

        let agg_req: Aggregations = serde_json::from_value(json!({
            "cardinality": {
                "cardinality": {
                    "field": "ip_field"
                },
            }
        }))
        .unwrap();

        let res = exec_request(agg_req, &index)?;
        assert_eq!(res["cardinality"]["value"], 2.0);

        Ok(())
    }

    #[test]
    fn cardinality_aggregation_json() -> crate::Result<()> {
        let mut schema_builder = Schema::builder();
        let field = schema_builder.add_json_field("json", FAST);
        let index = Index::create_in_ram(schema_builder.build());
        {
            let mut writer = index.writer_for_tests()?;
            writer.add_document(doc!(field => json!({"value": false})))?;
            writer.add_document(doc!(field => json!({"value": true})))?;
            writer.add_document(doc!(field => json!({"value": i64::from_u64(0u64)})))?;
            writer.add_document(doc!(field => json!({"value": i64::from_u64(1u64)})))?;
            writer.commit()?;
        }

        let agg_req: Aggregations = serde_json::from_value(json!({
            "cardinality": {
                "cardinality": {
                    "field": "json.value"
                },
            }
        }))
        .unwrap();

        let res = exec_request(agg_req, &index)?;
        assert_eq!(res["cardinality"]["value"], 4.0);

        Ok(())
    }

    #[test]
    fn cardinality_collector_serde_roundtrip() {
        use super::CardinalityCollector;

        let mut collector = CardinalityCollector::default();
        collector.insert("hello");
        collector.insert("world");
        collector.insert("hello"); // duplicate

        let serialized = serde_json::to_vec(&collector).unwrap();
        let deserialized: CardinalityCollector = serde_json::from_slice(&serialized).unwrap();

        let original_estimate = collector.finalize().unwrap();
        let roundtrip_estimate = deserialized.finalize().unwrap();
        assert_eq!(original_estimate, roundtrip_estimate);
        assert_eq!(original_estimate, 2.0);
    }

    #[test]
    fn cardinality_collector_merge() {
        use super::CardinalityCollector;

        let mut left = CardinalityCollector::default();
        left.insert("a");
        left.insert("b");

        let mut right = CardinalityCollector::default();
        right.insert("b");
        right.insert("c");

        left.merge_fruits(right).unwrap();
        let estimate = left.finalize().unwrap();
        assert_eq!(estimate, 3.0);
    }

    #[test]
    fn cardinality_collector_serialize_deserialize_binary() {
        use datasketches::hll::HllSketch;

        use super::CardinalityCollector;

        let mut collector = CardinalityCollector::default();
        collector.insert("apple");
        collector.insert("banana");
        collector.insert("cherry");

        let bytes = collector.to_sketch_bytes();
        let deserialized = HllSketch::deserialize(&bytes).unwrap();
        assert!((deserialized.estimate() - 3.0).abs() < 0.01);
    }

    #[test]
    fn cardinality_collector_salt_differentiates_types() {
        use super::CardinalityCollector;

        // Without salt, same u64 value from different column types would collide
        let mut collector_bool = CardinalityCollector::new(5); // e.g. ColumnType::Bool
        collector_bool.insert(0u64); // false
        collector_bool.insert(1u64); // true

        let mut collector_i64 = CardinalityCollector::new(2); // e.g. ColumnType::I64
        collector_i64.insert(0u64);
        collector_i64.insert(1u64);

        // Merge them
        collector_bool.merge_fruits(collector_i64).unwrap();
        let estimate = collector_bool.finalize().unwrap();
        // Should be 4 because salt makes (5, 0) != (2, 0) and (5, 1) != (2, 1)
        assert_eq!(estimate, 4.0);
    }
}


================================================
FILE: src/aggregation/metric/count.rs
================================================
use std::fmt::Debug;

use serde::{Deserialize, Serialize};

use super::*;
use crate::aggregation::*;

/// A single-value metric aggregation that counts the number of values that are
/// extracted from the aggregated documents.
/// See [super::SingleMetricResult] for return value.
///
/// # JSON Format
/// ```json
/// {
///     "value_count": {
///         "field": "score"
///     }
/// }
/// ```
#[derive(Clone, Debug, PartialEq, Serialize, Deserialize)]
pub struct CountAggregation {
    /// The field name to compute the count on.
    pub field: String,
    /// The missing parameter defines how documents that are missing a value should be treated.
    /// By default they will be ignored but it is also possible to treat them as if they had a
    /// value. Examples in JSON format:
    /// { "field": "my_numbers", "missing": "10.0" }
    #[serde(default, deserialize_with = "deserialize_option_f64")]
    pub missing: Option<f64>,
}

impl CountAggregation {
    /// Creates a new [`CountAggregation`] instance from a field name.
    pub fn from_field_name(field_name: String) -> Self {
        Self {
            field: field_name,
            missing: None,
        }
    }
    /// Returns the field name the aggregation is computed on.
    pub fn field_name(&self) -> &str {
        &self.field
    }
}

/// Intermediate result of the count aggregation that can be combined with other intermediate
/// results.
#[derive(Default, Clone, Debug, PartialEq, Serialize, Deserialize)]
pub struct IntermediateCount {
    stats: IntermediateStats,
}

impl IntermediateCount {
    /// Creates a new [`IntermediateCount`] instance from a [`SegmentStatsCollector`].
    pub(crate) fn from_stats(stats: IntermediateStats) -> Self {
        Self { stats }
    }
    /// Merges the other intermediate result into self.
    pub fn merge_fruits(&mut self, other: IntermediateCount) {
        self.stats.merge_fruits(other.stats);
    }
    /// Computes the final count value.
    pub fn finalize(&self) -> Option<f64> {
        Some(self.stats.finalize().count as f64)
    }
}


================================================
FILE: src/aggregation/metric/extended_stats.rs
================================================
use std::fmt::Debug;
use std::mem;

use serde::{Deserialize, Serialize};

use super::*;
use crate::aggregation::agg_data::AggregationsSegmentCtx;
use crate::aggregation::intermediate_agg_result::{
    IntermediateAggregationResult, IntermediateAggregationResults, IntermediateMetricResult,
};
use crate::aggregation::segment_agg_result::SegmentAggregationCollector;
use crate::aggregation::*;
use crate::TantivyError;

/// A multi-value metric aggregation that computes a collection of extended statistics
/// on numeric values that are extracted
/// from the aggregated documents.
/// See [`ExtendedStats`] for returned statistics.
///
/// # JSON Format
/// ```json
/// {
///     "extended_stats": {
///         "field": "score"
///     }
///  }
/// ```

#[derive(Clone, Debug, PartialEq, Serialize, Deserialize)]
pub struct ExtendedStatsAggregation {
    /// The field name to compute the stats on.
    pub field: String,
    /// The missing parameter defines how documents that are missing a value should be treated.
    /// By default they will be ignored but it is also possible to treat them as if they had a
    /// value. Examples in JSON format:
    /// { "field": "my_numbers", "missing": "10.0" }
    #[serde(default)]
    pub missing: Option<f64>,
    /// The sigma parameter defines how standard_deviation_bound_are_calculated.
    /// This can be a useful way to visualize variance of your data.
    /// The default value is 2. Examples in JSON format:
    /// { "field": "my_numbers", "sigma": "3.0" }
    #[serde(default)]
    pub sigma: Option<f64>,
}

impl ExtendedStatsAggregation {
    /// Creates a new [`ExtendedStatsAggregation`] instance from a field name.
    pub fn from_field_name(field_name: String) -> Self {
        ExtendedStatsAggregation {
            field: field_name,
            missing: None,
            sigma: None,
        }
    }
    /// Returns the field name the aggregation is computed on.
    pub fn field_name(&self) -> &str {
        &self.field
    }
}

/// Extended stats contains a collection of statistics
/// they extends stats adding variance, standard deviation
/// and bound information
#[derive(Clone, Debug, PartialEq, Serialize, Deserialize)]
pub struct ExtendedStats {
    /// The number of documents.
    pub count: u64,
    /// The sum of the fast field values.
    pub sum: f64,
    /// The min value of the fast field values.
    pub min: Option<f64>,
    /// The max value of the fast field values.
    pub max: Option<f64>,
    /// The average of the fast field values. `None` if count equals zero.
    pub avg: Option<f64>,
    /// The sum of squares of the fast field values. `None` if count equals zero.
    pub sum_of_squares: Option<f64>,
    /// The variance of the fast field values. `None` if count is is 0 or 1.
    pub variance: Option<f64>,
    /// The variance population of the fast field values, always equal to variance. `None` if count
    /// is is 0 or 1.
    pub variance_population: Option<f64>,
    /// The variance sampling of the fast field values, always equal to variance. `None` if count
    /// is is 0 or 1.
    pub variance_sampling: Option<f64>,
    /// The standard deviation of the fast field values. `None` if count is is 0 or 1.
    pub std_deviation: Option<f64>,
    /// The standard deviation of the fast field values, always equal to variance. `None` if count
    /// is is 0 or 1.
    pub std_deviation_population: Option<f64>,
    /// The standard deviation sampling of the fast field values. `None`
    /// if count is is 0 or 1.
    pub std_deviation_sampling: Option<f64>,
    /// The standard deviation bounds of the fast field values, always equal to variance. `None`
    /// if count is is 0 or 1.
    pub std_deviation_bounds: Option<StandardDeviationBounds>,
}

/// A sub struct for ExtendedStat containing deviation bounds
/// the values depend on sigma and represent
/// the bounds from the average with a distance of
/// std_deviation*sigma
#[derive(Clone, Debug, PartialEq, Serialize, Deserialize)]
pub struct StandardDeviationBounds {
    /// upper bound -> avg + std_dev*sigma
    pub upper: f64,
    /// lower bound -> avg - std_dev*sigma
    pub lower: f64,
    /// upper bound sampling -> avg + std_dev_sampling*sigma
    pub upper_sampling: f64,
    /// lower bound sampling -> avg - std_dev_sampling*sigma
    pub lower_sampling: f64,
    /// same as upper
    pub upper_population: f64,
    /// same as lower
    pub lower_population: f64,
}

impl ExtendedStats {
    pub(crate) fn get_value(&self, agg_property: &str) -> crate::Result<Option<f64>> {
        match agg_property {
            "count" => Ok(Some(self.count as f64)),
            "sum" => Ok(Some(self.sum)),
            "min" => Ok(self.min),
            "max" => Ok(self.max),
            "avg" => Ok(self.avg),
            "variance" => Ok(self.variance),
            "variance_sampling" => Ok(self.variance_sampling),
            "variance_population" => Ok(self.variance_population),
            "sum_of_squares" => Ok(self.sum_of_squares),
            "std_deviation" => Ok(self.std_deviation),
            "std_deviation_sampling" => Ok(self.std_deviation_sampling),
            "std_deviation_population" => Ok(self.std_deviation_population),
            "std_deviation_bounds.lower" => Ok(self
                .std_deviation_bounds
                .as_ref()
                .map(|bounds| bounds.lower)),
            "std_deviation_bounds.lower_population" => Ok(self
                .std_deviation_bounds
                .as_ref()
                .map(|bounds| bounds.lower_population)),
            "std_deviation_bounds.lower_sampling" => Ok(self
                .std_deviation_bounds
                .as_ref()
                .map(|bounds| bounds.lower_sampling)),
            "std_deviation_bounds.upper" => Ok(self
                .std_deviation_bounds
                .as_ref()
                .map(|bounds| bounds.upper)),
            "std_deviation_bounds.upper_population" => Ok(self
                .std_deviation_bounds
                .as_ref()
                .map(|bounds| bounds.upper_population)),
            "std_deviation_bounds.upper_sampling" => Ok(self
                .std_deviation_bounds
                .as_ref()
                .map(|bounds| bounds.upper_sampling)),
            _ => Err(TantivyError::InvalidArgument(format!(
                "Unknown property {agg_property} on stats metric aggregation"
            ))),
        }
    }
}

/// Intermediate result of the extended stats aggregation that can be combined with other
/// intermediate results.
#[derive(Clone, Debug, PartialEq, Serialize, Deserialize)]
pub struct IntermediateExtendedStats {
    intermediate_stats: IntermediateStats,
    /// The number of extracted values.
    /// The sum of square values, it's referred as M2 in Welford's online algorithm
    sum_of_squares: f64,
    /// The sum of square values as computed by elastic search
    sum_of_squares_elastic: f64,
    /// The delta for sum of squares  as computed by elastic search needed for the Kahan algorithm
    delta_sum_for_squares_elastic: f64,
    /// The mean is an intermediate value need for calculating the variance
    /// as per [Welford's online algorithm](https://en.wikipedia.org/wiki/Algorithms_for_calculating_variance#Welford's_online_algorithm)
    mean: f64,
    /// The value used for computing standard deviation bounds
    sigma: f64,
}

impl Default for IntermediateExtendedStats {
    fn default() -> Self {
        Self {
            intermediate_stats: IntermediateStats::default(),
            sum_of_squares: 0.0,
            sum_of_squares_elastic: 0.0,
            delta_sum_for_squares_elastic: 0.0,
            mean: 0.0,
            // The default value is the same of ElasticSearch
            sigma: 2.0,
        }
    }
}

impl IntermediateExtendedStats {
    /// Creates a new IntermediateExtendedStats using an option
    /// containing the sigma to be used for calculating bound values.
    pub fn with_sigma(sigma: Option<f64>) -> Self {
        Self {
            intermediate_stats: IntermediateStats::default(),
            sum_of_squares: 0.0,
            sum_of_squares_elastic: 0.0,
            delta_sum_for_squares_elastic: 0.0,
            mean: 0.0,
            // The default value is the same of ElasticSearch
            sigma: sigma.unwrap_or(2.0),
        }
    }
    /// Merges the other stats intermediate result into self.
    pub fn merge_fruits(&mut self, other: IntermediateExtendedStats) {
        if other.intermediate_stats.count == 0 {
            return;
        }
        if self.intermediate_stats.count == 0 {
            let _ = mem::replace(self, other);
            return;
        }
        let new_count = self.intermediate_stats.count + other.intermediate_stats.count;
        let delta = other.mean - self.mean;
        self.sum_of_squares += other.sum_of_squares
            + delta
                * delta
                * self.intermediate_stats.count as f64
                * other.intermediate_stats.count as f64
                / new_count as f64;
        self.mean = (self.intermediate_stats.sum + other.intermediate_stats.sum) / new_count as f64;
        self.sum_of_squares_elastic += other.sum_of_squares_elastic;
        self.delta_sum_for_squares_elastic += other.delta_sum_for_squares_elastic;
        self.intermediate_stats
            .merge_fruits(other.intermediate_stats);
    }

    /// Computes the final stats value.
    pub fn finalize(&self) -> Box<ExtendedStats> {
        let (min, max, avg, sum_of_squares) = if self.intermediate_stats.count == 0 {
            (None, None, None, None)
        } else {
            (
                Some(self.intermediate_stats.min),
                Some(self.intermediate_stats.max),
                Some(self.mean),
                Some(self.sum_of_squares_elastic),
            )
        };
        let (variance, variance_sampling) = if self.intermediate_stats.count <= 1 {
            (None, None)
        } else {
            (
                Some(self.sum_of_squares / self.intermediate_stats.count as f64),
                Some(self.sum_of_squares / (self.intermediate_stats.count - 1) as f64),
            )
        };
        let std_deviation = variance.map(|v| v.sqrt());
        let std_deviation_sampling = variance_sampling.map(|v| v.sqrt());
        let std_deviation_bounds =
            if let (Some(std_deviation_val), Some(std_deviation_sampling_val)) =
                (std_deviation, std_deviation_sampling)
            {
                let upper = self.mean + std_deviation_val * self.sigma;
                let lower = self.mean - std_deviation_val * self.sigma;
                let upper_sampling = self.mean + std_deviation_sampling_val * self.sigma;
                let lower_sampling = self.mean - std_deviation_sampling_val * self.sigma;
                Some(StandardDeviationBounds {
                    upper,
                    lower,
                    upper_sampling,
                    lower_sampling,
                    upper_population: upper,
                    lower_population: lower,
                })
            } else {
                None
            };
        Box::new(ExtendedStats {
            count: self.intermediate_stats.count,
            sum: self.intermediate_stats.sum,
            min,
            max,
            avg,
            sum_of_squares,
            variance,
            variance_population: variance,
            variance_sampling,
            std_deviation,
            std_deviation_population: std_deviation,
            std_deviation_sampling,
            std_deviation_bounds,
        })
    }

    fn update_variance(&mut self, value: f64) {
        let delta = value - self.mean;
        // this is not what the Welford's online algorithm prescribes but
        // using the pseudo code from wikipedia there was a small rounding
        // error (in 15th decimal place) that caused a test
        //(test_aggregation_level1 in agg_test.rs)
        // failure
        self.mean = self.intermediate_stats.sum / self.intermediate_stats.count as f64;
        // self.mean += delta / self.count as f64;
        let delta2 = value - self.mean;
        self.sum_of_squares += delta * delta2;
    }

    #[inline]
    fn collect(&mut self, value: f64) {
        self.intermediate_stats.collect(value);
        // kahan algorithm for sum_of_squares_elastic
        let y = value * value - self.delta_sum_for_squares_elastic;
        let t = self.sum_of_squares_elastic + y;
        self.delta_sum_for_squares_elastic = (t - self.sum_of_squares_elastic) - y;
        self.sum_of_squares_elastic = t;
        self.update_variance(value);
    }
}

#[derive(Clone, Debug)]
pub(crate) struct SegmentExtendedStatsCollector {
    name: String,
    missing: Option<u64>,
    field_type: ColumnType,
    accessor: columnar::Column<u64>,
    buckets: Vec<IntermediateExtendedStats>,
    sigma: Option<f64>,
}

impl SegmentExtendedStatsCollector {
    pub fn from_req(req: &MetricAggReqData, sigma: Option<f64>) -> Self {
        let missing = req
            .missing
            .and_then(|val| f64_to_fastfield_u64(val, &req.field_type));
        Self {
            name: req.name.clone(),
            field_type: req.field_type,
            accessor: req.accessor.clone(),
            missing,
            buckets: vec![IntermediateExtendedStats::with_sigma(sigma); 16],
            sigma,
        }
    }
}

impl SegmentAggregationCollector for SegmentExtendedStatsCollector {
    #[inline]
    fn add_intermediate_aggregation_result(
        &mut self,
        agg_data: &AggregationsSegmentCtx,
        results: &mut IntermediateAggregationResults,
        parent_bucket_id: BucketId,
    ) -> crate::Result<()> {
        let name = self.name.clone();
        self.prepare_max_bucket(parent_bucket_id, agg_data)?;
        let extended_stats = std::mem::take(&mut self.buckets[parent_bucket_id as usize]);
        results.push(
            name,
            IntermediateAggregationResult::Metric(IntermediateMetricResult::ExtendedStats(
                extended_stats,
            )),
        )?;

        Ok(())
    }

    #[inline]
    fn collect(
        &mut self,
        parent_bucket_id: BucketId,
        docs: &[crate::DocId],
        agg_data: &mut AggregationsSegmentCtx,
    ) -> crate::Result<()> {
        let mut extended_stats = self.buckets[parent_bucket_id as usize].clone();

        agg_data
            .column_block_accessor
            .fetch_block_with_missing(docs, &self.accessor, self.missing);
        for val in agg_data.column_block_accessor.iter_vals() {
            let val1 = f64_from_fastfield_u64(val, self.field_type);
            extended_stats.collect(val1);
        }

        // store back
        self.buckets[parent_bucket_id as usize] = extended_stats;

        Ok(())
    }

    fn prepare_max_bucket(
        &mut self,
        max_bucket: BucketId,
        _agg_data: &AggregationsSegmentCtx,
    ) -> crate::Result<()> {
        if self.buckets.len() <= max_bucket as usize {
            self.buckets.resize_with(max_bucket as usize + 1, || {
                IntermediateExtendedStats::with_sigma(self.sigma)
            });
        }
        Ok(())
    }
}

#[cfg(test)]
mod tests {

    use crate::aggregation::agg_req::Aggregations;
    use crate::aggregation::agg_result::AggregationResults;
    use crate::aggregation::metric::IntermediateExtendedStats;
    use crate::aggregation::tests::get_test_index_from_values;
    use crate::aggregation::AggregationCollector;
    use crate::assert_nearly_equals;
    use crate::query::AllQuery;

    const EPSILON_FOR_TEST: f64 = 0.000000000002;

    #[test]
    fn test_aggregation_extended_stats_no_variance() -> crate::Result<()> {
        let values = vec![1.0];

        let index = get_test_index_from_values(false, &values)?;

        let agg_req_1: Aggregations = serde_json::from_value(json!({
            "my_stats": {
                "extended_stats": {
                    "field": "score_f64",
                },
            }
        }))
        .unwrap();

        let collector = AggregationCollector::from_aggs(agg_req_1, Default::default());

        let reader = index.reader()?;
        let searcher = reader.searcher();
        let agg_res: AggregationResults = searcher.search(&AllQuery, &collector).unwrap();
        assert_eq!(
            agg_res
                .get_value_from_aggregation("my_stats", "count")?
                .unwrap(),
            1.0
        );
        assert_eq!(
            agg_res
                .get_value_from_aggregation("my_stats", "min")?
                .unwrap(),
            1.0
        );
        assert_eq!(
            agg_res
                .get_value_from_aggregation("my_stats", "max")?
                .unwrap(),
            1.0
        );
        assert_eq!(
            agg_res
                .get_value_from_aggregation("my_stats", "sum")?
                .unwrap(),
            1.0
        );
        assert_eq!(
            agg_res
                .get_value_from_aggregation("my_stats", "avg")?
                .unwrap(),
            1.0
        );

        assert!(agg_res
            .get_value_from_aggregation("my_stats", "std_deviation")?
            .is_none());
        assert!(agg_res
            .get_value_from_aggregation("my_stats", "std_deviation_population")?
            .is_none());
        assert!(agg_res
            .get_value_from_aggregation("my_stats", "std_deviation_sampling")?
            .is_none());
        assert!(agg_res
            .get_value_from_aggregation("my_stats", "std_deviation_bounds.lower")?
            .is_none());
        assert!(agg_res
            .get_value_from_aggregation("my_stats", "std_deviation_bounds.lower_population")?
            .is_none());
        assert!(agg_res
            .get_value_from_aggregation("my_stats", "std_deviation_bounds.lower_sampling")?
            .is_none());
        assert!(agg_res
            .get_value_from_aggregation("my_stats", "std_deviation_bounds.upper")?
            .is_none());
        assert!(agg_res
            .get_value_from_aggregation("my_stats", "std_deviation_bounds.upper_population")?
            .is_none());
        assert!(agg_res
            .get_value_from_aggregation("my_stats", "std_deviation_bounds.upper_sampling")?
            .is_none());
        assert_eq!(
            agg_res
                .get_value_from_aggregation("my_stats", "sum_of_squares")?
                .unwrap(),
            1.0
        );
        assert!(agg_res
            .get_value_from_aggregation("my_stats", "variance_population")?
            .is_none());
        assert!(agg_res
            .get_value_from_aggregation("my_stats", "variance")?
            .is_none());
        assert!(agg_res
            .get_value_from_aggregation("my_stats", "variance_sampling")?
            .is_none());

        Ok(())
    }

    #[test]
    fn test_aggregation_extended_stats() -> crate::Result<()> {
        let values = vec![1.0, 3.0, 4.0, 5.0, 8.0, 10.0];

        let index = get_test_index_from_values(false, &values)?;

        let agg_req_1: Aggregations = serde_json::from_value(json!({
            "my_stats": {
                "extended_stats": {
                    "field": "score_f64",
                },
            }
        }))
        .unwrap();

        let collector = AggregationCollector::from_aggs(agg_req_1, Default::default());

        let reader = index.reader()?;
        let searcher = reader.searcher();
        let agg_res: AggregationResults = searcher.search(&AllQuery, &collector).unwrap();
        const EXPECTED_VARIANCE: f64 = 9.138888888888888;
        assert_eq!(
            agg_res
                .get_value_from_aggregation("my_stats", "count")?
                .unwrap(),
            6.0
        );
        assert_eq!(
            agg_res
                .get_value_from_aggregation("my_stats", "min")?
                .unwrap(),
            1.0
        );
        assert_eq!(
            agg_res
                .get_value_from_aggregation("my_stats", "max")?
                .unwrap(),
            10.0
        );
        assert_eq!(
            agg_res
                .get_value_from_aggregation("my_stats", "sum")?
                .unwrap(),
            31.0
        );
        assert_nearly_equals!(
            agg_res
                .get_value_from_aggregation("my_stats", "avg")?
                .unwrap(),
            5.166666666666667,
            EPSILON_FOR_TEST
        );
        assert_nearly_equals!(
            agg_res
                .get_value_from_aggregation("my_stats", "std_deviation")?
                .unwrap(),
            EXPECTED_VARIANCE.sqrt(),
            EPSILON_FOR_TEST
        );
        assert_nearly_equals!(
            agg_res
                .get_value_from_aggregation("my_stats", "std_deviation_population")?
                .unwrap(),
            EXPECTED_VARIANCE.sqrt(),
            EPSILON_FOR_TEST
        );
        assert_nearly_equals!(
            agg_res
                .get_value_from_aggregation("my_stats", "std_deviation_sampling")?
                .unwrap(),
            3.311595788538611,
            EPSILON_FOR_TEST
        );
        assert_nearly_equals!(
            agg_res
                .get_value_from_aggregation("my_stats", "std_deviation_bounds.lower")?
                .unwrap(),
            -0.8794523824056837,
            EPSILON_FOR_TEST
        );
        assert_nearly_equals!(
            agg_res
                .get_value_from_aggregation("my_stats", "std_deviation_bounds.lower_population")?
                .unwrap(),
            -0.8794523824056837,
            0.00000000000001
        );
        assert_nearly_equals!(
            agg_res
                .get_value_from_aggregation("my_stats", "std_deviation_bounds.lower_sampling")?
                .unwrap(),
            -1.4565249104105549,
            EPSILON_FOR_TEST
        );
        assert_nearly_equals!(
            agg_res
                .get_value_from_aggregation("my_stats", "std_deviation_bounds.upper")?
                .unwrap(),
            11.212785715739017,
            EPSILON_FOR_TEST
        );
        assert_nearly_equals!(
            agg_res
                .get_value_from_aggregation("my_stats", "std_deviation_bounds.upper_population")?
                .unwrap(),
            11.212785715739017,
            EPSILON_FOR_TEST
        );
        assert_nearly_equals!(
            agg_res
                .get_value_from_aggregation("my_stats", "std_deviation_bounds.upper_sampling")?
                .unwrap(),
            11.78985824374389,
            EPSILON_FOR_TEST
        );
        assert_eq!(
            agg_res
                .get_value_from_aggregation("my_stats", "sum_of_squares")?
                .unwrap(),
            215.0
        );
        assert_nearly_equals!(
            agg_res
                .get_value_from_aggregation("my_stats", "variance_population")?
                .unwrap(),
            EXPECTED_VARIANCE,
            EPSILON_FOR_TEST
        );
        assert_nearly_equals!(
            agg_res
                .get_value_from_aggregation("my_stats", "variance")?
                .unwrap(),
            EXPECTED_VARIANCE,
            EPSILON_FOR_TEST
        );
        assert_nearly_equals!(
            agg_res
                .get_value_from_aggregation("my_stats", "variance_sampling")?
                .unwrap(),
            10.966666666666663,
            EPSILON_FOR_TEST
        );

        Ok(())
    }

    #[test]
    fn test_aggregation_extended_stats_with_sigma() -> crate::Result<()> {
        let values = vec![1.0, 2.0, 3.0, 4.0, 5.0, 6.0];

        let index = get_test_index_from_values(false, &values)?;

        let agg_req_1: Aggregations = serde_json::from_value(json!({
            "my_stats": {
                "extended_stats": {
                    "field": "score_f64",
                    "sigma": 1.5
                },
            }
        }))
        .unwrap();

        let collector = AggregationCollector::from_aggs(agg_req_1, Default::default());

        let reader = index.reader()?;
        let searcher = reader.searcher();
        let agg_res: AggregationResults = searcher.search(&AllQuery, &collector).unwrap();

        const EXPECTED_VARIANCE: f64 = 2.9166666666666665;
        assert_eq!(
            agg_res
                .get_value_from_aggregation("my_stats", "count")?
                .unwrap(),
            6.0
        );
        assert_eq!(
            agg_res
                .get_value_from_aggregation("my_stats", "min")?
                .unwrap(),
            1.0
        );
        assert_eq!(
            agg_res
                .get_value_from_aggregation("my_stats", "max")?
                .unwrap(),
            6.0
        );
        assert_eq!(
            agg_res
                .get_value_from_aggregation("my_stats", "sum")?
                .unwrap(),
            21.0
        );
        assert_eq!(
            agg_res
                .get_value_from_aggregation("my_stats", "avg")?
                .unwrap(),
            3.5
        );
        assert_nearly_equals!(
            agg_res
                .get_value_from_aggregation("my_stats", "std_deviation")?
                .unwrap(),
            EXPECTED_VARIANCE.sqrt(),
            EPSILON_FOR_TEST
        );
        assert_nearly_equals!(
            agg_res
                .get_value_from_aggregation("my_stats", "std_deviation_population")?
                .unwrap(),
            EXPECTED_VARIANCE.sqrt(),
            EPSILON_FOR_TEST
        );
        assert_nearly_equals!(
            agg_res
                .get_value_from_aggregation("my_stats", "std_deviation_sampling")?
                .unwrap(),
            1.8708286933869709,
            EPSILON_FOR_TEST
        );
        assert_nearly_equals!(
            agg_res
                .get_value_from_aggregation("my_stats", "std_deviation_bounds.lower")?
                .unwrap(),
            0.9382623085101005,
            EPSILON_FOR_TEST
        );
        assert_nearly_equals!(
            agg_res
                .get_value_from_aggregation("my_stats", "std_deviation_bounds.lower_population")?
                .unwrap(),
            0.9382623085101005,
            EPSILON_FOR_TEST
        );
        assert_nearly_equals!(
            agg_res
                .get_value_from_aggregation("my_stats", "std_deviation_bounds.lower_sampling")?
                .unwrap(),
            0.6937569599195434,
            EPSILON_FOR_TEST
        );
        assert_nearly_equals!(
            agg_res
                .get_value_from_aggregation("my_stats", "std_deviation_bounds.upper")?
                .unwrap(),
            6.061737691489899,
            EPSILON_FOR_TEST
        );
        assert_nearly_equals!(
            agg_res
                .get_value_from_aggregation("my_stats", "std_deviation_bounds.upper_population")?
                .unwrap(),
            6.061737691489899,
            EPSILON_FOR_TEST
        );
        assert_nearly_equals!(
            agg_res
                .get_value_from_aggregation("my_stats", "std_deviation_bounds.upper_sampling")?
                .unwrap(),
            6.3062430400804566,
            EPSILON_FOR_TEST
        );
        assert_eq!(
            agg_res
                .get_value_from_aggregation("my_stats", "sum_of_squares")?
                .unwrap(),
            91.0
        );
        assert_nearly_equals!(
            agg_res
                .get_value_from_aggregation("my_stats", "variance_population")?
                .unwrap(),
            EXPECTED_VARIANCE,
            EPSILON_FOR_TEST
        );
        assert_nearly_equals!(
            agg_res
                .get_value_from_aggregation("my_stats", "variance")?
                .unwrap(),
            EXPECTED_VARIANCE,
            EPSILON_FOR_TEST
        );
        assert_nearly_equals!(
            agg_res
                .get_value_from_aggregation("my_stats", "variance_sampling")?
                .unwrap(),
            3.5,
            EPSILON_FOR_TEST
        );

        Ok(())
    }

    #[test]
    fn test_aggregation_extended_stats_with_variance_similar_to_mean() -> crate::Result<()> {
        let values = vec![50.01, 50.02, 50.01, 50.03, 50.01, 50.02];

        let index = get_test_index_from_values(false, &values)?;

        let agg_req_1: Aggregations = serde_json::from_value(json!({
            "my_stats": {
                "extended_stats": {
                    "field": "score_f64",
                    "sigma": 1.5
                },
            }
        }))
        .unwrap();

        let collector = AggregationCollector::from_aggs(agg_req_1, Default::default());

        let reader = index.reader()?;
        let searcher = reader.searcher();
        let agg_res: AggregationResults = searcher.search(&AllQuery, &collector).unwrap();
        const EXPECTED_VARIANCE: f64 = 5.5555555555608854e-5;
        assert_eq!(
            agg_res
                .get_value_from_aggregation("my_stats", "count")?
                .unwrap(),
            6.0
        );
        assert_eq!(
            agg_res
                .get_value_from_aggregation("my_stats", "min")?
                .unwrap(),
            50.01
        );
        assert_eq!(
            agg_res
                .get_value_from_aggregation("my_stats", "max")?
                .unwrap(),
            50.03
        );
        assert_eq!(
            agg_res
                .get_value_from_aggregation("my_stats", "sum")?
                .unwrap(),
            300.1
        );
        assert_nearly_equals!(
            agg_res
                .get_value_from_aggregation("my_stats", "avg")?
                .unwrap(),
            50.01666666666667,
            EPSILON_FOR_TEST
        );
        assert_nearly_equals!(
            agg_res
                .get_value_from_aggregation("my_stats", "std_deviation")?
                .unwrap(),
            EXPECTED_VARIANCE.sqrt(),
            EPSILON_FOR_TEST
        );
        assert_nearly_equals!(
            agg_res
                .get_value_from_aggregation("my_stats", "std_deviation_population")?
                .unwrap(),
            EXPECTED_VARIANCE.sqrt(),
            EPSILON_FOR_TEST
        );
        assert_nearly_equals!(
            agg_res
                .get_value_from_aggregation("my_stats", "std_deviation_sampling")?
                .unwrap(),
            0.008164965809279263,
            EPSILON_FOR_TEST
        );
        assert_nearly_equals!(
            agg_res
                .get_value_from_aggregation("my_stats", "std_deviation_bounds.lower")?
                .unwrap(),
            50.00548632677917,
            EPSILON_FOR_TEST
        );
        assert_nearly_equals!(
            agg_res
                .get_value_from_aggregation("my_stats", "std_deviation_bounds.lower_population")?
                .unwrap(),
            50.00548632677917,
            EPSILON_FOR_TEST
        );
        assert_nearly_equals!(
            agg_res
                .get_value_from_aggregation("my_stats", "std_deviation_bounds.lower_sampling")?
                .unwrap(),
            50.00441921795275,
            EPSILON_FOR_TEST
        );
        assert_nearly_equals!(
            agg_res
                .get_value_from_aggregation("my_stats", "std_deviation_bounds.upper")?
                .unwrap(),
            50.027847006554175,
            EPSILON_FOR_TEST
        );
        assert_nearly_equals!(
            agg_res
                .get_value_from_aggregation("my_stats", "std_deviation_bounds.upper_population")?
                .unwrap(),
            50.027847006554175,
            EPSILON_FOR_TEST
        );
        assert_nearly_equals!(
            agg_res
                .get_value_from_aggregation("my_stats", "std_deviation_bounds.upper_sampling")?
                .unwrap(),
            50.028914115380594,
            EPSILON_FOR_TEST
        );
        assert_nearly_equals!(
            agg_res
                .get_value_from_aggregation("my_stats", "sum_of_squares")?
                .unwrap(),
            15010.002,
            EPSILON_FOR_TEST
        );
        assert_nearly_equals!(
            agg_res
                .get_value_from_aggregation("my_stats", "variance_population")?
                .unwrap(),
            EXPECTED_VARIANCE,
            EPSILON_FOR_TEST
        );
        assert_nearly_equals!(
            agg_res
                .get_value_from_aggregation("my_stats", "variance")?
                .unwrap(),
            EXPECTED_VARIANCE,
            EPSILON_FOR_TEST
        );
        assert_nearly_equals!(
            agg_res
                .get_value_from_aggregation("my_stats", "variance_sampling")?
                .unwrap(),
            6.666666666670718e-5,
            EPSILON_FOR_TEST
        );

        Ok(())
    }

    #[test]
    fn extended_stat_zero_value() {
        let intermediate_extend_stats = IntermediateExtendedStats::default();
        let extended_stats = intermediate_extend_stats.finalize();
        assert!(extended_stats.variance.is_none());
        assert!(extended_stats.variance_population.is_none());
        assert!(extended_stats.variance_sampling.is_none());
        assert!(extended_stats.sum_of_squares.is_none());
        assert!(extended_stats.std_deviation.is_none());
        assert!(extended_stats.std_deviation_population.is_none());
        assert!(extended_stats.std_deviation_sampling.is_none());
        assert!(extended_stats.std_deviation_bounds.is_none());
    }

    #[test]
    fn extended_stat_one_value() {
        let mut intermediate_extend_stats = IntermediateExtendedStats::default();
        intermediate_extend_stats.collect(1.0f64);
        let extended_stats = intermediate_extend_stats.finalize();
        assert!(extended_stats.variance.is_none());
        assert!(extended_stats.variance_population.is_none());
        assert!(extended_stats.variance_sampling.is_none());
        assert!(extended_stats.std_deviation.is_none());
        assert!(extended_stats.std_deviation_population.is_none());
        assert!(extended_stats.std_deviation_sampling.is_none());
        assert!(extended_stats.std_deviation_bounds.is_none());
        let sum_of_squares = extended_stats.sum_of_squares.unwrap();
        assert_eq!(1.0f64, sum_of_squares);
    }

    #[test]
    fn extended_stat_multiple_values() {
        let mut intermediate_extend_stats = IntermediateExtendedStats::default();
        intermediate_extend_stats.collect(1.0f64);
        intermediate_extend_stats.collect(3.0f64);
        intermediate_extend_stats.collect(4.0f64);
        intermediate_extend_stats.collect(5.0f64);
        intermediate_extend_stats.collect(8.0f64);
        intermediate_extend_stats.collect(10.0f64);
        let extended_stats = intermediate_extend_stats.finalize();
        let variance = extended_stats.variance.unwrap();
        const EXPECTED_VARIANCE: f64 = 9.138888888888888;
        assert_eq!(EXPECTED_VARIANCE, variance);
        let variance_population = extended_stats.variance_population.unwrap();
        assert_eq!(EXPECTED_VARIANCE, variance_population);
        let variance_sampling = extended_stats.variance_sampling.unwrap();
        assert_eq!(10.966666666666665f64, variance_sampling);
        let std_deviation = extended_stats.std_deviation.unwrap();
        assert_eq!(EXPECTED_VARIANCE.sqrt(), std_deviation);
        let std_deviation_population = extended_stats.std_deviation_population.unwrap();
        assert_eq!(EXPECTED_VARIANCE.sqrt(), std_deviation_population);
        let std_deviation_sampling = extended_stats.std_deviation_sampling.unwrap();
        assert_eq!(10.966666666666665f64.sqrt(), std_deviation_sampling);
        let sum_of_squares = extended_stats.sum_of_squares.unwrap();
        assert_eq!(215.0, sum_of_squares);
        let avg = extended_stats.avg.unwrap();
        assert_eq!(5.166666666666667, avg);
    }

    #[test]
    fn merge_empty_with_one_value() {
        let mut intermediate_extend_stats = IntermediateExtendedStats::default();
        let mut intermediate_extend_stats1 = IntermediateExtendedStats::default();
        intermediate_extend_stats1.collect(1.0f64);
        intermediate_extend_stats.merge_fruits(intermediate_extend_stats1);
        let extended_stats = intermediate_extend_stats.finalize();
        assert!(extended_stats.variance.is_none());
        assert!(extended_stats.variance_population.is_none());
        assert!(extended_stats.variance_sampling.is_none());
        assert!(extended_stats.std_deviation.is_none());
        assert!(extended_stats.std_deviation_population.is_none());
        assert!(extended_stats.std_deviation_sampling.is_none());
        let sum_of_squares = extended_stats.sum_of_squares.unwrap();
        assert_eq!(1.0f64, sum_of_squares);
    }

    #[test]
    fn merge_empty_with_multiple_values() {
        let mut intermediate_extend_stats1 = IntermediateExtendedStats::default();
        intermediate_extend_stats1.collect(1.0f64);
        intermediate_extend_stats1.collect(2.0f64);
        intermediate_extend_stats1.collect(3.0f64);
        intermediate_extend_stats1.collect(4.0f64);
        intermediate_extend_stats1.collect(5.0f64);

        let mut intermediate_extend_stats = IntermediateExtendedStats::default();
        intermediate_extend_stats.merge_fruits(intermediate_extend_stats1);
        let extended_stats = intermediate_extend_stats.finalize();
        const EXPECTED_VARIANCE: f64 = 2.0;
        let variance = extended_stats.variance.unwrap();
        assert_eq!(EXPECTED_VARIANCE, variance);
        let variance_population = extended_stats.variance_population.unwrap();
        assert_eq!(EXPECTED_VARIANCE, variance_population);
        let variance_sampling = extended_stats.variance_sampling.unwrap();
        assert_eq!(2.5f64, variance_sampling);
        let std_deviation = extended_stats.std_deviation.unwrap();
        assert_eq!(EXPECTED_VARIANCE.sqrt(), std_deviation);
        let std_deviation_population = extended_stats.std_deviation_population.unwrap();
        assert_eq!(EXPECTED_VARIANCE.sqrt(), std_deviation_population);
        let std_deviation_sampling = extended_stats.std_deviation_sampling.unwrap();
        assert_eq!(2.5f64.sqrt(), std_deviation_sampling);
        let sum_of_squares = extended_stats.sum_of_squares.unwrap();
        assert_eq!(55f64, sum_of_squares);
    }

    #[test]
    fn merge_non_empty_extended_stats() {
        let mut intermediate_extend_stats1 = IntermediateExtendedStats::default();
        intermediate_extend_stats1.collect(3.0f64);
        intermediate_extend_stats1.collect(4.0f64);
        intermediate_extend_stats1.collect(5.0f64);

        let mut intermediate_extend_stats = IntermediateExtendedStats::default();
        intermediate_extend_stats.collect(1.0f64);
        intermediate_extend_stats.collect(2.0f64);
        intermediate_extend_stats.merge_fruits(intermediate_extend_stats1);
        let extended_stats = intermediate_extend_stats.finalize();

        let variance = extended_stats.variance.unwrap();
        assert_eq!(2.0f64, variance);
        let variance_population = extended_stats.variance_population.unwrap();
        assert_eq!(2.0f64, variance_population);
        let variance_sampling = extended_stats.variance_sampling.unwrap();
        assert_eq!(2.5f64, variance_sampling);
        let std_deviation = extended_stats.std_deviation.unwrap();
        assert_eq!(2.0f64.sqrt(), std_deviation);
        let std_deviation_population = extended_stats.std_deviation_population.unwrap();
        assert_eq!(2.0f64.sqrt(), std_deviation_population);
        let std_deviation_sampling = extended_stats.std_deviation_sampling.unwrap();
        assert_eq!(2.5f64.sqrt(), std_deviation_sampling);
        let sum_of_squares = extended_stats.sum_of_squares.unwrap();
        assert_eq!(55f64, sum_of_squares);

        let mut intermediate_extend_stats = IntermediateExtendedStats::default();
        intermediate_extend_stats.collect(1.0f64);
        intermediate_extend_stats.collect(3.0f64);
        intermediate_extend_stats.collect(4.0f64);
        let mut intermediate_extend_stats1 = IntermediateExtendedStats::default();
        intermediate_extend_stats1.collect(5.0f64);
        intermediate_extend_stats1.collect(8.0f64);
        intermediate_extend_stats1.collect(10.0f64);
        intermediate_extend_stats.merge_fruits(intermediate_extend_stats1);
        let extended_stats = intermediate_extend_stats.finalize();
        const EXPECTED_VARIANCE: f64 = 9.138888888888888;
        let variance = extended_stats.variance.unwrap();
        assert_eq!(EXPECTED_VARIANCE, variance);
        let variance_population = extended_stats.variance_population.unwrap();
        assert_eq!(EXPECTED_VARIANCE, variance_population);
        let variance_sampling = extended_stats.variance_sampling.unwrap();
        assert_eq!(10.966666666666665f64, variance_sampling);
        let std_deviation = extended_stats.std_deviation.unwrap();
        assert_eq!(EXPECTED_VARIANCE.sqrt(), std_deviation);
        let std_deviation_population = extended_stats.std_deviation_population.unwrap();
        assert_eq!(EXPECTED_VARIANCE.sqrt(), std_deviation_population);
        let std_deviation_sampling = extended_stats.std_deviation_sampling.unwrap();
        assert_eq!(10.966666666666665f64.sqrt(), std_deviation_sampling);
        let sum_of_squares = extended_stats.sum_of_squares.unwrap();
        assert_eq!(215f64, sum_of_squares);
        let avg = extended_stats.avg.unwrap();
        assert_eq!(5.166666666666667, avg);
    }

    #[test]
    fn merge_and_then_collect_non_empty_extended_stats() {
        let mut intermediate_extend_stats = IntermediateExtendedStats::default();
        intermediate_extend_stats.collect(1.0f64);
        intermediate_extend_stats.collect(3.0f64);

        let mut intermediate_extend_stats1 = IntermediateExtendedStats::default();
        intermediate_extend_stats1.collect(5.0f64);
        intermediate_extend_stats1.collect(8.0f64);
        intermediate_extend_stats1.collect(10.0f64);
        intermediate_extend_stats.merge_fruits(intermediate_extend_stats1);
        intermediate_extend_stats.collect(4.0f64);
        let extended_stats = intermediate_extend_stats.finalize();
        const EXPECTED_VARIANCE: f64 = 9.138888888888888;
        let variance = extended_stats.variance.unwrap();
        assert_nearly_equals!(EXPECTED_VARIANCE, variance, EPSILON_FOR_TEST);
        let variance_population = extended_stats.variance_population.unwrap();
        assert_nearly_equals!(EXPECTED_VARIANCE, variance_population, EPSILON_FOR_TEST);
        let variance_sampling = extended_stats.variance_sampling.unwrap();
        assert_nearly_equals!(10.966666666666665, variance_sampling, EPSILON_FOR_TEST);
        let std_deviation = extended_stats.std_deviation.unwrap();
        assert_nearly_equals!(EXPECTED_VARIANCE.sqrt(), std_deviation, EPSILON_FOR_TEST);
        let std_deviation_population = extended_stats.std_deviation_population.unwrap();
        assert_nearly_equals!(
            EXPECTED_VARIANCE.sqrt(),
            std_deviation_population,
            EPSILON_FOR_TEST
        );
        let std_deviation_sampling = extended_stats.std_deviation_sampling.unwrap();
        assert_nearly_equals!(
            10.966666666666665_f64.sqrt(),
            std_deviation_sampling,
            EPSILON_FOR_TEST
        );
        let sum_of_squares = extended_stats.sum_of_squares.unwrap();
        assert_eq!(215.0, sum_of_squares);
        let avg = extended_stats.avg.unwrap();
        assert_eq!(5.166666666666667, avg);
    }
}


================================================
FILE: src/aggregation/metric/max.rs
================================================
use std::fmt::Debug;

use serde::{Deserialize, Serialize};

use super::*;
use crate::aggregation::*;

/// A single-value metric aggregation that computes the maximum of numeric values that are
/// extracted from the aggregated documents.
/// See [super::SingleMetricResult] for return value.
///
/// # JSON Format
/// ```json
/// {
///     "max": {
///         "field": "score"
///     }
/// }
/// ```
#[derive(Clone, Debug, PartialEq, Serialize, Deserialize)]
pub struct MaxAggregation {
    /// The field name to compute the maximum on.
    pub field: String,
    /// The missing parameter defines how documents that are missing a value should be treated.
    /// By default they will be ignored but it is also possible to treat them as if they had a
    /// value. Examples in JSON format:
    /// { "field": "my_numbers", "missing": "10.0" }
    #[serde(default, deserialize_with = "deserialize_option_f64")]
    pub missing: Option<f64>,
}

impl MaxAggregation {
    /// Creates a new [`MaxAggregation`] instance from a field name.
    pub fn from_field_name(field_name: String) -> Self {
        Self {
            field: field_name,
            missing: None,
        }
    }
    /// Returns the field name the aggregation is computed on.
    pub fn field_name(&self) -> &str {
        &self.field
    }
}

/// Intermediate result of the maximum aggregation that can be combined with other intermediate
/// results.
#[derive(Default, Clone, Debug, PartialEq, Serialize, Deserialize)]
pub struct IntermediateMax {
    stats: IntermediateStats,
}

impl IntermediateMax {
    /// Creates a new [`IntermediateMax`] instance from a [`SegmentStatsCollector`].
    pub(crate) fn from_stats(stats: IntermediateStats) -> Self {
        Self { stats }
    }
    /// Merges the other intermediate result into self.
    pub fn merge_fruits(&mut self, other: IntermediateMax) {
        self.stats.merge_fruits(other.stats);
    }
    /// Computes the final maximum value.
    pub fn finalize(&self) -> Option<f64> {
        self.stats.finalize().max
    }
}

#[cfg(test)]
mod tests {
    use crate::aggregation::agg_req::Aggregations;
    use crate::aggregation::tests::exec_request_with_query;
    use crate::schema::{Schema, FAST};
    use crate::{Index, IndexWriter};

    #[test]
    fn test_max_agg_with_missing() -> crate::Result<()> {
        let mut schema_builder = Schema::builder();
        let json = schema_builder.add_json_field("json", FAST);
        let schema = schema_builder.build();
        let index = Index::create_in_ram(schema);
        let mut index_writer: IndexWriter = index.writer_for_tests().unwrap();
        // => Segment with empty json
        index_writer.add_document(doc!()).unwrap();
        index_writer.commit().unwrap();
        // => Segment with json, but no field partially_empty
        index_writer
            .add_document(doc!(json => json!({"different_field": "blue"})))
            .unwrap();
        index_writer.commit().unwrap();
        //// => Segment with field partially_empty
        index_writer
            .add_document(doc!(json => json!({"partially_empty": 10.0})))
            .unwrap();
        index_writer.add_document(doc!())?;
        index_writer.commit().unwrap();

        let agg_req: Aggregations = serde_json::from_value(json!({
            "my_stats": {
                "max": {
                    "field": "json.partially_empty",
                    "missing": 100.0,
                }
            }
        }))
        .unwrap();

        let res = exec_request_with_query(agg_req, &index, None)?;

        assert_eq!(
            res["my_stats"],
            json!({
                "value": 100.0,
            })
        );

        Ok(())
    }
}


================================================
FILE: src/aggregation/metric/min.rs
================================================
use std::fmt::Debug;

use serde::{Deserialize, Serialize};

use super::*;
use crate::aggregation::*;

/// A single-value metric aggregation that computes the minimum of numeric values that are
/// extracted from the aggregated documents.
/// See [super::SingleMetricResult] for return value.
///
/// # JSON Format
/// ```json
/// {
///     "min": {
///         "field": "score"
///     }
/// }
/// ```
#[derive(Clone, Debug, PartialEq, Serialize, Deserialize)]
pub struct MinAggregation {
    /// The field name to compute the minimum on.
    pub field: String,
    /// The missing parameter defines how documents that are missing a value should be treated.
    /// By default they will be ignored but it is also possible to treat them as if they had a
    /// value. Examples in JSON format:
    /// { "field": "my_numbers", "missing": "10.0" }
    #[serde(default, deserialize_with = "deserialize_option_f64")]
    pub missing: Option<f64>,
}

impl MinAggregation {
    /// Creates a new [`MinAggregation`] instance from a field name.
    pub fn from_field_name(field_name: String) -> Self {
        Self {
            field: field_name,
            missing: None,
        }
    }
    /// Returns the field name the aggregation is computed on.
    pub fn field_name(&self) -> &str {
        &self.field
    }
}

/// Intermediate result of the minimum aggregation that can be combined with other intermediate
/// results.
#[derive(Default, Clone, Debug, PartialEq, Serialize, Deserialize)]
pub struct IntermediateMin {
    stats: IntermediateStats,
}

impl IntermediateMin {
    /// Creates a new [`IntermediateMin`] instance from a [`SegmentStatsCollector`].
    pub(crate) fn from_stats(stats: IntermediateStats) -> Self {
        Self { stats }
    }
    /// Merges the other intermediate result into self.
    pub fn merge_fruits(&mut self, other: IntermediateMin) {
        self.stats.merge_fruits(other.stats);
    }
    /// Computes the final minimum value.
    pub fn finalize(&self) -> Option<f64> {
        self.stats.finalize().min
    }
}


================================================
FILE: src/aggregation/metric/mod.rs
================================================
//! Module for all metric aggregations.
//!
//! The aggregations in this family compute metrics based on values extracted
//! from the documents that are being aggregated. Values are extracted from the fast field of
//! the document.
//! Some aggregations output a single numeric metric (e.g. Average) and are called
//! single-value numeric metrics aggregation, others generate multiple metrics (e.g. Stats) and are
//! called multi-value numeric metrics aggregation.
//!
//! ## Supported Metric Aggregations
//! - [Average](AverageAggregation)
//! - [Stats](StatsAggregation)
//! - [Min](MinAggregation)
//! - [Max](MaxAggregation)
//! - [Sum](SumAggregation)
//! - [Count](CountAggregation)
//! - [Percentiles](PercentilesAggregationReq)

mod average;
mod cardinality;
mod count;
mod extended_stats;
mod max;
mod min;
mod percentiles;
mod stats;
mod sum;
mod top_hits;

use std::collections::HashMap;

pub use average::*;
pub use cardinality::*;
use columnar::{Column, ColumnType};
pub use count::*;
pub use extended_stats::*;
pub use max::*;
pub use min::*;
pub use percentiles::*;
use rustc_hash::FxHashMap;
use serde::{Deserialize, Serialize};
pub use stats::*;
pub use sum::*;
pub use top_hits::*;

use crate::schema::OwnedValue;

/// Contains all information required by metric aggregations like avg, min, max, sum, stats,
/// extended_stats, count, percentiles.
#[repr(C)]
pub struct MetricAggReqData {
    /// True if the field is of number or date type.
    pub is_number_or_date_type: bool,
    /// The type of the field.
    pub field_type: ColumnType,
    /// The missing value normalized to the internal u64 representation of the field type.
    pub missing_u64: Option<u64>,
    /// The column accessor to access the fast field values.
    pub accessor: Column<u64>,
    /// Used when converting to intermediate result
    pub collecting_for: StatsType,
    /// The missing value
    pub missing: Option<f64>,
    /// The name of the aggregation.
    pub name: String,
}

impl MetricAggReqData {
    /// Estimate the memory consumption of this struct in bytes.
    pub fn get_memory_consumption(&self) -> usize {
        std::mem::size_of::<Self>()
    }
}

/// Single-metric aggregations use this common result structure.
///
/// Main reason to wrap it in value is to match elasticsearch output structure.
#[derive(Clone, Debug, PartialEq, Serialize, Deserialize)]
pub struct SingleMetricResult {
    /// The value of the single value metric.
    pub value: Option<f64>,
}

impl From<f64> for SingleMetricResult {
    fn from(value: f64) -> Self {
        Self { value: Some(value) }
    }
}

impl From<Option<f64>> for SingleMetricResult {
    fn from(value: Option<f64>) -> Self {
        Self { value }
    }
}

/// This is the wrapper of percentile entries, which can be vector or hashmap
/// depending on if it's keyed or not.
#[derive(Clone, Debug, PartialEq, Serialize, Deserialize)]
#[serde(untagged)]
pub enum PercentileValues {
    /// Vector format percentile entries
    Vec(Vec<PercentileValuesVecEntry>),
    /// HashMap format percentile entries. Key is the serialized percentile
    HashMap(FxHashMap<String, f64>),
}

#[derive(Clone, Debug, PartialEq, Serialize, Deserialize)]
/// The entry when requesting percentiles with keyed: false
pub struct PercentileValuesVecEntry {
    /// Percentile
    pub key: f64,

    /// Value at the percentile
    pub value: f64,
}

/// Single-metric aggregations use this common result structure.
///
/// Main reason to wrap it in value is to match elasticsearch output structure.
#[derive(Clone, Debug, PartialEq, Serialize, Deserialize)]
pub struct PercentilesMetricResult {
    /// The result of the percentile metric.
    pub values: PercentileValues,
}

/// The top_hits metric results entry
#[derive(Clone, Debug, PartialEq, Serialize, Deserialize)]
pub struct TopHitsVecEntry {
    /// The sort values of the document, depending on the sort criteria in the request.
    pub sort: Vec<Option<u64>>,

    /// Search results, for queries that include field retrieval requests
    /// (`docvalue_fields`).
    #[serde(rename = "docvalue_fields")]
    #[serde(skip_serializing_if = "HashMap::is_empty")]
    pub doc_value_fields: HashMap<String, OwnedValue>,
}

/// The top_hits metric aggregation results a list of top hits by sort criteria.
///
/// The main reason for wrapping it in `hits` is to match elasticsearch output structure.
#[derive(Clone, Debug, PartialEq, Serialize, Deserialize)]
pub struct TopHitsMetricResult {
    /// The result of the top_hits metric.
    pub hits: Vec<TopHitsVecEntry>,
}

#[cfg(test)]
mod tests {
    use crate::aggregation::agg_req::Aggregations;
    use crate::aggregation::agg_result::AggregationResults;
    use crate::aggregation::AggregationCollector;
    use crate::query::AllQuery;
    use crate::schema::{NumericOptions, Schema};
    use crate::{Index, IndexWriter};

    #[test]
    fn test_metric_aggregations() {
        let mut schema_builder = Schema::builder();
        let field_options = NumericOptions::default().set_fast();
        let field = schema_builder.add_f64_field("price", field_options);
        let index = Index::create_in_ram(schema_builder.build());
        let mut index_writer: IndexWriter = index.writer_for_tests().unwrap();

        for i in 0..3 {
            index_writer
                .add_document(doc!(
                    field => i as f64,
                ))
                .unwrap();
        }
        index_writer.commit().unwrap();

        for i in 3..6 {
            index_writer
                .add_document(doc!(
                    field => i as f64,
                ))
                .unwrap();
        }
        index_writer.commit().unwrap();

        let aggregations_json = r#"{
            "price_avg": { "avg": { "field": "price" } },
            "price_count": { "value_count": { "field": "price" } },
            "price_max": { "max": { "field": "price" } },
            "price_min": { "min": { "field": "price" } },
            "price_stats": { "stats": { "field": "price" } },
            "price_sum": { "sum": { "field": "price" } }
        }"#;
        let aggregations: Aggregations = serde_json::from_str(aggregations_json).unwrap();
        let collector = AggregationCollector::from_aggs(aggregations, Default::default());
        let reader = index.reader().unwrap();
        let searcher = reader.searcher();
        let aggregations_res: AggregationResults = searcher.search(&AllQuery, &collector).unwrap();
        let aggregations_res_json = serde_json::to_value(aggregations_res).unwrap();

        assert_eq!(aggregations_res_json["price_avg"]["value"], 2.5);
        assert_eq!(aggregations_res_json["price_count"]["value"], 6.0);
        assert_eq!(aggregations_res_json["price_max"]["value"], 5.0);
        assert_eq!(aggregations_res_json["price_min"]["value"], 0.0);
        assert_eq!(aggregations_res_json["price_sum"]["value"], 15.0);
    }
}


================================================
FILE: src/aggregation/metric/percentiles.rs
================================================
use std::fmt::Debug;

use serde::{Deserialize, Serialize};

use super::*;
use crate::aggregation::agg_data::AggregationsSegmentCtx;
use crate::aggregation::intermediate_agg_result::{
    IntermediateAggregationResult, IntermediateAggregationResults, IntermediateMetricResult,
};
use crate::aggregation::segment_agg_result::SegmentAggregationCollector;
use crate::aggregation::*;
use crate::TantivyError;

/// # Percentiles
///
/// The percentiles aggregation is a useful tool for understanding the distribution
/// of a data set. It calculates the values below which a given percentage of the
/// data falls. For instance, the 95th percentile indicates the value below which
/// 95% of the data points can be found.
///
/// This aggregation can be particularly interesting for analyzing website or service response
/// times. For example, if the 95th percentile website load time is significantly higher than the
/// median, this indicates that a small percentage of users are experiencing much slower load times
/// than the majority.
///
/// To use the percentiles aggregation, you'll need to provide a field to
/// aggregate on. In the case of website load times, this would typically be a
/// field containing the duration of time it takes for the site to load.
///
/// The following example demonstrates a request for the percentiles of the "load_time"
/// field:
///
/// ```JSON
/// {
///     "percentiles": {
///         "field": "load_time"
///     }
/// }
/// ```
///
/// This request will return an object containing the default percentiles (1, 5,
/// 25, 50 (median), 75, 95, and 99). You can also customize the percentiles you want to
/// calculate by providing an array of values in the "percents" parameter:
///
/// ```JSON
/// {
///     "percentiles": {
///         "field": "load_time",
///         "percents": [10, 20, 30, 40, 50, 60, 70, 80, 90]
///     }
/// }
/// ```
///
/// In this example, the aggregation will return the 10th, 20th, 30th, 40th, 50th,
/// 60th, 70th, 80th, and 90th percentiles of the "load_time" field.
///
/// Analyzing the percentiles of website load times can help you understand the
/// user experience and identify areas for optimization. For example, if the 95th
/// percentile load time is significantly higher than the median, this indicates
/// that a small percentage of users are experiencing much slower load times than
/// the majority.
///
/// # Estimating Percentiles
///
/// While percentiles provide valuable insights into the distribution of data, it's
/// important to understand that they are often estimates. This is because
/// calculating exact percentiles for large data sets can be computationally
/// expensive and time-consuming. As a result, many percentile aggregation
/// algorithms use approximation techniques to provide faster results.
#[derive(Clone, Debug, PartialEq, Serialize, Deserialize)]
pub struct PercentilesAggregationReq {
    /// The field name to compute the percentiles on.
    pub field: String,
    /// The percentiles to compute.
    /// Defaults to [1.0, 5.0, 25.0, 50.0, 75.0, 95.0, 99.0]
    pub percents: Option<Vec<f64>>,
    /// Whether to return the percentiles as a hash map
    #[serde(default = "default_as_true")]
    pub keyed: bool,
    /// The missing parameter defines how documents that are missing a value should be treated.
    /// By default they will be ignored but it is also possible to treat them as if they had a
    /// value. Examples in JSON format:
    /// { "field": "my_numbers", "missing": "10.0" }
    #[serde(
        skip_serializing_if = "Option::is_none",
        default,
        deserialize_with = "deserialize_option_f64"
    )]
    pub missing: Option<f64>,
}
fn default_percentiles() -> &'static [f64] {
    &[1.0, 5.0, 25.0, 50.0, 75.0, 95.0, 99.0]
}
fn default_as_true() -> bool {
    true
}

impl PercentilesAggregationReq {
    /// Creates a new [`PercentilesAggregationReq`] instance from a field name.
    pub fn from_field_name(field_name: String) -> Self {
        PercentilesAggregationReq {
            field: field_name,
            percents: None,
            keyed: default_as_true(),
            missing: None,
        }
    }
    /// Returns the field name the aggregation is computed on.
    pub fn field_name(&self) -> &str {
        &self.field
    }

    /// Validates the request parameters.
    pub fn validate(&self) -> crate::Result<()> {
        if let Some(percents) = self.percents.as_ref() {
            let all_in_range = percents
                .iter()
                .cloned()
                .all(|percent| (0.0..=100.0).contains(&percent));
            if !all_in_range {
                return Err(TantivyError::AggregationError(
                    AggregationError::InvalidRequest(
                        "All percentiles have to be between 0.0 and 100.0".to_string(),
                    ),
                ));
            }
        }

        Ok(())
    }
}

#[derive(Clone, Debug)]
pub(crate) struct SegmentPercentilesCollector {
    pub(crate) buckets: Vec<PercentilesCollector>,
    pub(crate) accessor_idx: usize,
    /// The type of the field.
    pub field_type: ColumnType,
    /// The missing value normalized to the internal u64 representation of the field type.
    pub missing_u64: Option<u64>,
    /// The column accessor to access the fast field values.
    pub accessor: Column<u64>,
}

#[derive(Clone, Serialize, Deserialize)]
/// The percentiles collector used during segment collection and for merging results.
pub struct PercentilesCollector {
    sketch: sketches_ddsketch::DDSketch,
}
impl Default for PercentilesCollector {
    fn default() -> Self {
        Self::new()
    }
}

impl Debug for PercentilesCollector {
    fn fmt(&self, f: &mut std::fmt::Formatter) -> std::fmt::Result {
        f.debug_struct("IntermediatePercentiles")
            .field("sketch_len", &self.sketch.length())
            .finish()
    }
}
impl PartialEq for PercentilesCollector {
    fn eq(&self, _other: &Self) -> bool {
        false
    }
}

fn format_percentile(percentile: f64) -> String {
    let mut out = percentile.to_string();
    // Slightly silly way to format trailing decimals
    if !out.contains('.') {
        out.push_str(".0");
    }
    out
}

impl PercentilesCollector {
    /// Convert result into final result. This will query the quantils from the underlying quantil
    /// collector.
    pub fn into_final_result(self, req: &PercentilesAggregationReq) -> PercentilesMetricResult {
        let percentiles: &[f64] = req
            .percents
            .as_ref()
            .map(|el| el.as_ref())
            .unwrap_or(default_percentiles());
        let iter_quantile_and_values = percentiles.iter().cloned().map(|percentile| {
            (
                percentile,
                self.sketch
                    .quantile(percentile / 100.0)
                    .expect(
                        "quantil out of range. This error should have been caught during \
                         validation phase",
                    )
                    .unwrap_or(f64::NAN),
            )
        });

        let values = if req.keyed {
            PercentileValues::HashMap(
                iter_quantile_and_values
                    .map(|(val, quantil)| (format_percentile(val), quantil))
                    .collect(),
            )
        } else {
            PercentileValues::Vec(
                iter_quantile_and_values
                    .map(|(key, value)| PercentileValuesVecEntry { key, value })
                    .collect(),
            )
        };
        PercentilesMetricResult { values }
    }

    fn new() -> Self {
        let ddsketch_config = sketches_ddsketch::Config::defaults();
        let sketch = sketches_ddsketch::DDSketch::new(ddsketch_config);
        Self { sketch }
    }
    fn collect(&mut self, val: f64) {
        self.sketch.add(val);
    }

    /// Encode the underlying DDSketch to Java-compatible binary format
    /// for cross-language serialization with Java consumers.
    pub fn to_sketch_bytes(&self) -> Vec<u8> {
        self.sketch.to_java_bytes()
    }

    pub(crate) fn merge_fruits(&mut self, right: PercentilesCollector) -> crate::Result<()> {
        self.sketch.merge(&right.sketch).map_err(|err| {
            TantivyError::AggregationError(AggregationError::InternalError(format!(
                "Error while merging percentiles {err:?}"
            )))
        })?;

        Ok(())
    }
}

impl SegmentPercentilesCollector {
    pub fn from_req_and_validate(
        field_type: ColumnType,
        missing_u64: Option<u64>,
        accessor: Column<u64>,
        accessor_idx: usize,
    ) -> Self {
        Self {
            buckets: Vec::with_capacity(64),
            field_type,
            missing_u64,
            accessor,
            accessor_idx,
        }
    }
}

impl SegmentAggregationCollector for SegmentPercentilesCollector {
    #[inline]
    fn add_intermediate_aggregation_result(
        &mut self,
        agg_data: &AggregationsSegmentCtx,
        results: &mut IntermediateAggregationResults,
        parent_bucket_id: BucketId,
    ) -> crate::Result<()> {
        let name = agg_data.get_metric_req_data(self.accessor_idx).name.clone();
        self.prepare_max_bucket(parent_bucket_id, agg_data)?;
        // Swap collector with an empty one to avoid cloning
        let percentiles_collector = std::mem::take(&mut self.buckets[parent_bucket_id as usize]);

        let intermediate_metric_result =
            IntermediateMetricResult::Percentiles(percentiles_collector);

        results.push(
            name,
            IntermediateAggregationResult::Metric(intermediate_metric_result),
        )?;

        Ok(())
    }

    #[inline]
    fn collect(
        &mut self,
        parent_bucket_id: BucketId,
        docs: &[crate::DocId],
        agg_data: &mut AggregationsSegmentCtx,
    ) -> crate::Result<()> {
        let percentiles = &mut self.buckets[parent_bucket_id as usize];
        agg_data.column_block_accessor.fetch_block_with_missing(
            docs,
            &self.accessor,
            self.missing_u64,
        );

        for val in agg_data.column_block_accessor.iter_vals() {
            let val1 = f64_from_fastfield_u64(val, self.field_type);
            percentiles.collect(val1);
        }

        Ok(())
    }

    fn prepare_max_bucket(
        &mut self,
        max_bucket: BucketId,
        _agg_data: &AggregationsSegmentCtx,
    ) -> crate::Result<()> {
        while self.buckets.len() <= max_bucket as usize {
            self.buckets.push(PercentilesCollector::new());
        }
        Ok(())
    }
}

#[cfg(test)]
mod tests {

    use itertools::Itertools;
    use more_asserts::{assert_ge, assert_le};
    use rand::rngs::StdRng;
    use rand::SeedableRng;
    use serde_json::Value;

    use crate::aggregation::agg_req::Aggregations;
    use crate::aggregation::agg_result::AggregationResults;
    use crate::aggregation::tests::{
        exec_request_with_query, get_test_index_from_values, get_test_index_from_values_and_terms,
    };
    use crate::aggregation::AggregationCollector;
    use crate::query::AllQuery;
    use crate::schema::{Schema, FAST};
    use crate::{assert_nearly_equals, Index};

    #[test]
    fn test_aggregation_percentiles_empty_index() -> crate::Result<()> {
        // test index without segments
        let values = vec![];

        let index = get_test_index_from_values(false, &values)?;

        let agg_req_1: Aggregations = serde_json::from_value(json!({
            "percentiles": {
                "percentiles": {
                    "field": "score",
                }
            },
        }))
        .unwrap();

        let collector = AggregationCollector::from_aggs(agg_req_1, Default::default());

        let reader = index.reader()?;
        let searcher = reader.searcher();
        let agg_res: AggregationResults = searcher.search(&AllQuery, &collector).unwrap();

        let res: Value = serde_json::from_str(&serde_json::to_string(&agg_res)?)?;
        assert_eq!(
            res["percentiles"]["values"],
            json!({
                "1.0": Value::Null,
                "5.0": Value::Null,
                "25.0": Value::Null,
                "50.0": Value::Null,
                "75.0": Value::Null,
                "95.0": Value::Null,
                "99.0": Value::Null,
            })
        );

        Ok(())
    }

    #[test]
    fn test_aggregation_percentile_simple() -> crate::Result<()> {
        let values = vec![10.0];

        let index = get_test_index_from_values(false, &values)?;

        let agg_req_1: Aggregations = serde_json::from_value(json!({
            "percentiles": {
                "percentiles": {
                    "field": "score",
                }
            },
        }))
        .unwrap();

        let collector = AggregationCollector::from_aggs(agg_req_1, Default::default());

        let reader = index.reader()?;
        let searcher = reader.searcher();
        let agg_res: AggregationResults = searcher.search(&AllQuery, &collector).unwrap();

        let res: Value = serde_json::from_str(&serde_json::to_string(&agg_res)?)?;

        let percents = vec!["1.0", "5.0", "25.0", "50.0", "75.0", "95.0", "99.0"];
        let range = 9.9..10.1;
        for percent in percents {
            let val = res["percentiles"]["values"][percent].as_f64().unwrap();
            assert!(range.contains(&val));
        }

        Ok(())
    }

    #[test]
    fn test_aggregation_percentile_parameters() -> crate::Result<()> {
        let values = vec![10.0];

        let index = get_test_index_from_values(false, &values)?;

        let agg_req_str = r#"
        {
          "mypercentiles": {
            "percentiles": {
              "field": "score",
              "percents": [ 95, 99, 99.9 ]
            }
          }
        } "#;
        let agg_req_1: Aggregations = serde_json::from_str(agg_req_str).unwrap();

        let collector = AggregationCollector::from_aggs(agg_req_1, Default::default());

        let reader = index.reader()?;
        let searcher = reader.searcher();
        let agg_res: AggregationResults = searcher.search(&AllQuery, &collector).unwrap();

        let res: Value = serde_json::from_str(&serde_json::to_string(&agg_res)?)?;

        let percents = vec!["95.0", "99.0", "99.9"];
        let expected_range = 9.9..10.1;
        for percent in percents {
            let val = res["mypercentiles"]["values"][percent].as_f64().unwrap();
            assert!(expected_range.contains(&val));
        }
        // Keyed false
        //
        let agg_req_str = r#"
        {
          "mypercentiles": {
            "percentiles": {
              "field": "score",
              "percents": [ 95, 99, 99.9 ],
              "keyed": false
            }
          }
        } "#;
        let agg_req_1: Aggregations = serde_json::from_str(agg_req_str).unwrap();

        let collector = AggregationCollector::from_aggs(agg_req_1, Default::default());

        let reader = index.reader()?;
        let searcher = reader.searcher();
        let agg_res: AggregationResults = searcher.search(&AllQuery, &collector).unwrap();

        let res: Value = serde_json::from_str(&serde_json::to_string(&agg_res)?)?;

        let vals = &res["mypercentiles"]["values"];
        assert_eq!(vals[0]["key"].as_f64().unwrap(), 95.0);
        assert_eq!(vals[1]["key"].as_f64().unwrap(), 99.0);
        assert_eq!(vals[2]["key"].as_f64().unwrap(), 99.9);
        assert_eq!(vals[3]["key"], serde_json::Value::Null);
        assert!(expected_range.contains(&vals[0]["value"].as_f64().unwrap()));
        assert!(expected_range.contains(&vals[1]["value"].as_f64().unwrap()));
        assert!(expected_range.contains(&vals[2]["value"].as_f64().unwrap()));

        Ok(())
    }

    #[test]
    fn test_aggregation_percentiles_single_seg() -> crate::Result<()> {
        test_aggregation_percentiles(true)
    }

    #[test]
    fn test_aggregation_percentiles_multi_seg() -> crate::Result<()> {
        test_aggregation_percentiles(false)
    }

    fn test_aggregation_percentiles(merge_segments: bool) -> crate::Result<()> {
        use rand_distr::Distribution;
        let num_values_in_segment = [100, 30_000, 8000];
        let lg_norm = rand_distr::LogNormal::new(2.996f64, 0.979f64).unwrap();
        let mut rng = StdRng::from_seed([1u8; 32]);

        let segment_data = |i| {
            (0..num_values_in_segment[i])
                .map(|_| lg_norm.sample(&mut rng))
                .collect_vec()
        };

        let values = (0..=2).map(segment_data).collect_vec();

        let mut all_values = values
            .iter()
            .flat_map(|el| el.iter().cloned())
            .collect_vec();
        all_values.sort_unstable_by(|a, b| a.total_cmp(b));

        fn get_exact_quantil(q: f64, all_values: &[f64]) -> f64 {
            let q = q / 100.0;
            assert!((0f64..=1f64).contains(&q));

            let index = (all_values.len() as f64 * q).ceil() as usize;
            let index = index.min(all_values.len() - 1);
            all_values[index]
        }

        let segment_and_values = values
            .into_iter()
            .map(|segment_data| {
                segment_data
                    .into_iter()
                    .map(|val| (val, val.to_string()))
                    .collect_vec()
            })
            .collect_vec();

        let index =
            get_test_index_from_values_and_terms(merge_segments, &segment_and_values).unwrap();

        let reader = index.reader()?;

        let agg_req_str = r#"
        {
          "mypercentiles": {
            "percentiles": {
              "field": "score_f64",
              "percents": [ 95, 99, 99.9 ]
            }
          }
        } "#;
        let agg_req_1: Aggregations = serde_json::from_str(agg_req_str).unwrap();

        let collector = AggregationCollector::from_aggs(agg_req_1, Default::default());

        let searcher = reader.searcher();
        let agg_res: AggregationResults = searcher.search(&AllQuery, &collector).unwrap();

        let res: Value = serde_json::from_str(&serde_json::to_string(&agg_res)?)?;
        let vals = &res["mypercentiles"]["values"];

        let check_quantil = |exact_quantil: f64, val: f64| {
            let lower = exact_quantil - exact_quantil * 0.02;
            let upper = exact_quantil + exact_quantil * 0.02;
            assert_le!(val, upper);
            assert_ge!(val, lower);
        };

        let val = vals["95.0"].as_f64().unwrap();
        let exact_quantil = get_exact_quantil(95.0, &all_values);
        check_quantil(exact_quantil, val);

        let val = vals["99.0"].as_f64().unwrap();
        let exact_quantil = get_exact_quantil(99.0, &all_values);
        check_quantil(exact_quantil, val);

        let val = vals["99.9"].as_f64().unwrap();
        let exact_quantil = get_exact_quantil(99.9, &all_values);
        check_quantil(exact_quantil, val);

        Ok(())
    }

    #[test]
    fn test_percentiles_missing_sub_agg() -> crate::Result<()> {
        // This test verifies the `collect` method (in contrast to `collect_block`), which is
        // called when the sub-aggregations are flushed.
        let mut schema_builder = Schema::builder();
        let text_field = schema_builder.add_text_field("texts", FAST);
        let score_field_f64 = schema_builder.add_f64_field("score", FAST);
        let schema = schema_builder.build();
        let index = Index::create_in_ram(schema);

        {
            let mut index_writer = index.writer_for_tests()?;
            // writing the segment
            index_writer.add_document(doc!(
                score_field_f64 => 10.0f64,
                text_field => "a"
            ))?;
            index_writer.add_document(doc!(
                score_field_f64 => 10.0f64,
                text_field => "a"
            ))?;

            index_writer.add_document(doc!(text_field => "a"))?;

            index_writer.commit()?;
        }

        let agg_req: Aggregations = {
            serde_json::from_value(json!({
                "range_with_stats": {
                    "terms": {
                        "field": "texts"
                    },
                    "aggs": {
                        "percentiles": {
                            "percentiles": {
                                "field": "score",
                                "missing": 5.0
                            }
                        }
                    }
                }
            }))
            .unwrap()
        };

        let res = exec_request_with_query(agg_req, &index, None)?;
        assert_eq!(res["range_with_stats"]["buckets"][0]["doc_count"], 3);

        assert_nearly_equals!(
            res["range_with_stats"]["buckets"][0]["percentiles"]["values"]["1.0"]
                .as_f64()
                .unwrap(),
            5.0028295751107414
        );
        assert_nearly_equals!(
            res["range_with_stats"]["buckets"][0]["percentiles"]["values"]["99.0"]
                .as_f64()
                .unwrap(),
            10.07469668951144
        );

        Ok(())
    }

    #[test]
    fn test_percentiles_missing() -> crate::Result<()> {
        let mut schema_builder = Schema::builder();
        let text_field = schema_builder.add_text_field("texts", FAST);
        let score_field_f64 = schema_builder.add_f64_field("score", FAST);
        let schema = schema_builder.build();
        let index = Index::create_in_ram(schema);

        {
            let mut index_writer = index.writer_for_tests()?;
            // writing the segment
            index_writer.add_document(doc!(
                score_field_f64 => 10.0f64,
                text_field => "a"
            ))?;
            index_writer.add_document(doc!(
                score_field_f64 => 10.0f64,
                text_field => "a"
            ))?;

            index_writer.add_document(doc!(text_field => "a"))?;

            index_writer.commit()?;
        }

        let agg_req: Aggregations = {
            serde_json::from_value(json!({
                "percentiles": {
                    "percentiles": {
                        "field": "score",
                        "missing": 5.0
                    }
                }
            }))
            .unwrap()
        };

        let res = exec_request_with_query(agg_req, &index, None)?;

        assert_nearly_equals!(
            res["percentiles"]["values"]["1.0"].as_f64().unwrap(),
            5.0028295751107414
        );
        assert_nearly_equals!(
            res["percentiles"]["values"]["99.0"].as_f64().unwrap(),
            10.07469668951144
        );

        Ok(())
    }
}


================================================
FILE: src/aggregation/metric/stats.rs
================================================
use std::fmt::Debug;

use columnar::{Column, ColumnType};
use serde::{Deserialize, Serialize};

use super::*;
use crate::aggregation::agg_data::AggregationsSegmentCtx;
use crate::aggregation::intermediate_agg_result::{
    IntermediateAggregationResult, IntermediateAggregationResults, IntermediateMetricResult,
};
use crate::aggregation::segment_agg_result::SegmentAggregationCollector;
use crate::aggregation::*;
use crate::TantivyError;

/// A multi-value metric aggregation that computes a collection of statistics on numeric values that
/// are extracted from the aggregated documents.
/// See [`Stats`] for returned statistics.
///
/// # JSON Format
/// ```json
/// {
///     "stats": {
///         "field": "score"
///     }
///  }
/// ```

#[derive(Clone, Debug, PartialEq, Serialize, Deserialize)]
pub struct StatsAggregation {
    /// The field name to compute the stats on.
    pub field: String,
    /// The missing parameter defines how documents that are missing a value should be treated.
    /// By default they will be ignored but it is also possible to treat them as if they had a
    /// value. Examples in JSON format:
    /// { "field": "my_numbers", "missing": "10.0" }
    #[serde(default, deserialize_with = "deserialize_option_f64")]
    pub missing: Option<f64>,
}

impl StatsAggregation {
    /// Creates a new [`StatsAggregation`] instance from a field name.
    pub fn from_field_name(field_name: String) -> Self {
        StatsAggregation {
            field: field_name,
            missing: None,
        }
    }
    /// Returns the field name the aggregation is computed on.
    pub fn field_name(&self) -> &str {
        &self.field
    }
}

/// Stats contains a collection of statistics.
#[derive(Clone, Debug, PartialEq, Serialize, Deserialize)]
pub struct Stats {
    /// The number of documents.
    pub count: u64,
    /// The sum of the fast field values.
    pub sum: f64,
    /// The min value of the fast field values.
    pub min: Option<f64>,
    /// The max value of the fast field values.
    pub max: Option<f64>,
    /// The average of the fast field values. `None` if count equals zero.
    pub avg: Option<f64>,
}

impl Stats {
    pub(crate) fn get_value(&self, agg_property: &str) -> crate::Result<Option<f64>> {
        match agg_property {
            "count" => Ok(Some(self.count as f64)),
            "sum" => Ok(Some(self.sum)),
            "min" => Ok(self.min),
            "max" => Ok(self.max),
            "avg" => Ok(self.avg),
            _ => Err(TantivyError::InvalidArgument(format!(
                "Unknown property {agg_property} on stats metric aggregation"
            ))),
        }
    }
}

/// Intermediate result of the stats aggregation that can be combined with other intermediate
/// results.
#[derive(Clone, Copy, Debug, PartialEq, Serialize, Deserialize)]
pub struct IntermediateStats {
    /// The number of extracted values.
    pub(crate) count: u64,
    /// The sum of the extracted values.
    pub(crate) sum: f64,
    /// delta for sum needed for [Kahan algorithm for summation](https://en.wikipedia.org/wiki/Kahan_summation_algorithm)
    pub(crate) delta: f64,
    /// The min value.
    pub(crate) min: f64,
    /// The max value.
    pub(crate) max: f64,
}

impl Default for IntermediateStats {
    fn default() -> Self {
        Self {
            count: 0,
            sum: 0.0,
            delta: 0.0,
            min: f64::MAX,
            max: f64::MIN,
        }
    }
}

impl IntermediateStats {
    /// Returns the number of values collected.
    pub fn count(&self) -> u64 {
        self.count
    }

    /// Returns the sum of all values collected.
    pub fn sum(&self) -> f64 {
        self.sum
    }

    /// Merges the other stats intermediate result into self.
    pub fn merge_fruits(&mut self, other: IntermediateStats) {
        self.count += other.count;

        // kahan algorithm for sum
        let y = other.sum - (self.delta + other.delta);
        let t = self.sum + y;
        self.delta = (t - self.sum) - y;
        self.sum = t;

        self.min = self.min.min(other.min);
        self.max = self.max.max(other.max);
    }

    /// Computes the final stats value.
    pub fn finalize(&self) -> Stats {
        let min = if self.count == 0 {
            None
        } else {
            Some(self.min)
        };
        let max = if self.count == 0 {
            None
        } else {
            Some(self.max)
        };
        let avg = if self.count == 0 {
            None
        } else {
            Some(self.sum / (self.count as f64))
        };
        Stats {
            count: self.count,
            sum: self.sum,
            min,
            max,
            avg,
        }
    }

    #[inline]
    pub(in crate::aggregation::metric) fn collect(&mut self, value: f64) {
        self.count += 1;

        // kahan algorithm for sum
        let y = value - self.delta;
        let t = self.sum + y;
        self.delta = (t - self.sum) - y;
        self.sum = t;

        self.min = self.min.min(value);
        self.max = self.max.max(value);
    }
}

/// The type of stats aggregation to perform.
/// Note that not all stats types are supported in the stats aggregation.
#[derive(Clone, Copy, Debug)]
pub enum StatsType {
    /// The average of the values.
    Average,
    /// The count of the values.
    Count,
    /// The maximum value.
    Max,
    /// The minimum value.
    Min,
    /// The stats (count, sum, min, max, avg) of the values.
    Stats,
    /// The extended stats (count, sum, min, max, avg, sum_of_squares, variance, std_deviation,
    ExtendedStats(Option<f64>), // sigma
    /// The sum of the values.
    Sum,
    /// The percentiles of the values.
    Percentiles,
}

fn create_collector<const TYPE_ID: u8>(
    req: &MetricAggReqData,
) -> Box<dyn SegmentAggregationCollector> {
    Box::new(SegmentStatsCollector::<TYPE_ID> {
        name: req.name.clone(),
        collecting_for: req.collecting_for,
        is_number_or_date_type: req.is_number_or_date_type,
        missing_u64: req.missing_u64,
        accessor: req.accessor.clone(),
        buckets: vec![IntermediateStats::default()],
    })
}

/// Build a concrete `SegmentStatsCollector` depending on the column type.
pub(crate) fn build_segment_stats_collector(
    req: &MetricAggReqData,
) -> crate::Result<Box<dyn SegmentAggregationCollector>> {
    match req.field_type {
        ColumnType::I64 => Ok(create_collector::<{ ColumnType::I64 as u8 }>(req)),
        ColumnType::U64 => Ok(create_collector::<{ ColumnType::U64 as u8 }>(req)),
        ColumnType::F64 => Ok(create_collector::<{ ColumnType::F64 as u8 }>(req)),
        ColumnType::Bool => Ok(create_collector::<{ ColumnType::Bool as u8 }>(req)),
        ColumnType::DateTime => Ok(create_collector::<{ ColumnType::DateTime as u8 }>(req)),
        ColumnType::Bytes => Ok(create_collector::<{ ColumnType::Bytes as u8 }>(req)),
        ColumnType::Str => Ok(create_collector::<{ ColumnType::Str as u8 }>(req)),
        ColumnType::IpAddr => Ok(create_collector::<{ ColumnType::IpAddr as u8 }>(req)),
    }
}

#[repr(C)]
#[derive(Clone, Debug)]
pub(crate) struct SegmentStatsCollector<const COLUMN_TYPE_ID: u8> {
    pub(crate) missing_u64: Option<u64>,
    pub(crate) accessor: Column<u64>,
    pub(crate) is_number_or_date_type: bool,
    pub(crate) buckets: Vec<IntermediateStats>,
    pub(crate) name: String,
    pub(crate) collecting_for: StatsType,
}

impl<const COLUMN_TYPE_ID: u8> SegmentAggregationCollector
    for SegmentStatsCollector<COLUMN_TYPE_ID>
{
    #[inline]
    fn add_intermediate_aggregation_result(
        &mut self,
        agg_data: &AggregationsSegmentCtx,
        results: &mut IntermediateAggregationResults,
        parent_bucket_id: BucketId,
    ) -> crate::Result<()> {
        let name = self.name.clone();

        self.prepare_max_bucket(parent_bucket_id, agg_data)?;
        let stats = self.buckets[parent_bucket_id as usize];
        let intermediate_metric_result = match self.collecting_for {
            StatsType::Average => {
                IntermediateMetricResult::Average(IntermediateAverage::from_stats(stats))
            }
            StatsType::Count => {
                IntermediateMetricResult::Count(IntermediateCount::from_stats(stats))
            }
            StatsType::Max => IntermediateMetricResult::Max(IntermediateMax::from_stats(stats)),
            StatsType::Min => IntermediateMetricResult::Min(IntermediateMin::from_stats(stats)),
            StatsType::Stats => IntermediateMetricResult::Stats(stats),
            StatsType::Sum => IntermediateMetricResult::Sum(IntermediateSum::from_stats(stats)),
            _ => {
                return Err(TantivyError::InvalidArgument(format!(
                    "Unsupported stats type for stats aggregation: {:?}",
                    self.collecting_for
                )))
            }
        };

        results.push(
            name,
            IntermediateAggregationResult::Metric(intermediate_metric_result),
        )?;

        Ok(())
    }

    #[inline]
    fn collect(
        &mut self,
        parent_bucket_id: BucketId,
        docs: &[crate::DocId],
        agg_data: &mut AggregationsSegmentCtx,
    ) -> crate::Result<()> {
        // TODO: remove once we fetch all values for all bucket ids in one go
        if docs.len() == 1 && self.missing_u64.is_none() {
            collect_stats::<COLUMN_TYPE_ID>(
                &mut self.buckets[parent_bucket_id as usize],
                self.accessor.values_for_doc(docs[0]),
                self.is_number_or_date_type,
            )?;

            return Ok(());
        }
        agg_data.column_block_accessor.fetch_block_with_missing(
            docs,
            &self.accessor,
            self.missing_u64,
        );
        collect_stats::<COLUMN_TYPE_ID>(
            &mut self.buckets[parent_bucket_id as usize],
            agg_data.column_block_accessor.iter_vals(),
            self.is_number_or_date_type,
        )?;

        Ok(())
    }

    fn prepare_max_bucket(
        &mut self,
        max_bucket: BucketId,
        _agg_data: &AggregationsSegmentCtx,
    ) -> crate::Result<()> {
        let required_buckets = (max_bucket as usize) + 1;
        if self.buckets.len() < required_buckets {
            self.buckets
                .resize_with(required_buckets, IntermediateStats::default);
        }
        Ok(())
    }
}

#[inline]
fn collect_stats<const COLUMN_TYPE_ID: u8>(
    stats: &mut IntermediateStats,
    vals: impl Iterator<Item = u64>,
    is_number_or_date_type: bool,
) -> crate::Result<()> {
    if is_number_or_date_type {
        for val in vals {
            let val1 = convert_to_f64::<COLUMN_TYPE_ID>(val);
            stats.collect(val1);
        }
    } else {
        for _val in vals {
            // we ignore the value and simply record that we got something
            stats.collect(0.0);
        }
    }

    Ok(())
}

#[cfg(test)]
mod tests {
    use serde_json::Value;

    use crate::aggregation::agg_req::{Aggregation, Aggregations};
    use crate::aggregation::agg_result::AggregationResults;
    use crate::aggregation::tests::{
        exec_request_with_query, get_test_index_2_segments, get_test_index_from_values,
    };
    use crate::aggregation::AggregationCollector;
    use crate::query::{AllQuery, TermQuery};
    use crate::schema::{IndexRecordOption, Schema, FAST};
    use crate::{Index, IndexWriter, Term};

    #[test]
    fn test_aggregation_stats_empty_index() -> crate::Result<()> {
        // test index without segments
        let values = vec![];

        let index = get_test_index_from_values(false, &values)?;

        let agg_req_1: Aggregations = serde_json::from_value(json!({
            "stats": {
                "stats": {
                    "field": "score",
                },
            }
        }))
        .unwrap();

        let collector = AggregationCollector::from_aggs(agg_req_1, Default::default());

        let reader = index.reader()?;
        let searcher = reader.searcher();
        let agg_res: AggregationResults = searcher.search(&AllQuery, &collector).unwrap();

        let res: Value = serde_json::from_str(&serde_json::to_string(&agg_res)?)?;
        assert_eq!(
            res["stats"],
            json!({
                "avg": Value::Null,
                "count": 0,
                "max": Value::Null,
                "min": Value::Null,
                "sum": 0.0
            })
        );

        Ok(())
    }

    #[test]
    fn test_aggregation_stats_simple() -> crate::Result<()> {
        let values = vec![10.0];

        let index = get_test_index_from_values(false, &values)?;

        let agg_req_1: Aggregations = serde_json::from_value(json!({
            "stats": {
                "stats": {
                    "field": "score",
                },
            }
        }))
        .unwrap();

        let collector = AggregationCollector::from_aggs(agg_req_1, Default::default());

        let reader = index.reader()?;
        let searcher = reader.searcher();
        let agg_res: AggregationResults = searcher.search(&AllQuery, &collector).unwrap();

        let res: Value = serde_json::from_str(&serde_json::to_string(&agg_res)?)?;
        assert_eq!(
            res["stats"],
            json!({
                "avg": 10.0,
                "count": 1,
                "max": 10.0,
                "min": 10.0,
                "sum": 10.0
            })
        );

        Ok(())
    }

    #[test]
    fn test_aggregation_stats() -> crate::Result<()> {
        let index = get_test_index_2_segments(false)?;

        let reader = index.reader()?;
        let text_field = reader.searcher().schema().get_field("text").unwrap();

        let term_query = TermQuery::new(
            Term::from_field_text(text_field, "cool"),
            IndexRecordOption::Basic,
        );

        let range_agg: Aggregation = {
            serde_json::from_value(json!({
                "range": {
                    "field": "score",
                    "ranges": [ { "from": 3.0f64, "to": 7.0f64 }, { "from": 7.0f64, "to": 19.0f64 }, { "from": 19.0f64, "to": 20.0f64 }  ]
                },
                "aggs": {
                    "stats": {
                        "stats": {
                            "field": "score"
                        }
                    }
                }
            }))
            .unwrap()
        };

        let agg_req_1: Aggregations = serde_json::from_value(json!({
            "stats_i64": {
                "stats": {
                    "field": "score_i64",
                },
            },
            "stats_f64": {
                "stats": {
                    "field": "score_f64",
                },
            },
            "stats": {
                "stats": {
                    "field": "score",
                },
            },
            "count_str": {
                "value_count": {
                    "field": "text",
                },
            },
            "range": range_agg
        }))
        .unwrap();

        let collector = AggregationCollector::from_aggs(agg_req_1, Default::default());

        let searcher = reader.searcher();
        let agg_res: AggregationResults = searcher.search(&term_query, &collector).unwrap();

        let res: Value = serde_json::from_str(&serde_json::to_string(&agg_res)?)?;
        assert_eq!(
            res["stats"],
            json!({
                "avg": 12.142857142857142,
                "count": 7,
                "max": 44.0,
                "min": 1.0,
                "sum": 85.0
            })
        );

        assert_eq!(
            res["stats_i64"],
            json!({
                "avg": 12.142857142857142,
                "count": 7,
                "max": 44.0,
                "min": 1.0,
                "sum": 85.0
            })
        );

        assert_eq!(
            res["stats_f64"],
            json!({
                "avg":  12.214285714285714,
                "count": 7,
                "max": 44.5,
                "min": 1.0,
                "sum": 85.5
            })
        );

        assert_eq!(
            res["range"]["buckets"][2]["stats"],
            json!({
                "avg": 10.666666666666666,
                "count": 3,
                "max": 14.0,
                "min": 7.0,
                "sum": 32.0
            })
        );

        assert_eq!(
            res["range"]["buckets"][3]["stats"],
            json!({
                "avg": serde_json::Value::Null,
                "count": 0,
                "max": serde_json::Value::Null,
                "min": serde_json::Value::Null,
                "sum": 0.0,
            })
        );

        assert_eq!(
            res["count_str"],
            json!({
                "value": 7.0,
            })
        );

        Ok(())
    }

    #[test]
    fn test_stats_json() -> crate::Result<()> {
        let mut schema_builder = Schema::builder();
        let json = schema_builder.add_json_field("json", FAST);
        let schema = schema_builder.build();
        let index = Index::create_in_ram(schema);
        let mut index_writer: IndexWriter = index.writer_for_tests().unwrap();
        // => Segment with empty json
        index_writer.add_document(doc!()).unwrap();
        index_writer.commit().unwrap();
        // => Segment with json, but no field partially_empty
        index_writer
            .add_document(doc!(json => json!({"different_field": "blue"})))
            .unwrap();
        index_writer.commit().unwrap();
        //// => Segment with field partially_empty
        index_writer
            .add_document(doc!(json => json!({"partially_empty": 10.0})))
            .unwrap();
        index_writer.add_document(doc!())?;
        index_writer.commit().unwrap();

        let agg_req: Aggregations = serde_json::from_value(json!({
            "my_stats": {
                "stats": {
                    "field": "json.partially_empty"
                },
            }
        }))
        .unwrap();

        let res = exec_request_with_query(agg_req, &index, None)?;

        assert_eq!(
            res["my_stats"],
            json!({
                "avg":  10.0,
                "count": 1,
                "max": 10.0,
                "min": 10.0,
                "sum": 10.0
            })
        );

        Ok(())
    }

    #[test]
    fn test_stats_json_missing() -> crate::Result<()> {
        let mut schema_builder = Schema::builder();
        let json = schema_builder.add_json_field("json", FAST);
        let schema = schema_builder.build();
        let index = Index::create_in_ram(schema);
        let mut index_writer: IndexWriter = index.writer_for_tests().unwrap();
        // => Segment with empty json
        index_writer.add_document(doc!()).unwrap();
        index_writer.commit().unwrap();
        // => Segment with json, but no field partially_empty
        index_writer
            .add_document(doc!(json => json!({"different_field": "blue"})))
            .unwrap();
        index_writer.commit().unwrap();
        //// => Segment with field partially_empty
        index_writer
            .add_document(doc!(json => json!({"partially_empty": 10.0})))
            .unwrap();
        index_writer.add_document(doc!())?;
        index_writer.commit().unwrap();

        let agg_req: Aggregations = serde_json::from_value(json!({
            "my_stats": {
                "stats": {
                    "field": "json.partially_empty",
                    "missing": 0.0
                },
            }
        }))
        .unwrap();

        let res = exec_request_with_query(agg_req, &index, None)?;

        assert_eq!(
            res["my_stats"],
            json!({
                "avg":  2.5,
                "count": 4,
                "max": 10.0,
                "min": 0.0,
                "sum": 10.0
            })
        );

        // From string
        let agg_req: Aggregations = serde_json::from_value(json!({
            "my_stats": {
                "stats": {
                    "field": "json.partially_empty",
                    "missing": "0.0"
                },
            }
        }))
        .unwrap();

        let res = exec_request_with_query(agg_req, &index, None)?;

        assert_eq!(
            res["my_stats"],
            json!({
                "avg":  2.5,
                "count": 4,
                "max": 10.0,
                "min": 0.0,
                "sum": 10.0
            })
        );

        Ok(())
    }

    #[test]
    fn test_stats_json_missing_sub_agg() -> crate::Result<()> {
        // This test verifies the `collect` method (in contrast to `collect_block`), which is
        // called when the sub-aggregations are flushed.
        let mut schema_builder = Schema::builder();
        let text_field = schema_builder.add_text_field("texts", FAST);
        let score_field_f64 = schema_builder.add_f64_field("score", FAST);
        let schema = schema_builder.build();
        let index = Index::create_in_ram(schema);

        {
            let mut index_writer = index.writer_for_tests()?;
            // writing the segment
            index_writer.add_document(doc!(
                score_field_f64 => 10.0f64,
                text_field => "a"
            ))?;

            index_writer.add_document(doc!(text_field => "a"))?;

            index_writer.commit()?;
        }

        let agg_req: Aggregations = {
            serde_json::from_value(json!({
                "range_with_stats": {
                    "terms": {
                        "field": "texts"
                    },
                    "aggs": {
                        "my_stats": {
                            "stats": {
                                "field": "score",
                                "missing": 0.0
                            }
                        }
                    }
                }
            }))
            .unwrap()
        };

        let res = exec_request_with_query(agg_req, &index, None)?;

        assert_eq!(
            res["range_with_stats"]["buckets"][0]["my_stats"]["count"],
            2
        );
        assert_eq!(
            res["range_with_stats"]["buckets"][0]["my_stats"]["min"],
            0.0
        );
        assert_eq!(
            res["range_with_stats"]["buckets"][0]["my_stats"]["avg"],
            5.0
        );

        Ok(())
    }
}


================================================
FILE: src/aggregation/metric/sum.rs
================================================
use std::fmt::Debug;

use serde::{Deserialize, Serialize};

use super::*;
use crate::aggregation::*;

/// A single-value metric aggregation that sums up numeric values that are
/// extracted from the aggregated documents.
/// See [super::SingleMetricResult] for return value.
///
/// # JSON Format
/// ```json
/// {
///     "sum": {
///         "field": "score"
///     }
/// }
/// ```
#[derive(Clone, Debug, PartialEq, Serialize, Deserialize)]
pub struct SumAggregation {
    /// The field name to compute the minimum on.
    pub field: String,
    /// The missing parameter defines how documents that are missing a value should be treated.
    /// By default they will be ignored but it is also possible to treat them as if they had a
    /// value. Examples in JSON format:
    /// { "field": "my_numbers", "missing": "10.0" }
    #[serde(default, deserialize_with = "deserialize_option_f64")]
    pub missing: Option<f64>,
}

impl SumAggregation {
    /// Creates a new [`SumAggregation`] instance from a field name.
    pub fn from_field_name(field_name: String) -> Self {
        Self {
            field: field_name,
            missing: None,
        }
    }
    /// Returns the field name the aggregation is computed on.
    pub fn field_name(&self) -> &str {
        &self.field
    }
}

/// Intermediate result of the minimum aggregation that can be combined with other intermediate
/// results.
#[derive(Default, Clone, Debug, PartialEq, Serialize, Deserialize)]
pub struct IntermediateSum {
    stats: IntermediateStats,
}

impl IntermediateSum {
    /// Creates a new [`IntermediateSum`] instance from a [`SegmentStatsCollector`].
    pub(crate) fn from_stats(stats: IntermediateStats) -> Self {
        Self { stats }
    }
    /// Merges the other intermediate result into self.
    pub fn merge_fruits(&mut self, other: IntermediateSum) {
        self.stats.merge_fruits(other.stats);
    }
    /// Computes the final minimum value.
    pub fn finalize(&self) -> Option<f64> {
        Some(self.stats.finalize().sum)
    }
}


================================================
FILE: src/aggregation/metric/top_hits.rs
================================================
use std::collections::HashMap;
use std::net::Ipv6Addr;

use columnar::{Column, ColumnType, ColumnarReader, DynamicColumn};
use common::json_path_writer::JSON_PATH_SEGMENT_SEP_STR;
use common::DateTime;
use regex::Regex;
use serde::ser::SerializeMap;
use serde::{Deserialize, Deserializer, Serialize, Serializer};

use super::{TopHitsMetricResult, TopHitsVecEntry};
use crate::aggregation::agg_data::AggregationsSegmentCtx;
use crate::aggregation::bucket::Order;
use crate::aggregation::intermediate_agg_result::{
    IntermediateAggregationResult, IntermediateMetricResult,
};
use crate::aggregation::segment_agg_result::SegmentAggregationCollector;
use crate::aggregation::{AggregationError, BucketId};
use crate::collector::sort_key::ReverseComparator;
use crate::collector::TopNComputer;
use crate::schema::OwnedValue;
use crate::{DocAddress, DocId, SegmentOrdinal};

/// Contains all information required by the TopHitsSegmentCollector to perform the
/// top_hits aggregation on a segment.
#[derive(Default)]
pub struct TopHitsAggReqData {
    /// The accessors to access the fast field values.
    pub accessors: Vec<(Column<u64>, ColumnType)>,
    /// The accessors to access the fast field values for retrieving document fields.
    pub value_accessors: HashMap<String, Vec<DynamicColumn>>,
    /// The ordinal of the segment this request data is for.
    pub segment_ordinal: SegmentOrdinal,
    /// The name of the aggregation.
    pub name: String,
    /// The top_hits aggregation request.
    pub req: TopHitsAggregationReq,
}

impl TopHitsAggReqData {
    /// Estimate the memory consumption of this struct in bytes.
    pub fn get_memory_consumption(&self) -> usize {
        std::mem::size_of::<Self>()
    }
}

/// # Top Hits
///
/// The top hits aggregation is a useful tool to answer questions like:
/// - "What are the most recent posts by each author?"
/// - "What are the most popular items in each category?"
///
/// It does so by keeping track of the most relevant document being aggregated,
/// in terms of a sort criterion that can consist of multiple fields and their
/// sort-orders (ascending or descending).
///
/// `top_hits` should not be used as a top-level aggregation. It is intended to be
/// used as a sub-aggregation, inside a `terms` aggregation or a `filters` aggregation,
/// for example.
///
/// Note that this aggregator does not return the actual document addresses, but
/// rather a list of the values of the fields that were requested to be retrieved.
/// These values can be specified in the `docvalue_fields` parameter, which can include
/// a list of fast fields to be retrieved. At the moment, only fast fields are supported
/// but it is possible that we support the `fields` parameter to retrieve any stored
/// field in the future.
///
/// The following example demonstrates a request for the top_hits aggregation:
/// ```JSON
/// {
///     "aggs": {
///         "top_authors": {
///             "terms": {
///                 "field": "author",
///                 "size": 5
///             }
///         },
///         "aggs": {
///             "top_hits": {
///                 "size": 2,
///                 "from": 0
///                 "sort": [
///                     { "date": "desc" }
///                 ]
///                 "docvalue_fields": ["date", "title", "iden"]
///             }
///         }
/// }
/// ```
///
/// This request will return an object containing the top two documents, sorted
/// by the `date` field in descending order. You can also sort by multiple fields, which
/// helps to resolve ties. The aggregation object for each bucket will look like:
/// ```JSON
/// {
///     "hits": [
///         {
///           "score": [<time_u64>],
///           "docvalue_fields": {
///             "date": "<date_RFC3339>",
///             "title": "<title>",
///             "iden": "<iden>"
///           }
///         },
///         {
///           "score": [<time_u64>]
///           "docvalue_fields": {
///             "date": "<date_RFC3339>",
///             "title": "<title>",
///             "iden": "<iden>"
///           }
///         }
///     ]
/// }
/// ```
#[derive(Debug, Clone, PartialEq, Serialize, Deserialize, Default)]
pub struct TopHitsAggregationReq {
    sort: Vec<KeyOrder>,
    size: usize,
    from: Option<usize>,

    #[serde(rename = "docvalue_fields")]
    #[serde(default)]
    doc_value_fields: Vec<String>,

    // Not supported
    _source: Option<serde_json::Value>,
    fields: Option<serde_json::Value>,
    script_fields: Option<serde_json::Value>,
    highlight: Option<serde_json::Value>,
    explain: Option<serde_json::Value>,
    version: Option<serde_json::Value>,
}

#[derive(Debug, Clone, PartialEq, Default)]
struct KeyOrder {
    field: String,
    order: Order,
}

impl Serialize for KeyOrder {
    fn serialize<S: Serializer>(&self, serializer: S) -> Result<S::Ok, S::Error> {
        let KeyOrder { field, order } = self;
        let mut map = serializer.serialize_map(Some(1))?;
        map.serialize_entry(field, order)?;
        map.end()
    }
}

impl<'de> Deserialize<'de> for KeyOrder {
    fn deserialize<D>(deserializer: D) -> Result<Self, D::Error>
    where D: Deserializer<'de> {
        let mut key_order = <HashMap<String, Order>>::deserialize(deserializer)?.into_iter();
        let (field, order) = key_order.next().ok_or(serde::de::Error::custom(
            "Expected exactly one key-value pair in sort parameter of top_hits, found none",
        ))?;
        if key_order.next().is_some() {
            return Err(serde::de::Error::custom(format!(
                "Expected exactly one key-value pair in sort parameter of top_hits, found \
                 {key_order:?}"
            )));
        }
        Ok(Self { field, order })
    }
}

// Transform a glob (`pattern*`, for example) into a regex::Regex (`^pattern.*$`)
fn globbed_string_to_regex(glob: &str) -> Result<Regex, crate::TantivyError> {
    // Replace `*` glob with `.*` regex
    let sanitized = format!("^{}$", regex::escape(glob).replace(r"\*", ".*"));
    Regex::new(&sanitized.replace('*', ".*")).map_err(|e| {
        crate::TantivyError::SchemaError(format!("Invalid regex '{glob}' in docvalue_fields: {e}"))
    })
}

fn use_doc_value_fields_err(parameter: &str) -> crate::Result<()> {
    Err(crate::TantivyError::AggregationError(
        AggregationError::InvalidRequest(format!(
            "The `{parameter}` parameter is not supported, only `docvalue_fields` is supported in \
             `top_hits` aggregation"
        )),
    ))
}
fn unsupported_err(parameter: &str) -> crate::Result<()> {
    Err(crate::TantivyError::AggregationError(
        AggregationError::InvalidRequest(format!(
            "The `{parameter}` parameter is not supported in the `top_hits` aggregation"
        )),
    ))
}

impl TopHitsAggregationReq {
    /// Validate and resolve field retrieval parameters
    pub fn validate_and_resolve_field_names(
        &mut self,
        reader: &ColumnarReader,
    ) -> crate::Result<()> {
        if self._source.is_some() {
            use_doc_value_fields_err("_source")?;
        }
        if self.fields.is_some() {
            use_doc_value_fields_err("fields")?;
        }
        if self.script_fields.is_some() {
            use_doc_value_fields_err("script_fields")?;
        }
        if self.explain.is_some() {
            unsupported_err("explain")?;
        }
        if self.highlight.is_some() {
            unsupported_err("highlight")?;
        }
        if self.version.is_some() {
            unsupported_err("version")?;
        }

        self.doc_value_fields = self
            .doc_value_fields
            .iter()
            .map(|field| {
                if !field.contains('*')
                    && reader
                        .iter_columns()?
                        .any(|(name, _)| name.as_str() == field)
                {
                    return Ok(vec![field.to_owned()]);
                }

                let pattern = globbed_string_to_regex(field)?;
                let fields = reader
                    .iter_columns()?
                    .map(|(name, _)| {
                        // normalize path from internal fast field repr
                        name.replace(JSON_PATH_SEGMENT_SEP_STR, ".")
                    })
                    .filter(|name| pattern.is_match(name))
                    .collect::<Vec<_>>();
                assert!(
                    !fields.is_empty(),
                    "No fields matched the glob '{field}' in docvalue_fields"
                );
                Ok(fields)
            })
            .collect::<crate::Result<Vec<_>>>()?
            .into_iter()
            .flatten()
            .collect();

        Ok(())
    }

    /// Return fields accessed by the aggregator, in order.
    pub fn field_names(&self) -> Vec<&str> {
        self.sort
            .iter()
            .map(|KeyOrder { field, .. }| field.as_str())
            .chain(self.doc_value_fields.iter().map(|s| s.as_str()))
            .collect()
    }

    /// Return fields accessed by the aggregator's value retrieval.
    pub fn value_field_names(&self) -> Vec<&str> {
        self.doc_value_fields.iter().map(|s| s.as_str()).collect()
    }

    fn get_document_field_data(
        &self,
        accessors: &HashMap<String, Vec<DynamicColumn>>,
        doc_id: DocId,
    ) -> HashMap<String, FastFieldValue> {
        let doc_value_fields = self
            .doc_value_fields
            .iter()
            .map(|field| {
                let accessors = accessors
                    .get(field)
                    .unwrap_or_else(|| panic!("field '{field}' not found in accessors"));

                let values: Vec<FastFieldValue> = accessors
                    .iter()
                    .flat_map(|accessor| match accessor {
                        DynamicColumn::U64(accessor) => accessor
                            .values_for_doc(doc_id)
                            .map(FastFieldValue::U64)
                            .collect::<Vec<_>>(),
                        DynamicColumn::I64(accessor) => accessor
                            .values_for_doc(doc_id)
                            .map(FastFieldValue::I64)
                            .collect::<Vec<_>>(),
                        DynamicColumn::F64(accessor) => accessor
                            .values_for_doc(doc_id)
                            .map(FastFieldValue::F64)
                            .collect::<Vec<_>>(),
                        DynamicColumn::Bytes(accessor) => accessor
                            .term_ords(doc_id)
                            .map(|term_ord| {
                                let mut buffer = vec![];
                                assert!(
                                    accessor
                                        .ord_to_bytes(term_ord, &mut buffer)
                                        .expect("could not read term dictionary"),
                                    "term corresponding to term_ord does not exist"
                                );
                                FastFieldValue::Bytes(buffer)
                            })
                            .collect::<Vec<_>>(),
                        DynamicColumn::Str(accessor) => accessor
                            .term_ords(doc_id)
                            .map(|term_ord| {
                                let mut buffer = vec![];
                                assert!(
                                    accessor
                                        .ord_to_bytes(term_ord, &mut buffer)
                                        .expect("could not read term dictionary"),
                                    "term corresponding to term_ord does not exist"
                                );
                                FastFieldValue::Str(String::from_utf8(buffer).unwrap())
                            })
                            .collect::<Vec<_>>(),
                        DynamicColumn::Bool(accessor) => accessor
                            .values_for_doc(doc_id)
                            .map(FastFieldValue::Bool)
                            .collect::<Vec<_>>(),
                        DynamicColumn::IpAddr(accessor) => accessor
                            .values_for_doc(doc_id)
                            .map(FastFieldValue::IpAddr)
                            .collect::<Vec<_>>(),
                        DynamicColumn::DateTime(accessor) => accessor
                            .values_for_doc(doc_id)
                            .map(FastFieldValue::Date)
                            .collect::<Vec<_>>(),
                    })
                    .collect();

                (field.to_owned(), FastFieldValue::Array(values))
            })
            .collect();
        doc_value_fields
    }
}

/// A retrieved value from a fast field.
#[derive(Debug, Clone, PartialEq, Serialize, Deserialize)]
pub enum FastFieldValue {
    /// The str type is used for any text information.
    Str(String),
    /// Unsigned 64-bits Integer `u64`
    U64(u64),
    /// Signed 64-bits Integer `i64`
    I64(i64),
    /// 64-bits Float `f64`
    F64(f64),
    /// Bool value
    Bool(bool),
    /// Date/time with nanoseconds precision
    Date(DateTime),
    /// Arbitrarily sized byte array
    Bytes(Vec<u8>),
    /// IpV6 Address. Internally there is no IpV4, it needs to be converted to `Ipv6Addr`.
    IpAddr(Ipv6Addr),
    /// A list of values.
    Array(Vec<Self>),
}

impl From<FastFieldValue> for OwnedValue {
    fn from(value: FastFieldValue) -> Self {
        match value {
            FastFieldValue::Str(s) => OwnedValue::Str(s),
            FastFieldValue::U64(u) => OwnedValue::U64(u),
            FastFieldValue::I64(i) => OwnedValue::I64(i),
            FastFieldValue::F64(f) => OwnedValue::F64(f),
            FastFieldValue::Bool(b) => OwnedValue::Bool(b),
            FastFieldValue::Date(d) => OwnedValue::Date(d),
            FastFieldValue::Bytes(b) => OwnedValue::Bytes(b),
            FastFieldValue::IpAddr(ip) => OwnedValue::IpAddr(ip),
            FastFieldValue::Array(a) => {
                OwnedValue::Array(a.into_iter().map(OwnedValue::from).collect())
            }
        }
    }
}

/// Holds a fast field value in its u64 representation, and the order in which it should be sorted.
#[derive(Clone, Serialize, Deserialize, Debug)]
struct DocValueAndOrder {
    /// A fast field value in its u64 representation.
    value: Option<u64>,
    /// Sort order for the value
    order: Order,
}

impl Ord for DocValueAndOrder {
    fn cmp(&self, other: &Self) -> std::cmp::Ordering {
        let invert = |cmp: std::cmp::Ordering| match self.order {
            Order::Asc => cmp,
            Order::Desc => cmp.reverse(),
        };

        match (self.value, other.value) {
            (Some(self_value), Some(other_value)) => invert(self_value.cmp(&other_value)),
            (Some(_), None) => std::cmp::Ordering::Greater,
            (None, Some(_)) => std::cmp::Ordering::Less,
            (None, None) => std::cmp::Ordering::Equal,
        }
    }
}

impl PartialOrd for DocValueAndOrder {
    fn partial_cmp(&self, other: &Self) -> Option<std::cmp::Ordering> {
        Some(self.cmp(other))
    }
}

impl PartialEq for DocValueAndOrder {
    fn eq(&self, other: &Self) -> bool {
        self.value.cmp(&other.value) == std::cmp::Ordering::Equal
    }
}

impl Eq for DocValueAndOrder {}

#[derive(Clone, Serialize, Deserialize, Debug)]
struct DocSortValuesAndFields {
    sorts: Vec<DocValueAndOrder>,

    #[serde(rename = "docvalue_fields")]
    #[serde(skip_serializing_if = "HashMap::is_empty")]
    doc_value_fields: HashMap<String, FastFieldValue>,
}

impl Ord for DocSortValuesAndFields {
    fn cmp(&self, other: &Self) -> std::cmp::Ordering {
        for (self_feature, other_feature) in self.sorts.iter().zip(other.sorts.iter()) {
            let cmp = self_feature.cmp(other_feature);
            if cmp != std::cmp::Ordering::Equal {
                return cmp;
            }
        }
        std::cmp::Ordering::Equal
    }
}

impl PartialOrd for DocSortValuesAndFields {
    fn partial_cmp(&self, other: &Self) -> Option<std::cmp::Ordering> {
        Some(self.cmp(other))
    }
}

impl PartialEq for DocSortValuesAndFields {
    fn eq(&self, other: &Self) -> bool {
        self.cmp(other) == std::cmp::Ordering::Equal
    }
}

impl Eq for DocSortValuesAndFields {}

/// The TopHitsCollector used for collecting over segments and merging results.
#[derive(Clone, Serialize, Deserialize, Debug)]
pub struct TopHitsTopNComputer {
    req: TopHitsAggregationReq,
    top_n: TopNComputer<DocSortValuesAndFields, DocAddress, ReverseComparator>,
}

impl std::cmp::PartialEq for TopHitsTopNComputer {
    fn eq(&self, _other: &Self) -> bool {
        false
    }
}

impl TopHitsTopNComputer {
    /// Create a new TopHitsCollector
    pub fn new(req: &TopHitsAggregationReq) -> Self {
        Self {
            top_n: TopNComputer::new_with_comparator(
                req.size + req.from.unwrap_or(0),
                ReverseComparator,
            ),
            req: req.clone(),
        }
    }

    fn collect(&mut self, features: DocSortValuesAndFields, doc: DocAddress) {
        self.top_n.push(features, doc);
    }

    pub(crate) fn merge_fruits(&mut self, other_fruit: Self) -> crate::Result<()> {
        for doc in other_fruit.top_n.into_vec() {
            self.collect(doc.sort_key, doc.doc);
        }
        Ok(())
    }

    /// Finalize by converting self into the final result form
    pub fn into_final_result(self) -> TopHitsMetricResult {
        let mut hits: Vec<TopHitsVecEntry> = self
            .top_n
            .into_sorted_vec()
            .into_iter()
            .map(|doc| TopHitsVecEntry {
                sort: doc.sort_key.sorts.iter().map(|f| f.value).collect(),
                doc_value_fields: doc
                    .sort_key
                    .doc_value_fields
                    .into_iter()
                    .map(|(k, v)| (k, v.into()))
                    .collect(),
            })
            .collect();

        // Remove the first `from` elements
        // Truncating from end would be more efficient, but we need to truncate from the front
        // because `into_sorted_vec` gives us a descending order because of the inverted
        // `Ord` semantics of the heap elements.
        hits.drain(..self.req.from.unwrap_or(0));
        TopHitsMetricResult { hits }
    }
}

#[derive(Clone, Debug)]
pub(crate) struct TopHitsSegmentCollector {
    segment_ordinal: SegmentOrdinal,
    accessor_idx: usize,
    buckets: Vec<TopNComputer<Vec<DocValueAndOrder>, DocAddress, ReverseComparator>>,
    num_hits: usize,
}

impl TopHitsSegmentCollector {
    pub fn from_req(
        req: &TopHitsAggregationReq,
        accessor_idx: usize,
        segment_ordinal: SegmentOrdinal,
    ) -> Self {
        let num_hits = req.size + req.from.unwrap_or(0);
        Self {
            num_hits,
            segment_ordinal,
            accessor_idx,
            buckets: vec![TopNComputer::new_with_comparator(num_hits, ReverseComparator); 1],
        }
    }
    fn get_top_hits_computer(
        &mut self,
        parent_bucket_id: BucketId,
        value_accessors: &HashMap<String, Vec<DynamicColumn>>,
        req: &TopHitsAggregationReq,
    ) -> TopHitsTopNComputer {
        if parent_bucket_id as usize >= self.buckets.len() {
            return TopHitsTopNComputer::new(req);
        }
        let top_n = std::mem::replace(
            &mut self.buckets[parent_bucket_id as usize],
            TopNComputer::new(0),
        );
        let mut top_hits_computer = TopHitsTopNComputer::new(req);
        let top_results = top_n.into_vec();

        for res in top_results {
            let doc_value_fields = req.get_document_field_data(value_accessors, res.doc.doc_id);
            top_hits_computer.collect(
                DocSortValuesAndFields {
                    sorts: res.sort_key,
                    doc_value_fields,
                },
                res.doc,
            );
        }

        top_hits_computer
    }
}

impl SegmentAggregationCollector for TopHitsSegmentCollector {
    fn add_intermediate_aggregation_result(
        &mut self,
        agg_data: &AggregationsSegmentCtx,
        results: &mut crate::aggregation::intermediate_agg_result::IntermediateAggregationResults,
        parent_bucket_id: BucketId,
    ) -> crate::Result<()> {
        let req_data = agg_data.get_top_hits_req_data(self.accessor_idx);

        let value_accessors = &req_data.value_accessors;

        let intermediate_result = IntermediateMetricResult::TopHits(self.get_top_hits_computer(
            parent_bucket_id,
            value_accessors,
            &req_data.req,
        ));
        results.push(
            req_data.name.to_string(),
            IntermediateAggregationResult::Metric(intermediate_result),
        )
    }

    /// TODO: Consider a caching layer to reduce the call overhead
    fn collect(
        &mut self,
        parent_bucket_id: BucketId,
        docs: &[crate::DocId],
        agg_data: &mut AggregationsSegmentCtx,
    ) -> crate::Result<()> {
        let top_n = &mut self.buckets[parent_bucket_id as usize];
        let req_data = agg_data.get_top_hits_req_data(self.accessor_idx);
        let req = &req_data.req;
        let accessors = &req_data.accessors;
        for &doc_id in docs {
            // TODO: this is terrible, a new vec is allocated for every doc
            // We can fetch blocks instead
            // We don't need to store the order for every value
            let sorts: Vec<DocValueAndOrder> = req
                .sort
                .iter()
                .enumerate()
                .map(|(idx, KeyOrder { order, .. })| {
                    let order = *order;
                    let value = accessors
                        .get(idx)
                        .expect("could not find field in accessors")
                        .0
                        .values_for_doc(doc_id)
                        .next();
                    DocValueAndOrder { value, order }
                })
                .collect();

            top_n.push(
                sorts,
                DocAddress {
                    segment_ord: self.segment_ordinal,
                    doc_id,
                },
            );
        }
        Ok(())
    }

    fn prepare_max_bucket(
        &mut self,
        max_bucket: BucketId,
        _agg_data: &AggregationsSegmentCtx,
    ) -> crate::Result<()> {
        self.buckets.resize(
            (max_bucket as usize) + 1,
            TopNComputer::new_with_comparator(self.num_hits, ReverseComparator),
        );
        Ok(())
    }
}

#[cfg(test)]
mod tests {
    use common::DateTime;
    use pretty_assertions::assert_eq;
    use serde_json::Value;
    use time::macros::datetime;

    use super::{DocSortValuesAndFields, DocValueAndOrder, Order};
    use crate::aggregation::agg_req::Aggregations;
    use crate::aggregation::agg_result::AggregationResults;
    use crate::aggregation::bucket::tests::get_test_index_from_docs;
    use crate::aggregation::tests::get_test_index_from_values;
    use crate::aggregation::AggregationCollector;
    use crate::collector::sort_key::ReverseComparator;
    use crate::collector::ComparableDoc;
    use crate::query::AllQuery;
    use crate::schema::OwnedValue;

    fn invert_order(cmp_feature: DocValueAndOrder) -> DocValueAndOrder {
        let DocValueAndOrder { value, order } = cmp_feature;
        let order = match order {
            Order::Asc => Order::Desc,
            Order::Desc => Order::Asc,
        };
        DocValueAndOrder { value, order }
    }

    fn collector_with_capacity(capacity: usize) -> super::TopHitsTopNComputer {
        super::TopHitsTopNComputer {
            top_n: super::TopNComputer::new_with_comparator(capacity, ReverseComparator),
            req: Default::default(),
        }
    }

    fn invert_order_features(mut cmp_features: DocSortValuesAndFields) -> DocSortValuesAndFields {
        cmp_features.sorts = cmp_features
            .sorts
            .into_iter()
            .map(invert_order)
            .collect::<Vec<_>>();
        cmp_features
    }

    #[test]
    fn test_comparable_doc_feature() -> crate::Result<()> {
        let small = DocValueAndOrder {
            value: Some(1),
            order: Order::Asc,
        };
        let big = DocValueAndOrder {
            value: Some(2),
            order: Order::Asc,
        };
        let none = DocValueAndOrder {
            value: None,
            order: Order::Asc,
        };

        assert!(small < big);
        assert!(none < small);
        assert!(none < big);

        let small = invert_order(small);
        let big = invert_order(big);
        let none = invert_order(none);

        assert!(small > big);
        assert!(none < small);
        assert!(none < big);

        Ok(())
    }

    #[test]
    fn test_comparable_doc_features() -> crate::Result<()> {
        let features_1 = DocSortValuesAndFields {
            sorts: vec![DocValueAndOrder {
                value: Some(1),
                order: Order::Asc,
            }],
            doc_value_fields: Default::default(),
        };

        let features_2 = DocSortValuesAndFields {
            sorts: vec![DocValueAndOrder {
                value: Some(2),
                order: Order::Asc,
            }],
            doc_value_fields: Default::default(),
        };

        assert!(features_1 < features_2);

        assert!(invert_order_features(features_1.clone()) > invert_order_features(features_2));

        Ok(())
    }

    #[test]
    fn test_aggregation_top_hits_empty_index() -> crate::Result<()> {
        let values = vec![];

        let index = get_test_index_from_values(false, &values)?;

        let d: Aggregations = serde_json::from_value(json!({
            "top_hits_req": {
                "top_hits": {
                    "size": 2,
                    "sort": [
                        { "date": "desc" }
                    ],
                    "from": 0,
                }
            }
        }))
        .unwrap();

        let collector = AggregationCollector::from_aggs(d, Default::default());

        let reader = index.reader()?;
        let searcher = reader.searcher();
        let agg_res: AggregationResults = searcher.search(&AllQuery, &collector).unwrap();

        let res: Value = serde_json::from_str(
            &serde_json::to_string(&agg_res).expect("JSON serialization failed"),
        )
        .expect("JSON parsing failed");

        assert_eq!(
            res,
            json!({
                "top_hits_req": {
                    "hits": []
                }
            })
        );

        Ok(())
    }

    #[test]
    fn test_top_hits_collector_single_feature() -> crate::Result<()> {
        let docs = vec![
            ComparableDoc::<_, _> {
                doc: crate::DocAddress {
                    segment_ord: 0,
                    doc_id: 0,
                },
                sort_key: DocSortValuesAndFields {
                    sorts: vec![DocValueAndOrder {
                        value: Some(1),
                        order: Order::Asc,
                    }],
                    doc_value_fields: Default::default(),
                },
            },
            ComparableDoc {
                doc: crate::DocAddress {
                    segment_ord: 0,
                    doc_id: 2,
                },
                sort_key: DocSortValuesAndFields {
                    sorts: vec![DocValueAndOrder {
                        value: Some(3),
                        order: Order::Asc,
                    }],
                    doc_value_fields: Default::default(),
                },
            },
            ComparableDoc {
                doc: crate::DocAddress {
                    segment_ord: 0,
                    doc_id: 1,
                },
                sort_key: DocSortValuesAndFields {
                    sorts: vec![DocValueAndOrder {
                        value: Some(5),
                        order: Order::Asc,
                    }],
                    doc_value_fields: Default::default(),
                },
            },
        ];

        let mut collector = collector_with_capacity(3);
        for doc in docs.clone() {
            collector.collect(doc.sort_key, doc.doc);
        }

        let res = collector.into_final_result();

        assert_eq!(
            res,
            super::TopHitsMetricResult {
                hits: vec![
                    super::TopHitsVecEntry {
                        sort: vec![docs[0].sort_key.sorts[0].value],
                        doc_value_fields: Default::default(),
                    },
                    super::TopHitsVecEntry {
                        sort: vec![docs[1].sort_key.sorts[0].value],
                        doc_value_fields: Default::default(),
                    },
                    super::TopHitsVecEntry {
                        sort: vec![docs[2].sort_key.sorts[0].value],
                        doc_value_fields: Default::default(),
                    },
                ]
            }
        );

        Ok(())
    }

    fn test_aggregation_top_hits(merge_segments: bool) -> crate::Result<()> {
        let docs = vec![
            vec![
                r#"{ "date": "2015-01-02T00:00:00Z", "text": "bbb", "text2": "bbb", "mixed": { "dyn_arr": [1, "2"] } }"#,
                r#"{ "date": "2017-06-15T00:00:00Z", "text": "ccc", "text2": "ddd", "mixed": { "dyn_arr": [3, "4"] } }"#,
            ],
            vec![
                r#"{ "text": "aaa", "text2": "bbb", "date": "2018-01-02T00:00:00Z", "mixed": { "dyn_arr": ["9", 8] } }"#,
                r#"{ "text": "aaa", "text2": "bbb", "date": "2016-01-02T00:00:00Z", "mixed": { "dyn_arr": ["7", 6] } }"#,
            ],
        ];

        let index = get_test_index_from_docs(merge_segments, &docs)?;

        let d: Aggregations = serde_json::from_value(json!({
            "top_hits_req": {
                "top_hits": {
                    "size": 2,
                    "sort": [
                        { "date": "desc" }
                    ],
                    "from": 1,
                    "docvalue_fields": [
                        "date",
                        "tex*",
                        "mixed.*",
                    ],
                }
            }
        }))?;

        let collector = AggregationCollector::from_aggs(d, Default::default());
        let reader = index.reader()?;
        let searcher = reader.searcher();

        let agg_res =
            serde_json::to_value(searcher.search(&AllQuery, &collector).unwrap()).unwrap();

        let date_2017 = datetime!(2017-06-15 00:00:00 UTC);
        let date_2016 = datetime!(2016-01-02 00:00:00 UTC);

        assert_eq!(
            agg_res["top_hits_req"],
            json!({
                "hits": [
                    {
                        "sort": [common::i64_to_u64(date_2017.unix_timestamp_nanos() as i64)],
                        "docvalue_fields": {
                            "date": [ OwnedValue::Date(DateTime::from_utc(date_2017)) ],
                            "text": [ "ccc" ],
                            "text2": [ "ddd" ],
                            "mixed.dyn_arr": [ 3, "4" ],
                        }
                    },
                    {
                        "sort": [common::i64_to_u64(date_2016.unix_timestamp_nanos() as i64)],
                        "docvalue_fields": {
                            "date": [ OwnedValue::Date(DateTime::from_utc(date_2016)) ],
                            "text": [ "aaa" ],
                            "text2": [ "bbb" ],
                            "mixed.dyn_arr": [ 6, "7" ],
                        }
                    }
                ]
            }),
        );

        Ok(())
    }

    #[test]
    fn test_aggregation_top_hits_single_segment() -> crate::Result<()> {
        test_aggregation_top_hits(true)
    }

    #[test]
    fn test_aggregation_top_hits_multi_segment() -> crate::Result<()> {
        test_aggregation_top_hits(false)
    }
}


================================================
FILE: src/aggregation/mod.rs
================================================
//! # Aggregations
//!
//! An aggregation summarizes your data as statistics on buckets or metrics.
//!
//! Aggregations can provide answer to questions like:
//! - What is the average price of all sold articles?
//! - How many errors with status code 500 do we have per day?
//! - What is the average listing price of cars grouped by color?
//!
//! There are two categories: [Metrics](metric) and [Buckets](bucket).
//!
//! ## Prerequisite
//! Currently aggregations work only on [fast fields](`crate::fastfield`). Fast fields
//! of type `u64`, `f64`, `i64`, `date` and fast fields on text fields.
//!
//! ## Usage
//! To use aggregations, build an aggregation request by constructing
//! [`Aggregations`](agg_req::Aggregations).
//! Create an [`AggregationCollector`] from this request. `AggregationCollector` implements the
//! [`Collector`](crate::collector::Collector) trait and can be passed as collector into
//! [`Searcher::search()`](crate::Searcher::search).
//!
//!
//! ## JSON Format
//! Aggregations request and result structures de/serialize into elasticsearch compatible JSON.
//!
//! Notice: Intermediate aggregation results should not be de/serialized via JSON format.
//! Postcard is a good choice.
//!
//! ```verbatim
//! let agg_req: Aggregations = serde_json::from_str(json_request_string).unwrap();
//! let collector = AggregationCollector::from_aggs(agg_req, None);
//! let searcher = reader.searcher();
//! let agg_res = searcher.search(&term_query, &collector).unwrap_err();
//! let json_response_string: String = &serde_json::to_string(&agg_res)?;
//! ```
//!
//! ## Supported Aggregations
//! - [Bucket](bucket)
//!     - [Histogram](bucket::HistogramAggregation)
//!     - [DateHistogram](bucket::DateHistogramAggregationReq)
//!     - [Range](bucket::RangeAggregation)
//!     - [Terms](bucket::TermsAggregation)
//! - [Metric](metric)
//!     - [Average](metric::AverageAggregation)
//!     - [Stats](metric::StatsAggregation)
//!     - [ExtendedStats](metric::ExtendedStatsAggregation)
//!     - [Min](metric::MinAggregation)
//!     - [Max](metric::MaxAggregation)
//!     - [Sum](metric::SumAggregation)
//!     - [Count](metric::CountAggregation)
//!     - [Percentiles](metric::PercentilesAggregationReq)
//!     - [Cardinality](metric::CardinalityAggregationReq)
//!     - [TopHits](metric::TopHitsAggregationReq)
//!
//! # Example
//! Compute the average metric, by building [`agg_req::Aggregations`], which is built from an
//! `(String, agg_req::Aggregation)` iterator.
//!
//! Requests are compatible with the elasticsearch JSON request format.
//!
//! ```
//! use tantivy::aggregation::agg_req::Aggregations;
//!
//! let elasticsearch_compatible_json_req = r#"
//! {
//!   "average": {
//!     "avg": { "field": "score" }
//!   },
//!   "range": {
//!     "range": {
//!       "field": "score",
//!       "ranges": [
//!         { "to": 3.0 },
//!         { "from": 3.0, "to": 7.0 },
//!         { "from": 7.0, "to": 20.0 },
//!         { "from": 20.0 }
//!       ]
//!     },
//!     "aggs": {
//!       "average_in_range": { "avg": { "field": "score" } }
//!     }
//!   }
//! }
//! "#;
//! let agg_req: Aggregations =
//!     serde_json::from_str(elasticsearch_compatible_json_req).unwrap();
//! ```
//! # Code Organization
//!
//! Check the [README](https://github.com/quickwit-oss/tantivy/tree/main/src/aggregation#readme) on github to see how the code is organized.
//!
//! # Nested Aggregation
//!
//! Buckets can contain sub-aggregations. In this example we create buckets with the range
//! aggregation and then calculate the average on each bucket.
//! ```
//! use tantivy::aggregation::agg_req::*;
//! use serde_json::json;
//!
//! let agg_req_1: Aggregations = serde_json::from_value(json!({
//!     "rangef64": {
//!         "range": {
//!             "field": "score",
//!             "ranges": [
//!                 { "from": 3, "to": 7000 },
//!                 { "from": 7000, "to": 20000 },
//!                 { "from": 50000, "to": 60000 }
//!             ]
//!         },
//!         "aggs": {
//!             "average_in_range": { "avg": { "field": "score" } }
//!         }
//!     },
//! }))
//! .unwrap();
//! ```
//!
//! # Distributed Aggregation
//! When the data is distributed on different [`Index`](crate::Index) instances, the
//! [`DistributedAggregationCollector`] provides functionality to merge data between independent
//! search calls by returning
//! [`IntermediateAggregationResults`](intermediate_agg_result::IntermediateAggregationResults).
//! `IntermediateAggregationResults` provides the
//! [`merge_fruits`](intermediate_agg_result::IntermediateAggregationResults::merge_fruits) method
//! to merge multiple results. The merged result can then be converted into
//! [`AggregationResults`](agg_result::AggregationResults) via the
//! [`into_final_result`](intermediate_agg_result::IntermediateAggregationResults::into_final_result) method.

mod accessor_helpers;
mod agg_data;
mod agg_limits;
pub mod agg_req;
pub mod agg_result;
pub mod bucket;
pub(crate) mod cached_sub_aggs;
mod collector;
mod date;
mod error;
pub mod intermediate_agg_result;
pub mod metric;

mod segment_agg_result;
use std::fmt::Display;

#[cfg(test)]
mod agg_tests;

use core::fmt;

pub use agg_limits::AggregationLimitsGuard;
pub use collector::{
    AggregationCollector, AggregationSegmentCollector, DistributedAggregationCollector,
    DEFAULT_BUCKET_LIMIT,
};
use columnar::{ColumnType, MonotonicallyMappableToU64};
pub(crate) use date::format_date;
pub use error::AggregationError;
use itertools::Itertools;
use serde::de::{self, Visitor};
use serde::{Deserialize, Deserializer, Serialize};

use crate::tokenizer::TokenizerManager;

/// A bucket id is a dense identifier for a bucket within an aggregation.
/// It is used to index into a Vec that hold per-bucket data.
///
/// For example, in a terms aggregation, each unique term will be assigned a incremental BucketId.
/// This BucketId will be forwarded to sub-aggregations to identify the parent bucket.
///
/// This allows to have a single AggregationCollector instance per aggregation,
/// that can handle multiple buckets efficiently.
///
/// The API to call sub-aggregations is therefore a &[(BucketId, &[DocId])].
/// For that we'll need a buffer. One Vec per bucket aggregation is needed.
pub type BucketId = u32;

/// Context parameters for aggregation execution
///
/// This struct holds shared resources needed during aggregation execution:
/// - `limits`: Memory and bucket limits for the aggregation
/// - `tokenizers`: TokenizerManager for parsing query strings in filter aggregations
#[derive(Clone, Default)]
pub struct AggContextParams {
    /// Aggregation limits (memory and bucket count)
    pub limits: AggregationLimitsGuard,
    /// Tokenizer manager for query string parsing
    pub tokenizers: TokenizerManager,
}

impl AggContextParams {
    /// Create new aggregation context parameters
    pub fn new(limits: AggregationLimitsGuard, tokenizers: TokenizerManager) -> Self {
        Self { limits, tokenizers }
    }
}

fn parse_str_into_f64<E: de::Error>(value: &str) -> Result<f64, E> {
    let parsed = value
        .parse::<f64>()
        .map_err(|_err| de::Error::custom(format!("Failed to parse f64 from string: {value:?}")))?;

    // Check if the parsed value is NaN or infinity
    if parsed.is_nan() || parsed.is_infinite() {
        Err(de::Error::custom(format!(
            "Value is not a valid f64 (NaN or Infinity): {value:?}"
        )))
    } else {
        Ok(parsed)
    }
}

/// deserialize Option<f64> from string or float
pub(crate) fn deserialize_option_f64<'de, D>(deserializer: D) -> Result<Option<f64>, D::Error>
where D: Deserializer<'de> {
    struct StringOrFloatVisitor;

    impl Visitor<'_> for StringOrFloatVisitor {
        type Value = Option<f64>;

        fn expecting(&self, formatter: &mut fmt::Formatter) -> fmt::Result {
            formatter.write_str("a string or a float")
        }

        fn visit_str<E>(self, value: &str) -> Result<Self::Value, E>
        where E: de::Error {
            parse_str_into_f64(value).map(Some)
        }

        fn visit_f64<E>(self, value: f64) -> Result<Self::Value, E>
        where E: de::Error {
            Ok(Some(value))
        }

        fn visit_i64<E>(self, value: i64) -> Result<Self::Value, E>
        where E: de::Error {
            Ok(Some(value as f64))
        }

        fn visit_u64<E>(self, value: u64) -> Result<Self::Value, E>
        where E: de::Error {
            Ok(Some(value as f64))
        }

        fn visit_none<E>(self) -> Result<Self::Value, E>
        where E: de::Error {
            Ok(None)
        }

        fn visit_unit<E>(self) -> Result<Self::Value, E>
        where E: de::Error {
            Ok(None)
        }
    }

    deserializer.deserialize_any(StringOrFloatVisitor)
}

/// deserialize f64 from string or float
pub(crate) fn deserialize_f64<'de, D>(deserializer: D) -> Result<f64, D::Error>
where D: Deserializer<'de> {
    struct StringOrFloatVisitor;

    impl Visitor<'_> for StringOrFloatVisitor {
        type Value = f64;

        fn expecting(&self, formatter: &mut fmt::Formatter) -> fmt::Result {
            formatter.write_str("a string or a float")
        }

        fn visit_str<E>(self, value: &str) -> Result<Self::Value, E>
        where E: de::Error {
            parse_str_into_f64(value)
        }

        fn visit_f64<E>(self, value: f64) -> Result<Self::Value, E>
        where E: de::Error {
            Ok(value)
        }

        fn visit_i64<E>(self, value: i64) -> Result<Self::Value, E>
        where E: de::Error {
            Ok(value as f64)
        }

        fn visit_u64<E>(self, value: u64) -> Result<Self::Value, E>
        where E: de::Error {
            Ok(value as f64)
        }
    }

    deserializer.deserialize_any(StringOrFloatVisitor)
}

/// The serialized key is used in a `HashMap`.
pub type SerializedKey = String;

#[derive(Clone, Debug, Serialize, Deserialize, PartialOrd)]
/// The key to identify a bucket.
///
/// The order is important, with serde untagged, that we try to deserialize into i64 first.
#[serde(untagged)]
pub enum Key {
    /// String key
    Str(String),
    /// `i64` key
    I64(i64),
    /// `u64` key
    U64(u64),
    /// `f64` key
    F64(f64),
}
impl Eq for Key {}
impl std::hash::Hash for Key {
    fn hash<H: std::hash::Hasher>(&self, state: &mut H) {
        core::mem::discriminant(self).hash(state);
        match self {
            Key::Str(text) => text.hash(state),
            Key::F64(val) => val.to_bits().hash(state),
            Key::U64(val) => val.hash(state),
            Key::I64(val) => val.hash(state),
        }
    }
}

impl PartialEq for Key {
    fn eq(&self, other: &Self) -> bool {
        match (self, other) {
            (Self::Str(l), Self::Str(r)) => l == r,
            (Self::F64(l), Self::F64(r)) => l.to_bits() == r.to_bits(),
            (Self::I64(l), Self::I64(r)) => l == r,
            (Self::U64(l), Self::U64(r)) => l == r,
            // we list all variant of left operand to make sure this gets updated when we add
            // variants to the enum
            (Self::Str(_) | Self::F64(_) | Self::I64(_) | Self::U64(_), _) => false,
        }
    }
}

impl Display for Key {
    fn fmt(&self, f: &mut std::fmt::Formatter<'_>) -> std::fmt::Result {
        match self {
            Key::Str(val) => f.write_str(val),
            Key::F64(val) => f.write_str(&val.to_string()),
            Key::U64(val) => f.write_str(&val.to_string()),
            Key::I64(val) => f.write_str(&val.to_string()),
        }
    }
}

pub(crate) fn convert_to_f64<const COLUMN_TYPE_ID: u8>(val: u64) -> f64 {
    if COLUMN_TYPE_ID == ColumnType::U64 as u8 {
        val as f64
    } else if COLUMN_TYPE_ID == ColumnType::I64 as u8
        || COLUMN_TYPE_ID == ColumnType::DateTime as u8
    {
        i64::from_u64(val) as f64
    } else if COLUMN_TYPE_ID == ColumnType::F64 as u8 {
        f64::from_u64(val)
    } else if COLUMN_TYPE_ID == ColumnType::Bool as u8 {
        val as f64
    } else {
        panic!(
            "ColumnType ID {} cannot be converted to f64 metric",
            COLUMN_TYPE_ID
        )
    }
}

/// Inverse of `to_fastfield_u64`. Used to convert to `f64` for metrics.
///
/// # Panics
/// Only `u64`, `f64`, `date`, and `i64` are supported.
pub(crate) fn f64_from_fastfield_u64(val: u64, field_type: ColumnType) -> f64 {
    match field_type {
        ColumnType::U64 => convert_to_f64::<{ ColumnType::U64 as u8 }>(val),
        ColumnType::I64 => convert_to_f64::<{ ColumnType::I64 as u8 }>(val),
        ColumnType::F64 => convert_to_f64::<{ ColumnType::F64 as u8 }>(val),
        ColumnType::Bool => convert_to_f64::<{ ColumnType::Bool as u8 }>(val),
        ColumnType::DateTime => convert_to_f64::<{ ColumnType::DateTime as u8 }>(val),
        _ => panic!("unexpected type {field_type:?}. This should not happen"),
    }
}

/// Converts the `f64` value to fast field value space, which is always u64.
///
/// If the fast field has `u64`, values are stored unchanged as `u64` in the fast field.
///
/// If the fast field has `f64` values are converted and stored to `u64` using a
/// monotonic mapping.
/// A `f64` value of e.g. `2.0` needs to be converted using the same monotonic
/// conversion function, so that the value matches the `u64` value stored in the fast
/// field.
pub(crate) fn f64_to_fastfield_u64(val: f64, field_type: &ColumnType) -> Option<u64> {
    match field_type {
        ColumnType::U64 => Some(val as u64),
        ColumnType::I64 | ColumnType::DateTime => Some((val as i64).to_u64()),
        ColumnType::F64 => Some(val.to_u64()),
        ColumnType::Bool => Some(val as u64),
        _ => None,
    }
}

#[cfg(test)]
mod tests {
    use std::net::Ipv6Addr;

    use columnar::DateTime;
    use serde_json::Value;
    use time::OffsetDateTime;

    use super::agg_req::Aggregations;
    use super::*;
    use crate::indexer::NoMergePolicy;
    use crate::query::{AllQuery, TermQuery};
    use crate::schema::{IndexRecordOption, Schema, TextFieldIndexing, FAST, STRING};
    use crate::{Index, IndexWriter, Term};

    pub fn get_test_index_with_num_docs(
        merge_segments: bool,
        num_docs: usize,
    ) -> crate::Result<Index> {
        get_test_index_from_values(
            merge_segments,
            &(0..num_docs).map(|el| el as f64).collect::<Vec<f64>>(),
        )
    }

    pub fn exec_request(agg_req: Aggregations, index: &Index) -> crate::Result<Value> {
        exec_request_with_query(agg_req, index, None)
    }
    pub fn exec_request_with_query(
        agg_req: Aggregations,
        index: &Index,
        query: Option<(&str, &str)>,
    ) -> crate::Result<Value> {
        exec_request_with_query_and_memory_limit(agg_req, index, query, Default::default())
    }

    pub fn exec_request_with_query_and_memory_limit(
        agg_req: Aggregations,
        index: &Index,
        query: Option<(&str, &str)>,
        limits: AggregationLimitsGuard,
    ) -> crate::Result<Value> {
        let collector = AggregationCollector::from_aggs(
            agg_req,
            AggContextParams::new(limits, index.tokenizers().clone()),
        );

        let reader = index.reader()?;
        let searcher = reader.searcher();
        let agg_res = if let Some((field, term)) = query {
            let text_field = reader.searcher().schema().get_field(field).unwrap();

            let term_query = TermQuery::new(
                Term::from_field_text(text_field, term),
                IndexRecordOption::Basic,
            );

            searcher.search(&term_query, &collector)?
        } else {
            searcher.search(&AllQuery, &collector)?
        };

        // Test serialization/deserialization roundtrip
        let res: Value = serde_json::from_str(&serde_json::to_string(&agg_res)?)?;
        Ok(res)
    }

    pub fn get_test_index_from_values(
        merge_segments: bool,
        values: &[f64],
    ) -> crate::Result<Index> {
        // Every value gets its own segment
        let mut segment_and_values = vec![];
        for value in values {
            segment_and_values.push(vec![(*value, value.to_string())]);
        }
        get_test_index_from_values_and_terms(merge_segments, &segment_and_values)
    }

    pub fn get_test_index_from_terms(
        merge_segments: bool,
        values: &[Vec<&str>],
    ) -> crate::Result<Index> {
        // Every value gets its own segment
        let segment_and_values = values
            .iter()
            .map(|terms| {
                terms
                    .iter()
                    .enumerate()
                    .map(|(i, term)| (i as f64, term.to_string()))
                    .collect()
            })
            .collect::<Vec<_>>();
        get_test_index_from_values_and_terms(merge_segments, &segment_and_values)
    }

    pub fn get_test_index_from_values_and_terms(
        merge_segments: bool,
        segment_and_values: &[Vec<(f64, String)>],
    ) -> crate::Result<Index> {
        let mut schema_builder = Schema::builder();
        let text_fieldtype = crate::schema::TextOptions::default()
            .set_indexing_options(
                TextFieldIndexing::default()
                    .set_index_option(IndexRecordOption::Basic)
                    .set_fieldnorms(false),
            )
            .set_fast(None)
            .set_stored();
        let text_field = schema_builder.add_text_field("text", text_fieldtype.clone());
        let text_field_id = schema_builder.add_text_field("text_id", text_fieldtype);
        let string_field_id = schema_builder.add_text_field("string_id", STRING | FAST);
        let score_fieldtype = crate::schema::NumericOptions::default().set_fast();
        let score_field = schema_builder.add_u64_field("score", score_fieldtype.clone());
        let score_field_f64 = schema_builder.add_f64_field("score_f64", score_fieldtype.clone());
        let score_field_i64 = schema_builder.add_i64_field("score_i64", score_fieldtype);
        let fraction_field = schema_builder.add_f64_field(
            "fraction_f64",
            crate::schema::NumericOptions::default().set_fast(),
        );
        let index = Index::create_in_ram(schema_builder.build());
        {
            // let mut index_writer = index.writer_for_tests()?;
            let mut index_writer = index.writer_with_num_threads(1, 20_000_000)?;
            index_writer.set_merge_policy(Box::new(NoMergePolicy));
            for values in segment_and_values {
                for (i, term) in values {
                    let i = *i;
                    // writing the segment
                    index_writer.add_document(doc!(
                        text_field => "cool",
                        text_field_id => term.to_string(),
                        string_field_id => term.to_string(),
                        score_field => i as u64,
                        score_field_f64 => i,
                        score_field_i64 => i as i64,
                        fraction_field => i/100.0,
                    ))?;
                }
                index_writer.commit()?;
            }
        }
        if merge_segments {
            let segment_ids = index
                .searchable_segment_ids()
                .expect("Searchable segments failed.");
            if segment_ids.len() > 1 {
                let mut index_writer: IndexWriter = index.writer_for_tests()?;
                index_writer.merge(&segment_ids).wait()?;
                index_writer.wait_merging_threads()?;
            }
        }

        Ok(index)
    }

    pub fn get_test_index_2_segments(merge_segments: bool) -> crate::Result<Index> {
        let mut schema_builder = Schema::builder();
        let text_fieldtype = crate::schema::TextOptions::default()
            .set_indexing_options(
                TextFieldIndexing::default().set_index_option(IndexRecordOption::WithFreqs),
            )
            .set_fast(Some("raw"))
            .set_stored();
        let text_field = schema_builder.add_text_field("text", text_fieldtype);
        let date_field = schema_builder.add_date_field("date", FAST);
        schema_builder.add_text_field("dummy_text", STRING);
        let score_fieldtype = crate::schema::NumericOptions::default().set_fast();
        let score_field = schema_builder.add_u64_field("score", score_fieldtype.clone());
        let score_field_f64 = schema_builder.add_f64_field("score_f64", score_fieldtype.clone());
        let ip_addr_field = schema_builder.add_ip_addr_field("ip_addr", FAST);

        let multivalue = crate::schema::NumericOptions::default().set_fast();
        let scores_field_i64 = schema_builder.add_i64_field("scores_i64", multivalue);

        let score_field_i64 = schema_builder.add_i64_field("score_i64", score_fieldtype);
        let index = Index::create_in_ram(schema_builder.build());
        {
            let mut index_writer = index.writer_for_tests()?;
            // writing the segment
            index_writer.add_document(doc!(
                text_field => "cool",
                date_field => DateTime::from_utc(OffsetDateTime::from_unix_timestamp(1_546_300_800).unwrap()),
                score_field => 1u64,
                ip_addr_field => Ipv6Addr::from(1u128),
                score_field_f64 => 1f64,
                score_field_i64 => 1i64,
                scores_field_i64 => 1i64,
                scores_field_i64 => 2i64,
            ))?;
            index_writer.add_document(doc!(
                text_field => "cool",
                date_field => DateTime::from_utc(OffsetDateTime::from_unix_timestamp(1_546_300_800 + 86400).unwrap()),
                score_field => 3u64,
                score_field_f64 => 3f64,
                score_field_i64 => 3i64,
                scores_field_i64 => 5i64,
                scores_field_i64 => 5i64,
            ))?;
            index_writer.add_document(doc!(
                text_field => "cool",
                date_field => DateTime::from_utc(OffsetDateTime::from_unix_timestamp(1_546_300_800 + 86400).unwrap()),
                score_field => 5u64,
                score_field_f64 => 5f64,
                score_field_i64 => 5i64,
            ))?;
            index_writer.add_document(doc!(
                text_field => "nohit",
                date_field => DateTime::from_utc(OffsetDateTime::from_unix_timestamp(1_546_300_800 + 86400).unwrap()),
                score_field => 6u64,
                score_field_f64 => 6f64,
                score_field_i64 => 6i64,
            ))?;
            index_writer.add_document(doc!(
                text_field => "cool",
                date_field => DateTime::from_utc(OffsetDateTime::from_unix_timestamp(1_546_300_800 + 86400).unwrap()),
                score_field => 7u64,
                score_field_f64 => 7f64,
                score_field_i64 => 7i64,
            ))?;
            index_writer.commit()?;
            index_writer.add_document(doc!(
                text_field => "cool",
                date_field => DateTime::from_utc(OffsetDateTime::from_unix_timestamp(1_546_300_800 + 86400).unwrap()),
                score_field => 11u64,
                score_field_f64 => 11f64,
                score_field_i64 => 11i64,
            ))?;
            index_writer.add_document(doc!(
                text_field => "cool",
                date_field => DateTime::from_utc(OffsetDateTime::from_unix_timestamp(1_546_300_800 + 86400 + 86400).unwrap()),
                score_field => 14u64,
                score_field_f64 => 14f64,
                score_field_i64 => 14i64,
            ))?;

            index_writer.add_document(doc!(
                text_field => "cool",
                date_field => DateTime::from_utc(OffsetDateTime::from_unix_timestamp(1_546_300_800 + 86400 + 86400).unwrap()),
                score_field => 44u64,
                score_field_f64 => 44.5f64,
                score_field_i64 => 44i64,
            ))?;

            index_writer.commit()?;

            // no hits segment
            index_writer.add_document(doc!(
                text_field => "nohit",
                date_field => DateTime::from_utc(OffsetDateTime::from_unix_timestamp(1_546_300_800 + 86400 + 86400).unwrap()),
                score_field => 44u64,
                score_field_f64 => 44.5f64,
                score_field_i64 => 44i64,
            ))?;

            index_writer.commit()?;
        }
        if merge_segments {
            let segment_ids = index
                .searchable_segment_ids()
                .expect("Searchable segments failed.");
            let mut index_writer: IndexWriter = index.writer_for_tests()?;
            index_writer.merge(&segment_ids).wait()?;
            index_writer.wait_merging_threads()?;
        }

        Ok(index)
    }
}


================================================
FILE: src/aggregation/segment_agg_result.rs
================================================
//! Contains aggregation trees which is used during collection in a segment.
//! This tree contains datastructrues optimized for fast collection.
//! The tree can be converted to an intermediate tree, which contains datastructrues optimized for
//! merging.

use std::fmt::Debug;

pub(crate) use super::agg_limits::AggregationLimitsGuard;
use super::intermediate_agg_result::IntermediateAggregationResults;
use crate::aggregation::agg_data::AggregationsSegmentCtx;
use crate::aggregation::BucketId;

/// Monotonically increasing provider of BucketIds.
#[derive(Debug, Clone, Default)]
pub struct BucketIdProvider(u32);
impl BucketIdProvider {
    /// Get the next BucketId.
    pub fn next_bucket_id(&mut self) -> BucketId {
        let bucket_id = self.0;
        self.0 += 1;
        bucket_id
    }
}

/// A SegmentAggregationCollector is used to collect aggregation results.
pub trait SegmentAggregationCollector: Debug {
    fn add_intermediate_aggregation_result(
        &mut self,
        agg_data: &AggregationsSegmentCtx,
        results: &mut IntermediateAggregationResults,
        parent_bucket_id: BucketId,
    ) -> crate::Result<()>;

    /// Note: The caller needs to call `prepare_max_bucket` before calling `collect`.
    fn collect(
        &mut self,
        parent_bucket_id: BucketId,
        docs: &[crate::DocId],
        agg_data: &mut AggregationsSegmentCtx,
    ) -> crate::Result<()>;

    /// Collect docs for multiple buckets in one call.
    /// Minimizes dynamic dispatch overhead when collecting many buckets.
    ///
    /// Note: The caller needs to call `prepare_max_bucket` before calling `collect`.
    fn collect_multiple(
        &mut self,
        bucket_ids: &[BucketId],
        docs: &[crate::DocId],
        agg_data: &mut AggregationsSegmentCtx,
    ) -> crate::Result<()> {
        debug_assert_eq!(bucket_ids.len(), docs.len());
        let mut start = 0;
        while start < bucket_ids.len() {
            let bucket_id = bucket_ids[start];
            let mut end = start + 1;
            while end < bucket_ids.len() && bucket_ids[end] == bucket_id {
                end += 1;
            }
            self.collect(bucket_id, &docs[start..end], agg_data)?;
            start = end;
        }
        Ok(())
    }

    /// Prepare the collector for collecting up to BucketId `max_bucket`.
    /// This is useful so we can split allocation ahead of time of collecting.
    fn prepare_max_bucket(
        &mut self,
        max_bucket: BucketId,
        agg_data: &AggregationsSegmentCtx,
    ) -> crate::Result<()>;

    /// Finalize method. Some Aggregator collect blocks of docs before calling `collect_block`.
    /// This method ensures those staged docs will be collected.
    fn flush(&mut self, _agg_data: &mut AggregationsSegmentCtx) -> crate::Result<()> {
        Ok(())
    }
}

#[derive(Default)]
/// The GenericSegmentAggregationResultsCollector is the generic version of the collector, which
/// can handle arbitrary complexity of  sub-aggregations. Ideally we never have to pick this one
/// and can provide specialized versions instead, that remove some of its overhead.
pub(crate) struct GenericSegmentAggregationResultsCollector {
    pub(crate) aggs: Vec<Box<dyn SegmentAggregationCollector>>,
}

impl Debug for GenericSegmentAggregationResultsCollector {
    fn fmt(&self, f: &mut std::fmt::Formatter<'_>) -> std::fmt::Result {
        f.debug_struct("SegmentAggregationResultsCollector")
            .field("aggs", &self.aggs)
            .finish()
    }
}

impl SegmentAggregationCollector for GenericSegmentAggregationResultsCollector {
    fn add_intermediate_aggregation_result(
        &mut self,
        agg_data: &AggregationsSegmentCtx,
        results: &mut IntermediateAggregationResults,
        parent_bucket_id: BucketId,
    ) -> crate::Result<()> {
        for agg in &mut self.aggs {
            agg.add_intermediate_aggregation_result(agg_data, results, parent_bucket_id)?;
        }

        Ok(())
    }

    fn collect(
        &mut self,
        parent_bucket_id: BucketId,
        docs: &[crate::DocId],
        agg_data: &mut AggregationsSegmentCtx,
    ) -> crate::Result<()> {
        for collector in &mut self.aggs {
            collector.collect(parent_bucket_id, docs, agg_data)?;
        }
        Ok(())
    }

    fn flush(&mut self, agg_data: &mut AggregationsSegmentCtx) -> crate::Result<()> {
        for collector in &mut self.aggs {
            collector.flush(agg_data)?;
        }
        Ok(())
    }

    fn prepare_max_bucket(
        &mut self,
        max_bucket: BucketId,
        agg_data: &AggregationsSegmentCtx,
    ) -> crate::Result<()> {
        for collector in &mut self.aggs {
            collector.prepare_max_bucket(max_bucket, agg_data)?;
        }
        Ok(())
    }
}


================================================
FILE: src/collector/count_collector.rs
================================================
use super::Collector;
use crate::collector::SegmentCollector;
use crate::{DocId, Score, SegmentOrdinal, SegmentReader};

/// `CountCollector` collector only counts how many
/// documents match the query.
///
/// ```rust
/// use tantivy::collector::Count;
/// use tantivy::query::QueryParser;
/// use tantivy::schema::{Schema, TEXT};
/// use tantivy::{doc, Index};
///
/// let mut schema_builder = Schema::builder();
/// let title = schema_builder.add_text_field("title", TEXT);
/// let schema = schema_builder.build();
/// let index = Index::create_in_ram(schema);
///
/// let mut index_writer = index.writer(15_000_000).unwrap();
/// index_writer.add_document(doc!(title => "The Name of the Wind")).unwrap();
/// index_writer.add_document(doc!(title => "The Diary of Muadib")).unwrap();
/// index_writer.add_document(doc!(title => "A Dairy Cow")).unwrap();
/// index_writer.add_document(doc!(title => "The Diary of a Young Girl")).unwrap();
/// assert!(index_writer.commit().is_ok());
///
/// let reader = index.reader().unwrap();
/// let searcher = reader.searcher();
///
/// // Here comes the important part
/// let query_parser = QueryParser::for_index(&index, vec![title]);
/// let query = query_parser.parse_query("diary").unwrap();
/// let count = searcher.search(&query, &Count).unwrap();
///
/// assert_eq!(count, 2);
/// ```
pub struct Count;

impl Collector for Count {
    type Fruit = usize;

    type Child = SegmentCountCollector;

    fn for_segment(
        &self,
        _: SegmentOrdinal,
        _: &SegmentReader,
    ) -> crate::Result<SegmentCountCollector> {
        Ok(SegmentCountCollector::default())
    }

    fn requires_scoring(&self) -> bool {
        false
    }

    fn merge_fruits(&self, segment_counts: Vec<usize>) -> crate::Result<usize> {
        Ok(segment_counts.into_iter().sum())
    }
}

#[derive(Default)]
pub struct SegmentCountCollector {
    count: usize,
}

impl SegmentCollector for SegmentCountCollector {
    type Fruit = usize;

    fn collect(&mut self, _: DocId, _: Score) {
        self.count += 1;
    }

    fn harvest(self) -> usize {
        self.count
    }
}

#[cfg(test)]
mod tests {
    use super::{Count, SegmentCountCollector};
    use crate::collector::{Collector, SegmentCollector};

    #[test]
    fn test_count_collect_does_not_requires_scoring() {
        assert!(!Count.requires_scoring());
    }

    #[test]
    fn test_segment_count_collector() {
        {
            let count_collector = SegmentCountCollector::default();
            assert_eq!(count_collector.harvest(), 0);
        }
        {
            let mut count_collector = SegmentCountCollector::default();
            count_collector.collect(0u32, 1.0);
            assert_eq!(count_collector.harvest(), 1);
        }
        {
            let mut count_collector = SegmentCountCollector::default();
            count_collector.collect(0u32, 1.0);
            assert_eq!(count_collector.harvest(), 1);
        }
        {
            let mut count_collector = SegmentCountCollector::default();
            count_collector.collect(0u32, 1.0);
            count_collector.collect(1u32, 1.0);
            assert_eq!(count_collector.harvest(), 2);
        }
    }
}


================================================
FILE: src/collector/docset_collector.rs
================================================
use std::collections::HashSet;

use super::{Collector, SegmentCollector};
use crate::{DocAddress, DocId, Score};

/// Collectors that returns the set of DocAddress that matches the query.
///
/// This collector is mostly useful for tests.
pub struct DocSetCollector;

impl Collector for DocSetCollector {
    type Fruit = HashSet<DocAddress>;
    type Child = DocSetChildCollector;

    fn for_segment(
        &self,
        segment_local_id: crate::SegmentOrdinal,
        _segment: &crate::SegmentReader,
    ) -> crate::Result<Self::Child> {
        Ok(DocSetChildCollector {
            segment_local_id,
            docs: HashSet::new(),
        })
    }

    fn requires_scoring(&self) -> bool {
        false
    }

    fn merge_fruits(
        &self,
        segment_fruits: Vec<(u32, HashSet<DocId>)>,
    ) -> crate::Result<Self::Fruit> {
        let len: usize = segment_fruits.iter().map(|(_, docset)| docset.len()).sum();
        let mut result = HashSet::with_capacity(len);
        for (segment_local_id, docs) in segment_fruits {
            for doc in docs {
                result.insert(DocAddress::new(segment_local_id, doc));
            }
        }
        Ok(result)
    }
}

pub struct DocSetChildCollector {
    segment_local_id: u32,
    docs: HashSet<DocId>,
}

impl SegmentCollector for DocSetChildCollector {
    type Fruit = (u32, HashSet<DocId>);

    fn collect(&mut self, doc: crate::DocId, _score: Score) {
        self.docs.insert(doc);
    }

    fn harvest(self) -> (u32, HashSet<DocId>) {
        (self.segment_local_id, self.docs)
    }
}


================================================
FILE: src/collector/facet_collector.rs
================================================
use std::cmp::Ordering;
use std::collections::{btree_map, BTreeMap, BTreeSet, BinaryHeap};
use std::io;
use std::ops::Bound;

use crate::collector::{Collector, SegmentCollector};
use crate::fastfield::FacetReader;
use crate::schema::Facet;
use crate::{DocId, Score, SegmentOrdinal, SegmentReader};

struct Hit<'a> {
    count: u64,
    facet: &'a Facet,
}

impl Eq for Hit<'_> {}

impl<'a> PartialEq<Hit<'a>> for Hit<'a> {
    fn eq(&self, other: &Hit<'_>) -> bool {
        self.count == other.count
    }
}

impl<'a> PartialOrd<Hit<'a>> for Hit<'a> {
    fn partial_cmp(&self, other: &Hit<'_>) -> Option<Ordering> {
        Some(self.cmp(other))
    }
}

impl Ord for Hit<'_> {
    fn cmp(&self, other: &Self) -> Ordering {
        other
            .count
            .cmp(&self.count)
            .then(self.facet.cmp(other.facet))
    }
}

fn facet_depth(facet_bytes: &[u8]) -> usize {
    if facet_bytes.is_empty() {
        0
    } else {
        facet_bytes.iter().cloned().filter(|b| *b == 0u8).count() + 1
    }
}

/// Collector for faceting
///
/// The collector collects all facets. You need to configure it
/// beforehand with the facet you want to extract.
///
/// This is done by calling `.add_facet(...)` with the root of the
/// facet you want to extract as argument.
///
/// Facet counts will only be computed for the facet that are direct children
/// of such a root facet.
///
/// For instance, if your index represents books, your hierarchy of facets
/// may contain `category`, `language`.
///
/// The category facet may include `subcategories`. For instance, a book
/// could belong to `/category/fiction/fantasy`.
///
/// If you request the facet counts for `/category`, the result will be
/// the breakdown of counts for the direct children of `/category`
/// (e.g. `/category/fiction`, `/category/biography`, `/category/personal_development`).
///
/// Once collection is finished, you can harvest its results in the form
/// of a [`FacetCounts`] object, and extract your facet counts from it.
///
/// This implementation assumes you are working with a number of facets that
/// is many hundreds of times smaller than your number of documents.
///
///
/// ```rust
/// use tantivy::collector::FacetCollector;
/// use tantivy::query::AllQuery;
/// use tantivy::schema::{Facet, Schema, FacetOptions, TEXT};
/// use tantivy::{doc, Index};
///
/// fn example() -> tantivy::Result<()> {
///     let mut schema_builder = Schema::builder();
///
///     // Facet have their own specific type.
///     // It is not a bad practise to put all of your
///     // facet information in the same field.
///     let facet = schema_builder.add_facet_field("facet", FacetOptions::default());
///     let title = schema_builder.add_text_field("title", TEXT);
///     let schema = schema_builder.build();
///     let index = Index::create_in_ram(schema);
///     {
///         let mut index_writer = index.writer(15_000_000)?;
///         // a document can be associated with any number of facets
///         index_writer.add_document(doc!(
///             title => "The Name of the Wind",
///             facet => Facet::from("/lang/en"),
///             facet => Facet::from("/category/fiction/fantasy")
///         ))?;
///         index_writer.add_document(doc!(
///             title => "Dune",
///             facet => Facet::from("/lang/en"),
///             facet => Facet::from("/category/fiction/sci-fi")
///         ))?;
///         index_writer.add_document(doc!(
///             title => "La Vénus d'Ille",
///             facet => Facet::from("/lang/fr"),
///             facet => Facet::from("/category/fiction/fantasy"),
///             facet => Facet::from("/category/fiction/horror")
///         ))?;
///         index_writer.add_document(doc!(
///             title => "The Diary of a Young Girl",
///             facet => Facet::from("/lang/en"),
///             facet => Facet::from("/category/biography")
///         ))?;
///         index_writer.commit()?;
///     }
///     let reader = index.reader()?;
///     let searcher = reader.searcher();
///
///     {
///         let mut facet_collector = FacetCollector::for_field("facet");
///         facet_collector.add_facet("/lang");
///         facet_collector.add_facet("/category");
///         let facet_counts = searcher.search(&AllQuery, &facet_collector)?;
///
///         // This lists all of the facet counts
///         let facets: Vec<(&Facet, u64)> = facet_counts
///             .get("/category")
///             .collect();
///         assert_eq!(facets, vec![
///             (&Facet::from("/category/biography"), 1),
///             (&Facet::from("/category/fiction"), 3)
///         ]);
///     }
///
///     {
///         let mut facet_collector = FacetCollector::for_field("facet");
///         facet_collector.add_facet("/category/fiction");
///         let facet_counts = searcher.search(&AllQuery, &facet_collector)?;
///
///         // This lists all of the facet counts
///         let facets: Vec<(&Facet, u64)> = facet_counts
///             .get("/category/fiction")
///             .collect();
///         assert_eq!(facets, vec![
///             (&Facet::from("/category/fiction/fantasy"), 2),
///             (&Facet::from("/category/fiction/horror"), 1),
///             (&Facet::from("/category/fiction/sci-fi"), 1)
///         ]);
///     }
///
///     {
///         let mut facet_collector = FacetCollector::for_field("facet");
///         facet_collector.add_facet("/category/fiction");
///         let facet_counts = searcher.search(&AllQuery, &facet_collector)?;
///
///         // This lists all of the facet counts
///         let facets: Vec<(&Facet, u64)> = facet_counts.top_k("/category/fiction", 1);
///         assert_eq!(facets, vec![
///             (&Facet::from("/category/fiction/fantasy"), 2)
///         ]);
///     }
///
///     {
///         let mut facet_collector = FacetCollector::for_field("facet");
///         facet_collector.add_facet("/");
///         let facet_counts = searcher.search(&AllQuery, &facet_collector)?;
///
///         // This lists all of the facet counts
///         let facets: Vec<(&Facet, u64)> = facet_counts
///             .get("/")
///             .collect();
///         assert_eq!(facets, vec![
///             (&Facet::from("/category"), 4),
///             (&Facet::from("/lang"), 4)
///         ]);
///     }
///
///     Ok(())
/// }
/// # assert!(example().is_ok());
/// ```
pub struct FacetCollector {
    field_name: String,
    facets: BTreeSet<Facet>,
}

pub struct FacetSegmentCollector {
    reader: FacetReader,
    // collapse facet_id -> count
    counts: Vec<u64>,
    // facet_ord -> compressed collapse facet_id
    compressed_collapse_mapping: Vec<usize>,
    // compressed collapse facet_id -> facet_ord
    unique_facet_ords: Vec<(u64, usize)>,
}

impl FacetCollector {
    /// Create a facet collector to collect the facets
    /// from a specific facet `Field`.
    ///
    /// This function does not check whether the field
    /// is of the proper type.
    pub fn for_field(field_name: impl ToString) -> FacetCollector {
        FacetCollector {
            field_name: field_name.to_string(),
            facets: BTreeSet::default(),
        }
    }

    /// Adds a facet that we want to record counts
    ///
    /// Adding facet `Facet::from("/country")` for instance,
    /// will record the counts of all of the direct children of the facet country
    /// (e.g. `/country/FR`, `/country/UK`).
    ///
    /// Adding two facets within which one is the prefix of the other is forbidden.
    /// If you need the correct number of unique documents for two such facets,
    /// just add them in a separate `FacetCollector`.
    pub fn add_facet<T>(&mut self, facet_from: T)
    where Facet: From<T> {
        let facet = Facet::from(facet_from);
        for old_facet in &self.facets {
            assert!(
                !old_facet.is_prefix_of(&facet),
                "Tried to add a facet which is a descendant of an already added facet."
            );
            assert!(
                !facet.is_prefix_of(old_facet),
                "Tried to add a facet which is an ancestor of an already added facet."
            );
        }
        self.facets.insert(facet);
    }
}

fn compress_mapping(mapping: &[(u64, usize)]) -> (Vec<usize>, Vec<(u64, usize)>) {
    // facet_ord -> collapse facet_id
    let mut compressed_collapse_mapping: Vec<usize> = Vec::with_capacity(mapping.len());
    // collapse facet_id -> facet_ord
    let mut unique_facet_ords: Vec<(u64, usize)> = Vec::new();
    if mapping.is_empty() {
        return (Vec::new(), Vec::new());
    }
    compressed_collapse_mapping.push(0);
    unique_facet_ords.push(mapping[0]);
    let mut last_facet_ord = mapping[0];
    let mut last_facet_id = 0;
    for &facet_ord in &mapping[1..] {
        if facet_ord != last_facet_ord {
            last_facet_id += 1;
            last_facet_ord = facet_ord;
            unique_facet_ords.push(facet_ord);
        }
        compressed_collapse_mapping.push(last_facet_id);
    }
    (compressed_collapse_mapping, unique_facet_ords)
}

impl Collector for FacetCollector {
    type Fruit = FacetCounts;

    type Child = FacetSegmentCollector;

    fn for_segment(
        &self,
        _: SegmentOrdinal,
        reader: &SegmentReader,
    ) -> crate::Result<FacetSegmentCollector> {
        let facet_reader = reader.facet_reader(&self.field_name)?;
        let facet_dict = facet_reader.facet_dict();
        let collapse_mapping: Vec<(u64, usize)> =
            compute_collapse_mapping(facet_dict, &self.facets)?;
        let (compressed_collapse_mapping, unique_facet_ords) = compress_mapping(&collapse_mapping);
        let counts = vec![0u64; unique_facet_ords.len()];
        Ok(FacetSegmentCollector {
            reader: facet_reader,
            compressed_collapse_mapping,
            counts,
            unique_facet_ords,
        })
    }

    fn requires_scoring(&self) -> bool {
        false
    }

    fn merge_fruits(&self, segments_facet_counts: Vec<FacetCounts>) -> crate::Result<FacetCounts> {
        let mut facet_counts: BTreeMap<Facet, u64> = BTreeMap::new();
        for segment_facet_counts in segments_facet_counts {
            for (facet, count) in segment_facet_counts.facet_counts {
                *(facet_counts.entry(facet).or_insert(0)) += count;
            }
        }
        Ok(FacetCounts { facet_counts })
    }
}

fn is_child_facet(parent_facet: &[u8], possible_child_facet: &[u8]) -> bool {
    if !possible_child_facet.starts_with(parent_facet) {
        return false;
    }
    if parent_facet.is_empty() {
        return true;
    }
    possible_child_facet.get(parent_facet.len()).copied() == Some(0u8)
}

fn compute_collapse_mapping_one(
    facet_terms: &mut columnar::Streamer,
    facet_bytes: &[u8],
    collapsed: &mut [(u64, usize)],
) -> io::Result<bool> {
    let mut facet_child: Vec<u8> = Vec::new();
    let mut term_ord = 0;
    let offset = facet_bytes.len() + 1;
    let depth = facet_depth(facet_bytes);
    loop {
        match facet_terms.key().cmp(facet_bytes) {
            Ordering::Less | Ordering::Equal => {}
            Ordering::Greater => {
                if !is_child_facet(facet_bytes, facet_terms.key()) {
                    return Ok(true);
                }
                let suffix = &facet_terms.key()[offset..];
                if facet_child.is_empty() || !is_child_facet(&facet_child, suffix) {
                    facet_child.clear();
                    term_ord = facet_terms.term_ord();
                    let end = suffix
                        .iter()
                        .position(|b| *b == 0u8)
                        .unwrap_or(suffix.len());
                    facet_child.extend(&suffix[..end]);
                }
                collapsed[facet_terms.term_ord() as usize] = (term_ord, depth);
            }
        }
        if !facet_terms.advance() {
            return Ok(false);
        }
    }
}

fn compute_collapse_mapping(
    facet_dict: &columnar::Dictionary,
    facets: &BTreeSet<Facet>,
) -> io::Result<Vec<(u64, usize)>> {
    let mut collapsed = vec![(u64::MAX, 0); facet_dict.num_terms()];
    if facets.is_empty() {
        return Ok(collapsed);
    }
    let mut facet_terms: columnar::Streamer = facet_dict.range().into_stream()?;
    if !facet_terms.advance() {
        return Ok(collapsed);
    }
    let mut facet_bytes = Vec::new();
    for facet in facets {
        facet_bytes.clear();
        facet_bytes.extend(facet.encoded_str().as_bytes());
        if !compute_collapse_mapping_one(&mut facet_terms, &facet_bytes, &mut collapsed[..])? {
            break;
        }
    }
    Ok(collapsed)
}

impl SegmentCollector for FacetSegmentCollector {
    type Fruit = FacetCounts;

    fn collect(&mut self, doc: DocId, _: Score) {
        let mut previous_collapsed_ord: usize = usize::MAX;
        for facet_ord in self.reader.facet_ords(doc) {
            let collapsed_ord = self.compressed_collapse_mapping[facet_ord as usize];
            self.counts[collapsed_ord] += u64::from(collapsed_ord != previous_collapsed_ord);
            previous_collapsed_ord = collapsed_ord;
        }
    }

    /// Returns the results of the collection.
    ///
    /// This method does not just return the counters,
    /// it also translates the facet ordinals of the last segment.
    fn harvest(self) -> FacetCounts {
        let mut facet_counts = BTreeMap::new();
        let facet_dict = self.reader.facet_dict();
        for (collapsed_facet_ord, count) in self.counts.iter().cloned().enumerate() {
            if count == 0 {
                continue;
            }
            let mut facet = vec![];
            let (facet_ord, facet_depth) = self.unique_facet_ords[collapsed_facet_ord];
            // TODO handle errors.
            if facet_dict.ord_to_term(facet_ord, &mut facet).is_ok() {
                if let Some((end_collapsed_facet, _)) = facet
                    .iter()
                    .enumerate()
                    .filter(|(_pos, &b)| b == 0u8)
                    .nth(facet_depth)
                {
                    facet.truncate(end_collapsed_facet);
                }
                if let Ok(facet) = Facet::from_encoded(facet) {
                    facet_counts.insert(facet, count);
                }
            }
        }
        FacetCounts { facet_counts }
    }
}

/// Intermediary result of the `FacetCollector` that stores
/// the facet counts for all the segments.
#[derive(Default, Clone)]
pub struct FacetCounts {
    facet_counts: BTreeMap<Facet, u64>,
}

pub struct FacetChildIterator<'a> {
    underlying: btree_map::Range<'a, Facet, u64>,
}

impl<'a> Iterator for FacetChildIterator<'a> {
    type Item = (&'a Facet, u64);

    fn next(&mut self) -> Option<Self::Item> {
        self.underlying.next().map(|(facet, count)| (facet, *count))
    }
}

impl FacetCounts {
    /// Returns an iterator over all of the facet count pairs inside this result.
    /// See the documentation for [`FacetCollector`] for a usage example.
    pub fn get<T>(&self, facet_from: T) -> FacetChildIterator<'_>
    where Facet: From<T> {
        let facet = Facet::from(facet_from);
        let lower_bound = Bound::Excluded(facet.clone());
        let upper_bound = if facet.is_root() {
            Bound::Unbounded
        } else {
            let mut facet_after_bytes: String = facet.encoded_str().to_owned();
            facet_after_bytes.push('\u{1}');
            let facet_after = Facet::from_encoded_string(facet_after_bytes);
            Bound::Excluded(facet_after)
        };
        let underlying: btree_map::Range<'_, _, _> =
            self.facet_counts.range((lower_bound, upper_bound));
        FacetChildIterator { underlying }
    }

    /// Returns a vector of top `k` facets with their counts, sorted highest-to-lowest by counts.
    /// See the documentation for [`FacetCollector`] for a usage example.
    pub fn top_k<T>(&self, facet: T, k: usize) -> Vec<(&Facet, u64)>
    where Facet: From<T> {
        let mut heap = BinaryHeap::with_capacity(k);
        let mut it = self.get(facet);

        // push the first k elements to first bring the heap
        // to capacity
        for (facet, count) in (&mut it).take(k) {
            heap.push(Hit { count, facet });
        }

        let mut lowest_count: u64 = heap.peek().map(|hit| hit.count).unwrap_or(u64::MIN); //< the `unwrap_or` case may be triggered but the value
                                                                                          // is never used in that case.

        for (facet, count) in it {
            if count > lowest_count {
                if let Some(mut head) = heap.peek_mut() {
                    *head = Hit { count, facet };
                }
                // the heap gets reconstructed at this point
                if let Some(head) = heap.peek() {
                    lowest_count = head.count;
                }
            }
        }
        heap.into_sorted_vec()
            .into_iter()
            .map(|hit| (hit.facet, hit.count))
            .collect::<Vec<_>>()
    }
}

#[cfg(test)]
mod tests {
    use std::collections::BTreeSet;

    use columnar::Dictionary;
    use rand::distr::Uniform;
    use rand::prelude::SliceRandom;
    use rand::{rng, Rng};

    use super::{FacetCollector, FacetCounts};
    use crate::collector::facet_collector::compress_mapping;
    use crate::collector::Count;
    use crate::index::Index;
    use crate::query::{AllQuery, QueryParser, TermQuery};
    use crate::schema::{Facet, FacetOptions, IndexRecordOption, Schema, TantivyDocument};
    use crate::{IndexWriter, Term};

    fn test_collapse_mapping_aux(
        facet_terms: &[&str],
        facet_params: &[&str],
        expected_collapsed_mapping: &[(u64, usize)],
    ) {
        let mut facets: Vec<Facet> = facet_terms.iter().map(Facet::from).collect();
        facets.sort();
        let facet_terms: Vec<&str> = facets.iter().map(|facet| facet.encoded_str()).collect();
        let dictionary = Dictionary::build_for_tests(&facet_terms);
        let facet_params: BTreeSet<Facet> = facet_params.iter().map(Facet::from).collect();
        let collapse_mapping = super::compute_collapse_mapping(&dictionary, &facet_params).unwrap();
        assert_eq!(&collapse_mapping[..], expected_collapsed_mapping);
    }

    #[test]
    fn test_collapse_simple() {
        test_collapse_mapping_aux(&["/facet/a", "/facet/b"], &["/facet"], &[(0, 1), (1, 1)]);
        test_collapse_mapping_aux(
            &["/facet/a", "/facet/a2", "/facet/b"],
            &["/facet"],
            &[(0, 1), (1, 1), (2, 1)],
        );
        test_collapse_mapping_aux(&["/facet/a", "/facet/a/2"], &["/facet"], &[(0, 1), (0, 1)]);
        test_collapse_mapping_aux(
            &["/facet/a", "/facet/a/2", "/facet/b"],
            &["/facet"],
            &[(0, 1), (0, 1), (2, 1)],
        );
    }

    fn test_compress_mapping_aux(
        collapsed_mapping: &[(u64, usize)],
        expected_compressed_collapsed_mapping: &[usize],
        expected_unique_facet_ords: &[(u64, usize)],
    ) {
        let (compressed_collapsed_mapping, unique_facet_ords) = compress_mapping(collapsed_mapping);
        assert_eq!(
            compressed_collapsed_mapping,
            expected_compressed_collapsed_mapping
        );
        assert_eq!(unique_facet_ords, expected_unique_facet_ords);
    }

    #[test]
    fn test_compress_mapping() {
        test_compress_mapping_aux(&[], &[], &[]);
        test_compress_mapping_aux(&[(1, 2)], &[0], &[(1, 2)]);
        test_compress_mapping_aux(&[(1, 2), (1, 2)], &[0, 0], &[(1, 2)]);
        test_compress_mapping_aux(
            &[(1, 2), (5, 2), (5, 2), (6, 3), (8, 3)],
            &[0, 1, 1, 2, 3],
            &[(1, 2), (5, 2), (6, 3), (8, 3)],
        );
    }

    #[test]
    fn test_facet_collector_simple() {
        let mut schema_builder = Schema::builder();
        let facet_field = schema_builder.add_facet_field("facet", FacetOptions::default());
        let schema = schema_builder.build();
        let index = Index::create_in_ram(schema);
        let mut index_writer: IndexWriter = index.writer_for_tests().unwrap();
        index_writer
            .add_document(doc!(facet_field=>Facet::from("/facet/a")))
            .unwrap();
        index_writer
            .add_document(doc!(facet_field=>Facet::from("/facet/b")))
            .unwrap();
        index_writer
            .add_document(doc!(facet_field=>Facet::from("/facet/b")))
            .unwrap();
        index_writer
            .add_document(doc!(facet_field=>Facet::from("/facet/c")))
            .unwrap();
        index_writer.commit().unwrap();
        let searcher = index.reader().unwrap().searcher();
        let mut facet_collector = FacetCollector::for_field("facet");
        facet_collector.add_facet("/facet");
        let counts: FacetCounts = searcher.search(&AllQuery, &facet_collector).unwrap();
        let facets: Vec<(&Facet, u64)> = counts.top_k("/facet", 1);
        assert_eq!(facets, vec![(&Facet::from("/facet/b"), 2)]);
    }

    #[test]
    fn test_facet_collector_drilldown() {
        let mut schema_builder = Schema::builder();
        let facet_field = schema_builder.add_facet_field("facet", FacetOptions::default());
        let schema = schema_builder.build();
        let index = Index::create_in_ram(schema);

        let mut index_writer: IndexWriter = index.writer_for_tests().unwrap();
        let num_facets: usize = 3 * 4 * 5;
        let facets: Vec<Facet> = (0..num_facets)
            .map(|mut n| {
                let top = n % 3;
                n /= 3;
                let mid = n % 4;
                n /= 4;
                let leaf = n % 5;
                Facet::from(&format!("/top{top}/mid{mid}/leaf{leaf}"))
            })
            .collect();
        for i in 0..num_facets * 10 {
            let mut doc = TantivyDocument::new();
            doc.add_facet(facet_field, facets[i % num_facets].clone());
            index_writer.add_document(doc).unwrap();
        }
        index_writer.commit().unwrap();
        let reader = index.reader().unwrap();
        let searcher = reader.searcher();
        let mut facet_collector = FacetCollector::for_field("facet");
        facet_collector.add_facet(Facet::from("/top1"));
        let counts = searcher.search(&AllQuery, &facet_collector).unwrap();

        {
            let facets: Vec<(String, u64)> = counts
                .get("/top1")
                .map(|(facet, count)| (facet.to_string(), count))
                .collect();
            assert_eq!(
                facets,
                [
                    ("/top1/mid0", 50),
                    ("/top1/mid1", 50),
                    ("/top1/mid2", 50),
                    ("/top1/mid3", 50),
                ]
                .iter()
                .map(|&(facet_str, count)| (String::from(facet_str), count))
                .collect::<Vec<_>>()
            );
        }
    }

    #[test]
    #[should_panic(
        expected = "Tried to add a facet which is a descendant of an already added facet."
    )]
    fn test_misused_facet_collector() {
        let mut facet_collector = FacetCollector::for_field("facet");
        facet_collector.add_facet(Facet::from("/country"));
        facet_collector.add_facet(Facet::from("/country/europe"));
    }

    #[test]
    fn test_doc_unsorted_multifacet() -> crate::Result<()> {
        let mut schema_builder = Schema::builder();
        let facet_field = schema_builder.add_facet_field("facets", FacetOptions::default());
        let schema = schema_builder.build();
        let index = Index::create_in_ram(schema);
        let mut index_writer = index.writer_for_tests()?;
        index_writer.add_document(doc!(
            facet_field => Facet::from_text(&"/subjects/A/a").unwrap(),
            facet_field => Facet::from_text(&"/subjects/B/a").unwrap(),
            facet_field => Facet::from_text(&"/subjects/A/b").unwrap(),
            facet_field => Facet::from_text(&"/subjects/B/b").unwrap(),
        ))?;
        index_writer.commit()?;
        let reader = index.reader()?;
        let searcher = reader.searcher();
        assert_eq!(searcher.num_docs(), 1);
        let mut facet_collector = FacetCollector::for_field("facets");
        facet_collector.add_facet("/subjects");
        let counts = searcher.search(&AllQuery, &facet_collector)?;
        let facets: Vec<(&Facet, u64)> = counts.get("/subjects").collect();
        assert_eq!(facets[0].1, 1);
        Ok(())
    }

    #[test]
    fn test_doc_search_by_facet() -> crate::Result<()> {
        let mut schema_builder = Schema::builder();
        let facet_field = schema_builder.add_facet_field("facet", FacetOptions::default());
        let schema = schema_builder.build();
        let index = Index::create_in_ram(schema);
        let mut index_writer = index.writer_for_tests()?;
        index_writer.add_document(doc!(
            facet_field => Facet::from_text(&"/A/A").unwrap(),
        ))?;
        index_writer.add_document(doc!(
            facet_field => Facet::from_text(&"/A/B").unwrap(),
        ))?;
        index_writer.add_document(doc!(
            facet_field => Facet::from_text(&"/A/C/A").unwrap(),
        ))?;
        index_writer.add_document(doc!(
            facet_field => Facet::from_text(&"/D/C/A").unwrap(),
        ))?;
        index_writer.commit()?;
        let reader = index.reader()?;
        let searcher = reader.searcher();
        assert_eq!(searcher.num_docs(), 4);

        let count_facet = |facet_str: &str| {
            let term = Term::from_facet(facet_field, &Facet::from_text(facet_str).unwrap());
            searcher
                .search(&TermQuery::new(term, IndexRecordOption::Basic), &Count)
                .unwrap()
        };

        assert_eq!(count_facet("/"), 4);
        assert_eq!(count_facet("/A"), 3);
        assert_eq!(count_facet("/A/B"), 1);
        assert_eq!(count_facet("/A/C"), 1);
        assert_eq!(count_facet("/A/C/A"), 1);
        assert_eq!(count_facet("/C/A"), 0);

        let query_parser = QueryParser::for_index(&index, vec![]);
        {
            let query = query_parser.parse_query("facet:/A/B")?;
            assert_eq!(1, searcher.search(&query, &Count).unwrap());
        }
        {
            let query = query_parser.parse_query("facet:/A")?;
            assert_eq!(3, searcher.search(&query, &Count)?);
        }
        Ok(())
    }

    #[test]
    fn test_non_used_facet_collector() {
        let mut facet_collector = FacetCollector::for_field("facet");
        facet_collector.add_facet(Facet::from("/country"));
        facet_collector.add_facet(Facet::from("/countryeurope"));
    }

    #[test]
    fn test_facet_collector_topk() {
        let mut schema_builder = Schema::builder();
        let facet_field = schema_builder.add_facet_field("facet", FacetOptions::default());
        let schema = schema_builder.build();
        let index = Index::create_in_ram(schema);

        let uniform = Uniform::new_inclusive(1, 100_000).unwrap();
        let mut docs: Vec<TantivyDocument> =
            vec![("a", 10), ("b", 100), ("c", 7), ("d", 12), ("e", 21)]
                .into_iter()
                .flat_map(|(c, count)| {
                    let facet = Facet::from(&format!("/facet/{c}"));
                    let doc = doc!(facet_field => facet);
                    std::iter::repeat_n(doc, count)
                })
                .map(|mut doc| {
                    doc.add_facet(facet_field, &format!("/facet/{}", rng().sample(uniform)));
                    doc
                })
                .collect();
        docs[..].shuffle(&mut rng());

        let mut index_writer: IndexWriter = index.writer_for_tests().unwrap();
        for doc in docs {
            index_writer.add_document(doc).unwrap();
        }
        index_writer.commit().unwrap();
        let searcher = index.reader().unwrap().searcher();

        let mut facet_collector = FacetCollector::for_field("facet");
        facet_collector.add_facet("/facet");
        let counts: FacetCounts = searcher.search(&AllQuery, &facet_collector).unwrap();

        {
            let facets: Vec<(&Facet, u64)> = counts.top_k("/facet", 3);
            assert_eq!(
                facets,
                vec![
                    (&Facet::from("/facet/b"), 100),
                    (&Facet::from("/facet/e"), 21),
                    (&Facet::from("/facet/d"), 12),
                ]
            );
        }
    }

    #[test]
    fn test_facet_collector_topk_tie_break() -> crate::Result<()> {
        let mut schema_builder = Schema::builder();
        let facet_field = schema_builder.add_facet_field("facet", FacetOptions::default());
        let schema = schema_builder.build();
        let index = Index::create_in_ram(schema);

        let docs: Vec<TantivyDocument> = vec![("b", 2), ("a", 2), ("c", 4)]
            .into_iter()
            .flat_map(|(c, count)| {
                let facet = Facet::from(&format!("/facet/{c}"));
                let doc = doc!(facet_field => facet);
                std::iter::repeat_n(doc, count)
            })
            .collect();

        let mut index_writer = index.writer_for_tests()?;
        for doc in docs {
            index_writer.add_document(doc)?;
        }
        index_writer.commit()?;

        let searcher = index.reader()?.searcher();
        let mut facet_collector = FacetCollector::for_field("facet");
        facet_collector.add_facet("/facet");
        let counts: FacetCounts = searcher.search(&AllQuery, &facet_collector)?;

        let facets: Vec<(&Facet, u64)> = counts.top_k("/facet", 2);
        assert_eq!(
            facets,
            vec![(&Facet::from("/facet/c"), 4), (&Facet::from("/facet/a"), 2)]
        );
        Ok(())
    }

    #[test]
    fn is_child_facet() {
        assert!(super::is_child_facet(&b"foo"[..], &b"foo\0bar"[..]));
        assert!(super::is_child_facet(&b""[..], &b"foo\0bar"[..]));
        assert!(super::is_child_facet(&b""[..], &b"foo"[..]));
        assert!(!super::is_child_facet(&b"foo\0bar"[..], &b"foo"[..]));
        assert!(!super::is_child_facet(&b"foo"[..], &b"foobar\0baz"[..]));
    }
}

#[cfg(all(test, feature = "unstable"))]
mod bench {

    use rand::rng;
    use rand::seq::SliceRandom;
    use test::Bencher;

    use crate::collector::FacetCollector;
    use crate::query::AllQuery;
    use crate::schema::{Facet, Schema, INDEXED};
    use crate::{Index, IndexWriter};

    #[bench]
    fn bench_facet_collector(b: &mut Bencher) {
        let mut schema_builder = Schema::builder();
        let facet_field = schema_builder.add_facet_field("facet", INDEXED);
        let schema = schema_builder.build();
        let index = Index::create_in_ram(schema);

        let mut docs = vec![];
        for val in 0..50 {
            let facet = Facet::from(&format!("/facet_{val}"));
            for _ in 0..val * val {
                docs.push(doc!(facet_field=>facet.clone()));
            }
        }
        // 40425 docs
        docs[..].shuffle(&mut rng());

        let mut index_writer: IndexWriter = index.writer_for_tests().unwrap();
        for doc in docs {
            index_writer.add_document(doc).unwrap();
        }
        index_writer.commit().unwrap();
        let reader = index.reader().unwrap();
        b.iter(|| {
            let searcher = reader.searcher();
            let facet_collector = FacetCollector::for_field("facet");
            searcher.search(&AllQuery, &facet_collector).unwrap();
        });
    }
}


================================================
FILE: src/collector/filter_collector_wrapper.rs
================================================
// # Custom collector example
//
// This example shows how you can implement your own
// collector. As an example, we will compute a collector
// that computes the standard deviation of a given fast field.
//
// Of course, you can have a look at the tantivy's built-in collectors
// such as the `CountCollector` for more examples.
use std::fmt::Debug;
use std::marker::PhantomData;

use columnar::{BytesColumn, Column, DynamicColumn, HasAssociatedColumnType};

use crate::collector::{Collector, SegmentCollector};
use crate::schema::Schema;
use crate::{DocId, Score, SegmentReader};

/// The `FilterCollector` filters docs using a fast field value and a predicate.
///
/// Only the documents containing at least one value for which the predicate returns `true`
/// will be passed on to the next collector.
///
/// In other words,
/// - documents with no values are filtered out.
/// - documents with several values are accepted if at least one value matches the predicate.
///
///
/// ```rust
/// use tantivy::collector::{TopDocs, FilterCollector};
/// use tantivy::query::QueryParser;
/// use tantivy::schema::{Schema, TEXT, FAST};
/// use tantivy::{doc, DocAddress, Index};
///
/// # fn main() -> tantivy::Result<()> {
/// let mut schema_builder = Schema::builder();
/// let title = schema_builder.add_text_field("title", TEXT);
/// let price = schema_builder.add_u64_field("price", FAST);
/// let schema = schema_builder.build();
/// let index = Index::create_in_ram(schema);
///
/// let mut index_writer = index.writer_with_num_threads(1, 20_000_000)?;
/// index_writer.add_document(doc!(title => "The Name of the Wind", price => 30_200u64))?;
/// index_writer.add_document(doc!(title => "The Diary of Muadib", price => 29_240u64))?;
/// index_writer.add_document(doc!(title => "A Dairy Cow", price => 21_240u64))?;
/// index_writer.add_document(doc!(title => "The Diary of a Young Girl", price => 20_120u64))?;
/// index_writer.commit()?;
///
/// let reader = index.reader()?;
/// let searcher = reader.searcher();
///
/// let query_parser = QueryParser::for_index(&index, vec![title]);
/// let query = query_parser.parse_query("diary")?;
/// let no_filter_collector = FilterCollector::new("price".to_string(), |value: u64| value > 20_120u64, TopDocs::with_limit(2).order_by_score());
/// let top_docs = searcher.search(&query, &no_filter_collector)?;
///
/// assert_eq!(top_docs.len(), 1);
/// assert_eq!(top_docs[0].1, DocAddress::new(0, 1));
///
/// let filter_all_collector: FilterCollector<_, _, u64> = FilterCollector::new("price".to_string(), |value| value < 5u64, TopDocs::with_limit(2).order_by_score());
/// let filtered_top_docs = searcher.search(&query, &filter_all_collector)?;
///
/// assert_eq!(filtered_top_docs.len(), 0);
/// # Ok(())
/// # }
/// ```
///
/// Note that this is limited to fast fields which implement the
/// [`FastValue`][crate::fastfield::FastValue] trait, e.g. `u64` but not `&[u8]`.
/// To filter based on a bytes fast field, use a [`BytesFilterCollector`] instead.
pub struct FilterCollector<TCollector, TPredicate, TPredicateValue>
where TPredicate: 'static + Clone
{
    field: String,
    collector: TCollector,
    predicate: TPredicate,
    t_predicate_value: PhantomData<TPredicateValue>,
}

impl<TCollector, TPredicate, TPredicateValue>
    FilterCollector<TCollector, TPredicate, TPredicateValue>
where
    TCollector: Collector + Send + Sync,
    TPredicate: Fn(TPredicateValue) -> bool + Send + Sync + Clone,
{
    /// Create a new `FilterCollector`.
    pub fn new(field: String, predicate: TPredicate, collector: TCollector) -> Self {
        Self {
            field,
            predicate,
            collector,
            t_predicate_value: PhantomData,
        }
    }
}

impl<TCollector, TPredicate, TPredicateValue> Collector
    for FilterCollector<TCollector, TPredicate, TPredicateValue>
where
    TCollector: Collector + Send + Sync,
    TPredicate: 'static + Fn(TPredicateValue) -> bool + Send + Sync + Clone,
    TPredicateValue: HasAssociatedColumnType,
    DynamicColumn: Into<Option<columnar::Column<TPredicateValue>>>,
{
    type Fruit = TCollector::Fruit;

    type Child = FilterSegmentCollector<TCollector::Child, TPredicate, TPredicateValue>;

    fn check_schema(&self, schema: &Schema) -> crate::Result<()> {
        self.collector.check_schema(schema)?;
        Ok(())
    }

    fn for_segment(
        &self,
        segment_local_id: u32,
        segment_reader: &SegmentReader,
    ) -> crate::Result<Self::Child> {
        let column_opt = segment_reader.fast_fields().column_opt(&self.field)?;

        let segment_collector = self
            .collector
            .for_segment(segment_local_id, segment_reader)?;

        Ok(FilterSegmentCollector {
            column_opt,
            segment_collector,
            predicate: self.predicate.clone(),
            t_predicate_value: PhantomData,
            filtered_docs: Vec::with_capacity(crate::COLLECT_BLOCK_BUFFER_LEN),
        })
    }

    fn requires_scoring(&self) -> bool {
        self.collector.requires_scoring()
    }

    fn merge_fruits(
        &self,
        segment_fruits: Vec<<TCollector::Child as SegmentCollector>::Fruit>,
    ) -> crate::Result<TCollector::Fruit> {
        self.collector.merge_fruits(segment_fruits)
    }
}

pub struct FilterSegmentCollector<TSegmentCollector, TPredicate, TPredicateValue> {
    column_opt: Option<Column<TPredicateValue>>,
    segment_collector: TSegmentCollector,
    predicate: TPredicate,
    t_predicate_value: PhantomData<TPredicateValue>,
    filtered_docs: Vec<DocId>,
}

impl<TSegmentCollector, TPredicate, TPredicateValue>
    FilterSegmentCollector<TSegmentCollector, TPredicate, TPredicateValue>
where
    TPredicateValue: PartialOrd + Copy + Debug + Send + Sync + 'static,
    TPredicate: 'static + Fn(TPredicateValue) -> bool + Send + Sync,
{
    #[inline]
    fn accept_document(&self, doc_id: DocId) -> bool {
        if let Some(column) = &self.column_opt {
            for val in column.values_for_doc(doc_id) {
                if (self.predicate)(val) {
                    return true;
                }
            }
        }
        false
    }
}

impl<TSegmentCollector, TPredicate, TPredicateValue> SegmentCollector
    for FilterSegmentCollector<TSegmentCollector, TPredicate, TPredicateValue>
where
    TSegmentCollector: SegmentCollector,
    TPredicateValue: HasAssociatedColumnType,
    TPredicate: 'static + Fn(TPredicateValue) -> bool + Send + Sync, /* DynamicColumn: Into<Option<columnar::Column<TPredicateValue>>> */
{
    type Fruit = TSegmentCollector::Fruit;

    fn collect(&mut self, doc: u32, score: Score) {
        if self.accept_document(doc) {
            self.segment_collector.collect(doc, score);
        }
    }

    fn collect_block(&mut self, docs: &[DocId]) {
        self.filtered_docs.clear();
        for &doc in docs {
            // TODO: `accept_document` could be further optimized to do batch lookups of column
            // values for single-valued columns.
            if self.accept_document(doc) {
                self.filtered_docs.push(doc);
            }
        }
        if !self.filtered_docs.is_empty() {
            self.segment_collector.collect_block(&self.filtered_docs);
        }
    }

    fn harvest(self) -> TSegmentCollector::Fruit {
        self.segment_collector.harvest()
    }
}

/// A variant of the [`FilterCollector`] specialized for bytes fast fields, i.e.
///
/// it transparently wraps an inner [`Collector`] but filters documents
/// based on the result of applying the predicate to the bytes fast field.
///
/// A document is accepted if and only if the predicate returns `true` for at least one value.
///
/// In other words,
/// - documents with no values are filtered out.
/// - documents with several values are accepted if at least one value matches the predicate.
///
/// ```rust
/// use tantivy::collector::{TopDocs, BytesFilterCollector};
/// use tantivy::query::QueryParser;
/// use tantivy::schema::{Schema, TEXT, FAST};
/// use tantivy::{doc, DocAddress, Index};
///
/// # fn main() -> tantivy::Result<()> {
/// let mut schema_builder = Schema::builder();
/// let title = schema_builder.add_text_field("title", TEXT);
/// let barcode = schema_builder.add_bytes_field("barcode", FAST);
/// let schema = schema_builder.build();
/// let index = Index::create_in_ram(schema);
///
/// let mut index_writer = index.writer_with_num_threads(1, 20_000_000)?;
/// index_writer.add_document(doc!(title => "The Name of the Wind", barcode => &b"010101"[..]))?;
/// index_writer.add_document(doc!(title => "The Diary of Muadib", barcode => &b"110011"[..]))?;
/// index_writer.add_document(doc!(title => "A Dairy Cow", barcode => &b"110111"[..]))?;
/// index_writer.add_document(doc!(title => "The Diary of a Young Girl", barcode => &b"011101"[..]))?;
/// index_writer.add_document(doc!(title => "Bridget Jones's Diary"))?;
/// index_writer.commit()?;
///
/// let reader = index.reader()?;
/// let searcher = reader.searcher();
///
/// let query_parser = QueryParser::for_index(&index, vec![title]);
/// let query = query_parser.parse_query("diary")?;
/// let filter_collector = BytesFilterCollector::new("barcode".to_string(), |bytes: &[u8]| bytes.starts_with(b"01"), TopDocs::with_limit(2).order_by_score());
/// let top_docs = searcher.search(&query, &filter_collector)?;
///
/// assert_eq!(top_docs.len(), 1);
/// assert_eq!(top_docs[0].1, DocAddress::new(0, 3));
/// # Ok(())
/// # }
/// ```
pub struct BytesFilterCollector<TCollector, TPredicate>
where TPredicate: 'static + Clone
{
    field: String,
    collector: TCollector,
    predicate: TPredicate,
}

impl<TCollector, TPredicate> BytesFilterCollector<TCollector, TPredicate>
where
    TCollector: Collector + Send + Sync,
    TPredicate: Fn(&[u8]) -> bool + Send + Sync + Clone,
{
    /// Create a new `BytesFilterCollector`.
    pub fn new(field: String, predicate: TPredicate, collector: TCollector) -> Self {
        Self {
            field,
            predicate,
            collector,
        }
    }
}

impl<TCollector, TPredicate> Collector for BytesFilterCollector<TCollector, TPredicate>
where
    TCollector: Collector + Send + Sync,
    TPredicate: 'static + Fn(&[u8]) -> bool + Send + Sync + Clone,
{
    type Fruit = TCollector::Fruit;

    type Child = BytesFilterSegmentCollector<TCollector::Child, TPredicate>;

    fn check_schema(&self, schema: &Schema) -> crate::Result<()> {
        self.collector.check_schema(schema)
    }

    fn for_segment(
        &self,
        segment_local_id: u32,
        segment_reader: &SegmentReader,
    ) -> crate::Result<Self::Child> {
        let column_opt = segment_reader.fast_fields().bytes(&self.field)?;

        let segment_collector = self
            .collector
            .for_segment(segment_local_id, segment_reader)?;

        Ok(BytesFilterSegmentCollector {
            column_opt,
            segment_collector,
            predicate: self.predicate.clone(),
            buffer: Vec::new(),
            filtered_docs: Vec::with_capacity(crate::COLLECT_BLOCK_BUFFER_LEN),
        })
    }

    fn requires_scoring(&self) -> bool {
        self.collector.requires_scoring()
    }

    fn merge_fruits(
        &self,
        segment_fruits: Vec<<TCollector::Child as SegmentCollector>::Fruit>,
    ) -> crate::Result<TCollector::Fruit> {
        self.collector.merge_fruits(segment_fruits)
    }
}

pub struct BytesFilterSegmentCollector<TSegmentCollector, TPredicate>
where TPredicate: 'static
{
    column_opt: Option<BytesColumn>,
    segment_collector: TSegmentCollector,
    predicate: TPredicate,
    buffer: Vec<u8>,
    filtered_docs: Vec<DocId>,
}

impl<TSegmentCollector, TPredicate> BytesFilterSegmentCollector<TSegmentCollector, TPredicate>
where
    TSegmentCollector: SegmentCollector,
    TPredicate: 'static + Fn(&[u8]) -> bool + Send + Sync,
{
    #[inline]
    fn accept_document(&mut self, doc_id: DocId) -> bool {
        if let Some(column) = &self.column_opt {
            for ord in column.term_ords(doc_id) {
                self.buffer.clear();

                let found = column.ord_to_bytes(ord, &mut self.buffer).unwrap_or(false);

                if found && (self.predicate)(&self.buffer) {
                    return true;
                }
            }
        }
        false
    }
}

impl<TSegmentCollector, TPredicate> SegmentCollector
    for BytesFilterSegmentCollector<TSegmentCollector, TPredicate>
where
    TSegmentCollector: SegmentCollector,
    TPredicate: 'static + Fn(&[u8]) -> bool + Send + Sync,
{
    type Fruit = TSegmentCollector::Fruit;

    fn collect(&mut self, doc: u32, score: Score) {
        if self.accept_document(doc) {
            self.segment_collector.collect(doc, score);
        }
    }

    fn collect_block(&mut self, docs: &[DocId]) {
        self.filtered_docs.clear();
        for &doc in docs {
            // TODO: `accept_document` could be further optimized to do batch lookups of column
            // values for single-valued columns.
            if self.accept_document(doc) {
                self.filtered_docs.push(doc);
            }
        }
        if !self.filtered_docs.is_empty() {
            self.segment_collector.collect_block(&self.filtered_docs);
        }
    }

    fn harvest(self) -> TSegmentCollector::Fruit {
        self.segment_collector.harvest()
    }
}


================================================
FILE: src/collector/histogram_collector.rs
================================================
use std::sync::Arc;

use columnar::ColumnValues;
use fastdivide::DividerU64;

use crate::collector::{Collector, SegmentCollector};
use crate::fastfield::{FastFieldNotAvailableError, FastValue};
use crate::schema::Type;
use crate::{DocId, Score};

/// Histogram builds an histogram of the values of a fastfield for the
/// collected DocSet.
///
/// At construction, it is given parameters that define a partition of an interval
/// [min_val, max_val) into N buckets with the same width.
/// The ith bucket is then defined by `[min_val + i * bucket_width, min_val + (i+1) * bucket_width)`
///
/// An histogram is then defined as a `Vec<u64>` of length `num_buckets`, that contains a count of
/// documents for each value bucket.
///
/// See also [`HistogramCollector::new()`].
///
/// # Warning
///
/// f64 fields are not supported.
#[derive(Clone)]
pub struct HistogramCollector {
    min_value: u64,
    num_buckets: usize,
    divider: DividerU64,
    field: String,
}

impl HistogramCollector {
    /// Builds a new HistogramCollector.
    ///
    /// The scale/range of the histogram is not dynamic. It is required to
    /// define it by supplying following parameter:
    ///  - `min_value`: the minimum value that can be recorded in the histogram.
    ///  - `bucket_width`: the length of the interval that is associated with each buckets.
    ///  - `num_buckets`: The overall number of buckets.
    ///
    /// Together, this parameters define a partition of `[min_value, min_value + num_buckets *
    /// bucket_width)` into `num_buckets` intervals of width bucket that we call `bucket`.
    ///
    /// # Disclaimer
    /// This function panics if the field given is of type f64.
    pub fn new<TFastValue: FastValue>(
        field: String,
        min_value: TFastValue,
        bucket_width: u64,
        num_buckets: usize,
    ) -> HistogramCollector {
        let fast_type = TFastValue::to_type();
        assert!(fast_type == Type::U64 || fast_type == Type::I64 || fast_type == Type::Date);
        HistogramCollector {
            min_value: min_value.to_u64(),
            num_buckets,
            field,
            divider: DividerU64::divide_by(bucket_width),
        }
    }
}

struct HistogramComputer {
    counts: Vec<u64>,
    min_value: u64,
    divider: DividerU64,
}

impl HistogramComputer {
    #[inline]
    pub(crate) fn add_value(&mut self, value: u64) {
        if value < self.min_value {
            return;
        }
        let delta = value - self.min_value;
        let bucket_id: usize = self.divider.divide(delta) as usize;
        if bucket_id < self.counts.len() {
            self.counts[bucket_id] += 1;
        }
    }

    fn harvest(self) -> Vec<u64> {
        self.counts
    }
}
pub struct SegmentHistogramCollector {
    histogram_computer: HistogramComputer,
    column_u64: Arc<dyn ColumnValues<u64>>,
}

impl SegmentCollector for SegmentHistogramCollector {
    type Fruit = Vec<u64>;

    fn collect(&mut self, doc: DocId, _score: Score) {
        let value = self.column_u64.get_val(doc);
        self.histogram_computer.add_value(value);
    }

    fn harvest(self) -> Self::Fruit {
        self.histogram_computer.harvest()
    }
}

impl Collector for HistogramCollector {
    type Fruit = Vec<u64>;
    type Child = SegmentHistogramCollector;

    fn for_segment(
        &self,
        _segment_local_id: crate::SegmentOrdinal,
        segment: &crate::SegmentReader,
    ) -> crate::Result<Self::Child> {
        let column_opt = segment.fast_fields().u64_lenient(&self.field)?;
        let (column, _column_type) = column_opt.ok_or_else(|| FastFieldNotAvailableError {
            field_name: self.field.clone(),
        })?;
        let column_u64 = column.first_or_default_col(0u64);
        Ok(SegmentHistogramCollector {
            histogram_computer: HistogramComputer {
                counts: vec![0; self.num_buckets],
                min_value: self.min_value,
                divider: self.divider,
            },
            column_u64,
        })
    }

    fn requires_scoring(&self) -> bool {
        false
    }

    fn merge_fruits(&self, child_histograms: Vec<Vec<u64>>) -> crate::Result<Vec<u64>> {
        Ok(add_vecs(child_histograms, self.num_buckets))
    }
}

pub fn add_arrays_into(acc: &mut [u64], add: &[u64]) {
    assert_eq!(acc.len(), add.len());
    for (dest_bucket, bucket_count) in acc.iter_mut().zip(add) {
        *dest_bucket += bucket_count;
    }
}

fn add_vecs(mut vals_list: Vec<Vec<u64>>, len: usize) -> Vec<u64> {
    let mut acc = vals_list.pop().unwrap_or_else(|| vec![0u64; len]);
    assert_eq!(acc.len(), len);
    for vals in vals_list {
        add_arrays_into(&mut acc, &vals);
    }
    acc
}

#[cfg(test)]
mod tests {
    use fastdivide::DividerU64;
    use query::AllQuery;

    use super::{add_vecs, HistogramCollector, HistogramComputer};
    use crate::schema::{Schema, FAST};
    use crate::time::{Date, Month};
    use crate::{query, DateTime, Index};

    #[test]
    fn test_add_histograms_simple() {
        assert_eq!(
            add_vecs(vec![vec![1, 0, 3], vec![11, 2, 3], vec![0, 0, 1]], 3),
            vec![12, 2, 7]
        )
    }

    #[test]
    fn test_add_histograms_empty() {
        assert_eq!(add_vecs(vec![], 3), vec![0, 0, 0])
    }

    #[test]
    fn test_histogram_builder_simple() {
        // [1..3)
        // [3..5)
        // ..
        // [9..11)
        let mut histogram_computer = HistogramComputer {
            counts: vec![0; 5],
            min_value: 1,
            divider: DividerU64::divide_by(2),
        };
        histogram_computer.add_value(1);
        histogram_computer.add_value(7);
        assert_eq!(histogram_computer.harvest(), vec![1, 0, 0, 1, 0]);
    }

    #[test]
    fn test_histogram_too_low_is_ignored() {
        let mut histogram_computer = HistogramComputer {
            counts: vec![0; 5],
            min_value: 2,
            divider: DividerU64::divide_by(2),
        };
        histogram_computer.add_value(0);
        assert_eq!(histogram_computer.harvest(), vec![0, 0, 0, 0, 0]);
    }

    #[test]
    fn test_histogram_too_high_is_ignored() {
        let mut histogram_computer = HistogramComputer {
            counts: vec![0u64; 5],
            min_value: 0,
            divider: DividerU64::divide_by(2),
        };
        histogram_computer.add_value(10);
        assert_eq!(histogram_computer.harvest(), vec![0, 0, 0, 0, 0]);
    }
    #[test]
    fn test_no_segments() -> crate::Result<()> {
        let mut schema_builder = Schema::builder();
        schema_builder.add_u64_field("val_field", FAST);
        let schema = schema_builder.build();
        let index = Index::create_in_ram(schema);
        let reader = index.reader()?;
        let searcher = reader.searcher();
        let all_query = AllQuery;
        let histogram_collector = HistogramCollector::new("val_field".to_string(), 0u64, 2, 5);
        let histogram = searcher.search(&all_query, &histogram_collector)?;
        assert_eq!(histogram, vec![0; 5]);
        Ok(())
    }

    #[test]
    fn test_histogram_i64() -> crate::Result<()> {
        let mut schema_builder = Schema::builder();
        let val_field = schema_builder.add_i64_field("val_field", FAST);
        let schema = schema_builder.build();
        let index = Index::create_in_ram(schema);
        let mut writer = index.writer_for_tests()?;
        writer.add_document(doc!(val_field=>12i64))?;
        writer.add_document(doc!(val_field=>-30i64))?;
        writer.add_document(doc!(val_field=>-12i64))?;
        writer.add_document(doc!(val_field=>-10i64))?;
        writer.commit()?;
        let reader = index.reader()?;
        let searcher = reader.searcher();
        let all_query = AllQuery;
        let histogram_collector =
            HistogramCollector::new("val_field".to_string(), -20i64, 10u64, 4);
        let histogram = searcher.search(&all_query, &histogram_collector)?;
        assert_eq!(histogram, vec![1, 1, 0, 1]);
        Ok(())
    }

    #[test]
    fn test_histogram_merge() -> crate::Result<()> {
        let mut schema_builder = Schema::builder();
        let val_field = schema_builder.add_i64_field("val_field", FAST);
        let schema = schema_builder.build();
        let index = Index::create_in_ram(schema);
        let mut writer = index.writer_for_tests()?;
        writer.add_document(doc!(val_field=>12i64))?;
        writer.commit()?;
        writer.add_document(doc!(val_field=>-30i64))?;
        writer.commit()?;
        writer.add_document(doc!(val_field=>-12i64))?;
        writer.commit()?;
        writer.add_document(doc!(val_field=>-10i64))?;
        writer.commit()?;
        let reader = index.reader()?;
        let searcher = reader.searcher();
        let all_query = AllQuery;
        let histogram_collector =
            HistogramCollector::new("val_field".to_string(), -20i64, 10u64, 4);
        let histogram = searcher.search(&all_query, &histogram_collector)?;
        assert_eq!(histogram, vec![1, 1, 0, 1]);
        Ok(())
    }

    #[test]
    fn test_histogram_dates() -> crate::Result<()> {
        let mut schema_builder = Schema::builder();
        let date_field = schema_builder.add_date_field("date_field", FAST);
        let schema = schema_builder.build();
        let index = Index::create_in_ram(schema);
        let mut writer = index.writer_for_tests()?;
        writer.add_document(doc!(date_field=>DateTime::from_primitive(Date::from_calendar_date(1982, Month::September, 17)?.with_hms(0, 0, 0)?)))?;
        writer.add_document(
            doc!(date_field=>DateTime::from_primitive(Date::from_calendar_date(1986, Month::March, 9)?.with_hms(0, 0, 0)?)),
        )?;
        writer.add_document(doc!(date_field=>DateTime::from_primitive(Date::from_calendar_date(1983, Month::September, 27)?.with_hms(0, 0, 0)?)))?;
        writer.commit()?;
        let reader = index.reader()?;
        let searcher = reader.searcher();
        let all_query = AllQuery;
        let week_histogram_collector = HistogramCollector::new(
            "date_field".to_string(),
            DateTime::from_primitive(
                Date::from_calendar_date(1980, Month::January, 1)?.with_hms(0, 0, 0)?,
            ),
            3_600_000_000_000 * 24 * 365, // it is just for a unit test... sorry leap years.
            10,
        );
        let week_histogram = searcher.search(&all_query, &week_histogram_collector)?;
        assert_eq!(week_histogram, vec![0, 0, 1, 1, 0, 0, 1, 0, 0, 0]);
        Ok(())
    }
}


================================================
FILE: src/collector/mod.rs
================================================
//! # Collectors
//!
//! Collectors define the information you want to extract from the documents matching the queries.
//! In tantivy jargon, we call this information your search "fruit".
//!
//! Your fruit could for instance be :
//! - [the count of matching documents](crate::collector::Count)
//! - [the top 10 documents, by relevancy or by a fast field](crate::collector::TopDocs)
//! - [facet counts](FacetCollector)
//!
//! At some point in your code, you will trigger the actual search operation by calling
//! [`Searcher::search()`](crate::Searcher::search).
//! This call will look like this:
//!
//! ```verbatim
//! let fruit = searcher.search(&query, &collector)?;
//! ```
//!
//! Here the type of fruit is actually determined as an associated type of the collector
//! (`Collector::Fruit`).
//!
//!
//! # Combining several collectors
//!
//! A rich search experience often requires to run several collectors on your search query.
//! For instance,
//! - selecting the top-K products matching your query
//! - counting the matching documents
//! - computing several facets
//! - computing statistics about the matching product prices
//!
//! A simple and efficient way to do that is to pass your collectors as one tuple.
//! The resulting `Fruit` will then be a typed tuple with each collector's original fruits
//! in their respective position.
//!
//! ```rust
//! # use tantivy::schema::*;
//! # use tantivy::*;
//! # use tantivy::query::*;
//! use tantivy::collector::{Count, TopDocs};
//! #
//! # fn main() -> tantivy::Result<()> {
//! # let mut schema_builder = Schema::builder();
//! #     let title = schema_builder.add_text_field("title", TEXT);
//! #     let schema = schema_builder.build();
//! #     let index = Index::create_in_ram(schema);
//! #     let mut index_writer = index.writer(15_000_000)?;
//! #       index_writer.add_document(doc!(
//! #       title => "The Name of the Wind",
//! #      ))?;
//! #     index_writer.add_document(doc!(
//! #        title => "The Diary of Muadib",
//! #     ))?;
//! #     index_writer.commit()?;
//! #     let reader = index.reader()?;
//! #     let searcher = reader.searcher();
//! #     let query_parser = QueryParser::for_index(&index, vec![title]);
//! #     let query = query_parser.parse_query("diary")?;
//! let (doc_count, top_docs): (usize, Vec<(Score, DocAddress)>) =
//! searcher.search(&query, &(Count, TopDocs::with_limit(2).order_by_score()))?;
//! #     Ok(())
//! # }
//! ```
//!
//! The `Collector` trait is implemented for up to 4 collectors.
//! If you have more than 4 collectors, you can either group them into
//! tuples of tuples `(a,(b,(c,d)))`, or rely on [`MultiCollector`].
//!
//! # Combining several collectors dynamically
//!
//! Combining collectors into a tuple is a zero-cost abstraction: everything
//! happens as if you had manually implemented a single collector
//! combining all of our features.
//!
//! Unfortunately it requires you to know at compile time your collector types.
//! If on the other hand, the collectors depend on some query parameter,
//! you can rely on [`MultiCollector`]'s.
//!
//!
//! # Implementing your own collectors.
//!
//! See the `custom_collector` example.

use downcast_rs::impl_downcast;

use crate::schema::Schema;
use crate::{DocId, Score, SegmentOrdinal, SegmentReader};

mod count_collector;
pub use self::count_collector::Count;

/// Sort keys
pub mod sort_key;

mod histogram_collector;
pub use histogram_collector::HistogramCollector;

mod multi_collector;
pub use self::multi_collector::{FruitHandle, MultiCollector, MultiFruit};

mod top_collector;
pub use self::top_collector::ComparableDoc;

mod top_score_collector;
pub use self::top_score_collector::{TopDocs, TopNComputer};

mod sort_key_top_collector;
pub use self::sort_key::{SegmentSortKeyComputer, SortKeyComputer};
mod facet_collector;
pub use self::facet_collector::{FacetCollector, FacetCounts};
use crate::query::Weight;

mod docset_collector;
pub use self::docset_collector::DocSetCollector;

mod filter_collector_wrapper;
pub use self::filter_collector_wrapper::{BytesFilterCollector, FilterCollector};

/// `Fruit` is the type for the result of our collection.
/// e.g. `usize` for the `Count` collector.
pub trait Fruit: Send + downcast_rs::Downcast {}

impl<T> Fruit for T where T: Send + downcast_rs::Downcast {}

/// Collectors are in charge of collecting and retaining relevant
/// information from the document found and scored by the query.
///
/// For instance,
///
/// - keeping track of the top 10 best documents
/// - computing a breakdown over a fast field
/// - computing the number of documents matching the query
///
/// Our search index is in fact a collection of segments, so
/// a `Collector` trait is actually more of a factory to instance
/// `SegmentCollector`s for each segments.
///
/// The collection logic itself is in the `SegmentCollector`.
///
/// Segments are not guaranteed to be visited in any specific order.
pub trait Collector: Sync + Send {
    /// `Fruit` is the type for the result of our collection.
    /// e.g. `usize` for the `Count` collector.
    type Fruit: Fruit;

    /// Type of the `SegmentCollector` associated with this collector.
    type Child: SegmentCollector;

    /// Returns an error if the schema is not compatible with the collector.
    fn check_schema(&self, _schema: &Schema) -> crate::Result<()> {
        Ok(())
    }

    /// `set_segment` is called before beginning to enumerate
    /// on this segment.
    fn for_segment(
        &self,
        segment_local_id: SegmentOrdinal,
        segment: &SegmentReader,
    ) -> crate::Result<Self::Child>;

    /// Returns true iff the collector requires to compute scores for documents.
    fn requires_scoring(&self) -> bool;

    /// Combines the fruit associated with the collection of each segments
    /// into one fruit.
    fn merge_fruits(
        &self,
        segment_fruits: Vec<<Self::Child as SegmentCollector>::Fruit>,
    ) -> crate::Result<Self::Fruit>;

    /// Created a segment collector and
    fn collect_segment(
        &self,
        weight: &dyn Weight,
        segment_ord: u32,
        reader: &SegmentReader,
    ) -> crate::Result<<Self::Child as SegmentCollector>::Fruit> {
        let with_scoring = self.requires_scoring();
        let mut segment_collector = self.for_segment(segment_ord, reader)?;
        default_collect_segment_impl(&mut segment_collector, weight, reader, with_scoring)?;
        Ok(segment_collector.harvest())
    }
}

pub(crate) fn default_collect_segment_impl<TSegmentCollector: SegmentCollector>(
    segment_collector: &mut TSegmentCollector,
    weight: &dyn Weight,
    reader: &SegmentReader,
    with_scoring: bool,
) -> crate::Result<()> {
    match (reader.alive_bitset(), with_scoring) {
        (Some(alive_bitset), true) => {
            weight.for_each(reader, &mut |doc, score| {
                if alive_bitset.is_alive(doc) {
                    segment_collector.collect(doc, score);
                }
            })?;
        }
        (Some(alive_bitset), false) => {
            weight.for_each_no_score(reader, &mut |docs| {
                for doc in docs.iter().cloned() {
                    if alive_bitset.is_alive(doc) {
                        segment_collector.collect(doc, 0.0);
                    }
                }
            })?;
        }
        (None, true) => {
            weight.for_each(reader, &mut |doc, score| {
                segment_collector.collect(doc, score);
            })?;
        }
        (None, false) => {
            weight.for_each_no_score(reader, &mut |docs| {
                segment_collector.collect_block(docs);
            })?;
        }
    }
    Ok(())
}

impl<TSegmentCollector: SegmentCollector> SegmentCollector for Option<TSegmentCollector> {
    type Fruit = Option<TSegmentCollector::Fruit>;

    fn collect(&mut self, doc: DocId, score: Score) {
        if let Some(segment_collector) = self {
            segment_collector.collect(doc, score);
        }
    }

    fn collect_block(&mut self, docs: &[DocId]) {
        if let Some(segment_collector) = self {
            segment_collector.collect_block(docs);
        }
    }

    fn harvest(self) -> Self::Fruit {
        self.map(|segment_collector| segment_collector.harvest())
    }
}

impl<TCollector: Collector> Collector for Option<TCollector> {
    type Fruit = Option<TCollector::Fruit>;

    type Child = Option<<TCollector as Collector>::Child>;

    fn check_schema(&self, schema: &Schema) -> crate::Result<()> {
        if let Some(underlying_collector) = self {
            underlying_collector.check_schema(schema)?;
        }
        Ok(())
    }

    fn for_segment(
        &self,
        segment_local_id: SegmentOrdinal,
        segment: &SegmentReader,
    ) -> crate::Result<Self::Child> {
        Ok(if let Some(inner) = self {
            let inner_segment_collector = inner.for_segment(segment_local_id, segment)?;
            Some(inner_segment_collector)
        } else {
            None
        })
    }

    fn requires_scoring(&self) -> bool {
        self.as_ref()
            .map(|inner| inner.requires_scoring())
            .unwrap_or(false)
    }

    fn merge_fruits(
        &self,
        segment_fruits: Vec<<Self::Child as SegmentCollector>::Fruit>,
    ) -> crate::Result<Self::Fruit> {
        if let Some(inner) = self.as_ref() {
            let inner_segment_fruits: Vec<_> = segment_fruits
                .into_iter()
                .flat_map(|fruit_opt| fruit_opt.into_iter())
                .collect();
            let fruit = inner.merge_fruits(inner_segment_fruits)?;
            Ok(Some(fruit))
        } else {
            Ok(None)
        }
    }
}

/// The `SegmentCollector` is the trait in charge of defining the
/// collect operation at the scale of the segment.
///
/// `.collect(doc, score)` will be called for every documents
/// matching the query.
pub trait SegmentCollector: 'static {
    /// `Fruit` is the type for the result of our collection.
    /// e.g. `usize` for the `Count` collector.
    type Fruit: Fruit;

    /// The query pushes the scored document to the collector via this method.
    fn collect(&mut self, doc: DocId, score: Score);

    /// The query pushes the scored document to the collector via this method.
    /// This method is used when the collector does not require scoring.
    ///
    /// See [`COLLECT_BLOCK_BUFFER_LEN`](crate::COLLECT_BLOCK_BUFFER_LEN) for the
    /// buffer size passed to the collector.
    fn collect_block(&mut self, docs: &[DocId]) {
        for doc in docs {
            self.collect(*doc, 0.0);
        }
    }

    /// Extract the fruit of the collection from the `SegmentCollector`.
    fn harvest(self) -> Self::Fruit;
}

// -----------------------------------------------
// Tuple implementations.

impl<Left, Right> Collector for (Left, Right)
where
    Left: Collector,
    Right: Collector,
{
    type Fruit = (Left::Fruit, Right::Fruit);
    type Child = (Left::Child, Right::Child);

    fn check_schema(&self, schema: &Schema) -> crate::Result<()> {
        self.0.check_schema(schema)?;
        self.1.check_schema(schema)?;
        Ok(())
    }

    fn for_segment(
        &self,
        segment_local_id: u32,
        segment: &SegmentReader,
    ) -> crate::Result<Self::Child> {
        let left = self.0.for_segment(segment_local_id, segment)?;
        let right = self.1.for_segment(segment_local_id, segment)?;
        Ok((left, right))
    }

    fn requires_scoring(&self) -> bool {
        self.0.requires_scoring() || self.1.requires_scoring()
    }

    fn merge_fruits(
        &self,
        segment_fruits: Vec<<Self::Child as SegmentCollector>::Fruit>,
    ) -> crate::Result<(Left::Fruit, Right::Fruit)> {
        let mut left_fruits = vec![];
        let mut right_fruits = vec![];
        for (left_fruit, right_fruit) in segment_fruits {
            left_fruits.push(left_fruit);
            right_fruits.push(right_fruit);
        }
        Ok((
            self.0.merge_fruits(left_fruits)?,
            self.1.merge_fruits(right_fruits)?,
        ))
    }
}

impl<Left, Right> SegmentCollector for (Left, Right)
where
    Left: SegmentCollector,
    Right: SegmentCollector,
{
    type Fruit = (Left::Fruit, Right::Fruit);

    fn collect(&mut self, doc: DocId, score: Score) {
        self.0.collect(doc, score);
        self.1.collect(doc, score);
    }

    fn collect_block(&mut self, docs: &[DocId]) {
        self.0.collect_block(docs);
        self.1.collect_block(docs);
    }

    fn harvest(self) -> <Self as SegmentCollector>::Fruit {
        (self.0.harvest(), self.1.harvest())
    }
}

// 3-Tuple

impl<One, Two, Three> Collector for (One, Two, Three)
where
    One: Collector,
    Two: Collector,
    Three: Collector,
{
    type Fruit = (One::Fruit, Two::Fruit, Three::Fruit);
    type Child = (One::Child, Two::Child, Three::Child);

    fn check_schema(&self, schema: &Schema) -> crate::Result<()> {
        self.0.check_schema(schema)?;
        self.1.check_schema(schema)?;
        self.2.check_schema(schema)?;
        Ok(())
    }

    fn for_segment(
        &self,
        segment_local_id: u32,
        segment: &SegmentReader,
    ) -> crate::Result<Self::Child> {
        let one = self.0.for_segment(segment_local_id, segment)?;
        let two = self.1.for_segment(segment_local_id, segment)?;
        let three = self.2.for_segment(segment_local_id, segment)?;
        Ok((one, two, three))
    }

    fn requires_scoring(&self) -> bool {
        self.0.requires_scoring() || self.1.requires_scoring() || self.2.requires_scoring()
    }

    fn merge_fruits(
        &self,
        children: Vec<<Self::Child as SegmentCollector>::Fruit>,
    ) -> crate::Result<Self::Fruit> {
        let mut one_fruits = vec![];
        let mut two_fruits = vec![];
        let mut three_fruits = vec![];
        for (one_fruit, two_fruit, three_fruit) in children {
            one_fruits.push(one_fruit);
            two_fruits.push(two_fruit);
            three_fruits.push(three_fruit);
        }
        Ok((
            self.0.merge_fruits(one_fruits)?,
            self.1.merge_fruits(two_fruits)?,
            self.2.merge_fruits(three_fruits)?,
        ))
    }
}

impl<One, Two, Three> SegmentCollector for (One, Two, Three)
where
    One: SegmentCollector,
    Two: SegmentCollector,
    Three: SegmentCollector,
{
    type Fruit = (One::Fruit, Two::Fruit, Three::Fruit);

    fn collect(&mut self, doc: DocId, score: Score) {
        self.0.collect(doc, score);
        self.1.collect(doc, score);
        self.2.collect(doc, score);
    }

    fn collect_block(&mut self, docs: &[DocId]) {
        self.0.collect_block(docs);
        self.1.collect_block(docs);
        self.2.collect_block(docs);
    }

    fn harvest(self) -> <Self as SegmentCollector>::Fruit {
        (self.0.harvest(), self.1.harvest(), self.2.harvest())
    }
}

// 4-Tuple

impl<One, Two, Three, Four> Collector for (One, Two, Three, Four)
where
    One: Collector,
    Two: Collector,
    Three: Collector,
    Four: Collector,
{
    type Fruit = (One::Fruit, Two::Fruit, Three::Fruit, Four::Fruit);
    type Child = (One::Child, Two::Child, Three::Child, Four::Child);

    fn check_schema(&self, schema: &Schema) -> crate::Result<()> {
        self.0.check_schema(schema)?;
        self.1.check_schema(schema)?;
        self.2.check_schema(schema)?;
        self.3.check_schema(schema)?;
        Ok(())
    }

    fn for_segment(
        &self,
        segment_local_id: u32,
        segment: &SegmentReader,
    ) -> crate::Result<Self::Child> {
        let one = self.0.for_segment(segment_local_id, segment)?;
        let two = self.1.for_segment(segment_local_id, segment)?;
        let three = self.2.for_segment(segment_local_id, segment)?;
        let four = self.3.for_segment(segment_local_id, segment)?;
        Ok((one, two, three, four))
    }

    fn requires_scoring(&self) -> bool {
        self.0.requires_scoring()
            || self.1.requires_scoring()
            || self.2.requires_scoring()
            || self.3.requires_scoring()
    }

    fn merge_fruits(
        &self,
        children: Vec<<Self::Child as SegmentCollector>::Fruit>,
    ) -> crate::Result<Self::Fruit> {
        let mut one_fruits = vec![];
        let mut two_fruits = vec![];
        let mut three_fruits = vec![];
        let mut four_fruits = vec![];
        for (one_fruit, two_fruit, three_fruit, four_fruit) in children {
            one_fruits.push(one_fruit);
            two_fruits.push(two_fruit);
            three_fruits.push(three_fruit);
            four_fruits.push(four_fruit);
        }
        Ok((
            self.0.merge_fruits(one_fruits)?,
            self.1.merge_fruits(two_fruits)?,
            self.2.merge_fruits(three_fruits)?,
            self.3.merge_fruits(four_fruits)?,
        ))
    }
}

impl<One, Two, Three, Four> SegmentCollector for (One, Two, Three, Four)
where
    One: SegmentCollector,
    Two: SegmentCollector,
    Three: SegmentCollector,
    Four: SegmentCollector,
{
    type Fruit = (One::Fruit, Two::Fruit, Three::Fruit, Four::Fruit);

    fn collect(&mut self, doc: DocId, score: Score) {
        self.0.collect(doc, score);
        self.1.collect(doc, score);
        self.2.collect(doc, score);
        self.3.collect(doc, score);
    }

    fn collect_block(&mut self, docs: &[DocId]) {
        self.0.collect_block(docs);
        self.1.collect_block(docs);
        self.2.collect_block(docs);
        self.3.collect_block(docs);
    }

    fn harvest(self) -> <Self as SegmentCollector>::Fruit {
        (
            self.0.harvest(),
            self.1.harvest(),
            self.2.harvest(),
            self.3.harvest(),
        )
    }
}

impl_downcast!(Fruit);

#[cfg(test)]
pub(crate) mod tests;


================================================
FILE: src/collector/multi_collector.rs
================================================
use std::marker::PhantomData;
use std::ops::Deref;

use super::{Collector, SegmentCollector};
use crate::collector::Fruit;
use crate::schema::Schema;
use crate::{DocId, Score, SegmentOrdinal, SegmentReader, TantivyError};

/// MultiFruit keeps Fruits from every nested Collector
pub struct MultiFruit {
    sub_fruits: Vec<Option<Box<dyn Fruit>>>,
}

pub struct CollectorWrapper<TCollector: Collector>(TCollector);

impl<TCollector: Collector> Collector for CollectorWrapper<TCollector> {
    type Fruit = Box<dyn Fruit>;
    type Child = Box<dyn BoxableSegmentCollector>;

    fn check_schema(&self, schema: &Schema) -> crate::Result<()> {
        self.0.check_schema(schema)
    }

    fn for_segment(
        &self,
        segment_local_id: u32,
        reader: &SegmentReader,
    ) -> crate::Result<Box<dyn BoxableSegmentCollector>> {
        let child = self.0.for_segment(segment_local_id, reader)?;
        Ok(Box::new(SegmentCollectorWrapper(child)))
    }

    fn requires_scoring(&self) -> bool {
        self.0.requires_scoring()
    }

    fn merge_fruits(
        &self,
        children: Vec<<Self::Child as SegmentCollector>::Fruit>,
    ) -> crate::Result<Box<dyn Fruit>> {
        let typed_fruit: Vec<<TCollector::Child as SegmentCollector>::Fruit> = children
            .into_iter()
            .map(|untyped_fruit| {
                untyped_fruit
                    .downcast::<<TCollector::Child as SegmentCollector>::Fruit>()
                    .map(|boxed_but_typed| *boxed_but_typed)
                    .map_err(|_| {
                        TantivyError::InvalidArgument("Failed to cast child fruit.".to_string())
                    })
            })
            .collect::<crate::Result<_>>()?;
        let merged_fruit = self.0.merge_fruits(typed_fruit)?;
        Ok(Box::new(merged_fruit))
    }
}

impl SegmentCollector for Box<dyn BoxableSegmentCollector> {
    type Fruit = Box<dyn Fruit>;

    #[inline]
    fn collect(&mut self, doc: u32, score: Score) {
        self.as_mut().collect(doc, score);
    }

    #[inline]
    fn collect_block(&mut self, docs: &[DocId]) {
        self.as_mut().collect_block(docs);
    }

    fn harvest(self) -> Box<dyn Fruit> {
        BoxableSegmentCollector::harvest_from_box(self)
    }
}

pub trait BoxableSegmentCollector {
    fn collect(&mut self, doc: u32, score: Score);
    fn collect_block(&mut self, docs: &[DocId]) {
        for &doc in docs {
            self.collect(doc, 0.0);
        }
    }
    fn harvest_from_box(self: Box<Self>) -> Box<dyn Fruit>;
}

pub struct SegmentCollectorWrapper<TSegmentCollector: SegmentCollector>(TSegmentCollector);

impl<TSegmentCollector: SegmentCollector> BoxableSegmentCollector
    for SegmentCollectorWrapper<TSegmentCollector>
{
    #[inline]
    fn collect(&mut self, doc: u32, score: Score) {
        self.0.collect(doc, score);
    }
    #[inline]
    fn collect_block(&mut self, docs: &[DocId]) {
        self.0.collect_block(docs);
    }

    fn harvest_from_box(self: Box<Self>) -> Box<dyn Fruit> {
        Box::new(self.0.harvest())
    }
}

/// FruitHandle stores reference to the corresponding collector inside MultiCollector
pub struct FruitHandle<TFruit: Fruit> {
    pos: usize,
    _phantom: PhantomData<TFruit>,
}

impl<TFruit: Fruit> FruitHandle<TFruit> {
    /// Extract a typed fruit off a multifruit.
    ///
    /// This function involves downcasting and can panic if the multifruit was
    /// created using faulty code.
    pub fn extract(self, fruits: &mut MultiFruit) -> TFruit {
        let boxed_fruit = fruits.sub_fruits[self.pos].take().expect("");
        *boxed_fruit
            .downcast::<TFruit>()
            .map_err(|_| ())
            .expect("Failed to downcast collector fruit.")
    }
}

/// Multicollector makes it possible to collect on more than one collector.
/// It should only be used for use cases where the Collector types is unknown
/// at compile time.
///
/// If the type of the collectors is known, you can just group yours collectors
/// in a tuple. See the
/// [Combining several collectors section of the collector
/// documentation](./index.html#combining-several-collectors).
///
/// ```rust
/// use tantivy::collector::{Count, TopDocs, MultiCollector};
/// use tantivy::query::QueryParser;
/// use tantivy::schema::{Schema, TEXT};
/// use tantivy::{doc, Index};
///
/// # fn main() -> tantivy::Result<()> {
/// let mut schema_builder = Schema::builder();
/// let title = schema_builder.add_text_field("title", TEXT);
/// let schema = schema_builder.build();
/// let index = Index::create_in_ram(schema);
/// let mut index_writer = index.writer(15_000_000)?;
/// index_writer.add_document(doc!(title => "The Name of the Wind"))?;
/// index_writer.add_document(doc!(title => "The Diary of Muadib"))?;
/// index_writer.add_document(doc!(title => "A Dairy Cow"))?;
/// index_writer.add_document(doc!(title => "The Diary of a Young Girl"))?;
/// index_writer.commit()?;
///
/// let reader = index.reader()?;
/// let searcher = reader.searcher();
///
/// let mut collectors = MultiCollector::new();
/// let top_docs_handle = collectors.add_collector(TopDocs::with_limit(2).order_by_score());
/// let count_handle = collectors.add_collector(Count);
/// let query_parser = QueryParser::for_index(&index, vec![title]);
/// let query = query_parser.parse_query("diary").unwrap();
/// let mut multi_fruit = searcher.search(&query, &collectors).unwrap();
///
/// let count = count_handle.extract(&mut multi_fruit);
/// let top_docs = top_docs_handle.extract(&mut multi_fruit);
///
/// assert_eq!(count, 2);
/// assert_eq!(top_docs.len(), 2);
/// # Ok(())
/// # }
/// ```
#[expect(clippy::type_complexity)]
#[derive(Default)]
pub struct MultiCollector<'a> {
    collector_wrappers: Vec<
        Box<dyn Collector<Child = Box<dyn BoxableSegmentCollector>, Fruit = Box<dyn Fruit>> + 'a>,
    >,
}

impl<'a> MultiCollector<'a> {
    /// Create a new `MultiCollector`
    pub fn new() -> Self {
        Default::default()
    }

    /// Add a new collector to our `MultiCollector`.
    pub fn add_collector<'b: 'a, TCollector: Collector + 'b>(
        &mut self,
        collector: TCollector,
    ) -> FruitHandle<TCollector::Fruit> {
        let pos = self.collector_wrappers.len();
        self.collector_wrappers
            .push(Box::new(CollectorWrapper(collector)));
        FruitHandle {
            pos,
            _phantom: PhantomData,
        }
    }
}

impl Collector for MultiCollector<'_> {
    type Fruit = MultiFruit;
    type Child = MultiCollectorChild;

    fn check_schema(&self, schema: &Schema) -> crate::Result<()> {
        for collector in &self.collector_wrappers {
            collector.check_schema(schema)?;
        }
        Ok(())
    }

    fn for_segment(
        &self,
        segment_local_id: SegmentOrdinal,
        segment: &SegmentReader,
    ) -> crate::Result<MultiCollectorChild> {
        let children = self
            .collector_wrappers
            .iter()
            .map(|collector_wrapper| collector_wrapper.for_segment(segment_local_id, segment))
            .collect::<crate::Result<Vec<_>>>()?;
        Ok(MultiCollectorChild { children })
    }

    fn requires_scoring(&self) -> bool {
        self.collector_wrappers
            .iter()
            .map(Deref::deref)
            .any(Collector::requires_scoring)
    }

    fn merge_fruits(&self, segments_multifruits: Vec<MultiFruit>) -> crate::Result<MultiFruit> {
        let mut segment_fruits_list: Vec<Vec<Box<dyn Fruit>>> = (0..self.collector_wrappers.len())
            .map(|_| Vec::with_capacity(segments_multifruits.len()))
            .collect::<Vec<_>>();
        for segment_multifruit in segments_multifruits {
            for (idx, segment_fruit_opt) in segment_multifruit.sub_fruits.into_iter().enumerate() {
                if let Some(segment_fruit) = segment_fruit_opt {
                    segment_fruits_list[idx].push(segment_fruit);
                }
            }
        }
        let sub_fruits = self
            .collector_wrappers
            .iter()
            .zip(segment_fruits_list)
            .map(|(child_collector, segment_fruits)| {
                Ok(Some(child_collector.merge_fruits(segment_fruits)?))
            })
            .collect::<crate::Result<_>>()?;
        Ok(MultiFruit { sub_fruits })
    }
}

pub struct MultiCollectorChild {
    children: Vec<Box<dyn BoxableSegmentCollector>>,
}

impl SegmentCollector for MultiCollectorChild {
    type Fruit = MultiFruit;

    fn collect(&mut self, doc: DocId, score: Score) {
        for child in &mut self.children {
            child.collect(doc, score);
        }
    }

    fn collect_block(&mut self, docs: &[DocId]) {
        for child in &mut self.children {
            child.collect_block(docs);
        }
    }

    fn harvest(self) -> MultiFruit {
        MultiFruit {
            sub_fruits: self
                .children
                .into_iter()
                .map(|child| Some(child.harvest()))
                .collect(),
        }
    }
}

#[cfg(test)]
mod tests {

    use super::*;
    use crate::collector::{Count, TopDocs};
    use crate::query::TermQuery;
    use crate::schema::{IndexRecordOption, Schema, TEXT};
    use crate::{Index, Term};

    #[test]
    fn test_multi_collector() -> crate::Result<()> {
        let mut schema_builder = Schema::builder();
        let text = schema_builder.add_text_field("text", TEXT);
        let schema = schema_builder.build();

        let index = Index::create_in_ram(schema);
        {
            let mut index_writer = index.writer_for_tests()?;
            index_writer.add_document(doc!(text=>"abc"))?;
            index_writer.add_document(doc!(text=>"abc abc abc"))?;
            index_writer.add_document(doc!(text=>"abc abc"))?;
            index_writer.commit()?;
            index_writer.add_document(doc!(text=>""))?;
            index_writer.add_document(doc!(text=>"abc abc abc abc"))?;
            index_writer.add_document(doc!(text=>"abc"))?;
            index_writer.commit()?;
        }
        let searcher = index.reader()?.searcher();
        let term = Term::from_field_text(text, "abc");
        let query = TermQuery::new(term, IndexRecordOption::Basic);

        let mut collectors = MultiCollector::new();
        let topdocs_handler = collectors.add_collector(TopDocs::with_limit(2).order_by_score());
        let count_handler = collectors.add_collector(Count);
        let mut multifruits = searcher.search(&query, &collectors).unwrap();

        assert_eq!(count_handler.extract(&mut multifruits), 5);
        assert_eq!(topdocs_handler.extract(&mut multifruits).len(), 2);
        Ok(())
    }
}


================================================
FILE: src/collector/sort_key/mod.rs
================================================
mod order;
mod sort_by_bytes;
mod sort_by_erased_type;
mod sort_by_score;
mod sort_by_static_fast_value;
mod sort_by_string;
mod sort_key_computer;

pub use order::*;
pub use sort_by_bytes::SortByBytes;
pub use sort_by_erased_type::SortByErasedType;
pub use sort_by_score::SortBySimilarityScore;
pub use sort_by_static_fast_value::SortByStaticFastValue;
pub use sort_by_string::SortByString;
pub use sort_key_computer::{SegmentSortKeyComputer, SortKeyComputer};

#[cfg(test)]
pub(crate) mod tests {

    // By spec, regardless of whether ascending or descending order was requested, in presence of a
    // tie, we sort by ascending doc id/doc address.
    pub(crate) fn sort_hits<TSortKey: Ord, D: Ord>(
        hits: &mut [ComparableDoc<TSortKey, D>],
        order: Order,
    ) {
        if order.is_asc() {
            hits.sort_by(|l, r| l.sort_key.cmp(&r.sort_key).then(l.doc.cmp(&r.doc)));
        } else {
            hits.sort_by(|l, r| {
                l.sort_key
                    .cmp(&r.sort_key)
                    .reverse() // This is descending
                    .then(l.doc.cmp(&r.doc))
            });
        }
    }

    use std::collections::HashMap;
    use std::ops::Range;

    use crate::collector::sort_key::{
        SortByErasedType, SortBySimilarityScore, SortByStaticFastValue, SortByString,
    };
    use crate::collector::{ComparableDoc, DocSetCollector, TopDocs};
    use crate::indexer::NoMergePolicy;
    use crate::query::{AllQuery, QueryParser};
    use crate::schema::{OwnedValue, Schema, FAST, TEXT};
    use crate::{DocAddress, Document, Index, Order, Score, Searcher};

    fn make_index() -> crate::Result<Index> {
        let mut schema_builder = Schema::builder();
        let id = schema_builder.add_u64_field("id", FAST);
        let city = schema_builder.add_text_field("city", TEXT | FAST);
        let catchphrase = schema_builder.add_text_field("catchphrase", TEXT);
        let altitude = schema_builder.add_f64_field("altitude", FAST);
        let schema = schema_builder.build();
        let index = Index::create_in_ram(schema);

        fn create_segment(index: &Index, docs: Vec<impl Document>) -> crate::Result<()> {
            let mut index_writer = index.writer_for_tests()?;
            index_writer.set_merge_policy(Box::new(NoMergePolicy));
            for doc in docs {
                index_writer.add_document(doc)?;
            }
            index_writer.commit()?;
            Ok(())
        }

        create_segment(
            &index,
            vec![
                doc!(
                    id => 0_u64,
                    city => "austin",
                    catchphrase => "Hills, Barbeque, Glow",
                    altitude => 149.0,
                ),
                doc!(
                    id => 1_u64,
                    city => "greenville",
                    catchphrase => "Grow, Glow, Glow",
                    altitude => 27.0,
                ),
            ],
        )?;
        create_segment(
            &index,
            vec![doc!(
                id => 2_u64,
                city => "tokyo",
                catchphrase => "Glow, Glow, Glow",
                altitude => 40.0,
            )],
        )?;
        create_segment(
            &index,
            vec![doc!(
                id => 3_u64,
                catchphrase => "No, No, No",
                altitude => 0.0,
            )],
        )?;
        Ok(index)
    }

    // NOTE: You cannot determine the SegmentIds that will be generated for Segments
    // ahead of time, so DocAddresses must be mapped back to a unique id for each Searcher.
    fn id_mapping(searcher: &Searcher) -> HashMap<DocAddress, u64> {
        searcher
            .search(&AllQuery, &DocSetCollector)
            .unwrap()
            .into_iter()
            .map(|doc_address| {
                let column = searcher.segment_readers()[doc_address.segment_ord as usize]
                    .fast_fields()
                    .u64("id")
                    .unwrap();
                (doc_address, column.first(doc_address.doc_id).unwrap())
            })
            .collect()
    }

    #[test]
    fn test_order_by_string() -> crate::Result<()> {
        let index = make_index()?;

        #[track_caller]
        fn assert_query(
            index: &Index,
            order: Order,
            doc_range: Range<usize>,
            expected: Vec<(Option<String>, u64)>,
        ) -> crate::Result<()> {
            let searcher = index.reader()?.searcher();
            let ids = id_mapping(&searcher);

            // Try as primitive.
            let top_collector = TopDocs::for_doc_range(doc_range)
                .order_by((SortByString::for_field("city"), order));
            let actual = searcher
                .search(&AllQuery, &top_collector)?
                .into_iter()
                .map(|(sort_key_opt, doc)| (sort_key_opt, ids[&doc]))
                .collect::<Vec<_>>();
            assert_eq!(actual, expected);
            Ok(())
        }

        assert_query(
            &index,
            Order::Asc,
            0..4,
            vec![
                (Some("austin".to_owned()), 0),
                (Some("greenville".to_owned()), 1),
                (Some("tokyo".to_owned()), 2),
                (None, 3),
            ],
        )?;

        assert_query(
            &index,
            Order::Asc,
            0..3,
            vec![
                (Some("austin".to_owned()), 0),
                (Some("greenville".to_owned()), 1),
                (Some("tokyo".to_owned()), 2),
            ],
        )?;

        assert_query(
            &index,
            Order::Asc,
            0..2,
            vec![
                (Some("austin".to_owned()), 0),
                (Some("greenville".to_owned()), 1),
            ],
        )?;

        assert_query(
            &index,
            Order::Asc,
            0..1,
            vec![(Some("austin".to_string()), 0)],
        )?;

        assert_query(
            &index,
            Order::Asc,
            1..3,
            vec![
                (Some("greenville".to_owned()), 1),
                (Some("tokyo".to_owned()), 2),
            ],
        )?;

        assert_query(
            &index,
            Order::Desc,
            0..4,
            vec![
                (Some("tokyo".to_owned()), 2),
                (Some("greenville".to_owned()), 1),
                (Some("austin".to_owned()), 0),
                (None, 3),
            ],
        )?;

        assert_query(
            &index,
            Order::Desc,
            1..3,
            vec![
                (Some("greenville".to_owned()), 1),
                (Some("austin".to_owned()), 0),
            ],
        )?;

        assert_query(
            &index,
            Order::Desc,
            0..1,
            vec![(Some("tokyo".to_owned()), 2)],
        )?;

        Ok(())
    }

    #[test]
    fn test_order_by_f64() -> crate::Result<()> {
        let index = make_index()?;

        fn assert_query(
            index: &Index,
            order: Order,
            expected: Vec<(Option<f64>, u64)>,
        ) -> crate::Result<()> {
            let searcher = index.reader()?.searcher();
            let ids = id_mapping(&searcher);

            // Try as primitive.
            let top_collector = TopDocs::with_limit(3)
                .order_by((SortByStaticFastValue::<f64>::for_field("altitude"), order));
            let actual = searcher
                .search(&AllQuery, &top_collector)?
                .into_iter()
                .map(|(altitude_opt, doc)| (altitude_opt, ids[&doc]))
                .collect::<Vec<_>>();
            assert_eq!(actual, expected);

            Ok(())
        }

        assert_query(
            &index,
            Order::Asc,
            vec![(Some(0.0), 3), (Some(27.0), 1), (Some(40.0), 2)],
        )?;

        assert_query(
            &index,
            Order::Desc,
            vec![(Some(149.0), 0), (Some(40.0), 2), (Some(27.0), 1)],
        )?;

        Ok(())
    }

    #[test]
    fn test_order_by_score() -> crate::Result<()> {
        let index = make_index()?;

        fn query(index: &Index, order: Order) -> crate::Result<Vec<(Score, u64)>> {
            let searcher = index.reader()?.searcher();
            let ids = id_mapping(&searcher);

            let top_collector = TopDocs::with_limit(4).order_by((SortBySimilarityScore, order));
            let field = index.schema().get_field("catchphrase").unwrap();
            let query_parser = QueryParser::for_index(index, vec![field]);
            let text_query = query_parser.parse_query("glow")?;

            Ok(searcher
                .search(&text_query, &top_collector)?
                .into_iter()
                .map(|(score, doc)| (score, ids[&doc]))
                .collect())
        }

        assert_eq!(
            &query(&index, Order::Desc)?,
            &[(0.5604893, 2), (0.4904281, 1), (0.35667497, 0),]
        );

        assert_eq!(
            &query(&index, Order::Asc)?,
            &[(0.35667497, 0), (0.4904281, 1), (0.5604893, 2),]
        );

        Ok(())
    }

    #[test]
    fn test_order_by_score_then_string() -> crate::Result<()> {
        let index = make_index()?;

        type SortKey = (Score, Option<String>);

        fn query(
            index: &Index,
            score_order: Order,
            city_order: Order,
        ) -> crate::Result<Vec<(SortKey, u64)>> {
            let searcher = index.reader()?.searcher();
            let ids = id_mapping(&searcher);

            let top_collector = TopDocs::with_limit(4).order_by((
                (SortBySimilarityScore, score_order),
                (SortByString::for_field("city"), city_order),
            ));
            let results: Vec<((Score, Option<String>), DocAddress)> =
                searcher.search(&AllQuery, &top_collector)?;
            Ok(results.into_iter().map(|(f, doc)| (f, ids[&doc])).collect())
        }

        assert_eq!(
            &query(&index, Order::Asc, Order::Asc)?,
            &[
                ((1.0, Some("austin".to_owned())), 0),
                ((1.0, Some("greenville".to_owned())), 1),
                ((1.0, Some("tokyo".to_owned())), 2),
                ((1.0, None), 3),
            ]
        );

        assert_eq!(
            &query(&index, Order::Asc, Order::Desc)?,
            &[
                ((1.0, Some("tokyo".to_owned())), 2),
                ((1.0, Some("greenville".to_owned())), 1),
                ((1.0, Some("austin".to_owned())), 0),
                ((1.0, None), 3),
            ]
        );
        Ok(())
    }

    #[test]
    fn test_order_by_score_then_owned_value() -> crate::Result<()> {
        let index = make_index()?;

        type SortKey = (Score, OwnedValue);

        fn query(
            index: &Index,
            score_order: Order,
            city_order: Order,
        ) -> crate::Result<Vec<(SortKey, u64)>> {
            let searcher = index.reader()?.searcher();
            let ids = id_mapping(&searcher);

            let top_collector = TopDocs::with_limit(4).order_by::<(Score, OwnedValue)>((
                (SortBySimilarityScore, score_order),
                (SortByErasedType::for_field("city"), city_order),
            ));
            let results: Vec<((Score, OwnedValue), DocAddress)> =
                searcher.search(&AllQuery, &top_collector)?;
            Ok(results.into_iter().map(|(f, doc)| (f, ids[&doc])).collect())
        }

        assert_eq!(
            &query(&index, Order::Asc, Order::Asc)?,
            &[
                ((1.0, OwnedValue::Str("austin".to_owned())), 0),
                ((1.0, OwnedValue::Str("greenville".to_owned())), 1),
                ((1.0, OwnedValue::Str("tokyo".to_owned())), 2),
                ((1.0, OwnedValue::Null), 3),
            ]
        );

        assert_eq!(
            &query(&index, Order::Asc, Order::Desc)?,
            &[
                ((1.0, OwnedValue::Str("tokyo".to_owned())), 2),
                ((1.0, OwnedValue::Str("greenville".to_owned())), 1),
                ((1.0, OwnedValue::Str("austin".to_owned())), 0),
                ((1.0, OwnedValue::Null), 3),
            ]
        );
        Ok(())
    }

    use proptest::prelude::*;

    proptest! {
    #[test]
    fn test_order_by_string_prop(
          order in prop_oneof!(Just(Order::Desc), Just(Order::Asc)),
          limit in 1..64_usize,
          offset in 0..64_usize,
          segments_terms in
            proptest::collection::vec(
                proptest::collection::vec(0..32_u8, 1..32_usize),
                0..8_usize,
            )
        ) {
            let mut schema_builder = Schema::builder();
            let city = schema_builder.add_text_field("city", TEXT | FAST);
            let schema = schema_builder.build();
            let index = Index::create_in_ram(schema);
            let mut index_writer = index.writer_for_tests()?;

            // A Vec<Vec<u8>>, where the outer Vec represents segments, and the inner Vec
            // represents terms.
            for segment_terms in segments_terms.into_iter() {
                for term in segment_terms.into_iter() {
                    let term = format!("{term:0>3}");
                    index_writer.add_document(doc!(
                        city => term,
                    ))?;
                }
                index_writer.commit()?;
            }

            let searcher = index.reader()?.searcher();
            let top_n_results = searcher.search(&AllQuery, &TopDocs::with_limit(limit)
                .and_offset(offset)
                .order_by_string_fast_field("city", order))?;
            let all_results = searcher.search(&AllQuery, &DocSetCollector)?.into_iter().map(|doc_address| {
                // Get the term for this address.
                let column = searcher.segment_readers()[doc_address.segment_ord as usize].fast_fields().str("city").unwrap().unwrap();
                let value = column.term_ords(doc_address.doc_id).next().map(|term_ord| {
                    let mut city = Vec::new();
                    column.dictionary().ord_to_term(term_ord, &mut city).unwrap();
                    String::try_from(city).unwrap()
                });
                (value, doc_address)
            });

            // Using the TopDocs collector should always be equivalent to sorting, skipping the
            // offset, and then taking the limit.
            let sorted_docs: Vec<_> = {
                let mut comparable_docs: Vec<ComparableDoc<_, _>> =
                    all_results.into_iter().map(|(sort_key, doc)| ComparableDoc { sort_key, doc}).collect();
                sort_hits(&mut comparable_docs, order);
                comparable_docs.into_iter().map(|cd| (cd.sort_key, cd.doc)).collect()
            };
            let expected_docs = sorted_docs.into_iter().skip(offset).take(limit).collect::<Vec<_>>();
            prop_assert_eq!(
                expected_docs,
                top_n_results
            );
        }
    }
}


================================================
FILE: src/collector/sort_key/order.rs
================================================
use std::cmp::Ordering;

use columnar::MonotonicallyMappableToU64;
use serde::{Deserialize, Serialize};

use crate::collector::{SegmentSortKeyComputer, SortKeyComputer};
use crate::schema::{OwnedValue, Schema};
use crate::{DocId, Order, Score};

fn compare_owned_value<const NULLS_FIRST: bool>(lhs: &OwnedValue, rhs: &OwnedValue) -> Ordering {
    match (lhs, rhs) {
        (OwnedValue::Null, OwnedValue::Null) => Ordering::Equal,
        (OwnedValue::Null, _) => {
            if NULLS_FIRST {
                Ordering::Less
            } else {
                Ordering::Greater
            }
        }
        (_, OwnedValue::Null) => {
            if NULLS_FIRST {
                Ordering::Greater
            } else {
                Ordering::Less
            }
        }
        (OwnedValue::Str(a), OwnedValue::Str(b)) => a.cmp(b),
        (OwnedValue::PreTokStr(a), OwnedValue::PreTokStr(b)) => a.cmp(b),
        (OwnedValue::U64(a), OwnedValue::U64(b)) => a.cmp(b),
        (OwnedValue::I64(a), OwnedValue::I64(b)) => a.cmp(b),
        (OwnedValue::F64(a), OwnedValue::F64(b)) => a.to_u64().cmp(&b.to_u64()),
        (OwnedValue::Bool(a), OwnedValue::Bool(b)) => a.cmp(b),
        (OwnedValue::Date(a), OwnedValue::Date(b)) => a.cmp(b),
        (OwnedValue::Facet(a), OwnedValue::Facet(b)) => a.cmp(b),
        (OwnedValue::Bytes(a), OwnedValue::Bytes(b)) => a.cmp(b),
        (OwnedValue::IpAddr(a), OwnedValue::IpAddr(b)) => a.cmp(b),
        (OwnedValue::U64(a), OwnedValue::I64(b)) => {
            if *b < 0 {
                Ordering::Greater
            } else {
                a.cmp(&(*b as u64))
            }
        }
        (OwnedValue::I64(a), OwnedValue::U64(b)) => {
            if *a < 0 {
                Ordering::Less
            } else {
                (*a as u64).cmp(b)
            }
        }
        (OwnedValue::U64(a), OwnedValue::F64(b)) => (*a as f64).to_u64().cmp(&b.to_u64()),
        (OwnedValue::F64(a), OwnedValue::U64(b)) => a.to_u64().cmp(&(*b as f64).to_u64()),
        (OwnedValue::I64(a), OwnedValue::F64(b)) => (*a as f64).to_u64().cmp(&b.to_u64()),
        (OwnedValue::F64(a), OwnedValue::I64(b)) => a.to_u64().cmp(&(*b as f64).to_u64()),
        (a, b) => {
            let ord = a.discriminant_value().cmp(&b.discriminant_value());
            // If the discriminant is equal, it's because a new type was added, but hasn't been
            // included in this `match` statement.
            assert!(
                ord != Ordering::Equal,
                "Unimplemented comparison for type of {a:?}, {b:?}"
            );
            ord
        }
    }
}

/// Comparator trait defining the order in which documents should be ordered.
pub trait Comparator<T>: Send + Sync + std::fmt::Debug + Default {
    /// Return the order between two values.
    fn compare(&self, lhs: &T, rhs: &T) -> Ordering;
}

/// Compare values naturally (e.g. 1 < 2).
///
/// When used with `TopDocs`, which reverses the order, this results in a
/// "Descending" sort (Greatest values first).
///
/// `None` (or Null for `OwnedValue`) values are considered to be smaller than any other value,
/// and will therefore appear last in a descending sort (e.g. `[Some(20), Some(10), None]`).
#[derive(Debug, Copy, Clone, Default, Serialize, Deserialize)]
pub struct NaturalComparator;

impl<T: PartialOrd> Comparator<T> for NaturalComparator {
    #[inline(always)]
    fn compare(&self, lhs: &T, rhs: &T) -> Ordering {
        lhs.partial_cmp(rhs).unwrap_or(Ordering::Equal)
    }
}

/// A (partial) implementation of comparison for OwnedValue.
///
/// Intended for use within columns of homogenous types, and so will panic for OwnedValues with
/// mismatched types. The one exception is Null, for which we do define all comparisons.
impl Comparator<OwnedValue> for NaturalComparator {
    #[inline(always)]
    fn compare(&self, lhs: &OwnedValue, rhs: &OwnedValue) -> Ordering {
        compare_owned_value::</* NULLS_FIRST= */ true>(lhs, rhs)
    }
}

/// Compare values in reverse (e.g. 2 < 1).
///
/// When used with `TopDocs`, which reverses the order, this results in an
/// "Ascending" sort (Smallest values first).
///
/// `None` is considered smaller than `Some` in the underlying comparator, but because the
/// comparison is reversed, `None` is effectively treated as the lowest value in the resulting
/// Ascending sort (e.g. `[None, Some(10), Some(20)]`).
///
/// The ReverseComparator does not necessarily imply that the sort order is reversed compared
/// to the NaturalComparator. In presence of a tie on the sort key, documents will always be
/// sorted by ascending `DocId`/`DocAddress` in TopN results, regardless of the sort key's order.
#[derive(Debug, Copy, Clone, Default, Serialize, Deserialize)]
pub struct ReverseComparator;

impl<T> Comparator<T> for ReverseComparator
where NaturalComparator: Comparator<T>
{
    #[inline(always)]
    fn compare(&self, lhs: &T, rhs: &T) -> Ordering {
        NaturalComparator.compare(rhs, lhs)
    }
}

/// Compare values in reverse, but treating `None` as lower than `Some`.
///
/// When used with `TopDocs`, which reverses the order, this results in an
/// "Ascending" sort (Smallest values first), but with `None` values appearing last
/// (e.g. `[Some(10), Some(20), None]`).
///
/// This is usually what is wanted when sorting by a field in an ascending order.
/// For instance, in an e-commerce website, if sorting by price ascending,
/// the cheapest items would appear first, and items without a price would appear last.
#[derive(Debug, Copy, Clone, Default)]
pub struct ReverseNoneIsLowerComparator;

impl<T> Comparator<Option<T>> for ReverseNoneIsLowerComparator
where ReverseComparator: Comparator<T>
{
    #[inline(always)]
    fn compare(&self, lhs_opt: &Option<T>, rhs_opt: &Option<T>) -> Ordering {
        match (lhs_opt, rhs_opt) {
            (None, None) => Ordering::Equal,
            (None, Some(_)) => Ordering::Less,
            (Some(_), None) => Ordering::Greater,
            (Some(lhs), Some(rhs)) => ReverseComparator.compare(lhs, rhs),
        }
    }
}

impl Comparator<u32> for ReverseNoneIsLowerComparator {
    #[inline(always)]
    fn compare(&self, lhs: &u32, rhs: &u32) -> Ordering {
        ReverseComparator.compare(lhs, rhs)
    }
}

impl Comparator<u64> for ReverseNoneIsLowerComparator {
    #[inline(always)]
    fn compare(&self, lhs: &u64, rhs: &u64) -> Ordering {
        ReverseComparator.compare(lhs, rhs)
    }
}

impl Comparator<f64> for ReverseNoneIsLowerComparator {
    #[inline(always)]
    fn compare(&self, lhs: &f64, rhs: &f64) -> Ordering {
        ReverseComparator.compare(lhs, rhs)
    }
}

impl Comparator<f32> for ReverseNoneIsLowerComparator {
    #[inline(always)]
    fn compare(&self, lhs: &f32, rhs: &f32) -> Ordering {
        ReverseComparator.compare(lhs, rhs)
    }
}

impl Comparator<i64> for ReverseNoneIsLowerComparator {
    #[inline(always)]
    fn compare(&self, lhs: &i64, rhs: &i64) -> Ordering {
        ReverseComparator.compare(lhs, rhs)
    }
}

impl Comparator<String> for ReverseNoneIsLowerComparator {
    #[inline(always)]
    fn compare(&self, lhs: &String, rhs: &String) -> Ordering {
        ReverseComparator.compare(lhs, rhs)
    }
}

impl Comparator<OwnedValue> for ReverseNoneIsLowerComparator {
    #[inline(always)]
    fn compare(&self, lhs: &OwnedValue, rhs: &OwnedValue) -> Ordering {
        compare_owned_value::</* NULLS_FIRST= */ false>(rhs, lhs)
    }
}

/// Compare values naturally, but treating `None` as higher than `Some`.
///
/// When used with `TopDocs`, which reverses the order, this results in a
/// "Descending" sort (Greatest values first), but with `None` values appearing first
/// (e.g. `[None, Some(20), Some(10)]`).
#[derive(Debug, Copy, Clone, Default, Serialize, Deserialize)]
pub struct NaturalNoneIsHigherComparator;

impl<T> Comparator<Option<T>> for NaturalNoneIsHigherComparator
where NaturalComparator: Comparator<T>
{
    #[inline(always)]
    fn compare(&self, lhs_opt: &Option<T>, rhs_opt: &Option<T>) -> Ordering {
        match (lhs_opt, rhs_opt) {
            (None, None) => Ordering::Equal,
            (None, Some(_)) => Ordering::Greater,
            (Some(_), None) => Ordering::Less,
            (Some(lhs), Some(rhs)) => NaturalComparator.compare(lhs, rhs),
        }
    }
}

impl Comparator<u32> for NaturalNoneIsHigherComparator {
    #[inline(always)]
    fn compare(&self, lhs: &u32, rhs: &u32) -> Ordering {
        NaturalComparator.compare(lhs, rhs)
    }
}

impl Comparator<u64> for NaturalNoneIsHigherComparator {
    #[inline(always)]
    fn compare(&self, lhs: &u64, rhs: &u64) -> Ordering {
        NaturalComparator.compare(lhs, rhs)
    }
}

impl Comparator<f64> for NaturalNoneIsHigherComparator {
    #[inline(always)]
    fn compare(&self, lhs: &f64, rhs: &f64) -> Ordering {
        NaturalComparator.compare(lhs, rhs)
    }
}

impl Comparator<f32> for NaturalNoneIsHigherComparator {
    #[inline(always)]
    fn compare(&self, lhs: &f32, rhs: &f32) -> Ordering {
        NaturalComparator.compare(lhs, rhs)
    }
}

impl Comparator<i64> for NaturalNoneIsHigherComparator {
    #[inline(always)]
    fn compare(&self, lhs: &i64, rhs: &i64) -> Ordering {
        NaturalComparator.compare(lhs, rhs)
    }
}

impl Comparator<String> for NaturalNoneIsHigherComparator {
    #[inline(always)]
    fn compare(&self, lhs: &String, rhs: &String) -> Ordering {
        NaturalComparator.compare(lhs, rhs)
    }
}

impl Comparator<OwnedValue> for NaturalNoneIsHigherComparator {
    #[inline(always)]
    fn compare(&self, lhs: &OwnedValue, rhs: &OwnedValue) -> Ordering {
        compare_owned_value::</* NULLS_FIRST= */ false>(lhs, rhs)
    }
}

/// An enum representing the different sort orders.
#[derive(Debug, Clone, Copy, Eq, PartialEq, Default)]
pub enum ComparatorEnum {
    /// Natural order (See [NaturalComparator])
    #[default]
    Natural,
    /// Reverse order (See [ReverseComparator])
    Reverse,
    /// Reverse order by treating None as the lowest value. (See [ReverseNoneLowerComparator])
    ReverseNoneLower,
    /// Natural order but treating None as the highest value. (See [NaturalNoneIsHigherComparator])
    NaturalNoneHigher,
}

impl From<Order> for ComparatorEnum {
    fn from(order: Order) -> Self {
        match order {
            Order::Asc => ComparatorEnum::ReverseNoneLower,
            Order::Desc => ComparatorEnum::Natural,
        }
    }
}

impl<T> Comparator<T> for ComparatorEnum
where
    ReverseNoneIsLowerComparator: Comparator<T>,
    NaturalComparator: Comparator<T>,
    ReverseComparator: Comparator<T>,
    NaturalNoneIsHigherComparator: Comparator<T>,
{
    #[inline(always)]
    fn compare(&self, lhs: &T, rhs: &T) -> Ordering {
        match self {
            ComparatorEnum::Natural => NaturalComparator.compare(lhs, rhs),
            ComparatorEnum::Reverse => ReverseComparator.compare(lhs, rhs),
            ComparatorEnum::ReverseNoneLower => ReverseNoneIsLowerComparator.compare(lhs, rhs),
            ComparatorEnum::NaturalNoneHigher => NaturalNoneIsHigherComparator.compare(lhs, rhs),
        }
    }
}

impl<Head, Tail, LeftComparator, RightComparator> Comparator<(Head, Tail)>
    for (LeftComparator, RightComparator)
where
    LeftComparator: Comparator<Head>,
    RightComparator: Comparator<Tail>,
{
    #[inline(always)]
    fn compare(&self, lhs: &(Head, Tail), rhs: &(Head, Tail)) -> Ordering {
        self.0
            .compare(&lhs.0, &rhs.0)
            .then_with(|| self.1.compare(&lhs.1, &rhs.1))
    }
}

impl<Type1, Type2, Type3, Comparator1, Comparator2, Comparator3> Comparator<(Type1, (Type2, Type3))>
    for (Comparator1, Comparator2, Comparator3)
where
    Comparator1: Comparator<Type1>,
    Comparator2: Comparator<Type2>,
    Comparator3: Comparator<Type3>,
{
    #[inline(always)]
    fn compare(&self, lhs: &(Type1, (Type2, Type3)), rhs: &(Type1, (Type2, Type3))) -> Ordering {
        self.0
            .compare(&lhs.0, &rhs.0)
            .then_with(|| self.1.compare(&lhs.1 .0, &rhs.1 .0))
            .then_with(|| self.2.compare(&lhs.1 .1, &rhs.1 .1))
    }
}

impl<Type1, Type2, Type3, Comparator1, Comparator2, Comparator3> Comparator<(Type1, Type2, Type3)>
    for (Comparator1, Comparator2, Comparator3)
where
    Comparator1: Comparator<Type1>,
    Comparator2: Comparator<Type2>,
    Comparator3: Comparator<Type3>,
{
    #[inline(always)]
    fn compare(&self, lhs: &(Type1, Type2, Type3), rhs: &(Type1, Type2, Type3)) -> Ordering {
        self.0
            .compare(&lhs.0, &rhs.0)
            .then_with(|| self.1.compare(&lhs.1, &rhs.1))
            .then_with(|| self.2.compare(&lhs.2, &rhs.2))
    }
}

impl<Type1, Type2, Type3, Type4, Comparator1, Comparator2, Comparator3, Comparator4>
    Comparator<(Type1, (Type2, (Type3, Type4)))>
    for (Comparator1, Comparator2, Comparator3, Comparator4)
where
    Comparator1: Comparator<Type1>,
    Comparator2: Comparator<Type2>,
    Comparator3: Comparator<Type3>,
    Comparator4: Comparator<Type4>,
{
    #[inline(always)]
    fn compare(
        &self,
        lhs: &(Type1, (Type2, (Type3, Type4))),
        rhs: &(Type1, (Type2, (Type3, Type4))),
    ) -> Ordering {
        self.0
            .compare(&lhs.0, &rhs.0)
            .then_with(|| self.1.compare(&lhs.1 .0, &rhs.1 .0))
            .then_with(|| self.2.compare(&lhs.1 .1 .0, &rhs.1 .1 .0))
            .then_with(|| self.3.compare(&lhs.1 .1 .1, &rhs.1 .1 .1))
    }
}

impl<Type1, Type2, Type3, Type4, Comparator1, Comparator2, Comparator3, Comparator4>
    Comparator<(Type1, Type2, Type3, Type4)>
    for (Comparator1, Comparator2, Comparator3, Comparator4)
where
    Comparator1: Comparator<Type1>,
    Comparator2: Comparator<Type2>,
    Comparator3: Comparator<Type3>,
    Comparator4: Comparator<Type4>,
{
    #[inline(always)]
    fn compare(
        &self,
        lhs: &(Type1, Type2, Type3, Type4),
        rhs: &(Type1, Type2, Type3, Type4),
    ) -> Ordering {
        self.0
            .compare(&lhs.0, &rhs.0)
            .then_with(|| self.1.compare(&lhs.1, &rhs.1))
            .then_with(|| self.2.compare(&lhs.2, &rhs.2))
            .then_with(|| self.3.compare(&lhs.3, &rhs.3))
    }
}

impl<TSortKeyComputer> SortKeyComputer for (TSortKeyComputer, ComparatorEnum)
where
    TSortKeyComputer: SortKeyComputer,
    ComparatorEnum: Comparator<TSortKeyComputer::SortKey>,
    ComparatorEnum: Comparator<
        <<TSortKeyComputer as SortKeyComputer>::Child as SegmentSortKeyComputer>::SegmentSortKey,
    >,
{
    type SortKey = TSortKeyComputer::SortKey;

    type Child = SegmentSortKeyComputerWithComparator<TSortKeyComputer::Child, Self::Comparator>;

    type Comparator = ComparatorEnum;

    fn check_schema(&self, schema: &Schema) -> crate::Result<()> {
        self.0.check_schema(schema)
    }

    fn requires_scoring(&self) -> bool {
        self.0.requires_scoring()
    }

    fn comparator(&self) -> Self::Comparator {
        self.1
    }

    fn segment_sort_key_computer(
        &self,
        segment_reader: &crate::SegmentReader,
    ) -> crate::Result<Self::Child> {
        let child = self.0.segment_sort_key_computer(segment_reader)?;
        Ok(SegmentSortKeyComputerWithComparator {
            segment_sort_key_computer: child,
            comparator: self.comparator(),
        })
    }
}

impl<TSortKeyComputer> SortKeyComputer for (TSortKeyComputer, Order)
where
    TSortKeyComputer: SortKeyComputer,
    ComparatorEnum: Comparator<TSortKeyComputer::SortKey>,
    ComparatorEnum: Comparator<
        <<TSortKeyComputer as SortKeyComputer>::Child as SegmentSortKeyComputer>::SegmentSortKey,
    >,
{
    type SortKey = TSortKeyComputer::SortKey;

    type Child = SegmentSortKeyComputerWithComparator<TSortKeyComputer::Child, Self::Comparator>;

    type Comparator = ComparatorEnum;

    fn check_schema(&self, schema: &Schema) -> crate::Result<()> {
        self.0.check_schema(schema)
    }

    fn requires_scoring(&self) -> bool {
        self.0.requires_scoring()
    }

    fn comparator(&self) -> Self::Comparator {
        self.1.into()
    }

    fn segment_sort_key_computer(
        &self,
        segment_reader: &crate::SegmentReader,
    ) -> crate::Result<Self::Child> {
        let child = self.0.segment_sort_key_computer(segment_reader)?;
        Ok(SegmentSortKeyComputerWithComparator {
            segment_sort_key_computer: child,
            comparator: self.comparator(),
        })
    }
}

/// A segment sort key computer with a custom ordering.
pub struct SegmentSortKeyComputerWithComparator<TSegmentSortKeyComputer, TComparator> {
    segment_sort_key_computer: TSegmentSortKeyComputer,
    comparator: TComparator,
}

impl<TSegmentSortKeyComputer, TSegmentSortKey, TComparator> SegmentSortKeyComputer
    for SegmentSortKeyComputerWithComparator<TSegmentSortKeyComputer, TComparator>
where
    TSegmentSortKeyComputer: SegmentSortKeyComputer<SegmentSortKey = TSegmentSortKey>,
    TSegmentSortKey: Clone + 'static + Sync + Send,
    TComparator: Comparator<TSegmentSortKey> + 'static + Sync + Send,
{
    type SortKey = TSegmentSortKeyComputer::SortKey;
    type SegmentSortKey = TSegmentSortKey;
    type SegmentComparator = TComparator;

    fn segment_sort_key(&mut self, doc: DocId, score: Score) -> Self::SegmentSortKey {
        self.segment_sort_key_computer.segment_sort_key(doc, score)
    }

    #[inline(always)]
    fn compare_segment_sort_key(
        &self,
        left: &Self::SegmentSortKey,
        right: &Self::SegmentSortKey,
    ) -> Ordering {
        self.comparator.compare(left, right)
    }

    fn convert_segment_sort_key(&self, sort_key: Self::SegmentSortKey) -> Self::SortKey {
        self.segment_sort_key_computer
            .convert_segment_sort_key(sort_key)
    }
}

#[cfg(test)]
mod tests {
    use super::*;
    use crate::schema::OwnedValue;

    #[test]
    fn test_natural_none_is_higher() {
        let comp = NaturalNoneIsHigherComparator;
        let null = None;
        let v1 = Some(1_u64);
        let v2 = Some(2_u64);

        // NaturalNoneIsGreaterComparator logic:
        // 1. Delegates to NaturalComparator for non-nulls.
        // NaturalComparator compare(2, 1) -> 2.cmp(1) -> Greater.
        assert_eq!(comp.compare(&v2, &v1), Ordering::Greater);

        // 2. Treats None (Null) as Greater than any value.
        // compare(None, Some(2)) should be Greater.
        assert_eq!(comp.compare(&null, &v2), Ordering::Greater);

        // compare(Some(1), None) should be Less.
        assert_eq!(comp.compare(&v1, &null), Ordering::Less);

        // compare(None, None) should be Equal.
        assert_eq!(comp.compare(&null, &null), Ordering::Equal);
    }

    #[test]
    fn test_mixed_ownedvalue_compare() {
        let u = OwnedValue::U64(10);
        let i = OwnedValue::I64(10);
        let f = OwnedValue::F64(10.0);

        let nc = NaturalComparator;
        assert_eq!(nc.compare(&u, &i), Ordering::Equal);
        assert_eq!(nc.compare(&u, &f), Ordering::Equal);
        assert_eq!(nc.compare(&i, &f), Ordering::Equal);

        let u2 = OwnedValue::U64(11);
        assert_eq!(nc.compare(&u2, &f), Ordering::Greater);

        let s = OwnedValue::Str("a".to_string());
        // Str < U64
        assert_eq!(nc.compare(&s, &u), Ordering::Less);
        // Str < I64
        assert_eq!(nc.compare(&s, &i), Ordering::Less);
        // Str < F64
        assert_eq!(nc.compare(&s, &f), Ordering::Less);
    }
}


================================================
FILE: src/collector/sort_key/sort_by_bytes.rs
================================================
use columnar::BytesColumn;

use crate::collector::sort_key::NaturalComparator;
use crate::collector::{SegmentSortKeyComputer, SortKeyComputer};
use crate::termdict::TermOrdinal;
use crate::{DocId, Score};

/// Sort by the first value of a bytes column.
///
/// If the field is multivalued, only the first value is considered.
///
/// Documents that do not have this value are still considered.
/// Their sort key will simply be `None`.
#[derive(Debug, Clone)]
pub struct SortByBytes {
    column_name: String,
}

impl SortByBytes {
    /// Creates a new sort by bytes sort key computer.
    pub fn for_field(column_name: impl ToString) -> Self {
        SortByBytes {
            column_name: column_name.to_string(),
        }
    }
}

impl SortKeyComputer for SortByBytes {
    type SortKey = Option<Vec<u8>>;
    type Child = ByBytesColumnSegmentSortKeyComputer;
    type Comparator = NaturalComparator;

    fn segment_sort_key_computer(
        &self,
        segment_reader: &crate::SegmentReader,
    ) -> crate::Result<Self::Child> {
        let bytes_column_opt = segment_reader.fast_fields().bytes(&self.column_name)?;
        Ok(ByBytesColumnSegmentSortKeyComputer { bytes_column_opt })
    }
}

/// Segment-level sort key computer for bytes columns.
pub struct ByBytesColumnSegmentSortKeyComputer {
    bytes_column_opt: Option<BytesColumn>,
}

impl SegmentSortKeyComputer for ByBytesColumnSegmentSortKeyComputer {
    type SortKey = Option<Vec<u8>>;
    type SegmentSortKey = Option<TermOrdinal>;
    type SegmentComparator = NaturalComparator;

    #[inline(always)]
    fn segment_sort_key(&mut self, doc: DocId, _score: Score) -> Option<TermOrdinal> {
        let bytes_column = self.bytes_column_opt.as_ref()?;
        bytes_column.ords().first(doc)
    }

    fn convert_segment_sort_key(&self, term_ord_opt: Option<TermOrdinal>) -> Option<Vec<u8>> {
        // TODO: Individual lookups to the dictionary like this are very likely to repeatedly
        // decompress the same blocks. See https://github.com/quickwit-oss/tantivy/issues/2776
        let term_ord = term_ord_opt?;
        let bytes_column = self.bytes_column_opt.as_ref()?;
        let mut bytes = Vec::new();
        bytes_column
            .dictionary()
            .ord_to_term(term_ord, &mut bytes)
            .ok()?;
        Some(bytes)
    }
}

#[cfg(test)]
mod tests {
    use super::SortByBytes;
    use crate::collector::TopDocs;
    use crate::query::AllQuery;
    use crate::schema::{BytesOptions, Schema, FAST, INDEXED};
    use crate::{Index, IndexWriter, Order, TantivyDocument};

    #[test]
    fn test_sort_by_bytes_asc() -> crate::Result<()> {
        let mut schema_builder = Schema::builder();
        let bytes_field = schema_builder
            .add_bytes_field("data", BytesOptions::default().set_fast().set_indexed());
        let id_field = schema_builder.add_u64_field("id", FAST | INDEXED);
        let schema = schema_builder.build();
        let index = Index::create_in_ram(schema);
        let mut index_writer: IndexWriter = index.writer_for_tests()?;

        // Insert documents with byte values in non-sorted order
        let test_data: Vec<(u64, Vec<u8>)> = vec![
            (1, vec![0x02, 0x00]),
            (2, vec![0x00, 0x10]),
            (3, vec![0x01, 0x00]),
            (4, vec![0x00, 0x20]),
        ];

        for (id, bytes) in &test_data {
            let mut doc = TantivyDocument::new();
            doc.add_u64(id_field, *id);
            doc.add_bytes(bytes_field, bytes);
            index_writer.add_document(doc)?;
        }
        index_writer.commit()?;

        let reader = index.reader()?;
        let searcher = reader.searcher();

        // Sort ascending by bytes
        let top_docs =
            TopDocs::with_limit(10).order_by((SortByBytes::for_field("data"), Order::Asc));
        let results: Vec<(Option<Vec<u8>>, _)> = searcher.search(&AllQuery, &top_docs)?;

        // Expected order: [0x00,0x10], [0x00,0x20], [0x01,0x00], [0x02,0x00]
        let sorted_bytes: Vec<Option<Vec<u8>>> = results.into_iter().map(|(b, _)| b).collect();
        assert_eq!(
            sorted_bytes,
            vec![
                Some(vec![0x00, 0x10]),
                Some(vec![0x00, 0x20]),
                Some(vec![0x01, 0x00]),
                Some(vec![0x02, 0x00]),
            ]
        );

        Ok(())
    }

    #[test]
    fn test_sort_by_bytes_desc() -> crate::Result<()> {
        let mut schema_builder = Schema::builder();
        let bytes_field = schema_builder
            .add_bytes_field("data", BytesOptions::default().set_fast().set_indexed());
        let schema = schema_builder.build();
        let index = Index::create_in_ram(schema);
        let mut index_writer: IndexWriter = index.writer_for_tests()?;

        let test_data: Vec<Vec<u8>> = vec![vec![0x00, 0x10], vec![0x02, 0x00], vec![0x01, 0x00]];

        for bytes in &test_data {
            let mut doc = TantivyDocument::new();
            doc.add_bytes(bytes_field, bytes);
            index_writer.add_document(doc)?;
        }
        index_writer.commit()?;

        let reader = index.reader()?;
        let searcher = reader.searcher();

        // Sort descending by bytes
        let top_docs =
            TopDocs::with_limit(10).order_by((SortByBytes::for_field("data"), Order::Desc));
        let results: Vec<(Option<Vec<u8>>, _)> = searcher.search(&AllQuery, &top_docs)?;

        // Expected order (descending): [0x02,0x00], [0x01,0x00], [0x00,0x10]
        let sorted_bytes: Vec<Option<Vec<u8>>> = results.into_iter().map(|(b, _)| b).collect();
        assert_eq!(
            sorted_bytes,
            vec![
                Some(vec![0x02, 0x00]),
                Some(vec![0x01, 0x00]),
                Some(vec![0x00, 0x10]),
            ]
        );

        Ok(())
    }
}


================================================
FILE: src/collector/sort_key/sort_by_erased_type.rs
================================================
use columnar::{ColumnType, MonotonicallyMappableToU64};

use crate::collector::sort_key::{
    NaturalComparator, SortByBytes, SortBySimilarityScore, SortByStaticFastValue, SortByString,
};
use crate::collector::{SegmentSortKeyComputer, SortKeyComputer};
use crate::fastfield::FastFieldNotAvailableError;
use crate::schema::OwnedValue;
use crate::{DateTime, DocId, Score};

/// Sort by the boxed / OwnedValue representation of either a fast field, or of the score.
///
/// Using the OwnedValue representation allows for type erasure, and can be useful when sort orders
/// are not known until runtime. But it comes with a performance cost: wherever possible, prefer to
/// use a SortKeyComputer implementation with a known-type at compile time.
#[derive(Debug, Clone)]
pub enum SortByErasedType {
    /// Sort by a fast field
    Field(String),
    /// Sort by score
    Score,
}

impl SortByErasedType {
    /// Creates a new sort key computer which will sort by the given fast field column, with type
    /// erasure.
    pub fn for_field(column_name: impl ToString) -> Self {
        Self::Field(column_name.to_string())
    }

    /// Creates a new sort key computer which will sort by score, with type erasure.
    pub fn for_score() -> Self {
        Self::Score
    }
}

trait ErasedSegmentSortKeyComputer: Send + Sync {
    fn segment_sort_key(&mut self, doc: DocId, score: Score) -> Option<u64>;
    fn convert_segment_sort_key(&self, sort_key: Option<u64>) -> OwnedValue;
}

struct ErasedSegmentSortKeyComputerWrapper<C, F> {
    inner: C,
    converter: F,
}

impl<C, F> ErasedSegmentSortKeyComputer for ErasedSegmentSortKeyComputerWrapper<C, F>
where
    C: SegmentSortKeyComputer<SegmentSortKey = Option<u64>> + Send + Sync,
    F: Fn(C::SortKey) -> OwnedValue + Send + Sync + 'static,
{
    fn segment_sort_key(&mut self, doc: DocId, score: Score) -> Option<u64> {
        self.inner.segment_sort_key(doc, score)
    }

    fn convert_segment_sort_key(&self, sort_key: Option<u64>) -> OwnedValue {
        let val = self.inner.convert_segment_sort_key(sort_key);
        (self.converter)(val)
    }
}

struct ScoreSegmentSortKeyComputer {
    segment_computer: SortBySimilarityScore,
}

impl ErasedSegmentSortKeyComputer for ScoreSegmentSortKeyComputer {
    fn segment_sort_key(&mut self, doc: DocId, score: Score) -> Option<u64> {
        let score_value: f64 = self.segment_computer.segment_sort_key(doc, score).into();
        Some(score_value.to_u64())
    }

    fn convert_segment_sort_key(&self, sort_key: Option<u64>) -> OwnedValue {
        let score_value: u64 = sort_key.expect("This implementation always produces a score.");
        OwnedValue::F64(f64::from_u64(score_value))
    }
}

impl SortKeyComputer for SortByErasedType {
    type SortKey = OwnedValue;
    type Child = ErasedColumnSegmentSortKeyComputer;
    type Comparator = NaturalComparator;

    fn requires_scoring(&self) -> bool {
        matches!(self, Self::Score)
    }

    fn segment_sort_key_computer(
        &self,
        segment_reader: &crate::SegmentReader,
    ) -> crate::Result<Self::Child> {
        let inner: Box<dyn ErasedSegmentSortKeyComputer> = match self {
            Self::Field(column_name) => {
                let fast_fields = segment_reader.fast_fields();
                // TODO: We currently double-open the column to avoid relying on the implementation
                // details of `SortByString` or `SortByStaticFastValue`. Once
                // https://github.com/quickwit-oss/tantivy/issues/2776 is resolved, we should
                // consider directly constructing the appropriate `SegmentSortKeyComputer` type for
                // the column that we open here.
                let (_column, column_type) =
                    fast_fields.u64_lenient(column_name)?.ok_or_else(|| {
                        FastFieldNotAvailableError {
                            field_name: column_name.to_owned(),
                        }
                    })?;

                match column_type {
                    ColumnType::Str => {
                        let computer = SortByString::for_field(column_name);
                        let inner = computer.segment_sort_key_computer(segment_reader)?;
                        Box::new(ErasedSegmentSortKeyComputerWrapper {
                            inner,
                            converter: |val: Option<String>| {
                                val.map(OwnedValue::Str).unwrap_or(OwnedValue::Null)
                            },
                        })
                    }
                    ColumnType::Bytes => {
                        let computer = SortByBytes::for_field(column_name);
                        let inner = computer.segment_sort_key_computer(segment_reader)?;
                        Box::new(ErasedSegmentSortKeyComputerWrapper {
                            inner,
                            converter: |val: Option<Vec<u8>>| {
                                val.map(OwnedValue::Bytes).unwrap_or(OwnedValue::Null)
                            },
                        })
                    }
                    ColumnType::U64 => {
                        let computer = SortByStaticFastValue::<u64>::for_field(column_name);
                        let inner = computer.segment_sort_key_computer(segment_reader)?;
                        Box::new(ErasedSegmentSortKeyComputerWrapper {
                            inner,
                            converter: |val: Option<u64>| {
                                val.map(OwnedValue::U64).unwrap_or(OwnedValue::Null)
                            },
                        })
                    }
                    ColumnType::I64 => {
                        let computer = SortByStaticFastValue::<i64>::for_field(column_name);
                        let inner = computer.segment_sort_key_computer(segment_reader)?;
                        Box::new(ErasedSegmentSortKeyComputerWrapper {
                            inner,
                            converter: |val: Option<i64>| {
                                val.map(OwnedValue::I64).unwrap_or(OwnedValue::Null)
                            },
                        })
                    }
                    ColumnType::F64 => {
                        let computer = SortByStaticFastValue::<f64>::for_field(column_name);
                        let inner = computer.segment_sort_key_computer(segment_reader)?;
                        Box::new(ErasedSegmentSortKeyComputerWrapper {
                            inner,
                            converter: |val: Option<f64>| {
                                val.map(OwnedValue::F64).unwrap_or(OwnedValue::Null)
                            },
                        })
                    }
                    ColumnType::Bool => {
                        let computer = SortByStaticFastValue::<bool>::for_field(column_name);
                        let inner = computer.segment_sort_key_computer(segment_reader)?;
                        Box::new(ErasedSegmentSortKeyComputerWrapper {
                            inner,
                            converter: |val: Option<bool>| {
                                val.map(OwnedValue::Bool).unwrap_or(OwnedValue::Null)
                            },
                        })
                    }
                    ColumnType::DateTime => {
                        let computer = SortByStaticFastValue::<DateTime>::for_field(column_name);
                        let inner = computer.segment_sort_key_computer(segment_reader)?;
                        Box::new(ErasedSegmentSortKeyComputerWrapper {
                            inner,
                            converter: |val: Option<DateTime>| {
                                val.map(OwnedValue::Date).unwrap_or(OwnedValue::Null)
                            },
                        })
                    }
                    column_type => {
                        return Err(crate::TantivyError::SchemaError(format!(
                            "Field `{}` is of type {column_type:?}, which is not supported for \
                             sorting by owned value yet.",
                            column_name
                        )))
                    }
                }
            }
            Self::Score => Box::new(ScoreSegmentSortKeyComputer {
                segment_computer: SortBySimilarityScore,
            }),
        };
        Ok(ErasedColumnSegmentSortKeyComputer { inner })
    }
}

pub struct ErasedColumnSegmentSortKeyComputer {
    inner: Box<dyn ErasedSegmentSortKeyComputer>,
}

impl SegmentSortKeyComputer for ErasedColumnSegmentSortKeyComputer {
    type SortKey = OwnedValue;
    type SegmentSortKey = Option<u64>;
    type SegmentComparator = NaturalComparator;

    #[inline(always)]
    fn segment_sort_key(&mut self, doc: DocId, score: Score) -> Option<u64> {
        self.inner.segment_sort_key(doc, score)
    }

    fn convert_segment_sort_key(&self, segment_sort_key: Self::SegmentSortKey) -> OwnedValue {
        self.inner.convert_segment_sort_key(segment_sort_key)
    }
}

#[cfg(test)]
mod tests {
    use crate::collector::sort_key::{ComparatorEnum, SortByErasedType};
    use crate::collector::TopDocs;
    use crate::query::AllQuery;
    use crate::schema::{OwnedValue, Schema, FAST, TEXT};
    use crate::Index;

    #[test]
    fn test_sort_by_owned_u64() {
        let mut schema_builder = Schema::builder();
        let id_field = schema_builder.add_u64_field("id", FAST);
        let schema = schema_builder.build();
        let index = Index::create_in_ram(schema);
        let mut writer = index.writer_for_tests().unwrap();
        writer.add_document(doc!(id_field => 10u64)).unwrap();
        writer.add_document(doc!(id_field => 2u64)).unwrap();
        writer.add_document(doc!()).unwrap();
        writer.commit().unwrap();

        let reader = index.reader().unwrap();
        let searcher = reader.searcher();

        let collector = TopDocs::with_limit(10)
            .order_by((SortByErasedType::for_field("id"), ComparatorEnum::Natural));
        let top_docs = searcher.search(&AllQuery, &collector).unwrap();

        let values: Vec<OwnedValue> = top_docs.into_iter().map(|(key, _)| key).collect();

        assert_eq!(
            values,
            vec![OwnedValue::U64(10), OwnedValue::U64(2), OwnedValue::Null]
        );

        let collector = TopDocs::with_limit(10).order_by((
            SortByErasedType::for_field("id"),
            ComparatorEnum::ReverseNoneLower,
        ));
        let top_docs = searcher.search(&AllQuery, &collector).unwrap();

        let values: Vec<OwnedValue> = top_docs.into_iter().map(|(key, _)| key).collect();

        assert_eq!(
            values,
            vec![OwnedValue::U64(2), OwnedValue::U64(10), OwnedValue::Null]
        );
    }

    #[test]
    fn test_sort_by_owned_string() {
        let mut schema_builder = Schema::builder();
        let city_field = schema_builder.add_text_field("city", FAST | TEXT);
        let schema = schema_builder.build();
        let index = Index::create_in_ram(schema);
        let mut writer = index.writer_for_tests().unwrap();
        writer.add_document(doc!(city_field => "tokyo")).unwrap();
        writer.add_document(doc!(city_field => "austin")).unwrap();
        writer.add_document(doc!()).unwrap();
        writer.commit().unwrap();

        let reader = index.reader().unwrap();
        let searcher = reader.searcher();

        let collector = TopDocs::with_limit(10).order_by((
            SortByErasedType::for_field("city"),
            ComparatorEnum::ReverseNoneLower,
        ));
        let top_docs = searcher.search(&AllQuery, &collector).unwrap();

        let values: Vec<OwnedValue> = top_docs.into_iter().map(|(key, _)| key).collect();

        assert_eq!(
            values,
            vec![
                OwnedValue::Str("austin".to_string()),
                OwnedValue::Str("tokyo".to_string()),
                OwnedValue::Null
            ]
        );
    }

    #[test]
    fn test_sort_by_owned_bytes() {
        let mut schema_builder = Schema::builder();
        let data_field = schema_builder.add_bytes_field("data", FAST);
        let schema = schema_builder.build();
        let index = Index::create_in_ram(schema);
        let mut writer = index.writer_for_tests().unwrap();
        writer
            .add_document(doc!(data_field => vec![0x03u8, 0x00]))
            .unwrap();
        writer
            .add_document(doc!(data_field => vec![0x01u8, 0x00]))
            .unwrap();
        writer
            .add_document(doc!(data_field => vec![0x02u8, 0x00]))
            .unwrap();
        writer.add_document(doc!()).unwrap();
        writer.commit().unwrap();

        let reader = index.reader().unwrap();
        let searcher = reader.searcher();

        // Sort descending (Natural - highest first)
        let collector = TopDocs::with_limit(10)
            .order_by((SortByErasedType::for_field("data"), ComparatorEnum::Natural));
        let top_docs = searcher.search(&AllQuery, &collector).unwrap();

        let values: Vec<OwnedValue> = top_docs.into_iter().map(|(key, _)| key).collect();

        assert_eq!(
            values,
            vec![
                OwnedValue::Bytes(vec![0x03, 0x00]),
                OwnedValue::Bytes(vec![0x02, 0x00]),
                OwnedValue::Bytes(vec![0x01, 0x00]),
                OwnedValue::Null
            ]
        );

        // Sort ascending (ReverseNoneLower - lowest first, nulls last)
        let collector = TopDocs::with_limit(10).order_by((
            SortByErasedType::for_field("data"),
            ComparatorEnum::ReverseNoneLower,
        ));
        let top_docs = searcher.search(&AllQuery, &collector).unwrap();

        let values: Vec<OwnedValue> = top_docs.into_iter().map(|(key, _)| key).collect();

        assert_eq!(
            values,
            vec![
                OwnedValue::Bytes(vec![0x01, 0x00]),
                OwnedValue::Bytes(vec![0x02, 0x00]),
                OwnedValue::Bytes(vec![0x03, 0x00]),
                OwnedValue::Null
            ]
        );
    }

    #[test]
    fn test_sort_by_owned_reverse() {
        let mut schema_builder = Schema::builder();
        let id_field = schema_builder.add_u64_field("id", FAST);
        let schema = schema_builder.build();
        let index = Index::create_in_ram(schema);
        let mut writer = index.writer_for_tests().unwrap();
        writer.add_document(doc!(id_field => 10u64)).unwrap();
        writer.add_document(doc!(id_field => 2u64)).unwrap();
        writer.add_document(doc!()).unwrap();
        writer.commit().unwrap();

        let reader = index.reader().unwrap();
        let searcher = reader.searcher();

        let collector = TopDocs::with_limit(10)
            .order_by((SortByErasedType::for_field("id"), ComparatorEnum::Reverse));
        let top_docs = searcher.search(&AllQuery, &collector).unwrap();

        let values: Vec<OwnedValue> = top_docs.into_iter().map(|(key, _)| key).collect();

        assert_eq!(
            values,
            vec![OwnedValue::Null, OwnedValue::U64(2), OwnedValue::U64(10)]
        );
    }

    #[test]
    fn test_sort_by_owned_score() {
        let mut schema_builder = Schema::builder();
        let body_field = schema_builder.add_text_field("body", TEXT);
        let schema = schema_builder.build();
        let index = Index::create_in_ram(schema);
        let mut writer = index.writer_for_tests().unwrap();
        writer.add_document(doc!(body_field => "a a")).unwrap();
        writer.add_document(doc!(body_field => "a")).unwrap();
        writer.commit().unwrap();

        let reader = index.reader().unwrap();
        let searcher = reader.searcher();
        let query_parser = crate::query::QueryParser::for_index(&index, vec![body_field]);
        let query = query_parser.parse_query("a").unwrap();

        // Sort by score descending (Natural)
        let collector = TopDocs::with_limit(10)
            .order_by((SortByErasedType::for_score(), ComparatorEnum::Natural));
        let top_docs = searcher.search(&query, &collector).unwrap();

        let values: Vec<f64> = top_docs
            .into_iter()
            .map(|(key, _)| match key {
                OwnedValue::F64(val) => val,
                _ => panic!("Wrong type {key:?}"),
            })
            .collect();

        assert_eq!(values.len(), 2);
        assert!(values[0] > values[1]);

        // Sort by score ascending (ReverseNoneLower)
        let collector = TopDocs::with_limit(10).order_by((
            SortByErasedType::for_score(),
            ComparatorEnum::ReverseNoneLower,
        ));
        let top_docs = searcher.search(&query, &collector).unwrap();

        let values: Vec<f64> = top_docs
            .into_iter()
            .map(|(key, _)| match key {
                OwnedValue::F64(val) => val,
                _ => panic!("Wrong type {key:?}"),
            })
            .collect();

        assert_eq!(values.len(), 2);
        assert!(values[0] < values[1]);
    }
}


================================================
FILE: src/collector/sort_key/sort_by_score.rs
================================================
use crate::collector::sort_key::NaturalComparator;
use crate::collector::{SegmentSortKeyComputer, SortKeyComputer, TopNComputer};
use crate::{DocAddress, DocId, Score};

/// Sort by similarity score.
#[derive(Clone, Debug, Copy)]
pub struct SortBySimilarityScore;

impl SortKeyComputer for SortBySimilarityScore {
    type SortKey = Score;

    type Child = SortBySimilarityScore;

    type Comparator = NaturalComparator;

    fn requires_scoring(&self) -> bool {
        true
    }

    fn segment_sort_key_computer(
        &self,
        _segment_reader: &crate::SegmentReader,
    ) -> crate::Result<Self::Child> {
        Ok(SortBySimilarityScore)
    }

    // Sorting by score is special in that it allows for the Block-Wand optimization.
    fn collect_segment_top_k(
        &self,
        k: usize,
        weight: &dyn crate::query::Weight,
        reader: &crate::SegmentReader,
        segment_ord: u32,
    ) -> crate::Result<Vec<(Self::SortKey, DocAddress)>> {
        let mut top_n: TopNComputer<Score, DocId, Self::Comparator> =
            TopNComputer::new_with_comparator(k, self.comparator());

        if let Some(alive_bitset) = reader.alive_bitset() {
            let mut threshold = Score::MIN;
            top_n.threshold = Some(threshold);
            weight.for_each_pruning(Score::MIN, reader, &mut |doc, score| {
                if alive_bitset.is_deleted(doc) {
                    return threshold;
                }
                top_n.push(score, doc);
                threshold = top_n.threshold.unwrap_or(Score::MIN);
                threshold
            })?;
        } else {
            weight.for_each_pruning(Score::MIN, reader, &mut |doc, score| {
                top_n.push(score, doc);
                top_n.threshold.unwrap_or(Score::MIN)
            })?;
        }

        Ok(top_n
            .into_vec()
            .into_iter()
            .map(|cid| (cid.sort_key, DocAddress::new(segment_ord, cid.doc)))
            .collect())
    }
}

impl SegmentSortKeyComputer for SortBySimilarityScore {
    type SortKey = Score;
    type SegmentSortKey = Score;
    type SegmentComparator = NaturalComparator;

    #[inline(always)]
    fn segment_sort_key(&mut self, _doc: DocId, score: Score) -> Score {
        score
    }

    fn convert_segment_sort_key(&self, score: Score) -> Score {
        score
    }
}


================================================
FILE: src/collector/sort_key/sort_by_static_fast_value.rs
================================================
use std::marker::PhantomData;

use columnar::Column;

use crate::collector::sort_key::NaturalComparator;
use crate::collector::{SegmentSortKeyComputer, SortKeyComputer};
use crate::fastfield::{FastFieldNotAvailableError, FastValue};
use crate::{DocId, Score, SegmentReader};

/// Sorts by a fast value (u64, i64, f64, bool).
///
/// The field must appear explicitly in the schema, with the right type, and declared as
/// a fast field..
///
/// If the field is multivalued, only the first value is considered.
///
/// Documents that do not have this value are still considered.
/// Their sort key will simply be `None`.
#[derive(Debug, Clone)]
pub struct SortByStaticFastValue<T: FastValue> {
    field: String,
    typ: PhantomData<T>,
}

impl<T: FastValue> SortByStaticFastValue<T> {
    /// Creates a new `SortByStaticFastValue` instance for the given field.
    pub fn for_field(column_name: impl ToString) -> SortByStaticFastValue<T> {
        Self {
            field: column_name.to_string(),
            typ: PhantomData,
        }
    }
}

impl<T: FastValue> SortKeyComputer for SortByStaticFastValue<T> {
    type Child = SortByFastValueSegmentSortKeyComputer<T>;
    type SortKey = Option<T>;
    type Comparator = NaturalComparator;

    fn check_schema(&self, schema: &crate::schema::Schema) -> crate::Result<()> {
        // At the segment sort key computer level, we rely on the u64 representation.
        // The mapping is monotonic, so it is sufficient to compute our top-K docs.
        let field = schema.get_field(&self.field)?;
        let field_entry = schema.get_field_entry(field);
        if !field_entry.is_fast() {
            return Err(crate::TantivyError::SchemaError(format!(
                "Field `{}` is not a fast field.",
                self.field,
            )));
        }
        let schema_type = field_entry.field_type().value_type();
        if schema_type != T::to_type() {
            return Err(crate::TantivyError::SchemaError(format!(
                "Field `{}` is of type {schema_type:?}, not of the type {:?}.",
                &self.field,
                T::to_type()
            )));
        }
        Ok(())
    }

    fn segment_sort_key_computer(
        &self,
        segment_reader: &SegmentReader,
    ) -> crate::Result<Self::Child> {
        let sort_column_opt = segment_reader.fast_fields().u64_lenient(&self.field)?;
        let (sort_column, _sort_column_type) =
            sort_column_opt.ok_or_else(|| FastFieldNotAvailableError {
                field_name: self.field.clone(),
            })?;
        Ok(SortByFastValueSegmentSortKeyComputer {
            sort_column,
            typ: PhantomData,
        })
    }
}

pub struct SortByFastValueSegmentSortKeyComputer<T> {
    sort_column: Column<u64>,
    typ: PhantomData<T>,
}

impl<T: FastValue> SegmentSortKeyComputer for SortByFastValueSegmentSortKeyComputer<T> {
    type SortKey = Option<T>;
    type SegmentSortKey = Option<u64>;
    type SegmentComparator = NaturalComparator;

    #[inline(always)]
    fn segment_sort_key(&mut self, doc: DocId, _score: Score) -> Self::SegmentSortKey {
        self.sort_column.first(doc)
    }

    fn convert_segment_sort_key(&self, sort_key: Self::SegmentSortKey) -> Self::SortKey {
        sort_key.map(T::from_u64)
    }
}


================================================
FILE: src/collector/sort_key/sort_by_string.rs
================================================
use columnar::StrColumn;

use crate::collector::sort_key::NaturalComparator;
use crate::collector::{SegmentSortKeyComputer, SortKeyComputer};
use crate::termdict::TermOrdinal;
use crate::{DocId, Score};

/// Sort by the first value of a string column.
///
/// The string can be dynamic (coming from a json field)
/// or static (being specificaly defined in the configuration).
///
/// If the field is multivalued, only the first value is considered.
///
/// Documents that do not have this value are still considered.
/// Their sort key will simply be `None`.
#[derive(Debug, Clone)]
pub struct SortByString {
    column_name: String,
}

impl SortByString {
    /// Creates a new sort by string sort key computer.
    pub fn for_field(column_name: impl ToString) -> Self {
        SortByString {
            column_name: column_name.to_string(),
        }
    }
}

impl SortKeyComputer for SortByString {
    type SortKey = Option<String>;
    type Child = ByStringColumnSegmentSortKeyComputer;
    type Comparator = NaturalComparator;

    fn segment_sort_key_computer(
        &self,
        segment_reader: &crate::SegmentReader,
    ) -> crate::Result<Self::Child> {
        let str_column_opt = segment_reader.fast_fields().str(&self.column_name)?;
        Ok(ByStringColumnSegmentSortKeyComputer { str_column_opt })
    }
}

pub struct ByStringColumnSegmentSortKeyComputer {
    str_column_opt: Option<StrColumn>,
}

impl SegmentSortKeyComputer for ByStringColumnSegmentSortKeyComputer {
    type SortKey = Option<String>;
    type SegmentSortKey = Option<TermOrdinal>;
    type SegmentComparator = NaturalComparator;

    #[inline(always)]
    fn segment_sort_key(&mut self, doc: DocId, _score: Score) -> Option<TermOrdinal> {
        let str_column = self.str_column_opt.as_ref()?;
        str_column.ords().first(doc)
    }

    fn convert_segment_sort_key(&self, term_ord_opt: Option<TermOrdinal>) -> Option<String> {
        // TODO: Individual lookups to the dictionary like this are very likely to repeatedly
        // decompress the same blocks. See https://github.com/quickwit-oss/tantivy/issues/2776
        let term_ord = term_ord_opt?;
        let str_column = self.str_column_opt.as_ref()?;
        let mut bytes = Vec::new();
        str_column
            .dictionary()
            .ord_to_term(term_ord, &mut bytes)
            .ok()?;
        String::try_from(bytes).ok()
    }
}


================================================
FILE: src/collector/sort_key/sort_key_computer.rs
================================================
use std::cmp::Ordering;

use crate::collector::sort_key::{Comparator, NaturalComparator};
use crate::collector::sort_key_top_collector::TopBySortKeySegmentCollector;
use crate::collector::{default_collect_segment_impl, SegmentCollector as _, TopNComputer};
use crate::schema::Schema;
use crate::{DocAddress, DocId, Result, Score, SegmentReader};

/// A `SegmentSortKeyComputer` makes it possible to modify the default score
/// for a given document belonging to a specific segment.
///
/// It is the segment local version of the [`SortKeyComputer`].
pub trait SegmentSortKeyComputer: 'static {
    /// The final score being emitted.
    type SortKey: 'static + Send + Sync + Clone;

    /// Sort key used by at the segment level by the `SegmentSortKeyComputer`.
    ///
    /// It is typically small like a `u64`, and is meant to be converted
    /// to the final score at the end of the collection of the segment.
    type SegmentSortKey: 'static + Clone + Send + Sync + Clone;

    /// Comparator type.
    type SegmentComparator: Comparator<Self::SegmentSortKey> + 'static;

    /// Returns the segment sort key comparator.
    fn segment_comparator(&self) -> Self::SegmentComparator {
        Self::SegmentComparator::default()
    }

    /// Computes the sort key for the given document and score.
    fn segment_sort_key(&mut self, doc: DocId, score: Score) -> Self::SegmentSortKey;

    /// Computes the sort key and pushes the document in a TopN Computer.
    ///
    /// When using a tuple as the sorting key, the sort key is evaluated in a lazy manner.
    #[inline(always)]
    fn compute_sort_key_and_collect<C: Comparator<Self::SegmentSortKey>>(
        &mut self,
        doc: DocId,
        score: Score,
        top_n_computer: &mut TopNComputer<Self::SegmentSortKey, DocId, C>,
    ) {
        let sort_key = self.segment_sort_key(doc, score);
        top_n_computer.push(sort_key, doc);
    }

    /// A SegmentSortKeyComputer maps to a SegmentSortKey, but it can also decide on
    /// its ordering.
    ///
    /// This method must be consistent with the `SortKey` ordering.
    #[inline(always)]
    fn compare_segment_sort_key(
        &self,
        left: &Self::SegmentSortKey,
        right: &Self::SegmentSortKey,
    ) -> Ordering {
        self.segment_comparator().compare(left, right)
    }

    /// Implementing this method makes it possible to avoid computing
    /// a sort_key entirely if we can assess that it won't pass a threshold
    /// with a partial computation.
    ///
    /// This is currently used for lexicographic sorting.
    fn accept_sort_key_lazy(
        &mut self,
        doc_id: DocId,
        score: Score,
        threshold: &Self::SegmentSortKey,
    ) -> Option<(Ordering, Self::SegmentSortKey)> {
        let sort_key = self.segment_sort_key(doc_id, score);
        let cmp = self.compare_segment_sort_key(&sort_key, threshold);
        if cmp == Ordering::Less {
            None
        } else {
            Some((cmp, sort_key))
        }
    }

    /// Convert a segment level sort key into the global sort key.
    fn convert_segment_sort_key(&self, sort_key: Self::SegmentSortKey) -> Self::SortKey;
}

/// `SortKeyComputer` defines the sort key to be used by a TopK Collector.
///
/// The `SortKeyComputer` itself does not make much of the computation itself.
/// Instead, it helps constructing `Self::Child` instances that will compute
/// the sort key at a segment scale.
pub trait SortKeyComputer: Sync {
    /// The sort key type.
    type SortKey: 'static + Send + Sync + Clone + std::fmt::Debug;
    /// Type of the associated [`SegmentSortKeyComputer`].
    type Child: SegmentSortKeyComputer<SortKey = Self::SortKey>;
    /// Comparator type.
    type Comparator: Comparator<Self::SortKey>
        + Comparator<<Self::Child as SegmentSortKeyComputer>::SegmentSortKey>
        + 'static;

    /// Checks whether the schema is compatible with the sort key computer.
    fn check_schema(&self, _schema: &Schema) -> crate::Result<()> {
        Ok(())
    }

    /// Returns the sort key comparator.
    fn comparator(&self) -> Self::Comparator {
        Self::Comparator::default()
    }

    /// Indicates whether the sort key actually uses the similarity score (by default BM25).
    /// If set to false, the similary score might not be computed (as an optimization),
    /// and the score fed in the segment sort key computer could take any value.
    fn requires_scoring(&self) -> bool {
        false
    }

    /// Sorting by score has a overriding implementation for BM25 scores, using Block-WAND.
    fn collect_segment_top_k(
        &self,
        k: usize,
        weight: &dyn crate::query::Weight,
        reader: &crate::SegmentReader,
        segment_ord: u32,
    ) -> crate::Result<Vec<(Self::SortKey, DocAddress)>> {
        let with_scoring = self.requires_scoring();
        let segment_sort_key_computer = self.segment_sort_key_computer(reader)?;
        let topn_computer = TopNComputer::new_with_comparator(k, self.comparator());
        let mut segment_top_key_collector = TopBySortKeySegmentCollector {
            topn_computer,
            segment_ord,
            segment_sort_key_computer,
        };
        default_collect_segment_impl(&mut segment_top_key_collector, weight, reader, with_scoring)?;
        Ok(segment_top_key_collector.harvest())
    }

    /// Builds a child sort key computer for a specific segment.
    fn segment_sort_key_computer(&self, segment_reader: &SegmentReader) -> Result<Self::Child>;
}

impl<HeadSortKeyComputer, TailSortKeyComputer> SortKeyComputer
    for (HeadSortKeyComputer, TailSortKeyComputer)
where
    HeadSortKeyComputer: SortKeyComputer,
    TailSortKeyComputer: SortKeyComputer,
{
    type SortKey = (HeadSortKeyComputer::SortKey, TailSortKeyComputer::SortKey);
    type Child = (HeadSortKeyComputer::Child, TailSortKeyComputer::Child);

    type Comparator = (
        HeadSortKeyComputer::Comparator,
        TailSortKeyComputer::Comparator,
    );

    fn comparator(&self) -> Self::Comparator {
        (self.0.comparator(), self.1.comparator())
    }

    fn segment_sort_key_computer(&self, segment_reader: &SegmentReader) -> Result<Self::Child> {
        Ok((
            self.0.segment_sort_key_computer(segment_reader)?,
            self.1.segment_sort_key_computer(segment_reader)?,
        ))
    }

    /// Checks whether the schema is compatible with the sort key computer.
    fn check_schema(&self, schema: &Schema) -> crate::Result<()> {
        self.0.check_schema(schema)?;
        self.1.check_schema(schema)?;
        Ok(())
    }

    /// Indicates whether the sort key actually uses the similarity score (by default BM25).
    /// If set to false, the similary score might not be computed (as an optimization),
    /// and the score fed in the segment sort key computer could take any value.
    fn requires_scoring(&self) -> bool {
        self.0.requires_scoring() || self.1.requires_scoring()
    }
}

impl<HeadSegmentSortKeyComputer, TailSegmentSortKeyComputer> SegmentSortKeyComputer
    for (HeadSegmentSortKeyComputer, TailSegmentSortKeyComputer)
where
    HeadSegmentSortKeyComputer: SegmentSortKeyComputer,
    TailSegmentSortKeyComputer: SegmentSortKeyComputer,
{
    type SortKey = (
        HeadSegmentSortKeyComputer::SortKey,
        TailSegmentSortKeyComputer::SortKey,
    );
    type SegmentSortKey = (
        HeadSegmentSortKeyComputer::SegmentSortKey,
        TailSegmentSortKeyComputer::SegmentSortKey,
    );

    type SegmentComparator = (
        HeadSegmentSortKeyComputer::SegmentComparator,
        TailSegmentSortKeyComputer::SegmentComparator,
    );

    /// A SegmentSortKeyComputer maps to a SegmentSortKey, but it can also decide on
    /// its ordering.
    ///
    /// By default, it uses the natural ordering.
    #[inline]
    fn compare_segment_sort_key(
        &self,
        left: &Self::SegmentSortKey,
        right: &Self::SegmentSortKey,
    ) -> Ordering {
        self.0
            .compare_segment_sort_key(&left.0, &right.0)
            .then_with(|| self.1.compare_segment_sort_key(&left.1, &right.1))
    }

    #[inline(always)]
    fn compute_sort_key_and_collect<C: Comparator<Self::SegmentSortKey>>(
        &mut self,
        doc: DocId,
        score: Score,
        top_n_computer: &mut TopNComputer<Self::SegmentSortKey, DocId, C>,
    ) {
        let sort_key: Self::SegmentSortKey;
        if let Some(threshold) = &top_n_computer.threshold {
            if let Some((_cmp, lazy_sort_key)) = self.accept_sort_key_lazy(doc, score, threshold) {
                sort_key = lazy_sort_key;
            } else {
                return;
            }
        } else {
            sort_key = self.segment_sort_key(doc, score);
        };
        top_n_computer.append_doc(doc, sort_key);
    }

    #[inline(always)]
    fn segment_sort_key(&mut self, doc: DocId, score: Score) -> Self::SegmentSortKey {
        let head_sort_key = self.0.segment_sort_key(doc, score);
        let tail_sort_key = self.1.segment_sort_key(doc, score);
        (head_sort_key, tail_sort_key)
    }

    fn accept_sort_key_lazy(
        &mut self,
        doc_id: DocId,
        score: Score,
        threshold: &Self::SegmentSortKey,
    ) -> Option<(Ordering, Self::SegmentSortKey)> {
        let (head_threshold, tail_threshold) = threshold;
        let (head_cmp, head_sort_key) =
            self.0.accept_sort_key_lazy(doc_id, score, head_threshold)?;
        if head_cmp == Ordering::Equal {
            let (tail_cmp, tail_sort_key) =
                self.1.accept_sort_key_lazy(doc_id, score, tail_threshold)?;
            Some((tail_cmp, (head_sort_key, tail_sort_key)))
        } else {
            let tail_sort_key = self.1.segment_sort_key(doc_id, score);
            Some((head_cmp, (head_sort_key, tail_sort_key)))
        }
    }

    fn convert_segment_sort_key(&self, sort_key: Self::SegmentSortKey) -> Self::SortKey {
        let (head_sort_key, tail_sort_key) = sort_key;
        (
            self.0.convert_segment_sort_key(head_sort_key),
            self.1.convert_segment_sort_key(tail_sort_key),
        )
    }
}

/// This struct is used as an adapter to take a sort key computer and map its score to another
/// new sort key.
pub struct MappedSegmentSortKeyComputer<T, PreviousSortKey, NewSortKey> {
    sort_key_computer: T,
    map: fn(PreviousSortKey) -> NewSortKey,
}

impl<T, PreviousScore, NewScore> SegmentSortKeyComputer
    for MappedSegmentSortKeyComputer<T, PreviousScore, NewScore>
where
    T: SegmentSortKeyComputer<SortKey = PreviousScore>,
    PreviousScore: 'static + Clone + Send + Sync,
    NewScore: 'static + Clone + Send + Sync,
{
    type SortKey = NewScore;
    type SegmentSortKey = T::SegmentSortKey;
    type SegmentComparator = T::SegmentComparator;

    fn segment_sort_key(&mut self, doc: DocId, score: Score) -> Self::SegmentSortKey {
        self.sort_key_computer.segment_sort_key(doc, score)
    }

    fn accept_sort_key_lazy(
        &mut self,
        doc_id: DocId,
        score: Score,
        threshold: &Self::SegmentSortKey,
    ) -> Option<(Ordering, Self::SegmentSortKey)> {
        self.sort_key_computer
            .accept_sort_key_lazy(doc_id, score, threshold)
    }

    #[inline(always)]
    fn compute_sort_key_and_collect<C: Comparator<Self::SegmentSortKey>>(
        &mut self,
        doc: DocId,
        score: Score,
        top_n_computer: &mut TopNComputer<Self::SegmentSortKey, DocId, C>,
    ) {
        self.sort_key_computer
            .compute_sort_key_and_collect(doc, score, top_n_computer);
    }

    fn convert_segment_sort_key(&self, segment_sort_key: Self::SegmentSortKey) -> Self::SortKey {
        (self.map)(
            self.sort_key_computer
                .convert_segment_sort_key(segment_sort_key),
        )
    }
}

// We then re-use our (head, tail) implement and our mapper by seeing mapping any tuple (a, b, c,
// ...) as the chain (a, (b, (c, ...)))

impl<SortKeyComputer1, SortKeyComputer2, SortKeyComputer3> SortKeyComputer
    for (SortKeyComputer1, SortKeyComputer2, SortKeyComputer3)
where
    SortKeyComputer1: SortKeyComputer,
    SortKeyComputer2: SortKeyComputer,
    SortKeyComputer3: SortKeyComputer,
{
    type SortKey = (
        SortKeyComputer1::SortKey,
        SortKeyComputer2::SortKey,
        SortKeyComputer3::SortKey,
    );
    type Child = MappedSegmentSortKeyComputer<
        <(SortKeyComputer1, (SortKeyComputer2, SortKeyComputer3)) as SortKeyComputer>::Child,
        (
            SortKeyComputer1::SortKey,
            (SortKeyComputer2::SortKey, SortKeyComputer3::SortKey),
        ),
        Self::SortKey,
    >;

    type Comparator = (
        SortKeyComputer1::Comparator,
        SortKeyComputer2::Comparator,
        SortKeyComputer3::Comparator,
    );

    fn comparator(&self) -> Self::Comparator {
        (
            self.0.comparator(),
            self.1.comparator(),
            self.2.comparator(),
        )
    }

    fn segment_sort_key_computer(&self, segment_reader: &SegmentReader) -> Result<Self::Child> {
        let sort_key_computer1 = self.0.segment_sort_key_computer(segment_reader)?;
        let sort_key_computer2 = self.1.segment_sort_key_computer(segment_reader)?;
        let sort_key_computer3 = self.2.segment_sort_key_computer(segment_reader)?;
        let map = |(sort_key1, (sort_key2, sort_key3))| (sort_key1, sort_key2, sort_key3);
        Ok(MappedSegmentSortKeyComputer {
            sort_key_computer: (sort_key_computer1, (sort_key_computer2, sort_key_computer3)),
            map,
        })
    }

    fn check_schema(&self, schema: &Schema) -> crate::Result<()> {
        self.0.check_schema(schema)?;
        self.1.check_schema(schema)?;
        self.2.check_schema(schema)?;
        Ok(())
    }

    fn requires_scoring(&self) -> bool {
        self.0.requires_scoring() || self.1.requires_scoring() || self.2.requires_scoring()
    }
}

impl<SortKeyComputer1, SortKeyComputer2, SortKeyComputer3, SortKeyComputer4> SortKeyComputer
    for (
        SortKeyComputer1,
        SortKeyComputer2,
        SortKeyComputer3,
        SortKeyComputer4,
    )
where
    SortKeyComputer1: SortKeyComputer,
    SortKeyComputer2: SortKeyComputer,
    SortKeyComputer3: SortKeyComputer,
    SortKeyComputer4: SortKeyComputer,
{
    type Child = MappedSegmentSortKeyComputer<
        <(
            SortKeyComputer1,
            (SortKeyComputer2, (SortKeyComputer3, SortKeyComputer4)),
        ) as SortKeyComputer>::Child,
        (
            SortKeyComputer1::SortKey,
            (
                SortKeyComputer2::SortKey,
                (SortKeyComputer3::SortKey, SortKeyComputer4::SortKey),
            ),
        ),
        Self::SortKey,
    >;
    type SortKey = (
        SortKeyComputer1::SortKey,
        SortKeyComputer2::SortKey,
        SortKeyComputer3::SortKey,
        SortKeyComputer4::SortKey,
    );
    type Comparator = (
        SortKeyComputer1::Comparator,
        SortKeyComputer2::Comparator,
        SortKeyComputer3::Comparator,
        SortKeyComputer4::Comparator,
    );

    fn segment_sort_key_computer(&self, segment_reader: &SegmentReader) -> Result<Self::Child> {
        let sort_key_computer1 = self.0.segment_sort_key_computer(segment_reader)?;
        let sort_key_computer2 = self.1.segment_sort_key_computer(segment_reader)?;
        let sort_key_computer3 = self.2.segment_sort_key_computer(segment_reader)?;
        let sort_key_computer4 = self.3.segment_sort_key_computer(segment_reader)?;
        Ok(MappedSegmentSortKeyComputer {
            sort_key_computer: (
                sort_key_computer1,
                (sort_key_computer2, (sort_key_computer3, sort_key_computer4)),
            ),
            map: |(sort_key1, (sort_key2, (sort_key3, sort_key4)))| {
                (sort_key1, sort_key2, sort_key3, sort_key4)
            },
        })
    }

    fn check_schema(&self, schema: &Schema) -> crate::Result<()> {
        self.0.check_schema(schema)?;
        self.1.check_schema(schema)?;
        self.2.check_schema(schema)?;
        self.3.check_schema(schema)?;
        Ok(())
    }

    fn requires_scoring(&self) -> bool {
        self.0.requires_scoring()
            || self.1.requires_scoring()
            || self.2.requires_scoring()
            || self.3.requires_scoring()
    }
}

impl<F, SegmentF, TSortKey> SortKeyComputer for F
where
    F: 'static + Send + Sync + Fn(&SegmentReader) -> SegmentF,
    SegmentF: 'static + FnMut(DocId) -> TSortKey,
    TSortKey: 'static + PartialOrd + Clone + Send + Sync + std::fmt::Debug,
{
    type SortKey = TSortKey;
    type Child = SegmentF;
    type Comparator = NaturalComparator;

    fn segment_sort_key_computer(&self, segment_reader: &SegmentReader) -> Result<Self::Child> {
        Ok((self)(segment_reader))
    }
}

impl<F, TSortKey> SegmentSortKeyComputer for F
where
    F: 'static + FnMut(DocId) -> TSortKey,
    TSortKey: 'static + PartialOrd + Clone + Send + Sync,
{
    type SortKey = TSortKey;
    type SegmentSortKey = TSortKey;
    type SegmentComparator = NaturalComparator;

    fn segment_sort_key(&mut self, doc: DocId, _score: Score) -> TSortKey {
        (self)(doc)
    }

    /// Convert a segment level score into the global level score.
    fn convert_segment_sort_key(&self, sort_key: Self::SegmentSortKey) -> Self::SortKey {
        sort_key
    }
}

#[cfg(test)]
mod tests {
    use std::cmp::Ordering;
    use std::sync::atomic::{AtomicUsize, Ordering as AtomicOrdering};
    use std::sync::Arc;

    use crate::collector::{SegmentSortKeyComputer, SortKeyComputer};
    use crate::schema::Schema;
    use crate::{DocId, Index, Order, SegmentReader};

    fn build_test_index() -> Index {
        let schema = Schema::builder().build();
        let index = Index::create_in_ram(schema);
        let mut index_writer = index.writer_for_tests().unwrap();
        index_writer
            .add_document(crate::TantivyDocument::default())
            .unwrap();
        index_writer.commit().unwrap();
        index
    }

    #[test]
    fn test_lazy_score_computer() {
        let score_computer_primary = |_segment_reader: &SegmentReader| |_doc: DocId| 200u32;
        let call_count = Arc::new(AtomicUsize::new(0));
        let call_count_clone = call_count.clone();
        let score_computer_secondary = move |_segment_reader: &SegmentReader| {
            let call_count_new_clone = call_count_clone.clone();
            move |_doc: DocId| {
                call_count_new_clone.fetch_add(1, AtomicOrdering::SeqCst);
                "b"
            }
        };
        let lazy_score_computer = (score_computer_primary, score_computer_secondary);
        let index = build_test_index();
        let searcher = index.reader().unwrap().searcher();
        let mut segment_sort_key_computer = lazy_score_computer
            .segment_sort_key_computer(searcher.segment_reader(0))
            .unwrap();
        let expected_sort_key = (200, "b");
        {
            let sort_key_opt =
                segment_sort_key_computer.accept_sort_key_lazy(0u32, 1f32, &(100u32, "a"));
            assert_eq!(sort_key_opt, Some((Ordering::Greater, expected_sort_key)));
            assert_eq!(call_count.load(AtomicOrdering::SeqCst), 1);
        }
        {
            let sort_key_opt =
                segment_sort_key_computer.accept_sort_key_lazy(0u32, 1f32, &(100u32, "c"));
            assert_eq!(sort_key_opt, Some((Ordering::Greater, expected_sort_key)));
            assert_eq!(call_count.load(AtomicOrdering::SeqCst), 2);
        }
        {
            let sort_key_opt =
                segment_sort_key_computer.accept_sort_key_lazy(0u32, 1f32, &(200u32, "a"));
            assert_eq!(sort_key_opt, Some((Ordering::Greater, expected_sort_key)));
            assert_eq!(call_count.load(AtomicOrdering::SeqCst), 3);
        }
        {
            let sort_key_opt =
                segment_sort_key_computer.accept_sort_key_lazy(0u32, 1f32, &(200u32, "c"));
            assert!(sort_key_opt.is_none());
            assert_eq!(call_count.load(AtomicOrdering::SeqCst), 4);
        }
        {
            let sort_key_opt =
                segment_sort_key_computer.accept_sort_key_lazy(0u32, 1f32, &(300u32, "a"));
            assert_eq!(sort_key_opt, None);
            assert_eq!(call_count.load(AtomicOrdering::SeqCst), 4);
        }
        {
            let sort_key_opt =
                segment_sort_key_computer.accept_sort_key_lazy(0u32, 1f32, &(300u32, "c"));
            assert_eq!(sort_key_opt, None);
            assert_eq!(call_count.load(AtomicOrdering::SeqCst), 4);
        }
        {
            let sort_key_opt =
                segment_sort_key_computer.accept_sort_key_lazy(0u32, 1f32, &expected_sort_key);
            assert_eq!(sort_key_opt, Some((Ordering::Equal, expected_sort_key)));
            assert_eq!(call_count.load(AtomicOrdering::SeqCst), 5);
        }
    }

    #[test]
    fn test_lazy_score_computer_dynamic_ordering() {
        let score_computer_primary = |_segment_reader: &SegmentReader| |_doc: DocId| 200u32;
        let call_count = Arc::new(AtomicUsize::new(0));
        let call_count_clone = call_count.clone();
        let score_computer_secondary = move |_segment_reader: &SegmentReader| {
            let call_count_new_clone = call_count_clone.clone();
            move |_doc: DocId| {
                call_count_new_clone.fetch_add(1, AtomicOrdering::SeqCst);
                2u32
            }
        };
        let lazy_score_computer = (
            (score_computer_primary, Order::Desc),
            (score_computer_secondary, Order::Asc),
        );
        let index = build_test_index();
        let searcher = index.reader().unwrap().searcher();
        let mut segment_sort_key_computer = lazy_score_computer
            .segment_sort_key_computer(searcher.segment_reader(0))
            .unwrap();
        let expected_sort_key = (200, 2u32);

        {
            let sort_key_opt =
                segment_sort_key_computer.accept_sort_key_lazy(0u32, 1f32, &(100u32, 1u32));
            assert_eq!(sort_key_opt, Some((Ordering::Greater, expected_sort_key)));
            assert_eq!(call_count.load(AtomicOrdering::SeqCst), 1);
        }
        {
            let sort_key_opt =
                segment_sort_key_computer.accept_sort_key_lazy(0u32, 1f32, &(100u32, 3u32));
            assert_eq!(sort_key_opt, Some((Ordering::Greater, expected_sort_key)));
            assert_eq!(call_count.load(AtomicOrdering::SeqCst), 2);
        }
        {
            let sort_key_opt =
                segment_sort_key_computer.accept_sort_key_lazy(0u32, 1f32, &(200u32, 1u32));
            assert!(sort_key_opt.is_none());
            assert_eq!(call_count.load(AtomicOrdering::SeqCst), 3);
        }
        {
            let sort_key_opt =
                segment_sort_key_computer.accept_sort_key_lazy(0u32, 1f32, &(200u32, 3u32));
            assert_eq!(sort_key_opt, Some((Ordering::Greater, expected_sort_key)));
            assert_eq!(call_count.load(AtomicOrdering::SeqCst), 4);
        }
        {
            let sort_key_opt =
                segment_sort_key_computer.accept_sort_key_lazy(0u32, 1f32, &(300u32, 1u32));
            assert_eq!(sort_key_opt, None);
            assert_eq!(call_count.load(AtomicOrdering::SeqCst), 4);
        }
        {
            let sort_key_opt =
                segment_sort_key_computer.accept_sort_key_lazy(0u32, 1f32, &(300u32, 3u32));
            assert_eq!(sort_key_opt, None);
            assert_eq!(call_count.load(AtomicOrdering::SeqCst), 4);
        }
        {
            let sort_key_opt =
                segment_sort_key_computer.accept_sort_key_lazy(0u32, 1f32, &expected_sort_key);
            assert_eq!(sort_key_opt, Some((Ordering::Equal, expected_sort_key)));
            assert_eq!(call_count.load(AtomicOrdering::SeqCst), 5);
        }
        assert_eq!(
            segment_sort_key_computer.convert_segment_sort_key(expected_sort_key),
            (200u32, 2u32)
        );
    }
}


================================================
FILE: src/collector/sort_key_top_collector.rs
================================================
use std::ops::Range;

use crate::collector::sort_key::{Comparator, SegmentSortKeyComputer, SortKeyComputer};
use crate::collector::{Collector, SegmentCollector, TopNComputer};
use crate::query::Weight;
use crate::schema::Schema;
use crate::{DocAddress, DocId, Result, Score, SegmentReader};

pub(crate) struct TopBySortKeyCollector<TSortKeyComputer> {
    sort_key_computer: TSortKeyComputer,
    doc_range: Range<usize>,
}

impl<TSortKeyComputer> TopBySortKeyCollector<TSortKeyComputer> {
    pub fn new(sort_key_computer: TSortKeyComputer, doc_range: Range<usize>) -> Self {
        TopBySortKeyCollector {
            sort_key_computer,
            doc_range,
        }
    }
}

impl<TSortKeyComputer> Collector for TopBySortKeyCollector<TSortKeyComputer>
where TSortKeyComputer: SortKeyComputer + Send + Sync + 'static
{
    type Fruit = Vec<(TSortKeyComputer::SortKey, DocAddress)>;

    type Child =
        TopBySortKeySegmentCollector<TSortKeyComputer::Child, TSortKeyComputer::Comparator>;

    fn check_schema(&self, schema: &Schema) -> crate::Result<()> {
        self.sort_key_computer.check_schema(schema)
    }

    fn for_segment(&self, segment_ord: u32, segment_reader: &SegmentReader) -> Result<Self::Child> {
        let segment_sort_key_computer = self
            .sort_key_computer
            .segment_sort_key_computer(segment_reader)?;
        let topn_computer = TopNComputer::new_with_comparator(
            self.doc_range.end,
            self.sort_key_computer.comparator(),
        );
        Ok(TopBySortKeySegmentCollector {
            topn_computer,
            segment_ord,
            segment_sort_key_computer,
        })
    }

    fn requires_scoring(&self) -> bool {
        self.sort_key_computer.requires_scoring()
    }

    fn merge_fruits(&self, segment_fruits: Vec<Self::Fruit>) -> Result<Self::Fruit> {
        Ok(merge_top_k(
            segment_fruits.into_iter().flatten(),
            self.doc_range.clone(),
            self.sort_key_computer.comparator(),
        ))
    }

    fn collect_segment(
        &self,
        weight: &dyn Weight,
        segment_ord: u32,
        reader: &SegmentReader,
    ) -> crate::Result<Vec<(TSortKeyComputer::SortKey, DocAddress)>> {
        let k = self.doc_range.end;
        let docs = self
            .sort_key_computer
            .collect_segment_top_k(k, weight, reader, segment_ord)?;
        Ok(docs)
    }
}

fn merge_top_k<D: Ord, TSortKey: Clone + std::fmt::Debug, C: Comparator<TSortKey>>(
    sort_key_docs: impl Iterator<Item = (TSortKey, D)>,
    doc_range: Range<usize>,
    comparator: C,
) -> Vec<(TSortKey, D)> {
    if doc_range.is_empty() {
        return Vec::new();
    }
    let mut top_collector: TopNComputer<TSortKey, D, C> =
        TopNComputer::new_with_comparator(doc_range.end, comparator);
    for (sort_key, doc) in sort_key_docs {
        top_collector.push(sort_key, doc);
    }
    top_collector
        .into_sorted_vec()
        .into_iter()
        .skip(doc_range.start)
        .map(|cdoc| (cdoc.sort_key, cdoc.doc))
        .collect()
}

pub struct TopBySortKeySegmentCollector<TSegmentSortKeyComputer, C>
where
    TSegmentSortKeyComputer: SegmentSortKeyComputer,
    C: Comparator<TSegmentSortKeyComputer::SegmentSortKey>,
{
    pub(crate) topn_computer: TopNComputer<TSegmentSortKeyComputer::SegmentSortKey, DocId, C>,
    pub(crate) segment_ord: u32,
    pub(crate) segment_sort_key_computer: TSegmentSortKeyComputer,
}

impl<TSegmentSortKeyComputer, C> SegmentCollector
    for TopBySortKeySegmentCollector<TSegmentSortKeyComputer, C>
where
    TSegmentSortKeyComputer: 'static + SegmentSortKeyComputer,
    C: Comparator<TSegmentSortKeyComputer::SegmentSortKey> + 'static,
{
    type Fruit = Vec<(TSegmentSortKeyComputer::SortKey, DocAddress)>;

    fn collect(&mut self, doc: DocId, score: Score) {
        self.segment_sort_key_computer.compute_sort_key_and_collect(
            doc,
            score,
            &mut self.topn_computer,
        );
    }

    fn harvest(self) -> Self::Fruit {
        let segment_ord = self.segment_ord;
        let segment_hits: Vec<(TSegmentSortKeyComputer::SortKey, DocAddress)> = self
            .topn_computer
            .into_vec()
            .into_iter()
            .map(|comparable_doc| {
                let sort_key = self
                    .segment_sort_key_computer
                    .convert_segment_sort_key(comparable_doc.sort_key);
                (
                    sort_key,
                    DocAddress {
                        segment_ord,
                        doc_id: comparable_doc.doc,
                    },
                )
            })
            .collect();
        segment_hits
    }
}

#[cfg(test)]
mod tests {
    use std::ops::Range;

    use rand;
    use rand::seq::SliceRandom as _;

    use super::merge_top_k;
    use crate::collector::sort_key::ComparatorEnum;
    use crate::Order;

    fn test_merge_top_k_aux(
        order: Order,
        doc_range: Range<usize>,
        expected: &[(crate::Score, usize)],
    ) {
        let mut vals: Vec<(crate::Score, usize)> = (0..10).map(|val| (val as f32, val)).collect();
        vals.shuffle(&mut rand::rng());
        let vals_merged = merge_top_k(vals.into_iter(), doc_range, ComparatorEnum::from(order));
        assert_eq!(&vals_merged, expected);
    }

    #[test]
    fn test_merge_top_k() {
        test_merge_top_k_aux(Order::Asc, 0..0, &[]);
        test_merge_top_k_aux(Order::Asc, 3..3, &[]);
        test_merge_top_k_aux(Order::Asc, 0..3, &[(0.0f32, 0), (1.0f32, 1), (2.0f32, 2)]);
        test_merge_top_k_aux(
            Order::Asc,
            0..11,
            &[
                (0.0f32, 0),
                (1.0f32, 1),
                (2.0f32, 2),
                (3.0f32, 3),
                (4.0f32, 4),
                (5.0f32, 5),
                (6.0f32, 6),
                (7.0f32, 7),
                (8.0f32, 8),
                (9.0f32, 9),
            ],
        );
        test_merge_top_k_aux(Order::Asc, 1..3, &[(1.0f32, 1), (2.0f32, 2)]);
        test_merge_top_k_aux(Order::Desc, 0..2, &[(9.0f32, 9), (8.0f32, 8)]);
        test_merge_top_k_aux(Order::Desc, 2..4, &[(7.0f32, 7), (6.0f32, 6)]);
    }
}


================================================
FILE: src/collector/tests.rs
================================================
use columnar::{BytesColumn, Column};

use super::*;
use crate::query::{AllQuery, QueryParser};
use crate::schema::{Schema, FAST, TEXT};
use crate::time::format_description::well_known::Rfc3339;
use crate::time::OffsetDateTime;
use crate::{DateTime, DocAddress, Index, Searcher, TantivyDocument};

pub const TEST_COLLECTOR_WITH_SCORE: TestCollector = TestCollector {
    compute_score: true,
};

pub const TEST_COLLECTOR_WITHOUT_SCORE: TestCollector = TestCollector {
    compute_score: true,
};

#[test]
pub fn test_filter_collector() -> crate::Result<()> {
    let mut schema_builder = Schema::builder();
    let title = schema_builder.add_text_field("title", TEXT);
    let price = schema_builder.add_u64_field("price", FAST);
    let date = schema_builder.add_date_field("date", FAST);
    let schema = schema_builder.build();
    let index = Index::create_in_ram(schema);

    let mut index_writer = index.writer_with_num_threads(1, 20_000_000)?;
    index_writer.add_document(doc!(title => "The Name of the Wind", price => 30_200u64, date => DateTime::from_utc(OffsetDateTime::parse("1898-04-09T00:00:00+00:00", &Rfc3339).unwrap())))?;
    index_writer.add_document(doc!(title => "The Diary of Muadib", price => 29_240u64, date => DateTime::from_utc(OffsetDateTime::parse("2020-04-09T00:00:00+00:00", &Rfc3339).unwrap())))?;
    index_writer.add_document(doc!(title => "The Diary of Anne Frank", price => 18_240u64, date => DateTime::from_utc(OffsetDateTime::parse("2019-04-20T00:00:00+00:00", &Rfc3339).unwrap())))?;
    index_writer.add_document(doc!(title => "A Dairy Cow", price => 21_240u64, date => DateTime::from_utc(OffsetDateTime::parse("2019-04-09T00:00:00+00:00", &Rfc3339).unwrap())))?;
    index_writer.add_document(doc!(title => "The Diary of a Young Girl", price => 20_120u64, date => DateTime::from_utc(OffsetDateTime::parse("2018-04-09T00:00:00+00:00", &Rfc3339).unwrap())))?;
    index_writer.commit()?;

    let reader = index.reader()?;
    let searcher = reader.searcher();

    let query_parser = QueryParser::for_index(&index, vec![title]);
    let query = query_parser.parse_query("diary")?;
    let filter_some_collector = FilterCollector::new(
        "price".to_string(),
        &|value: u64| value > 20_120u64,
        TopDocs::with_limit(2).order_by_score(),
    );
    let top_docs = searcher.search(&query, &filter_some_collector)?;

    assert_eq!(top_docs.len(), 1);
    assert_eq!(top_docs[0].1, DocAddress::new(0, 1));

    let filter_all_collector: FilterCollector<_, _, u64> = FilterCollector::new(
        "price".to_string(),
        &|value| value < 5u64,
        TopDocs::with_limit(2).order_by_score(),
    );
    let filtered_top_docs = searcher.search(&query, &filter_all_collector).unwrap();

    assert_eq!(filtered_top_docs.len(), 0);

    fn date_filter(value: DateTime) -> bool {
        (value.into_utc() - OffsetDateTime::parse("2019-04-09T00:00:00+00:00", &Rfc3339).unwrap())
            .whole_weeks()
            > 0
    }

    let filter_dates_collector = FilterCollector::new(
        "date".to_string(),
        &date_filter,
        TopDocs::with_limit(5).order_by_score(),
    );
    let filtered_date_docs = searcher.search(&query, &filter_dates_collector)?;

    assert_eq!(filtered_date_docs.len(), 2);
    Ok(())
}

/// Stores all of the doc ids.
/// This collector is only used for tests.
/// It is unusable in practise, as it does
/// not store the segment ordinals
pub struct TestCollector {
    pub compute_score: bool,
}

pub struct TestSegmentCollector {
    segment_id: SegmentOrdinal,
    fruit: TestFruit,
}

#[derive(Default)]
pub struct TestFruit {
    docs: Vec<DocAddress>,
    scores: Vec<Score>,
}

impl TestFruit {
    /// Return the list of matching documents exhaustively.
    pub fn docs(&self) -> &[DocAddress] {
        &self.docs[..]
    }
    pub fn scores(&self) -> &[Score] {
        &self.scores[..]
    }
}

impl Collector for TestCollector {
    type Fruit = TestFruit;
    type Child = TestSegmentCollector;

    fn for_segment(
        &self,
        segment_id: SegmentOrdinal,
        _reader: &SegmentReader,
    ) -> crate::Result<TestSegmentCollector> {
        Ok(TestSegmentCollector {
            segment_id,
            fruit: TestFruit::default(),
        })
    }

    fn requires_scoring(&self) -> bool {
        self.compute_score
    }

    fn merge_fruits(&self, mut children: Vec<TestFruit>) -> crate::Result<TestFruit> {
        children.sort_by_key(|fruit| {
            if fruit.docs().is_empty() {
                0
            } else {
                fruit.docs()[0].segment_ord
            }
        });
        let mut docs = vec![];
        let mut scores = vec![];
        for child in children {
            docs.extend(child.docs());
            scores.extend(child.scores);
        }
        Ok(TestFruit { docs, scores })
    }
}

impl SegmentCollector for TestSegmentCollector {
    type Fruit = TestFruit;

    fn collect(&mut self, doc: DocId, score: Score) {
        self.fruit.docs.push(DocAddress::new(self.segment_id, doc));
        self.fruit.scores.push(score);
    }

    fn harvest(self) -> <Self as SegmentCollector>::Fruit {
        self.fruit
    }
}

/// Collects in order all of the fast fields for all of the
/// doc in the `DocSet`
///
/// This collector is mainly useful for tests.
pub struct FastFieldTestCollector {
    field: String,
}

pub struct FastFieldSegmentCollector {
    vals: Vec<u64>,
    reader: Column,
}

impl FastFieldTestCollector {
    pub fn for_field(field: impl ToString) -> FastFieldTestCollector {
        FastFieldTestCollector {
            field: field.to_string(),
        }
    }
}

impl Collector for FastFieldTestCollector {
    type Fruit = Vec<u64>;
    type Child = FastFieldSegmentCollector;

    fn for_segment(
        &self,
        _: SegmentOrdinal,
        segment_reader: &SegmentReader,
    ) -> crate::Result<FastFieldSegmentCollector> {
        let reader = segment_reader
            .fast_fields()
            .u64(&self.field)
            .expect("Requested field is not a fast field.");
        Ok(FastFieldSegmentCollector {
            vals: Vec::new(),
            reader,
        })
    }

    fn requires_scoring(&self) -> bool {
        false
    }

    fn merge_fruits(&self, children: Vec<Vec<u64>>) -> crate::Result<Vec<u64>> {
        Ok(children.into_iter().flat_map(|v| v.into_iter()).collect())
    }
}

impl SegmentCollector for FastFieldSegmentCollector {
    type Fruit = Vec<u64>;

    fn collect(&mut self, doc: DocId, _score: Score) {
        self.vals.extend(self.reader.values_for_doc(doc));
    }

    fn harvest(self) -> Vec<u64> {
        self.vals
    }
}

/// Collects in order all of the fast field bytes for all of the
/// docs in the `DocSet`
///
/// This collector is mainly useful for tests.
/// It is very slow.
pub struct BytesFastFieldTestCollector {
    field: String,
}

pub struct BytesFastFieldSegmentCollector {
    vals: Vec<u8>,
    column_opt: Option<BytesColumn>,
    buffer: Vec<u8>,
}

impl BytesFastFieldTestCollector {
    pub fn for_field(field: impl ToString) -> BytesFastFieldTestCollector {
        BytesFastFieldTestCollector {
            field: field.to_string(),
        }
    }
}

impl Collector for BytesFastFieldTestCollector {
    type Fruit = Vec<u8>;
    type Child = BytesFastFieldSegmentCollector;

    fn for_segment(
        &self,
        _segment_local_id: u32,
        segment_reader: &SegmentReader,
    ) -> crate::Result<BytesFastFieldSegmentCollector> {
        let column_opt = segment_reader.fast_fields().bytes(&self.field)?;
        Ok(BytesFastFieldSegmentCollector {
            vals: Vec::new(),
            column_opt,
            buffer: Vec::new(),
        })
    }

    fn requires_scoring(&self) -> bool {
        false
    }

    fn merge_fruits(&self, children: Vec<Vec<u8>>) -> crate::Result<Vec<u8>> {
        Ok(children.into_iter().flat_map(|c| c.into_iter()).collect())
    }
}

impl SegmentCollector for BytesFastFieldSegmentCollector {
    type Fruit = Vec<u8>;

    fn collect(&mut self, doc: DocId, _score: Score) {
        if let Some(column) = self.column_opt.as_ref() {
            for term_ord in column.term_ords(doc) {
                let (vals, buffer) = (&mut self.vals, &mut self.buffer);
                if column.ord_to_bytes(term_ord, buffer).unwrap() {
                    vals.extend(&buffer[..]);
                }
            }
        }
    }

    fn harvest(self) -> <Self as SegmentCollector>::Fruit {
        self.vals
    }
}

fn make_test_searcher() -> crate::Result<Searcher> {
    let schema = Schema::builder().build();
    let index = Index::create_in_ram(schema);
    let mut index_writer = index.writer_for_tests()?;
    index_writer.add_document(TantivyDocument::default())?;
    index_writer.add_document(TantivyDocument::default())?;
    index_writer.commit()?;
    Ok(index.reader()?.searcher())
}

#[test]
fn test_option_collector_some() -> crate::Result<()> {
    let searcher = make_test_searcher()?;
    let counts = searcher.search(&AllQuery, &Some(Count))?;
    assert_eq!(counts, Some(2));
    Ok(())
}

#[test]
fn test_option_collector_none() -> crate::Result<()> {
    let searcher = make_test_searcher()?;
    let none_collector: Option<Count> = None;
    let counts = searcher.search(&AllQuery, &none_collector)?;
    assert_eq!(counts, None);
    Ok(())
}


================================================
FILE: src/collector/top_collector.rs
================================================
use serde::{Deserialize, Serialize};

/// Contains a feature (field, score, etc.) of a document along with the document address.
///
/// Used only by TopNComputer, which implements the actual comparison via a `Comparator`.
#[derive(Clone, Default, Eq, PartialEq, Serialize, Deserialize)]
pub struct ComparableDoc<T, D> {
    /// The feature of the document. In practice, this is
    /// is a type which can be compared with a `Comparator<T>`.
    pub sort_key: T,
    /// The document address. In practice, this is either a `DocId` or `DocAddress`.
    pub doc: D,
}

impl<T: std::fmt::Debug, D: std::fmt::Debug> std::fmt::Debug for ComparableDoc<T, D> {
    fn fmt(&self, f: &mut std::fmt::Formatter) -> std::fmt::Result {
        f.debug_struct("ComparableDoc")
            .field("feature", &self.sort_key)
            .field("doc", &self.doc)
            .finish()
    }
}


================================================
FILE: src/collector/top_score_collector.rs
================================================
use std::cmp::Ordering;
use std::fmt;
use std::ops::Range;

use serde::{Deserialize, Serialize};

use super::Collector;
use crate::collector::sort_key::{
    Comparator, ComparatorEnum, NaturalComparator, ReverseComparator, SortBySimilarityScore,
    SortByStaticFastValue, SortByString,
};
use crate::collector::sort_key_top_collector::TopBySortKeyCollector;
use crate::collector::top_collector::ComparableDoc;
use crate::collector::{SegmentSortKeyComputer, SortKeyComputer};
use crate::fastfield::FastValue;
use crate::{DocAddress, DocId, Order, Score, SegmentReader};

/// The `TopDocs` collector keeps track of the top `K` documents
/// sorted by their score.
///
/// The implementation is based on a repeatedly truncating on the median after K * 2 documents
/// with pattern defeating QuickSort.
/// The theoretical complexity for collecting the top `K` out of `N` documents
/// is `O(N + K)`.
///
/// This collector guarantees a stable sorting in case of a tie on the
/// document score/sort key: The document address (`DocAddress`) is used as a tie breaker.
/// In case of a tie on the sort key, documents are always sorted by ascending `DocAddress`.
///
/// ```rust
/// use tantivy::collector::TopDocs;
/// use tantivy::query::QueryParser;
/// use tantivy::schema::{Schema, TEXT};
/// use tantivy::{doc, DocAddress, Index};
///
/// # fn main() -> tantivy::Result<()> {
/// let mut schema_builder = Schema::builder();
/// let title = schema_builder.add_text_field("title", TEXT);
/// let schema = schema_builder.build();
/// let index = Index::create_in_ram(schema);
///
/// let mut index_writer = index.writer_with_num_threads(1, 20_000_000)?;
/// index_writer.add_document(doc!(title => "The Name of the Wind"))?;
/// index_writer.add_document(doc!(title => "The Diary of Muadib"))?;
/// index_writer.add_document(doc!(title => "A Dairy Cow"))?;
/// index_writer.add_document(doc!(title => "The Diary of a Young Girl"))?;
/// index_writer.commit()?;
///
/// let reader = index.reader()?;
/// let searcher = reader.searcher();
///
/// let query_parser = QueryParser::for_index(&index, vec![title]);
/// let query = query_parser.parse_query("diary")?;
/// let top_docs = searcher.search(&query, &TopDocs::with_limit(2).order_by_score())?;
///
/// assert_eq!(top_docs[0].1, DocAddress::new(0, 1));
/// assert_eq!(top_docs[1].1, DocAddress::new(0, 3));
/// # Ok(())
/// # }
/// ```
pub struct TopDocs {
    limit: usize,
    offset: usize,
}

impl fmt::Debug for TopDocs {
    fn fmt(&self, f: &mut fmt::Formatter) -> fmt::Result {
        write!(f, "TopDocs(limit={}, offset={})", self.limit, self.offset)
    }
}

impl TopDocs {
    /// Builds a `TopDocs` capturing a given document range.
    ///
    /// The range start..end translates in a limit of `end - start`
    /// and an offset of start.
    pub fn for_doc_range(doc_range: Range<usize>) -> Self {
        TopDocs {
            limit: doc_range.end.saturating_sub(doc_range.start),
            offset: doc_range.start,
        }
    }

    /// Returns the doc range we are trying to capture.
    pub fn doc_range(&self) -> Range<usize> {
        self.offset..self.offset + self.limit
    }

    /// Creates a top score collector, with a number of documents equal to "limit".
    ///
    /// # Panics
    /// The method panics if limit is 0
    pub fn with_limit(limit: usize) -> TopDocs {
        assert_ne!(limit, 0, "Limit must be greater than 0");
        TopDocs { limit, offset: 0 }
    }

    /// Skip the first "offset" documents when collecting.
    ///
    /// This is equivalent to `OFFSET` in MySQL or PostgreSQL and `start` in
    /// Lucene's TopDocsCollector.
    ///
    /// # Example
    ///
    /// ```rust
    /// use tantivy::collector::TopDocs;
    /// use tantivy::query::QueryParser;
    /// use tantivy::schema::{Schema, TEXT};
    /// use tantivy::{doc, DocAddress, Index};
    ///
    /// # fn main() -> tantivy::Result<()> {
    /// let mut schema_builder = Schema::builder();
    /// let title = schema_builder.add_text_field("title", TEXT);
    /// let schema = schema_builder.build();
    /// let index = Index::create_in_ram(schema);
    ///
    /// let mut index_writer = index.writer_with_num_threads(1, 20_000_000)?;
    /// index_writer.add_document(doc!(title => "The Name of the Wind"))?;
    /// index_writer.add_document(doc!(title => "The Diary of Muadib"))?;
    /// index_writer.add_document(doc!(title => "A Dairy Cow"))?;
    /// index_writer.add_document(doc!(title => "The Diary of a Young Girl"))?;
    /// index_writer.add_document(doc!(title => "The Diary of Lena Mukhina"))?;
    /// index_writer.commit()?;
    ///
    /// let reader = index.reader()?;
    /// let searcher = reader.searcher();
    ///
    /// let query_parser = QueryParser::for_index(&index, vec![title]);
    /// let query = query_parser.parse_query("diary")?;
    /// let top_docs = searcher.search(&query, &TopDocs::with_limit(2).and_offset(1).order_by_score())?;
    ///
    /// assert_eq!(top_docs.len(), 2);
    /// assert_eq!(top_docs[0].1, DocAddress::new(0, 4));
    /// assert_eq!(top_docs[1].1, DocAddress::new(0, 3));
    /// Ok(())
    /// # }
    /// ```
    #[must_use]
    pub fn and_offset(self, offset: usize) -> TopDocs {
        TopDocs {
            limit: self.limit,
            offset,
        }
    }

    /// Set top-K to rank documents by a given fast field.
    ///
    /// If the field is not a fast or does not exist, this method returns successfully (it is not
    /// aware of any schema). An error will be returned at the moment of search.
    ///
    /// If the field is a FAST field but not a u64 field, search will return successfully but it
    /// will return returns a monotonic u64-representation (ie. the order is still correct) of
    /// the requested field type.
    ///
    /// # Example
    ///
    /// ```rust
    /// # use tantivy::schema::{Schema, FAST, TEXT};
    /// # use tantivy::{doc, Index, DocAddress, Order};
    /// # use tantivy::query::{Query, QueryParser};
    /// use tantivy::Searcher;
    /// use tantivy::collector::TopDocs;
    ///
    /// # fn main() -> tantivy::Result<()> {
    /// #   let mut schema_builder = Schema::builder();
    /// #   let title = schema_builder.add_text_field("title", TEXT);
    /// #   let rating = schema_builder.add_u64_field("rating", FAST);
    /// #   let schema = schema_builder.build();
    /// #
    /// #   let index = Index::create_in_ram(schema);
    /// #   let mut index_writer = index.writer_with_num_threads(1, 20_000_000)?;
    /// #   index_writer.add_document(doc!(title => "The Name of the Wind", rating => 92u64))?;
    /// #   index_writer.add_document(doc!(title => "The Diary of Muadib", rating => 97u64))?;
    /// #   index_writer.add_document(doc!(title => "A Dairy Cow", rating => 63u64))?;
    /// #   index_writer.add_document(doc!(title => "The Diary of a Young Girl", rating => 80u64))?;
    /// #   index_writer.commit()?;
    /// #   let reader = index.reader()?;
    /// #   let query = QueryParser::for_index(&index, vec![title]).parse_query("diary")?;
    /// #   let top_docs = docs_sorted_by_rating(&reader.searcher(), &query)?;
    /// #   assert_eq!(top_docs,
    /// #            vec![(Some(97u64), DocAddress::new(0u32, 1)),
    /// #                 (Some(80u64), DocAddress::new(0u32, 3))]);
    /// #   Ok(())
    /// # }
    /// /// Searches the document matching the given query, and
    /// /// collects the top 10 documents, order by the u64-`field`
    /// /// given in argument.
    /// fn docs_sorted_by_rating(searcher: &Searcher,
    ///                          query: &dyn Query)
    ///     -> tantivy::Result<Vec<(Option<u64>, DocAddress)>> {
    ///
    ///     // This is where we build our topdocs collector
    ///     //
    ///     // Note the `rating_field` needs to be a FAST field here.
    ///     let top_books_by_rating = TopDocs
    ///                 ::with_limit(10)
    ///                  .order_by_fast_field("rating", Order::Desc);
    ///
    ///     // ... and here are our documents. Note this is a simple vec.
    ///     // The `u64` in the pair is the value of our fast field for
    ///     // each documents.
    ///     //
    ///     // The vec is sorted decreasingly by `sort_by_field`, and has a
    ///     // length of 10, or less if not enough documents matched the
    ///     // query.
    ///     let resulting_docs: Vec<(Option<u64>, DocAddress)> =
    ///          searcher.search(query, &top_books_by_rating)?;
    ///
    ///     Ok(resulting_docs)
    /// }
    /// ```
    ///
    /// # See also
    ///
    /// To comfortably work with `u64`s, `i64`s, `f64`s, or `date`s, please refer to
    /// the [.order_by_fast_field(...)](TopDocs::order_by_fast_field) method.
    pub fn order_by_u64_field(
        self,
        field: impl ToString,
        order: Order,
    ) -> impl Collector<Fruit = Vec<(Option<u64>, DocAddress)>> {
        self.order_by((SortByStaticFastValue::for_field(field), order))
    }

    /// Order docs by decreasing BM25 similarity score.
    pub fn order_by_score(self) -> impl Collector<Fruit = Vec<(Score, DocAddress)>> {
        TopBySortKeyCollector::new(SortBySimilarityScore, self.doc_range())
    }

    /// Set top-K to rank documents by a given fast field.
    ///
    /// If the field is not a fast field, or its field type does not match the generic type, this
    /// method does not panic, but an explicit error will be returned at the moment of
    /// collection.
    ///
    /// Note that this method is a generic. The requested fast field type will be often
    /// inferred in your code by the rust compiler.
    ///
    /// Implementation-wise, for performance reason, tantivy will manipulate the u64 representation
    /// of your fast field until the last moment.
    ///
    /// # Example
    ///
    /// ```rust
    /// # use tantivy::schema::{Schema, FAST, TEXT};
    /// # use tantivy::{doc, Index, DocAddress,Order};
    /// # use tantivy::query::{Query, AllQuery};
    /// use tantivy::Searcher;
    /// use tantivy::collector::TopDocs;
    ///
    /// # fn main() -> tantivy::Result<()> {
    /// #   let mut schema_builder = Schema::builder();
    /// #   let title = schema_builder.add_text_field("company", TEXT);
    /// #   let revenue = schema_builder.add_i64_field("revenue", FAST);
    /// #   let schema = schema_builder.build();
    /// #
    /// #   let index = Index::create_in_ram(schema);
    /// #   let mut index_writer = index.writer_with_num_threads(1, 20_000_000)?;
    /// #   index_writer.add_document(doc!(title => "MadCow Inc.", revenue => 92_000_000i64))?;
    /// #   index_writer.add_document(doc!(title => "Zozo Cow KKK", revenue => 119_000_000i64))?;
    /// #   index_writer.add_document(doc!(title => "Declining Cow", revenue => -63_000_000i64))?;
    /// #   assert!(index_writer.commit().is_ok());
    /// #   let reader = index.reader()?;
    /// #   let top_docs = docs_sorted_by_revenue(&reader.searcher(), &AllQuery, "revenue")?;
    /// #   assert_eq!(top_docs,
    /// #            vec![(Some(119_000_000i64), DocAddress::new(0, 1)),
    /// #                 (Some(92_000_000i64), DocAddress::new(0, 0))]);
    /// #   Ok(())
    /// # }
    /// /// Searches the document matching the given query, and
    /// /// collects the top 10 documents, order by the u64-`field`
    /// /// given in argument.
    /// fn docs_sorted_by_revenue(searcher: &Searcher,
    ///                          query: &dyn Query,
    ///                          revenue_field: &str)
    ///     -> tantivy::Result<Vec<(Option<i64>, DocAddress)>> {
    ///
    ///     // This is where we build our topdocs collector
    ///     //
    ///     // Note the generics parameter that needs to match the
    ///     // type `sort_by_field`. revenue_field here is a FAST i64 field.
    ///     let top_company_by_revenue = TopDocs
    ///                 ::with_limit(2)
    ///                  .order_by_fast_field("revenue", Order::Desc);
    ///
    ///     // ... and here are our documents. Note this is a simple vec.
    ///     // The `i64` in the pair is the value of our fast field for
    ///     // each documents.
    ///     //
    ///     // The vec is sorted decreasingly by `sort_by_field`, and has a
    ///     // length of 10, or less if not enough documents matched the
    ///     // query.
    ///     let resulting_docs: Vec<(Option<i64>, DocAddress)> =
    ///          searcher.search(query, &top_company_by_revenue)?;
    ///
    ///     Ok(resulting_docs)
    /// }
    /// ```
    pub fn order_by_fast_field<TFastValue>(
        self,
        fast_field: impl ToString,
        order: Order,
    ) -> impl Collector<Fruit = Vec<(Option<TFastValue>, DocAddress)>>
    where
        TFastValue: FastValue,
        ComparatorEnum: Comparator<Option<TFastValue>>,
    {
        self.order_by((SortByStaticFastValue::for_field(fast_field), order))
    }

    /// Like `order_by_fast_field`, but for a `String` fast field.
    pub fn order_by_string_fast_field(
        self,
        fast_field: impl ToString,
        order: Order,
    ) -> impl Collector<Fruit = Vec<(Option<String>, DocAddress)>> {
        let by_string_sort_key_computer = SortByString::for_field(fast_field.to_string());
        self.order_by((by_string_sort_key_computer, order))
    }

    /// Ranks the documents using a sort key.
    pub fn order_by<TSortKey>(
        self,
        sort_key_computer: impl SortKeyComputer<SortKey = TSortKey> + Send + 'static,
    ) -> impl Collector<Fruit = Vec<(TSortKey, DocAddress)>>
    where
        TSortKey: 'static + Clone + Send + Sync + std::fmt::Debug,
    {
        TopBySortKeyCollector::new(sort_key_computer, self.doc_range())
    }

    /// Helper function to tweak the similarity score of documents using a function.
    /// (usually a closure).
    ///
    /// This method offers a convenient way to tweak or replace
    /// the documents score. As suggested by the prototype you can
    /// manually define your own [`SortKeyComputer`]
    /// and pass it as an argument, but there is a much simpler way to
    /// tweak your score: you can use a closure as in the following
    /// example.
    ///
    /// # Example
    ///
    /// Typically, you will want to rely on one or more fast fields,
    /// to alter the original relevance `Score`.
    ///
    /// For instance, in the following, we assume that we are implementing
    /// an e-commerce website that has a fast field called `popularity`
    /// that rates whether a product is typically often bought by users.
    ///
    /// In the following example will will tweak our ranking a bit by
    /// boosting popular products a notch.
    ///
    /// In more serious application, this tweaking could involve running a
    /// learning-to-rank model over various features
    ///
    /// ```rust
    /// # use tantivy::schema::{Schema, FAST, TEXT};
    /// # use tantivy::{doc, Index, DocAddress, DocId, Score};
    /// # use tantivy::query::QueryParser;
    /// use tantivy::SegmentReader;
    /// use tantivy::collector::TopDocs;
    /// use tantivy::schema::Field;
    ///
    /// fn create_schema() -> Schema {
    ///    let mut schema_builder = Schema::builder();
    ///    schema_builder.add_text_field("product_name", TEXT);
    ///    schema_builder.add_u64_field("popularity", FAST);
    ///    schema_builder.build()
    /// }
    ///
    /// fn create_index() -> tantivy::Result<Index> {
    ///   let schema = create_schema();
    ///   let index = Index::create_in_ram(schema);
    ///   let mut index_writer = index.writer_with_num_threads(1, 20_000_000)?;
    ///   let product_name = index.schema().get_field("product_name").unwrap();
    ///   let popularity: Field = index.schema().get_field("popularity").unwrap();
    ///   index_writer.add_document(doc!(product_name => "The Diary of Muadib", popularity => 1u64))?;
    ///   index_writer.add_document(doc!(product_name => "A Dairy Cow", popularity => 10u64))?;
    ///   index_writer.add_document(doc!(product_name => "The Diary of a Young Girl", popularity => 15u64))?;
    ///   index_writer.commit()?;
    ///   Ok(index)
    /// }
    ///
    /// let index = create_index().unwrap();
    /// let product_name = index.schema().get_field("product_name").unwrap();
    /// let popularity: Field = index.schema().get_field("popularity").unwrap();
    ///
    /// let user_query_str = "diary";
    /// let query_parser = QueryParser::for_index(&index, vec![product_name]);
    /// let query = query_parser.parse_query(user_query_str).unwrap();
    ///
    /// // This is where we build our collector with our custom score.
    /// let top_docs_by_custom_score = TopDocs
    ///         ::with_limit(10)
    ///          .tweak_score(move |segment_reader: &SegmentReader| {
    ///             // The argument is a function that returns our scoring
    ///             // function.
    ///             //
    ///             // The point of this "mother" function is to gather all
    ///             // of the segment level information we need for scoring.
    ///             // Typically, fast_fields.
    ///             //
    ///             // In our case, we will get a reader for the popularity
    ///             // fast field. For simplicity we read the first or default value in the fast
    ///             // field.
    ///             let popularity_reader =
    ///                 segment_reader.fast_fields().u64("popularity").unwrap().first_or_default_col(0);
    ///
    ///             // We can now define our actual scoring function
    ///             move |doc: DocId, original_score: Score| {
    ///                 let popularity: u64 = popularity_reader.get_val(doc);
    ///                 // Well.. For the sake of the example we use a simple logarithm
    ///                 // function.
    ///                 let popularity_boost_score = ((2u64 + popularity) as Score).log2();
    ///                 popularity_boost_score * original_score
    ///             }
    ///           });
    /// let reader = index.reader().unwrap();
    /// let searcher = reader.searcher();
    /// // ... and here are our documents. Note this is a simple vec.
    /// // The `Score` in the pair is our tweaked score.
    /// let resulting_docs: Vec<(Score, DocAddress)> =
    ///      searcher.search(&query, &top_docs_by_custom_score).unwrap();
    /// ``
    pub fn tweak_score<F, TSortKey>(
        self,
        sort_key_fn: F,
    ) -> impl Collector<Fruit = Vec<(TSortKey, DocAddress)>>
    where
        F: 'static + Send + Sync,
        TSortKey: 'static + PartialOrd + Clone + Send + Sync + std::fmt::Debug,
        TweakScoreFn<F>: SortKeyComputer<SortKey = TSortKey>,
    {
        self.order_by(TweakScoreFn(sort_key_fn))
    }
}

/// Helper struct to make it possible to define a sort key computer that does not use
/// the similary score from a simple function.
pub struct TweakScoreFn<F>(F);

impl<F, TTweakScoreSortKeyFn, TSortKey> SortKeyComputer for TweakScoreFn<F>
where
    F: 'static + Send + Sync + Fn(&SegmentReader) -> TTweakScoreSortKeyFn,
    TTweakScoreSortKeyFn: 'static + Fn(DocId, Score) -> TSortKey,
    TweakScoreSegmentSortKeyComputer<TTweakScoreSortKeyFn>:
        SegmentSortKeyComputer<SortKey = TSortKey, SegmentSortKey = TSortKey>,
    TSortKey: 'static + PartialOrd + Clone + Send + Sync + std::fmt::Debug,
{
    type SortKey = TSortKey;
    type Child = TweakScoreSegmentSortKeyComputer<TTweakScoreSortKeyFn>;
    type Comparator = NaturalComparator;

    fn requires_scoring(&self) -> bool {
        true
    }

    fn segment_sort_key_computer(
        &self,
        segment_reader: &SegmentReader,
    ) -> crate::Result<Self::Child> {
        Ok({
            TweakScoreSegmentSortKeyComputer {
                sort_key_fn: (self.0)(segment_reader),
            }
        })
    }
}

pub struct TweakScoreSegmentSortKeyComputer<TTweakScoreSortKeyFn> {
    sort_key_fn: TTweakScoreSortKeyFn,
}

impl<TTweakScoreSortKeyFn, TSortKey> SegmentSortKeyComputer
    for TweakScoreSegmentSortKeyComputer<TTweakScoreSortKeyFn>
where
    TTweakScoreSortKeyFn: 'static + Fn(DocId, Score) -> TSortKey,
    TSortKey: 'static + PartialOrd + Clone + Send + Sync,
{
    type SortKey = TSortKey;
    type SegmentSortKey = TSortKey;
    type SegmentComparator = NaturalComparator;

    fn segment_sort_key(&mut self, doc: DocId, score: Score) -> TSortKey {
        (self.sort_key_fn)(doc, score)
    }

    /// Convert a segment level score into the global level score.
    fn convert_segment_sort_key(&self, sort_key: Self::SegmentSortKey) -> Self::SortKey {
        sort_key
    }
}

/// Fast TopN Computation
///
/// Capacity of the vec is 2 * top_n.
/// The buffer is truncated to the top_n elements when it reaches the capacity of the Vec.
/// That means capacity has special meaning and should be carried over when cloning or serializing.
///
/// For TopN == 0, it will be relative expensive.
///
/// The TopNComputer will tiebreak by using ascending `D` (DocId or DocAddress):
/// i.e., in case of a tie on the sort key, the `DocId|DocAddress` are always sorted in
/// ascending order, regardless of the `Comparator` used for the `Score` type.
///
/// NOTE: Items must be `push`ed to the TopNComputer in ascending `DocId|DocAddress` order, as the
/// threshold used to eliminate docs does not include the `DocId` or `DocAddress`: this provides
/// the ascending `DocId|DocAddress` tie-breaking behavior without additional comparisons.
#[derive(Serialize, Deserialize)]
#[serde(from = "TopNComputerDeser<Score, D, C>")]
pub struct TopNComputer<Score, D, C> {
    /// The buffer reverses sort order to get top-semantics instead of bottom-semantics
    buffer: Vec<ComparableDoc<Score, D>>,
    top_n: usize,
    pub(crate) threshold: Option<Score>,
    comparator: C,
}

// Intermediate struct for TopNComputer for deserialization, to keep vec capacity
#[derive(Deserialize)]
struct TopNComputerDeser<Score, D, C> {
    buffer: Vec<ComparableDoc<Score, D>>,
    top_n: usize,
    threshold: Option<Score>,
    comparator: C,
}

impl<Score, D, C> From<TopNComputerDeser<Score, D, C>> for TopNComputer<Score, D, C> {
    fn from(mut value: TopNComputerDeser<Score, D, C>) -> Self {
        let expected_cap = value.top_n.max(1) * 2;
        let current_cap = value.buffer.capacity();
        if current_cap < expected_cap {
            value.buffer.reserve_exact(expected_cap - current_cap);
        } else {
            value.buffer.shrink_to(expected_cap);
        }

        TopNComputer {
            buffer: value.buffer,
            top_n: value.top_n,
            threshold: value.threshold,
            comparator: value.comparator,
        }
    }
}

impl<Score: std::fmt::Debug, D, C> std::fmt::Debug for TopNComputer<Score, D, C>
where C: Comparator<Score>
{
    fn fmt(&self, f: &mut fmt::Formatter) -> std::fmt::Result {
        f.debug_struct("TopNComputer")
            .field("buffer_len", &self.buffer.len())
            .field("top_n", &self.top_n)
            .field("current_threshold", &self.threshold)
            .field("comparator", &self.comparator)
            .finish()
    }
}

// Custom clone to keep capacity
impl<Score: Clone, D: Clone, C: Clone> Clone for TopNComputer<Score, D, C> {
    fn clone(&self) -> Self {
        let mut buffer_clone = Vec::with_capacity(self.buffer.capacity());
        buffer_clone.extend(self.buffer.iter().cloned());
        TopNComputer {
            buffer: buffer_clone,
            top_n: self.top_n,
            threshold: self.threshold.clone(),
            comparator: self.comparator.clone(),
        }
    }
}

impl<TSortKey, D> TopNComputer<TSortKey, D, ReverseComparator>
where
    D: Ord,
    TSortKey: Clone,
    NaturalComparator: Comparator<TSortKey>,
{
    /// Create a new `TopNComputer`.
    /// Internally it will allocate a buffer of size `2 * top_n`.
    pub fn new(top_n: usize) -> Self {
        TopNComputer::new_with_comparator(top_n, ReverseComparator)
    }
}

#[inline(always)]
fn compare_for_top_k<TSortKey, D: Ord, C: Comparator<TSortKey>>(
    c: &C,
    lhs: &ComparableDoc<TSortKey, D>,
    rhs: &ComparableDoc<TSortKey, D>,
) -> std::cmp::Ordering {
    c.compare(&lhs.sort_key, &rhs.sort_key)
        .reverse() // Reverse here because we want top K.
        .then_with(|| lhs.doc.cmp(&rhs.doc)) // Regardless of asc/desc, in presence of a tie, we
                                             // sort by doc id
}

impl<TSortKey, D, C> TopNComputer<TSortKey, D, C>
where
    D: Ord,
    TSortKey: Clone,
    C: Comparator<TSortKey>,
{
    /// Create a new `TopNComputer`.
    /// Internally it will allocate a buffer of size `2 * top_n`.
    pub fn new_with_comparator(top_n: usize, comparator: C) -> Self {
        let vec_cap = top_n.max(1) * 2;
        TopNComputer {
            buffer: Vec::with_capacity(vec_cap),
            top_n,
            threshold: None,
            comparator,
        }
    }

    /// Push a new document to the top n.
    /// If the document is below the current threshold, it will be ignored.
    ///
    /// NOTE: `push` must be called in ascending `DocId`/`DocAddress` order.
    #[inline]
    pub fn push(&mut self, sort_key: TSortKey, doc: D) {
        if let Some(last_median) = &self.threshold {
            // See the struct docs for an explanation of why this comparison is strict.
            if self.comparator.compare(&sort_key, last_median) != Ordering::Greater {
                return;
            }
        }
        self.append_doc(doc, sort_key);
    }

    // Append a document to the top n.
    //
    // At this point, we need to have established that the doc is above the threshold.
    #[inline(always)]
    pub(crate) fn append_doc(&mut self, doc: D, sort_key: TSortKey) {
        if self.buffer.len() == self.buffer.capacity() {
            let median = self.truncate_top_n();
            self.threshold = Some(median);
        }
        // This cannot panic, because we truncate_median will at least remove one element, since
        // the min capacity is 2.
        let comparable_doc = ComparableDoc { doc, sort_key };
        push_assuming_capacity(comparable_doc, &mut self.buffer);
    }

    #[inline(never)]
    fn truncate_top_n(&mut self) -> TSortKey {
        // Use select_nth_unstable to find the top nth score
        let (_, median_el, _) = self.buffer.select_nth_unstable_by(self.top_n, |lhs, rhs| {
            compare_for_top_k(&self.comparator, lhs, rhs)
        });

        let median_score = median_el.sort_key.clone();
        // Remove all elements below the top_n
        self.buffer.truncate(self.top_n);

        median_score
    }

    /// Returns the top n elements in sorted order.
    pub fn into_sorted_vec(mut self) -> Vec<ComparableDoc<TSortKey, D>> {
        if self.buffer.len() > self.top_n {
            self.truncate_top_n();
        }
        self.buffer
            .sort_unstable_by(|lhs, rhs| compare_for_top_k(&self.comparator, lhs, rhs));
        self.buffer
    }

    /// Returns the top n elements in stored order.
    /// Useful if you do not need the elements in sorted order,
    /// for example when merging the results of multiple segments.
    pub fn into_vec(mut self) -> Vec<ComparableDoc<TSortKey, D>> {
        if self.buffer.len() > self.top_n {
            self.truncate_top_n();
        }
        self.buffer
    }
}

// Push an element provided there is enough capacity to do so.
//
// Panics if there is not enough capacity to add an element.
#[inline(always)]
fn push_assuming_capacity<T>(el: T, buf: &mut Vec<T>) {
    let prev_len = buf.len();
    assert!(prev_len < buf.capacity());
    // This is mimicking the current (non-stabilized) implementation in std.
    // SAFETY: we just checked we have enough capacity.
    unsafe {
        let end = buf.as_mut_ptr().add(prev_len);
        std::ptr::write(end, el);
        buf.set_len(prev_len + 1);
    }
}

#[cfg(test)]
mod tests {
    use proptest::prelude::*;

    use super::{TopDocs, TopNComputer};
    use crate::collector::sort_key::{ComparatorEnum, NaturalComparator, ReverseComparator};
    use crate::collector::top_collector::ComparableDoc;
    use crate::collector::{Collector, DocSetCollector};
    use crate::query::{AllQuery, Query, QueryParser};
    use crate::schema::{Field, Schema, FAST, STORED, TEXT};
    use crate::time::format_description::well_known::Rfc3339;
    use crate::time::OffsetDateTime;
    use crate::{
        assert_nearly_equals, DateTime, DocAddress, DocId, Index, IndexWriter, Order, Score,
        SegmentReader,
    };

    fn make_index() -> crate::Result<Index> {
        let mut schema_builder = Schema::builder();
        let text_field = schema_builder.add_text_field("text", TEXT);
        let schema = schema_builder.build();
        let index = Index::create_in_ram(schema);
        // writing the segment
        let mut index_writer = index.writer_with_num_threads(1, 20_000_000)?;
        index_writer.add_document(doc!(text_field=>"Hello happy tax payer."))?;
        index_writer.add_document(doc!(text_field=>"Droopy says hello happy tax payer"))?;
        index_writer.add_document(doc!(text_field=>"I like Droopy"))?;
        index_writer.commit()?;
        Ok(index)
    }

    fn assert_results_equals(results: &[(Score, DocAddress)], expected: &[(Score, DocAddress)]) {
        for (result, expected) in results.iter().zip(expected.iter()) {
            assert_eq!(result.1, expected.1);
            crate::assert_nearly_equals!(result.0, expected.0);
        }
    }

    #[test]
    fn test_empty_topn_computer() {
        let mut computer: TopNComputer<u32, u32, NaturalComparator> =
            TopNComputer::new_with_comparator(0, NaturalComparator);

        computer.push(1u32, 1u32);
        computer.push(1u32, 2u32);
        computer.push(1u32, 3u32);
        assert!(computer.into_vec().is_empty());
    }

    #[test]
    fn test_topn_computer() {
        let mut computer: TopNComputer<u32, u32, NaturalComparator> =
            TopNComputer::new_with_comparator(2, NaturalComparator);

        computer.push(1u32, 1u32);
        computer.push(2u32, 2u32);
        computer.push(3u32, 3u32);
        computer.push(2u32, 4u32);
        computer.push(1u32, 5u32);
        assert_eq!(
            computer.into_sorted_vec(),
            &[
                ComparableDoc {
                    sort_key: 3u32,
                    doc: 3u32,
                },
                ComparableDoc {
                    sort_key: 2u32,
                    doc: 2u32,
                }
            ]
        );
    }

    #[test]
    fn test_topn_computer_duplicates() {
        let mut computer: TopNComputer<u32, u32, NaturalComparator> =
            TopNComputer::new_with_comparator(2, NaturalComparator);

        computer.push(1u32, 1u32);
        computer.push(1u32, 2u32);
        computer.push(1u32, 3u32);
        computer.push(1u32, 4u32);
        computer.push(1u32, 5u32);

        // In the presence of duplicates, DocIds are always ascending order.
        assert_eq!(
            computer.into_sorted_vec(),
            &[
                ComparableDoc {
                    sort_key: 1u32,
                    doc: 1u32,
                },
                ComparableDoc {
                    sort_key: 1u32,
                    doc: 2u32,
                }
            ]
        );
    }

    #[test]
    fn test_topn_computer_no_panic() {
        for top_n in 0..10 {
            let mut computer: TopNComputer<u32, u32, NaturalComparator> =
                TopNComputer::new_with_comparator(top_n, NaturalComparator);

            for _ in 0..1 + top_n * 2 {
                computer.push(1u32, 1u32);
            }
            let _vals = computer.into_sorted_vec();
        }
    }

    proptest! {
        #[test]
        fn test_topn_computer_asc_prop(
          limit in 0..10_usize,
          mut docs in proptest::collection::vec((0..100_u64, 0..100_u64), 0..100_usize),
        ) {
            // NB: TopNComputer must receive inputs in ascending DocId order.
            docs.sort_by_key(|(_, doc_id)| *doc_id);
            let mut computer: TopNComputer<_, _, ReverseComparator> = TopNComputer::new_with_comparator(limit, ReverseComparator);
            for (feature, doc) in &docs {
                computer.push(*feature, *doc);
            }
            let mut comparable_docs: Vec<ComparableDoc<u64, u64>> =
                docs.into_iter().map(|(sort_key, doc)| ComparableDoc { sort_key, doc }).collect();
            crate::collector::sort_key::tests::sort_hits(&mut comparable_docs, Order::Asc);
            comparable_docs.truncate(limit);
            prop_assert_eq!(
                computer.into_sorted_vec(),
                comparable_docs,
            );
        }
    }

    #[test]
    fn test_top_collector_not_at_capacity_without_offset() -> crate::Result<()> {
        let index = make_index()?;
        let field = index.schema().get_field("text").unwrap();
        let query_parser = QueryParser::for_index(&index, vec![field]);
        let text_query = query_parser.parse_query("droopy tax")?;
        let score_docs: Vec<(Score, DocAddress)> = index
            .reader()?
            .searcher()
            .search(&text_query, &TopDocs::with_limit(4).order_by_score())?;
        assert_results_equals(
            &score_docs,
            &[
                (0.81221175, DocAddress::new(0u32, 1)),
                (0.5376842, DocAddress::new(0u32, 2)),
                (0.48527452, DocAddress::new(0, 0)),
            ],
        );
        Ok(())
    }

    #[test]
    fn test_top_collector_not_at_capacity_with_offset() {
        let index = make_index().unwrap();
        let field = index.schema().get_field("text").unwrap();
        let query_parser = QueryParser::for_index(&index, vec![field]);
        let text_query = query_parser.parse_query("droopy tax").unwrap();
        let score_docs: Vec<(Score, DocAddress)> = index
            .reader()
            .unwrap()
            .searcher()
            .search(
                &text_query,
                &TopDocs::with_limit(4).and_offset(2).order_by_score(),
            )
            .unwrap();
        assert_results_equals(&score_docs[..], &[(0.48527452, DocAddress::new(0, 0))]);
    }

    #[test]
    fn test_top_collector_at_capacity() {
        let index = make_index().unwrap();
        let field = index.schema().get_field("text").unwrap();
        let query_parser = QueryParser::for_index(&index, vec![field]);
        let text_query = query_parser.parse_query("droopy tax").unwrap();
        let score_docs: Vec<(Score, DocAddress)> = index
            .reader()
            .unwrap()
            .searcher()
            .search(&text_query, &TopDocs::with_limit(2).order_by_score())
            .unwrap();
        assert_results_equals(
            &score_docs,
            &[
                (0.81221175, DocAddress::new(0u32, 1)),
                (0.5376842, DocAddress::new(0u32, 2)),
            ],
        );
    }

    #[test]
    fn test_top_collector_at_capacity_with_offset() {
        let index = make_index().unwrap();
        let field = index.schema().get_field("text").unwrap();
        let query_parser = QueryParser::for_index(&index, vec![field]);
        let text_query = query_parser.parse_query("droopy tax").unwrap();
        let score_docs: Vec<(Score, DocAddress)> = index
            .reader()
            .unwrap()
            .searcher()
            .search(
                &text_query,
                &TopDocs::with_limit(2).and_offset(1).order_by_score(),
            )
            .unwrap();
        assert_results_equals(
            &score_docs[..],
            &[
                (0.5376842, DocAddress::new(0u32, 2)),
                (0.48527452, DocAddress::new(0, 0)),
            ],
        );
    }

    #[test]
    fn test_top_collector_stable_sorting() {
        let index = make_index().unwrap();

        // using AllQuery to get a constant score
        let searcher = index.reader().unwrap().searcher();

        let page_0 = searcher
            .search(&AllQuery, &TopDocs::with_limit(1).order_by_score())
            .unwrap();

        let page_1 = searcher
            .search(&AllQuery, &TopDocs::with_limit(2).order_by_score())
            .unwrap();

        let page_2 = searcher
            .search(&AllQuery, &TopDocs::with_limit(3).order_by_score())
            .unwrap();

        // precondition for the test to be meaningful: we did get documents
        // with the same score
        assert!(page_0.iter().all(|result| result.0 == page_1[0].0));
        assert!(page_1.iter().all(|result| result.0 == page_1[0].0));
        assert!(page_2.iter().all(|result| result.0 == page_2[0].0));

        // sanity check since we're relying on make_index()
        assert_eq!(page_0.len(), 1);
        assert_eq!(page_1.len(), 2);
        assert_eq!(page_2.len(), 3);

        assert_eq!(page_1, &page_2[..page_1.len()]);
        assert_eq!(page_0, &page_2[..page_0.len()]);
    }

    proptest! {
        #![proptest_config(ProptestConfig::with_cases(20))]
        /// Build multiple segments with equal-scoring docs and verify stable ordering
        /// across pages when increasing limit or offset.
        #[test]
        fn proptest_stable_ordering_across_segments_with_pagination(
            docs_per_segment in proptest::collection::vec(1usize..50, 2..5)
        ) {
            use crate::indexer::NoMergePolicy;

            // Build an index with multiple segments; all docs will have the same score using AllQuery.
            let mut schema_builder = Schema::builder();
            let text = schema_builder.add_text_field("text", TEXT);
            let schema = schema_builder.build();
            let index = Index::create_in_ram(schema);
            let mut writer = index.writer_for_tests().unwrap();
            writer.set_merge_policy(Box::new(NoMergePolicy));

            for num_docs in &docs_per_segment {
                for _ in 0..*num_docs {
                    writer.add_document(doc!(text => "x")).unwrap();
                }
                writer.commit().unwrap();
            }

            let reader = index.reader().unwrap();
            let searcher = reader.searcher();

            let total_docs: usize = docs_per_segment.iter().sum();
            // Full result set, first assert all scores are identical.
            let full_with_scores: Vec<(Score, DocAddress)> = searcher
                .search(&AllQuery, &TopDocs::with_limit(total_docs).order_by_score())
                .unwrap();
            // Sanity: at least one document was returned.
            prop_assert!(!full_with_scores.is_empty());
            let first_score = full_with_scores[0].0;
            prop_assert!(full_with_scores.iter().all(|(score, _)| *score == first_score));

            // Keep only the addresses for the remaining checks.
            let full: Vec<DocAddress> = full_with_scores
                .into_iter()
                .map(|(_score, addr)| addr)
                .collect();

            // Sanity: we actually created multiple segments and have documents.
            prop_assert!(docs_per_segment.len() >= 2);
            prop_assert!(total_docs >= 2);

            // 1) Increasing limit should preserve prefix ordering.
            for k in 1..=total_docs {
                let page: Vec<DocAddress> = searcher
                    .search(&AllQuery, &TopDocs::with_limit(k).order_by_score())
                    .unwrap()
                    .into_iter()
                    .map(|(_score, addr)| addr)
                    .collect();
                prop_assert_eq!(page, full[..k].to_vec());
            }

            // 2) Offset + limit pages should always match the corresponding slice.
            //    For each offset, check three representative page sizes:
            //    - first page (size 1)
            //    - a middle page (roughly half of remaining)
            //    - the last page (size = remaining)
            for offset in 0..total_docs {
                let remaining = total_docs - offset;

                let assert_page_eq = |limit: usize| -> proptest::test_runner::TestCaseResult {
                    let page: Vec<DocAddress> = searcher
                        .search(&AllQuery, &TopDocs::with_limit(limit).and_offset(offset).order_by_score())
                        .unwrap()
                        .into_iter()
                        .map(|(_score, addr)| addr)
                        .collect();
                    prop_assert_eq!(page, full[offset..offset + limit].to_vec());
                    Ok(())
                };

                // Smallest page.
                assert_page_eq(1)?;
                // A middle-sized page (dedupes to 1 if remaining == 1).
                assert_page_eq((remaining / 2).max(1))?;
                // Largest page for this offset.
                assert_page_eq(remaining)?;
            }

            // 3) Concatenating fixed-size pages by offset reproduces the full order.
            for page_size in 1..=total_docs.min(5) {
                let mut concat: Vec<DocAddress> = Vec::new();
                let mut offset = 0;
                while offset < total_docs {
                    let size = page_size.min(total_docs - offset);
                    let page: Vec<DocAddress> = searcher
                        .search(&AllQuery, &TopDocs::with_limit(size).and_offset(offset).order_by_score())
                        .unwrap()
                        .into_iter()
                        .map(|(_score, addr)| addr)
                        .collect();
                    concat.extend(page);
                    offset += size;
                }
                // Avoid moving `full` across loop iterations.
                prop_assert_eq!(concat, full.clone());
            }
        }
    }

    proptest! {
        #![proptest_config(ProptestConfig::with_cases(20))]
        /// Build multiple segments with same-scoring term matches and verify stable ordering
        /// across pages for a real scoring query (TermQuery with identical TF and fieldnorm).
        #[test]
        fn proptest_stable_ordering_across_segments_with_term_query_and_pagination(
            docs_per_segment in proptest::collection::vec(1usize..50, 2..5)
        ) {
            use crate::indexer::NoMergePolicy;
            use crate::schema::IndexRecordOption;
            use crate::query::TermQuery;
            use crate::Term;

            // Build an index with multiple segments; each doc has exactly one token "x",
            // ensuring equal BM25 scores across all matching docs (same TF=1 and fieldnorm=1).
            let mut schema_builder = Schema::builder();
            let text = schema_builder.add_text_field("text", TEXT);
            let schema = schema_builder.build();
            let index = Index::create_in_ram(schema);
            let mut writer = index.writer_for_tests().unwrap();
            writer.set_merge_policy(Box::new(NoMergePolicy));

            for num_docs in &docs_per_segment {
                for _ in 0..*num_docs {
                    writer.add_document(doc!(text => "x")).unwrap();
                }
                writer.commit().unwrap();
            }

            let reader = index.reader().unwrap();
            let searcher = reader.searcher();

            let total_docs: usize = docs_per_segment.iter().sum();
            let term = Term::from_field_text(text, "x");
            let tq = TermQuery::new(term, IndexRecordOption::WithFreqs);

            // Full result set, first assert all scores are identical across docs.
            let full_with_scores: Vec<(Score, DocAddress)> = searcher
                .search(&tq, &TopDocs::with_limit(total_docs).order_by_score())
                .unwrap();
            // Sanity: at least one document was returned.
            prop_assert!(!full_with_scores.is_empty());
            let first_score = full_with_scores[0].0;
            prop_assert!(full_with_scores.iter().all(|(score, _)| *score == first_score));

            // Keep only the addresses for the remaining checks.
            let full: Vec<DocAddress> = full_with_scores
                .into_iter()
                .map(|(_score, addr)| addr)
                .collect();

            // Sanity: we actually created multiple segments and have documents.
            prop_assert!(docs_per_segment.len() >= 2);
            prop_assert!(total_docs >= 2);

            // 1) Increasing limit should preserve prefix ordering.
            for k in 1..=total_docs {
                let page: Vec<DocAddress> = searcher
                    .search(&tq, &TopDocs::with_limit(k).order_by_score())
                    .unwrap()
                    .into_iter()
                    .map(|(_score, addr)| addr)
                    .collect();
                prop_assert_eq!(page, full[..k].to_vec());
            }

            // 2) Offset + limit pages should always match the corresponding slice.
            //    Check three representative page sizes for each offset: 1, ~half, and remaining.
            for offset in 0..total_docs {
                let remaining = total_docs - offset;

                let assert_page_eq = |limit: usize| -> proptest::test_runner::TestCaseResult {
                    let page: Vec<DocAddress> = searcher
                        .search(&tq, &TopDocs::with_limit(limit).and_offset(offset).order_by_score())
                        .unwrap()
                        .into_iter()
                        .map(|(_score, addr)| addr)
                        .collect();
                    prop_assert_eq!(page, full[offset..offset + limit].to_vec());
                    Ok(())
                };

                assert_page_eq(1)?;
                assert_page_eq((remaining / 2).max(1))?;
                assert_page_eq(remaining)?;
            }

            // 3) Concatenating fixed-size pages by offset reproduces the full order.
            for page_size in 1..=total_docs.min(5) {
                let mut concat: Vec<DocAddress> = Vec::new();
                let mut offset = 0;
                while offset < total_docs {
                    let size = page_size.min(total_docs - offset);
                    let page: Vec<DocAddress> = searcher
                        .search(&tq, &TopDocs::with_limit(size).and_offset(offset).order_by_score())
                        .unwrap()
                        .into_iter()
                        .map(|(_score, addr)| addr)
                        .collect();
                    concat.extend(page);
                    offset += size;
                }
                prop_assert_eq!(concat, full.clone());
            }
        }
    }

    #[test]
    #[should_panic]
    fn test_top_0() {
        TopDocs::with_limit(0);
    }

    const TITLE: &str = "title";
    const SIZE: &str = "size";

    #[test]
    fn test_top_field_collector_not_at_capacity() -> crate::Result<()> {
        let mut schema_builder = Schema::builder();
        let title = schema_builder.add_text_field(TITLE, TEXT);
        let size = schema_builder.add_u64_field(SIZE, FAST);
        let schema = schema_builder.build();
        let (index, query) = index("beer", title, schema, |index_writer| {
            index_writer
                .add_document(doc!(
                    title => "bottle of beer",
                    size => 12u64,
                ))
                .unwrap();
            index_writer
                .add_document(doc!(
                    title => "growler of beer",
                    size => 64u64,
                ))
                .unwrap();
            index_writer
                .add_document(doc!(
                    title => "pint of beer",
                    size => 16u64,
                ))
                .unwrap();
        });
        let searcher = index.reader()?.searcher();

        let top_collector = TopDocs::with_limit(4).order_by_u64_field(SIZE, Order::Desc);
        let top_docs: Vec<(Option<u64>, DocAddress)> = searcher.search(&query, &top_collector)?;
        assert_eq!(
            &top_docs[..],
            &[
                (Some(64), DocAddress::new(0, 1)),
                (Some(16), DocAddress::new(0, 2)),
                (Some(12), DocAddress::new(0, 0))
            ]
        );
        Ok(())
    }

    #[test]
    fn test_top_field_collector_datetime() -> crate::Result<()> {
        let mut schema_builder = Schema::builder();
        let name = schema_builder.add_text_field("name", TEXT);
        let birthday = schema_builder.add_date_field("birthday", FAST);
        let schema = schema_builder.build();
        let index = Index::create_in_ram(schema);
        let mut index_writer = index.writer_for_tests()?;
        let pr_birthday = DateTime::from_utc(OffsetDateTime::parse(
            "1898-04-09T00:00:00+00:00",
            &Rfc3339,
        )?);
        index_writer.add_document(doc!(
            name => "Paul Robeson",
            birthday => pr_birthday,
        ))?;
        let mr_birthday = DateTime::from_utc(OffsetDateTime::parse(
            "1947-11-08T00:00:00+00:00",
            &Rfc3339,
        )?);
        index_writer.add_document(doc!(
            name => "Minnie Riperton",
            birthday => mr_birthday,
        ))?;
        index_writer.commit()?;
        let searcher = index.reader()?.searcher();
        let top_collector = TopDocs::with_limit(3).order_by_fast_field("birthday", Order::Desc);
        let top_docs: Vec<(Option<DateTime>, DocAddress)> =
            searcher.search(&AllQuery, &top_collector)?;
        assert_eq!(
            &top_docs[..],
            &[
                (Some(mr_birthday), DocAddress::new(0, 1)),
                (Some(pr_birthday), DocAddress::new(0, 0)),
            ]
        );
        Ok(())
    }

    #[test]
    fn test_top_field_collector_i64() -> crate::Result<()> {
        let mut schema_builder = Schema::builder();
        let city = schema_builder.add_text_field("city", TEXT);
        let altitude = schema_builder.add_i64_field("altitude", FAST);
        let schema = schema_builder.build();
        let index = Index::create_in_ram(schema);
        let mut index_writer = index.writer_for_tests()?;
        index_writer.add_document(doc!(
                city => "georgetown",
                altitude =>  -1i64,
        ))?;
        index_writer.add_document(doc!(
            city => "tokyo",
            altitude =>  40i64,
        ))?;
        index_writer.commit()?;
        let searcher = index.reader()?.searcher();
        let top_collector = TopDocs::with_limit(3).order_by_fast_field("altitude", Order::Desc);
        let top_docs: Vec<(Option<i64>, DocAddress)> =
            searcher.search(&AllQuery, &top_collector)?;
        assert_eq!(
            &top_docs[..],
            &[
                (Some(40i64), DocAddress::new(0, 1)),
                (Some(-1i64), DocAddress::new(0, 0)),
            ]
        );
        Ok(())
    }

    #[test]
    fn test_top_field_collector_f64() -> crate::Result<()> {
        let mut schema_builder = Schema::builder();
        let city = schema_builder.add_text_field("city", TEXT);
        let altitude = schema_builder.add_f64_field("altitude", FAST);
        let schema = schema_builder.build();
        let index = Index::create_in_ram(schema);
        let mut index_writer = index.writer_for_tests()?;
        index_writer.add_document(doc!(
                city => "georgetown",
                altitude =>  -1.0f64,
        ))?;
        index_writer.add_document(doc!(
            city => "tokyo",
            altitude =>  40f64,
        ))?;
        index_writer.commit()?;
        let searcher = index.reader()?.searcher();
        let top_collector = TopDocs::with_limit(3).order_by_fast_field("altitude", Order::Desc);
        let top_docs: Vec<(Option<f64>, DocAddress)> =
            searcher.search(&AllQuery, &top_collector)?;
        assert_eq!(
            &top_docs[..],
            &[
                (Some(40f64), DocAddress::new(0, 1)),
                (Some(-1.0f64), DocAddress::new(0, 0)),
            ]
        );
        Ok(())
    }

    #[test]
    fn test_top_field_collector_string() -> crate::Result<()> {
        let mut schema_builder = Schema::builder();
        let city = schema_builder.add_text_field("city", TEXT | FAST);
        let schema = schema_builder.build();
        let index = Index::create_in_ram(schema);
        let mut index_writer = index.writer_for_tests()?;
        index_writer.add_document(doc!(
                city => "austin",
        ))?;
        index_writer.add_document(doc!(
                city => "greenville",
        ))?;
        index_writer.add_document(doc!(
            city => "tokyo",
        ))?;
        index_writer.commit()?;

        fn query(
            index: &Index,
            order: Order,
            limit: usize,
            offset: usize,
        ) -> crate::Result<Vec<(Option<String>, DocAddress)>> {
            let searcher = index.reader()?.searcher();
            let top_collector = TopDocs::with_limit(limit)
                .and_offset(offset)
                .order_by_string_fast_field("city", order);
            searcher.search(&AllQuery, &top_collector)
        }

        assert_eq!(
            &query(&index, Order::Desc, 3, 0)?,
            &[
                (Some("tokyo".to_owned()), DocAddress::new(0, 2)),
                (Some("greenville".to_owned()), DocAddress::new(0, 1)),
                (Some("austin".to_owned()), DocAddress::new(0, 0)),
            ]
        );

        assert_eq!(
            &query(&index, Order::Desc, 2, 0)?,
            &[
                (Some("tokyo".to_owned()), DocAddress::new(0, 2)),
                (Some("greenville".to_owned()), DocAddress::new(0, 1)),
            ]
        );

        assert_eq!(&query(&index, Order::Desc, 3, 3)?, &[]);

        assert_eq!(
            &query(&index, Order::Desc, 2, 1)?,
            &[
                (Some("greenville".to_owned()), DocAddress::new(0, 1)),
                (Some("austin".to_owned()), DocAddress::new(0, 0)),
            ]
        );

        assert_eq!(
            &query(&index, Order::Asc, 3, 0)?,
            &[
                (Some("austin".to_owned()), DocAddress::new(0, 0)),
                (Some("greenville".to_owned()), DocAddress::new(0, 1)),
                (Some("tokyo".to_owned()), DocAddress::new(0, 2)),
            ]
        );

        assert_eq!(
            &query(&index, Order::Asc, 2, 1)?,
            &[
                (Some("greenville".to_owned()), DocAddress::new(0, 1)),
                (Some("tokyo".to_owned()), DocAddress::new(0, 2)),
            ]
        );

        assert_eq!(
            &query(&index, Order::Asc, 2, 0)?,
            &[
                (Some("austin".to_owned()), DocAddress::new(0, 0)),
                (Some("greenville".to_owned()), DocAddress::new(0, 1)),
            ]
        );

        assert_eq!(&query(&index, Order::Asc, 3, 3)?, &[]);

        Ok(())
    }

    proptest! {
        #[test]
        fn test_top_field_collect_string_prop(
          order in prop_oneof!(Just(Order::Desc), Just(Order::Asc)),
          limit in 1..256_usize,
          offset in 0..256_usize,
          segments_terms in
            proptest::collection::vec(
                proptest::collection::vec(0..32_u8, 1..32_usize),
                0..8_usize,
            )
        ) {
            let mut schema_builder = Schema::builder();
            let city = schema_builder.add_text_field("city", TEXT | FAST);
            let schema = schema_builder.build();
            let index = Index::create_in_ram(schema);
            let mut index_writer = index.writer_for_tests()?;

            // A Vec<Vec<u8>>, where the outer Vec represents segments, and the inner Vec
            // represents terms.
            for segment_terms in segments_terms.into_iter() {
                for term in segment_terms.into_iter() {
                    let term = format!("{term:0>3}");
                    index_writer.add_document(doc!(
                        city => term,
                    ))?;
                }
                index_writer.commit()?;
            }

            let searcher = index.reader()?.searcher();
            let top_n_results = searcher.search(&AllQuery, &TopDocs::with_limit(limit)
                .and_offset(offset)
                .order_by_string_fast_field("city", order))?;
            let all_results = searcher.search(&AllQuery, &DocSetCollector)?.into_iter().map(|doc_address| {
                // Get the term for this address.
                // NOTE: We can't determine the SegmentIds that will be generated for Segments
                // ahead of time, so we can't pre-compute the expected `DocAddress`es.
                let column = searcher.segment_readers()[doc_address.segment_ord as usize].fast_fields().str("city").unwrap().unwrap();
                let term_ord = column.term_ords(doc_address.doc_id).next().unwrap();
                let mut city = Vec::new();
                column.dictionary().ord_to_term(term_ord, &mut city).unwrap();
                (Some(String::try_from(city).unwrap()), doc_address)
            });

            // Using the TopDocs collector should always be equivalent to sorting, skipping the
            // offset, and then taking the limit.
            let sorted_docs: Vec<_> = {
                let mut comparable_docs: Vec<ComparableDoc<_, _>> =
                    all_results.into_iter().map(|(sort_key, doc)| ComparableDoc { sort_key, doc}).collect();
                crate::collector::sort_key::tests::sort_hits(&mut comparable_docs, order);
                comparable_docs.into_iter().map(|cd| (cd.sort_key, cd.doc)).collect()
            };
            let expected_docs = sorted_docs.into_iter().skip(offset).take(limit).collect::<Vec<_>>();
            prop_assert_eq!(
                expected_docs,
                top_n_results
            );
        }
    }

    #[test]
    #[should_panic]
    fn test_field_does_not_exist() {
        let mut schema_builder = Schema::builder();
        let title = schema_builder.add_text_field(TITLE, TEXT);
        let size = schema_builder.add_u64_field(SIZE, FAST);
        let schema = schema_builder.build();
        let (index, _) = index("beer", title, schema, |index_writer| {
            index_writer
                .add_document(doc!(
                    title => "bottle of beer",
                    size => 12u64,
                ))
                .unwrap();
        });
        let searcher = index.reader().unwrap().searcher();
        let top_collector = TopDocs::with_limit(4).order_by_u64_field("missing_field", Order::Desc);
        let segment_reader = searcher.segment_reader(0u32);
        top_collector
            .for_segment(0, segment_reader)
            .expect("should panic");
    }

    #[test]
    fn test_field_not_fast_field() -> crate::Result<()> {
        let mut schema_builder = Schema::builder();
        let size = schema_builder.add_u64_field(SIZE, STORED);
        let schema = schema_builder.build();
        let index = Index::create_in_ram(schema);
        let mut index_writer = index.writer_for_tests()?;
        index_writer.add_document(doc!(size=>1u64))?;
        index_writer.commit()?;
        let searcher = index.reader()?.searcher();
        let segment = searcher.segment_reader(0);
        let top_collector = TopDocs::with_limit(4).order_by_u64_field(SIZE, Order::Desc);
        let err = top_collector.for_segment(0, segment).err().unwrap();
        assert!(matches!(err, crate::TantivyError::InvalidArgument(_)));
        Ok(())
    }

    #[test]
    fn test_field_wrong_type() {
        let mut schema_builder = Schema::builder();
        let _size = schema_builder.add_u64_field(SIZE, STORED);
        let schema = schema_builder.build();
        let top_collector = TopDocs::with_limit(4).order_by_fast_field::<i64>(SIZE, Order::Desc);
        let err = top_collector.check_schema(&schema).err().unwrap();
        assert!(
            matches!(err, crate::TantivyError::SchemaError(msg) if msg == "Field `size` is not a fast field.")
        );
    }

    #[test]
    fn test_sort_key_top_collector_with_offset() -> crate::Result<()> {
        let index = make_index()?;
        let field = index.schema().get_field("text").unwrap();
        let query_parser = QueryParser::for_index(&index, vec![field]);
        let text_query = query_parser.parse_query("droopy tax")?;
        let collector = TopDocs::with_limit(2)
            .and_offset(1)
            .order_by(move |_segment_reader: &SegmentReader| move |doc: DocId| doc);
        let score_docs: Vec<(u32, DocAddress)> =
            index.reader()?.searcher().search(&text_query, &collector)?;
        assert_eq!(
            score_docs,
            vec![(1, DocAddress::new(0, 1)), (0, DocAddress::new(0, 0)),]
        );
        Ok(())
    }

    #[test]
    fn test_custom_score_top_collector_with_offset() {
        let index = make_index().unwrap();
        let field = index.schema().get_field("text").unwrap();
        let query_parser = QueryParser::for_index(&index, vec![field]);
        let text_query = query_parser.parse_query("droopy tax").unwrap();
        let collector = TopDocs::with_limit(2)
            .and_offset(1)
            .order_by(move |_segment_reader: &SegmentReader| move |doc: DocId| doc);
        let score_docs: Vec<(u32, DocAddress)> = index
            .reader()
            .unwrap()
            .searcher()
            .search(&text_query, &collector)
            .unwrap();

        assert_eq!(
            score_docs,
            vec![(1, DocAddress::new(0, 1)), (0, DocAddress::new(0, 0)),]
        );
    }

    fn index(
        query: &str,
        query_field: Field,
        schema: Schema,
        mut doc_adder: impl FnMut(&mut IndexWriter),
    ) -> (Index, Box<dyn Query>) {
        let index = Index::create_in_ram(schema);
        let mut index_writer = index.writer_with_num_threads(1, 15_000_000).unwrap();
        doc_adder(&mut index_writer);
        index_writer.commit().unwrap();
        let query_parser = QueryParser::for_index(&index, vec![query_field]);
        let query = query_parser.parse_query(query).unwrap();
        (index, query)
    }
    #[test]
    fn test_fast_field_ascending_order() -> crate::Result<()> {
        let mut schema_builder = Schema::builder();
        let title = schema_builder.add_text_field(TITLE, TEXT);
        let size = schema_builder.add_u64_field(SIZE, FAST);
        let schema = schema_builder.build();
        let (index, query) = index("beer", title, schema, |index_writer| {
            index_writer
                .add_document(doc!(
                    title => "bottle of beer",
                    size => 12u64,
                ))
                .unwrap();
            index_writer
                .add_document(doc!(
                    title => "growler of beer",
                    size => 64u64,
                ))
                .unwrap();
            index_writer
                .add_document(doc!(
                    title => "pint of beer",
                    size => 16u64,
                ))
                .unwrap();
            index_writer
                .add_document(doc!(
                    title => "empty beer",
                ))
                .unwrap();
        });
        let searcher = index.reader()?.searcher();

        let top_collector = TopDocs::with_limit(4).order_by_fast_field(SIZE, Order::Asc);
        let top_docs: Vec<(Option<u64>, DocAddress)> = searcher.search(&query, &top_collector)?;
        assert_eq!(
            &top_docs[..],
            &[
                (Some(12), DocAddress::new(0, 0)),
                (Some(16), DocAddress::new(0, 2)),
                (Some(64), DocAddress::new(0, 1)),
                (None, DocAddress::new(0, 3)),
            ]
        );
        Ok(())
    }

    #[test]
    fn test_topn_computer_desc() {
        let mut computer: TopNComputer<u32, u32, _> =
            TopNComputer::new_with_comparator(2, ComparatorEnum::from(Order::Desc));

        computer.push(1u32, 1u32);
        computer.push(2u32, 2u32);
        computer.push(3u32, 3u32);
        computer.push(2u32, 4u32);
        computer.push(4u32, 5u32);
        computer.push(1u32, 6u32);
        assert_eq!(
            computer.into_sorted_vec(),
            &[
                ComparableDoc {
                    sort_key: 4u32,
                    doc: 5u32,
                },
                ComparableDoc {
                    sort_key: 3u32,
                    doc: 3u32,
                }
            ]
        );
    }

    #[test]
    fn test_topn_computer_asc() {
        let mut computer: TopNComputer<u32, u32, _> =
            TopNComputer::new_with_comparator(2, ComparatorEnum::from(Order::Asc));
        computer.push(1u32, 1u32);
        computer.push(2u32, 2u32);
        computer.push(3u32, 3u32);
        computer.push(2u32, 4u32);
        computer.push(4u32, 5u32);
        computer.push(1u32, 6u32);
        assert_eq!(
            computer.into_sorted_vec(),
            &[
                ComparableDoc {
                    sort_key: 1u32,
                    doc: 1u32,
                },
                ComparableDoc {
                    sort_key: 1u32,
                    doc: 6u32,
                }
            ]
        );
    }

    #[test]
    fn test_topn_computer_option_asc_null_at_the_end() {
        let mut computer: TopNComputer<Option<u32>, u32, _> =
            TopNComputer::new_with_comparator(2, ComparatorEnum::ReverseNoneLower);
        computer.push(Some(1u32), 1u32);
        computer.push(Some(2u32), 2u32);
        computer.push(None, 3u32);
        assert_eq!(
            computer.into_sorted_vec(),
            &[
                ComparableDoc {
                    sort_key: Some(1u32),
                    doc: 1u32,
                },
                ComparableDoc {
                    sort_key: Some(2u32),
                    doc: 2u32,
                }
            ]
        );
    }

    #[test]
    fn test_topn_computer_option_asc_null_at_the_begining() {
        let mut computer: TopNComputer<Option<u32>, u32, _> =
            TopNComputer::new_with_comparator(2, ComparatorEnum::Reverse);
        computer.push(Some(1u32), 1u32);
        computer.push(Some(2u32), 2u32);
        computer.push(None, 3u32);
        assert_eq!(
            computer.into_sorted_vec(),
            &[
                ComparableDoc {
                    sort_key: None,
                    doc: 3u32,
                },
                ComparableDoc {
                    sort_key: Some(1u32),
                    doc: 1u32,
                },
            ]
        );
    }

    #[test]
    fn test_push_assuming_capacity() {
        let mut vec = Vec::with_capacity(2);
        super::push_assuming_capacity(1, &mut vec);
        assert_eq!(&vec, &[1]);
        super::push_assuming_capacity(2, &mut vec);
        assert_eq!(&vec, &[1, 2]);
    }

    #[test]
    #[should_panic]
    fn test_push_assuming_capacity_panics_when_no_cap() {
        let mut vec = Vec::with_capacity(1);
        super::push_assuming_capacity(1, &mut vec);
        assert_eq!(&vec, &[1]);
        super::push_assuming_capacity(2, &mut vec);
    }

    #[test]
    fn test_top_n_computer_not_at_capacity() {
        let mut top_n_computer = TopNComputer::new_with_comparator(4, NaturalComparator);
        top_n_computer.append_doc(1, 0.8);
        top_n_computer.append_doc(3, 0.2);
        top_n_computer.append_doc(5, 0.3);
        assert_eq!(
            &top_n_computer.into_sorted_vec(),
            &[
                ComparableDoc {
                    sort_key: 0.8,
                    doc: 1
                },
                ComparableDoc {
                    sort_key: 0.3,
                    doc: 5
                },
                ComparableDoc {
                    sort_key: 0.2,
                    doc: 3
                },
            ]
        );
    }

    #[test]
    fn test_top_n_computer_at_capacity() {
        let mut top_collector = TopNComputer::new_with_comparator(4, NaturalComparator);
        top_collector.append_doc(1, 0.8);
        top_collector.append_doc(3, 0.2);
        top_collector.append_doc(5, 0.3);
        top_collector.append_doc(7, 0.9);
        top_collector.append_doc(9, -0.2);
        assert_eq!(
            &top_collector.into_sorted_vec(),
            &[
                ComparableDoc {
                    sort_key: 0.9,
                    doc: 7
                },
                ComparableDoc {
                    sort_key: 0.8,
                    doc: 1
                },
                ComparableDoc {
                    sort_key: 0.3,
                    doc: 5
                },
                ComparableDoc {
                    sort_key: 0.2,
                    doc: 3
                },
            ]
        );
    }

    #[test]
    fn test_top_segment_collector_stable_ordering_for_equal_feature() {
        // given that the documents are collected in ascending doc id order,
        // when harvesting we have to guarantee stable sorting in case of a tie
        // on the score
        let doc_ids_collection = [4, 5, 6];
        let score = 3.3f32;

        let mut top_collector_limit_2 = TopNComputer::new_with_comparator(2, NaturalComparator);
        for id in &doc_ids_collection {
            top_collector_limit_2.append_doc(*id, score);
        }

        let mut top_collector_limit_3 = TopNComputer::new_with_comparator(3, NaturalComparator);
        for id in &doc_ids_collection {
            top_collector_limit_3.append_doc(*id, score);
        }

        let docs_limit_2 = top_collector_limit_2.into_sorted_vec();
        let docs_limit_3 = top_collector_limit_3.into_sorted_vec();

        assert_eq!(&docs_limit_2, &docs_limit_3[..2],);
    }
}

#[cfg(all(test, feature = "unstable"))]
mod bench {
    use test::Bencher;

    use super::TopNComputer;
    use crate::collector::sort_key::NaturalComparator;

    #[bench]
    fn bench_top_segment_collector_collect_at_capacity(b: &mut Bencher) {
        let mut top_collector = TopNComputer::new_with_comparator(100, NaturalComparator);

        for i in 0..100 {
            top_collector.append_doc(i, 0.8);
        }

        b.iter(|| {
            for i in 0..100 {
                top_collector.append_doc(i, 0.8);
            }
        });
    }
}


================================================
FILE: src/compat_tests.rs
================================================
use std::path::PathBuf;

use schema::*;

use crate::*;

fn create_index(path: &str) {
    let mut schema_builder = Schema::builder();
    let label = schema_builder.add_text_field("label", TEXT | STORED);
    let date = schema_builder.add_date_field("date", INDEXED | STORED);
    let schema = schema_builder.build();
    std::fs::create_dir_all(path).unwrap();
    let index = Index::create_in_dir(path, schema).unwrap();
    let mut index_writer = index.writer_with_num_threads(1, 20_000_000).unwrap();
    index_writer
        .add_document(doc!(label => "dateformat", date => DateTime::from_timestamp_nanos(123456)))
        .unwrap();
    index_writer.commit().unwrap();
}

#[test]
/// Writes an Index for the current INDEX_FORMAT_VERSION to disk.
fn create_format() {
    let version = INDEX_FORMAT_VERSION.to_string();
    let file_path = path_for_version(&version);
    if PathBuf::from(file_path.clone()).exists() {
        return;
    }
    create_index(&file_path);
}

fn path_for_version(version: &str) -> String {
    format!("./tests/compat_tests_data/index_v{version}/")
}

/// feature flag quickwit uses a different dictionary type
#[test]
#[cfg(not(feature = "quickwit"))]
fn test_format_6() {
    let path = path_for_version("6");

    let index = Index::open_in_dir(path).expect("Failed to open index");
    // dates are truncated to Microseconds in v6
    assert_date_time_precision(&index, DateTimePrecision::Microseconds);
}

/// feature flag quickwit uses a different dictionary type
#[test]
#[cfg(not(feature = "quickwit"))]
fn test_format_7() {
    let path = path_for_version("7");

    let index = Index::open_in_dir(path).expect("Failed to open index");
    // dates are not truncated in v7 in the docstore
    assert_date_time_precision(&index, DateTimePrecision::Nanoseconds);
}

#[cfg(not(feature = "quickwit"))]
fn assert_date_time_precision(index: &Index, doc_store_precision: DateTimePrecision) {
    use collector::TopDocs;
    let reader = index.reader().expect("Failed to create reader");
    let searcher = reader.searcher();

    let schema = index.schema();
    let label_field = schema.get_field("label").expect("Field 'label' not found");
    let query_parser = query::QueryParser::for_index(index, vec![label_field]);

    let query = query_parser
        .parse_query("dateformat")
        .expect("Failed to parse query");
    let top_docs = searcher
        .search(&query, &TopDocs::with_limit(1).order_by_score())
        .expect("Search failed");

    assert_eq!(top_docs.len(), 1, "Expected 1 search result");

    let doc_address = top_docs[0].1;
    let retrieved_doc: TantivyDocument = searcher
        .doc(doc_address)
        .expect("Failed to retrieve document");

    let date_field = schema.get_field("date").expect("Field 'date' not found");
    let date_value = retrieved_doc
        .get_first(date_field)
        .expect("Date field not found in document")
        .as_datetime()
        .unwrap();

    let expected = DateTime::from_timestamp_nanos(123456).truncate(doc_store_precision);
    assert_eq!(date_value, expected,);
}


================================================
FILE: src/core/executor.rs
================================================
use std::sync::Arc;

#[cfg(feature = "quickwit")]
use futures_util::{future::Either, FutureExt};

use crate::TantivyError;

/// Executor makes it possible to run tasks in single thread or
/// in a thread pool.
#[derive(Clone)]
pub enum Executor {
    /// Single thread variant of an Executor
    SingleThread,
    /// Thread pool variant of an Executor
    ThreadPool(Arc<rayon::ThreadPool>),
}

#[cfg(feature = "quickwit")]
impl From<Arc<rayon::ThreadPool>> for Executor {
    fn from(thread_pool: Arc<rayon::ThreadPool>) -> Self {
        Executor::ThreadPool(thread_pool)
    }
}

impl Executor {
    /// Creates an Executor that performs all task in the caller thread.
    pub fn single_thread() -> Executor {
        Executor::SingleThread
    }

    /// Creates an Executor that dispatches the tasks in a thread pool.
    pub fn multi_thread(num_threads: usize, prefix: &'static str) -> crate::Result<Executor> {
        let pool = rayon::ThreadPoolBuilder::new()
            .num_threads(num_threads)
            .thread_name(move |num| format!("{prefix}{num}"))
            .build()?;
        Ok(Executor::ThreadPool(Arc::new(pool)))
    }

    /// Perform a map in the thread pool.
    ///
    /// Regardless of the executor (`SingleThread` or `ThreadPool`), panics in the task
    /// will propagate to the caller.
    pub fn map<A, R, F>(&self, f: F, args: impl Iterator<Item = A>) -> crate::Result<Vec<R>>
    where
        A: Send,
        R: Send,
        F: Sized + Sync + Fn(A) -> crate::Result<R>,
    {
        match self {
            Executor::SingleThread => {
                // Avoid `collect`, since the stacktrace is blown up by it, which makes profiling
                // harder.
                let mut result = Vec::with_capacity(args.size_hint().0);
                for arg in args {
                    result.push(f(arg)?);
                }
                Ok(result)
            }
            Executor::ThreadPool(pool) => {
                let args: Vec<A> = args.collect();
                let num_fruits = args.len();
                let fruit_receiver = {
                    let (fruit_sender, fruit_receiver) = crossbeam_channel::unbounded();
                    pool.scope(|scope| {
                        for (idx, arg) in args.into_iter().enumerate() {
                            // We name references for f and fruit_sender_ref because we do not
                            // want these two to be moved into the closure.
                            let f_ref = &f;
                            let fruit_sender_ref = &fruit_sender;
                            scope.spawn(move |_| {
                                let fruit = f_ref(arg);
                                if let Err(err) = fruit_sender_ref.send((idx, fruit)) {
                                    error!(
                                        "Failed to send search task. It probably means all search \
                                         threads have panicked. {err:?}"
                                    );
                                }
                            });
                        }
                    });
                    fruit_receiver
                    // This ends the scope of fruit_sender.
                    // This is important as it makes it possible for the fruit_receiver iteration to
                    // terminate.
                };
                let mut result_placeholders: Vec<Option<R>> =
                    std::iter::repeat_with(|| None).take(num_fruits).collect();
                for (pos, fruit_res) in fruit_receiver {
                    let fruit = fruit_res?;
                    result_placeholders[pos] = Some(fruit);
                }
                let results: Vec<R> = result_placeholders.into_iter().flatten().collect();
                if results.len() != num_fruits {
                    return Err(TantivyError::InternalError(
                        "One of the mapped execution failed.".to_string(),
                    ));
                }
                Ok(results)
            }
        }
    }

    /// Spawn a task on the pool, returning a future completing on task success.
    ///
    /// If the task panics, returns `Err(())`.
    #[cfg(feature = "quickwit")]
    pub fn spawn_blocking<T: Send + 'static>(
        &self,
        cpu_intensive_task: impl FnOnce() -> T + Send + 'static,
    ) -> impl std::future::Future<Output = Result<T, ()>> {
        match self {
            Executor::SingleThread => Either::Left(std::future::ready(Ok(cpu_intensive_task()))),
            Executor::ThreadPool(pool) => {
                let (sender, receiver) = oneshot::channel();
                pool.spawn(|| {
                    if sender.is_closed() {
                        return;
                    }
                    let task_result = cpu_intensive_task();
                    let _ = sender.send(task_result);
                });

                let res = receiver.map(|res| res.map_err(|_| ()));
                Either::Right(res)
            }
        }
    }
}

#[cfg(test)]
mod tests {
    use super::Executor;

    #[test]
    #[should_panic(expected = "panic should propagate")]
    fn test_panic_propagates_single_thread() {
        let _result: Vec<usize> = Executor::single_thread()
            .map(
                |_| {
                    panic!("panic should propagate");
                },
                vec![0].into_iter(),
            )
            .unwrap();
    }

    #[test]
    #[should_panic] //< unfortunately the panic message is not propagated
    fn test_panic_propagates_multi_thread() {
        let _result: Vec<usize> = Executor::multi_thread(1, "search-test")
            .unwrap()
            .map(
                |_| {
                    panic!("panic should propagate");
                },
                vec![0].into_iter(),
            )
            .unwrap();
    }

    #[test]
    fn test_map_singlethread() {
        let result: Vec<usize> = Executor::single_thread()
            .map(|i| Ok(i * 2), 0..1_000)
            .unwrap();
        assert_eq!(result.len(), 1_000);
        for i in 0..1_000 {
            assert_eq!(result[i], i * 2);
        }
    }

    #[test]
    fn test_map_multithread() {
        let result: Vec<usize> = Executor::multi_thread(3, "search-test")
            .unwrap()
            .map(|i| Ok(i * 2), 0..10)
            .unwrap();
        assert_eq!(result.len(), 10);
        for i in 0..10 {
            assert_eq!(result[i], i * 2);
        }
    }

    #[cfg(feature = "quickwit")]
    #[test]
    fn test_cancel_cpu_intensive_tasks() {
        use std::sync::atomic::{AtomicU64, Ordering};
        use std::sync::Arc;

        let counter: Arc<AtomicU64> = Default::default();

        let other_counter: Arc<AtomicU64> = Default::default();

        let mut futures = Vec::new();
        let mut other_futures = Vec::new();

        let (tx, rx) = crossbeam_channel::bounded::<()>(0);
        let rx = Arc::new(rx);
        let executor = Executor::multi_thread(3, "search-test").unwrap();
        for _ in 0..1000 {
            let counter_clone: Arc<AtomicU64> = counter.clone();
            let other_counter_clone: Arc<AtomicU64> = other_counter.clone();

            let rx_clone = rx.clone();
            let rx_clone2 = rx.clone();
            let fut = executor.spawn_blocking(move || {
                counter_clone.fetch_add(1, Ordering::SeqCst);
                let _ = rx_clone.recv();
            });
            futures.push(fut);
            let other_fut = executor.spawn_blocking(move || {
                other_counter_clone.fetch_add(1, Ordering::SeqCst);
                let _ = rx_clone2.recv();
            });
            other_futures.push(other_fut);
        }

        // We execute 100 futures.
        for _ in 0..100 {
            tx.send(()).unwrap();
        }

        let counter_val = counter.load(Ordering::SeqCst);
        let other_counter_val = other_counter.load(Ordering::SeqCst);
        assert!(counter_val >= 30);
        assert!(other_counter_val >= 30);

        drop(other_futures);

        // We execute 100 futures.
        for _ in 0..100 {
            tx.send(()).unwrap();
        }

        let counter_val2 = counter.load(Ordering::SeqCst);
        assert!(counter_val2 >= counter_val + 100 - 6);

        let other_counter_val2 = other_counter.load(Ordering::SeqCst);
        assert!(other_counter_val2 <= other_counter_val + 6);
    }
}


================================================
FILE: src/core/json_utils.rs
================================================
use columnar::NumericalValue;
use common::json_path_writer::{JSON_END_OF_PATH, JSON_PATH_SEGMENT_SEP};
use common::{replace_in_place, JsonPathWriter};
use rustc_hash::FxHashMap;

use crate::indexer::indexing_term::IndexingTerm;
use crate::postings::{IndexingContext, IndexingPosition, PostingsWriter};
use crate::schema::document::{ReferenceValue, ReferenceValueLeaf, Value};
use crate::schema::{Type, DATE_TIME_PRECISION_INDEXED};
use crate::time::format_description::well_known::Rfc3339;
use crate::time::{OffsetDateTime, UtcOffset};
use crate::tokenizer::TextAnalyzer;
use crate::{DateTime, DocId, Term};

/// This object is a map storing the last position for a given path for the current document
/// being indexed.
///
/// It is key to solve the following problem:
/// If we index a JsonObject emitting several terms with the same path
/// we do not want to create false positive in phrase queries.
///
/// For instance:
///
/// ```json
/// {"bands": [
///     {"band_name": "Elliot Smith"},
///     {"band_name": "The Who"},
/// ]}
/// ```
///
/// If we are careless and index each band names independently,
/// `Elliot` and `The` will end up indexed at position 0, and `Smith` and `Who` will be indexed at
/// position 1.
/// As a result, with lemmatization, "The Smiths" will match our object.
///
/// Worse, if a same term appears in the second object, a non increasing value would be pushed
/// to the position recorder probably provoking a panic.
///
/// This problem is solved for regular multivalued object by offsetting the position
/// of values, with a position gap. Here we would like `The` and `Who` to get indexed at
/// position 2 and 3 respectively.
///
/// With regular fields, we sort the fields beforehand, so that all terms with the same
/// path are indexed consecutively.
///
/// In JSON object, we do not have this comfort, so we need to record these position offsets in
/// a map.
///
/// Note that using a single position for the entire object would not hurt correctness.
/// It would however hurt compression.
///
/// We can therefore afford working with a map that is not imperfect. It is fine if several
/// path map to the same index position as long as the probability is relatively low.
#[derive(Default)]
pub(crate) struct IndexingPositionsPerPath {
    positions_per_path: FxHashMap<u32, IndexingPosition>,
}

impl IndexingPositionsPerPath {
    fn get_position_from_id(&mut self, id: u32) -> &mut IndexingPosition {
        self.positions_per_path.entry(id).or_default()
    }
    pub fn clear(&mut self) {
        self.positions_per_path.clear();
    }
}

/// Convert JSON_PATH_SEGMENT_SEP to a dot.
pub fn json_path_sep_to_dot(path: &mut str) {
    // This is safe since we are replacing a ASCII character by another ASCII character.
    unsafe {
        replace_in_place(JSON_PATH_SEGMENT_SEP, b'.', path.as_bytes_mut());
    }
}

#[expect(clippy::too_many_arguments)]
fn index_json_object<'a, V: Value<'a>>(
    doc: DocId,
    json_visitor: V::ObjectIter,
    text_analyzer: &mut TextAnalyzer,
    term_buffer: &mut IndexingTerm,
    json_path_writer: &mut JsonPathWriter,
    postings_writer: &mut dyn PostingsWriter,
    ctx: &mut IndexingContext,
    positions_per_path: &mut IndexingPositionsPerPath,
) {
    for (json_path_segment, json_value_visitor) in json_visitor {
        if json_path_segment.as_bytes().contains(&JSON_END_OF_PATH) {
            continue;
        }
        json_path_writer.push(json_path_segment);
        index_json_value(
            doc,
            json_value_visitor,
            text_analyzer,
            term_buffer,
            json_path_writer,
            postings_writer,
            ctx,
            positions_per_path,
        );
        json_path_writer.pop();
    }
}

#[expect(clippy::too_many_arguments)]
pub(crate) fn index_json_value<'a, V: Value<'a>>(
    doc: DocId,
    json_value: V,
    text_analyzer: &mut TextAnalyzer,
    term_buffer: &mut IndexingTerm,
    json_path_writer: &mut JsonPathWriter,
    postings_writer: &mut dyn PostingsWriter,
    ctx: &mut IndexingContext,
    positions_per_path: &mut IndexingPositionsPerPath,
) {
    let set_path_id = |term_buffer: &mut IndexingTerm, unordered_id: u32| {
        term_buffer.truncate_value_bytes(0);
        term_buffer.append_bytes(&unordered_id.to_be_bytes());
    };
    let set_type = |term_buffer: &mut IndexingTerm, typ: Type| {
        term_buffer.append_bytes(&[typ.to_code()]);
    };

    match json_value.as_value() {
        ReferenceValue::Leaf(leaf) => match leaf {
            ReferenceValueLeaf::Null => {}
            ReferenceValueLeaf::Str(val) => {
                let mut token_stream = text_analyzer.token_stream(val);
                let unordered_id = ctx
                    .path_to_unordered_id
                    .get_or_allocate_unordered_id(json_path_writer.as_str());

                // TODO: make sure the chain position works out.
                set_path_id(term_buffer, unordered_id);
                set_type(term_buffer, Type::Str);
                let indexing_position = positions_per_path.get_position_from_id(unordered_id);
                postings_writer.index_text(
                    doc,
                    &mut *token_stream,
                    term_buffer,
                    ctx,
                    indexing_position,
                );
            }
            ReferenceValueLeaf::U64(val) => {
                // try to parse to i64, since when querying we will apply the same logic and prefer
                // i64 values
                set_path_id(
                    term_buffer,
                    ctx.path_to_unordered_id
                        .get_or_allocate_unordered_id(json_path_writer.as_str()),
                );
                if let Ok(i64_val) = val.try_into() {
                    term_buffer.append_type_and_fast_value::<i64>(i64_val);
                } else {
                    term_buffer.append_type_and_fast_value::<u64>(val);
                }
                postings_writer.subscribe(doc, 0u32, term_buffer, ctx);
            }
            ReferenceValueLeaf::I64(val) => {
                set_path_id(
                    term_buffer,
                    ctx.path_to_unordered_id
                        .get_or_allocate_unordered_id(json_path_writer.as_str()),
                );
                term_buffer.append_type_and_fast_value(val);
                postings_writer.subscribe(doc, 0u32, term_buffer, ctx);
            }
            ReferenceValueLeaf::F64(val) => {
                if !val.is_finite() {
                    return;
                };
                set_path_id(
                    term_buffer,
                    ctx.path_to_unordered_id
                        .get_or_allocate_unordered_id(json_path_writer.as_str()),
                );
                // Normalize here is important.
                // In the inverted index, we coerce all numerical values to their canonical
                // representation.
                //
                // (We do the same thing on the query side)
                match NumericalValue::F64(val).normalize() {
                    NumericalValue::I64(val_i64) => {
                        term_buffer.append_type_and_fast_value::<i64>(val_i64);
                    }
                    NumericalValue::U64(val_u64) => {
                        term_buffer.append_type_and_fast_value::<u64>(val_u64);
                    }
                    NumericalValue::F64(val_f64) => {
                        term_buffer.append_type_and_fast_value::<f64>(val_f64);
                    }
                }
                postings_writer.subscribe(doc, 0u32, term_buffer, ctx);
            }
            ReferenceValueLeaf::Bool(val) => {
                set_path_id(
                    term_buffer,
                    ctx.path_to_unordered_id
                        .get_or_allocate_unordered_id(json_path_writer.as_str()),
                );
                term_buffer.append_type_and_fast_value(val);
                postings_writer.subscribe(doc, 0u32, term_buffer, ctx);
            }
            ReferenceValueLeaf::Date(val) => {
                set_path_id(
                    term_buffer,
                    ctx.path_to_unordered_id
                        .get_or_allocate_unordered_id(json_path_writer.as_str()),
                );
                let val = val.truncate(DATE_TIME_PRECISION_INDEXED);
                term_buffer.append_type_and_fast_value(val);
                postings_writer.subscribe(doc, 0u32, term_buffer, ctx);
            }
            ReferenceValueLeaf::PreTokStr(_) => {
                unimplemented!(
                    "Pre-tokenized string support in dynamic fields is not yet implemented"
                )
            }
            ReferenceValueLeaf::Bytes(_) => {
                unimplemented!("Bytes support in dynamic fields is not yet implemented")
            }
            ReferenceValueLeaf::Facet(_) => {
                unimplemented!("Facet support in dynamic fields is not yet implemented")
            }
            ReferenceValueLeaf::IpAddr(_) => {
                unimplemented!("IP address support in dynamic fields is not yet implemented")
            }
        },
        ReferenceValue::Array(elements) => {
            for val in elements {
                index_json_value(
                    doc,
                    val,
                    text_analyzer,
                    term_buffer,
                    json_path_writer,
                    postings_writer,
                    ctx,
                    positions_per_path,
                );
            }
        }
        ReferenceValue::Object(object) => {
            index_json_object::<V>(
                doc,
                object,
                text_analyzer,
                term_buffer,
                json_path_writer,
                postings_writer,
                ctx,
                positions_per_path,
            );
        }
    }
}

/// Tries to infer a JSON type from a string and append it to the term.
///
/// The term must be json + JSON path.
pub fn convert_to_fast_value_and_append_to_json_term(
    term: &Term,
    text: &str,
    truncate_date_for_search: bool,
) -> Option<Term> {
    assert_eq!(
        term.value()
            .as_json_value_bytes()
            .expect("expecting a Term with a json type and json path")
            .as_serialized()
            .len(),
        0,
        "JSON value bytes should be empty"
    );
    try_convert_to_datetime_and_append_to_json_term(term, text, truncate_date_for_search)
        .or_else(|| try_convert_to_number_and_append_to_json_term(term, text))
        .or_else(|| try_convert_to_bool_and_append_to_json_term_typed(term, text))
}

fn try_convert_to_datetime_and_append_to_json_term(
    term: &Term,
    text: &str,
    truncate_date_for_search: bool,
) -> Option<Term> {
    let dt = OffsetDateTime::parse(text, &Rfc3339).ok()?;
    let mut dt = DateTime::from_utc(dt.to_offset(UtcOffset::UTC));
    if truncate_date_for_search {
        dt = dt.truncate(DATE_TIME_PRECISION_INDEXED);
    }
    let mut term_clone = term.clone();
    term_clone.append_type_and_fast_value(dt);
    Some(term_clone)
}

fn try_convert_to_number_and_append_to_json_term(term: &Term, text: &str) -> Option<Term> {
    let numerical_value: NumericalValue = str::parse::<NumericalValue>(text).ok()?;
    let mut term_clone = term.clone();
    // Parse is actually returning normalized values already today, but let's not
    // not rely on that hidden contract.
    match numerical_value.normalize() {
        NumericalValue::I64(i64_value) => {
            term_clone.append_type_and_fast_value::<i64>(i64_value);
        }
        NumericalValue::U64(u64_value) => {
            term_clone.append_type_and_fast_value::<u64>(u64_value);
        }
        NumericalValue::F64(f64_value) => {
            term_clone.append_type_and_fast_value::<f64>(f64_value);
        }
    }
    Some(term_clone)
}

fn try_convert_to_bool_and_append_to_json_term_typed(term: &Term, text: &str) -> Option<Term> {
    let val = str::parse::<bool>(text).ok()?;
    let mut term_clone = term.clone();
    term_clone.append_type_and_fast_value(val);
    Some(term_clone)
}

/// Splits a json path supplied to the query parser in such a way that
/// `.` can be escaped.
///
/// In other words,
/// - `k8s.node` ends up as `["k8s", "node"]`.
/// - `k8s\.node` ends up as `["k8s.node"]`.
pub fn split_json_path(json_path: &str) -> Vec<String> {
    let mut escaped_state: bool = false;
    let mut json_path_segments = Vec::new();
    let mut buffer = String::new();
    for ch in json_path.chars() {
        if escaped_state {
            buffer.push(ch);
            escaped_state = false;
            continue;
        }
        match ch {
            '\\' => {
                escaped_state = true;
            }
            '.' => {
                let new_segment = std::mem::take(&mut buffer);
                json_path_segments.push(new_segment);
            }
            _ => {
                buffer.push(ch);
            }
        }
    }
    json_path_segments.push(buffer);
    json_path_segments
}

/// Takes a field name, a json path as supplied by a user, and whether we should expand dots, and
/// return a column key, as expected by the columnar crate.
///
/// This function will detect unescaped dots in the path, and split over them.
/// If expand_dots is enabled, then even escaped dots will be split over.
///
/// The resulting list of segment then gets stitched together, joined by \1 separator,
/// as defined in the columnar crate.
pub(crate) fn encode_column_name(
    field_name: &str,
    json_path: &str,
    expand_dots_enabled: bool,
) -> String {
    let mut path = JsonPathWriter::default();
    path.push(field_name);
    path.set_expand_dots(expand_dots_enabled);
    for segment in split_json_path(json_path) {
        path.push(&segment);
    }
    path.into()
}

#[cfg(test)]
mod tests {
    use super::split_json_path;
    use crate::schema::Field;
    use crate::Term;

    #[test]
    fn test_json_writer() {
        let field = Field::from_field_id(1);

        let mut term = Term::from_field_json_path(field, "attributes.color", false);
        term.append_type_and_str("red");
        assert_eq!(
            format!("{term:?}"),
            "Term(field=1, type=Json, path=attributes.color, type=Str, \"red\")"
        );

        let mut term = Term::from_field_json_path(field, "attributes.dimensions.width", false);
        term.append_type_and_fast_value(400i64);
        assert_eq!(
            format!("{term:?}"),
            "Term(field=1, type=Json, path=attributes.dimensions.width, type=I64, 400)"
        );
    }

    #[test]
    fn test_string_term() {
        let field = Field::from_field_id(1);
        let mut term = Term::from_field_json_path(field, "color", false);
        term.append_type_and_str("red");

        assert_eq!(term.serialized_value_bytes(), b"color\x00sred".to_vec())
    }

    #[test]
    fn test_i64_term() {
        let field = Field::from_field_id(1);
        let mut term = Term::from_field_json_path(field, "color", false);
        term.append_type_and_fast_value(-4i64);

        assert_eq!(
            term.serialized_value_bytes(),
            b"color\x00i\x7f\xff\xff\xff\xff\xff\xff\xfc".to_vec()
        )
    }

    #[test]
    fn test_u64_term() {
        let field = Field::from_field_id(1);
        let mut term = Term::from_field_json_path(field, "color", false);
        term.append_type_and_fast_value(4u64);

        assert_eq!(
            term.serialized_value_bytes(),
            b"color\x00u\x00\x00\x00\x00\x00\x00\x00\x04".to_vec()
        )
    }

    #[test]
    fn test_f64_term() {
        let field = Field::from_field_id(1);
        let mut term = Term::from_field_json_path(field, "color", false);
        term.append_type_and_fast_value(4.0f64);
        assert_eq!(
            term.serialized_value_bytes(),
            b"color\x00f\xc0\x10\x00\x00\x00\x00\x00\x00".to_vec()
        )
    }

    #[test]
    fn test_bool_term() {
        let field = Field::from_field_id(1);
        let mut term = Term::from_field_json_path(field, "color", false);
        term.append_type_and_fast_value(true);
        assert_eq!(
            term.serialized_value_bytes(),
            b"color\x00o\x00\x00\x00\x00\x00\x00\x00\x01".to_vec()
        )
    }

    #[test]
    fn test_split_json_path_simple() {
        let json_path = split_json_path("titi.toto");
        assert_eq!(&json_path, &["titi", "toto"]);
    }

    #[test]
    fn test_split_json_path_single_segment() {
        let json_path = split_json_path("toto");
        assert_eq!(&json_path, &["toto"]);
    }

    #[test]
    fn test_split_json_path_trailing_dot() {
        let json_path = split_json_path("toto.");
        assert_eq!(&json_path, &["toto", ""]);
    }

    #[test]
    fn test_split_json_path_heading_dot() {
        let json_path = split_json_path(".toto");
        assert_eq!(&json_path, &["", "toto"]);
    }

    #[test]
    fn test_split_json_path_escaped_dot() {
        let json_path = split_json_path(r"toto\.titi");
        assert_eq!(&json_path, &["toto.titi"]);
        let json_path_2 = split_json_path(r"k8s\.container\.name");
        assert_eq!(&json_path_2, &["k8s.container.name"]);
    }

    #[test]
    fn test_split_json_path_escaped_backslash() {
        let json_path = split_json_path(r"toto\\titi");
        assert_eq!(&json_path, &[r"toto\titi"]);
    }

    #[test]
    fn test_split_json_path_escaped_normal_letter() {
        let json_path = split_json_path(r"toto\titi");
        assert_eq!(&json_path, &[r#"tototiti"#]);
    }
}


================================================
FILE: src/core/mod.rs
================================================
mod executor;
#[doc(hidden)]
pub mod json_utils;
pub mod searcher;

use std::path::Path;

use once_cell::sync::Lazy;

pub use self::executor::Executor;
pub use self::searcher::{Searcher, SearcherGeneration};

/// The meta file contains all the information about the list of segments and the schema
/// of the index.
pub static META_FILEPATH: Lazy<&'static Path> = Lazy::new(|| Path::new("meta.json"));

/// The managed file contains a list of files that were created by the tantivy
/// and will therefore be garbage collected when they are deemed useless by tantivy.
///
/// Removing this file is safe, but will prevent the garbage collection of all of the file that
/// are currently in the directory
pub static MANAGED_FILEPATH: Lazy<&'static Path> = Lazy::new(|| Path::new(".managed.json"));

#[cfg(test)]
mod tests;


================================================
FILE: src/core/searcher.rs
================================================
use std::collections::BTreeMap;
use std::sync::Arc;
use std::{fmt, io};

use crate::collector::Collector;
use crate::core::Executor;
use crate::index::{SegmentId, SegmentReader};
use crate::query::{Bm25StatisticsProvider, EnableScoring, Query};
use crate::schema::document::DocumentDeserialize;
use crate::schema::{Schema, Term};
use crate::space_usage::SearcherSpaceUsage;
use crate::store::{CacheStats, StoreReader};
use crate::{DocAddress, Index, Opstamp, TrackedObject};

/// Identifies the searcher generation accessed by a [`Searcher`].
///
/// While this might seem redundant, a [`SearcherGeneration`] contains
/// both a `generation_id` AND a list of `(SegmentId, DeleteOpstamp)`.
///
/// This is on purpose. This object is used by the [`Warmer`](crate::reader::Warmer) API.
/// Having both information makes it possible to identify which
/// artifact should be refreshed or garbage collected.
///
/// Depending on the use case, `Warmer`'s implementers can decide to
/// produce artifacts per:
/// - `generation_id` (e.g. some searcher level aggregates)
/// - `(segment_id, delete_opstamp)` (e.g. segment level aggregates)
/// - `segment_id` (e.g. for immutable document level information)
/// - `(generation_id, segment_id)` (e.g. for consistent dynamic column)
/// - ...
#[derive(Debug, Clone, PartialEq, Eq, PartialOrd, Ord, Hash)]
pub struct SearcherGeneration {
    segments: BTreeMap<SegmentId, Option<Opstamp>>,
    generation_id: u64,
}

impl SearcherGeneration {
    pub(crate) fn from_segment_readers(
        segment_readers: &[SegmentReader],
        generation_id: u64,
    ) -> Self {
        let mut segment_id_to_del_opstamp = BTreeMap::new();
        for segment_reader in segment_readers {
            segment_id_to_del_opstamp
                .insert(segment_reader.segment_id(), segment_reader.delete_opstamp());
        }
        Self {
            segments: segment_id_to_del_opstamp,
            generation_id,
        }
    }

    /// Returns the searcher generation id.
    pub fn generation_id(&self) -> u64 {
        self.generation_id
    }

    /// Return a `(SegmentId -> DeleteOpstamp)` mapping.
    pub fn segments(&self) -> &BTreeMap<SegmentId, Option<Opstamp>> {
        &self.segments
    }
}

/// Holds a list of `SegmentReader`s ready for search.
///
/// It guarantees that the `Segment` will not be removed before
/// the destruction of the `Searcher`.
#[derive(Clone)]
pub struct Searcher {
    inner: Arc<SearcherInner>,
}

impl Searcher {
    /// Returns the `Index` associated with the `Searcher`
    pub fn index(&self) -> &Index {
        &self.inner.index
    }

    /// [`SearcherGeneration`] which identifies the version of the snapshot held by this `Searcher`.
    pub fn generation(&self) -> &SearcherGeneration {
        self.inner.generation.as_ref()
    }

    /// Fetches a document from tantivy's store given a [`DocAddress`].
    ///
    /// The searcher uses the segment ordinal to route the
    /// request to the right `Segment`.
    pub fn doc<D: DocumentDeserialize>(&self, doc_address: DocAddress) -> crate::Result<D> {
        let store_reader = &self.inner.store_readers[doc_address.segment_ord as usize];
        store_reader.get(doc_address.doc_id)
    }

    /// The cache stats for the underlying store reader.
    ///
    /// Aggregates the sum for each segment store reader.
    pub fn doc_store_cache_stats(&self) -> CacheStats {
        let cache_stats: CacheStats = self
            .inner
            .store_readers
            .iter()
            .map(|reader| reader.cache_stats())
            .sum();
        cache_stats
    }

    /// Fetches a document in an asynchronous manner.
    #[cfg(feature = "quickwit")]
    pub async fn doc_async<D: DocumentDeserialize>(
        &self,
        doc_address: DocAddress,
    ) -> crate::Result<D> {
        let executor = self.inner.index.search_executor();
        let store_reader = &self.inner.store_readers[doc_address.segment_ord as usize];
        store_reader.get_async(doc_address.doc_id, executor).await
    }

    /// Access the schema associated with the index of this searcher.
    pub fn schema(&self) -> &Schema {
        &self.inner.schema
    }

    /// Returns the overall number of documents in the index.
    pub fn num_docs(&self) -> u64 {
        self.inner
            .segment_readers
            .iter()
            .map(|segment_reader| u64::from(segment_reader.num_docs()))
            .sum::<u64>()
    }

    /// Return the overall number of documents containing
    /// the given term.
    pub fn doc_freq(&self, term: &Term) -> crate::Result<u64> {
        let mut total_doc_freq = 0;
        for segment_reader in &self.inner.segment_readers {
            let inverted_index = segment_reader.inverted_index(term.field())?;
            let doc_freq = inverted_index.doc_freq(term)?;
            total_doc_freq += u64::from(doc_freq);
        }
        Ok(total_doc_freq)
    }

    /// Return the overall number of documents containing
    /// the given term in an asynchronous manner.
    #[cfg(feature = "quickwit")]
    pub async fn doc_freq_async(&self, term: &Term) -> crate::Result<u64> {
        let mut total_doc_freq = 0;
        for segment_reader in &self.inner.segment_readers {
            let inverted_index = segment_reader.inverted_index(term.field())?;
            let doc_freq = inverted_index.doc_freq_async(term).await?;
            total_doc_freq += u64::from(doc_freq);
        }
        Ok(total_doc_freq)
    }

    /// Return the list of segment readers
    pub fn segment_readers(&self) -> &[SegmentReader] {
        &self.inner.segment_readers
    }

    /// Returns the segment_reader associated with the given segment_ord
    pub fn segment_reader(&self, segment_ord: u32) -> &SegmentReader {
        &self.inner.segment_readers[segment_ord as usize]
    }

    /// Runs a query on the segment readers wrapped by the searcher.
    ///
    /// Search works as follows :
    ///
    ///  First the weight object associated with the query is created.
    ///
    ///  Then, the query loops over the segments and for each segment :
    ///  - setup the collector and informs it that the segment being processed has changed.
    ///  - creates a SegmentCollector for collecting documents associated with the segment
    ///  - creates a `Scorer` object associated for this segment
    ///  - iterate through the matched documents and push them to the segment collector.
    ///
    ///  Finally, the Collector merges each of the child collectors into itself for result usability
    ///  by the caller.
    pub fn search<C: Collector>(
        &self,
        query: &dyn Query,
        collector: &C,
    ) -> crate::Result<C::Fruit> {
        self.search_with_statistics_provider(query, collector, self)
    }

    /// Same as [`search(...)`](Searcher::search) but allows specifying
    /// a [Bm25StatisticsProvider].
    ///
    /// This can be used to adjust the statistics used in computing BM25
    /// scores.
    pub fn search_with_statistics_provider<C: Collector>(
        &self,
        query: &dyn Query,
        collector: &C,
        statistics_provider: &dyn Bm25StatisticsProvider,
    ) -> crate::Result<C::Fruit> {
        let enabled_scoring = if collector.requires_scoring() {
            EnableScoring::enabled_from_statistics_provider(statistics_provider, self)
        } else {
            EnableScoring::disabled_from_searcher(self)
        };
        let executor = self.inner.index.search_executor();
        self.search_with_executor(query, collector, executor, enabled_scoring)
    }

    /// Same as [`search(...)`](Searcher::search) but multithreaded.
    ///
    /// The current implementation is rather naive :
    /// multithreading is by splitting search into as many task
    /// as there are segments.
    ///
    /// It is powerless at making search faster if your index consists in
    /// one large segment.
    ///
    /// Also, keep in mind multithreading a single query on several
    /// threads will not improve your throughput. It can actually
    /// hurt it. It will however, decrease the average response time.
    pub fn search_with_executor<C: Collector>(
        &self,
        query: &dyn Query,
        collector: &C,
        executor: &Executor,
        enabled_scoring: EnableScoring,
    ) -> crate::Result<C::Fruit> {
        let weight = query.weight(enabled_scoring)?;
        collector.check_schema(self.schema())?;
        let segment_readers = self.segment_readers();
        let fruits = executor.map(
            |(segment_ord, segment_reader)| {
                collector.collect_segment(weight.as_ref(), segment_ord as u32, segment_reader)
            },
            segment_readers.iter().enumerate(),
        )?;
        collector.merge_fruits(fruits)
    }

    /// Summarize total space usage of this searcher.
    pub fn space_usage(&self) -> io::Result<SearcherSpaceUsage> {
        let mut space_usage = SearcherSpaceUsage::new();
        for segment_reader in self.segment_readers() {
            space_usage.add_segment(segment_reader.space_usage()?);
        }
        Ok(space_usage)
    }
}

impl From<Arc<SearcherInner>> for Searcher {
    fn from(inner: Arc<SearcherInner>) -> Self {
        Searcher { inner }
    }
}

/// Holds a list of `SegmentReader`s ready for search.
///
/// It guarantees that the `Segment` will not be removed before
/// the destruction of the `Searcher`.
pub(crate) struct SearcherInner {
    schema: Schema,
    index: Index,
    segment_readers: Vec<SegmentReader>,
    store_readers: Vec<StoreReader>,
    generation: TrackedObject<SearcherGeneration>,
}

impl SearcherInner {
    /// Creates a new `Searcher`
    pub(crate) fn new(
        schema: Schema,
        index: Index,
        segment_readers: Vec<SegmentReader>,
        generation: TrackedObject<SearcherGeneration>,
        doc_store_cache_num_blocks: usize,
    ) -> io::Result<SearcherInner> {
        assert_eq!(
            &segment_readers
                .iter()
                .map(|reader| (reader.segment_id(), reader.delete_opstamp()))
                .collect::<BTreeMap<_, _>>(),
            generation.segments(),
            "Set of segments referenced by this Searcher and its SearcherGeneration must match"
        );
        let store_readers: Vec<StoreReader> = segment_readers
            .iter()
            .map(|segment_reader| segment_reader.get_store_reader(doc_store_cache_num_blocks))
            .collect::<io::Result<Vec<_>>>()?;

        Ok(SearcherInner {
            schema,
            index,
            segment_readers,
            store_readers,
            generation,
        })
    }
}

impl fmt::Debug for Searcher {
    fn fmt(&self, f: &mut fmt::Formatter<'_>) -> fmt::Result {
        let segment_ids = self
            .segment_readers()
            .iter()
            .map(SegmentReader::segment_id)
            .collect::<Vec<_>>();
        write!(f, "Searcher({segment_ids:?})")
    }
}


================================================
FILE: src/core/tests.rs
================================================
use crate::collector::Count;
use crate::directory::{RamDirectory, WatchCallback};
use crate::index::SegmentId;
use crate::indexer::{LogMergePolicy, NoMergePolicy};
use crate::postings::Postings;
use crate::query::TermQuery;
use crate::schema::{Field, IndexRecordOption, Schema, INDEXED, STRING, TEXT};
use crate::tokenizer::TokenizerManager;
use crate::{
    Directory, DocSet, Index, IndexBuilder, IndexReader, IndexSettings, IndexWriter, ReloadPolicy,
    TantivyDocument, Term,
};

#[test]
fn test_indexer_for_field() {
    let mut schema_builder = Schema::builder();
    let num_likes_field = schema_builder.add_u64_field("num_likes", INDEXED);
    let body_field = schema_builder.add_text_field("body", TEXT);
    let schema = schema_builder.build();
    let index = Index::create_in_ram(schema);
    assert!(index.tokenizer_for_field(body_field).is_ok());
    assert_eq!(
        format!("{:?}", index.tokenizer_for_field(num_likes_field).err()),
        "Some(SchemaError(\"\\\"num_likes\\\" is not a text field.\"))"
    );
}

#[test]
fn test_set_tokenizer_manager() {
    let mut schema_builder = Schema::builder();
    schema_builder.add_u64_field("num_likes", INDEXED);
    schema_builder.add_text_field("body", TEXT);
    let schema = schema_builder.build();
    let index = IndexBuilder::new()
        // set empty tokenizer manager
        .tokenizers(TokenizerManager::new())
        .schema(schema)
        .create_in_ram()
        .unwrap();
    assert!(index.tokenizers().get("raw").is_none());
}

#[test]
fn test_index_exists() {
    let directory: Box<dyn Directory> = Box::new(RamDirectory::create());
    assert!(!Index::exists(directory.as_ref()).unwrap());
    assert!(Index::create(
        directory.clone(),
        throw_away_schema(),
        IndexSettings::default()
    )
    .is_ok());
    assert!(Index::exists(directory.as_ref()).unwrap());
}

#[test]
fn open_or_create_should_create() {
    let directory = RamDirectory::create();
    assert!(!Index::exists(&directory).unwrap());
    assert!(Index::open_or_create(directory.clone(), throw_away_schema()).is_ok());
    assert!(Index::exists(&directory).unwrap());
}

#[test]
fn open_or_create_should_open() {
    let directory: Box<dyn Directory> = Box::new(RamDirectory::create());
    assert!(Index::create(
        directory.clone(),
        throw_away_schema(),
        IndexSettings::default()
    )
    .is_ok());
    assert!(Index::exists(directory.as_ref()).unwrap());
    assert!(Index::open_or_create(directory, throw_away_schema()).is_ok());
}

#[test]
fn create_should_wipeoff_existing() {
    let directory: Box<dyn Directory> = Box::new(RamDirectory::create());
    assert!(Index::create(
        directory.clone(),
        throw_away_schema(),
        IndexSettings::default()
    )
    .is_ok());
    assert!(Index::exists(directory.as_ref()).unwrap());
    assert!(Index::create(
        directory,
        Schema::builder().build(),
        IndexSettings::default()
    )
    .is_ok());
}

#[test]
fn open_or_create_exists_but_schema_does_not_match() {
    let directory = RamDirectory::create();
    assert!(Index::create(
        directory.clone(),
        throw_away_schema(),
        IndexSettings::default()
    )
    .is_ok());
    assert!(Index::exists(&directory).unwrap());
    assert!(Index::open_or_create(directory.clone(), throw_away_schema()).is_ok());
    let err = Index::open_or_create(directory, Schema::builder().build());
    assert_eq!(
        format!("{:?}", err.unwrap_err()),
        "SchemaError(\"An index exists but the schema does not match.\")"
    );
}

fn throw_away_schema() -> Schema {
    let mut schema_builder = Schema::builder();
    let _ = schema_builder.add_u64_field("num_likes", INDEXED);
    schema_builder.build()
}

#[test]
fn test_index_on_commit_reload_policy() -> crate::Result<()> {
    let schema = throw_away_schema();
    let field = schema.get_field("num_likes").unwrap();
    let index = Index::create_in_ram(schema);
    let reader = index
        .reader_builder()
        .reload_policy(ReloadPolicy::OnCommitWithDelay)
        .try_into()
        .unwrap();
    assert_eq!(reader.searcher().num_docs(), 0);
    test_index_on_commit_reload_policy_aux(field, &index, &reader)
}

#[cfg(feature = "mmap")]
mod mmap_specific {

    use std::path::PathBuf;

    use tempfile::TempDir;

    use super::*;

    #[test]
    fn test_index_on_commit_reload_policy_mmap() -> crate::Result<()> {
        let schema = throw_away_schema();
        let field = schema.get_field("num_likes").unwrap();
        let tempdir = TempDir::new().unwrap();
        let tempdir_path = PathBuf::from(tempdir.path());
        let index = Index::create_in_dir(tempdir_path, schema).unwrap();
        let reader = index
            .reader_builder()
            .reload_policy(ReloadPolicy::OnCommitWithDelay)
            .try_into()
            .unwrap();
        assert_eq!(reader.searcher().num_docs(), 0);
        test_index_on_commit_reload_policy_aux(field, &index, &reader)
    }

    #[test]
    fn test_index_manual_policy_mmap() -> crate::Result<()> {
        let schema = throw_away_schema();
        let field = schema.get_field("num_likes").unwrap();
        let mut index = Index::create_from_tempdir(schema)?;
        let mut writer: IndexWriter = index.writer_for_tests()?;
        writer.commit()?;
        let reader = index
            .reader_builder()
            .reload_policy(ReloadPolicy::Manual)
            .try_into()?;
        assert_eq!(reader.searcher().num_docs(), 0);
        writer.add_document(doc!(field=>1u64))?;
        let (sender, receiver) = crossbeam_channel::unbounded();
        let _handle = index.directory_mut().watch(WatchCallback::new(move || {
            let _ = sender.send(());
        }));
        writer.commit()?;
        assert!(receiver.recv().is_ok());
        assert_eq!(reader.searcher().num_docs(), 0);
        reader.reload()?;
        assert_eq!(reader.searcher().num_docs(), 1);
        Ok(())
    }

    #[test]
    fn test_index_on_commit_reload_policy_different_directories() -> crate::Result<()> {
        let schema = throw_away_schema();
        let field = schema.get_field("num_likes").unwrap();
        let tempdir = TempDir::new().unwrap();
        let tempdir_path = PathBuf::from(tempdir.path());
        let write_index = Index::create_in_dir(&tempdir_path, schema).unwrap();
        let read_index = Index::open_in_dir(&tempdir_path).unwrap();
        let reader = read_index
            .reader_builder()
            .reload_policy(ReloadPolicy::OnCommitWithDelay)
            .try_into()
            .unwrap();
        assert_eq!(reader.searcher().num_docs(), 0);
        test_index_on_commit_reload_policy_aux(field, &write_index, &reader)
    }
}
fn test_index_on_commit_reload_policy_aux(
    field: Field,
    index: &Index,
    reader: &IndexReader,
) -> crate::Result<()> {
    let mut reader_index = reader.index();
    let (sender, receiver) = crossbeam_channel::unbounded();
    let _watch_handle = reader_index
        .directory_mut()
        .watch(WatchCallback::new(move || {
            let _ = sender.send(());
        }));
    let mut writer: IndexWriter = index.writer_for_tests()?;
    assert_eq!(reader.searcher().num_docs(), 0);
    writer.add_document(doc!(field=>1u64))?;
    writer.commit().unwrap();
    // We need a loop here because it is possible for notify to send more than
    // one modify event. It was observed on CI on MacOS.
    loop {
        assert!(receiver.recv().is_ok());
        if reader.searcher().num_docs() == 1 {
            break;
        }
    }
    writer.add_document(doc!(field=>2u64))?;
    writer.commit().unwrap();
    // ... Same as above
    loop {
        assert!(receiver.recv().is_ok());
        if reader.searcher().num_docs() == 2 {
            break;
        }
    }
    Ok(())
}

// This test will not pass on windows, because windows
// prevent deleting files that are MMapped.
#[cfg(not(target_os = "windows"))]
#[test]
fn garbage_collect_works_as_intended() -> crate::Result<()> {
    let directory = RamDirectory::create();
    let schema = throw_away_schema();
    let field = schema.get_field("num_likes").unwrap();
    let index = Index::create(directory.clone(), schema, IndexSettings::default())?;

    let mut writer: IndexWriter = index.writer_with_num_threads(1, 32_000_000).unwrap();
    for _seg in 0..8 {
        for i in 0u64..1_000u64 {
            writer.add_document(doc!(field => i))?;
        }
        writer.commit()?;
    }

    let mem_right_after_commit = directory.total_mem_usage();

    let reader = index
        .reader_builder()
        .reload_policy(ReloadPolicy::Manual)
        .try_into()?;
    assert_eq!(reader.searcher().num_docs(), 8_000);
    assert_eq!(reader.searcher().segment_readers().len(), 8);

    writer.wait_merging_threads()?;

    let mem_right_after_merge_finished = directory.total_mem_usage();

    reader.reload().unwrap();
    let searcher = reader.searcher();
    assert_eq!(searcher.segment_readers().len(), 1);
    assert_eq!(searcher.num_docs(), 8_000);
    assert!(
        mem_right_after_merge_finished < mem_right_after_commit,
        "(mem after merge){mem_right_after_merge_finished} is expected < (mem before \
         merge){mem_right_after_commit}"
    );
    Ok(())
}

#[test]
fn test_single_segment_index_writer() -> crate::Result<()> {
    let mut schema_builder = Schema::builder();
    let text_field = schema_builder.add_text_field("text", TEXT);
    let schema = schema_builder.build();
    let directory = RamDirectory::default();
    let mut single_segment_index_writer = Index::builder()
        .schema(schema)
        .single_segment_index_writer(directory, 15_000_000)?;
    for _ in 0..10 {
        let doc = doc!(text_field=>"hello");
        single_segment_index_writer.add_document(doc)?;
    }
    let index = single_segment_index_writer.finalize()?;
    let searcher = index.reader()?.searcher();
    let term_query = TermQuery::new(
        Term::from_field_text(text_field, "hello"),
        IndexRecordOption::Basic,
    );
    let count = searcher.search(&term_query, &Count)?;
    assert_eq!(count, 10);
    Ok(())
}

#[test]
fn test_merging_segment_update_docfreq() {
    let mut schema_builder = Schema::builder();
    let text_field = schema_builder.add_text_field("text", TEXT);
    let id_field = schema_builder.add_text_field("id", STRING);
    let schema = schema_builder.build();
    let index = Index::create_in_ram(schema);
    let mut writer: IndexWriter = index.writer_for_tests().unwrap();
    writer.set_merge_policy(Box::new(NoMergePolicy));
    for _ in 0..5 {
        writer.add_document(doc!(text_field=>"hello")).unwrap();
    }
    writer
        .add_document(doc!(text_field=>"hello", id_field=>"TO_BE_DELETED"))
        .unwrap();
    writer
        .add_document(doc!(text_field=>"hello", id_field=>"TO_BE_DELETED"))
        .unwrap();
    writer.add_document(TantivyDocument::default()).unwrap();
    writer.commit().unwrap();
    for _ in 0..7 {
        writer.add_document(doc!(text_field=>"hello")).unwrap();
    }
    writer.add_document(TantivyDocument::default()).unwrap();
    writer.add_document(TantivyDocument::default()).unwrap();
    writer.delete_term(Term::from_field_text(id_field, "TO_BE_DELETED"));
    writer.commit().unwrap();

    let segment_ids: Vec<SegmentId> = index
        .list_all_segment_metas()
        .into_iter()
        .map(|reader| reader.id())
        .collect();
    writer.merge(&segment_ids[..]).wait().unwrap();
    let index_reader = index.reader().unwrap();
    let searcher = index_reader.searcher();
    assert_eq!(searcher.segment_readers().len(), 1);
    assert_eq!(searcher.num_docs(), 15);
    let segment_reader = searcher.segment_reader(0);
    assert_eq!(segment_reader.max_doc(), 15);
    let inv_index = segment_reader.inverted_index(text_field).unwrap();
    let term = Term::from_field_text(text_field, "hello");
    let term_info = inv_index.get_term_info(&term).unwrap().unwrap();
    assert_eq!(term_info.doc_freq, 12);
}

// motivated by https://github.com/quickwit-oss/quickwit/issues/4130
#[test]
fn test_positions_merge_bug_non_text_json_vint() {
    let mut schema_builder = Schema::builder();
    let field = schema_builder.add_json_field("dynamic", TEXT);
    let schema = schema_builder.build();
    let index = Index::create_in_ram(schema.clone());
    let mut writer: IndexWriter = index.writer_for_tests().unwrap();
    let mut merge_policy = LogMergePolicy::default();
    merge_policy.set_min_num_segments(2);
    writer.set_merge_policy(Box::new(merge_policy));
    // Here a string would work.
    let doc_json = r#"{"tenant_id":75}"#;
    let vals = serde_json::from_str(doc_json).unwrap();
    let mut doc = TantivyDocument::default();
    doc.add_object(field, vals);
    writer.add_document(doc.clone()).unwrap();
    writer.commit().unwrap();
    writer.add_document(doc.clone()).unwrap();
    writer.commit().unwrap();
    writer.wait_merging_threads().unwrap();
    let reader = index.reader().unwrap();
    assert_eq!(reader.searcher().segment_readers().len(), 1);
}

// Same as above but with bitpacked blocks
#[test]
fn test_positions_merge_bug_non_text_json_bitpacked_block() {
    let mut schema_builder = Schema::builder();
    let field = schema_builder.add_json_field("dynamic", TEXT);
    let schema = schema_builder.build();
    let index = Index::create_in_ram(schema.clone());
    let mut writer: IndexWriter = index.writer_for_tests().unwrap();
    let mut merge_policy = LogMergePolicy::default();
    merge_policy.set_min_num_segments(2);
    writer.set_merge_policy(Box::new(merge_policy));
    // Here a string would work.
    let doc_json = r#"{"tenant_id":75}"#;
    let vals = serde_json::from_str(doc_json).unwrap();
    let mut doc = TantivyDocument::default();
    doc.add_object(field, vals);
    for _ in 0..128 {
        writer.add_document(doc.clone()).unwrap();
    }
    writer.commit().unwrap();
    writer.add_document(doc.clone()).unwrap();
    writer.commit().unwrap();
    writer.wait_merging_threads().unwrap();
    let reader = index.reader().unwrap();
    assert_eq!(reader.searcher().segment_readers().len(), 1);
}

#[test]
fn test_non_text_json_term_freq() {
    let mut schema_builder = Schema::builder();
    let field = schema_builder.add_json_field("dynamic", TEXT);
    let schema = schema_builder.build();
    let index = Index::create_in_ram(schema.clone());
    let mut writer: IndexWriter = index.writer_for_tests().unwrap();
    // Here a string would work.
    let doc_json = r#"{"tenant_id":75}"#;
    let vals = serde_json::from_str(doc_json).unwrap();
    let mut doc = TantivyDocument::default();
    doc.add_object(field, vals);
    writer.add_document(doc.clone()).unwrap();
    writer.commit().unwrap();
    let reader = index.reader().unwrap();
    assert_eq!(reader.searcher().segment_readers().len(), 1);
    let searcher = reader.searcher();
    let segment_reader = searcher.segment_reader(0u32);
    let inv_idx = segment_reader.inverted_index(field).unwrap();

    let mut term = Term::from_field_json_path(field, "tenant_id", false);
    term.append_type_and_fast_value(75i64);

    let postings = inv_idx
        .read_postings(&term, IndexRecordOption::WithFreqsAndPositions)
        .unwrap()
        .unwrap();
    assert_eq!(postings.doc(), 0);
    assert_eq!(postings.term_freq(), 1u32);
}

#[test]
fn test_non_text_json_term_freq_bitpacked() {
    let mut schema_builder = Schema::builder();
    let field = schema_builder.add_json_field("dynamic", TEXT);
    let schema = schema_builder.build();
    let index = Index::create_in_ram(schema.clone());
    let mut writer: IndexWriter = index.writer_for_tests().unwrap();
    // Here a string would work.
    let doc_json = r#"{"tenant_id":75}"#;
    let vals = serde_json::from_str(doc_json).unwrap();
    let mut doc = TantivyDocument::default();
    doc.add_object(field, vals);
    let num_docs = 132;
    for _ in 0..num_docs {
        writer.add_document(doc.clone()).unwrap();
    }
    writer.commit().unwrap();
    let reader = index.reader().unwrap();
    assert_eq!(reader.searcher().segment_readers().len(), 1);
    let searcher = reader.searcher();
    let segment_reader = searcher.segment_reader(0u32);
    let inv_idx = segment_reader.inverted_index(field).unwrap();

    let mut term = Term::from_field_json_path(field, "tenant_id", false);
    term.append_type_and_fast_value(75i64);

    let mut postings = inv_idx
        .read_postings(&term, IndexRecordOption::WithFreqsAndPositions)
        .unwrap()
        .unwrap();
    assert_eq!(postings.doc(), 0);
    assert_eq!(postings.term_freq(), 1u32);
    for i in 1..num_docs {
        assert_eq!(postings.advance(), i);
        assert_eq!(postings.term_freq(), 1u32);
    }
}


================================================
FILE: src/directory/composite_file.rs
================================================
use std::collections::HashMap;
use std::io::{self, Read, Write};
use std::ops::Range;

use common::{BinarySerializable, CountingWriter, HasLen, VInt};

use crate::directory::{FileSlice, TerminatingWrite, WritePtr};
use crate::schema::{Field, Schema};
use crate::space_usage::{FieldUsage, PerFieldSpaceUsage};

#[derive(Eq, PartialEq, Hash, Copy, Ord, PartialOrd, Clone, Debug)]
pub struct FileAddr {
    field: Field,
    idx: usize,
}

impl FileAddr {
    fn new(field: Field, idx: usize) -> FileAddr {
        FileAddr { field, idx }
    }
}

impl BinarySerializable for FileAddr {
    fn serialize<W: Write + ?Sized>(&self, writer: &mut W) -> io::Result<()> {
        self.field.serialize(writer)?;
        VInt(self.idx as u64).serialize(writer)?;
        Ok(())
    }

    fn deserialize<R: Read>(reader: &mut R) -> io::Result<Self> {
        let field = Field::deserialize(reader)?;
        let idx = VInt::deserialize(reader)?.0 as usize;
        Ok(FileAddr { field, idx })
    }
}

/// A `CompositeWrite` is used to write a `CompositeFile`.
pub struct CompositeWrite<W = WritePtr> {
    write: CountingWriter<W>,
    offsets: Vec<(FileAddr, u64)>,
}

impl<W: TerminatingWrite + Write> CompositeWrite<W> {
    /// Crate a new API writer that writes a composite file
    /// in a given write.
    pub fn wrap(w: W) -> CompositeWrite<W> {
        CompositeWrite {
            write: CountingWriter::wrap(w),
            offsets: Vec::new(),
        }
    }

    /// Start writing a new field.
    pub fn for_field(&mut self, field: Field) -> &mut CountingWriter<W> {
        self.for_field_with_idx(field, 0)
    }

    /// Start writing a new field.
    pub fn for_field_with_idx(&mut self, field: Field, idx: usize) -> &mut CountingWriter<W> {
        let offset = self.write.written_bytes();
        let file_addr = FileAddr::new(field, idx);
        assert!(!self.offsets.iter().any(|el| el.0 == file_addr));
        self.offsets.push((file_addr, offset));
        &mut self.write
    }

    /// Close the composite file
    ///
    /// An index of the different field offsets
    /// will be written as a footer.
    pub fn close(mut self) -> io::Result<()> {
        let footer_offset = self.write.written_bytes();
        VInt(self.offsets.len() as u64).serialize(&mut self.write)?;

        let mut prev_offset = 0;
        for (file_addr, offset) in self.offsets {
            VInt(offset - prev_offset).serialize(&mut self.write)?;
            file_addr.serialize(&mut self.write)?;
            prev_offset = offset;
        }

        let footer_len = (self.write.written_bytes() - footer_offset) as u32;
        footer_len.serialize(&mut self.write)?;
        self.write.terminate()
    }
}

/// A composite file is an abstraction to store a
/// file partitioned by field.
///
/// The file needs to be written field by field.
/// A footer describes the start and stop offsets
/// for each field.
#[derive(Clone)]
pub struct CompositeFile {
    data: FileSlice,
    offsets_index: HashMap<FileAddr, Range<usize>>,
}

impl std::fmt::Debug for CompositeFile {
    fn fmt(&self, f: &mut std::fmt::Formatter<'_>) -> std::fmt::Result {
        f.debug_struct("CompositeFile")
            .field("offsets_index", &self.offsets_index)
            .finish()
    }
}

impl CompositeFile {
    /// Opens a composite file stored in a given
    /// `FileSlice`.
    pub fn open(data: &FileSlice) -> io::Result<CompositeFile> {
        let end = data.len();
        let footer_len_data = data.slice_from(end - 4).read_bytes()?;
        let footer_len = u32::deserialize(&mut footer_len_data.as_slice())? as usize;
        let footer_start = end - 4 - footer_len;
        let footer_data = data
            .slice(footer_start..footer_start + footer_len)
            .read_bytes()?;
        let mut footer_buffer = footer_data.as_slice();
        let num_fields = VInt::deserialize(&mut footer_buffer)?.0 as usize;

        let mut file_addrs = vec![];
        let mut offsets = vec![];
        let mut field_index = HashMap::new();

        let mut offset = 0;
        for _ in 0..num_fields {
            offset += VInt::deserialize(&mut footer_buffer)?.0 as usize;
            let file_addr = FileAddr::deserialize(&mut footer_buffer)?;
            offsets.push(offset);
            file_addrs.push(file_addr);
        }
        offsets.push(footer_start);
        for i in 0..num_fields {
            let file_addr = file_addrs[i];
            let start_offset = offsets[i];
            let end_offset = offsets[i + 1];
            field_index.insert(file_addr, start_offset..end_offset);
        }

        Ok(CompositeFile {
            data: data.slice_to(footer_start),
            offsets_index: field_index,
        })
    }

    /// Returns a composite file that stores
    /// no fields.
    pub fn empty() -> CompositeFile {
        CompositeFile {
            offsets_index: HashMap::new(),
            data: FileSlice::empty(),
        }
    }

    /// Returns the `FileSlice` associated with
    /// a given `Field` and stored in a `CompositeFile`.
    pub fn open_read(&self, field: Field) -> Option<FileSlice> {
        self.open_read_with_idx(field, 0)
    }

    /// Returns the `FileSlice` associated with
    /// a given `Field` and stored in a `CompositeFile`.
    pub fn open_read_with_idx(&self, field: Field, idx: usize) -> Option<FileSlice> {
        self.offsets_index
            .get(&FileAddr { field, idx })
            .map(|byte_range| self.data.slice(byte_range.clone()))
    }

    /// Returns the space usage per field in this composite file.
    pub fn space_usage(&self, schema: &Schema) -> PerFieldSpaceUsage {
        let mut fields = Vec::new();
        for (&field_addr, byte_range) in &self.offsets_index {
            let field_name = schema.get_field_name(field_addr.field).to_string();
            let mut field_usage = FieldUsage::empty(field_name);
            field_usage.add_field_idx(field_addr.idx, byte_range.len().into());
            fields.push(field_usage);
        }
        PerFieldSpaceUsage::new(fields)
    }
}

#[cfg(test)]
mod test {

    use std::io::Write;
    use std::path::Path;

    use common::{BinarySerializable, VInt};

    use super::{CompositeFile, CompositeWrite};
    use crate::directory::{Directory, RamDirectory};
    use crate::schema::Field;

    #[test]
    fn test_composite_file() -> crate::Result<()> {
        let path = Path::new("test_path");
        let directory = RamDirectory::create();
        {
            let w = directory.open_write(path).unwrap();
            let mut composite_write = CompositeWrite::wrap(w);
            let mut write_0 = composite_write.for_field(Field::from_field_id(0u32));
            VInt(32431123u64).serialize(&mut write_0)?;
            write_0.flush()?;
            let mut write_4 = composite_write.for_field(Field::from_field_id(4u32));
            VInt(2).serialize(&mut write_4)?;
            write_4.flush()?;
            composite_write.close()?;
        }
        {
            let r = directory.open_read(path)?;
            let composite_file = CompositeFile::open(&r)?;
            {
                let file0 = composite_file
                    .open_read(Field::from_field_id(0u32))
                    .unwrap()
                    .read_bytes()?;
                let mut file0_buf = file0.as_slice();
                let payload_0 = VInt::deserialize(&mut file0_buf)?.0;
                assert_eq!(file0_buf.len(), 0);
                assert_eq!(payload_0, 32431123u64);
            }
            {
                let file4 = composite_file
                    .open_read(Field::from_field_id(4u32))
                    .unwrap()
                    .read_bytes()?;
                let mut file4_buf = file4.as_slice();
                let payload_4 = VInt::deserialize(&mut file4_buf)?.0;
                assert_eq!(file4_buf.len(), 0);
                assert_eq!(payload_4, 2u64);
            }
        }
        Ok(())
    }

    #[test]
    fn test_composite_file_bug() -> crate::Result<()> {
        let path = Path::new("test_path");
        let directory = RamDirectory::create();
        {
            let w = directory.open_write(path).unwrap();
            let mut composite_write = CompositeWrite::wrap(w);
            let mut write = composite_write.for_field_with_idx(Field::from_field_id(1u32), 0);
            VInt(32431123u64).serialize(&mut write)?;
            write.flush()?;
            let write = composite_write.for_field_with_idx(Field::from_field_id(1u32), 1);
            write.flush()?;

            let mut write = composite_write.for_field_with_idx(Field::from_field_id(0u32), 0);
            VInt(1_000_000).serialize(&mut write)?;
            write.flush()?;

            composite_write.close()?;
        }
        {
            let r = directory.open_read(path)?;
            let composite_file = CompositeFile::open(&r)?;
            {
                let file = composite_file
                    .open_read_with_idx(Field::from_field_id(1u32), 0)
                    .unwrap()
                    .read_bytes()?;
                let mut file0_buf = file.as_slice();
                let payload_0 = VInt::deserialize(&mut file0_buf)?.0;
                assert_eq!(file0_buf.len(), 0);
                assert_eq!(payload_0, 32431123u64);
            }
            {
                let file = composite_file
                    .open_read_with_idx(Field::from_field_id(1u32), 1)
                    .unwrap()
                    .read_bytes()?;
                let file = file.as_slice();
                assert_eq!(file.len(), 0);
            }
            {
                let file = composite_file
                    .open_read_with_idx(Field::from_field_id(0u32), 0)
                    .unwrap()
                    .read_bytes()?;
                let file = file.as_slice();
                assert_eq!(file.len(), 3);
            }
        }
        Ok(())
    }
}


================================================
FILE: src/directory/directory.rs
================================================
use std::io::Write;
use std::path::{Path, PathBuf};
use std::sync::Arc;
use std::time::Duration;
use std::{fmt, io, thread};

use crate::directory::directory_lock::Lock;
use crate::directory::error::{DeleteError, LockError, OpenReadError, OpenWriteError};
use crate::directory::{FileHandle, FileSlice, WatchCallback, WatchHandle, WritePtr};

/// Retry the logic of acquiring locks is pretty simple.
/// We just retry `n` times after a given `duratio`, both
/// depending on the type of lock.
struct RetryPolicy {
    num_retries: usize,
    wait_in_ms: u64,
}

impl RetryPolicy {
    fn no_retry() -> RetryPolicy {
        RetryPolicy {
            num_retries: 0,
            wait_in_ms: 0,
        }
    }

    fn wait_and_retry(&mut self) -> bool {
        if self.num_retries == 0 {
            false
        } else {
            self.num_retries -= 1;
            let wait_duration = Duration::from_millis(self.wait_in_ms);
            thread::sleep(wait_duration);
            true
        }
    }
}

/// The `DirectoryLock` is an object that represents a file lock.
///
/// It is associated with a lock file, that gets deleted on `Drop.`
#[expect(dead_code)]
pub struct DirectoryLock(Box<dyn Send + Sync + 'static>);

struct DirectoryLockGuard {
    directory: Box<dyn Directory>,
    path: PathBuf,
}

impl<T: Send + Sync + 'static> From<Box<T>> for DirectoryLock {
    fn from(underlying: Box<T>) -> Self {
        DirectoryLock(underlying)
    }
}

impl Drop for DirectoryLockGuard {
    fn drop(&mut self) {
        if let Err(e) = self.directory.delete(&self.path) {
            error!("Failed to remove the lock file. {e:?}");
        }
    }
}

enum TryAcquireLockError {
    FileExists,
    IoError(Arc<io::Error>),
}
impl From<io::Error> for TryAcquireLockError {
    fn from(io_error: io::Error) -> Self {
        Self::IoError(Arc::new(io_error))
    }
}

fn try_acquire_lock(
    filepath: &Path,
    directory: &dyn Directory,
) -> Result<DirectoryLock, TryAcquireLockError> {
    let mut write = directory.open_write(filepath).map_err(|e| match e {
        OpenWriteError::FileAlreadyExists(_) => TryAcquireLockError::FileExists,
        OpenWriteError::IoError { io_error, .. } => TryAcquireLockError::IoError(io_error),
    })?;
    write.flush().map_err(TryAcquireLockError::from)?;
    Ok(DirectoryLock::from(Box::new(DirectoryLockGuard {
        directory: directory.box_clone(),
        path: filepath.to_owned(),
    })))
}

fn retry_policy(is_blocking: bool) -> RetryPolicy {
    if is_blocking {
        RetryPolicy {
            num_retries: 100,
            wait_in_ms: 100,
        }
    } else {
        RetryPolicy::no_retry()
    }
}

/// Write-once read many (WORM) abstraction for where
/// tantivy's data should be stored.
///
/// There are currently two implementations of `Directory`
///
/// - The [`MMapDirectory`][crate::directory::MmapDirectory], this should be your default choice.
/// - The [`RamDirectory`][crate::directory::RamDirectory], which should be used mostly for tests.
pub trait Directory: DirectoryClone + fmt::Debug + Send + Sync + 'static {
    /// Opens a file and returns a boxed `FileHandle`.
    ///
    /// Users of `Directory` should typically call `Directory::open_read(...)`,
    /// while `Directory` implementer should implement `get_file_handle()`.
    fn get_file_handle(&self, path: &Path) -> Result<Arc<dyn FileHandle>, OpenReadError>;

    /// Once a virtual file is open, its data may not
    /// change.
    ///
    /// Specifically, subsequent writes or flushes should
    /// have no effect on the returned [`FileSlice`] object.
    ///
    /// You should only use this to read files create with [`Directory::open_write()`].
    fn open_read(&self, path: &Path) -> Result<FileSlice, OpenReadError> {
        let file_handle = self.get_file_handle(path)?;
        Ok(FileSlice::new(file_handle))
    }

    /// Removes a file
    ///
    /// Removing a file will not affect an eventual
    /// existing [`FileSlice`] pointing to it.
    ///
    /// Removing a nonexistent file, returns a
    /// [`DeleteError::FileDoesNotExist`].
    fn delete(&self, path: &Path) -> Result<(), DeleteError>;

    /// Returns true if and only if the file exists
    fn exists(&self, path: &Path) -> Result<bool, OpenReadError>;

    /// Opens a writer for the *virtual file* associated with
    /// a [`Path`].
    ///
    /// Right after this call, for the span of the execution of the program
    /// the file should be created and any subsequent call to
    /// [`Directory::open_read()`] for the same path should return
    /// a [`FileSlice`].
    ///
    /// However, depending on the directory implementation,
    /// it might be required to call [`Directory::sync_directory()`] to ensure
    /// that the file is durably created.
    /// (The semantics here are the same when dealing with
    /// a POSIX filesystem.)
    ///
    /// Write operations may be aggressively buffered.
    /// The client of this trait is responsible for calling flush
    /// to ensure that subsequent `read` operations
    /// will take into account preceding `write` operations.
    ///
    /// Flush operation should also be persistent.
    ///
    /// The user shall not rely on [`Drop`] triggering `flush`.
    /// Note that [`RamDirectory`][crate::directory::RamDirectory] will
    /// panic! if `flush` was not called.
    ///
    /// The file may not previously exist.
    fn open_write(&self, path: &Path) -> Result<WritePtr, OpenWriteError>;

    /// Reads the full content file that has been written using
    /// [`Directory::atomic_write()`].
    ///
    /// This should only be used for small files.
    ///
    /// You should only use this to read files create with [`Directory::atomic_write()`].
    fn atomic_read(&self, path: &Path) -> Result<Vec<u8>, OpenReadError>;

    /// Atomically replace the content of a file with data.
    ///
    /// This calls ensure that reads can never *observe*
    /// a partially written file.
    ///
    /// The file may or may not previously exist.
    fn atomic_write(&self, path: &Path, data: &[u8]) -> io::Result<()>;

    /// Sync the directory.
    ///
    /// This call is required to ensure that newly created files are
    /// effectively stored durably.
    fn sync_directory(&self) -> io::Result<()>;

    /// Acquire a lock in the directory given in the [`Lock`].
    ///
    /// The method is blocking or not depending on the [`Lock`] object.
    fn acquire_lock(&self, lock: &Lock) -> Result<DirectoryLock, LockError> {
        let box_directory = self.box_clone();
        let mut retry_policy = retry_policy(lock.is_blocking);
        loop {
            match try_acquire_lock(&lock.filepath, &*box_directory) {
                Ok(result) => {
                    return Ok(result);
                }
                Err(TryAcquireLockError::FileExists) => {
                    if !retry_policy.wait_and_retry() {
                        return Err(LockError::LockBusy);
                    }
                }
                Err(TryAcquireLockError::IoError(io_error)) => {
                    return Err(LockError::IoError(io_error));
                }
            }
        }
    }

    /// Registers a callback that will be called whenever a change on the `meta.json`
    /// using the [`Directory::atomic_write()`] API is detected.
    ///
    /// The behavior when using `.watch()` on a file using [`Directory::open_write()`] is, on the
    /// other hand, undefined.
    ///
    /// The file will be watched for the lifetime of the returned `WatchHandle`. The caller is
    /// required to keep it.
    /// It does not override previous callbacks. When the file is modified, all callback that are
    /// registered (and whose [`WatchHandle`] is still alive) are triggered.
    ///
    /// Internally, tantivy only uses this API to detect new commits to implement the
    /// `OnCommitWithDelay` `ReloadPolicy`. Not implementing watch in a `Directory` only prevents
    /// the `OnCommitWithDelay` `ReloadPolicy` to work properly.
    fn watch(&self, watch_callback: WatchCallback) -> crate::Result<WatchHandle>;
}

/// DirectoryClone
pub trait DirectoryClone {
    /// Clones the directory and boxes the clone
    fn box_clone(&self) -> Box<dyn Directory>;
}

impl<T> DirectoryClone for T
where T: 'static + Directory + Clone
{
    fn box_clone(&self) -> Box<dyn Directory> {
        Box::new(self.clone())
    }
}

impl Clone for Box<dyn Directory> {
    fn clone(&self) -> Self {
        self.box_clone()
    }
}

impl<T: Directory + 'static> From<T> for Box<dyn Directory> {
    fn from(t: T) -> Self {
        Box::new(t)
    }
}


================================================
FILE: src/directory/directory_lock.rs
================================================
use std::path::PathBuf;

use once_cell::sync::Lazy;

/// A directory lock.
///
/// A lock is associated with a specific path.
///
/// The lock will be passed to [`Directory::acquire_lock`](crate::Directory::acquire_lock).
///
/// Tantivy itself uses only two locks but client application
/// can use the directory facility to define their own locks.
/// - [`INDEX_WRITER_LOCK`]
/// - [`META_LOCK`]
///
/// Check out these locks documentation for more information.
#[derive(Debug)]
pub struct Lock {
    /// The lock needs to be associated with its own file `path`.
    /// Depending on the platform, the lock might rely on the creation
    /// and deletion of this filepath.
    pub filepath: PathBuf,
    /// `is_blocking` describes whether acquiring the lock is meant
    /// to be a blocking operation or a non-blocking.
    ///
    /// Acquiring a blocking lock blocks until the lock is
    /// available.
    ///
    /// Acquiring a non-blocking lock returns rapidly, either successfully
    /// or with an error signifying that someone is already holding
    /// the lock.
    pub is_blocking: bool,
}

/// Only one process should be able to write tantivy's index at a time.
/// This lock file, when present, is in charge of preventing other processes to open an
/// `IndexWriter`.
///
/// If the process is killed and this file remains, it is safe to remove it manually.
///
/// Failing to acquire this lock usually means a misuse of tantivy's API,
/// (creating more than one instance of the `IndexWriter`), are a spurious
/// lock file remaining after a crash. In the latter case, removing the file after
/// checking no process running tantivy is running is safe.
pub static INDEX_WRITER_LOCK: Lazy<Lock> = Lazy::new(|| Lock {
    filepath: PathBuf::from(".tantivy-writer.lock"),
    is_blocking: false,
});
/// The meta lock file is here to protect the segment files being opened by
/// `IndexReader::reload()` from being garbage collected.
///
/// It makes it possible for another process to safely consume
/// our index in-writing. Ideally, we may have preferred `RWLock` semantics
/// here, but it is difficult to achieve on Windows.
///
/// Opening segment readers is a very fast process.
pub static META_LOCK: Lazy<Lock> = Lazy::new(|| Lock {
    filepath: PathBuf::from(".tantivy-meta.lock"),
    is_blocking: true,
});


================================================
FILE: src/directory/error.rs
================================================
use std::path::PathBuf;
use std::sync::Arc;
use std::{fmt, io};

use crate::Version;

/// Error while trying to acquire a directory [lock](crate::directory::Lock).
///
/// This is returned from [`Directory::acquire_lock`](crate::Directory::acquire_lock).
#[derive(Debug, Clone, Error)]
pub enum LockError {
    /// Failed to acquired a lock as it is already held by another
    /// client.
    /// - In the context of a blocking lock, this means the lock was not released within some
    ///   `timeout` period.
    /// - In the context of a non-blocking lock, this means the lock was busy at the moment of the
    ///   call.
    #[error("Could not acquire lock as it is already held, possibly by a different process.")]
    LockBusy,
    /// Trying to acquire a lock failed with an `IoError`
    #[error("Failed to acquire the lock due to an io:Error.")]
    IoError(Arc<io::Error>),
}

impl LockError {
    /// Wraps an io error.
    pub fn wrap_io_error(io_error: io::Error) -> Self {
        Self::IoError(Arc::new(io_error))
    }
}

/// Error that may occur when opening a directory
#[derive(Debug, Clone, Error)]
pub enum OpenDirectoryError {
    /// The underlying directory does not exist.
    #[error("Directory does not exist: '{0}'.")]
    DoesNotExist(PathBuf),
    /// The path exists but is not a directory.
    #[error("Path exists but is not a directory: '{0}'.")]
    NotADirectory(PathBuf),
    /// Failed to create a temp directory.
    #[error("Failed to create a temporary directory: '{0}'.")]
    FailedToCreateTempDir(Arc<io::Error>),
    /// IoError
    #[error("IoError '{io_error:?}' while create directory in: '{directory_path:?}'.")]
    IoError {
        /// underlying io Error.
        io_error: Arc<io::Error>,
        /// directory we tried to open.
        directory_path: PathBuf,
    },
}

impl OpenDirectoryError {
    /// Wraps an io error.
    pub fn wrap_io_error(io_error: io::Error, directory_path: PathBuf) -> Self {
        Self::IoError {
            io_error: Arc::new(io_error),
            directory_path,
        }
    }
}

/// Error that may occur when starting to write in a file
#[derive(Debug, Clone, Error)]
pub enum OpenWriteError {
    /// Our directory is WORM, writing an existing file is forbidden.
    /// Checkout the `Directory` documentation.
    #[error("File already exists: '{0}'")]
    FileAlreadyExists(PathBuf),
    /// Any kind of IO error that happens when
    /// writing in the underlying IO device.
    #[error("IoError '{io_error:?}' while opening file for write: '{filepath}'.")]
    IoError {
        /// The underlying `io::Error`.
        io_error: Arc<io::Error>,
        /// File path of the file that tantivy failed to open for write.
        filepath: PathBuf,
    },
}

impl OpenWriteError {
    /// Wraps an io error.
    pub fn wrap_io_error(io_error: io::Error, filepath: PathBuf) -> Self {
        Self::IoError {
            io_error: Arc::new(io_error),
            filepath,
        }
    }
}
/// Type of index incompatibility between the library and the index found on disk
/// Used to catch and provide a hint to solve this incompatibility issue
#[derive(Clone)]
pub enum Incompatibility {
    /// This library cannot decompress the index found on disk
    CompressionMismatch {
        /// Compression algorithm used by the current version of tantivy
        library_compression_format: String,
        /// Compression algorithm that was used to serialise the index
        index_compression_format: String,
    },
    /// The index format found on disk isn't supported by this version of the library
    IndexMismatch {
        /// Version used by the library
        library_version: Version,
        /// Version the index was built with
        index_version: Version,
    },
}

impl fmt::Debug for Incompatibility {
    fn fmt(&self, f: &mut fmt::Formatter<'_>) -> Result<(), fmt::Error> {
        match self {
            Incompatibility::CompressionMismatch {
                library_compression_format,
                index_compression_format,
            } => {
                let err = format!(
                    "Library was compiled with {library_compression_format:?} compression, index \
                     was compressed with {index_compression_format:?}"
                );
                let advice = format!(
                    "Change the feature flag to {index_compression_format:?} and rebuild the \
                     library"
                );
                write!(f, "{err}. {advice}")?;
            }
            Incompatibility::IndexMismatch {
                library_version,
                index_version,
            } => {
                let err = format!(
                    "Library version: {}, index version: {}",
                    library_version.index_format_version, index_version.index_format_version
                );
                // TODO make a more useful error message
                // include the version range that supports this index_format_version
                let advice = format!(
                    "Change tantivy to a version compatible with index format {} (e.g. {}.{}.x) \
                     and rebuild your project.",
                    index_version.index_format_version, index_version.major, index_version.minor
                );
                write!(f, "{err}. {advice}")?;
            }
        }

        Ok(())
    }
}

/// Error that may occur when accessing a file read
#[derive(Debug, Clone, Error)]
pub enum OpenReadError {
    /// The file does not exist.
    #[error("Files does not exist: {0:?}")]
    FileDoesNotExist(PathBuf),
    /// Any kind of io::Error.
    #[error(
        "IoError: '{io_error:?}' happened while opening the following file for Read: {filepath}."
    )]
    IoError {
        /// The underlying `io::Error`.
        io_error: Arc<io::Error>,
        /// File path of the file that tantivy failed to open for read.
        filepath: PathBuf,
    },
    /// This library does not support the index version found in file footer.
    #[error("Index version unsupported: {0:?}")]
    IncompatibleIndex(Incompatibility),
}

impl OpenReadError {
    /// Wraps an io error.
    pub fn wrap_io_error(io_error: io::Error, filepath: PathBuf) -> Self {
        Self::IoError {
            io_error: Arc::new(io_error),
            filepath,
        }
    }
}
/// Error that may occur when trying to delete a file
#[derive(Debug, Clone, Error)]
pub enum DeleteError {
    /// The file does not exist.
    #[error("File does not exist: '{0}'.")]
    FileDoesNotExist(PathBuf),
    /// Any kind of IO error that happens when
    /// interacting with the underlying IO device.
    #[error("The following IO error happened while deleting file '{filepath}': '{io_error:?}'.")]
    IoError {
        /// The underlying `io::Error`.
        io_error: Arc<io::Error>,
        /// File path of the file that tantivy failed to delete.
        filepath: PathBuf,
    },
}

impl From<Incompatibility> for OpenReadError {
    fn from(incompatibility: Incompatibility) -> Self {
        OpenReadError::IncompatibleIndex(incompatibility)
    }
}


================================================
FILE: src/directory/footer.rs
================================================
//! The footer is a small metadata structure that is appended at the end of every file.
//!
//! The footer is used to store a checksum of the file content.
//! The footer also stores the version of the index format.
//! This version is used to detect incompatibility between the index and the library version.

use std::io;
use std::io::Write;

use common::{BinarySerializable, CountingWriter, DeserializeFrom, FixedSize, HasLen};
use crc32fast::Hasher;
use serde::{Deserialize, Serialize};

use crate::directory::error::Incompatibility;
use crate::directory::{AntiCallToken, FileSlice, TerminatingWrite};
use crate::{Version, INDEX_FORMAT_OLDEST_SUPPORTED_VERSION, INDEX_FORMAT_VERSION};

const FOOTER_MAX_LEN: u32 = 50_000;

/// The magic byte of the footer to identify corruption
/// or an old version of the footer.
const FOOTER_MAGIC_NUMBER: u32 = 1337;

type CrcHashU32 = u32;

/// A Footer is appended to every file
#[derive(Debug, Clone, PartialEq, Serialize, Deserialize)]
pub struct Footer {
    /// The version of the index format
    pub version: Version,
    /// The crc32 hash of the body
    pub crc: CrcHashU32,
}

impl Footer {
    pub(crate) fn new(crc: CrcHashU32) -> Self {
        let version = crate::VERSION.clone();
        Footer { version, crc }
    }

    pub(crate) fn crc(&self) -> CrcHashU32 {
        self.crc
    }
    pub(crate) fn append_footer<W: io::Write>(&self, mut write: &mut W) -> io::Result<()> {
        let mut counting_write = CountingWriter::wrap(&mut write);
        counting_write.write_all(serde_json::to_string(&self)?.as_ref())?;
        let footer_payload_len = counting_write.written_bytes();
        BinarySerializable::serialize(&(footer_payload_len as u32), write)?;
        BinarySerializable::serialize(&FOOTER_MAGIC_NUMBER, write)?;
        Ok(())
    }

    /// Extracts the tantivy Footer from the file and returns the footer and the rest of the file
    pub fn extract_footer(file: FileSlice) -> io::Result<(Footer, FileSlice)> {
        if file.len() < 4 {
            return Err(io::Error::new(
                io::ErrorKind::UnexpectedEof,
                format!(
                    "File corrupted. The file is smaller than 4 bytes (len={}).",
                    file.len()
                ),
            ));
        }

        let footer_metadata_len = <(u32, u32)>::SIZE_IN_BYTES;
        let (footer_len, footer_magic_byte): (u32, u32) = file
            .slice_from_end(footer_metadata_len)
            .read_bytes()?
            .as_ref()
            .deserialize()?;

        if footer_magic_byte != FOOTER_MAGIC_NUMBER {
            return Err(io::Error::new(
                io::ErrorKind::InvalidData,
                "Footer magic byte mismatch. File corrupted or index was created using old an \
                 tantivy version which is not supported anymore. Please use tantivy 0.15 or above \
                 to recreate the index.",
            ));
        }

        if footer_len > FOOTER_MAX_LEN {
            return Err(io::Error::new(
                io::ErrorKind::InvalidData,
                format!(
                    "Footer seems invalid as it suggests a footer len of {footer_len}. File is \
                     corrupted, or the index was created with a different & old version of \
                     tantivy."
                ),
            ));
        }
        let total_footer_size = footer_len as usize + footer_metadata_len;
        if file.len() < total_footer_size {
            return Err(io::Error::new(
                io::ErrorKind::UnexpectedEof,
                format!(
                    "File corrupted. The file is smaller than it's footer bytes \
                     (len={total_footer_size})."
                ),
            ));
        }

        let footer: Footer =
            serde_json::from_slice(&file.read_bytes_slice(
                file.len() - total_footer_size..file.len() - footer_metadata_len,
            )?)?;

        let body = file.slice_to(file.len() - total_footer_size);
        Ok((footer, body))
    }

    /// Confirms that the index will be read correctly by this version of tantivy
    /// Has to be called after `extract_footer` to make sure it's not accessing uninitialised memory
    pub fn is_compatible(&self) -> Result<(), Incompatibility> {
        const SUPPORTED_INDEX_FORMAT_VERSION_RANGE: std::ops::RangeInclusive<u32> =
            INDEX_FORMAT_OLDEST_SUPPORTED_VERSION..=INDEX_FORMAT_VERSION;

        let library_version = crate::version();
        if !SUPPORTED_INDEX_FORMAT_VERSION_RANGE.contains(&self.version.index_format_version) {
            return Err(Incompatibility::IndexMismatch {
                library_version: library_version.clone(),
                index_version: self.version.clone(),
            });
        }
        Ok(())
    }
}

pub(crate) struct FooterProxy<W: TerminatingWrite> {
    /// always Some except after terminate call
    hasher: Option<Hasher>,
    /// always Some except after terminate call
    writer: Option<W>,
}

impl<W: TerminatingWrite> FooterProxy<W> {
    pub fn new(writer: W) -> Self {
        FooterProxy {
            hasher: Some(Hasher::new()),
            writer: Some(writer),
        }
    }
}

impl<W: TerminatingWrite> Write for FooterProxy<W> {
    fn write(&mut self, buf: &[u8]) -> io::Result<usize> {
        let count = self.writer.as_mut().unwrap().write(buf)?;
        self.hasher.as_mut().unwrap().update(&buf[..count]);
        Ok(count)
    }

    fn flush(&mut self) -> io::Result<()> {
        self.writer.as_mut().unwrap().flush()
    }
}

impl<W: TerminatingWrite> TerminatingWrite for FooterProxy<W> {
    fn terminate_ref(&mut self, _: AntiCallToken) -> io::Result<()> {
        let crc32 = self.hasher.take().unwrap().finalize();
        let footer = Footer::new(crc32);
        let mut writer = self.writer.take().unwrap();
        footer.append_footer(&mut writer)?;
        writer.terminate()
    }
}

#[cfg(test)]
mod tests {

    use std::io;
    use std::sync::Arc;

    use common::BinarySerializable;

    use crate::directory::footer::{Footer, FOOTER_MAGIC_NUMBER};
    use crate::directory::{FileSlice, OwnedBytes};

    #[test]
    fn test_deserialize_footer() {
        let mut buf: Vec<u8> = vec![];
        let footer = Footer::new(123);
        footer.append_footer(&mut buf).unwrap();
        let owned_bytes = OwnedBytes::new(buf);
        let fileslice = FileSlice::new(Arc::new(owned_bytes));
        let (footer_deser, _body) = Footer::extract_footer(fileslice).unwrap();
        assert_eq!(footer_deser.crc(), footer.crc());
    }
    #[test]
    fn test_deserialize_footer_missing_magic_byte() {
        let mut buf: Vec<u8> = vec![];
        BinarySerializable::serialize(&0_u32, &mut buf).unwrap();
        let wrong_magic_byte: u32 = 5555;
        BinarySerializable::serialize(&wrong_magic_byte, &mut buf).unwrap();

        let owned_bytes = OwnedBytes::new(buf);

        let fileslice = FileSlice::new(Arc::new(owned_bytes));
        let err = Footer::extract_footer(fileslice).unwrap_err();
        assert_eq!(
            err.to_string(),
            "Footer magic byte mismatch. File corrupted or index was created using old an tantivy \
             version which is not supported anymore. Please use tantivy 0.15 or above to recreate \
             the index."
        );
    }
    #[test]
    fn test_deserialize_footer_wrong_filesize() {
        let mut buf: Vec<u8> = vec![];
        BinarySerializable::serialize(&100_u32, &mut buf).unwrap();
        BinarySerializable::serialize(&FOOTER_MAGIC_NUMBER, &mut buf).unwrap();

        let owned_bytes = OwnedBytes::new(buf);

        let fileslice = FileSlice::new(Arc::new(owned_bytes));
        let err = Footer::extract_footer(fileslice).unwrap_err();
        assert_eq!(err.kind(), io::ErrorKind::UnexpectedEof);
        assert_eq!(
            err.to_string(),
            "File corrupted. The file is smaller than it\'s footer bytes (len=108)."
        );
    }

    #[test]
    fn test_deserialize_too_large_footer() {
        let mut buf: Vec<u8> = vec![];

        let footer_length = super::FOOTER_MAX_LEN + 1;
        BinarySerializable::serialize(&footer_length, &mut buf).unwrap();
        BinarySerializable::serialize(&FOOTER_MAGIC_NUMBER, &mut buf).unwrap();

        let owned_bytes = OwnedBytes::new(buf);

        let fileslice = FileSlice::new(Arc::new(owned_bytes));
        let err = Footer::extract_footer(fileslice).unwrap_err();
        assert_eq!(err.kind(), io::ErrorKind::InvalidData);
        assert_eq!(
            err.to_string(),
            "Footer seems invalid as it suggests a footer len of 50001. File is corrupted, or the \
             index was created with a different & old version of tantivy."
        );
    }
}


================================================
FILE: src/directory/managed_directory.rs
================================================
use std::collections::HashSet;
use std::io::Write;
use std::path::{Path, PathBuf};
use std::sync::{Arc, RwLock, RwLockWriteGuard};
use std::{io, result};

use crc32fast::Hasher;

use crate::core::MANAGED_FILEPATH;
use crate::directory::error::{DeleteError, LockError, OpenReadError, OpenWriteError};
use crate::directory::footer::{Footer, FooterProxy};
use crate::directory::{
    DirectoryLock, FileHandle, FileSlice, GarbageCollectionResult, Lock, WatchCallback,
    WatchHandle, WritePtr, META_LOCK,
};
use crate::error::DataCorruption;
use crate::Directory;

/// Returns true if the file is "managed".
/// Non-managed file are not subject to garbage collection.
///
/// Filenames that starts by a "." -typically locks-
/// are not managed.
fn is_managed(path: &Path) -> bool {
    path.to_str()
        .map(|p_str| !p_str.starts_with('.'))
        .unwrap_or(true)
}

/// Wrapper of directories that keeps track of files created by Tantivy.
///
/// A managed directory is just a wrapper of a directory
/// that keeps a (persisted) list of the files that
/// have been created (and not deleted) by tantivy so far.
///
/// Thanks to this list, it implements a `garbage_collect` method
/// that removes the files that were created by tantivy and are not
/// useful anymore.
#[derive(Debug)]
pub struct ManagedDirectory {
    directory: Box<dyn Directory>,
    meta_informations: Arc<RwLock<MetaInformation>>,
}

#[derive(Debug, Default)]
struct MetaInformation {
    managed_paths: HashSet<PathBuf>,
}

/// Saves the file containing the list of existing files
/// that were created by tantivy.
fn save_managed_paths(
    directory: &dyn Directory,
    wlock: &RwLockWriteGuard<'_, MetaInformation>,
) -> io::Result<()> {
    let mut w = serde_json::to_vec(&wlock.managed_paths)?;
    writeln!(&mut w)?;
    directory.atomic_write(&MANAGED_FILEPATH, &w[..])?;
    Ok(())
}

impl ManagedDirectory {
    /// Wraps a directory as managed directory.
    pub fn wrap(directory: Box<dyn Directory>) -> crate::Result<ManagedDirectory> {
        match directory.atomic_read(&MANAGED_FILEPATH) {
            Ok(data) => {
                let managed_files_json = String::from_utf8_lossy(&data);
                let managed_files: HashSet<PathBuf> = serde_json::from_str(&managed_files_json)
                    .map_err(|e| {
                        DataCorruption::new(
                            MANAGED_FILEPATH.to_path_buf(),
                            format!("Managed file cannot be deserialized: {e:?}. "),
                        )
                    })?;
                Ok(ManagedDirectory {
                    directory,
                    meta_informations: Arc::new(RwLock::new(MetaInformation {
                        managed_paths: managed_files,
                    })),
                })
            }
            Err(OpenReadError::FileDoesNotExist(_)) => Ok(ManagedDirectory {
                directory,
                meta_informations: Arc::default(),
            }),
            io_err @ Err(OpenReadError::IoError { .. }) => Err(io_err.err().unwrap().into()),
            Err(OpenReadError::IncompatibleIndex(incompatibility)) => {
                // For the moment, this should never happen  `meta.json`
                // do not have any footer and cannot detect incompatibility.
                Err(crate::TantivyError::IncompatibleIndex(incompatibility))
            }
        }
    }

    /// Garbage collect unused files.
    ///
    /// Removes the files that were created by `tantivy` and are not
    /// used by any segment anymore.
    ///
    /// * `living_files` - List of files that are still used by the index.
    ///
    /// The use a callback ensures that the list of living_files is computed
    /// while we hold the lock on meta.
    ///
    /// This method does not panick nor returns errors.
    /// If a file cannot be deleted (for permission reasons for instance)
    /// an error is simply logged, and the file remains in the list of managed
    /// files.
    pub fn garbage_collect<L: FnOnce() -> HashSet<PathBuf>>(
        &mut self,
        get_living_files: L,
    ) -> crate::Result<GarbageCollectionResult> {
        info!("Garbage collect");
        let mut files_to_delete = vec![];

        // It is crucial to get the living files after acquiring the
        // read lock of meta information. That way, we
        // avoid the following scenario.
        //
        // 1) we get the list of living files.
        // 2) someone creates a new file.
        // 3) we start garbage collection and remove this file
        // even though it is a living file.
        //
        // releasing the lock as .delete() will use it too.
        {
            let meta_informations_rlock = self
                .meta_informations
                .read()
                .expect("Managed directory rlock poisoned in garbage collect.");

            // The point of this second "file" lock is to enforce the following scenario
            // 1) process B tries to load a new set of searcher.
            // The list of segments is loaded
            // 2) writer change meta.json (for instance after a merge or a commit)
            // 3) gc kicks in.
            // 4) gc removes a file that was useful for process B, before process B opened it.
            match self.acquire_lock(&META_LOCK) {
                Ok(_meta_lock) => {
                    let living_files = get_living_files();
                    for managed_path in &meta_informations_rlock.managed_paths {
                        if !living_files.contains(managed_path) {
                            files_to_delete.push(managed_path.clone());
                        }
                    }
                }
                Err(err) => {
                    error!("Failed to acquire lock for GC");
                    return Err(crate::TantivyError::from(err));
                }
            }
        }

        let mut failed_to_delete_files = vec![];
        let mut deleted_files = vec![];

        for file_to_delete in files_to_delete {
            match self.delete(&file_to_delete) {
                Ok(_) => {
                    info!("Deleted {file_to_delete:?}");
                    deleted_files.push(file_to_delete);
                }
                Err(file_error) => {
                    match file_error {
                        DeleteError::FileDoesNotExist(_) => {
                            deleted_files.push(file_to_delete.clone());
                        }
                        DeleteError::IoError { .. } => {
                            failed_to_delete_files.push(file_to_delete.clone());
                            if !cfg!(target_os = "windows") {
                                // On windows, delete is expected to fail if the file
                                // is mmapped.
                                error!("Failed to delete {file_to_delete:?}");
                            }
                        }
                    }
                }
            }
        }

        if !deleted_files.is_empty() {
            // update the list of managed files by removing
            // the file that were removed.
            let mut meta_informations_wlock = self
                .meta_informations
                .write()
                .expect("Managed directory wlock poisoned (2).");
            let managed_paths_write = &mut meta_informations_wlock.managed_paths;
            for delete_file in &deleted_files {
                managed_paths_write.remove(delete_file);
            }
            self.directory.sync_directory()?;
            save_managed_paths(self.directory.as_mut(), &meta_informations_wlock)?;
        }

        Ok(GarbageCollectionResult {
            deleted_files,
            failed_to_delete_files,
        })
    }

    /// Registers a file as managed
    ///
    /// This method must be called before the file is
    /// actually created to ensure that a failure between
    /// registering the filepath and creating the file
    /// will not lead to garbage files that will
    /// never get removed.
    ///
    /// File starting by "." are reserved to locks.
    /// They are not managed and cannot be subjected
    /// to garbage collection.
    fn register_file_as_managed(&self, filepath: &Path) -> io::Result<()> {
        // Files starting by "." (e.g. lock files) are not managed.
        if !is_managed(filepath) {
            return Ok(());
        }
        let mut meta_wlock = self
            .meta_informations
            .write()
            .expect("Managed file lock poisoned");
        let has_changed = meta_wlock.managed_paths.insert(filepath.to_owned());
        if !has_changed {
            return Ok(());
        }
        save_managed_paths(self.directory.as_ref(), &meta_wlock)?;
        // This is not the first file we add.
        // Therefore, we are sure that `.managed.json` has been already
        // properly created and we do not need to sync its parent directory.
        //
        // (It might seem like a nicer solution to create the managed_json on the
        // creation of the ManagedDirectory instance but it would actually
        // prevent the use of read-only directories..)
        let managed_file_definitely_already_exists = meta_wlock.managed_paths.len() > 1;
        if managed_file_definitely_already_exists {
            return Ok(());
        }
        self.directory.sync_directory()?;
        Ok(())
    }

    /// Verify checksum of a managed file
    pub fn validate_checksum(&self, path: &Path) -> result::Result<bool, OpenReadError> {
        let reader = self.directory.open_read(path)?;
        let (footer, data) = Footer::extract_footer(reader)
            .map_err(|io_error| OpenReadError::wrap_io_error(io_error, path.to_path_buf()))?;
        let bytes = data
            .read_bytes()
            .map_err(|io_error| OpenReadError::IoError {
                io_error: Arc::new(io_error),
                filepath: path.to_path_buf(),
            })?;
        let mut hasher = Hasher::new();
        hasher.update(bytes.as_slice());
        let crc = hasher.finalize();
        Ok(footer.crc() == crc)
    }

    /// List all managed files
    pub fn list_managed_files(&self) -> HashSet<PathBuf> {
        let managed_paths = self
            .meta_informations
            .read()
            .expect("Managed directory rlock poisoned in list damaged.")
            .managed_paths
            .clone();
        managed_paths
    }
}

impl Directory for ManagedDirectory {
    fn get_file_handle(&self, path: &Path) -> Result<Arc<dyn FileHandle>, OpenReadError> {
        let file_slice = self.open_read(path)?;
        Ok(Arc::new(file_slice))
    }

    fn open_read(&self, path: &Path) -> result::Result<FileSlice, OpenReadError> {
        let file_slice = self.directory.open_read(path)?;
        let (footer, reader) = Footer::extract_footer(file_slice)
            .map_err(|io_error| OpenReadError::wrap_io_error(io_error, path.to_path_buf()))?;
        footer.is_compatible()?;
        Ok(reader)
    }

    fn open_write(&self, path: &Path) -> result::Result<WritePtr, OpenWriteError> {
        self.register_file_as_managed(path)
            .map_err(|io_error| OpenWriteError::wrap_io_error(io_error, path.to_path_buf()))?;
        Ok(io::BufWriter::new(Box::new(FooterProxy::new(
            self.directory
                .open_write(path)?
                .into_inner()
                .map_err(|_| ())
                .expect("buffer should be empty"),
        ))))
    }

    fn atomic_write(&self, path: &Path, data: &[u8]) -> io::Result<()> {
        self.register_file_as_managed(path)?;
        self.directory.atomic_write(path, data)
    }

    fn atomic_read(&self, path: &Path) -> result::Result<Vec<u8>, OpenReadError> {
        self.directory.atomic_read(path)
    }

    fn delete(&self, path: &Path) -> result::Result<(), DeleteError> {
        self.directory.delete(path)
    }

    fn exists(&self, path: &Path) -> Result<bool, OpenReadError> {
        self.directory.exists(path)
    }

    fn acquire_lock(&self, lock: &Lock) -> result::Result<DirectoryLock, LockError> {
        self.directory.acquire_lock(lock)
    }

    fn watch(&self, watch_callback: WatchCallback) -> crate::Result<WatchHandle> {
        self.directory.watch(watch_callback)
    }

    fn sync_directory(&self) -> io::Result<()> {
        self.directory.sync_directory()?;
        Ok(())
    }
}

impl Clone for ManagedDirectory {
    fn clone(&self) -> ManagedDirectory {
        ManagedDirectory {
            directory: self.directory.box_clone(),
            meta_informations: Arc::clone(&self.meta_informations),
        }
    }
}

#[cfg(feature = "mmap")]
#[cfg(test)]
mod tests_mmap_specific {

    use std::collections::HashSet;
    use std::io::Write;
    use std::path::{Path, PathBuf};

    use tempfile::TempDir;

    use crate::directory::{Directory, ManagedDirectory, MmapDirectory, TerminatingWrite};

    #[test]
    fn test_managed_directory() {
        let tempdir = TempDir::new().unwrap();
        let tempdir_path = PathBuf::from(tempdir.path());

        let test_path1: &'static Path = Path::new("some_path_for_test");
        let test_path2: &'static Path = Path::new("some_path_for_test_2");
        {
            let mmap_directory = MmapDirectory::open(&tempdir_path).unwrap();
            let mut managed_directory = ManagedDirectory::wrap(Box::new(mmap_directory)).unwrap();
            let write_file = managed_directory.open_write(test_path1).unwrap();
            write_file.terminate().unwrap();
            managed_directory
                .atomic_write(test_path2, &[0u8, 1u8])
                .unwrap();
            assert!(managed_directory.exists(test_path1).unwrap());
            assert!(managed_directory.exists(test_path2).unwrap());
            let living_files: HashSet<PathBuf> = [test_path1.to_owned()].iter().cloned().collect();
            assert!(managed_directory.garbage_collect(|| living_files).is_ok());
            assert!(managed_directory.exists(test_path1).unwrap());
            assert!(!managed_directory.exists(test_path2).unwrap());
        }
        {
            let mmap_directory = MmapDirectory::open(&tempdir_path).unwrap();
            let mut managed_directory = ManagedDirectory::wrap(Box::new(mmap_directory)).unwrap();
            assert!(managed_directory.exists(test_path1).unwrap());
            assert!(!managed_directory.exists(test_path2).unwrap());
            let living_files: HashSet<PathBuf> = HashSet::new();
            assert!(managed_directory.garbage_collect(|| living_files).is_ok());
            assert!(!managed_directory.exists(test_path1).unwrap());
            assert!(!managed_directory.exists(test_path2).unwrap());
        }
    }

    #[test]
    fn test_managed_directory_gc_while_mmapped() {
        let test_path1: &'static Path = Path::new("some_path_for_test");

        let tempdir = TempDir::new().unwrap();
        let tempdir_path = PathBuf::from(tempdir.path());
        let living_files = HashSet::new();

        let mmap_directory = MmapDirectory::open(tempdir_path).unwrap();
        let mut managed_directory = ManagedDirectory::wrap(Box::new(mmap_directory)).unwrap();
        let mut write = managed_directory.open_write(test_path1).unwrap();
        write.write_all(&[0u8, 1u8]).unwrap();
        write.terminate().unwrap();
        assert!(managed_directory.exists(test_path1).unwrap());

        let _mmap_read = managed_directory.open_read(test_path1).unwrap();
        assert!(managed_directory
            .garbage_collect(|| living_files.clone())
            .is_ok());
        if cfg!(target_os = "windows") {
            // On Windows, gc should try and fail the file as it is mmapped.
            assert!(managed_directory.exists(test_path1).unwrap());
            // unmap should happen here.
            drop(_mmap_read);
            // The file should still be in the list of managed file and
            // eventually be deleted once mmap is released.
            assert!(managed_directory.garbage_collect(|| living_files).is_ok());
        }
        assert!(!managed_directory.exists(test_path1).unwrap());
    }
}


================================================
FILE: src/directory/mmap_directory/file_watcher.rs
================================================
use std::io::BufRead;
use std::path::Path;
use std::sync::atomic::{AtomicUsize, Ordering};
use std::sync::Arc;
use std::time::Duration;
use std::{fs, io, thread};

use crc32fast::Hasher;

use crate::directory::{WatchCallback, WatchCallbackList, WatchHandle};

const POLLING_INTERVAL: Duration = Duration::from_millis(if cfg!(test) { 1 } else { 500 });

// Watches a file and executes registered callbacks when the file is modified.
pub struct FileWatcher {
    path: Arc<Path>,
    callbacks: Arc<WatchCallbackList>,
    state: Arc<AtomicUsize>, // 0: new, 1: runnable, 2: terminated
}

impl FileWatcher {
    pub fn new(path: &Path) -> FileWatcher {
        FileWatcher {
            path: Arc::from(path),
            callbacks: Default::default(),
            state: Default::default(),
        }
    }

    pub fn spawn(&self) {
        if self
            .state
            .compare_exchange(0, 1, Ordering::SeqCst, Ordering::SeqCst)
            .is_err()
        {
            return;
        }

        let path = self.path.clone();
        let callbacks = self.callbacks.clone();
        let state = self.state.clone();

        thread::Builder::new()
            .name("thread-tantivy-meta-file-watcher".to_string())
            .spawn(move || {
                let mut current_checksum_opt = None;

                while state.load(Ordering::SeqCst) == 1 {
                    if let Ok(checksum) = FileWatcher::compute_checksum(&path) {
                        let metafile_has_changed = current_checksum_opt
                            .map(|current_checksum| current_checksum != checksum)
                            .unwrap_or(true);
                        if metafile_has_changed {
                            info!("Meta file {path:?} was modified");
                            current_checksum_opt = Some(checksum);
                            // We actually ignore callbacks failing here.
                            // We just wait for the end of their execution.
                            let _ = callbacks.broadcast().wait();
                        }
                    }

                    thread::sleep(POLLING_INTERVAL);
                }
            })
            .expect("Failed to spawn meta file watcher thread");
    }

    pub fn watch(&self, callback: WatchCallback) -> WatchHandle {
        let handle = self.callbacks.subscribe(callback);
        self.spawn();
        handle
    }

    fn compute_checksum(path: &Path) -> Result<u32, io::Error> {
        let reader = match fs::File::open(path) {
            Ok(f) => io::BufReader::new(f),
            Err(e) => {
                warn!("Failed to open meta file {path:?}: {e:?}");
                return Err(e);
            }
        };

        let mut hasher = Hasher::new();

        for line in reader.lines() {
            hasher.update(line?.as_bytes())
        }

        Ok(hasher.finalize())
    }
}

impl Drop for FileWatcher {
    fn drop(&mut self) {
        self.state.store(2, Ordering::SeqCst);
    }
}

#[cfg(test)]
mod tests {

    use std::mem;

    use super::*;
    use crate::directory::mmap_directory::atomic_write;

    #[test]
    fn test_file_watcher_drop_watcher() -> crate::Result<()> {
        let tmp_dir = tempfile::TempDir::new()?;
        let tmp_file = tmp_dir.path().join("watched.txt");

        let counter: Arc<AtomicUsize> = Default::default();
        let (tx, rx) = crossbeam_channel::unbounded();
        let timeout = Duration::from_millis(100);

        let watcher = FileWatcher::new(&tmp_file);

        let state = watcher.state.clone();
        assert_eq!(state.load(Ordering::SeqCst), 0);

        let counter_clone = counter.clone();

        let _handle = watcher.watch(WatchCallback::new(move || {
            let val = counter_clone.fetch_add(1, Ordering::SeqCst);
            tx.send(val + 1).unwrap();
        }));

        assert_eq!(counter.load(Ordering::SeqCst), 0);
        assert_eq!(state.load(Ordering::SeqCst), 1);

        atomic_write(&tmp_file, b"foo")?;
        assert_eq!(rx.recv_timeout(timeout), Ok(1));

        atomic_write(&tmp_file, b"foo")?;
        assert!(rx.recv_timeout(timeout).is_err());

        atomic_write(&tmp_file, b"bar")?;
        assert_eq!(rx.recv_timeout(timeout), Ok(2));

        mem::drop(watcher);

        atomic_write(&tmp_file, b"qux")?;
        thread::sleep(Duration::from_millis(10));
        assert_eq!(counter.load(Ordering::SeqCst), 2);
        assert_eq!(state.load(Ordering::SeqCst), 2);

        Ok(())
    }

    #[test]
    fn test_file_watcher_drop_handle() -> crate::Result<()> {
        let tmp_dir = tempfile::TempDir::new()?;
        let tmp_file = tmp_dir.path().join("watched.txt");

        let counter: Arc<AtomicUsize> = Default::default();
        let (tx, rx) = crossbeam_channel::unbounded();
        let timeout = Duration::from_millis(100);

        let watcher = FileWatcher::new(&tmp_file);

        let state = watcher.state.clone();
        assert_eq!(state.load(Ordering::SeqCst), 0);

        let counter_clone = counter.clone();

        let handle = watcher.watch(WatchCallback::new(move || {
            let val = counter_clone.fetch_add(1, Ordering::SeqCst);
            tx.send(val + 1).unwrap();
        }));

        assert_eq!(counter.load(Ordering::SeqCst), 0);
        assert_eq!(state.load(Ordering::SeqCst), 1);

        atomic_write(&tmp_file, b"foo")?;
        assert_eq!(rx.recv_timeout(timeout), Ok(1));

        mem::drop(handle);

        atomic_write(&tmp_file, b"qux")?;
        assert_eq!(counter.load(Ordering::SeqCst), 1);
        assert_eq!(state.load(Ordering::SeqCst), 1);

        Ok(())
    }
}


================================================
FILE: src/directory/mmap_directory/mod.rs
================================================
mod file_watcher;

use std::collections::HashMap;
use std::fmt;
use std::fs::{self, File, OpenOptions};
use std::io::{self, BufWriter, Read, Write};
use std::ops::Deref;
use std::path::{Path, PathBuf};
use std::sync::{Arc, RwLock, Weak};

use common::StableDeref;
use file_watcher::FileWatcher;
use fs4::fs_std::FileExt;
#[cfg(all(feature = "mmap", unix))]
pub use memmap2::Advice;
use memmap2::Mmap;
use serde::{Deserialize, Serialize};
use tempfile::TempDir;

use crate::core::META_FILEPATH;
use crate::directory::error::{
    DeleteError, LockError, OpenDirectoryError, OpenReadError, OpenWriteError,
};
use crate::directory::{
    AntiCallToken, Directory, DirectoryLock, FileHandle, Lock, OwnedBytes, TerminatingWrite,
    WatchCallback, WatchHandle, WritePtr,
};

pub type ArcBytes = Arc<dyn Deref<Target = [u8]> + Send + Sync + 'static>;
pub type WeakArcBytes = Weak<dyn Deref<Target = [u8]> + Send + Sync + 'static>;

/// Create a default io error given a string.
pub(crate) fn make_io_err(msg: String) -> io::Error {
    io::Error::other(msg)
}

/// Returns `None` iff the file exists, can be read, but is empty (and hence
/// cannot be mmapped)
fn open_mmap(full_path: &Path) -> Result<Option<Mmap>, OpenReadError> {
    let file = File::open(full_path).map_err(|io_err| {
        if io_err.kind() == io::ErrorKind::NotFound {
            OpenReadError::FileDoesNotExist(full_path.to_path_buf())
        } else {
            OpenReadError::wrap_io_error(io_err, full_path.to_path_buf())
        }
    })?;

    let meta_data = file
        .metadata()
        .map_err(|io_err| OpenReadError::wrap_io_error(io_err, full_path.to_owned()))?;
    if meta_data.len() == 0 {
        // if the file size is 0, it will not be possible
        // to mmap the file, so we return None
        // instead.
        return Ok(None);
    }
    let mmap_opt: Option<memmap2::Mmap> = unsafe {
        memmap2::Mmap::map(&file)
            .map(Some)
            .map_err(|io_err| OpenReadError::wrap_io_error(io_err, full_path.to_path_buf()))
    }?;

    Ok(mmap_opt)
}

#[derive(Default, Clone, Debug, Serialize, Deserialize)]
pub struct CacheCounters {
    /// Number of time the cache prevents to call `mmap`
    pub hit: usize,
    /// Number of time tantivy had to call `mmap`
    /// as no entry was in the cache.
    pub miss: usize,
}

#[derive(Clone, Debug, Serialize, Deserialize)]
pub struct CacheInfo {
    pub counters: CacheCounters,
    pub mmapped: Vec<PathBuf>,
}

struct MmapCache {
    counters: CacheCounters,
    cache: HashMap<PathBuf, WeakArcBytes>,
    #[cfg(unix)]
    madvice_opt: Option<Advice>,
}

impl MmapCache {
    fn new() -> MmapCache {
        MmapCache {
            counters: CacheCounters::default(),
            cache: HashMap::default(),
            #[cfg(unix)]
            madvice_opt: None,
        }
    }

    #[cfg(unix)]
    fn set_advice(&mut self, madvice: Advice) {
        self.madvice_opt = Some(madvice);
    }

    fn get_info(&self) -> CacheInfo {
        let paths: Vec<PathBuf> = self.cache.keys().cloned().collect();
        CacheInfo {
            counters: self.counters.clone(),
            mmapped: paths,
        }
    }

    fn remove_weak_ref(&mut self) {
        let keys_to_remove: Vec<PathBuf> = self
            .cache
            .iter()
            .filter(|(_, mmap_weakref)| mmap_weakref.upgrade().is_none())
            .map(|(key, _)| key.clone())
            .collect();
        for key in keys_to_remove {
            self.cache.remove(&key);
        }
    }

    fn open_mmap_impl(&self, full_path: &Path) -> Result<Option<Mmap>, OpenReadError> {
        let mmap_opt = open_mmap(full_path)?;
        #[cfg(unix)]
        if let (Some(mmap), Some(madvice)) = (mmap_opt.as_ref(), self.madvice_opt) {
            // We ignore madvise errors.
            let _ = mmap.advise(madvice);
        }
        Ok(mmap_opt)
    }

    // Returns None if the file exists but as a len of 0 (and hence is not mmappable).
    fn get_mmap(&mut self, full_path: &Path) -> Result<Option<ArcBytes>, OpenReadError> {
        if let Some(mmap_weak) = self.cache.get(full_path) {
            if let Some(mmap_arc) = mmap_weak.upgrade() {
                self.counters.hit += 1;
                return Ok(Some(mmap_arc));
            }
        }
        self.cache.remove(full_path);
        self.counters.miss += 1;
        let mmap_opt = self.open_mmap_impl(full_path)?;
        Ok(mmap_opt.map(|mmap| {
            let mmap_arc: ArcBytes = Arc::new(mmap);
            let mmap_weak = Arc::downgrade(&mmap_arc);
            self.cache.insert(full_path.to_owned(), mmap_weak);
            mmap_arc
        }))
    }
}

/// Directory storing data in files, read via mmap.
///
/// The Mmap object are cached to limit the
/// system calls.
///
/// In the `MmapDirectory`, locks are implemented using the `fs2` crate definition of locks.
///
/// On MacOS & linux, it relies on `flock` (aka `BSD Lock`). These locks solve most of the
/// problems related to POSIX Locks, but may their contract may not be respected on `NFS`
/// depending on the implementation.
///
/// On Windows the semantics are again different.
#[derive(Clone)]
pub struct MmapDirectory {
    inner: Arc<MmapDirectoryInner>,
}

struct MmapDirectoryInner {
    root_path: PathBuf,
    mmap_cache: RwLock<MmapCache>,
    _temp_directory: Option<TempDir>,
    watcher: FileWatcher,
}

impl MmapDirectoryInner {
    fn new(root_path: PathBuf, temp_directory: Option<TempDir>) -> MmapDirectoryInner {
        MmapDirectoryInner {
            mmap_cache: RwLock::new(MmapCache::new()),
            _temp_directory: temp_directory,
            watcher: FileWatcher::new(&root_path.join(*META_FILEPATH)),
            root_path,
        }
    }

    fn watch(&self, callback: WatchCallback) -> WatchHandle {
        self.watcher.watch(callback)
    }
}

impl fmt::Debug for MmapDirectory {
    fn fmt(&self, f: &mut fmt::Formatter<'_>) -> fmt::Result {
        write!(f, "MmapDirectory({:?})", self.inner.root_path)
    }
}

impl MmapDirectory {
    fn new(root_path: PathBuf, temp_directory: Option<TempDir>) -> MmapDirectory {
        let inner = MmapDirectoryInner::new(root_path, temp_directory);
        MmapDirectory {
            inner: Arc::new(inner),
        }
    }

    /// Creates a new MmapDirectory in a temporary directory.
    ///
    /// This is mostly useful to test the MmapDirectory itself.
    /// For your unit tests, prefer the RamDirectory.
    pub fn create_from_tempdir() -> Result<MmapDirectory, OpenDirectoryError> {
        let tempdir = TempDir::new()
            .map_err(|io_err| OpenDirectoryError::FailedToCreateTempDir(Arc::new(io_err)))?;
        Ok(MmapDirectory::new(
            tempdir.path().to_path_buf(),
            Some(tempdir),
        ))
    }

    /// Opens a MmapDirectory in a directory, with a given access pattern.
    ///
    /// This is only supported on unix platforms.
    #[cfg(unix)]
    pub fn open_with_madvice(
        directory_path: impl AsRef<Path>,
        madvice: Advice,
    ) -> Result<MmapDirectory, OpenDirectoryError> {
        let dir = Self::open_impl_to_avoid_monomorphization(directory_path.as_ref())?;
        dir.inner.mmap_cache.write().unwrap().set_advice(madvice);
        Ok(dir)
    }

    /// Opens a MmapDirectory in a directory.
    ///
    /// Returns an error if the `directory_path` does not
    /// exist or if it is not a directory.
    pub fn open(directory_path: impl AsRef<Path>) -> Result<MmapDirectory, OpenDirectoryError> {
        Self::open_impl_to_avoid_monomorphization(directory_path.as_ref())
    }

    #[inline(never)]
    fn open_impl_to_avoid_monomorphization(
        directory_path: &Path,
    ) -> Result<MmapDirectory, OpenDirectoryError> {
        if !directory_path.exists() {
            return Err(OpenDirectoryError::DoesNotExist(PathBuf::from(
                directory_path,
            )));
        }
        #[expect(clippy::bind_instead_of_map)]
        let canonical_path: PathBuf = directory_path.canonicalize().or_else(|io_err| {
            let directory_path = directory_path.to_owned();

            #[cfg(windows)]
            {
                // `canonicalize` returns "Incorrect function" (error code 1)
                // for virtual drives (network drives, ramdisk, etc.).
                if io_err.raw_os_error() == Some(1) && directory_path.exists() {
                    // Should call `std::path::absolute` when it is stabilised.
                    return Ok(directory_path);
                }
            }

            Err(OpenDirectoryError::wrap_io_error(io_err, directory_path))
        })?;
        if !canonical_path.is_dir() {
            return Err(OpenDirectoryError::NotADirectory(PathBuf::from(
                directory_path,
            )));
        }
        Ok(MmapDirectory::new(canonical_path, None))
    }

    /// Joins a relative_path to the directory `root_path`
    /// to create a proper complete `filepath`.
    fn resolve_path(&self, relative_path: &Path) -> PathBuf {
        self.inner.root_path.join(relative_path)
    }

    /// Returns some statistical information
    /// about the Mmap cache.
    ///
    /// The `MmapDirectory` embeds a `MmapDirectory`
    /// to avoid multiplying the `mmap` system calls.
    pub fn get_cache_info(&self) -> CacheInfo {
        self.inner
            .mmap_cache
            .write()
            .expect("mmap cache lock is poisoned")
            .remove_weak_ref();
        self.inner
            .mmap_cache
            .read()
            .expect("Mmap cache lock is poisoned.")
            .get_info()
    }
}

/// We rely on fs2 for file locking. On Windows & MacOS this
/// uses BSD locks (`flock`). The lock is actually released when
/// the `File` object is dropped and its associated file descriptor
/// is closed.
struct ReleaseLockFile {
    _file: File,
    path: PathBuf,
}

impl Drop for ReleaseLockFile {
    fn drop(&mut self) {
        debug!("Releasing lock {:?}", self.path);
    }
}

/// This Write wraps a File, but has the specificity of
/// call `sync_all` on flush.
struct SafeFileWriter(File);

impl SafeFileWriter {
    fn new(file: File) -> SafeFileWriter {
        SafeFileWriter(file)
    }
}

impl Write for SafeFileWriter {
    fn write(&mut self, buf: &[u8]) -> io::Result<usize> {
        self.0.write(buf)
    }

    fn flush(&mut self) -> io::Result<()> {
        Ok(())
    }
}

impl TerminatingWrite for SafeFileWriter {
    fn terminate_ref(&mut self, _: AntiCallToken) -> io::Result<()> {
        self.0.flush()?;
        self.0.sync_data()?;
        Ok(())
    }
}

#[derive(Clone)]
struct MmapArc(Arc<dyn Deref<Target = [u8]> + Send + Sync>);

impl Deref for MmapArc {
    type Target = [u8];

    fn deref(&self) -> &[u8] {
        self.0.deref()
    }
}
unsafe impl StableDeref for MmapArc {}

/// Writes a file in an atomic manner.
pub(crate) fn atomic_write(path: &Path, content: &[u8]) -> io::Result<()> {
    // We create the temporary file in the same directory as the target file.
    // Indeed the canonical temp directory and the target file might sit in different
    // filesystem, in which case the atomic write may actually not work.
    let parent_path = path.parent().ok_or_else(|| {
        io::Error::new(
            io::ErrorKind::InvalidInput,
            "Path {:?} does not have parent directory.",
        )
    })?;
    let mut tempfile = tempfile::Builder::new().tempfile_in(parent_path)?;
    tempfile.write_all(content)?;
    tempfile.flush()?;
    tempfile.as_file_mut().sync_data()?;
    tempfile.into_temp_path().persist(path)?;
    Ok(())
}

impl Directory for MmapDirectory {
    fn get_file_handle(&self, path: &Path) -> Result<Arc<dyn FileHandle>, OpenReadError> {
        debug!("Open Read {path:?}");
        let full_path = self.resolve_path(path);

        let mut mmap_cache = self.inner.mmap_cache.write().map_err(|_| {
            let msg = format!("Failed to acquired write lock on mmap cache while reading {path:?}");
            let io_err = make_io_err(msg);
            OpenReadError::wrap_io_error(io_err, path.to_path_buf())
        })?;

        let owned_bytes = mmap_cache
            .get_mmap(&full_path)?
            .map(|mmap_arc| {
                let mmap_arc_obj = MmapArc(mmap_arc);
                OwnedBytes::new(mmap_arc_obj)
            })
            .unwrap_or_else(OwnedBytes::empty);

        Ok(Arc::new(owned_bytes))
    }

    /// Any entry associated with the path in the mmap will be
    /// removed before the file is deleted.
    fn delete(&self, path: &Path) -> Result<(), DeleteError> {
        let full_path = self.resolve_path(path);
        fs::remove_file(full_path).map_err(|e| {
            if e.kind() == io::ErrorKind::NotFound {
                DeleteError::FileDoesNotExist(path.to_owned())
            } else {
                DeleteError::IoError {
                    io_error: Arc::new(e),
                    filepath: path.to_path_buf(),
                }
            }
        })?;
        Ok(())
    }

    fn exists(&self, path: &Path) -> Result<bool, OpenReadError> {
        let full_path = self.resolve_path(path);
        full_path
            .try_exists()
            .map_err(|io_err| OpenReadError::wrap_io_error(io_err, path.to_path_buf()))
    }

    fn open_write(&self, path: &Path) -> Result<WritePtr, OpenWriteError> {
        debug!("Open Write {path:?}");
        let full_path = self.resolve_path(path);

        let open_res = OpenOptions::new()
            .write(true)
            .create_new(true)
            .open(full_path);

        let mut file = open_res.map_err(|io_err| {
            if io_err.kind() == io::ErrorKind::AlreadyExists {
                OpenWriteError::FileAlreadyExists(path.to_path_buf())
            } else {
                OpenWriteError::wrap_io_error(io_err, path.to_path_buf())
            }
        })?;

        // making sure the file is created.
        file.flush()
            .map_err(|io_error| OpenWriteError::wrap_io_error(io_error, path.to_path_buf()))?;

        // Note we actually do not sync the parent directory here.
        //
        // A newly created file, may, in some case, be created and even flushed to disk.
        // and then lost...
        //
        // The file will only be durably written after we terminate AND
        // sync_directory() is called.

        let writer = SafeFileWriter::new(file);
        Ok(BufWriter::new(Box::new(writer)))
    }

    fn atomic_read(&self, path: &Path) -> Result<Vec<u8>, OpenReadError> {
        let full_path = self.resolve_path(path);
        let mut buffer = Vec::new();
        match File::open(full_path) {
            Ok(mut file) => {
                file.read_to_end(&mut buffer).map_err(|io_error| {
                    OpenReadError::wrap_io_error(io_error, path.to_path_buf())
                })?;
                Ok(buffer)
            }
            Err(io_error) => {
                if io_error.kind() == io::ErrorKind::NotFound {
                    Err(OpenReadError::FileDoesNotExist(path.to_owned()))
                } else {
                    Err(OpenReadError::wrap_io_error(io_error, path.to_path_buf()))
                }
            }
        }
    }

    fn atomic_write(&self, path: &Path, content: &[u8]) -> io::Result<()> {
        debug!("Atomic Write {path:?}");
        let full_path = self.resolve_path(path);
        atomic_write(&full_path, content)?;
        Ok(())
    }

    fn acquire_lock(&self, lock: &Lock) -> Result<DirectoryLock, LockError> {
        let full_path = self.resolve_path(&lock.filepath);
        // We make sure that the file exists.
        let file: File = OpenOptions::new()
            .write(true)
            .create(true) //< if the file does not exist yet, create it.
            .truncate(false)
            .open(full_path)
            .map_err(LockError::wrap_io_error)?;
        if lock.is_blocking {
            file.lock_exclusive().map_err(LockError::wrap_io_error)?;
        } else if !file.try_lock_exclusive().map_err(|_| LockError::LockBusy)? {
            return Err(LockError::LockBusy);
        }
        // dropping the file handle will release the lock.
        Ok(DirectoryLock::from(Box::new(ReleaseLockFile {
            path: lock.filepath.clone(),
            _file: file,
        })))
    }

    fn watch(&self, watch_callback: WatchCallback) -> crate::Result<WatchHandle> {
        Ok(self.inner.watch(watch_callback))
    }

    #[cfg(windows)]
    fn sync_directory(&self) -> Result<(), io::Error> {
        // On Windows, it is not necessary to fsync the parent directory to
        // ensure that the directory entry containing the file has also reached
        // disk, and calling sync_data on a handle to directory is a no-op on
        // local disks, but will return an error on virtual drives.
        Ok(())
    }

    #[cfg(not(windows))]
    fn sync_directory(&self) -> Result<(), io::Error> {
        let mut open_opts = OpenOptions::new();

        // Linux needs read to be set, otherwise returns EINVAL
        // write must not be set, or it fails with EISDIR
        open_opts.read(true);

        let fd = open_opts.open(&self.inner.root_path)?;
        fd.sync_data()?;
        Ok(())
    }
}

#[cfg(test)]
mod tests {

    // There are more tests in directory/mod.rs
    // The following tests are specific to the MmapDirectory

    use std::time::Duration;

    use common::HasLen;

    use super::*;
    use crate::indexer::LogMergePolicy;
    use crate::schema::{Schema, SchemaBuilder, TEXT};
    use crate::{Index, IndexSettings, IndexWriter, ReloadPolicy};

    #[test]
    fn test_open_non_existent_path() {
        assert!(MmapDirectory::open(PathBuf::from("./nowhere")).is_err());
    }

    #[test]
    fn test_open_empty() {
        // empty file is actually an edge case because those
        // cannot be mmapped.
        //
        // In that case the directory returns a SharedVecSlice.
        let mmap_directory = MmapDirectory::create_from_tempdir().unwrap();
        let path = PathBuf::from("test");
        {
            let mut w = mmap_directory.open_write(&path).unwrap();
            w.flush().unwrap();
        }
        let readonlymap = mmap_directory.open_read(&path).unwrap();
        assert_eq!(readonlymap.len(), 0);
    }

    #[test]
    fn test_cache() {
        let content = b"abc";

        // here we test if the cache releases
        // mmaps correctly.
        let mmap_directory = MmapDirectory::create_from_tempdir().unwrap();
        let num_paths = 10;
        let paths: Vec<PathBuf> = (0..num_paths)
            .map(|i| PathBuf::from(&*format!("file_{i}")))
            .collect();
        {
            for path in &paths {
                let mut w = mmap_directory.open_write(path).unwrap();
                w.write_all(content).unwrap();
                w.flush().unwrap();
            }
        }

        let mut keep = vec![];
        for (i, path) in paths.iter().enumerate() {
            keep.push(mmap_directory.open_read(path).unwrap());
            assert_eq!(mmap_directory.get_cache_info().mmapped.len(), i + 1);
        }
        assert_eq!(mmap_directory.get_cache_info().counters.hit, 0);
        assert_eq!(mmap_directory.get_cache_info().counters.miss, 10);
        assert_eq!(mmap_directory.get_cache_info().mmapped.len(), 10);
        for path in paths.iter() {
            let _r = mmap_directory.open_read(path).unwrap();
            assert_eq!(mmap_directory.get_cache_info().mmapped.len(), num_paths);
        }
        assert_eq!(mmap_directory.get_cache_info().counters.hit, 10);
        assert_eq!(mmap_directory.get_cache_info().counters.miss, 10);
        assert_eq!(mmap_directory.get_cache_info().mmapped.len(), 10);

        for path in paths.iter() {
            let _r = mmap_directory.open_read(path).unwrap();
            assert_eq!(mmap_directory.get_cache_info().mmapped.len(), 10);
        }

        assert_eq!(mmap_directory.get_cache_info().counters.hit, 20);
        assert_eq!(mmap_directory.get_cache_info().counters.miss, 10);
        assert_eq!(mmap_directory.get_cache_info().mmapped.len(), 10);
        drop(keep);
        for path in paths.iter() {
            let _r = mmap_directory.open_read(path).unwrap();
            assert_eq!(mmap_directory.get_cache_info().mmapped.len(), 1);
        }
        assert_eq!(mmap_directory.get_cache_info().counters.hit, 20);
        assert_eq!(mmap_directory.get_cache_info().counters.miss, 20);
        assert_eq!(mmap_directory.get_cache_info().mmapped.len(), 0);

        for path in &paths {
            mmap_directory.delete(path).unwrap();
        }
        assert_eq!(mmap_directory.get_cache_info().counters.hit, 20);
        assert_eq!(mmap_directory.get_cache_info().counters.miss, 20);
        assert_eq!(mmap_directory.get_cache_info().mmapped.len(), 0);
        for path in paths.iter() {
            assert!(mmap_directory.open_read(path).is_err());
        }
        assert_eq!(mmap_directory.get_cache_info().counters.hit, 20);
        assert_eq!(mmap_directory.get_cache_info().counters.miss, 30);
        assert_eq!(mmap_directory.get_cache_info().mmapped.len(), 0);
    }

    fn assert_eventually<P: Fn() -> Option<String>>(predicate: P) {
        for _ in 0..30 {
            if predicate().is_none() {
                break;
            }
            std::thread::sleep(Duration::from_millis(200));
        }
        if let Some(error_msg) = predicate() {
            panic!("{}", error_msg);
        }
    }

    #[test]
    fn test_mmap_released() {
        let mmap_directory = MmapDirectory::create_from_tempdir().unwrap();
        let mut schema_builder: SchemaBuilder = Schema::builder();
        let text_field = schema_builder.add_text_field("text", TEXT);
        let schema = schema_builder.build();

        {
            let index =
                Index::create(mmap_directory.clone(), schema, IndexSettings::default()).unwrap();

            let mut index_writer: IndexWriter = index.writer_for_tests().unwrap();
            let mut log_merge_policy = LogMergePolicy::default();
            log_merge_policy.set_min_num_segments(3);
            index_writer.set_merge_policy(Box::new(log_merge_policy));
            for _num_commits in 0..10 {
                for _ in 0..10 {
                    index_writer.add_document(doc!(text_field=>"abc")).unwrap();
                }
                index_writer.commit().unwrap();
            }

            let reader = index
                .reader_builder()
                .reload_policy(ReloadPolicy::Manual)
                .try_into()
                .unwrap();

            for _ in 0..4 {
                index_writer.add_document(doc!(text_field=>"abc")).unwrap();
                index_writer.commit().unwrap();
                reader.reload().unwrap();
            }
            index_writer.wait_merging_threads().unwrap();

            reader.reload().unwrap();
            let num_segments = reader.searcher().segment_readers().len();
            assert!(num_segments <= 4);
            let num_components_except_deletes_and_tempstore =
                crate::index::SegmentComponent::iterator().len() - 1;
            let max_num_mmapped = num_components_except_deletes_and_tempstore * num_segments;
            assert_eventually(|| {
                let num_mmapped = mmap_directory.get_cache_info().mmapped.len();
                if num_mmapped > max_num_mmapped {
                    Some(format!(
                        "Expected at most {max_num_mmapped} mmapped files, got {num_mmapped}"
                    ))
                } else {
                    None
                }
            });
        }
        // This test failed on CI. The last Mmap is dropped from the merging thread so there might
        // be a race condition indeed.
        assert_eventually(|| {
            let num_mmapped = mmap_directory.get_cache_info().mmapped.len();
            if num_mmapped > 0 {
                Some(format!("Expected no mmapped files, got {num_mmapped}"))
            } else {
                None
            }
        });
    }
}


================================================
FILE: src/directory/mod.rs
================================================
//! WORM (Write Once Read Many) directory abstraction.

#[cfg(feature = "mmap")]
mod mmap_directory;

mod directory;
mod directory_lock;
pub mod footer;
mod managed_directory;
mod ram_directory;
mod watch_event_router;

/// Errors specific to the directory module.
pub mod error;

mod composite_file;

use std::io::BufWriter;
use std::path::PathBuf;

pub use common::file_slice::{FileHandle, FileSlice};
pub use common::{AntiCallToken, OwnedBytes, TerminatingWrite};

pub use self::composite_file::{CompositeFile, CompositeWrite};
pub use self::directory::{Directory, DirectoryClone, DirectoryLock};
pub use self::directory_lock::{Lock, INDEX_WRITER_LOCK, META_LOCK};
pub use self::ram_directory::RamDirectory;
pub use self::watch_event_router::{WatchCallback, WatchCallbackList, WatchHandle};

/// Outcome of the Garbage collection
pub struct GarbageCollectionResult {
    /// List of files that were deleted in this cycle
    pub deleted_files: Vec<PathBuf>,
    /// List of files that were schedule to be deleted in this cycle,
    /// but deletion did not work. This typically happens on windows,
    /// as deleting a memory mapped file is forbidden.
    ///
    /// If a searcher is still held, a file cannot be deleted.
    /// This is not considered a bug, the file will simply be deleted
    /// in the next GC.
    pub failed_to_delete_files: Vec<PathBuf>,
}

#[cfg(all(feature = "mmap", unix))]
pub use memmap2::Advice;

pub use self::managed_directory::ManagedDirectory;
#[cfg(feature = "mmap")]
pub use self::mmap_directory::MmapDirectory;

/// Write object for Directory.
///
/// `WritePtr` are required to implement both Write
/// and Seek.
pub type WritePtr = BufWriter<Box<dyn TerminatingWrite + Send + Sync>>;

#[cfg(test)]
mod tests;


================================================
FILE: src/directory/ram_directory.rs
================================================
use std::collections::HashMap;
use std::io::{self, BufWriter, Cursor, Write};
use std::path::{Path, PathBuf};
use std::sync::{Arc, RwLock};
use std::{fmt, result};

use common::HasLen;

use super::FileHandle;
use crate::core::META_FILEPATH;
use crate::directory::error::{DeleteError, OpenReadError, OpenWriteError};
use crate::directory::{
    AntiCallToken, Directory, FileSlice, TerminatingWrite, WatchCallback, WatchCallbackList,
    WatchHandle, WritePtr,
};

/// Writer associated with the [`RamDirectory`].
///
/// The Writer just writes a buffer.
struct VecWriter {
    path: PathBuf,
    shared_directory: RamDirectory,
    data: Cursor<Vec<u8>>,
    is_flushed: bool,
}

impl VecWriter {
    fn new(path_buf: PathBuf, shared_directory: RamDirectory) -> VecWriter {
        VecWriter {
            path: path_buf,
            data: Cursor::new(Vec::new()),
            shared_directory,
            is_flushed: true,
        }
    }
}

impl Drop for VecWriter {
    fn drop(&mut self) {
        if !self.is_flushed {
            warn!(
                "You forgot to flush {:?} before its writer got Drop. Do not rely on drop. This \
                 also occurs when the indexer crashed, so you may want to check the logs for the \
                 root cause.",
                self.path
            )
        }
    }
}

impl Write for VecWriter {
    fn write(&mut self, buf: &[u8]) -> io::Result<usize> {
        self.is_flushed = false;
        self.data.write_all(buf)?;
        Ok(buf.len())
    }

    fn flush(&mut self) -> io::Result<()> {
        self.is_flushed = true;
        let mut fs = self.shared_directory.fs.write().unwrap();
        fs.write(self.path.clone(), self.data.get_ref());
        Ok(())
    }
}

impl TerminatingWrite for VecWriter {
    fn terminate_ref(&mut self, _: AntiCallToken) -> io::Result<()> {
        self.flush()
    }
}

#[derive(Default)]
struct InnerDirectory {
    fs: HashMap<PathBuf, FileSlice>,
    watch_router: WatchCallbackList,
}

impl InnerDirectory {
    fn write(&mut self, path: PathBuf, data: &[u8]) -> bool {
        let data = FileSlice::from(data.to_vec());
        self.fs.insert(path, data).is_some()
    }

    fn open_read(&self, path: &Path) -> Result<FileSlice, OpenReadError> {
        self.fs
            .get(path)
            .ok_or_else(|| OpenReadError::FileDoesNotExist(PathBuf::from(path)))
            .cloned()
    }

    fn delete(&mut self, path: &Path) -> result::Result<(), DeleteError> {
        match self.fs.remove(path) {
            Some(_) => Ok(()),
            None => Err(DeleteError::FileDoesNotExist(PathBuf::from(path))),
        }
    }

    fn exists(&self, path: &Path) -> bool {
        self.fs.contains_key(path)
    }

    fn watch(&mut self, watch_handle: WatchCallback) -> WatchHandle {
        self.watch_router.subscribe(watch_handle)
    }

    fn total_mem_usage(&self) -> usize {
        self.fs.values().map(|f| f.len()).sum()
    }
}

impl fmt::Debug for RamDirectory {
    fn fmt(&self, f: &mut fmt::Formatter<'_>) -> fmt::Result {
        write!(f, "RamDirectory")
    }
}

/// A Directory storing everything in anonymous memory.
///
/// It is mainly meant for unit testing.
/// Writes are only made visible upon flushing.
#[derive(Clone, Default)]
pub struct RamDirectory {
    fs: Arc<RwLock<InnerDirectory>>,
}

impl RamDirectory {
    /// Constructor
    pub fn create() -> RamDirectory {
        Self::default()
    }

    /// Deep clones the directory.
    ///
    /// Ulterior writes on one of the copy
    /// will not affect the other copy.
    pub fn deep_clone(&self) -> RamDirectory {
        let inner_clone = InnerDirectory {
            fs: self.fs.read().unwrap().fs.clone(),
            watch_router: Default::default(),
        };
        RamDirectory {
            fs: Arc::new(RwLock::new(inner_clone)),
        }
    }

    /// Returns the sum of the size of the different files
    /// in the [`RamDirectory`].
    pub fn total_mem_usage(&self) -> usize {
        self.fs.read().unwrap().total_mem_usage()
    }

    /// Write a copy of all of the files saved in the [`RamDirectory`] in the target [`Directory`].
    ///
    /// Files are all written using the [`Directory::open_write()`] meaning, even if they were
    /// written using the [`Directory::atomic_write()`] api.
    ///
    /// If an error is encountered, files may be persisted partially.
    pub fn persist(&self, dest: &dyn Directory) -> crate::Result<()> {
        let wlock = self.fs.write().unwrap();
        for (path, file) in wlock.fs.iter() {
            let mut dest_wrt = dest.open_write(path)?;
            dest_wrt.write_all(file.read_bytes()?.as_slice())?;
            dest_wrt.terminate()?;
        }
        Ok(())
    }
}

impl Directory for RamDirectory {
    fn get_file_handle(&self, path: &Path) -> Result<Arc<dyn FileHandle>, OpenReadError> {
        let file_slice = self.open_read(path)?;
        Ok(Arc::new(file_slice))
    }

    fn open_read(&self, path: &Path) -> result::Result<FileSlice, OpenReadError> {
        self.fs.read().unwrap().open_read(path)
    }

    fn delete(&self, path: &Path) -> result::Result<(), DeleteError> {
        crate::fail_point!("RamDirectory::delete", |_| {
            Err(DeleteError::IoError {
                io_error: Arc::new(io::Error::from(io::ErrorKind::Other)),
                filepath: path.to_path_buf(),
            })
        });
        self.fs.write().unwrap().delete(path)
    }

    fn exists(&self, path: &Path) -> Result<bool, OpenReadError> {
        Ok(self
            .fs
            .read()
            .map_err(|e| OpenReadError::IoError {
                io_error: Arc::new(io::Error::other(e.to_string())),
                filepath: path.to_path_buf(),
            })?
            .exists(path))
    }

    fn open_write(&self, path: &Path) -> Result<WritePtr, OpenWriteError> {
        let mut fs = self.fs.write().unwrap();
        let path_buf = PathBuf::from(path);
        let vec_writer = VecWriter::new(path_buf.clone(), self.clone());
        let exists = fs.write(path_buf.clone(), &[]);
        // force the creation of the file to mimic the MMap directory.
        if exists {
            Err(OpenWriteError::FileAlreadyExists(path_buf))
        } else {
            Ok(BufWriter::new(Box::new(vec_writer)))
        }
    }

    fn atomic_read(&self, path: &Path) -> Result<Vec<u8>, OpenReadError> {
        let bytes =
            self.open_read(path)?
                .read_bytes()
                .map_err(|io_error| OpenReadError::IoError {
                    io_error: Arc::new(io_error),
                    filepath: path.to_path_buf(),
                })?;
        Ok(bytes.as_slice().to_owned())
    }

    fn atomic_write(&self, path: &Path, data: &[u8]) -> io::Result<()> {
        let path_buf = PathBuf::from(path);
        self.fs.write().unwrap().write(path_buf, data);
        if path == *META_FILEPATH {
            drop(self.fs.write().unwrap().watch_router.broadcast());
        }
        Ok(())
    }

    fn watch(&self, watch_callback: WatchCallback) -> crate::Result<WatchHandle> {
        Ok(self.fs.write().unwrap().watch(watch_callback))
    }

    fn sync_directory(&self) -> io::Result<()> {
        Ok(())
    }
}

#[cfg(test)]
mod tests {
    use std::io::Write;
    use std::path::Path;

    use super::RamDirectory;
    use crate::Directory;

    #[test]
    fn test_persist() {
        let msg_atomic: &'static [u8] = b"atomic is the way";
        let msg_seq: &'static [u8] = b"sequential is the way";
        let path_atomic: &'static Path = Path::new("atomic");
        let path_seq: &'static Path = Path::new("seq");
        let directory = RamDirectory::create();
        assert!(directory.atomic_write(path_atomic, msg_atomic).is_ok());
        let mut wrt = directory.open_write(path_seq).unwrap();
        assert!(wrt.write_all(msg_seq).is_ok());
        assert!(wrt.flush().is_ok());
        let directory_copy = RamDirectory::create();
        assert!(directory.persist(&directory_copy).is_ok());
        assert_eq!(directory_copy.atomic_read(path_atomic).unwrap(), msg_atomic);
        assert_eq!(directory_copy.atomic_read(path_seq).unwrap(), msg_seq);
    }

    #[test]
    fn test_ram_directory_deep_clone() {
        let dir = RamDirectory::default();
        let test = Path::new("test");
        let test2 = Path::new("test2");
        dir.atomic_write(test, b"firstwrite").unwrap();
        let dir_clone = dir.deep_clone();
        assert_eq!(
            dir_clone.atomic_read(test).unwrap(),
            dir.atomic_read(test).unwrap()
        );
        dir.atomic_write(test, b"original").unwrap();
        dir_clone.atomic_write(test, b"clone").unwrap();
        dir_clone.atomic_write(test2, b"clone2").unwrap();
        assert_eq!(dir.atomic_read(test).unwrap(), b"original");
        assert_eq!(&dir_clone.atomic_read(test).unwrap(), b"clone");
        assert_eq!(&dir_clone.atomic_read(test2).unwrap(), b"clone2");
    }
}


================================================
FILE: src/directory/tests.rs
================================================
use std::io::Write;
use std::mem;
use std::path::Path;
use std::sync::atomic::Ordering::SeqCst;
use std::sync::atomic::{AtomicBool, AtomicUsize};
use std::sync::Arc;
use std::time::Duration;

use super::*;

#[cfg(feature = "mmap")]
mod mmap_directory_tests {
    use crate::directory::MmapDirectory;

    type DirectoryImpl = MmapDirectory;

    fn make_directory() -> DirectoryImpl {
        MmapDirectory::create_from_tempdir().unwrap()
    }

    #[test]
    fn test_simple() -> crate::Result<()> {
        let directory = make_directory();
        super::test_simple(&directory)
    }

    #[test]
    fn test_write_create_the_file() {
        let directory = make_directory();
        super::test_write_create_the_file(&directory);
    }

    #[test]
    fn test_rewrite_forbidden() -> crate::Result<()> {
        let directory = make_directory();
        super::test_rewrite_forbidden(&directory)?;
        Ok(())
    }

    #[test]
    fn test_directory_delete() -> crate::Result<()> {
        let directory = make_directory();
        super::test_directory_delete(&directory)?;
        Ok(())
    }

    #[test]
    fn test_lock_non_blocking() {
        let directory = make_directory();
        super::test_lock_non_blocking(&directory);
    }

    #[test]
    fn test_lock_blocking() {
        let directory = make_directory();
        super::test_lock_blocking(&directory);
    }

    #[test]
    fn test_watch() {
        let directory = make_directory();
        super::test_watch(&directory);
    }
}

mod ram_directory_tests {
    use crate::directory::RamDirectory;

    type DirectoryImpl = RamDirectory;

    fn make_directory() -> DirectoryImpl {
        RamDirectory::default()
    }

    #[test]
    fn test_simple() -> crate::Result<()> {
        let directory = make_directory();
        super::test_simple(&directory)
    }

    #[test]
    fn test_write_create_the_file() {
        let directory = make_directory();
        super::test_write_create_the_file(&directory);
    }

    #[test]
    fn test_rewrite_forbidden() -> crate::Result<()> {
        let directory = make_directory();
        super::test_rewrite_forbidden(&directory)?;
        Ok(())
    }

    #[test]
    fn test_directory_delete() -> crate::Result<()> {
        let directory = make_directory();
        super::test_directory_delete(&directory)?;
        Ok(())
    }

    #[test]
    fn test_lock_non_blocking() {
        let directory = make_directory();
        super::test_lock_non_blocking(&directory);
    }

    #[test]
    fn test_lock_blocking() {
        let directory = make_directory();
        super::test_lock_blocking(&directory);
    }

    #[test]
    fn test_watch() {
        let directory = make_directory();
        super::test_watch(&directory);
    }
}

fn test_simple(directory: &dyn Directory) -> crate::Result<()> {
    let test_path: &'static Path = Path::new("some_path_for_test");
    let mut write_file = directory.open_write(test_path)?;
    assert!(directory.exists(test_path).unwrap());
    write_file.write_all(&[4])?;
    write_file.write_all(&[3])?;
    write_file.write_all(&[7, 3, 5])?;
    write_file.flush()?;
    let read_file = directory.open_read(test_path)?.read_bytes()?;
    assert_eq!(read_file.as_slice(), &[4u8, 3u8, 7u8, 3u8, 5u8]);
    mem::drop(read_file);
    assert!(directory.delete(test_path).is_ok());
    assert!(!directory.exists(test_path).unwrap());
    Ok(())
}

fn test_rewrite_forbidden(directory: &dyn Directory) -> crate::Result<()> {
    let test_path: &'static Path = Path::new("some_path_for_test");
    directory.open_write(test_path)?;
    assert!(directory.exists(test_path).unwrap());
    assert!(directory.open_write(test_path).is_err());
    assert!(directory.delete(test_path).is_ok());
    Ok(())
}

fn test_write_create_the_file(directory: &dyn Directory) {
    let test_path: &'static Path = Path::new("some_path_for_test");
    {
        assert!(directory.open_read(test_path).is_err());
        let _w = directory.open_write(test_path).unwrap();
        assert!(directory.exists(test_path).unwrap());
        assert!(directory.open_read(test_path).is_ok());
        assert!(directory.delete(test_path).is_ok());
    }
}

fn test_directory_delete(directory: &dyn Directory) -> crate::Result<()> {
    let test_path: &'static Path = Path::new("some_path_for_test");
    assert!(directory.open_read(test_path).is_err());
    let mut write_file = directory.open_write(test_path)?;
    write_file.write_all(&[1, 2, 3, 4])?;
    write_file.flush()?;
    {
        let read_handle = directory.open_read(test_path)?.read_bytes()?;
        assert_eq!(read_handle.as_slice(), &[1u8, 2u8, 3u8, 4u8]);
        // Mapped files can't be deleted on Windows
        if !cfg!(windows) {
            assert!(directory.delete(test_path).is_ok());
            assert_eq!(read_handle.as_slice(), &[1u8, 2u8, 3u8, 4u8]);
        }
        assert!(directory.delete(Path::new("SomeOtherPath")).is_err());
    }

    if cfg!(windows) {
        assert!(directory.delete(test_path).is_ok());
    }

    assert!(directory.open_read(test_path).is_err());
    assert!(directory.delete(test_path).is_err());
    Ok(())
}

fn test_watch(directory: &dyn Directory) {
    let counter: Arc<AtomicUsize> = Default::default();
    let (tx, rx) = crossbeam_channel::unbounded();
    let timeout = Duration::from_millis(500);

    let handle = directory
        .watch(WatchCallback::new(move || {
            let val = counter.fetch_add(1, SeqCst);
            tx.send(val + 1).unwrap();
        }))
        .unwrap();

    assert!(directory
        .atomic_write(Path::new("meta.json"), b"foo")
        .is_ok());
    assert_eq!(rx.recv_timeout(timeout), Ok(1));

    assert!(directory
        .atomic_write(Path::new("meta.json"), b"bar")
        .is_ok());
    assert_eq!(rx.recv_timeout(timeout), Ok(2));

    mem::drop(handle);

    assert!(directory
        .atomic_write(Path::new("meta.json"), b"qux")
        .is_ok());
    assert!(rx.recv_timeout(timeout).is_err());
}

fn test_lock_non_blocking(directory: &dyn Directory) {
    {
        let lock_a_res = directory.acquire_lock(&Lock {
            filepath: PathBuf::from("a.lock"),
            is_blocking: false,
        });
        assert!(lock_a_res.is_ok());
        let lock_b_res = directory.acquire_lock(&Lock {
            filepath: PathBuf::from("b.lock"),
            is_blocking: false,
        });
        assert!(lock_b_res.is_ok());
        let lock_a_res2 = directory.acquire_lock(&Lock {
            filepath: PathBuf::from("a.lock"),
            is_blocking: false,
        });
        assert!(lock_a_res2.is_err());
    }
    let lock_a_res = directory.acquire_lock(&Lock {
        filepath: PathBuf::from("a.lock"),
        is_blocking: false,
    });
    assert!(lock_a_res.is_ok());
}

fn test_lock_blocking(directory: &dyn Directory) {
    let lock_a_res = directory.acquire_lock(&Lock {
        filepath: PathBuf::from("a.lock"),
        is_blocking: true,
    });
    assert!(lock_a_res.is_ok());
    let in_thread = Arc::new(AtomicBool::default());
    let in_thread_clone = in_thread.clone();
    let (sender, receiver) = oneshot::channel();
    std::thread::spawn(move || {
        //< lock_a_res is sent to the thread.
        in_thread_clone.store(true, SeqCst);
        let _just_sync = receiver.recv();
        // explicitly dropping lock_a_res. It would have been sufficient to just force it
        // to be part of the move, but the intent seems clearer that way.
        drop(lock_a_res);
    });
    {
        // A non-blocking call should fail, as the thread is running and holding the lock.
        let lock_a_res = directory.acquire_lock(&Lock {
            filepath: PathBuf::from("a.lock"),
            is_blocking: false,
        });
        assert!(lock_a_res.is_err());
    }
    let directory_clone = directory.box_clone();
    let (sender2, receiver2) = oneshot::channel();
    let join_handle = std::thread::spawn(move || {
        assert!(sender2.send(()).is_ok());
        let lock_a_res = directory_clone.acquire_lock(&Lock {
            filepath: PathBuf::from("a.lock"),
            is_blocking: true,
        });
        assert!(in_thread.load(SeqCst));
        assert!(lock_a_res.is_ok());
    });
    assert!(receiver2.recv().is_ok());
    assert!(sender.send(()).is_ok());
    assert!(join_handle.join().is_ok());
}


================================================
FILE: src/directory/watch_event_router.rs
================================================
use std::sync::{Arc, RwLock, Weak};

use crate::FutureResult;

/// Cloneable wrapper for callbacks registered when watching files of a `Directory`.
#[derive(Clone)]
pub struct WatchCallback(Arc<dyn Fn() + Sync + Send>);

impl WatchCallback {
    /// Wraps a `Fn()` to create a WatchCallback.
    pub fn new<F: Fn() + Sync + Send + 'static>(op: F) -> Self {
        WatchCallback(Arc::new(op))
    }

    fn call(&self) {
        self.0()
    }
}

/// Helper struct to implement the watch method in `Directory` implementations.
///
/// It registers callbacks (See `.subscribe(...)`) and
/// calls them upon calls to `.broadcast(...)`.
#[derive(Default)]
pub struct WatchCallbackList {
    router: RwLock<Vec<Weak<WatchCallback>>>,
}

/// Controls how long a directory should watch for a file change.
///
/// After all the clones of `WatchHandle` are dropped, the associated will not be called when a
/// file change is detected.
#[must_use = "This `WatchHandle` controls the lifetime of the watch and should therefore be used."]
#[derive(Clone)]
#[expect(dead_code)]
pub struct WatchHandle(Arc<WatchCallback>);

impl WatchHandle {
    /// Create a WatchHandle handle.
    pub fn new(watch_callback: Arc<WatchCallback>) -> WatchHandle {
        WatchHandle(watch_callback)
    }

    /// Returns an empty watch handle.
    ///
    /// This function is only useful when implementing a readonly directory.
    pub fn empty() -> WatchHandle {
        WatchHandle::new(Arc::new(WatchCallback::new(|| {})))
    }
}

impl WatchCallbackList {
    /// Subscribes a new callback and returns a handle that controls the lifetime of the callback.
    pub fn subscribe(&self, watch_callback: WatchCallback) -> WatchHandle {
        let watch_callback_arc = Arc::new(watch_callback);
        let watch_callback_weak = Arc::downgrade(&watch_callback_arc);
        self.router.write().unwrap().push(watch_callback_weak);
        WatchHandle::new(watch_callback_arc)
    }

    fn list_callback(&self) -> Vec<WatchCallback> {
        let mut callbacks: Vec<WatchCallback> = vec![];
        let mut router_wlock = self.router.write().unwrap();
        let mut i = 0;
        while i < router_wlock.len() {
            if let Some(watch) = router_wlock[i].upgrade() {
                callbacks.push(watch.as_ref().clone());
                i += 1;
            } else {
                router_wlock.swap_remove(i);
            }
        }
        callbacks
    }

    /// Triggers all callbacks
    pub fn broadcast(&self) -> FutureResult<()> {
        let callbacks = self.list_callback();
        let (result, sender) = FutureResult::create("One of the callback panicked.");
        if callbacks.is_empty() {
            let _ = sender.send(Ok(()));
            return result;
        }
        let spawn_res = std::thread::Builder::new()
            .name("watch-callbacks".to_string())
            .spawn(move || {
                for callback in callbacks {
                    callback.call();
                }
                let _ = sender.send(Ok(()));
            });
        if let Err(err) = spawn_res {
            error!("Failed to spawn thread to call watch callbacks. Cause: {err:?}");
        }
        result
    }
}

#[cfg(test)]
mod tests {
    use std::mem;
    use std::sync::atomic::{AtomicUsize, Ordering};
    use std::sync::Arc;

    use crate::directory::{WatchCallback, WatchCallbackList};

    #[test]
    fn test_watch_event_router_simple() {
        let watch_event_router = WatchCallbackList::default();
        let counter: Arc<AtomicUsize> = Default::default();
        let counter_clone = counter.clone();
        let inc_callback = WatchCallback::new(move || {
            counter_clone.fetch_add(1, Ordering::SeqCst);
        });
        watch_event_router.broadcast().wait().unwrap();
        assert_eq!(0, counter.load(Ordering::SeqCst));
        let handle_a = watch_event_router.subscribe(inc_callback);
        assert_eq!(0, counter.load(Ordering::SeqCst));
        watch_event_router.broadcast().wait().unwrap();
        assert_eq!(1, counter.load(Ordering::SeqCst));
        watch_event_router.broadcast().wait().unwrap();
        watch_event_router.broadcast().wait().unwrap();
        watch_event_router.broadcast().wait().unwrap();
        assert_eq!(4, counter.load(Ordering::SeqCst));
        mem::drop(handle_a);
        watch_event_router.broadcast().wait().unwrap();
        assert_eq!(4, counter.load(Ordering::SeqCst));
    }

    #[test]
    fn test_watch_event_router_multiple_callback_same_key() {
        let watch_event_router = WatchCallbackList::default();
        let counter: Arc<AtomicUsize> = Default::default();
        let inc_callback = |inc: usize| {
            let counter_clone = counter.clone();
            WatchCallback::new(move || {
                counter_clone.fetch_add(inc, Ordering::SeqCst);
            })
        };
        let handle_a = watch_event_router.subscribe(inc_callback(1));
        let handle_a2 = watch_event_router.subscribe(inc_callback(10));
        assert_eq!(0, counter.load(Ordering::SeqCst));
        watch_event_router.broadcast().wait().unwrap();
        watch_event_router.broadcast().wait().unwrap();
        assert_eq!(22, counter.load(Ordering::SeqCst));
        mem::drop(handle_a);
        watch_event_router.broadcast().wait().unwrap();
        assert_eq!(32, counter.load(Ordering::SeqCst));
        mem::drop(handle_a2);
        watch_event_router.broadcast().wait().unwrap();
        watch_event_router.broadcast().wait().unwrap();
        assert_eq!(32, counter.load(Ordering::SeqCst));
    }

    #[test]
    fn test_watch_event_router_multiple_callback_different_key() {
        let watch_event_router = WatchCallbackList::default();
        let counter: Arc<AtomicUsize> = Default::default();
        let counter_clone = counter.clone();
        let inc_callback = WatchCallback::new(move || {
            counter_clone.fetch_add(1, Ordering::SeqCst);
        });
        let handle_a = watch_event_router.subscribe(inc_callback);
        assert_eq!(0, counter.load(Ordering::SeqCst));
        watch_event_router.broadcast().wait().unwrap();
        watch_event_router.broadcast().wait().unwrap();
        assert_eq!(2, counter.load(Ordering::SeqCst));
        mem::drop(handle_a);
        drop(watch_event_router.broadcast());
        watch_event_router.broadcast().wait().unwrap();
        assert_eq!(2, counter.load(Ordering::SeqCst));
    }
}


================================================
FILE: src/docset.rs
================================================
use std::borrow::{Borrow, BorrowMut};

use crate::fastfield::AliveBitSet;
use crate::DocId;

/// Sentinel value returned when a [`DocSet`] has been entirely consumed.
///
/// This is not `u32::MAX` as one would have expected, due to the lack of SSE2 instructions
/// to compare `[u32; 4]`.
pub const TERMINATED: DocId = i32::MAX as u32;

/// The collect_block method on `SegmentCollector` uses a buffer of this size.
/// Passed results to `collect_block` will not exceed this size and will be
/// exactly this size as long as we can fill the buffer.
pub const COLLECT_BLOCK_BUFFER_LEN: usize = 64;

/// Represents an iterable set of sorted doc ids.
pub trait DocSet: Send {
    /// Goes to the next element.
    ///
    /// The DocId of the next element is returned.
    /// In other words we should always have :
    /// ```compile_fail
    /// let doc = docset.advance();
    /// assert_eq!(doc, docset.doc());
    /// ```
    ///
    /// If we reached the end of the `DocSet`, [`TERMINATED`] should be returned.
    ///
    /// Calling `.advance()` on a terminated `DocSet` should be supported, and [`TERMINATED`] should
    /// be returned.
    fn advance(&mut self) -> DocId;

    /// Advances the `DocSet` forward until reaching the target, or going to the
    /// lowest [`DocId`] greater than the target.
    ///
    /// If the end of the `DocSet` is reached, [`TERMINATED`] is returned.
    ///
    /// Calling `.seek(target)` on a terminated `DocSet` is legal. Implementation
    /// of `DocSet` should support it.
    ///
    /// Calling `seek(TERMINATED)` is also legal and is the normal way to consume a `DocSet`.
    ///
    /// `target` has to be larger or equal to `.doc()` when calling `seek`.
    fn seek(&mut self, target: DocId) -> DocId {
        let mut doc = self.doc();
        debug_assert!(doc <= target);
        while doc < target {
            doc = self.advance();
        }
        doc
    }

    /// !!!Dragons ahead!!!
    /// In spirit, this is an approximate and dangerous version of `seek`.
    ///
    /// It can leave the DocSet in an `invalid` state and might return a
    /// lower bound of what the result of Seek would have been.
    ///
    ///
    /// More accurately it returns either:
    /// - Found if the target is in the docset. In that case, the DocSet is left in a valid state.
    /// - SeekLowerBound(seek_lower_bound) if the target is not in the docset. In that case, The
    ///   DocSet can be the left in a invalid state. The DocSet should then only receives call to
    ///   `seek_danger(..)` until it returns `Found`, and get back to a valid state.
    ///
    /// `seek_lower_bound` can be any `DocId` (in the docset or not) as long as it is in
    /// `(target .. seek_result] U {TERMINATED}` where `seek_result` is the first document in the
    /// docset greater than to `target`.
    ///
    /// `seek_danger` may return `SeekLowerBound(TERMINATED)`.
    ///
    /// Calling `seek_danger` with TERMINATED as a target is allowed,
    /// and should always return NewTarget(TERMINATED) or anything larger as TERMINATED is NOT in
    /// the DocSet.
    ///
    /// DocSets that already have an efficient `seek` method don't need to implement
    /// `seek_danger`.
    ///
    /// Consecutive calls to seek_danger are guaranteed to have strictly increasing `target`
    /// values.
    fn seek_danger(&mut self, target: DocId) -> SeekDangerResult {
        if target >= TERMINATED {
            debug_assert!(target == TERMINATED);
            // No need to advance.
            return SeekDangerResult::SeekLowerBound(target);
        }

        // The default implementation does not include any
        // `danger zone` behavior.
        //
        // It does not leave the scorer in an invalid state.
        // For this reason, we can safely call `self.doc()`.
        let mut doc = self.doc();
        if doc < target {
            doc = self.seek(target);
        }
        if doc == target {
            SeekDangerResult::Found
        } else {
            SeekDangerResult::SeekLowerBound(doc)
        }
    }

    /// Fills a given mutable buffer with the next doc ids from the
    /// `DocSet`
    ///
    /// If that many `DocId`s are available, the method should
    /// fill the entire buffer and return the length of the buffer.
    ///
    /// If we reach the end of the `DocSet` before filling
    /// it entirely, then the buffer is filled up to this point, and
    /// return value is the number of elements that were filled.
    ///
    /// # Warning
    ///
    /// This method is only here for specific high-performance
    /// use case where batching. The normal way to
    /// go through the `DocId`'s is to call `.advance()`.
    fn fill_buffer(&mut self, buffer: &mut [DocId; COLLECT_BLOCK_BUFFER_LEN]) -> usize {
        if self.doc() == TERMINATED {
            return 0;
        }
        for (i, buffer_val) in buffer.iter_mut().enumerate() {
            *buffer_val = self.doc();
            if self.advance() == TERMINATED {
                return i + 1;
            }
        }
        buffer.len()
    }

    /// Returns the current document
    /// Right after creating a new `DocSet`, the docset points to the first document.
    ///
    /// If the `DocSet` is empty, `.doc()` should return [`TERMINATED`].
    fn doc(&self) -> DocId;

    /// Returns a best-effort hint of the
    /// length of the docset.
    fn size_hint(&self) -> u32;

    /// Returns a best-effort hint of the cost to consume the entire docset.
    ///
    /// Consuming means calling advance until [`TERMINATED`] is returned.
    /// The cost should be relative to the cost of driving a Term query,
    /// which would be the number of documents in the DocSet.
    ///
    /// By default this returns `size_hint()`.
    ///
    /// DocSets may have vastly different cost depending on their type,
    /// e.g. an intersection with 10 hits is much cheaper than
    /// a phrase search with 10 hits, since it needs to load positions.
    ///
    /// ### Future Work
    /// We may want to differentiate `DocSet` costs more more granular, e.g.
    /// creation_cost, advance_cost, seek_cost on to get a good estimation
    /// what query types to choose.
    fn cost(&self) -> u64 {
        self.size_hint() as u64
    }

    /// Returns the number documents matching.
    /// Calling this method consumes the `DocSet`.
    fn count(&mut self, alive_bitset: &AliveBitSet) -> u32 {
        let mut count = 0u32;
        let mut doc = self.doc();
        while doc != TERMINATED {
            if alive_bitset.is_alive(doc) {
                count += 1u32;
            }
            doc = self.advance();
        }
        count
    }

    /// Returns the count of documents, deleted or not.
    /// Calling this method consumes the `DocSet`.
    ///
    /// Of course, the result is an upper bound of the result
    /// given by `count()`.
    fn count_including_deleted(&mut self) -> u32 {
        let mut count = 0u32;
        let mut doc = self.doc();
        while doc != TERMINATED {
            count += 1u32;
            doc = self.advance();
        }
        count
    }
}

#[derive(Clone, Copy, Debug, PartialEq, Eq)]
pub enum SeekDangerResult {
    /// The target was found in the DocSet.
    Found,
    /// The target was not found in the DocSet.
    /// We return a range in which the value could be.
    /// The given target can be any DocId, that is <= than the first document
    /// in the docset after the target.
    SeekLowerBound(DocId),
}

impl DocSet for &mut dyn DocSet {
    fn advance(&mut self) -> u32 {
        (**self).advance()
    }

    fn seek(&mut self, target: DocId) -> DocId {
        (**self).seek(target)
    }

    fn seek_danger(&mut self, target: DocId) -> SeekDangerResult {
        (**self).seek_danger(target)
    }

    fn doc(&self) -> u32 {
        (**self).doc()
    }

    fn size_hint(&self) -> u32 {
        (**self).size_hint()
    }

    fn cost(&self) -> u64 {
        (**self).cost()
    }

    fn count(&mut self, alive_bitset: &AliveBitSet) -> u32 {
        (**self).count(alive_bitset)
    }

    fn count_including_deleted(&mut self) -> u32 {
        (**self).count_including_deleted()
    }
}

impl<TDocSet: DocSet + ?Sized> DocSet for Box<TDocSet> {
    fn advance(&mut self) -> DocId {
        let unboxed: &mut TDocSet = self.borrow_mut();
        unboxed.advance()
    }

    fn seek(&mut self, target: DocId) -> DocId {
        let unboxed: &mut TDocSet = self.borrow_mut();
        unboxed.seek(target)
    }

    fn seek_danger(&mut self, target: DocId) -> SeekDangerResult {
        let unboxed: &mut TDocSet = self.borrow_mut();
        unboxed.seek_danger(target)
    }

    fn fill_buffer(&mut self, buffer: &mut [DocId; COLLECT_BLOCK_BUFFER_LEN]) -> usize {
        let unboxed: &mut TDocSet = self.borrow_mut();
        unboxed.fill_buffer(buffer)
    }

    fn doc(&self) -> DocId {
        let unboxed: &TDocSet = self.borrow();
        unboxed.doc()
    }

    fn size_hint(&self) -> u32 {
        let unboxed: &TDocSet = self.borrow();
        unboxed.size_hint()
    }

    fn cost(&self) -> u64 {
        let unboxed: &TDocSet = self.borrow();
        unboxed.cost()
    }

    fn count(&mut self, alive_bitset: &AliveBitSet) -> u32 {
        let unboxed: &mut TDocSet = self.borrow_mut();
        unboxed.count(alive_bitset)
    }

    fn count_including_deleted(&mut self) -> u32 {
        let unboxed: &mut TDocSet = self.borrow_mut();
        unboxed.count_including_deleted()
    }
}


================================================
FILE: src/error.rs
================================================
//! Definition of Tantivy's errors and results.

use std::path::PathBuf;
use std::sync::{Arc, PoisonError};
use std::{fmt, io};

use thiserror::Error;

use crate::aggregation::AggregationError;
use crate::directory::error::{
    Incompatibility, LockError, OpenDirectoryError, OpenReadError, OpenWriteError,
};
use crate::fastfield::FastFieldNotAvailableError;
use crate::schema::document::DeserializeError;
use crate::{query, schema};

/// Represents a `DataCorruption` error.
///
/// When facing data corruption, tantivy actually panics or returns this error.
#[derive(Clone)]
pub struct DataCorruption {
    filepath: Option<PathBuf>,
    comment: String,
}

impl DataCorruption {
    /// Creates a `DataCorruption` Error.
    pub fn new(filepath: PathBuf, comment: String) -> DataCorruption {
        DataCorruption {
            filepath: Some(filepath),
            comment,
        }
    }

    /// Creates a `DataCorruption` Error, when the filepath is irrelevant.
    pub fn comment_only<TStr: ToString>(comment: TStr) -> DataCorruption {
        DataCorruption {
            filepath: None,
            comment: comment.to_string(),
        }
    }
}

impl fmt::Debug for DataCorruption {
    fn fmt(&self, f: &mut fmt::Formatter<'_>) -> Result<(), fmt::Error> {
        write!(f, "Data corruption")?;
        if let Some(ref filepath) = &self.filepath {
            write!(f, " (in file `{filepath:?}`)")?;
        }
        write!(f, ": {}.", self.comment)?;
        Ok(())
    }
}

/// The library's error enum
#[derive(Debug, Clone, Error)]
pub enum TantivyError {
    /// Error when handling aggregations.
    #[error(transparent)]
    AggregationError(#[from] AggregationError),
    /// Failed to open the directory.
    #[error("Failed to open the directory: '{0:?}'")]
    OpenDirectoryError(#[from] OpenDirectoryError),
    /// Failed to open a file for read.
    #[error("Failed to open file for read: '{0:?}'")]
    OpenReadError(#[from] OpenReadError),
    /// Failed to open a file for write.
    #[error("Failed to open file for write: '{0:?}'")]
    OpenWriteError(#[from] OpenWriteError),
    /// Index already exists in this directory.
    #[error("Index already exists")]
    IndexAlreadyExists,
    /// Failed to acquire file lock.
    #[error("Failed to acquire Lockfile: {0:?}. {1:?}")]
    LockFailure(LockError, Option<String>),
    /// IO Error.
    #[error("An IO error occurred: '{0}'")]
    IoError(Arc<io::Error>),
    /// Data corruption.
    #[error("Data corrupted: '{0:?}'")]
    DataCorruption(DataCorruption),
    /// A thread holding the locked panicked and poisoned the lock.
    #[error("A thread holding the locked panicked and poisoned the lock")]
    Poisoned,
    /// The provided field name does not exist.
    #[error("The field does not exist: '{0}'")]
    FieldNotFound(String),
    /// Invalid argument was passed by the user.
    #[error("An invalid argument was passed: '{0}'")]
    InvalidArgument(String),
    /// An Error occurred in one of the threads.
    #[error("An error occurred in a thread: '{0}'")]
    ErrorInThread(String),
    /// An Error occurred related to opening or creating a index.
    #[error("Missing required index builder argument when open/create index: '{0}'")]
    IndexBuilderMissingArgument(&'static str),
    /// An Error occurred related to the schema.
    #[error("Schema error: '{0}'")]
    SchemaError(String),
    /// System error. (e.g.: We failed spawning a new thread).
    #[error("System error.'{0}'")]
    SystemError(String),
    /// Index incompatible with current version of Tantivy.
    #[error("{0:?}")]
    IncompatibleIndex(Incompatibility),
    /// An internal error occurred. This is are internal states that should not be reached.
    /// e.g. a datastructure is incorrectly initialized.
    #[error("Internal error: '{0}'")]
    InternalError(String),
    #[error("Deserialize error: {0}")]
    /// An error occurred while attempting to deserialize a document.
    DeserializeError(DeserializeError),
}

impl From<io::Error> for TantivyError {
    fn from(io_err: io::Error) -> TantivyError {
        TantivyError::IoError(Arc::new(io_err))
    }
}
impl From<DataCorruption> for TantivyError {
    fn from(data_corruption: DataCorruption) -> TantivyError {
        TantivyError::DataCorruption(data_corruption)
    }
}
impl From<FastFieldNotAvailableError> for TantivyError {
    fn from(fastfield_error: FastFieldNotAvailableError) -> TantivyError {
        TantivyError::SchemaError(format!("{fastfield_error}"))
    }
}
impl From<LockError> for TantivyError {
    fn from(lock_error: LockError) -> TantivyError {
        TantivyError::LockFailure(lock_error, None)
    }
}

impl From<query::QueryParserError> for TantivyError {
    fn from(parsing_error: query::QueryParserError) -> TantivyError {
        TantivyError::InvalidArgument(format!("Query is invalid. {parsing_error:?}"))
    }
}

impl<Guard> From<PoisonError<Guard>> for TantivyError {
    fn from(_: PoisonError<Guard>) -> TantivyError {
        TantivyError::Poisoned
    }
}

impl From<time::error::Format> for TantivyError {
    fn from(err: time::error::Format) -> TantivyError {
        TantivyError::InvalidArgument(format!("Date formatting error: {err}"))
    }
}

impl From<time::error::Parse> for TantivyError {
    fn from(err: time::error::Parse) -> TantivyError {
        TantivyError::InvalidArgument(format!("Date parsing error: {err}"))
    }
}

impl From<time::error::ComponentRange> for TantivyError {
    fn from(err: time::error::ComponentRange) -> TantivyError {
        TantivyError::InvalidArgument(format!("Date range error: {err}"))
    }
}

impl From<schema::DocParsingError> for TantivyError {
    fn from(error: schema::DocParsingError) -> TantivyError {
        TantivyError::InvalidArgument(format!("Failed to parse document {error:?}"))
    }
}

impl From<serde_json::Error> for TantivyError {
    fn from(error: serde_json::Error) -> TantivyError {
        TantivyError::IoError(Arc::new(error.into()))
    }
}

impl From<rayon::ThreadPoolBuildError> for TantivyError {
    fn from(error: rayon::ThreadPoolBuildError) -> TantivyError {
        TantivyError::SystemError(error.to_string())
    }
}

impl From<DeserializeError> for TantivyError {
    fn from(error: DeserializeError) -> TantivyError {
        TantivyError::DeserializeError(error)
    }
}


================================================
FILE: src/fastfield/alive_bitset.rs
================================================
use std::io;
use std::io::Write;

use common::{intersect_bitsets, BitSet, ByteCount, OwnedBytes, ReadOnlyBitSet};

use crate::DocId;

/// Write an alive `BitSet`
///
/// where `alive_bitset` is the set of alive `DocId`.
/// Warning: this function does not call terminate. The caller is in charge of
/// closing the writer properly.
pub fn write_alive_bitset<T: Write>(alive_bitset: &BitSet, writer: &mut T) -> io::Result<()> {
    alive_bitset.serialize(writer)?;
    Ok(())
}

/// Set of alive `DocId`s.
#[derive(Clone)]
pub struct AliveBitSet {
    num_alive_docs: usize,
    bitset: ReadOnlyBitSet,
}

/// Intersects two AliveBitSets in a new one.
/// The two bitsets need to have the same max_value.
pub fn intersect_alive_bitsets(left: AliveBitSet, right: AliveBitSet) -> AliveBitSet {
    assert_eq!(left.bitset().max_value(), right.bitset().max_value());
    let bitset = intersect_bitsets(left.bitset(), right.bitset());
    let num_alive_docs = bitset.len();
    AliveBitSet {
        num_alive_docs,
        bitset,
    }
}

impl AliveBitSet {
    #[cfg(test)]
    pub(crate) fn for_test_from_deleted_docs(deleted_docs: &[DocId], max_doc: u32) -> AliveBitSet {
        assert!(deleted_docs.iter().all(|&doc| doc < max_doc));
        let mut bitset = BitSet::with_max_value_and_full(max_doc);
        for &doc in deleted_docs {
            bitset.remove(doc);
        }
        let mut alive_bitset_buffer = Vec::new();
        write_alive_bitset(&bitset, &mut alive_bitset_buffer).unwrap();
        let alive_bitset_bytes = OwnedBytes::new(alive_bitset_buffer);
        Self::open(alive_bitset_bytes)
    }

    /// Opens an alive bitset given its file.
    pub fn open(bytes: OwnedBytes) -> AliveBitSet {
        let bitset = ReadOnlyBitSet::open(bytes);
        AliveBitSet::from(bitset)
    }

    /// Returns true if the document is still "alive". In other words, if it has not been deleted.
    #[inline]
    pub fn is_alive(&self, doc: DocId) -> bool {
        self.bitset.contains(doc)
    }

    /// Returns true if the document has been marked as deleted.
    #[inline]
    pub fn is_deleted(&self, doc: DocId) -> bool {
        !self.is_alive(doc)
    }

    /// Iterate over the alive doc_ids.
    #[inline]
    pub fn iter_alive(&self) -> impl Iterator<Item = DocId> + '_ {
        self.bitset.iter()
    }

    /// Get underlying bitset.
    #[inline]
    pub fn bitset(&self) -> &ReadOnlyBitSet {
        &self.bitset
    }

    /// The number of alive documents.
    pub fn num_alive_docs(&self) -> usize {
        self.num_alive_docs
    }

    /// Summarize total space usage of this bitset.
    pub fn space_usage(&self) -> ByteCount {
        self.bitset().num_bytes()
    }
}

impl From<ReadOnlyBitSet> for AliveBitSet {
    fn from(bitset: ReadOnlyBitSet) -> AliveBitSet {
        let num_alive_docs = bitset.len();
        AliveBitSet {
            num_alive_docs,
            bitset,
        }
    }
}

#[cfg(test)]
mod tests {

    use super::AliveBitSet;

    #[test]
    fn test_alive_bitset_empty() {
        let alive_bitset = AliveBitSet::for_test_from_deleted_docs(&[], 10);
        for doc in 0..10 {
            assert_eq!(alive_bitset.is_deleted(doc), !alive_bitset.is_alive(doc));
            assert!(!alive_bitset.is_deleted(doc));
        }
        assert_eq!(alive_bitset.num_alive_docs(), 10);
    }

    #[test]
    fn test_alive_bitset() {
        let alive_bitset = AliveBitSet::for_test_from_deleted_docs(&[1, 9], 10);
        assert!(alive_bitset.is_alive(0));
        assert!(alive_bitset.is_deleted(1));
        assert!(alive_bitset.is_alive(2));
        assert!(alive_bitset.is_alive(3));
        assert!(alive_bitset.is_alive(4));
        assert!(alive_bitset.is_alive(5));
        assert!(alive_bitset.is_alive(6));
        assert!(alive_bitset.is_alive(6));
        assert!(alive_bitset.is_alive(7));
        assert!(alive_bitset.is_alive(8));
        assert!(alive_bitset.is_deleted(9));
        for doc in 0..10 {
            assert_eq!(alive_bitset.is_deleted(doc), !alive_bitset.is_alive(doc));
        }
        assert_eq!(alive_bitset.num_alive_docs(), 8);
    }

    #[test]
    fn test_alive_bitset_iter_minimal() {
        let alive_bitset = AliveBitSet::for_test_from_deleted_docs(&[7], 8);

        let data: Vec<_> = alive_bitset.iter_alive().collect();
        assert_eq!(data, vec![0, 1, 2, 3, 4, 5, 6]);
    }

    #[test]
    fn test_alive_bitset_iter_small() {
        let alive_bitset = AliveBitSet::for_test_from_deleted_docs(&[0, 2, 3, 6], 7);

        let data: Vec<_> = alive_bitset.iter_alive().collect();
        assert_eq!(data, vec![1, 4, 5]);
    }
    #[test]
    fn test_alive_bitset_iter() {
        let alive_bitset = AliveBitSet::for_test_from_deleted_docs(&[0, 1, 1000], 1001);

        let data: Vec<_> = alive_bitset.iter_alive().collect();
        assert_eq!(data, (2..=999).collect::<Vec<_>>());
    }
}

#[cfg(all(test, feature = "unstable"))]
mod bench {

    use rand::prelude::IteratorRandom;
    use rand::rng;
    use test::Bencher;

    use super::AliveBitSet;

    fn get_alive() -> Vec<u32> {
        let mut data = (0..1_000_000_u32).collect::<Vec<u32>>();
        for _ in 0..1_000_000 / 8 {
            remove_rand(&mut data);
        }
        data
    }

    fn remove_rand(raw: &mut Vec<u32>) {
        let i = (0..raw.len()).choose(&mut rng()).unwrap();
        raw.remove(i);
    }

    #[bench]
    fn bench_alive_bitset_iter_deser_on_fly(bench: &mut Bencher) {
        let alive_bitset = AliveBitSet::for_test_from_deleted_docs(&[0, 1, 1000, 10000], 1_000_000);

        bench.iter(|| alive_bitset.iter_alive().collect::<Vec<_>>());
    }

    #[bench]
    fn bench_alive_bitset_access(bench: &mut Bencher) {
        let alive_bitset = AliveBitSet::for_test_from_deleted_docs(&[0, 1, 1000, 10000], 1_000_000);

        bench.iter(|| {
            (0..1_000_000_u32)
                .filter(|doc| alive_bitset.is_alive(*doc))
                .collect::<Vec<_>>()
        });
    }

    #[bench]
    fn bench_alive_bitset_iter_deser_on_fly_1_8_alive(bench: &mut Bencher) {
        let alive_bitset = AliveBitSet::for_test_from_deleted_docs(&get_alive(), 1_000_000);

        bench.iter(|| alive_bitset.iter_alive().collect::<Vec<_>>());
    }

    #[bench]
    fn bench_alive_bitset_access_1_8_alive(bench: &mut Bencher) {
        let alive_bitset = AliveBitSet::for_test_from_deleted_docs(&get_alive(), 1_000_000);

        bench.iter(|| {
            (0..1_000_000_u32)
                .filter(|doc| alive_bitset.is_alive(*doc))
                .collect::<Vec<_>>()
        });
    }
}


================================================
FILE: src/fastfield/error.rs
================================================
use std::result;

use crate::schema::FieldEntry;

/// `FastFieldNotAvailableError` is returned when the
/// user requested for a fast field reader, and the field was not
/// defined in the schema as a fast field.
#[derive(Debug, Error)]
#[error("Fast field not available: '{field_name:?}'")]
pub struct FastFieldNotAvailableError {
    pub(crate) field_name: String,
}

impl FastFieldNotAvailableError {
    /// Creates a `FastFieldNotAvailable` error.
    /// `field_entry` is the configuration of the field
    /// for which fast fields are not available.
    pub fn new(field_entry: &FieldEntry) -> FastFieldNotAvailableError {
        FastFieldNotAvailableError {
            field_name: field_entry.name().to_string(),
        }
    }
}

/// Result when trying to access a fast field reader.
pub type Result<R> = result::Result<R, FastFieldNotAvailableError>;


================================================
FILE: src/fastfield/facet_reader.rs
================================================
use columnar::StrColumn;

use crate::schema::Facet;
use crate::termdict::TermOrdinal;
use crate::DocId;

/// The facet reader makes it possible to access the list of
/// facets associated with a given document in a specific
/// segment.
///
/// Rather than manipulating `Facet` object directly, the API
/// exposes those in the form of list of `Facet` ordinal.
///
/// A segment ordinal can then be translated into a facet via
/// `.facet_from_ord(...)`.
///
/// Facet ordinals are defined as their position in the sorted
/// list of facets. This ordinal is segment local and
/// only makes sense for a given segment.
pub struct FacetReader {
    facet_column: StrColumn,
}

impl FacetReader {
    /// Creates a new `FacetReader`.
    ///
    /// A facet reader just wraps :
    /// - a `MultiValuedFastFieldReader` that makes it possible to access the list of facet ords for
    ///   a given document.
    /// - a `TermDictionary` that helps associating a facet to an ordinal and vice versa.
    pub fn new(facet_column: StrColumn) -> FacetReader {
        FacetReader { facet_column }
    }

    /// Returns the size of the sets of facets in the segment.
    /// This does not take in account the documents that may be marked
    /// as deleted.
    ///
    /// `Facet` ordinals range from `0` to `num_facets() - 1`.
    pub fn num_facets(&self) -> usize {
        self.facet_column.num_terms()
    }

    /// Given a term ordinal returns the term associated with it.
    pub fn facet_from_ord(&self, facet_ord: TermOrdinal, output: &mut Facet) -> crate::Result<()> {
        let found_term = self.facet_column.ord_to_str(facet_ord, &mut output.0)?;
        assert!(found_term, "Term ordinal {facet_ord} no found.");
        Ok(())
    }

    /// Return the list of facet ordinals associated with a document.
    pub fn facet_ords(&self, doc: DocId) -> impl Iterator<Item = u64> + '_ {
        self.facet_column.ords().values_for_doc(doc)
    }

    /// Accessor to the facet dictionary.
    pub fn facet_dict(&self) -> &columnar::Dictionary {
        self.facet_column.dictionary()
    }
}

#[cfg(test)]
mod tests {
    use crate::schema::{Facet, FacetOptions, SchemaBuilder, Value, STORED};
    use crate::{DocAddress, Index, IndexWriter, TantivyDocument};

    #[test]
    fn test_facet_only_indexed() {
        let mut schema_builder = SchemaBuilder::default();
        let facet_field = schema_builder.add_facet_field("facet", FacetOptions::default());
        let schema = schema_builder.build();
        let index = Index::create_in_ram(schema);
        let mut index_writer: IndexWriter = index.writer_for_tests().unwrap();
        index_writer
            .add_document(doc!(facet_field=>Facet::from_text("/a/b").unwrap()))
            .unwrap();
        index_writer.commit().unwrap();
        let searcher = index.reader().unwrap().searcher();
        let facet_reader = searcher.segment_reader(0u32).facet_reader("facet").unwrap();
        let mut facet_ords = Vec::new();
        facet_ords.extend(facet_reader.facet_ords(0u32));
        assert_eq!(&facet_ords, &[0u64]);
        assert_eq!(facet_reader.num_facets(), 1);
        let mut facet = Facet::default();
        facet_reader.facet_from_ord(0, &mut facet).unwrap();
        assert_eq!(facet.to_path_string(), "/a/b");
        let doc = searcher
            .doc::<TantivyDocument>(DocAddress::new(0u32, 0u32))
            .unwrap();
        let value = doc
            .get_first(facet_field)
            .and_then(|v| v.as_value().as_facet());
        assert_eq!(value, None);
    }

    #[test]
    fn test_facet_several_facets_sorted() {
        let mut schema_builder = SchemaBuilder::default();
        let facet_field = schema_builder.add_facet_field("facet", FacetOptions::default());
        let schema = schema_builder.build();
        let index = Index::create_in_ram(schema);
        let mut index_writer: IndexWriter = index.writer_for_tests().unwrap();
        index_writer
            .add_document(doc!(facet_field=>Facet::from_text("/parent/child1").unwrap()))
            .unwrap();
        index_writer
            .add_document(doc!(
                facet_field=>Facet::from_text("/parent/child2").unwrap(),
                facet_field=>Facet::from_text("/parent/child1/blop").unwrap(),
            ))
            .unwrap();
        index_writer.commit().unwrap();
        let searcher = index.reader().unwrap().searcher();
        let facet_reader = searcher.segment_reader(0u32).facet_reader("facet").unwrap();
        let mut facet_ords = Vec::new();

        facet_ords.extend(facet_reader.facet_ords(0u32));
        assert_eq!(&facet_ords, &[0u64]);

        facet_ords.clear();
        facet_ords.extend(facet_reader.facet_ords(1u32));
        assert_eq!(&facet_ords, &[1u64, 2u64]);

        assert_eq!(facet_reader.num_facets(), 3);
        let mut facet = Facet::default();
        facet_reader.facet_from_ord(0, &mut facet).unwrap();
        assert_eq!(facet.to_path_string(), "/parent/child1");
        facet_reader.facet_from_ord(1, &mut facet).unwrap();
        assert_eq!(facet.to_path_string(), "/parent/child1/blop");
        facet_reader.facet_from_ord(2, &mut facet).unwrap();
        assert_eq!(facet.to_path_string(), "/parent/child2");
    }

    #[test]
    fn test_facet_stored_and_indexed() -> crate::Result<()> {
        let mut schema_builder = SchemaBuilder::default();
        let facet_field = schema_builder.add_facet_field("facet", STORED);
        let schema = schema_builder.build();
        let index = Index::create_in_ram(schema);
        let mut index_writer = index.writer_for_tests()?;
        index_writer.add_document(doc!(facet_field=>Facet::from_text("/a/b").unwrap()))?;
        index_writer.commit()?;
        let searcher = index.reader()?.searcher();
        let facet_reader = searcher.segment_reader(0u32).facet_reader("facet").unwrap();
        let mut facet_ords = Vec::new();
        facet_ords.extend(facet_reader.facet_ords(0u32));
        assert_eq!(&facet_ords, &[0u64]);
        let doc = searcher.doc::<TantivyDocument>(DocAddress::new(0u32, 0u32))?;
        let value: Option<Facet> = doc
            .get_first(facet_field)
            .and_then(|v| v.as_facet())
            .map(|facet| Facet::from_encoded_string(facet.to_string()));
        assert_eq!(value, Facet::from_text("/a/b").ok());
        Ok(())
    }

    #[test]
    fn test_facet_not_populated_for_all_docs() -> crate::Result<()> {
        let mut schema_builder = SchemaBuilder::default();
        let facet_field = schema_builder.add_facet_field("facet", FacetOptions::default());
        let schema = schema_builder.build();
        let index = Index::create_in_ram(schema);
        let mut index_writer = index.writer_for_tests()?;
        index_writer.add_document(doc!(facet_field=>Facet::from_text("/a/b").unwrap()))?;
        index_writer.add_document(TantivyDocument::default())?;
        index_writer.commit()?;
        let searcher = index.reader()?.searcher();
        let facet_reader = searcher.segment_reader(0u32).facet_reader("facet").unwrap();
        let mut facet_ords = Vec::new();
        facet_ords.extend(facet_reader.facet_ords(0u32));
        assert_eq!(&facet_ords, &[0u64]);
        facet_ords.clear();
        facet_ords.extend(facet_reader.facet_ords(1u32));
        assert!(facet_ords.is_empty());
        Ok(())
    }

    #[test]
    fn test_facet_not_populated_for_any_docs() -> crate::Result<()> {
        let mut schema_builder = SchemaBuilder::default();
        schema_builder.add_facet_field("facet", FacetOptions::default());
        let schema = schema_builder.build();
        let index = Index::create_in_ram(schema);
        let mut index_writer = index.writer_for_tests()?;
        index_writer.add_document(TantivyDocument::default())?;
        index_writer.add_document(TantivyDocument::default())?;
        index_writer.commit()?;
        let searcher = index.reader()?.searcher();
        let facet_reader = searcher.segment_reader(0u32).facet_reader("facet").unwrap();
        assert!(facet_reader.facet_ords(0u32).next().is_none());
        assert!(facet_reader.facet_ords(1u32).next().is_none());
        Ok(())
    }
}


================================================
FILE: src/fastfield/mod.rs
================================================
//! Column oriented field storage for tantivy.
//!
//! It is the equivalent of `Lucene`'s `DocValues`.
//!
//! A fast field is a column-oriented fashion storage for `tantivy`.
//!
//! It is designed for the fast random access of some document
//! fields given a document id.
//!
//! Fast fields are useful when a field is required for all or most of
//! the `DocSet`: for instance for scoring, grouping, aggregation, filtering, or faceting.
//!
//!
//! Fields have to be declared as `FAST` in the schema.
//! Currently supported fields are: u64, i64, f64, bytes, ip and text.
//!
//! Fast fields are stored in with [different codecs](columnar). The best codec is detected
//! automatically, when serializing.
//!
//! Read access performance is comparable to that of an array lookup.

pub use columnar::Column;
use columnar::MonotonicallyMappableToU64;

pub use self::alive_bitset::{intersect_alive_bitsets, write_alive_bitset, AliveBitSet};
pub use self::error::{FastFieldNotAvailableError, Result};
pub use self::facet_reader::FacetReader;
pub use self::readers::FastFieldReaders;
pub use self::writer::FastFieldsWriter;
use crate::schema::Type;
use crate::DateTime;

mod alive_bitset;
mod error;
mod facet_reader;
mod readers;
mod writer;

/// Trait for types that are allowed for fast fields:
/// (u64, i64 and f64, bool, DateTime).
pub trait FastValue: MonotonicallyMappableToU64 {
    /// Returns the `schema::Type` for this FastValue.
    fn to_type() -> Type;
}

impl FastValue for u64 {
    fn to_type() -> Type {
        Type::U64
    }
}

impl FastValue for i64 {
    fn to_type() -> Type {
        Type::I64
    }
}

impl FastValue for f64 {
    fn to_type() -> Type {
        Type::F64
    }
}

impl FastValue for bool {
    fn to_type() -> Type {
        Type::Bool
    }
}
impl FastValue for DateTime {
    fn to_type() -> Type {
        Type::Date
    }
}

#[cfg(test)]
mod tests {

    use std::net::Ipv6Addr;
    use std::ops::{Range, RangeInclusive};
    use std::path::Path;

    use columnar::StrColumn;
    use common::{ByteCount, DateTimePrecision, HasLen, TerminatingWrite};
    use once_cell::sync::Lazy;
    use rand::prelude::SliceRandom;
    use rand::rngs::StdRng;
    use rand::{Rng, SeedableRng};

    use super::*;
    use crate::directory::{Directory, RamDirectory, WritePtr};
    use crate::index::SegmentId;
    use crate::merge_policy::NoMergePolicy;
    use crate::schema::{
        DateOptions, Facet, FacetOptions, Field, JsonObjectOptions, Schema, SchemaBuilder,
        TantivyDocument, TextOptions, FAST, INDEXED, STORED, STRING, TEXT,
    };
    use crate::time::OffsetDateTime;
    use crate::tokenizer::{LowerCaser, RawTokenizer, TextAnalyzer, TokenizerManager};
    use crate::{Index, IndexWriter, SegmentReader};

    pub static SCHEMA: Lazy<Schema> = Lazy::new(|| {
        let mut schema_builder = Schema::builder();
        schema_builder.add_u64_field("field", FAST);
        schema_builder.build()
    });
    pub static FIELD: Lazy<Field> = Lazy::new(|| SCHEMA.get_field("field").unwrap());

    #[test]
    pub fn test_convert_i64_u64() {
        let datetime = DateTime::from_utc(OffsetDateTime::UNIX_EPOCH);
        assert_eq!(i64::from_u64(datetime.to_u64()), 0i64);
    }

    #[test]
    fn test_intfastfield_small() -> crate::Result<()> {
        let path = Path::new("test");
        let directory: RamDirectory = RamDirectory::create();
        {
            let mut write: WritePtr = directory.open_write(Path::new("test")).unwrap();
            let mut fast_field_writers = FastFieldsWriter::from_schema(&SCHEMA).unwrap();
            fast_field_writers
                .add_document(&doc!(*FIELD=>13u64))
                .unwrap();
            fast_field_writers
                .add_document(&doc!(*FIELD=>14u64))
                .unwrap();
            fast_field_writers
                .add_document(&doc!(*FIELD=>2u64))
                .unwrap();
            fast_field_writers.serialize(&mut write).unwrap();
            write.terminate().unwrap();
        }
        let file = directory.open_read(path).unwrap();

        assert_eq!(file.len(), 80);
        let fast_field_readers = FastFieldReaders::open(file, SCHEMA.clone()).unwrap();
        let column = fast_field_readers
            .u64("field")
            .unwrap()
            .first_or_default_col(0);
        assert_eq!(column.get_val(0), 13u64);
        assert_eq!(column.get_val(1), 14u64);
        assert_eq!(column.get_val(2), 2u64);
        Ok(())
    }

    #[test]
    fn test_intfastfield_large() {
        let path = Path::new("test");
        let directory: RamDirectory = RamDirectory::create();
        {
            let mut write: WritePtr = directory.open_write(Path::new("test")).unwrap();
            let mut fast_field_writers = FastFieldsWriter::from_schema(&SCHEMA).unwrap();
            fast_field_writers
                .add_document(&doc!(*FIELD=>4u64))
                .unwrap();
            fast_field_writers
                .add_document(&doc!(*FIELD=>14_082_001u64))
                .unwrap();
            fast_field_writers
                .add_document(&doc!(*FIELD=>3_052u64))
                .unwrap();
            fast_field_writers
                .add_document(&doc!(*FIELD=>9_002u64))
                .unwrap();
            fast_field_writers
                .add_document(&doc!(*FIELD=>15_001u64))
                .unwrap();
            fast_field_writers
                .add_document(&doc!(*FIELD=>777u64))
                .unwrap();
            fast_field_writers
                .add_document(&doc!(*FIELD=>1_002u64))
                .unwrap();
            fast_field_writers
                .add_document(&doc!(*FIELD=>1_501u64))
                .unwrap();
            fast_field_writers
                .add_document(&doc!(*FIELD=>215u64))
                .unwrap();
            fast_field_writers.serialize(&mut write).unwrap();
            write.terminate().unwrap();
        }
        let file = directory.open_read(path).unwrap();
        assert_eq!(file.len(), 108);
        let fast_field_readers = FastFieldReaders::open(file, SCHEMA.clone()).unwrap();
        let col = fast_field_readers
            .u64("field")
            .unwrap()
            .first_or_default_col(0);
        assert_eq!(col.get_val(0), 4u64);
        assert_eq!(col.get_val(1), 14_082_001u64);
        assert_eq!(col.get_val(2), 3_052u64);
        assert_eq!(col.get_val(3), 9002u64);
        assert_eq!(col.get_val(4), 15_001u64);
        assert_eq!(col.get_val(5), 777u64);
        assert_eq!(col.get_val(6), 1_002u64);
        assert_eq!(col.get_val(7), 1_501u64);
        assert_eq!(col.get_val(8), 215u64);
    }

    #[test]
    fn test_intfastfield_null_amplitude() {
        let path = Path::new("test");
        let directory: RamDirectory = RamDirectory::create();
        {
            let mut write: WritePtr = directory.open_write(Path::new("test")).unwrap();
            let mut fast_field_writers = FastFieldsWriter::from_schema(&SCHEMA).unwrap();
            for _ in 0..10_000 {
                fast_field_writers
                    .add_document(&doc!(*FIELD=>100_000u64))
                    .unwrap();
            }
            fast_field_writers.serialize(&mut write).unwrap();
            write.terminate().unwrap();
        }
        let file = directory.open_read(path).unwrap();
        assert_eq!(file.len(), 81);
        let fast_field_readers = FastFieldReaders::open(file, SCHEMA.clone()).unwrap();
        let fast_field_reader = fast_field_readers
            .u64("field")
            .unwrap()
            .first_or_default_col(0);
        for doc in 0..10_000 {
            assert_eq!(fast_field_reader.get_val(doc), 100_000u64);
        }
    }

    #[test]
    fn test_intfastfield_large_numbers() {
        let path = Path::new("test");
        let directory: RamDirectory = RamDirectory::create();

        {
            let mut write: WritePtr = directory.open_write(Path::new("test")).unwrap();
            let mut fast_field_writers = FastFieldsWriter::from_schema(&SCHEMA).unwrap();
            // forcing the amplitude to be high
            fast_field_writers
                .add_document(&doc!(*FIELD=>0u64))
                .unwrap();
            for doc_id in 1u64..10_000u64 {
                fast_field_writers
                    .add_document(&doc!(*FIELD=>5_000_000_000_000_000_000u64 + doc_id))
                    .unwrap();
            }
            fast_field_writers.serialize(&mut write).unwrap();
            write.terminate().unwrap();
        }
        let file = directory.open_read(path).unwrap();
        assert_eq!(file.len(), 4476);
        {
            let fast_field_readers = FastFieldReaders::open(file, SCHEMA.clone()).unwrap();
            let col = fast_field_readers
                .u64("field")
                .unwrap()
                .first_or_default_col(0);
            for doc in 1..10_000 {
                assert_eq!(col.get_val(doc), 5_000_000_000_000_000_000u64 + doc as u64);
            }
        }
    }

    #[test]
    fn test_signed_intfastfield_normal() -> crate::Result<()> {
        let path = Path::new("test");
        let directory: RamDirectory = RamDirectory::create();
        let mut schema_builder = Schema::builder();

        let i64_field = schema_builder.add_i64_field("field", FAST);
        let schema = schema_builder.build();
        {
            let mut write: WritePtr = directory.open_write(Path::new("test")).unwrap();
            let mut fast_field_writers = FastFieldsWriter::from_schema(&schema).unwrap();
            for i in -100i64..10_000i64 {
                let mut doc = TantivyDocument::default();
                doc.add_i64(i64_field, i);
                fast_field_writers.add_document(&doc).unwrap();
            }
            fast_field_writers.serialize(&mut write).unwrap();
            write.terminate().unwrap();
        }
        let file = directory.open_read(path).unwrap();
        assert_eq!(file.len(), 252);

        {
            let fast_field_readers = FastFieldReaders::open(file, schema).unwrap();
            let col = fast_field_readers
                .i64("field")
                .unwrap()
                .first_or_default_col(0);
            assert_eq!(col.min_value(), -100i64);
            assert_eq!(col.max_value(), 9_999i64);
            for (doc, i) in (-100i64..10_000i64).enumerate() {
                assert_eq!(col.get_val(doc as u32), i);
            }
            let mut buffer = vec![0i64; 100];
            col.get_range(53, &mut buffer[..]);
            for i in 0..100 {
                assert_eq!(buffer[i], -100i64 + 53i64 + i as i64);
            }
        }
        Ok(())
    }

    #[test]
    fn test_signed_intfastfield_default_val() {
        let path = Path::new("test");
        let directory: RamDirectory = RamDirectory::create();
        let mut schema_builder = Schema::builder();
        schema_builder.add_i64_field("field", FAST);
        let schema = schema_builder.build();

        {
            let mut write: WritePtr = directory.open_write(Path::new("test")).unwrap();
            let mut fast_field_writers = FastFieldsWriter::from_schema(&schema).unwrap();
            let doc = TantivyDocument::default();
            fast_field_writers.add_document(&doc).unwrap();
            fast_field_writers.serialize(&mut write).unwrap();
            write.terminate().unwrap();
        }

        let file = directory.open_read(path).unwrap();
        let fast_field_readers = FastFieldReaders::open(file, schema).unwrap();
        let col = fast_field_readers.i64("field").unwrap();
        assert_eq!(col.first(0), None);

        let col = fast_field_readers
            .i64("field")
            .unwrap()
            .first_or_default_col(0);
        assert_eq!(col.get_val(0), 0);
        let col = fast_field_readers
            .i64("field")
            .unwrap()
            .first_or_default_col(-100);
        assert_eq!(col.get_val(0), -100);
    }

    #[test]
    fn test_date_fastfield_default() {
        let path = Path::new("test");
        let directory: RamDirectory = RamDirectory::create();
        let mut schema_builder = Schema::builder();
        schema_builder.add_date_field("date", FAST);
        let schema = schema_builder.build();
        {
            let mut write: WritePtr = directory.open_write(Path::new("test")).unwrap();
            let mut fast_field_writers = FastFieldsWriter::from_schema(&schema).unwrap();
            let doc = TantivyDocument::default();
            fast_field_writers.add_document(&doc).unwrap();
            fast_field_writers.serialize(&mut write).unwrap();
            write.terminate().unwrap();
        }

        let file = directory.open_read(path).unwrap();
        let fast_field_readers = FastFieldReaders::open(file, schema).unwrap();
        let col = fast_field_readers
            .date("date")
            .unwrap()
            .first_or_default_col(DateTime::default());
        assert_eq!(col.get_val(0), DateTime::default());
    }

    // Warning: this generates the same permutation at each call
    pub fn generate_permutation() -> Vec<u64> {
        let mut permutation: Vec<u64> = (0u64..100_000u64).collect();
        permutation.shuffle(&mut StdRng::from_seed([1u8; 32]));
        permutation
    }

    // Warning: this generates the same permutation at each call
    pub fn generate_permutation_gcd() -> Vec<u64> {
        let mut permutation: Vec<u64> = (1u64..100_000u64).map(|el| el * 1000).collect();
        permutation.shuffle(&mut StdRng::from_seed([1u8; 32]));
        permutation
    }

    fn test_intfastfield_permutation_with_data(permutation: Vec<u64>) {
        let path = Path::new("test");
        let n = permutation.len();
        let directory = RamDirectory::create();
        {
            let mut write: WritePtr = directory.open_write(Path::new("test")).unwrap();
            let mut fast_field_writers = FastFieldsWriter::from_schema(&SCHEMA).unwrap();
            for &x in &permutation {
                fast_field_writers.add_document(&doc!(*FIELD=>x)).unwrap();
            }
            fast_field_writers.serialize(&mut write).unwrap();
            write.terminate().unwrap();
        }
        let file = directory.open_read(path).unwrap();
        let fast_field_readers = FastFieldReaders::open(file, SCHEMA.clone()).unwrap();
        let col = fast_field_readers
            .u64("field")
            .unwrap()
            .first_or_default_col(0);
        for a in 0..n {
            assert_eq!(col.get_val(a as u32), permutation[a]);
        }
    }

    #[test]
    fn test_intfastfield_permutation_gcd() {
        let permutation = generate_permutation_gcd();
        test_intfastfield_permutation_with_data(permutation);
    }

    #[test]
    fn test_intfastfield_permutation() {
        let permutation = generate_permutation();
        test_intfastfield_permutation_with_data(permutation);
    }

    #[test]
    fn test_merge_missing_date_fast_field() {
        let mut schema_builder = Schema::builder();
        let date_field = schema_builder.add_date_field("date", FAST);
        let schema = schema_builder.build();
        let index = Index::create_in_ram(schema);
        let mut index_writer: IndexWriter = index.writer_for_tests().unwrap();
        index_writer.set_merge_policy(Box::new(NoMergePolicy));
        index_writer
            .add_document(doc!(date_field => DateTime::from_utc(OffsetDateTime::now_utc())))
            .unwrap();
        index_writer.commit().unwrap();
        index_writer.add_document(doc!()).unwrap();
        index_writer.commit().unwrap();
        let reader = index.reader().unwrap();
        let segment_ids: Vec<SegmentId> = reader
            .searcher()
            .segment_readers()
            .iter()
            .map(SegmentReader::segment_id)
            .collect();
        assert_eq!(segment_ids.len(), 2);
        index_writer.merge(&segment_ids[..]).wait().unwrap();
        reader.reload().unwrap();
        assert_eq!(reader.searcher().segment_readers().len(), 1);
    }

    fn get_vals_for_docs(column: &Column<u64>, docs: Range<u32>) -> Vec<u64> {
        docs.into_iter()
            .flat_map(|doc| column.values_for_doc(doc))
            .collect()
    }

    #[test]
    fn test_text_fastfield() {
        let mut schema_builder = Schema::builder();
        let text_field = schema_builder.add_text_field("text", TEXT | FAST);
        let schema = schema_builder.build();
        let index = Index::create_in_ram(schema);

        {
            // first segment
            let mut index_writer: IndexWriter = index.writer_for_tests().unwrap();
            index_writer.set_merge_policy(Box::new(NoMergePolicy));
            index_writer
                .add_document(doc!(
                text_field => "BBBBB", // term ord 1
                text_field => "AAAAA", // term ord 0
                ))
                .unwrap();
            index_writer.add_document(doc!()).unwrap();
            index_writer
                .add_document(doc!(
                text_field => "AAAAA", // term_ord 0
                ))
                .unwrap();
            index_writer
                .add_document(doc!(
                    text_field => "AAAAA",
                    text_field => "BBBBB",
                ))
                .unwrap();
            index_writer
                .add_document(doc!(
                text_field => "zumberthree", // term_ord 2, after merge term_ord 3
                ))
                .unwrap();

            index_writer.add_document(doc!()).unwrap();
            index_writer.commit().unwrap();

            let reader = index.reader().unwrap();
            let searcher = reader.searcher();
            assert_eq!(searcher.segment_readers().len(), 1);
            let segment_reader = searcher.segment_reader(0);
            let fast_fields = segment_reader.fast_fields();
            let str_column = fast_fields.str("text").unwrap().unwrap();
            assert!(str_column.ords().values_for_doc(0u32).eq([1, 0]),);
            assert!(str_column.ords().values_for_doc(1u32).next().is_none());
            assert!(str_column.ords().values_for_doc(2u32).eq([0]),);
            assert!(str_column.ords().values_for_doc(3u32).eq([0, 1]),);
            assert!(str_column.ords().values_for_doc(4u32).eq([2]),);

            let mut str_term = String::default();
            assert!(str_column.ord_to_str(0, &mut str_term).unwrap());
            assert_eq!("AAAAA", &str_term);

            let inverted_index = segment_reader.inverted_index(text_field).unwrap();
            assert_eq!(inverted_index.terms().num_terms(), 3);
            let mut bytes = vec![];
            assert!(inverted_index.terms().ord_to_term(0, &mut bytes).unwrap());
            assert_eq!(bytes, "aaaaa".as_bytes());
        }

        {
            // second segment
            let mut index_writer: IndexWriter = index.writer_for_tests().unwrap();

            index_writer
                .add_document(doc!(
                text_field => "AAAAA", // term_ord 0
                ))
                .unwrap();

            index_writer
                .add_document(doc!(
                text_field => "CCCCC AAAAA", // term_ord 1, after merge 2
                ))
                .unwrap();

            index_writer.add_document(doc!()).unwrap();
            index_writer.commit().unwrap();

            let reader = index.reader().unwrap();
            let searcher = reader.searcher();
            assert_eq!(searcher.segment_readers().len(), 2);
            let segment_reader = searcher.segment_reader(1);
            let fast_fields = segment_reader.fast_fields();
            let text_fast_field = fast_fields.str("text").unwrap().unwrap();

            assert_eq!(&get_vals_for_docs(text_fast_field.ords(), 0..2), &[0, 1]);
        }

        // TODO uncomment once merging is available
        // Merging the segments
        {
            let segment_ids = index.searchable_segment_ids().unwrap();
            let mut index_writer: IndexWriter = index.writer_for_tests().unwrap();
            index_writer.merge(&segment_ids).wait().unwrap();
            index_writer.wait_merging_threads().unwrap();
        }

        let reader = index.reader().unwrap();
        let searcher = reader.searcher();
        let segment_reader = searcher.segment_reader(0);
        let fast_fields = segment_reader.fast_fields();
        let text_column = fast_fields.str("text").unwrap().unwrap();

        assert_eq!(
            get_vals_for_docs(text_column.ords(), 0..8),
            vec![1, 0, 0, 0, 1, 3 /* next segment */, 0, 2]
        );
    }

    #[test]
    fn test_string_fastfield_simple() {
        let mut schema_builder = Schema::builder();
        let text_field = schema_builder.add_text_field("text", TEXT | FAST);
        let schema = schema_builder.build();
        let index = Index::create_in_ram(schema);
        let mut writer = index.writer_for_tests().unwrap();
        writer.add_document(doc!(text_field=>"hello happy tax payer", text_field=>"aaa this string comes lexicographically before the other one.")).unwrap();
        writer.commit().unwrap();
        let searcher = index.reader().unwrap().searcher();
        let segment_reader = searcher.segment_reader(0);
        let str_column = segment_reader.fast_fields().str("text").unwrap().unwrap();
        // The string values are not sorted here.
        let term_ords: Vec<u64> = str_column.term_ords(0u32).collect();
        assert_eq!(&term_ords, &[1, 0]);
    }

    #[test]
    fn test_facet_fastfield_simple() {
        let mut schema_builder = Schema::builder();
        let facet_field = schema_builder.add_facet_field("facet", FacetOptions::default());
        let schema = schema_builder.build();
        let index = Index::create_in_ram(schema);
        let mut writer = index.writer_for_tests().unwrap();
        writer
            .add_document(doc!(facet_field=>Facet::from("/a/2"), facet_field=>Facet::from("/a/1")))
            .unwrap();
        writer.commit().unwrap();
        let searcher = index.reader().unwrap().searcher();
        let segment_reader = searcher.segment_reader(0);
        let facet_reader = segment_reader.facet_reader("facet").unwrap();
        // facets, contrary to strings are sorted.
        let mut facet_ords = Vec::new();
        facet_ords.extend(facet_reader.facet_ords(0u32));
        assert_eq!(&facet_ords, &[0, 1]);
    }

    #[test]
    fn test_string_fastfield() -> crate::Result<()> {
        let mut schema_builder = Schema::builder();
        let text_field = schema_builder.add_text_field("text", STRING | FAST);
        let schema = schema_builder.build();
        let index = Index::create_in_ram(schema);

        {
            // first segment
            let mut index_writer = index.writer_for_tests()?;
            index_writer.set_merge_policy(Box::new(NoMergePolicy));
            index_writer.add_document(doc!(
                text_field => "BBBBB", // term_ord 1
            ))?;
            index_writer.add_document(doc!())?;
            index_writer.add_document(doc!(
                text_field => "AAAAA", // term_ord 0
            ))?;
            index_writer.add_document(doc!(
                text_field => "AAAAA", // term_ord 0
            ))?;
            index_writer.add_document(doc!(
                text_field => "zumberthree", // term_ord 2, after merge term_ord 3
            ))?;

            index_writer.add_document(doc!())?;
            index_writer.commit()?;

            let reader = index.reader()?;
            let searcher = reader.searcher();
            assert_eq!(searcher.segment_readers().len(), 1);
            let segment_reader = searcher.segment_reader(0);
            let fast_fields = segment_reader.fast_fields();
            let text_col = fast_fields.str("text").unwrap().unwrap();

            assert_eq!(get_vals_for_docs(text_col.ords(), 0..6), vec![1, 0, 0, 2]);

            let inverted_index = segment_reader.inverted_index(text_field)?;
            assert_eq!(inverted_index.terms().num_terms(), 3);
            let mut bytes = vec![];
            assert!(inverted_index.terms().ord_to_term(0, &mut bytes)?);
            assert_eq!(bytes, "AAAAA".as_bytes());
        }

        {
            // second segment
            let mut index_writer = index.writer_for_tests()?;

            index_writer.add_document(doc!(
                text_field => "AAAAA", // term_ord 0
            ))?;

            index_writer.add_document(doc!(
                text_field => "CCCCC", // term_ord 1, after merge 2
            ))?;

            index_writer.add_document(doc!())?;
            index_writer.commit()?;

            let reader = index.reader()?;
            let searcher = reader.searcher();
            assert_eq!(searcher.segment_readers().len(), 2);
            let segment_reader = searcher.segment_reader(1);
            let fast_fields = segment_reader.fast_fields();
            let text_fast_field = fast_fields.str("text").unwrap().unwrap();

            assert_eq!(&get_vals_for_docs(text_fast_field.ords(), 0..2), &[0, 1]);
        }
        // Merging the segments
        {
            let segment_ids = index.searchable_segment_ids()?;
            let mut index_writer: IndexWriter = index.writer_for_tests()?;
            index_writer.merge(&segment_ids).wait()?;
            index_writer.wait_merging_threads()?;
        }

        let reader = index.reader()?;
        let searcher = reader.searcher();
        let segment_reader = searcher.segment_reader(0);
        let fast_fields = segment_reader.fast_fields();
        let text_fast_field = fast_fields.str("text").unwrap().unwrap();

        assert_eq!(
            get_vals_for_docs(text_fast_field.ords(), 0..9),
            vec![1, 0, 0, 3 /* next segment */, 0, 2]
        );

        Ok(())
    }

    #[test]
    fn test_datefastfield() -> crate::Result<()> {
        let mut schema_builder = Schema::builder();
        let date_field = schema_builder.add_date_field(
            "date",
            DateOptions::from(FAST).set_precision(DateTimePrecision::Nanoseconds),
        );
        let multi_date_field = schema_builder.add_date_field(
            "multi_date",
            DateOptions::default()
                .set_precision(DateTimePrecision::Nanoseconds)
                .set_fast(),
        );
        let schema = schema_builder.build();
        let index = Index::create_in_ram(schema);
        let mut index_writer = index.writer_for_tests()?;
        index_writer.set_merge_policy(Box::new(NoMergePolicy));
        index_writer.add_document(doc!(
            date_field => DateTime::from_u64(1i64.to_u64()),
            multi_date_field => DateTime::from_u64(2i64.to_u64()),
            multi_date_field => DateTime::from_u64(3i64.to_u64())
        ))?;
        index_writer.add_document(doc!(
            date_field => DateTime::from_u64(4i64.to_u64())
        ))?;
        index_writer.add_document(doc!(
            multi_date_field => DateTime::from_u64(5i64.to_u64()),
            multi_date_field => DateTime::from_u64(6i64.to_u64())
        ))?;
        index_writer.commit()?;
        let reader = index.reader()?;
        let searcher = reader.searcher();
        assert_eq!(searcher.segment_readers().len(), 1);
        let segment_reader = searcher.segment_reader(0);
        let fast_fields = segment_reader.fast_fields();
        let date_fast_field = fast_fields
            .column_opt::<DateTime>("date")
            .unwrap()
            .unwrap()
            .first_or_default_col(Default::default());
        let dates_fast_field = fast_fields
            .column_opt::<DateTime>("multi_date")
            .unwrap()
            .unwrap();

        {
            assert_eq!(date_fast_field.get_val(0).into_timestamp_nanos(), 1i64);
            let dates: Vec<DateTime> = dates_fast_field.values_for_doc(0u32).collect();
            assert_eq!(dates.len(), 2);
            assert_eq!(dates[0].into_timestamp_nanos(), 2i64);
            assert_eq!(dates[1].into_timestamp_nanos(), 3i64);
        }
        {
            assert_eq!(date_fast_field.get_val(1).into_timestamp_nanos(), 4i64);
            let dates: Vec<DateTime> = dates_fast_field.values_for_doc(1u32).collect();
            assert!(dates.is_empty());
        }
        {
            assert_eq!(date_fast_field.get_val(2).into_timestamp_nanos(), 0i64);
            let dates: Vec<DateTime> = dates_fast_field.values_for_doc(2u32).collect();
            assert_eq!(dates.len(), 2);
            assert_eq!(dates[0].into_timestamp_nanos(), 5i64);
            assert_eq!(dates[1].into_timestamp_nanos(), 6i64);
        }
        Ok(())
    }

    #[test]
    pub fn test_fastfield_bool_small() {
        let path = Path::new("test_bool");
        let directory: RamDirectory = RamDirectory::create();

        let mut schema_builder = Schema::builder();
        schema_builder.add_bool_field("field_bool", FAST);
        let schema = schema_builder.build();
        let field = schema.get_field("field_bool").unwrap();

        {
            let mut write: WritePtr = directory.open_write(path).unwrap();
            let mut fast_field_writers = FastFieldsWriter::from_schema(&schema).unwrap();
            fast_field_writers.add_document(&doc!(field=>true)).unwrap();
            fast_field_writers
                .add_document(&doc!(field=>false))
                .unwrap();
            fast_field_writers.add_document(&doc!(field=>true)).unwrap();
            fast_field_writers
                .add_document(&doc!(field=>false))
                .unwrap();
            fast_field_writers.serialize(&mut write).unwrap();
            write.terminate().unwrap();
        }
        let file = directory.open_read(path).unwrap();
        assert_eq!(file.len(), 84);
        let fast_field_readers = FastFieldReaders::open(file, schema).unwrap();
        let bool_col = fast_field_readers.bool("field_bool").unwrap();
        assert_eq!(bool_col.first(0), Some(true));
        assert_eq!(bool_col.first(1), Some(false));
        assert_eq!(bool_col.first(2), Some(true));
        assert_eq!(bool_col.first(3), Some(false));
    }

    #[test]
    pub fn test_fastfield_bool_large() {
        let path = Path::new("test_bool");
        let directory: RamDirectory = RamDirectory::create();

        let mut schema_builder = Schema::builder();
        schema_builder.add_bool_field("field_bool", FAST);
        let schema = schema_builder.build();
        let field = schema.get_field("field_bool").unwrap();

        {
            let mut write: WritePtr = directory.open_write(path).unwrap();
            let mut fast_field_writers = FastFieldsWriter::from_schema(&schema).unwrap();
            for _ in 0..50 {
                fast_field_writers.add_document(&doc!(field=>true)).unwrap();
                fast_field_writers
                    .add_document(&doc!(field=>false))
                    .unwrap();
            }
            fast_field_writers.serialize(&mut write).unwrap();
            write.terminate().unwrap();
        }
        let file = directory.open_read(path).unwrap();
        assert_eq!(file.len(), 96);
        let readers = FastFieldReaders::open(file, schema).unwrap();
        let bool_col = readers.bool("field_bool").unwrap();
        for i in 0..25 {
            assert_eq!(bool_col.first(i * 2), Some(true));
            assert_eq!(bool_col.first(i * 2 + 1), Some(false));
        }
    }

    #[test]
    pub fn test_fastfield_bool_default_value() {
        let path = Path::new("test_bool");
        let directory: RamDirectory = RamDirectory::create();
        let mut schema_builder = Schema::builder();
        schema_builder.add_bool_field("field_bool", FAST);
        let schema = schema_builder.build();
        {
            let mut write: WritePtr = directory.open_write(path).unwrap();
            let mut fast_field_writers = FastFieldsWriter::from_schema(&schema).unwrap();
            let doc = TantivyDocument::default();
            fast_field_writers.add_document(&doc).unwrap();
            fast_field_writers.serialize(&mut write).unwrap();
            write.terminate().unwrap();
        }
        let file = directory.open_read(path).unwrap();
        assert_eq!(file.len(), 86);
        let fastfield_readers = FastFieldReaders::open(file, schema).unwrap();
        let col = fastfield_readers.bool("field_bool").unwrap();
        assert_eq!(col.first(0), None);
        let col = fastfield_readers
            .bool("field_bool")
            .unwrap()
            .first_or_default_col(false);
        assert_eq!(col.get_val(0), false);
        let col = fastfield_readers
            .bool("field_bool")
            .unwrap()
            .first_or_default_col(true);
        assert_eq!(col.get_val(0), true);
    }

    fn get_index(docs: &[crate::TantivyDocument], schema: &Schema) -> crate::Result<RamDirectory> {
        let directory: RamDirectory = RamDirectory::create();
        {
            let mut write: WritePtr = directory.open_write(Path::new("test")).unwrap();
            let mut fast_field_writers = FastFieldsWriter::from_schema(schema).unwrap();
            for doc in docs {
                fast_field_writers.add_document(doc).unwrap();
            }
            fast_field_writers.serialize(&mut write).unwrap();
            write.terminate().unwrap();
        }
        Ok(directory)
    }

    #[test]
    pub fn test_gcd_date() {
        let size_prec_sec = test_gcd_date_with_codec(DateTimePrecision::Seconds);
        assert!((1000 * 13 / 8..100 + 1000 * 13 / 8).contains(&size_prec_sec.get_bytes())); // 13 bits per val = ceil(log_2(number of seconds in 2hours);
        let size_prec_micros = test_gcd_date_with_codec(DateTimePrecision::Microseconds);
        assert!((1000 * 33 / 8..100 + 1000 * 33 / 8).contains(&size_prec_micros.get_bytes()));
        // 33 bits per
        // val = ceil(log_2(number
        // of microsecsseconds
        // in 2hours);
    }

    fn test_gcd_date_with_codec(precision: DateTimePrecision) -> ByteCount {
        let mut rng = StdRng::seed_from_u64(2u64);
        const T0: i64 = 1_662_345_825_012_529i64;
        const ONE_HOUR_IN_MICROSECS: i64 = 3_600 * 1_000_000;
        let times: Vec<DateTime> = std::iter::repeat_with(|| {
            // +- One hour.
            let t = T0 + rng.random_range(-ONE_HOUR_IN_MICROSECS..ONE_HOUR_IN_MICROSECS);
            DateTime::from_timestamp_micros(t)
        })
        .take(1_000)
        .collect();
        let date_options = DateOptions::default().set_fast().set_precision(precision);
        let mut schema_builder = SchemaBuilder::default();
        let field = schema_builder.add_date_field("field", date_options);
        let schema = schema_builder.build();

        let docs: Vec<TantivyDocument> = times.iter().map(|time| doc!(field=>*time)).collect();

        let directory = get_index(&docs[..], &schema).unwrap();
        let path = Path::new("test");
        let file = directory.open_read(path).unwrap();
        let readers = FastFieldReaders::open(file, schema).unwrap();
        let col = readers.date("field").unwrap();

        for (i, time) in times.iter().enumerate() {
            let dt: DateTime = col.first(i as u32).unwrap();
            assert_eq!(dt, time.truncate(precision));
        }
        readers.column_num_bytes("field").unwrap()
    }

    #[test]
    fn test_gcd_bug_regression_1757() {
        let mut schema_builder = Schema::builder();
        let num_field = schema_builder.add_u64_field("url_norm_hash", FAST | INDEXED);
        let schema = schema_builder.build();
        let index = Index::create_in_ram(schema);
        {
            let mut writer = index.writer_for_tests().unwrap();
            writer
                .add_document(doc! {
                    num_field => 100u64,
                })
                .unwrap();
            writer
                .add_document(doc! {
                    num_field => 200u64,
                })
                .unwrap();
            writer
                .add_document(doc! {
                    num_field => 300u64,
                })
                .unwrap();

            writer.commit().unwrap();
        }

        let reader = index.reader().unwrap();
        let searcher = reader.searcher();
        let segment = &searcher.segment_readers()[0];
        let field = segment
            .fast_fields()
            .u64("url_norm_hash")
            .unwrap()
            .first_or_default_col(0);

        let numbers = [100, 200, 300];
        let test_range = |range: RangeInclusive<u64>| {
            let expected_count = numbers.iter().filter(|num| range.contains(*num)).count();
            let mut vec = vec![];
            field.get_row_ids_for_value_range(range, 0..u32::MAX, &mut vec);
            assert_eq!(vec.len(), expected_count);
        };
        test_range(50..=50);
        test_range(150..=150);
        test_range(350..=350);
        test_range(100..=250);
        test_range(101..=200);
        test_range(101..=199);
        test_range(100..=300);
        test_range(100..=299);
    }

    #[test]
    fn test_ip_addr_columnar_simple() {
        let mut schema_builder = Schema::builder();
        let ip_field = schema_builder.add_u64_field("ip", FAST);
        let schema = schema_builder.build();
        let index = Index::create_in_ram(schema);
        let mut index_writer: IndexWriter = index.writer_for_tests().unwrap();
        let ip_addr = Ipv6Addr::new(1, 2, 3, 4, 5, 1, 2, 3);
        index_writer
            .add_document(TantivyDocument::default())
            .unwrap();
        index_writer.add_document(doc!(ip_field=>ip_addr)).unwrap();
        index_writer
            .add_document(TantivyDocument::default())
            .unwrap();
        index_writer.commit().unwrap();
        let searcher = index.reader().unwrap().searcher();
        let fastfields = searcher.segment_reader(0u32).fast_fields();
        let column: Column<Ipv6Addr> = fastfields.column_opt("ip").unwrap().unwrap();
        assert_eq!(column.num_docs(), 3);
        assert_eq!(column.first(0), None);
        assert_eq!(column.first(1), Some(ip_addr));
        assert_eq!(column.first(2), None);
    }

    #[test]
    fn test_mapping_bug_docids_for_value_range() {
        let mut schema_builder = Schema::builder();
        let num_field = schema_builder.add_u64_field("url_norm_hash", FAST | INDEXED);
        let schema = schema_builder.build();
        let index = Index::create_in_ram(schema);
        {
            // Values without gcd, but with min_value
            let mut writer = index.writer_for_tests().unwrap();
            writer
                .add_document(doc! {
                    num_field => 1000u64,
                })
                .unwrap();
            writer
                .add_document(doc! {
                    num_field => 1001u64,
                })
                .unwrap();
            writer
                .add_document(doc! {
                    num_field => 1003u64,
                })
                .unwrap();
            writer.commit().unwrap();
        }

        let reader = index.reader().unwrap();
        let searcher = reader.searcher();
        let segment = &searcher.segment_readers()[0];
        let field = segment
            .fast_fields()
            .u64("url_norm_hash")
            .unwrap()
            .first_or_default_col(0);

        let numbers = [1000, 1001, 1003];
        let test_range = |range: RangeInclusive<u64>| {
            let expected_count = numbers.iter().filter(|num| range.contains(*num)).count();
            let mut vec = vec![];
            field.get_row_ids_for_value_range(range, 0..u32::MAX, &mut vec);
            assert_eq!(vec.len(), expected_count);
        };
        let test_range_variant = |start, stop| {
            let start_range = start..=stop;
            test_range(start_range);
            let start_range = start..=(stop - 1);
            test_range(start_range);
            let start_range = start..=(stop + 1);
            test_range(start_range);
            let start_range = (start - 1)..=stop;
            test_range(start_range);
            let start_range = (start - 1)..=(stop - 1);
            test_range(start_range);
            let start_range = (start - 1)..=(stop + 1);
            test_range(start_range);
            let start_range = (start + 1)..=stop;
            test_range(start_range);
            let start_range = (start + 1)..=(stop - 1);
            test_range(start_range);
            let start_range = (start + 1)..=(stop + 1);
            test_range(start_range);
        };
        test_range_variant(50, 50);
        test_range_variant(1000, 1000);
        test_range_variant(1000, 1002);
    }

    #[test]
    fn test_json_object_fast_field() {
        let mut schema_builder = Schema::builder();
        let without_fast_field = schema_builder.add_json_field("without", STORED);
        let with_fast_field = schema_builder.add_json_field("with", STORED | FAST);
        let schema = schema_builder.build();
        let index = Index::create_in_ram(schema);
        let mut writer = index.writer_for_tests().unwrap();
        writer
            .add_document(doc!(without_fast_field=>json!({"hello": "without"})))
            .unwrap();
        writer
            .add_document(doc!(with_fast_field=>json!({"hello": "with"})))
            .unwrap();
        writer
            .add_document(doc!(with_fast_field=>json!({"hello": "with2"})))
            .unwrap();
        writer
            .add_document(doc!(with_fast_field=>json!({"hello": "with1"})))
            .unwrap();
        writer.commit().unwrap();
        let searcher = index.reader().unwrap().searcher();
        let segment_reader = searcher.segment_reader(0u32);
        let fast_fields = segment_reader.fast_fields();
        let column_without_opt = fast_fields.str("without.hello");
        assert!(column_without_opt.is_err());
        let column_with_opt: Option<StrColumn> = fast_fields.str("with.hello").unwrap();
        let column_with: StrColumn = column_with_opt.unwrap();
        assert!(column_with.term_ords(0).next().is_none());
        assert!(column_with.term_ords(1).eq([0]));
        assert!(column_with.term_ords(2).eq([2]));
        assert!(column_with.term_ords(3).eq([1]));
    }

    #[test]
    fn test_fast_field_in_json_field_expand_dots_disabled() {
        let mut schema_builder = Schema::builder();
        let json_option = JsonObjectOptions::default().set_fast(None);
        let json = schema_builder.add_json_field("json", json_option);
        let schema = schema_builder.build();
        let index = Index::create_in_ram(schema);
        let mut index_writer: IndexWriter = index.writer_for_tests().unwrap();
        index_writer
            .add_document(doc!(json => json!({"attr.age": 32})))
            .unwrap();
        index_writer.commit().unwrap();
        let searcher = index.reader().unwrap().searcher();
        let fast_field_reader = searcher.segment_reader(0u32).fast_fields();
        assert!(fast_field_reader
            .column_opt::<i64>("json.attr.age")
            .unwrap()
            .is_none());
        let column = fast_field_reader
            .column_opt::<i64>(r"json.attr\.age")
            .unwrap()
            .unwrap();
        let vals: Vec<i64> = column.values_for_doc(0u32).collect();
        assert_eq!(&vals, &[32])
    }

    #[test]
    fn test_fast_field_in_json_field_with_tokenizer() {
        let mut schema_builder = Schema::builder();
        let json_option = JsonObjectOptions::default().set_fast(Some("default"));
        let json = schema_builder.add_json_field("json", json_option);
        let schema = schema_builder.build();
        let index = Index::create_in_ram(schema);
        let mut index_writer: IndexWriter = index.writer_for_tests().unwrap();
        index_writer
            .add_document(doc!(json => json!({"age": 32})))
            .unwrap();
        index_writer
            .add_document(doc!(json => json!({"age": "NEW"})))
            .unwrap();

        index_writer.commit().unwrap();
        let searcher = index.reader().unwrap().searcher();
        let fast_fields = searcher.segment_reader(0u32).fast_fields();

        let ff_str = fast_fields.str("json.age").unwrap().unwrap();
        let mut output = String::new();
        ff_str.ord_to_str(0, &mut output).unwrap();
        assert_eq!(output, "new");
    }

    #[test]
    fn test_fast_field_in_json_field_expand_dots_enabled() {
        let mut schema_builder = Schema::builder();
        let json_option = JsonObjectOptions::default()
            .set_fast(None)
            .set_expand_dots_enabled();
        let json = schema_builder.add_json_field("json", json_option);
        let schema = schema_builder.build();
        let index = Index::create_in_ram(schema);
        let mut index_writer: IndexWriter = index.writer_for_tests().unwrap();
        index_writer
            .add_document(doc!(json => json!({"attr.age": 32})))
            .unwrap();
        index_writer.commit().unwrap();
        let searcher = index.reader().unwrap().searcher();
        let fast_field_reader = searcher.segment_reader(0u32).fast_fields();
        for test_column_name in &["json.attr.age", "json.attr\\.age"] {
            let column = fast_field_reader
                .column_opt::<i64>(test_column_name)
                .unwrap()
                .unwrap();
            let vals: Vec<i64> = column.values_for_doc(0u32).collect();
            assert_eq!(&vals, &[32]);
        }
    }

    #[test]
    fn test_fast_field_dot_in_schema_field_name() {
        let mut schema_builder = Schema::builder();
        let field_with_dot = schema_builder.add_i64_field("field.with.dot", FAST);
        let schema = schema_builder.build();
        let index = Index::create_in_ram(schema);
        let mut index_writer: IndexWriter = index.writer_for_tests().unwrap();
        index_writer
            .add_document(doc!(field_with_dot => 32i64))
            .unwrap();
        index_writer.commit().unwrap();
        let searcher = index.reader().unwrap().searcher();
        let fast_field_reader = searcher.segment_reader(0u32).fast_fields();
        let column = fast_field_reader
            .column_opt::<i64>("field.with.dot")
            .unwrap()
            .unwrap();
        let vals: Vec<i64> = column.values_for_doc(0u32).collect();
        assert_eq!(&vals, &[32]);
    }

    #[test]
    fn test_shadowing_fast_field() {
        let mut schema_builder = Schema::builder();
        let json_field = schema_builder.add_json_field("jsonfield", FAST);
        let shadowing_json_field = schema_builder.add_json_field("jsonfield.attr", FAST);
        let schema = schema_builder.build();
        let index = Index::create_in_ram(schema);
        let mut index_writer: IndexWriter = index.writer_for_tests().unwrap();
        index_writer
            .add_document(doc!(json_field=> json!({"attr": {"age": 32}}), shadowing_json_field=>json!({"age": 33})))
            .unwrap();
        index_writer.commit().unwrap();
        let searcher = index.reader().unwrap().searcher();
        let fast_field_reader = searcher.segment_reader(0u32).fast_fields();
        let column = fast_field_reader
            .column_opt::<i64>("jsonfield.attr.age")
            .unwrap()
            .unwrap();
        let vals: Vec<i64> = column.values_for_doc(0u32).collect();
        assert_eq!(&vals, &[33]);
    }

    #[test]
    fn test_fast_field_tokenizer() {
        let mut schema_builder = Schema::builder();
        let opt = TextOptions::default().set_fast(Some("custom_lowercase"));
        let text_field = schema_builder.add_text_field("text", opt);
        let schema = schema_builder.build();
        let ff_tokenizer_manager = TokenizerManager::default();
        ff_tokenizer_manager.register(
            "custom_lowercase",
            TextAnalyzer::builder(RawTokenizer::default())
                .filter(LowerCaser)
                .build(),
        );

        let mut index = Index::create_in_ram(schema);
        index.set_fast_field_tokenizers(ff_tokenizer_manager);
        let mut index_writer: IndexWriter = index.writer_for_tests().unwrap();
        index_writer
            .add_document(doc!(text_field => "Test1 test2"))
            .unwrap();
        index_writer.commit().unwrap();
        let searcher = index.reader().unwrap().searcher();
        let fast_field_reader = searcher.segment_reader(0u32).fast_fields();
        let column = fast_field_reader.str("text").unwrap().unwrap();
        let mut out = String::new();
        column.ord_to_str(0u64, &mut out).unwrap();
        assert_eq!(&out, "test1 test2");
    }

    #[test]
    fn test_text_fast_field_tokenizer() {
        let mut schema_builder = Schema::builder();

        let text_fieldtype = crate::schema::TextOptions::default()
            .set_indexing_options(
                crate::schema::TextFieldIndexing::default()
                    .set_index_option(crate::schema::IndexRecordOption::WithFreqs)
                    .set_tokenizer("raw"),
            )
            .set_fast(Some("default"))
            .set_stored();

        let log_field = schema_builder.add_text_field("log_level", text_fieldtype);
        let schema = schema_builder.build();
        let index = Index::create_in_ram(schema);
        let mut index_writer: IndexWriter = index.writer_for_tests().unwrap();
        index_writer
            .add_document(doc!(log_field => "info"))
            .unwrap();
        index_writer
            .add_document(doc!(log_field => "INFO"))
            .unwrap();
        index_writer.commit().unwrap();
        let searcher = index.reader().unwrap().searcher();
        let fast_field_reader = searcher.segment_reader(0u32).fast_fields();

        let text_fast_field = fast_field_reader.str("log_level").unwrap().unwrap();
        let mut buffer = String::new();
        assert!(text_fast_field.ord_to_str(0, &mut buffer).unwrap());
        assert_eq!(buffer, "info");
        assert!(!text_fast_field.ord_to_str(1, &mut buffer).unwrap());

        assert!(text_fast_field.term_ords(0).eq([0].into_iter()));
        assert!(text_fast_field.term_ords(1).eq([0].into_iter()));
        assert!(text_fast_field.ords().values_for_doc(0u32).eq([0]));
        assert!(text_fast_field.ords().values_for_doc(1u32).eq([0]));
    }

    #[test]
    fn test_shadowing_fast_field_with_expand_dots() {
        let mut schema_builder = Schema::builder();
        let json_option = JsonObjectOptions::default()
            .set_fast(None)
            .set_expand_dots_enabled();
        let json_field = schema_builder.add_json_field("jsonfield", json_option.clone());
        let shadowing_json_field = schema_builder.add_json_field("jsonfield.attr", json_option);
        let schema = schema_builder.build();
        let index = Index::create_in_ram(schema);
        let mut index_writer: IndexWriter = index.writer_for_tests().unwrap();
        index_writer
            .add_document(doc!(json_field=> json!({"attr.age": 32}), shadowing_json_field=>json!({"age": 33})))
            .unwrap();
        index_writer.commit().unwrap();
        let searcher = index.reader().unwrap().searcher();
        let fast_field_reader = searcher.segment_reader(0u32).fast_fields();
        // Supported for now, maybe dropped in the future.
        let column = fast_field_reader
            .column_opt::<i64>("jsonfield.attr.age")
            .unwrap()
            .unwrap();
        let vals: Vec<i64> = column.values_for_doc(0u32).collect();
        assert_eq!(&vals, &[33]);
        let column = fast_field_reader
            .column_opt::<i64>("jsonfield\\.attr.age")
            .unwrap()
            .unwrap();
        let vals: Vec<i64> = column.values_for_doc(0u32).collect();
        assert_eq!(&vals, &[33]);
    }
}


================================================
FILE: src/fastfield/readers.rs
================================================
use std::io;
use std::net::Ipv6Addr;
use std::sync::Arc;

use columnar::{
    BytesColumn, Column, ColumnType, ColumnValues, ColumnarReader, DynamicColumn,
    DynamicColumnHandle, HasAssociatedColumnType, StrColumn,
};
use common::ByteCount;

use crate::core::json_utils::{encode_column_name, json_path_sep_to_dot};
use crate::directory::FileSlice;
use crate::schema::{Field, FieldEntry, FieldType, Schema};
use crate::space_usage::{FieldUsage, PerFieldSpaceUsage};
use crate::TantivyError;

/// Provides access to all of the BitpackedFastFieldReader.
///
/// Internally, `FastFieldReaders` have preloaded fast field readers,
/// and just wraps several `HashMap`.
#[derive(Clone)]
pub struct FastFieldReaders {
    columnar: Arc<ColumnarReader>,
    schema: Schema,
}

impl FastFieldReaders {
    pub(crate) fn open(fast_field_file: FileSlice, schema: Schema) -> io::Result<FastFieldReaders> {
        let columnar = Arc::new(ColumnarReader::open(fast_field_file)?);
        Ok(FastFieldReaders { columnar, schema })
    }

    fn resolve_field(&self, column_name: &str) -> crate::Result<Option<String>> {
        let default_field_opt: Option<Field> = if cfg!(feature = "quickwit") {
            self.schema.get_field("_dynamic").ok()
        } else {
            None
        };
        self.resolve_column_name_given_default_field(column_name, default_field_opt)
    }

    pub(crate) fn space_usage(&self) -> io::Result<PerFieldSpaceUsage> {
        let mut per_field_usages: Vec<FieldUsage> = Default::default();
        for (mut field_name, column_handle) in self.columnar.iter_columns()? {
            json_path_sep_to_dot(&mut field_name);
            let space_usage = column_handle.space_usage()?;
            let mut field_usage = FieldUsage::empty(field_name);
            field_usage.set_column_usage(space_usage);
            per_field_usages.push(field_usage);
        }
        Ok(PerFieldSpaceUsage::new(per_field_usages))
    }

    pub(crate) fn columnar(&self) -> &ColumnarReader {
        self.columnar.as_ref()
    }

    /// Transforms a user-supplied fast field name into a column name.
    ///
    /// A user-supplied fast field name is not necessarily a schema field name
    /// because we handle fast fields.
    ///
    /// For instance, if the documents look like `{.., "attributes": {"color": "red"}}` and
    /// `attributes` is a json fast field,  a user could want to run a term aggregation over
    /// colors, by referring to the field as `attributes.color`.
    ///
    /// This function transforms `attributes.color` into a column key to be used in the `columnar`.
    ///
    /// The logic works as follows, first we identify which field is targeted by calling
    /// `schema.find_field(..)`. This method will attempt to split the user splied fast field
    /// name by non-escaped dots, and find the longest matching schema field name.
    /// In our case, it would return the (attribute_field, "color").
    ///
    /// If no field is found, but a dynamic field is supplied, then we
    /// will simply assume the user is targeting the dynamic field. (This feature is used in
    /// Quickwit.)
    ///
    /// We then encode the `(field, path)` into the right `columnar_key`.
    fn resolve_column_name_given_default_field<'a>(
        &'a self,
        field_name: &'a str,
        default_field_opt: Option<Field>,
    ) -> crate::Result<Option<String>> {
        let Some((field, path)): Option<(Field, &str)> = self
            .schema
            .find_field_with_default(field_name, default_field_opt)
        else {
            return Ok(None);
        };
        let field_entry: &FieldEntry = self.schema.get_field_entry(field);
        if !field_entry.is_fast() {
            return Err(TantivyError::InvalidArgument(format!(
                "Field {field_name:?} is not configured as fast field"
            )));
        }
        Ok(match (field_entry.field_type(), path) {
            (FieldType::JsonObject(json_options), path) if !path.is_empty() => {
                Some(encode_column_name(
                    field_entry.name(),
                    path,
                    json_options.is_expand_dots_enabled(),
                ))
            }
            (_, "") => Some(field_entry.name().to_string()),
            _ => None,
        })
    }

    /// Returns a typed column associated to a given field name.
    ///
    /// If no column associated with that field_name exists,
    /// or existing columns do not have the required type,
    /// returns `None`.
    pub fn column_opt<T>(&self, field_name: &str) -> crate::Result<Option<Column<T>>>
    where
        T: HasAssociatedColumnType,
        DynamicColumn: Into<Option<Column<T>>>,
    {
        let Some(dynamic_column_handle) =
            self.dynamic_column_handle(field_name, T::column_type())?
        else {
            return Ok(None);
        };
        let dynamic_column = dynamic_column_handle.open()?;
        Ok(dynamic_column.into())
    }

    /// Returns the number of `bytes` associated with a column.
    ///
    /// Returns 0 if the column does not exist.
    pub fn column_num_bytes(&self, field: &str) -> crate::Result<ByteCount> {
        let Some(resolved_field_name) = self.resolve_field(field)? else {
            return Ok(0u64.into());
        };
        Ok(self
            .columnar
            .read_columns(&resolved_field_name)?
            .into_iter()
            .map(|column_handle| column_handle.num_bytes())
            .sum())
    }

    /// Returns a typed column value object.
    ///
    /// In that column value:
    /// - Rows with no value are associated with the default value.
    /// - Rows with several values are associated with the first value.
    pub fn column_first_or_default<T>(&self, field: &str) -> crate::Result<Arc<dyn ColumnValues<T>>>
    where
        T: PartialOrd + Copy + HasAssociatedColumnType + Send + Sync + 'static,
        DynamicColumn: Into<Option<Column<T>>>,
    {
        let col: Column<T> = self.column(field)?;
        Ok(col.first_or_default_col(T::default_value()))
    }

    /// Returns a typed column associated to a given field name.
    ///
    /// Returns an error if no column associated with that field_name exists.
    fn column<T>(&self, field: &str) -> crate::Result<Column<T>>
    where
        T: PartialOrd + Copy + HasAssociatedColumnType + Send + Sync + 'static,
        DynamicColumn: Into<Option<Column<T>>>,
    {
        let col_opt: Option<Column<T>> = self.column_opt(field)?;
        col_opt.ok_or_else(|| {
            crate::TantivyError::SchemaError(format!(
                "Field `{field}` is missing or is not configured as a fast field."
            ))
        })
    }

    /// Returns the `u64` fast field reader reader associated with `field`.
    ///
    /// If `field` is not a u64 fast field, this method returns an Error.
    pub fn u64(&self, field: &str) -> crate::Result<Column<u64>> {
        self.column(field)
    }

    /// Returns the `date` fast field reader reader associated with `field`.
    ///
    /// If `field` is not a date fast field, this method returns an Error.
    pub fn date(&self, field: &str) -> crate::Result<Column<common::DateTime>> {
        self.column(field)
    }

    /// Returns the `ip` fast field reader reader associated to `field`.
    ///
    /// If `field` is not a u128 fast field, this method returns an Error.
    pub fn ip_addr(&self, field: &str) -> crate::Result<Column<Ipv6Addr>> {
        self.column(field)
    }

    /// Returns a `str` column.
    pub fn str(&self, field_name: &str) -> crate::Result<Option<StrColumn>> {
        let Some(dynamic_column_handle) =
            self.dynamic_column_handle(field_name, ColumnType::Str)?
        else {
            return Ok(None);
        };
        let dynamic_column = dynamic_column_handle.open()?;
        Ok(dynamic_column.into())
    }

    /// Returns a `bytes` column.
    pub fn bytes(&self, field_name: &str) -> crate::Result<Option<BytesColumn>> {
        let Some(dynamic_column_handle) =
            self.dynamic_column_handle(field_name, ColumnType::Bytes)?
        else {
            return Ok(None);
        };
        let dynamic_column = dynamic_column_handle.open()?;
        Ok(dynamic_column.into())
    }

    /// Returns a `dynamic_column_handle`.
    pub fn dynamic_column_handle(
        &self,
        field_name: &str,
        column_type: ColumnType,
    ) -> crate::Result<Option<DynamicColumnHandle>> {
        let Some(resolved_field_name) = self.resolve_field(field_name)? else {
            return Ok(None);
        };
        let dynamic_column_handle_opt = self
            .columnar
            .read_columns(&resolved_field_name)?
            .into_iter()
            .find(|column| column.column_type() == column_type);
        Ok(dynamic_column_handle_opt)
    }

    /// Returns all `dynamic_column_handle` that match the given field name.
    pub fn dynamic_column_handles(
        &self,
        field_name: &str,
    ) -> crate::Result<Vec<DynamicColumnHandle>> {
        let Some(resolved_field_name) = self.resolve_field(field_name)? else {
            return Ok(Vec::new());
        };
        let dynamic_column_handles = self
            .columnar
            .read_columns(&resolved_field_name)?
            .into_iter()
            .collect();
        Ok(dynamic_column_handles)
    }

    /// Returns all `dynamic_column_handle` that are inner fields of the provided JSON path.
    pub fn dynamic_subpath_column_handles(
        &self,
        root_path: &str,
    ) -> crate::Result<Vec<DynamicColumnHandle>> {
        let Some(resolved_field_name) = self.resolve_field(root_path)? else {
            return Ok(Vec::new());
        };
        let dynamic_column_handles = self
            .columnar
            .read_subpath_columns(&resolved_field_name)?
            .into_iter()
            .collect();
        Ok(dynamic_column_handles)
    }

    #[doc(hidden)]
    pub async fn list_dynamic_column_handles(
        &self,
        field_name: &str,
    ) -> crate::Result<Vec<DynamicColumnHandle>> {
        let Some(resolved_field_name) = self.resolve_field(field_name)? else {
            return Ok(Vec::new());
        };
        let columns = self
            .columnar
            .read_columns_async(&resolved_field_name)
            .await?;
        Ok(columns)
    }

    #[doc(hidden)]
    pub async fn list_subpath_dynamic_column_handles(
        &self,
        root_path: &str,
    ) -> crate::Result<Vec<DynamicColumnHandle>> {
        let Some(resolved_field_name) = self.resolve_field(root_path)? else {
            return Ok(Vec::new());
        };
        let columns = self
            .columnar
            .read_subpath_columns_async(&resolved_field_name)
            .await?;
        Ok(columns)
    }

    /// Returns the `u64` column used to represent any `u64`-mapped typed (String/Bytes term ids,
    /// i64, u64, f64, DateTime).
    ///
    /// Returns Ok(None) for empty columns
    #[doc(hidden)]
    pub fn u64_lenient_for_type(
        &self,
        type_white_list_opt: Option<&[ColumnType]>,
        field_name: &str,
    ) -> crate::Result<Option<(Column<u64>, ColumnType)>> {
        let Some(resolved_field_name) = self.resolve_field(field_name)? else {
            return Ok(None);
        };
        for col in self.columnar.read_columns(&resolved_field_name)? {
            if let Some(type_white_list) = type_white_list_opt {
                if !type_white_list.contains(&col.column_type()) {
                    continue;
                }
            }
            if let Some(col_u64) = col.open_u64_lenient()? {
                return Ok(Some((col_u64, col.column_type())));
            }
        }
        Ok(None)
    }

    /// Returns the all `u64` column used to represent any `u64`-mapped typed (String/Bytes term
    /// ids, i64, u64, f64, bool, DateTime).
    ///
    /// In case of JSON, there may be two columns. One for term and one for numerical types. (This
    /// may change later to 3 types if JSON handles DateTime)
    #[doc(hidden)]
    pub fn u64_lenient_for_type_all(
        &self,
        type_white_list_opt: Option<&[ColumnType]>,
        field_name: &str,
    ) -> crate::Result<Vec<(Column<u64>, ColumnType)>> {
        let mut columns_and_types = Vec::new();
        let Some(resolved_field_name) = self.resolve_field(field_name)? else {
            return Ok(columns_and_types);
        };
        for col in self.columnar.read_columns(&resolved_field_name)? {
            if let Some(type_white_list) = type_white_list_opt {
                if !type_white_list.contains(&col.column_type()) {
                    continue;
                }
            }
            if let Some(col_u64) = col.open_u64_lenient()? {
                columns_and_types.push((col_u64, col.column_type()));
            }
        }
        Ok(columns_and_types)
    }

    /// Returns the `u64` column used to represent any `u64`-mapped typed (i64, u64, f64, DateTime).
    ///
    /// Returns Ok(None) for empty columns
    #[doc(hidden)]
    pub fn u64_lenient(
        &self,
        field_name: &str,
    ) -> crate::Result<Option<(Column<u64>, ColumnType)>> {
        self.u64_lenient_for_type(None, field_name)
    }

    /// Returns the `i64` fast field reader reader associated with `field`.
    ///
    /// If `field` is not a i64 fast field, this method returns an Error.
    pub fn i64(&self, field_name: &str) -> crate::Result<Column<i64>> {
        self.column(field_name)
    }

    /// Returns the `f64` fast field reader reader associated with `field`.
    ///
    /// If `field` is not a f64 fast field, this method returns an Error.
    pub fn f64(&self, field_name: &str) -> crate::Result<Column<f64>> {
        self.column(field_name)
    }

    /// Returns the `bool` fast field reader reader associated with `field`.
    ///
    /// If `field` is not a bool fast field, this method returns an Error.
    pub fn bool(&self, field_name: &str) -> crate::Result<Column<bool>> {
        self.column(field_name)
    }
}

#[cfg(test)]
mod tests {
    use columnar::ColumnType;

    use crate::schema::{JsonObjectOptions, Schema, FAST};
    use crate::{Index, IndexWriter, TantivyDocument};

    #[test]
    fn test_fast_field_reader_resolve_with_dynamic_internal() {
        let mut schema_builder = Schema::builder();
        schema_builder.add_i64_field("age", FAST);
        schema_builder.add_json_field("json_expand_dots_disabled", FAST);
        schema_builder.add_json_field(
            "json_expand_dots_enabled",
            JsonObjectOptions::default()
                .set_fast(None)
                .set_expand_dots_enabled(),
        );
        let dynamic_field = schema_builder.add_json_field("_dyna", FAST);
        let schema = schema_builder.build();
        let index = Index::create_in_ram(schema);
        let mut index_writer: IndexWriter = index.writer_for_tests().unwrap();
        index_writer
            .add_document(TantivyDocument::default())
            .unwrap();
        index_writer.commit().unwrap();
        let reader = index.reader().unwrap();
        let searcher = reader.searcher();
        let reader = searcher.segment_reader(0u32);
        let fast_field_readers = reader.fast_fields();
        assert_eq!(
            fast_field_readers
                .resolve_column_name_given_default_field("age", None)
                .unwrap(),
            Some("age".to_string())
        );
        assert_eq!(
            fast_field_readers
                .resolve_column_name_given_default_field("age", Some(dynamic_field))
                .unwrap(),
            Some("age".to_string())
        );
        assert_eq!(
            fast_field_readers
                .resolve_column_name_given_default_field(
                    "json_expand_dots_disabled.attr.color",
                    None
                )
                .unwrap(),
            Some("json_expand_dots_disabled\u{1}attr\u{1}color".to_string())
        );
        assert_eq!(
            fast_field_readers
                .resolve_column_name_given_default_field(
                    "json_expand_dots_disabled.attr\\.color",
                    Some(dynamic_field)
                )
                .unwrap(),
            Some("json_expand_dots_disabled\u{1}attr.color".to_string())
        );
        assert_eq!(
            fast_field_readers
                .resolve_column_name_given_default_field(
                    "json_expand_dots_enabled.attr\\.color",
                    Some(dynamic_field)
                )
                .unwrap(),
            Some("json_expand_dots_enabled\u{1}attr\u{1}color".to_string())
        );
        assert_eq!(
            fast_field_readers
                .resolve_column_name_given_default_field("notinschema.attr.color", None)
                .unwrap(),
            None
        );
        assert_eq!(
            fast_field_readers
                .resolve_column_name_given_default_field(
                    "notinschema.attr.color",
                    Some(dynamic_field)
                )
                .unwrap(),
            Some("_dyna\u{1}notinschema\u{1}attr\u{1}color".to_string())
        );
    }

    #[test]
    fn test_fast_field_reader_dynamic_column_handles() {
        let mut schema_builder = Schema::builder();
        let id = schema_builder.add_u64_field("id", FAST);
        let json = schema_builder.add_json_field("json", FAST);
        let schema = schema_builder.build();
        let index = Index::create_in_ram(schema);
        let mut index_writer: IndexWriter = index.writer_for_tests().unwrap();
        index_writer
            .add_document(doc!(id=> 1u64, json => json!({"foo": 42})))
            .unwrap();
        index_writer
            .add_document(doc!(id=> 2u64, json => json!({"foo": true})))
            .unwrap();
        index_writer
            .add_document(doc!(id=> 3u64, json => json!({"foo": "bar"})))
            .unwrap();
        index_writer.commit().unwrap();
        let reader = index.reader().unwrap();
        let searcher = reader.searcher();
        let reader = searcher.segment_reader(0u32);
        let fast_fields = reader.fast_fields();
        let id_columns = fast_fields.dynamic_column_handles("id").unwrap();
        assert_eq!(id_columns.len(), 1);
        assert_eq!(id_columns.first().unwrap().column_type(), ColumnType::U64);

        let foo_columns = fast_fields.dynamic_column_handles("json.foo").unwrap();
        assert_eq!(foo_columns.len(), 3);
        assert!(foo_columns
            .iter()
            .any(|column| column.column_type() == ColumnType::I64));
        assert!(foo_columns
            .iter()
            .any(|column| column.column_type() == ColumnType::Bool));
        assert!(foo_columns
            .iter()
            .any(|column| column.column_type() == ColumnType::Str));

        let json_columns = fast_fields.dynamic_column_handles("json").unwrap();
        assert_eq!(json_columns.len(), 0);

        let json_subcolumns = fast_fields.dynamic_subpath_column_handles("json").unwrap();
        assert_eq!(json_subcolumns.len(), 3);

        let foo_subcolumns = fast_fields
            .dynamic_subpath_column_handles("json.foo")
            .unwrap();
        assert_eq!(foo_subcolumns.len(), 0);
    }
}


================================================
FILE: src/fastfield/writer.rs
================================================
use std::io;

use columnar::{ColumnarWriter, NumericalValue};
use common::{DateTimePrecision, JsonPathWriter};
use tokenizer_api::Token;

use crate::schema::document::{Document, ReferenceValue, ReferenceValueLeaf, Value};
use crate::schema::{value_type_to_column_type, Field, FieldType, Schema, Type};
use crate::tokenizer::{TextAnalyzer, TokenizerManager};
use crate::{DocId, TantivyError};

/// Only index JSON down to a depth of 20.
/// This is mostly to guard us from a stack overflow triggered by malicious input.
const JSON_DEPTH_LIMIT: usize = 20;

/// The `FastFieldsWriter` groups all of the fast field writers.
pub struct FastFieldsWriter {
    columnar_writer: ColumnarWriter,
    fast_field_names: Vec<Option<String>>, //< TODO see if we can hash the field name hash too.
    per_field_tokenizer: Vec<Option<TextAnalyzer>>,
    date_precisions: Vec<DateTimePrecision>,
    expand_dots: Vec<bool>,
    num_docs: DocId,
    // Buffer that we recycle to avoid allocation.
    json_path_buffer: JsonPathWriter,
}

impl FastFieldsWriter {
    /// Create all `FastFieldWriter` required by the schema.
    #[cfg(test)]
    pub fn from_schema(schema: &Schema) -> crate::Result<FastFieldsWriter> {
        FastFieldsWriter::from_schema_and_tokenizer_manager(schema, TokenizerManager::new())
    }

    /// Create all `FastFieldWriter` required by the schema.
    pub fn from_schema_and_tokenizer_manager(
        schema: &Schema,
        tokenizer_manager: TokenizerManager,
    ) -> crate::Result<FastFieldsWriter> {
        let mut columnar_writer = ColumnarWriter::default();

        let mut fast_field_names: Vec<Option<String>> = vec![None; schema.num_fields()];
        let mut date_precisions: Vec<DateTimePrecision> =
            std::iter::repeat_with(DateTimePrecision::default)
                .take(schema.num_fields())
                .collect();
        let mut expand_dots = vec![false; schema.num_fields()];
        let mut per_field_tokenizer: Vec<Option<TextAnalyzer>> = vec![None; schema.num_fields()];
        // TODO see other types
        for (field_id, field_entry) in schema.fields() {
            if !field_entry.field_type().is_fast() {
                continue;
            }
            fast_field_names[field_id.field_id() as usize] = Some(field_entry.name().to_string());
            let value_type = field_entry.field_type().value_type();
            if let FieldType::Date(date_options) = field_entry.field_type() {
                date_precisions[field_id.field_id() as usize] = date_options.get_precision();
            }
            if let FieldType::JsonObject(json_object_options) = field_entry.field_type() {
                if let Some(tokenizer_name) = json_object_options.get_fast_field_tokenizer_name() {
                    let text_analyzer = tokenizer_manager.get(tokenizer_name).ok_or_else(|| {
                        TantivyError::InvalidArgument(format!(
                            "Tokenizer {tokenizer_name:?} not found"
                        ))
                    })?;
                    per_field_tokenizer[field_id.field_id() as usize] = Some(text_analyzer);
                }

                expand_dots[field_id.field_id() as usize] =
                    json_object_options.is_expand_dots_enabled();
            }
            if let FieldType::Str(text_options) = field_entry.field_type() {
                if let Some(tokenizer_name) = text_options.get_fast_field_tokenizer_name() {
                    let text_analyzer = tokenizer_manager.get(tokenizer_name).ok_or_else(|| {
                        TantivyError::InvalidArgument(format!(
                            "Tokenizer {tokenizer_name:?} not found"
                        ))
                    })?;
                    per_field_tokenizer[field_id.field_id() as usize] = Some(text_analyzer);
                }
            }

            let sort_values_within_row = value_type == Type::Facet;
            if let Some(column_type) = value_type_to_column_type(value_type) {
                columnar_writer.record_column_type(
                    field_entry.name(),
                    column_type,
                    sort_values_within_row,
                );
            }
        }
        Ok(FastFieldsWriter {
            columnar_writer,
            fast_field_names,
            per_field_tokenizer,
            num_docs: 0u32,
            date_precisions,
            expand_dots,
            json_path_buffer: JsonPathWriter::default(),
        })
    }

    /// The memory used (inclusive childs)
    pub fn mem_usage(&self) -> usize {
        self.columnar_writer.mem_usage()
    }

    /// Indexes all of the fastfields of a new document.
    pub fn add_document<D: Document>(&mut self, doc: &D) -> crate::Result<()> {
        let doc_id = self.num_docs;
        for (field, value) in doc.iter_fields_and_values() {
            let value_access = value as D::Value<'_>;

            self.add_doc_value(doc_id, field, value_access)?;
        }
        self.num_docs += 1;
        Ok(())
    }

    fn add_doc_value<'a, V: Value<'a>>(
        &mut self,
        doc_id: DocId,
        field: Field,
        value: V,
    ) -> crate::Result<()> {
        let field_name = match &self.fast_field_names[field.field_id() as usize] {
            None => return Ok(()),
            Some(name) => name,
        };

        match value.as_value() {
            ReferenceValue::Leaf(leaf) => match leaf {
                ReferenceValueLeaf::Null => {}
                ReferenceValueLeaf::Str(val) => {
                    if let Some(tokenizer) =
                        &mut self.per_field_tokenizer[field.field_id() as usize]
                    {
                        let mut token_stream = tokenizer.token_stream(val);
                        token_stream.process(&mut |token: &Token| {
                            self.columnar_writer
                                .record_str(doc_id, field_name, &token.text);
                        })
                    } else {
                        self.columnar_writer.record_str(doc_id, field_name, val);
                    }
                }
                ReferenceValueLeaf::U64(val) => {
                    self.columnar_writer.record_numerical(
                        doc_id,
                        field_name,
                        NumericalValue::from(val),
                    );
                }
                ReferenceValueLeaf::I64(val) => {
                    self.columnar_writer.record_numerical(
                        doc_id,
                        field_name,
                        NumericalValue::from(val),
                    );
                }
                ReferenceValueLeaf::F64(val) => {
                    self.columnar_writer.record_numerical(
                        doc_id,
                        field_name,
                        NumericalValue::from(val),
                    );
                }
                ReferenceValueLeaf::Date(val) => {
                    let date_precision = self.date_precisions[field.field_id() as usize];
                    let truncated_datetime = val.truncate(date_precision);
                    self.columnar_writer
                        .record_datetime(doc_id, field_name, truncated_datetime);
                }
                ReferenceValueLeaf::Facet(val) => {
                    self.columnar_writer.record_str(doc_id, field_name, val);
                }
                ReferenceValueLeaf::Bytes(val) => {
                    self.columnar_writer.record_bytes(doc_id, field_name, val);
                }
                ReferenceValueLeaf::IpAddr(val) => {
                    self.columnar_writer.record_ip_addr(doc_id, field_name, val);
                }
                ReferenceValueLeaf::Bool(val) => {
                    self.columnar_writer.record_bool(doc_id, field_name, val);
                }
                ReferenceValueLeaf::PreTokStr(val) => {
                    for token in &val.tokens {
                        self.columnar_writer
                            .record_str(doc_id, field_name, &token.text);
                    }
                }
            },
            ReferenceValue::Array(val) => {
                // TODO: Check this is the correct behaviour we want.
                for value in val {
                    self.add_doc_value(doc_id, field, value)?;
                }
            }
            ReferenceValue::Object(val) => {
                let expand_dots = self.expand_dots[field.field_id() as usize];
                self.json_path_buffer.clear();
                // First field should not be expanded.
                self.json_path_buffer.set_expand_dots(false);
                self.json_path_buffer.push(field_name);
                self.json_path_buffer.set_expand_dots(expand_dots);

                let text_analyzer = &mut self.per_field_tokenizer[field.field_id() as usize];

                record_json_obj_to_columnar_writer::<V>(
                    doc_id,
                    val,
                    JSON_DEPTH_LIMIT,
                    &mut self.json_path_buffer,
                    &mut self.columnar_writer,
                    text_analyzer,
                );
            }
        }

        Ok(())
    }

    /// Serializes all of the `FastFieldWriter`s by pushing them in
    /// order to the fast field serializer.
    pub fn serialize(mut self, wrt: &mut dyn io::Write) -> io::Result<()> {
        let num_docs = self.num_docs;
        self.columnar_writer.serialize(num_docs, wrt)?;
        Ok(())
    }
}

fn record_json_obj_to_columnar_writer<'a, V: Value<'a>>(
    doc: DocId,
    json_visitor: V::ObjectIter,
    remaining_depth_limit: usize,
    json_path_buffer: &mut JsonPathWriter,
    columnar_writer: &mut columnar::ColumnarWriter,
    tokenizer: &mut Option<TextAnalyzer>,
) {
    for (key, child) in json_visitor {
        json_path_buffer.push(key);
        record_json_value_to_columnar_writer(
            doc,
            child,
            remaining_depth_limit,
            json_path_buffer,
            columnar_writer,
            tokenizer,
        );
        json_path_buffer.pop();
    }
}

fn record_json_value_to_columnar_writer<'a, V: Value<'a>>(
    doc: DocId,
    json_val: V,
    mut remaining_depth_limit: usize,
    json_path_writer: &mut JsonPathWriter,
    columnar_writer: &mut columnar::ColumnarWriter,
    tokenizer: &mut Option<TextAnalyzer>,
) {
    if remaining_depth_limit == 0 {
        return;
    }
    remaining_depth_limit -= 1;

    match json_val.as_value() {
        ReferenceValue::Leaf(leaf) => match leaf {
            ReferenceValueLeaf::Null => {} // TODO: Handle null
            ReferenceValueLeaf::Str(val) => {
                if let Some(text_analyzer) = tokenizer.as_mut() {
                    let mut token_stream = text_analyzer.token_stream(val);
                    token_stream.process(&mut |token| {
                        columnar_writer.record_str(doc, json_path_writer.as_str(), &token.text);
                    })
                } else {
                    columnar_writer.record_str(doc, json_path_writer.as_str(), val);
                }
            }
            ReferenceValueLeaf::U64(val) => {
                columnar_writer.record_numerical(
                    doc,
                    json_path_writer.as_str(),
                    NumericalValue::from(val),
                );
            }
            ReferenceValueLeaf::I64(val) => {
                columnar_writer.record_numerical(
                    doc,
                    json_path_writer.as_str(),
                    NumericalValue::from(val),
                );
            }
            ReferenceValueLeaf::F64(val) => {
                columnar_writer.record_numerical(
                    doc,
                    json_path_writer.as_str(),
                    NumericalValue::from(val),
                );
            }
            ReferenceValueLeaf::Bool(val) => {
                columnar_writer.record_bool(doc, json_path_writer.as_str(), val);
            }
            ReferenceValueLeaf::Date(val) => {
                columnar_writer.record_datetime(doc, json_path_writer.as_str(), val);
            }
            ReferenceValueLeaf::Facet(_) => {
                unimplemented!("Facet support in dynamic fields is not yet implemented")
            }
            ReferenceValueLeaf::Bytes(_) => {
                // TODO: This can be re added once it is added to the JSON Utils section as well.
                // columnar_writer.record_bytes(doc, json_path_writer.as_str(), val);
                unimplemented!("Bytes support in dynamic fields is not yet implemented")
            }
            ReferenceValueLeaf::IpAddr(_) => {
                unimplemented!("IP address support in dynamic fields is not yet implemented")
            }
            ReferenceValueLeaf::PreTokStr(_) => {
                unimplemented!(
                    "Pre-tokenized string support in dynamic fields is not yet implemented"
                )
            }
        },
        ReferenceValue::Array(elements) => {
            for el in elements {
                record_json_value_to_columnar_writer(
                    doc,
                    el,
                    remaining_depth_limit,
                    json_path_writer,
                    columnar_writer,
                    tokenizer,
                );
            }
        }
        ReferenceValue::Object(object) => {
            record_json_obj_to_columnar_writer::<V>(
                doc,
                object,
                remaining_depth_limit,
                json_path_writer,
                columnar_writer,
                tokenizer,
            );
        }
    }
}

#[cfg(test)]
mod tests {
    use columnar::{Column, ColumnarReader, ColumnarWriter, StrColumn};
    use common::JsonPathWriter;

    use super::record_json_value_to_columnar_writer;
    use crate::fastfield::writer::JSON_DEPTH_LIMIT;
    use crate::DocId;

    fn test_columnar_from_jsons_aux(
        json_docs: &[serde_json::Value],
        expand_dots: bool,
    ) -> ColumnarReader {
        let mut columnar_writer = ColumnarWriter::default();
        let mut json_path = JsonPathWriter::default();
        json_path.set_expand_dots(expand_dots);
        for (doc, json_doc) in json_docs.iter().enumerate() {
            record_json_value_to_columnar_writer(
                doc as u32,
                json_doc,
                JSON_DEPTH_LIMIT,
                &mut json_path,
                &mut columnar_writer,
                &mut None,
            );
        }
        let mut buffer = Vec::new();
        columnar_writer
            .serialize(json_docs.len() as DocId, &mut buffer)
            .unwrap();
        ColumnarReader::open(buffer).unwrap()
    }

    #[test]
    fn test_json_fastfield_record_simple() {
        let json_doc = serde_json::json!({
            "float": 1.02,
            "text": "hello happy tax payer",
            "nested": {"child": 3, "child2": 5},
            "arr": ["hello", "happy", "tax", "payer"]
        });
        let columnar_reader = test_columnar_from_jsons_aux(&[json_doc], false);
        let columns = columnar_reader.list_columns().unwrap();
        {
            assert_eq!(columns[0].0, "arr");
            let column_arr_opt: Option<StrColumn> = columns[0].1.open().unwrap().into();
            assert!(column_arr_opt
                .unwrap()
                .term_ords(0)
                .eq([1, 0, 3, 2].into_iter()));
        }
        {
            assert_eq!(columns[1].0, "float");
            let column_float_opt: Option<Column<f64>> = columns[1].1.open().unwrap().into();
            assert!(column_float_opt
                .unwrap()
                .values_for_doc(0)
                .eq([1.02f64].into_iter()));
        }
        {
            assert_eq!(columns[2].0, "nested\u{1}child");
            let column_nest_child_opt: Option<Column<i64>> = columns[2].1.open().unwrap().into();
            assert!(column_nest_child_opt
                .unwrap()
                .values_for_doc(0)
                .eq([3].into_iter()));
        }
        {
            assert_eq!(columns[3].0, "nested\u{1}child2");
            let column_nest_child2_opt: Option<Column<i64>> = columns[3].1.open().unwrap().into();
            assert!(column_nest_child2_opt
                .unwrap()
                .values_for_doc(0)
                .eq([5].into_iter()));
        }
        {
            assert_eq!(columns[4].0, "text");
            let column_text_opt: Option<StrColumn> = columns[4].1.open().unwrap().into();
            assert!(column_text_opt.unwrap().term_ords(0).eq([0].into_iter()));
        }
    }

    #[test]
    fn test_json_fastfield_deep_obj() {
        let json_doc = serde_json::json!(
            {"a": {"a": {"a": {"a": {"a":
            {"a": {"a": {"a": {"a": {"a":
            {"a": {"a": {"a": {"a": {"a":
            {"a": {"a": {"a": {"depth_accepted": 19, "a": {  "depth_truncated": 20}
        }}}}}}}}}}}}}}}}}}});
        let columnar_reader = test_columnar_from_jsons_aux(&[json_doc], false);
        let columns = columnar_reader.list_columns().unwrap();
        assert_eq!(columns.len(), 1);
        assert!(columns[0].0.ends_with("a\u{1}a\u{1}a\u{1}depth_accepted"));
    }

    #[test]
    fn test_json_fastfield_deep_arr() {
        let json_doc = json!(
        {"obj":
        [[[[[,
        [[[[[,
        [[[[[,
        [[18, [19, //< within limits
        [20]]]]]]]]]]]]]]]]]]]});
        let columnar_reader = test_columnar_from_jsons_aux(&[json_doc], false);
        let columns = columnar_reader.list_columns().unwrap();
        assert_eq!(columns.len(), 1);
        assert_eq!(columns[0].0, "obj");
        let dynamic_column = columns[0].1.open().unwrap();
        let col: Option<Column<i64>> = dynamic_column.into();
        let vals: Vec<i64> = col.unwrap().values_for_doc(0).collect();
        assert_eq!(&vals, &[18, 19])
    }

    #[test]
    fn test_json_fast_field_do_not_expand_dots() {
        let json_doc = json!({"field.with.dots": {"child.with.dot": "hello"}});
        let columnar_reader = test_columnar_from_jsons_aux(&[json_doc], false);
        let columns = columnar_reader.list_columns().unwrap();
        assert_eq!(columns.len(), 1);
        assert_eq!(columns[0].0, "field.with.dots\u{1}child.with.dot");
    }

    #[test]
    fn test_json_fast_field_expand_dots() {
        let json_doc = json!({"field.with.dots": {"child.with.dot": "hello"}});
        let columnar_reader = test_columnar_from_jsons_aux(&[json_doc], true);
        let columns = columnar_reader.list_columns().unwrap();
        assert_eq!(columns.len(), 1);
        assert_eq!(
            columns[0].0,
            "field\u{1}with\u{1}dots\u{1}child\u{1}with\u{1}dot"
        );
    }
}


================================================
FILE: src/fieldnorm/code.rs
================================================
#[inline]
pub fn id_to_fieldnorm(id: u8) -> u32 {
    FIELD_NORMS_TABLE[id as usize]
}

#[inline]
pub fn fieldnorm_to_id(fieldnorm: u32) -> u8 {
    FIELD_NORMS_TABLE
        .binary_search(&fieldnorm)
        .unwrap_or_else(|idx| idx - 1) as u8
}

pub const FIELD_NORMS_TABLE: [u32; 256] = [
    0,
    1,
    2,
    3,
    4,
    5,
    6,
    7,
    8,
    9,
    10,
    11,
    12,
    13,
    14,
    15,
    16,
    17,
    18,
    19,
    20,
    21,
    22,
    23,
    24,
    25,
    26,
    27,
    28,
    29,
    30,
    31,
    32,
    33,
    34,
    35,
    36,
    37,
    38,
    39,
    40,
    42,
    44,
    46,
    48,
    50,
    52,
    54,
    56,
    60,
    64,
    68,
    72,
    76,
    80,
    84,
    88,
    96,
    104,
    112,
    120,
    128,
    136,
    144,
    152,
    168,
    184,
    200,
    216,
    232,
    248,
    264,
    280,
    312,
    344,
    376,
    408,
    440,
    472,
    504,
    536,
    600,
    664,
    728,
    792,
    856,
    920,
    984,
    1_048,
    1_176,
    1_304,
    1_432,
    1_560,
    1_688,
    1_816,
    1_944,
    2_072,
    2_328,
    2_584,
    2_840,
    3_096,
    3_352,
    3_608,
    3_864,
    4_120,
    4_632,
    5_144,
    5_656,
    6_168,
    6_680,
    7_192,
    7_704,
    8_216,
    9_240,
    10_264,
    11_288,
    12_312,
    13_336,
    14_360,
    15_384,
    16_408,
    18_456,
    20_504,
    22_552,
    24_600,
    26_648,
    28_696,
    30_744,
    32_792,
    36_888,
    40_984,
    45_080,
    49_176,
    53_272,
    57_368,
    61_464,
    65_560,
    73_752,
    81_944,
    90_136,
    98_328,
    106_520,
    114_712,
    122_904,
    131_096,
    147_480,
    163_864,
    180_248,
    196_632,
    213_016,
    229_400,
    245_784,
    262_168,
    294_936,
    327_704,
    360_472,
    393_240,
    426_008,
    458_776,
    491_544,
    524_312,
    589_848,
    655_384,
    720_920,
    786_456,
    851_992,
    917_528,
    983_064,
    1_048_600,
    1_179_672,
    1_310_744,
    1_441_816,
    1_572_888,
    1_703_960,
    1_835_032,
    1_966_104,
    2_097_176,
    2_359_320,
    2_621_464,
    2_883_608,
    3_145_752,
    3_407_896,
    3_670_040,
    3_932_184,
    4_194_328,
    4_718_616,
    5_242_904,
    5_767_192,
    6_291_480,
    6_815_768,
    7_340_056,
    7_864_344,
    8_388_632,
    9_437_208,
    10_485_784,
    11_534_360,
    12_582_936,
    13_631_512,
    14_680_088,
    15_728_664,
    16_777_240,
    18_874_392,
    20_971_544,
    23_068_696,
    25_165_848,
    27_263_000,
    29_360_152,
    31_457_304,
    33_554_456,
    37_748_760,
    41_943_064,
    46_137_368,
    50_331_672,
    54_525_976,
    58_720_280,
    62_914_584,
    67_108_888,
    75_497_496,
    83_886_104,
    92_274_712,
    100_663_320,
    109_051_928,
    117_440_536,
    125_829_144,
    134_217_752,
    150_994_968,
    167_772_184,
    184_549_400,
    201_326_616,
    218_103_832,
    234_881_048,
    251_658_264,
    268_435_480,
    301_989_912,
    335_544_344,
    369_098_776,
    402_653_208,
    436_207_640,
    469_762_072,
    503_316_504,
    536_870_936,
    603_979_800,
    671_088_664,
    738_197_528,
    805_306_392,
    872_415_256,
    939_524_120,
    1_006_632_984,
    1_073_741_848,
    1_207_959_576,
    1_342_177_304,
    1_476_395_032,
    1_610_612_760,
    1_744_830_488,
    1_879_048_216,
    2_013_265_944,
];

#[cfg(test)]
mod tests {

    use super::{fieldnorm_to_id, id_to_fieldnorm, FIELD_NORMS_TABLE};

    #[test]
    fn test_decode_code() {
        assert_eq!(fieldnorm_to_id(0), 0);
        assert_eq!(fieldnorm_to_id(1), 1);
        for i in 0..41 {
            assert_eq!(fieldnorm_to_id(i), i as u8);
        }
        assert_eq!(fieldnorm_to_id(41), 40);
        assert_eq!(fieldnorm_to_id(42), 41);
        for id in 43..256 {
            let field_norm = FIELD_NORMS_TABLE[id];
            assert_eq!(id_to_fieldnorm(id as u8), field_norm);
            assert_eq!(fieldnorm_to_id(field_norm), id as u8);
            assert_eq!(fieldnorm_to_id(field_norm - 1), id as u8 - 1);
            assert_eq!(fieldnorm_to_id(field_norm + 1), id as u8);
        }
    }

    #[test]
    fn test_u32_max() {
        assert_eq!(fieldnorm_to_id(u32::MAX), u8::MAX);
    }

    #[test]
    fn test_fieldnorm_byte() {
        // const expression are not really a thing
        // yet... Therefore we do things the other way around.

        // The array is defined as a const,
        // and we check in the unit test that the const
        // value is matching the logic.
        const IDENTITY_PART: u8 = 24u8;
        fn decode_field_norm_exp_part(b: u8) -> u32 {
            let bits = (b & 0b00000111) as u32;
            let shift = b >> 3;
            if shift == 0 {
                bits
            } else {
                (bits | 8u32) << ((shift - 1u8) as u32)
            }
        }
        fn decode_fieldnorm_byte(b: u8) -> u32 {
            if b < IDENTITY_PART {
                b as u32
            } else {
                (IDENTITY_PART as u32) + decode_field_norm_exp_part(b - IDENTITY_PART)
            }
        }
        for i in 0..256 {
            assert_eq!(FIELD_NORMS_TABLE[i], decode_fieldnorm_byte(i as u8));
        }
    }
}


================================================
FILE: src/fieldnorm/mod.rs
================================================
//! The fieldnorm represents the length associated with
//! a given Field of a given document.
//!
//! This metric is important to compute the score of a
//! document: a document having a query word in one of its short fields
//! (e.g. title)  is likely to be more relevant than in one of its longer field
//! (e.g. body).
//!
//! It encodes `fieldnorm` on one byte with some precision loss,
//! using the exact same scheme as Lucene. Each value is placed on a log-scale
//! that takes values from `0` to `255`.
//!
//! A value on this scale is identified by a `fieldnorm_id`.
//! Apart from compression, this scale also makes it possible to
//! precompute computationally expensive functions of the fieldnorm
//! in a very short array.
//!
//! This trick is used by the Bm25 similarity.
mod code;
mod reader;
mod serializer;
mod writer;

use self::code::{fieldnorm_to_id, id_to_fieldnorm};
pub use self::reader::{FieldNormReader, FieldNormReaders};
pub use self::serializer::FieldNormsSerializer;
pub use self::writer::FieldNormsWriter;

#[cfg(test)]
mod tests {
    use std::path::Path;

    use once_cell::sync::Lazy;

    use crate::directory::{CompositeFile, Directory, RamDirectory, WritePtr};
    use crate::fieldnorm::{FieldNormReader, FieldNormsSerializer, FieldNormsWriter};
    use crate::query::{EnableScoring, Query, TermQuery};
    use crate::schema::{
        Field, IndexRecordOption, Schema, TextFieldIndexing, TextOptions, STORED, TEXT,
    };
    use crate::{Index, Term, TERMINATED};

    pub static SCHEMA: Lazy<Schema> = Lazy::new(|| {
        let mut schema_builder = Schema::builder();
        schema_builder.add_text_field("field", STORED);
        schema_builder.add_text_field("txt_field", TEXT);
        schema_builder.add_text_field(
            "str_field",
            TextOptions::default().set_indexing_options(
                TextFieldIndexing::default()
                    .set_index_option(IndexRecordOption::Basic)
                    .set_fieldnorms(false),
            ),
        );
        schema_builder.build()
    });

    pub static FIELD: Lazy<Field> = Lazy::new(|| SCHEMA.get_field("field").unwrap());
    pub static TXT_FIELD: Lazy<Field> = Lazy::new(|| SCHEMA.get_field("txt_field").unwrap());
    pub static STR_FIELD: Lazy<Field> = Lazy::new(|| SCHEMA.get_field("str_field").unwrap());

    #[test]
    #[should_panic(expected = "Cannot register a given fieldnorm twice")]
    pub fn test_should_panic_when_recording_fieldnorm_twice_for_same_doc() {
        let mut fieldnorm_writers = FieldNormsWriter::for_schema(&SCHEMA);
        fieldnorm_writers.record(0u32, *TXT_FIELD, 5);
        fieldnorm_writers.record(0u32, *TXT_FIELD, 3);
    }

    #[test]
    pub fn test_fieldnorm() -> crate::Result<()> {
        let path = Path::new("test");
        let directory: RamDirectory = RamDirectory::create();
        {
            let write: WritePtr = directory.open_write(Path::new("test"))?;
            let serializer = FieldNormsSerializer::from_write(write)?;
            let mut fieldnorm_writers = FieldNormsWriter::for_schema(&SCHEMA);
            fieldnorm_writers.record(2u32, *TXT_FIELD, 5);
            fieldnorm_writers.record(3u32, *TXT_FIELD, 3);
            fieldnorm_writers.serialize(serializer)?;
        }
        let file = directory.open_read(path)?;
        {
            let fields_composite = CompositeFile::open(&file)?;
            assert!(fields_composite.open_read(*FIELD).is_none());
            assert!(fields_composite.open_read(*STR_FIELD).is_none());
            let data = fields_composite.open_read(*TXT_FIELD).unwrap();
            let fieldnorm_reader = FieldNormReader::open(data)?;
            assert_eq!(fieldnorm_reader.fieldnorm(0u32), 0u32);
            assert_eq!(fieldnorm_reader.fieldnorm(1u32), 0u32);
            assert_eq!(fieldnorm_reader.fieldnorm(2u32), 5u32);
            assert_eq!(fieldnorm_reader.fieldnorm(3u32), 3u32);
        }
        Ok(())
    }

    #[test]
    fn test_fieldnorm_disabled() -> crate::Result<()> {
        let mut schema_builder = Schema::builder();
        let text_options = TextOptions::default()
            .set_indexing_options(TextFieldIndexing::default().set_fieldnorms(false));
        let text = schema_builder.add_text_field("text", text_options);
        let schema = schema_builder.build();
        let index = Index::create_in_ram(schema);
        let mut writer = index.writer_for_tests()?;
        writer.add_document(doc!(text=>"hello"))?;
        writer.add_document(doc!(text=>"hello hello hello"))?;
        writer.commit()?;
        let reader = index.reader()?;
        let searcher = reader.searcher();
        let query = TermQuery::new(
            Term::from_field_text(text, "hello"),
            IndexRecordOption::WithFreqs,
        );
        let weight = query.weight(EnableScoring::enabled_from_searcher(&searcher))?;
        let mut scorer = weight.scorer(searcher.segment_reader(0), 1.0f32)?;
        assert_eq!(scorer.doc(), 0);
        assert!((scorer.score() - 0.22920431).abs() < 0.001f32);
        assert_eq!(scorer.advance(), 1);
        assert_eq!(scorer.doc(), 1);
        assert!((scorer.score() - 0.22920431).abs() < 0.001f32);
        assert_eq!(scorer.advance(), TERMINATED);
        Ok(())
    }

    #[test]
    fn test_fieldnorm_enabled() -> crate::Result<()> {
        let mut schema_builder = Schema::builder();
        let text_options = TextOptions::default()
            .set_indexing_options(TextFieldIndexing::default().set_fieldnorms(true));
        let text = schema_builder.add_text_field("text", text_options);
        let schema = schema_builder.build();
        let index = Index::create_in_ram(schema);
        let mut writer = index.writer_for_tests()?;
        writer.add_document(doc!(text=>"hello"))?;
        writer.add_document(doc!(text=>"hello hello hello"))?;
        writer.commit()?;
        let reader = index.reader()?;
        let searcher = reader.searcher();
        let query = TermQuery::new(
            Term::from_field_text(text, "hello"),
            IndexRecordOption::WithFreqs,
        );
        let weight = query.weight(EnableScoring::enabled_from_searcher(&searcher))?;
        let mut scorer = weight.scorer(searcher.segment_reader(0), 1.0f32)?;
        assert_eq!(scorer.doc(), 0);
        assert!((scorer.score() - 0.22920431).abs() < 0.001f32);
        assert_eq!(scorer.advance(), 1);
        assert_eq!(scorer.doc(), 1);
        assert!((scorer.score() - 0.15136132).abs() < 0.001f32);
        assert_eq!(scorer.advance(), TERMINATED);
        Ok(())
    }
}


================================================
FILE: src/fieldnorm/reader.rs
================================================
use std::sync::Arc;

use super::{fieldnorm_to_id, id_to_fieldnorm};
use crate::directory::{CompositeFile, FileSlice, OwnedBytes};
use crate::schema::{Field, Schema};
use crate::space_usage::PerFieldSpaceUsage;
use crate::DocId;

/// Reader for the fieldnorm (for each document, the number of tokens indexed in the
/// field) of all indexed fields in the index.
///
/// Each fieldnorm is approximately compressed over one byte. We refer to this byte as
/// `fieldnorm_id`.
/// The mapping from `fieldnorm` to `fieldnorm_id` is given by monotonic.
#[derive(Clone)]
pub struct FieldNormReaders {
    data: Arc<CompositeFile>,
}

impl FieldNormReaders {
    /// Creates a field norm reader.
    pub fn open(file: FileSlice) -> crate::Result<FieldNormReaders> {
        let data = CompositeFile::open(&file)?;
        Ok(FieldNormReaders {
            data: Arc::new(data),
        })
    }

    /// Returns the FieldNormReader for a specific field.
    pub fn get_field(&self, field: Field) -> crate::Result<Option<FieldNormReader>> {
        if let Some(file) = self.data.open_read(field) {
            let fieldnorm_reader = FieldNormReader::open(file)?;
            Ok(Some(fieldnorm_reader))
        } else {
            Ok(None)
        }
    }

    /// Return a break down of the space usage per field.
    pub fn space_usage(&self, schema: &Schema) -> PerFieldSpaceUsage {
        self.data.space_usage(schema)
    }

    /// Returns a handle to inner file
    pub fn get_inner_file(&self) -> Arc<CompositeFile> {
        self.data.clone()
    }
}

/// Reads the fieldnorm associated with a document.
///
/// The [fieldnorm](FieldNormReader::fieldnorm) represents the length associated with
/// a given Field of a given document.
#[derive(Clone)]
pub struct FieldNormReader(ReaderImplEnum);

impl From<ReaderImplEnum> for FieldNormReader {
    fn from(reader_enum: ReaderImplEnum) -> FieldNormReader {
        FieldNormReader(reader_enum)
    }
}

#[derive(Clone)]
enum ReaderImplEnum {
    FromData(OwnedBytes),
    Const {
        num_docs: u32,
        fieldnorm_id: u8,
        fieldnorm: u32,
    },
}

impl FieldNormReader {
    /// Creates a `FieldNormReader` with a constant fieldnorm.
    ///
    /// The fieldnorm will be subjected to compression as if it was coming
    /// from an array-backed fieldnorm reader.
    pub fn constant(num_docs: u32, fieldnorm: u32) -> FieldNormReader {
        let fieldnorm_id = fieldnorm_to_id(fieldnorm);
        let fieldnorm = id_to_fieldnorm(fieldnorm_id);
        ReaderImplEnum::Const {
            num_docs,
            fieldnorm_id,
            fieldnorm,
        }
        .into()
    }

    /// Opens a field norm reader given its file.
    pub fn open(fieldnorm_file: FileSlice) -> crate::Result<Self> {
        let data = fieldnorm_file.read_bytes()?;
        Ok(FieldNormReader::new(data))
    }

    fn new(data: OwnedBytes) -> Self {
        ReaderImplEnum::FromData(data).into()
    }

    /// Returns the number of documents in this segment.
    pub fn num_docs(&self) -> u32 {
        match &self.0 {
            ReaderImplEnum::FromData(data) => data.len() as u32,
            ReaderImplEnum::Const { num_docs, .. } => *num_docs,
        }
    }

    /// Returns the `fieldnorm` associated with a doc id.
    /// The fieldnorm is a value approximating the number
    /// of tokens in a given field of the `doc_id`.
    ///
    /// It is imprecise, and equal or lower than
    /// the actual number of tokens.
    ///
    /// The fieldnorm is effectively decoded from the
    /// `fieldnorm_id` by doing a simple table lookup.
    pub fn fieldnorm(&self, doc_id: DocId) -> u32 {
        match &self.0 {
            ReaderImplEnum::FromData(data) => {
                let fieldnorm_id = data.as_slice()[doc_id as usize];
                id_to_fieldnorm(fieldnorm_id)
            }
            ReaderImplEnum::Const { fieldnorm, .. } => *fieldnorm,
        }
    }

    /// Returns the `fieldnorm_id` associated with a document.
    #[inline]
    pub fn fieldnorm_id(&self, doc_id: DocId) -> u8 {
        match &self.0 {
            ReaderImplEnum::FromData(data) => {
                let fieldnorm_id = data.as_slice()[doc_id as usize];
                fieldnorm_id
            }
            ReaderImplEnum::Const { fieldnorm_id, .. } => *fieldnorm_id,
        }
    }

    /// Converts a `fieldnorm_id` into a fieldnorm.
    #[inline]
    pub fn id_to_fieldnorm(id: u8) -> u32 {
        id_to_fieldnorm(id)
    }

    /// Converts a `fieldnorm` into a `fieldnorm_id`.
    /// (This function is not injective).
    #[inline]
    pub fn fieldnorm_to_id(fieldnorm: u32) -> u8 {
        fieldnorm_to_id(fieldnorm)
    }

    #[cfg(test)]
    pub(crate) fn for_test(field_norms: &[u32]) -> FieldNormReader {
        let field_norms_id = field_norms
            .iter()
            .cloned()
            .map(FieldNormReader::fieldnorm_to_id)
            .collect::<Vec<u8>>();
        let field_norms_data = OwnedBytes::new(field_norms_id);
        FieldNormReader::new(field_norms_data)
    }
}

#[cfg(test)]
mod tests {
    use crate::fieldnorm::FieldNormReader;

    #[test]
    fn test_from_fieldnorms_array() {
        let fieldnorms = &[1, 2, 3, 4, 1_000_000];
        let fieldnorm_reader = FieldNormReader::for_test(fieldnorms);
        assert_eq!(fieldnorm_reader.num_docs(), 5);
        assert_eq!(fieldnorm_reader.fieldnorm(0), 1);
        assert_eq!(fieldnorm_reader.fieldnorm(1), 2);
        assert_eq!(fieldnorm_reader.fieldnorm(2), 3);
        assert_eq!(fieldnorm_reader.fieldnorm(3), 4);
        assert_eq!(fieldnorm_reader.fieldnorm(4), 983_064);
    }

    #[test]
    fn test_const_fieldnorm_reader_small_fieldnorm_id() {
        let fieldnorm_reader = FieldNormReader::constant(1_000_000u32, 10u32);
        assert_eq!(fieldnorm_reader.num_docs(), 1_000_000u32);
        assert_eq!(fieldnorm_reader.fieldnorm(0u32), 10u32);
        assert_eq!(fieldnorm_reader.fieldnorm_id(0u32), 10u8);
    }

    #[test]
    fn test_const_fieldnorm_reader_large_fieldnorm_id() {
        let fieldnorm_reader = FieldNormReader::constant(1_000_000u32, 300u32);
        assert_eq!(fieldnorm_reader.num_docs(), 1_000_000u32);
        assert_eq!(fieldnorm_reader.fieldnorm(0u32), 280u32);
        assert_eq!(fieldnorm_reader.fieldnorm_id(0u32), 72u8);
    }
}


================================================
FILE: src/fieldnorm/serializer.rs
================================================
use std::io;
use std::io::Write;

use crate::directory::{CompositeWrite, WritePtr};
use crate::schema::Field;

/// The fieldnorms serializer is in charge of
/// the serialization of field norms for all fields.
pub struct FieldNormsSerializer {
    composite_write: CompositeWrite,
}

impl FieldNormsSerializer {
    /// Constructor
    pub fn from_write(write: WritePtr) -> io::Result<FieldNormsSerializer> {
        // just making room for the pointer to header.
        let composite_write = CompositeWrite::wrap(write);
        Ok(FieldNormsSerializer { composite_write })
    }

    /// Serialize the given field
    pub fn serialize_field(&mut self, field: Field, fieldnorms_data: &[u8]) -> io::Result<()> {
        let write = self.composite_write.for_field(field);
        write.write_all(fieldnorms_data)?;
        write.flush()?;
        Ok(())
    }

    /// Clean up / flush / close
    pub fn close(self) -> io::Result<()> {
        self.composite_write.close()?;
        Ok(())
    }
}


================================================
FILE: src/fieldnorm/writer.rs
================================================
use std::cmp::Ordering;
use std::{io, iter};

use super::{fieldnorm_to_id, FieldNormsSerializer};
use crate::schema::{Field, Schema};
use crate::DocId;

/// The `FieldNormsWriter` is in charge of tracking the fieldnorm byte
/// of each document for each field with field norms.
///
/// `FieldNormsWriter` stores a `Vec<u8>` for each tracked field, using a
/// byte per document per field.
pub struct FieldNormsWriter {
    fieldnorms_buffers: Vec<Option<Vec<u8>>>,
}

impl FieldNormsWriter {
    /// Returns the fields that should have field norms computed
    /// according to the given schema.
    pub(crate) fn fields_with_fieldnorm(schema: &Schema) -> Vec<Field> {
        schema
            .fields()
            .filter_map(|(field, field_entry)| {
                if field_entry.is_indexed() && field_entry.has_fieldnorms() {
                    Some(field)
                } else {
                    None
                }
            })
            .collect::<Vec<_>>()
    }

    /// Initialize with state for tracking the field norm fields
    /// specified in the schema.
    pub fn for_schema(schema: &Schema) -> FieldNormsWriter {
        let mut fieldnorms_buffers: Vec<Option<Vec<u8>>> = iter::repeat_with(|| None)
            .take(schema.num_fields())
            .collect();
        for field in FieldNormsWriter::fields_with_fieldnorm(schema) {
            fieldnorms_buffers[field.field_id() as usize] = Some(Vec::with_capacity(1_000));
        }
        FieldNormsWriter { fieldnorms_buffers }
    }

    /// The memory used inclusive childs
    pub fn mem_usage(&self) -> usize {
        self.fieldnorms_buffers
            .iter()
            .flatten()
            .map(|buf| buf.capacity())
            .sum()
    }
    /// Ensure that all documents in 0..max_doc have a byte associated with them
    /// in each of the fieldnorm vectors.
    ///
    /// Will extend with 0-bytes for documents that have not been seen.
    pub fn fill_up_to_max_doc(&mut self, max_doc: DocId) {
        for fieldnorms_buffer_opt in self.fieldnorms_buffers.iter_mut() {
            if let Some(fieldnorms_buffer) = fieldnorms_buffer_opt.as_mut() {
                fieldnorms_buffer.resize(max_doc as usize, 0u8);
            }
        }
    }

    /// Set the fieldnorm byte for the given document for the given field.
    ///
    /// Will internally convert the u32 `fieldnorm` value to the appropriate byte
    /// to approximate the field norm in less space.
    ///
    /// * doc       - the document id
    /// * field     - the field being set
    /// * fieldnorm - the number of terms present in document `doc` in field `field`
    pub fn record(&mut self, doc: DocId, field: Field, fieldnorm: u32) {
        if let Some(fieldnorm_buffer) = self
            .fieldnorms_buffers
            .get_mut(field.field_id() as usize)
            .and_then(Option::as_mut)
        {
            match fieldnorm_buffer.len().cmp(&(doc as usize)) {
                Ordering::Less => {
                    // we fill intermediary `DocId` as  having a fieldnorm of 0.
                    fieldnorm_buffer.resize(doc as usize, 0u8);
                }
                Ordering::Equal => {}
                Ordering::Greater => {
                    panic!("Cannot register a given fieldnorm twice")
                }
            }
            fieldnorm_buffer.push(fieldnorm_to_id(fieldnorm));
        }
    }

    /// Serialize the seen fieldnorm values to the serializer for all fields.
    pub fn serialize(&self, mut fieldnorms_serializer: FieldNormsSerializer) -> io::Result<()> {
        for (field, fieldnorms_buffer) in self.fieldnorms_buffers.iter().enumerate().filter_map(
            |(field_id, fieldnorms_buffer_opt)| {
                fieldnorms_buffer_opt.as_ref().map(|fieldnorms_buffer| {
                    (Field::from_field_id(field_id as u32), fieldnorms_buffer)
                })
            },
        ) {
            fieldnorms_serializer.serialize_field(field, fieldnorms_buffer)?;
        }
        fieldnorms_serializer.close()?;
        Ok(())
    }
}


================================================
FILE: src/functional_test.rs
================================================
use std::collections::HashSet;

use rand::{rng, Rng};

use crate::indexer::index_writer::MEMORY_BUDGET_NUM_BYTES_MIN;
use crate::schema::*;
use crate::{doc, schema, Index, IndexWriter, Searcher};

fn check_index_content(searcher: &Searcher, vals: &[u64]) -> crate::Result<()> {
    assert!(searcher.segment_readers().len() < 20);
    assert_eq!(searcher.num_docs() as usize, vals.len());
    for segment_reader in searcher.segment_readers() {
        let store_reader = segment_reader.get_store_reader(1)?;
        for doc_id in 0..segment_reader.max_doc() {
            let _doc: TantivyDocument = store_reader.get(doc_id)?;
        }
    }
    Ok(())
}

#[test]
#[ignore]
fn test_functional_store() -> crate::Result<()> {
    let mut schema_builder = Schema::builder();

    let id_field = schema_builder.add_u64_field("id", INDEXED | STORED);
    let schema = schema_builder.build();

    let index = Index::create_in_ram(schema);
    let reader = index.reader()?;

    let mut rng = rng();

    let mut index_writer: IndexWriter =
        index.writer_with_num_threads(3, 3 * MEMORY_BUDGET_NUM_BYTES_MIN)?;

    let mut doc_set: Vec<u64> = Vec::new();

    let mut doc_id = 0u64;
    for _iteration in 0..get_num_iterations() {
        let num_docs: usize = rng.random_range(0..4);
        if !doc_set.is_empty() {
            let doc_to_remove_id = rng.random_range(0..doc_set.len());
            let removed_doc_id = doc_set.swap_remove(doc_to_remove_id);
            index_writer.delete_term(Term::from_field_u64(id_field, removed_doc_id));
        }
        for _ in 0..num_docs {
            doc_set.push(doc_id);
            index_writer.add_document(doc!(id_field=>doc_id))?;
            doc_id += 1;
        }
        index_writer.commit()?;
        reader.reload()?;
        let searcher = reader.searcher();
        check_index_content(&searcher, &doc_set)?;
    }
    Ok(())
}

fn get_num_iterations() -> usize {
    std::env::var("NUM_FUNCTIONAL_TEST_ITERATIONS")
        .map(|str| str.parse().unwrap())
        .unwrap_or(2000)
}

const LOREM: &str = "Doc Lorem ipsum dolor sit amet, consectetur adipiscing elit, sed do eiusmod \
                     tempor incididunt ut labore et dolore magna aliqua. Ut enim ad minim veniam, \
                     quis nostrud exercitation ullamco laboris nisi ut aliquip ex ea commodo \
                     consequat. Duis aute irure dolor in reprehenderit in voluptate velit esse \
                     cillum dolore eu fugiat nulla pariatur. Excepteur sint occaecat cupidatat \
                     non proident, sunt in culpa qui officia deserunt mollit anim id est laborum.";
fn get_text() -> String {
    use rand::seq::IndexedRandom;
    let mut rng = rng();
    let tokens: Vec<_> = LOREM.split(' ').collect();
    let random_val = rng.random_range(0..20);

    (0..random_val)
        .map(|_| tokens.choose(&mut rng).unwrap())
        .cloned()
        .collect::<Vec<_>>()
        .join(" ")
}

#[test]
#[ignore]
fn test_functional_indexing_unsorted() -> crate::Result<()> {
    let mut schema_builder = Schema::builder();

    let id_field = schema_builder.add_u64_field("id", INDEXED);
    let multiples_field = schema_builder.add_u64_field("multiples", INDEXED);
    let text_field_options = TextOptions::default()
        .set_indexing_options(
            TextFieldIndexing::default()
                .set_index_option(schema::IndexRecordOption::WithFreqsAndPositions),
        )
        .set_stored();
    let text_field = schema_builder.add_text_field("text_field", text_field_options);
    let schema = schema_builder.build();

    let index = Index::create_from_tempdir(schema)?;
    let reader = index.reader()?;

    let mut rng = rng();

    let mut index_writer: IndexWriter =
        index.writer_with_num_threads(3, 3 * MEMORY_BUDGET_NUM_BYTES_MIN)?;

    let mut committed_docs: HashSet<u64> = HashSet::new();
    let mut uncommitted_docs: HashSet<u64> = HashSet::new();

    for _ in 0..get_num_iterations() {
        let random_val = rng.random_range(0..20);
        if random_val == 0 {
            index_writer.commit()?;
            committed_docs.extend(&uncommitted_docs);
            uncommitted_docs.clear();
            reader.reload()?;
            let searcher = reader.searcher();
            // check that everything is correct.
            check_index_content(
                &searcher,
                &committed_docs.iter().cloned().collect::<Vec<u64>>(),
            )?;
        } else if committed_docs.remove(&random_val) || uncommitted_docs.remove(&random_val) {
            let doc_id_term = Term::from_field_u64(id_field, random_val);
            index_writer.delete_term(doc_id_term);
        } else {
            uncommitted_docs.insert(random_val);
            let mut doc = TantivyDocument::new();
            doc.add_u64(id_field, random_val);
            for i in 1u64..10u64 {
                doc.add_u64(multiples_field, random_val * i);
            }
            doc.add_text(text_field, get_text());
            index_writer.add_document(doc)?;
        }
    }
    Ok(())
}


================================================
FILE: src/future_result.rs
================================================
use std::future::Future;
use std::pin::Pin;
use std::task::Poll;

use crate::TantivyError;

/// `FutureResult` is a handle that makes it possible to wait for the completion
/// of an ongoing task.
///
/// Contrary to some `Future`, it does not need to be polled for the task to
/// progress. Dropping the `FutureResult` does not cancel the task being executed
/// either.
///
/// - In a sync context, you can call `FutureResult::wait()`. The function does not rely on
///   `block_on`.
/// - In an async context, you can call simply use `FutureResult` as a future.
pub struct FutureResult<T> {
    inner: Inner<T>,
}

enum Inner<T> {
    FailedBeforeStart(Option<TantivyError>),
    InProgress {
        receiver: oneshot::Receiver<crate::Result<T>>,
        error_msg_if_failure: &'static str,
    },
}

impl<T> From<TantivyError> for FutureResult<T> {
    fn from(err: TantivyError) -> Self {
        FutureResult {
            inner: Inner::FailedBeforeStart(Some(err)),
        }
    }
}

impl<T> FutureResult<T> {
    pub(crate) fn create(
        error_msg_if_failure: &'static str,
    ) -> (Self, oneshot::Sender<crate::Result<T>>) {
        let (sender, receiver) = oneshot::channel();
        let inner: Inner<T> = Inner::InProgress {
            receiver,
            error_msg_if_failure,
        };
        (FutureResult { inner }, sender)
    }

    /// Blocks until the scheduled result is available.
    ///
    /// In an async context, you should simply use `ScheduledResult` as a future.
    pub fn wait(self) -> crate::Result<T> {
        match self.inner {
            Inner::FailedBeforeStart(err) => Err(err.unwrap()),
            Inner::InProgress {
                receiver,
                error_msg_if_failure,
            } => receiver.recv().unwrap_or_else(|_| {
                Err(crate::TantivyError::SystemError(
                    error_msg_if_failure.to_string(),
                ))
            }),
        }
    }
}

impl<T> Future for FutureResult<T> {
    type Output = crate::Result<T>;

    fn poll(self: Pin<&mut Self>, cx: &mut std::task::Context<'_>) -> Poll<Self::Output> {
        unsafe {
            match &mut Pin::get_unchecked_mut(self).inner {
                Inner::FailedBeforeStart(err) => Poll::Ready(Err(err.take().unwrap())),
                Inner::InProgress {
                    receiver,
                    error_msg_if_failure,
                } => match Future::poll(Pin::new_unchecked(receiver), cx) {
                    Poll::Ready(oneshot_res) => {
                        let res = oneshot_res.unwrap_or_else(|_| {
                            Err(crate::TantivyError::SystemError(
                                error_msg_if_failure.to_string(),
                            ))
                        });
                        Poll::Ready(res)
                    }
                    Poll::Pending => Poll::Pending,
                },
            }
        }
    }
}

#[cfg(test)]
mod tests {
    use futures::executor::block_on;

    use super::FutureResult;
    use crate::TantivyError;

    #[test]
    fn test_scheduled_result_failed_to_schedule() {
        let scheduled_result: FutureResult<()> = FutureResult::from(TantivyError::Poisoned);
        let res = block_on(scheduled_result);
        assert!(matches!(res, Err(TantivyError::Poisoned)));
    }

    #[test]

    fn test_scheduled_result_error() {
        let (scheduled_result, tx): (FutureResult<()>, _) = FutureResult::create("failed");
        drop(tx);
        let res = block_on(scheduled_result);
        assert!(matches!(res, Err(TantivyError::SystemError(_))));
    }

    #[test]
    fn test_scheduled_result_sent_success() {
        let (scheduled_result, tx): (FutureResult<u64>, _) = FutureResult::create("failed");
        tx.send(Ok(2u64)).unwrap();
        assert_eq!(block_on(scheduled_result).unwrap(), 2u64);
    }

    #[test]
    fn test_scheduled_result_sent_error() {
        let (scheduled_result, tx): (FutureResult<u64>, _) = FutureResult::create("failed");
        tx.send(Err(TantivyError::Poisoned)).unwrap();
        let res = block_on(scheduled_result);
        assert!(matches!(res, Err(TantivyError::Poisoned)));
    }
}


================================================
FILE: src/index/index.rs
================================================
use std::collections::HashSet;
use std::fmt;
#[cfg(feature = "mmap")]
use std::path::Path;
use std::path::PathBuf;
use std::thread::available_parallelism;

use super::segment::Segment;
use super::segment_reader::merge_field_meta_data;
use super::{FieldMetadata, IndexSettings};
use crate::core::{Executor, META_FILEPATH};
use crate::directory::error::OpenReadError;
#[cfg(feature = "mmap")]
use crate::directory::MmapDirectory;
use crate::directory::{Directory, ManagedDirectory, RamDirectory, INDEX_WRITER_LOCK};
use crate::error::{DataCorruption, TantivyError};
use crate::index::{IndexMeta, SegmentId, SegmentMeta, SegmentMetaInventory};
use crate::indexer::index_writer::{
    IndexWriterOptions, MAX_NUM_THREAD, MEMORY_BUDGET_NUM_BYTES_MIN,
};
use crate::indexer::segment_updater::save_metas;
use crate::indexer::{IndexWriter, SingleSegmentIndexWriter};
use crate::reader::{IndexReader, IndexReaderBuilder};
use crate::schema::document::Document;
use crate::schema::{Field, FieldType, Schema};
use crate::tokenizer::{TextAnalyzer, TokenizerManager};
use crate::SegmentReader;

fn load_metas(
    directory: &dyn Directory,
    inventory: &SegmentMetaInventory,
) -> crate::Result<IndexMeta> {
    let meta_data = directory.atomic_read(&META_FILEPATH)?;
    let meta_string = String::from_utf8(meta_data).map_err(|_utf8_err| {
        error!("Meta data is not valid utf8.");
        DataCorruption::new(
            META_FILEPATH.to_path_buf(),
            "Meta file does not contain valid utf8 file.".to_string(),
        )
    })?;
    IndexMeta::deserialize(&meta_string, inventory)
        .map_err(|e| {
            DataCorruption::new(
                META_FILEPATH.to_path_buf(),
                format!("Meta file cannot be deserialized. {e:?}. Content: {meta_string:?}"),
            )
        })
        .map_err(From::from)
}

/// Save the index meta file.
/// This operation is atomic :
/// Either
/// - it fails, in which case an error is returned, and the `meta.json` remains untouched,
/// - it succeeds, and `meta.json` is written and flushed.
///
/// This method is not part of tantivy's public API
fn save_new_metas(
    schema: Schema,
    index_settings: IndexSettings,
    directory: &dyn Directory,
) -> crate::Result<()> {
    save_metas(
        &IndexMeta {
            index_settings,
            segments: Vec::new(),
            schema,
            opstamp: 0u64,
            payload: None,
        },
        directory,
    )?;
    directory.sync_directory()?;
    Ok(())
}

/// IndexBuilder can be used to create an index.
///
/// Use in conjunction with [`SchemaBuilder`][crate::schema::SchemaBuilder].
/// Global index settings can be configured with [`IndexSettings`].
///
/// # Examples
///
/// ```
/// use tantivy::schema::*;
/// use tantivy::{Index, IndexSettings};
///
/// let mut schema_builder = Schema::builder();
/// let id_field = schema_builder.add_text_field("id", STRING);
/// let title_field = schema_builder.add_text_field("title", TEXT);
/// let body_field = schema_builder.add_text_field("body", TEXT);
/// let number_field = schema_builder.add_u64_field(
///     "number",
///     NumericOptions::default().set_fast(),
/// );
///
/// let schema = schema_builder.build();
/// let settings = IndexSettings{
///     docstore_blocksize: 100_000,
///     ..Default::default()
/// };
/// let index = Index::builder().schema(schema).settings(settings).create_in_ram();
/// ```
pub struct IndexBuilder {
    schema: Option<Schema>,
    index_settings: IndexSettings,
    tokenizer_manager: TokenizerManager,
    fast_field_tokenizer_manager: TokenizerManager,
}
impl Default for IndexBuilder {
    fn default() -> Self {
        IndexBuilder::new()
    }
}
impl IndexBuilder {
    /// Creates a new `IndexBuilder`
    pub fn new() -> Self {
        Self {
            schema: None,
            index_settings: IndexSettings::default(),
            tokenizer_manager: TokenizerManager::default(),
            fast_field_tokenizer_manager: TokenizerManager::default(),
        }
    }

    /// Set the settings
    #[must_use]
    pub fn settings(mut self, settings: IndexSettings) -> Self {
        self.index_settings = settings;
        self
    }

    /// Set the schema
    #[must_use]
    pub fn schema(mut self, schema: Schema) -> Self {
        self.schema = Some(schema);
        self
    }

    /// Set the tokenizers.
    pub fn tokenizers(mut self, tokenizers: TokenizerManager) -> Self {
        self.tokenizer_manager = tokenizers;
        self
    }

    /// Set the fast field tokenizers.
    pub fn fast_field_tokenizers(mut self, tokenizers: TokenizerManager) -> Self {
        self.fast_field_tokenizer_manager = tokenizers;
        self
    }

    /// Creates a new index using the [`RamDirectory`].
    ///
    /// The index will be allocated in anonymous memory.
    /// This is useful for indexing small set of documents
    /// for instances like unit test or temporary in memory index.
    pub fn create_in_ram(self) -> Result<Index, TantivyError> {
        let ram_directory = RamDirectory::create();
        self.create(ram_directory)
    }

    /// Creates a new index in a given filepath.
    /// The index will use the [`MmapDirectory`].
    ///
    /// If a previous index was in this directory, it returns an
    /// [`TantivyError::IndexAlreadyExists`] error.
    #[cfg(feature = "mmap")]
    pub fn create_in_dir<P: AsRef<Path>>(self, directory_path: P) -> crate::Result<Index> {
        let mmap_directory: Box<dyn Directory> = Box::new(MmapDirectory::open(directory_path)?);
        if Index::exists(&*mmap_directory)? {
            return Err(TantivyError::IndexAlreadyExists);
        }
        self.create(mmap_directory)
    }

    /// Dragons ahead!!!
    ///
    /// The point of this API is to let users create a simple index with a single segment
    /// and without starting any thread.
    ///
    /// Do not use this method if you are not sure what you are doing.
    ///
    /// It expects an originally empty directory, and will not run any GC operation.
    #[doc(hidden)]
    pub fn single_segment_index_writer<D: Document>(
        self,
        dir: impl Into<Box<dyn Directory>>,
        mem_budget: usize,
    ) -> crate::Result<SingleSegmentIndexWriter<D>> {
        let index = self.create(dir)?;
        let index_simple_writer = SingleSegmentIndexWriter::new(index, mem_budget)?;
        Ok(index_simple_writer)
    }

    /// Creates a new index in a temp directory.
    ///
    /// The index will use the [`MmapDirectory`] in a newly created directory.
    /// The temp directory will be destroyed automatically when the [`Index`] object
    /// is destroyed.
    ///
    /// The temp directory is only used for testing the [`MmapDirectory`].
    /// For other unit tests, prefer the [`RamDirectory`], see:
    /// [`IndexBuilder::create_in_ram()`].
    #[cfg(feature = "mmap")]
    pub fn create_from_tempdir(self) -> crate::Result<Index> {
        let mmap_directory: Box<dyn Directory> = Box::new(MmapDirectory::create_from_tempdir()?);
        self.create(mmap_directory)
    }

    fn get_expect_schema(&self) -> crate::Result<Schema> {
        self.schema
            .as_ref()
            .cloned()
            .ok_or(TantivyError::IndexBuilderMissingArgument("schema"))
    }

    /// Opens or creates a new index in the provided directory
    pub fn open_or_create<T: Into<Box<dyn Directory>>>(self, dir: T) -> crate::Result<Index> {
        let dir: Box<dyn Directory> = dir.into();
        if !Index::exists(&*dir)? {
            return self.create(dir);
        }
        let mut index = Index::open(dir)?;
        index.set_tokenizers(self.tokenizer_manager.clone());
        if index.schema() == self.get_expect_schema()? {
            Ok(index)
        } else {
            Err(TantivyError::SchemaError(
                "An index exists but the schema does not match.".to_string(),
            ))
        }
    }

    fn validate(&self) -> crate::Result<()> {
        if let Some(_schema) = self.schema.as_ref() {
            Ok(())
        } else {
            Err(TantivyError::InvalidArgument(
                "no schema passed".to_string(),
            ))
        }
    }

    /// Creates a new index given an implementation of the trait `Directory`.
    ///
    /// If a directory previously existed, it will be erased.
    fn create<T: Into<Box<dyn Directory>>>(self, dir: T) -> crate::Result<Index> {
        self.validate()?;
        let dir = dir.into();
        let directory = ManagedDirectory::wrap(dir)?;
        save_new_metas(
            self.get_expect_schema()?,
            self.index_settings.clone(),
            &directory,
        )?;
        let mut metas = IndexMeta::with_schema(self.get_expect_schema()?);
        metas.index_settings = self.index_settings;
        let mut index = Index::open_from_metas(directory, &metas, SegmentMetaInventory::default());
        index.set_tokenizers(self.tokenizer_manager);
        index.set_fast_field_tokenizers(self.fast_field_tokenizer_manager);
        Ok(index)
    }
}

/// Search Index
#[derive(Clone)]
pub struct Index {
    directory: ManagedDirectory,
    schema: Schema,
    settings: IndexSettings,
    executor: Executor,
    tokenizers: TokenizerManager,
    fast_field_tokenizers: TokenizerManager,
    inventory: SegmentMetaInventory,
}

impl Index {
    /// Creates a new builder.
    pub fn builder() -> IndexBuilder {
        IndexBuilder::new()
    }
    /// Examines the directory to see if it contains an index.
    ///
    /// Effectively, it only checks for the presence of the `meta.json` file.
    pub fn exists(dir: &dyn Directory) -> Result<bool, OpenReadError> {
        dir.exists(&META_FILEPATH)
    }

    /// Accessor to the search executor.
    ///
    /// This pool is used by default when calling `searcher.search(...)`
    /// to perform search on the individual segments.
    ///
    /// By default the executor is single thread, and simply runs in the calling thread.
    pub fn search_executor(&self) -> &Executor {
        &self.executor
    }

    /// Replace the default single thread search executor pool
    /// by a thread pool with a given number of threads.
    pub fn set_multithread_executor(&mut self, num_threads: usize) -> crate::Result<()> {
        self.executor = Executor::multi_thread(num_threads, "tantivy-search-")?;
        Ok(())
    }

    /// Custom thread pool by a outer thread pool.
    pub fn set_executor(&mut self, executor: Executor) {
        self.executor = executor;
    }

    /// Replace the default single thread search executor pool
    /// by a thread pool with as many threads as there are CPUs on the system.
    pub fn set_default_multithread_executor(&mut self) -> crate::Result<()> {
        let default_num_threads = available_parallelism()?.get();
        self.set_multithread_executor(default_num_threads)
    }

    /// Creates a new index using the [`RamDirectory`].
    ///
    /// The index will be allocated in anonymous memory.
    /// This is useful for indexing small set of documents
    /// for instances like unit test or temporary in memory index.
    pub fn create_in_ram(schema: Schema) -> Index {
        IndexBuilder::new().schema(schema).create_in_ram().unwrap()
    }

    /// Creates a new index in a given filepath.
    /// The index will use the [`MmapDirectory`].
    ///
    /// If a previous index was in this directory, then it returns
    /// a [`TantivyError::IndexAlreadyExists`] error.
    #[cfg(feature = "mmap")]
    pub fn create_in_dir<P: AsRef<Path>>(
        directory_path: P,
        schema: Schema,
    ) -> crate::Result<Index> {
        IndexBuilder::new()
            .schema(schema)
            .create_in_dir(directory_path)
    }

    /// Opens or creates a new index in the provided directory
    pub fn open_or_create<T: Into<Box<dyn Directory>>>(
        dir: T,
        schema: Schema,
    ) -> crate::Result<Index> {
        let dir = dir.into();
        IndexBuilder::new().schema(schema).open_or_create(dir)
    }

    /// Creates a new index in a temp directory.
    ///
    /// The index will use the [`MmapDirectory`] in a newly created directory.
    /// The temp directory will be destroyed automatically when the [`Index`] object
    /// is destroyed.
    ///
    /// The temp directory is only used for testing the [`MmapDirectory`].
    /// For other unit tests, prefer the [`RamDirectory`],
    /// see: [`IndexBuilder::create_in_ram()`].
    #[cfg(feature = "mmap")]
    pub fn create_from_tempdir(schema: Schema) -> crate::Result<Index> {
        IndexBuilder::new().schema(schema).create_from_tempdir()
    }

    /// Creates a new index given an implementation of the trait `Directory`.
    ///
    /// If a directory previously existed, it will be erased.
    pub fn create<T: Into<Box<dyn Directory>>>(
        dir: T,
        schema: Schema,
        settings: IndexSettings,
    ) -> crate::Result<Index> {
        let dir: Box<dyn Directory> = dir.into();
        let mut builder = IndexBuilder::new().schema(schema);
        builder = builder.settings(settings);
        builder.create(dir)
    }

    /// Creates a new index given a directory and an [`IndexMeta`].
    fn open_from_metas(
        directory: ManagedDirectory,
        metas: &IndexMeta,
        inventory: SegmentMetaInventory,
    ) -> Index {
        let schema = metas.schema.clone();
        Index {
            settings: metas.index_settings.clone(),
            directory,
            schema,
            tokenizers: TokenizerManager::default(),
            fast_field_tokenizers: TokenizerManager::default(),
            executor: Executor::single_thread(),
            inventory,
        }
    }

    /// Setter for the tokenizer manager.
    pub fn set_tokenizers(&mut self, tokenizers: TokenizerManager) {
        self.tokenizers = tokenizers;
    }

    /// Accessor for the tokenizer manager.
    pub fn tokenizers(&self) -> &TokenizerManager {
        &self.tokenizers
    }

    /// Setter for the fast field tokenizer manager.
    pub fn set_fast_field_tokenizers(&mut self, tokenizers: TokenizerManager) {
        self.fast_field_tokenizers = tokenizers;
    }

    /// Accessor for the fast field tokenizer manager.
    pub fn fast_field_tokenizer(&self) -> &TokenizerManager {
        &self.fast_field_tokenizers
    }

    /// Get the tokenizer associated with a specific field.
    pub fn tokenizer_for_field(&self, field: Field) -> crate::Result<TextAnalyzer> {
        let field_entry = self.schema.get_field_entry(field);
        let field_type = field_entry.field_type();
        let tokenizer_manager: &TokenizerManager = self.tokenizers();
        let indexing_options_opt = match field_type {
            FieldType::JsonObject(options) => options.get_text_indexing_options(),
            FieldType::Str(options) => options.get_indexing_options(),
            _ => {
                return Err(TantivyError::SchemaError(format!(
                    "{:?} is not a text field.",
                    field_entry.name()
                )))
            }
        };
        let indexing_options = indexing_options_opt.ok_or_else(|| {
            TantivyError::InvalidArgument(format!(
                "No indexing options set for field {field_entry:?}"
            ))
        })?;

        tokenizer_manager
            .get(indexing_options.tokenizer())
            .ok_or_else(|| {
                TantivyError::InvalidArgument(format!(
                    "No Tokenizer found for field {field_entry:?}"
                ))
            })
    }

    /// Create a default [`IndexReader`] for the given index.
    ///
    /// See [`Index.reader_builder()`].
    pub fn reader(&self) -> crate::Result<IndexReader> {
        self.reader_builder().try_into()
    }

    /// Create a [`IndexReader`] for the given index.
    ///
    /// Most project should create at most one reader for a given index.
    /// This method is typically called only once per `Index` instance.
    pub fn reader_builder(&self) -> IndexReaderBuilder {
        IndexReaderBuilder::new(self.clone())
    }

    /// Opens a new directory from an index path.
    #[cfg(feature = "mmap")]
    pub fn open_in_dir<P: AsRef<Path>>(directory_path: P) -> crate::Result<Index> {
        let mmap_directory = MmapDirectory::open(directory_path)?;
        Index::open(mmap_directory)
    }

    /// Returns the list of the segment metas tracked by the index.
    ///
    /// Such segments can of course be part of the index,
    /// but also they could be segments being currently built or in the middle of a merge
    /// operation.
    pub(crate) fn list_all_segment_metas(&self) -> Vec<SegmentMeta> {
        self.inventory.all()
    }

    /// Returns the list of fields that have been indexed in the Index.
    /// The field list includes the field defined in the schema as well as the fields
    /// that have been indexed as a part of a JSON field.
    /// The returned field name is the full field name, including the name of the JSON field.
    ///
    /// The returned field names can be used in queries.
    ///
    /// Notice: If your data contains JSON fields this is **very expensive**, as it requires
    /// browsing through the inverted index term dictionary and the columnar field dictionary.
    ///
    /// Disclaimer: Some fields may not be listed here. For instance, if the schema contains a json
    /// field that is not indexed nor a fast field but is stored, it is possible for the field
    /// to not be listed.
    pub fn fields_metadata(&self) -> crate::Result<Vec<FieldMetadata>> {
        let segments = self.searchable_segments()?;
        let fields_metadata: Vec<Vec<FieldMetadata>> = segments
            .into_iter()
            .map(|segment| SegmentReader::open(&segment)?.fields_metadata())
            .collect::<Result<_, _>>()?;
        Ok(merge_field_meta_data(fields_metadata))
    }

    /// Creates a new segment_meta (Advanced user only).
    ///
    /// As long as the `SegmentMeta` lives, the files associated with the
    /// `SegmentMeta` are guaranteed to not be garbage collected, regardless of
    /// whether the segment is recorded as part of the index or not.
    pub fn new_segment_meta(&self, segment_id: SegmentId, max_doc: u32) -> SegmentMeta {
        self.inventory.new_segment_meta(segment_id, max_doc)
    }

    /// Open the index using the provided directory
    pub fn open<T: Into<Box<dyn Directory>>>(directory: T) -> crate::Result<Index> {
        let directory = directory.into();
        let directory = ManagedDirectory::wrap(directory)?;
        let inventory = SegmentMetaInventory::default();
        let metas = load_metas(&directory, &inventory)?;
        let index = Index::open_from_metas(directory, &metas, inventory);
        Ok(index)
    }

    /// Reads the index meta file from the directory.
    pub fn load_metas(&self) -> crate::Result<IndexMeta> {
        load_metas(self.directory(), &self.inventory)
    }

    /// Open a new index writer with the given options. Attempts to acquire a lockfile.
    ///
    /// The lockfile should be deleted on drop, but it is possible
    /// that due to a panic or other error, a stale lockfile will be
    /// left in the index directory. If you are sure that no other
    /// `IndexWriter` on the system is accessing the index directory,
    /// it is safe to manually delete the lockfile.
    ///
    /// - `options` defines the writer configuration which includes things like buffer sizes,
    ///   indexer threads, etc...
    ///
    /// # Errors
    /// If the lockfile already exists, returns `TantivyError::LockFailure`.
    /// If the memory arena per thread is too small or too big, returns
    /// `TantivyError::InvalidArgument`
    pub fn writer_with_options<D: Document>(
        &self,
        options: IndexWriterOptions,
    ) -> crate::Result<IndexWriter<D>> {
        let directory_lock = self
            .directory
            .acquire_lock(&INDEX_WRITER_LOCK)
            .map_err(|err| {
                TantivyError::LockFailure(
                    err,
                    Some(
                        "Failed to acquire index lock. If you are using a regular directory, this \
                         means there is already an `IndexWriter` working on this `Directory`, in \
                         this process or in a different process."
                            .to_string(),
                    ),
                )
            })?;

        IndexWriter::new(self, options, directory_lock)
    }

    /// Open a new index writer. Attempts to acquire a lockfile.
    ///
    /// The lockfile should be deleted on drop, but it is possible
    /// that due to a panic or other error, a stale lockfile will be
    /// left in the index directory. If you are sure that no other
    /// `IndexWriter` on the system is accessing the index directory,
    /// it is safe to manually delete the lockfile.
    ///
    /// - `num_threads` defines the number of indexing workers that should work at the same time.
    ///
    /// - `overall_memory_budget_in_bytes` sets the amount of memory allocated for all indexing
    ///   thread.
    ///
    /// Each thread will receive a budget of `overall_memory_budget_in_bytes / num_threads`.
    ///
    /// # Errors
    /// If the lockfile already exists, returns `Error::DirectoryLockBusy` or an `Error::IoError`.
    /// If the memory arena per thread is too small or too big, returns
    /// `TantivyError::InvalidArgument`
    pub fn writer_with_num_threads<D: Document>(
        &self,
        num_threads: usize,
        overall_memory_budget_in_bytes: usize,
    ) -> crate::Result<IndexWriter<D>> {
        let memory_arena_in_bytes_per_thread = overall_memory_budget_in_bytes / num_threads;
        let options = IndexWriterOptions::builder()
            .num_worker_threads(num_threads)
            .memory_budget_per_thread(memory_arena_in_bytes_per_thread)
            .build();
        self.writer_with_options(options)
    }

    /// Helper to create an index writer for tests.
    ///
    /// That index writer only simply has a single thread and a memory budget of 15 MB.
    /// Using a single thread gives us a deterministic allocation of DocId.
    #[cfg(test)]
    pub fn writer_for_tests<D: Document>(&self) -> crate::Result<IndexWriter<D>> {
        self.writer_with_num_threads(1, MEMORY_BUDGET_NUM_BYTES_MIN)
    }

    /// Creates a multithreaded writer
    ///
    /// Tantivy will automatically define the number of threads to use, but
    /// no more than 8 threads.
    /// `overall_memory_arena_in_bytes` is the total target memory usage that will be split
    /// between a given number of threads.
    ///
    /// # Errors
    /// If the lockfile already exists, returns `Error::FileAlreadyExists`.
    /// If the memory arena per thread is too small or too big, returns
    /// `TantivyError::InvalidArgument`
    pub fn writer<D: Document>(
        &self,
        memory_budget_in_bytes: usize,
    ) -> crate::Result<IndexWriter<D>> {
        let mut num_threads = std::cmp::min(available_parallelism()?.get(), MAX_NUM_THREAD);
        let memory_budget_num_bytes_per_thread = memory_budget_in_bytes / num_threads;
        if memory_budget_num_bytes_per_thread < MEMORY_BUDGET_NUM_BYTES_MIN {
            num_threads = (memory_budget_in_bytes / MEMORY_BUDGET_NUM_BYTES_MIN).max(1);
        }
        self.writer_with_num_threads(num_threads, memory_budget_in_bytes)
    }

    /// Accessor to the index settings
    pub fn settings(&self) -> &IndexSettings {
        &self.settings
    }

    /// Accessor to the index settings
    pub fn settings_mut(&mut self) -> &mut IndexSettings {
        &mut self.settings
    }

    /// Accessor to the index schema
    ///
    /// The schema is actually cloned.
    pub fn schema(&self) -> Schema {
        self.schema.clone()
    }

    /// Returns the list of segments that are searchable
    pub fn searchable_segments(&self) -> crate::Result<Vec<Segment>> {
        Ok(self
            .searchable_segment_metas()?
            .into_iter()
            .map(|segment_meta| self.segment(segment_meta))
            .collect())
    }

    #[doc(hidden)]
    pub fn segment(&self, segment_meta: SegmentMeta) -> Segment {
        Segment::for_index(self.clone(), segment_meta)
    }

    /// Creates a new segment.
    pub fn new_segment(&self) -> Segment {
        let segment_meta = self
            .inventory
            .new_segment_meta(SegmentId::generate_random(), 0);
        self.segment(segment_meta)
    }

    /// Return a reference to the index directory.
    pub fn directory(&self) -> &ManagedDirectory {
        &self.directory
    }

    /// Return a mutable reference to the index directory.
    pub fn directory_mut(&mut self) -> &mut ManagedDirectory {
        &mut self.directory
    }

    /// Reads the meta.json and returns the list of
    /// `SegmentMeta` from the last commit.
    pub fn searchable_segment_metas(&self) -> crate::Result<Vec<SegmentMeta>> {
        Ok(self.load_metas()?.segments)
    }

    /// Returns the list of segment ids that are searchable.
    pub fn searchable_segment_ids(&self) -> crate::Result<Vec<SegmentId>> {
        Ok(self
            .searchable_segment_metas()?
            .iter()
            .map(SegmentMeta::id)
            .collect())
    }

    /// Returns the set of corrupted files
    pub fn validate_checksum(&self) -> crate::Result<HashSet<PathBuf>> {
        let managed_files = self.directory.list_managed_files();
        let active_segments_files: HashSet<PathBuf> = self
            .searchable_segment_metas()?
            .iter()
            .flat_map(|segment_meta| segment_meta.list_files())
            .collect();
        let active_existing_files: HashSet<&PathBuf> =
            active_segments_files.intersection(&managed_files).collect();

        let mut damaged_files = HashSet::new();
        for path in active_existing_files {
            if !self.directory.validate_checksum(path)? {
                damaged_files.insert((*path).clone());
            }
        }
        Ok(damaged_files)
    }
}

impl fmt::Debug for Index {
    fn fmt(&self, f: &mut fmt::Formatter<'_>) -> fmt::Result {
        write!(f, "Index({:?})", self.directory)
    }
}


================================================
FILE: src/index/index_meta.rs
================================================
use std::collections::HashSet;
use std::fmt;
use std::path::PathBuf;

use serde::{Deserialize, Serialize};

use super::SegmentComponent;
use crate::index::SegmentId;
use crate::schema::Schema;
use crate::store::Compressor;
use crate::{Inventory, Opstamp, TrackedObject};

#[derive(Clone, Debug, Serialize, Deserialize)]
pub struct DeleteMeta {
    num_deleted_docs: u32,
    pub opstamp: Opstamp,
}

#[derive(Clone, Default)]
pub(crate) struct SegmentMetaInventory {
    inventory: Inventory<InnerSegmentMeta>,
}

impl SegmentMetaInventory {
    /// Lists all living `SegmentMeta` object at the time of the call.
    pub fn all(&self) -> Vec<SegmentMeta> {
        self.inventory
            .list()
            .into_iter()
            .map(SegmentMeta::from)
            .collect::<Vec<_>>()
    }

    pub fn new_segment_meta(&self, segment_id: SegmentId, max_doc: u32) -> SegmentMeta {
        let inner = InnerSegmentMeta {
            segment_id,
            max_doc,
            deletes: None,
        };
        SegmentMeta::from(self.inventory.track(inner))
    }
}

/// `SegmentMeta` contains simple meta information about a segment.
///
/// For instance the number of docs it contains,
/// how many are deleted, etc.
#[derive(Clone)]
pub struct SegmentMeta {
    tracked: TrackedObject<InnerSegmentMeta>,
}

impl fmt::Debug for SegmentMeta {
    fn fmt(&self, f: &mut fmt::Formatter<'_>) -> Result<(), fmt::Error> {
        self.tracked.fmt(f)
    }
}

impl serde::Serialize for SegmentMeta {
    fn serialize<S>(
        &self,
        serializer: S,
    ) -> Result<<S as serde::Serializer>::Ok, <S as serde::Serializer>::Error>
    where
        S: serde::Serializer,
    {
        self.tracked.serialize(serializer)
    }
}

impl From<TrackedObject<InnerSegmentMeta>> for SegmentMeta {
    fn from(tracked: TrackedObject<InnerSegmentMeta>) -> SegmentMeta {
        SegmentMeta { tracked }
    }
}

impl SegmentMeta {
    // Creates a new `SegmentMeta` object.

    /// Returns the segment id.
    pub fn id(&self) -> SegmentId {
        self.tracked.segment_id
    }

    /// Returns the number of deleted documents.
    pub fn num_deleted_docs(&self) -> u32 {
        self.tracked
            .deletes
            .as_ref()
            .map(|delete_meta| delete_meta.num_deleted_docs)
            .unwrap_or(0u32)
    }

    /// Returns the list of files that
    /// are required for the segment meta.
    /// Note: Some of the returned files may not exist depending on the state of the segment.
    ///
    /// This is useful as the way tantivy removes files
    /// is by removing all files that have been created by tantivy
    /// and are not used by any segment anymore.
    pub fn list_files(&self) -> HashSet<PathBuf> {
        SegmentComponent::iterator()
            .map(|component| self.relative_path(*component))
            .collect::<HashSet<PathBuf>>()
    }

    /// Returns the relative path of a component of our segment.
    ///
    /// It just joins the segment id with the extension
    /// associated with a segment component.
    pub fn relative_path(&self, component: SegmentComponent) -> PathBuf {
        let mut path = self.id().uuid_string();
        path.push_str(&match component {
            SegmentComponent::Postings => ".idx".to_string(),
            SegmentComponent::Positions => ".pos".to_string(),
            SegmentComponent::Terms => ".term".to_string(),
            SegmentComponent::Store => ".store".to_string(),
            SegmentComponent::FastFields => ".fast".to_string(),
            SegmentComponent::FieldNorms => ".fieldnorm".to_string(),
            SegmentComponent::Delete => format!(".{}.del", self.delete_opstamp().unwrap_or(0)),
        });
        PathBuf::from(path)
    }

    /// Return the highest doc id + 1
    ///
    /// If there are no deletes, then num_docs = max_docs
    /// and all the doc ids contains in this segment
    /// are exactly (0..max_doc).
    pub fn max_doc(&self) -> u32 {
        self.tracked.max_doc
    }

    /// Return the number of documents in the segment.
    pub fn num_docs(&self) -> u32 {
        self.max_doc() - self.num_deleted_docs()
    }

    /// Returns the `Opstamp` of the last delete operation
    /// taken in account in this segment.
    pub fn delete_opstamp(&self) -> Option<Opstamp> {
        self.tracked
            .deletes
            .as_ref()
            .map(|delete_meta| delete_meta.opstamp)
    }

    /// Returns true iff the segment meta contains
    /// delete information.
    pub fn has_deletes(&self) -> bool {
        self.num_deleted_docs() > 0
    }

    /// Updates the max_doc value from the `SegmentMeta`.
    pub fn with_max_doc(self, max_doc: u32) -> SegmentMeta {
        assert_eq!(self.tracked.max_doc, 0);
        assert!(self.tracked.deletes.is_none());
        let tracked = self.tracked.map(move |inner_meta| InnerSegmentMeta {
            segment_id: inner_meta.segment_id,
            max_doc,
            deletes: None,
        });
        SegmentMeta { tracked }
    }

    #[doc(hidden)]
    #[must_use]
    pub fn with_delete_meta(self, num_deleted_docs: u32, opstamp: Opstamp) -> SegmentMeta {
        assert!(
            num_deleted_docs <= self.max_doc(),
            "There cannot be more deleted docs than there are docs."
        );
        let delete_meta = DeleteMeta {
            num_deleted_docs,
            opstamp,
        };
        let tracked = self.tracked.map(move |inner_meta| InnerSegmentMeta {
            segment_id: inner_meta.segment_id,
            max_doc: inner_meta.max_doc,
            deletes: Some(delete_meta),
        });
        SegmentMeta { tracked }
    }
}

#[derive(Debug, Clone, Serialize, Deserialize)]
struct InnerSegmentMeta {
    segment_id: SegmentId,
    max_doc: u32,
    pub deletes: Option<DeleteMeta>,
}

impl InnerSegmentMeta {
    pub fn track(self, inventory: &SegmentMetaInventory) -> SegmentMeta {
        SegmentMeta {
            tracked: inventory.inventory.track(self),
        }
    }
}

fn return_true() -> bool {
    true
}

fn is_true(val: &bool) -> bool {
    *val
}

/// Search Index Settings.
///
/// Contains settings which are applied on the whole
/// index, like presort documents.
#[derive(Clone, Debug, Serialize, Deserialize, Eq, PartialEq)]
pub struct IndexSettings {
    /// The `Compressor` used to compress the doc store.
    #[serde(default)]
    pub docstore_compression: Compressor,
    /// If set to true, docstore compression will happen on a dedicated thread.
    /// (defaults: true)
    #[doc(hidden)]
    #[serde(default = "return_true")]
    #[serde(skip_serializing_if = "is_true")]
    pub docstore_compress_dedicated_thread: bool,
    #[serde(default = "default_docstore_blocksize")]
    /// The size of each block that will be compressed and written to disk
    pub docstore_blocksize: usize,
}

/// Must be a function to be compatible with serde defaults
fn default_docstore_blocksize() -> usize {
    16_384
}

impl Default for IndexSettings {
    fn default() -> Self {
        Self {
            docstore_compression: Compressor::default(),
            docstore_blocksize: default_docstore_blocksize(),
            docstore_compress_dedicated_thread: true,
        }
    }
}

/// The order to sort by
#[derive(Clone, Copy, Debug, Serialize, Deserialize, Eq, PartialEq)]
pub enum Order {
    /// Ascending Order
    Asc,
    /// Descending Order
    Desc,
}

impl Order {
    /// return if the Order is ascending
    pub fn is_asc(&self) -> bool {
        self == &Order::Asc
    }
    /// return if the Order is descending
    pub fn is_desc(&self) -> bool {
        self == &Order::Desc
    }
}

/// Meta information about the `Index`.
///
/// This object is serialized on disk in the `meta.json` file.
/// It keeps information about
/// * the searchable segments,
/// * the index `docstamp`
/// * the schema
#[derive(Clone, Serialize)]
pub struct IndexMeta {
    /// `IndexSettings` to configure index options.
    #[serde(default)]
    pub index_settings: IndexSettings,
    /// List of `SegmentMeta` information associated with each finalized segment of the index.
    pub segments: Vec<SegmentMeta>,
    /// Index `Schema`
    pub schema: Schema,
    /// Opstamp associated with the last `commit` operation.
    pub opstamp: Opstamp,
    /// Payload associated with the last commit.
    ///
    /// Upon commit, clients can optionally add a small `String` payload to their commit
    /// to help identify this commit.
    /// This payload is entirely unused by tantivy.
    #[serde(skip_serializing_if = "Option::is_none")]
    pub payload: Option<String>,
}

#[derive(Deserialize, Debug)]
struct UntrackedIndexMeta {
    pub segments: Vec<InnerSegmentMeta>,
    #[serde(default)]
    pub index_settings: IndexSettings,
    pub schema: Schema,
    pub opstamp: Opstamp,
    #[serde(skip_serializing_if = "Option::is_none")]
    pub payload: Option<String>,
}

impl UntrackedIndexMeta {
    pub fn track(self, inventory: &SegmentMetaInventory) -> IndexMeta {
        IndexMeta {
            index_settings: self.index_settings,
            segments: self
                .segments
                .into_iter()
                .map(|inner_seg_meta| inner_seg_meta.track(inventory))
                .collect::<Vec<SegmentMeta>>(),
            schema: self.schema,
            opstamp: self.opstamp,
            payload: self.payload,
        }
    }
}

impl IndexMeta {
    /// Create an `IndexMeta` object representing a brand new `Index`
    /// with the given index.
    ///
    /// This new index does not contains any segments.
    /// Opstamp will the value `0u64`.
    pub fn with_schema(schema: Schema) -> IndexMeta {
        IndexMeta {
            index_settings: IndexSettings::default(),
            segments: vec![],
            schema,
            opstamp: 0u64,
            payload: None,
        }
    }

    pub(crate) fn deserialize(
        meta_json: &str,
        inventory: &SegmentMetaInventory,
    ) -> serde_json::Result<IndexMeta> {
        let untracked_meta_json: UntrackedIndexMeta = serde_json::from_str(meta_json)?;
        Ok(untracked_meta_json.track(inventory))
    }
}

impl fmt::Debug for IndexMeta {
    fn fmt(&self, f: &mut fmt::Formatter<'_>) -> fmt::Result {
        write!(
            f,
            "{}",
            serde_json::ser::to_string(self)
                .expect("JSON serialization for IndexMeta should never fail.")
        )
    }
}

#[cfg(test)]
mod tests {

    use super::IndexMeta;
    use crate::index::index_meta::UntrackedIndexMeta;
    use crate::schema::{Schema, TEXT};
    use crate::store::Compressor;
    #[cfg(feature = "zstd-compression")]
    use crate::store::ZstdCompressor;
    use crate::IndexSettings;

    #[test]
    fn test_serialize_metas() {
        let schema = {
            let mut schema_builder = Schema::builder();
            schema_builder.add_text_field("text", TEXT);
            schema_builder.build()
        };
        let index_metas = IndexMeta {
            index_settings: IndexSettings {
                docstore_compression: Compressor::None,
                ..Default::default()
            },
            segments: Vec::new(),
            schema,
            opstamp: 0u64,
            payload: None,
        };
        let json = serde_json::ser::to_string(&index_metas).expect("serialization failed");
        assert_eq!(
            json,
            r#"{"index_settings":{"docstore_compression":"none","docstore_blocksize":16384},"segments":[],"schema":[{"name":"text","type":"text","options":{"indexing":{"record":"position","fieldnorms":true,"tokenizer":"default"},"stored":false,"fast":false}}],"opstamp":0}"#
        );

        let deser_meta: UntrackedIndexMeta = serde_json::from_str(&json).unwrap();
        assert_eq!(index_metas.index_settings, deser_meta.index_settings);
        assert_eq!(index_metas.schema, deser_meta.schema);
        assert_eq!(index_metas.opstamp, deser_meta.opstamp);
    }

    #[test]
    #[cfg(feature = "zstd-compression")]
    fn test_serialize_metas_zstd_compressor() {
        let schema = {
            let mut schema_builder = Schema::builder();
            schema_builder.add_text_field("text", TEXT);
            schema_builder.build()
        };
        let index_metas = IndexMeta {
            index_settings: IndexSettings {
                docstore_compression: crate::store::Compressor::Zstd(ZstdCompressor {
                    compression_level: Some(4),
                }),
                docstore_blocksize: 1_000_000,
                docstore_compress_dedicated_thread: true,
            },
            segments: Vec::new(),
            schema,
            opstamp: 0u64,
            payload: None,
        };
        let json = serde_json::ser::to_string(&index_metas).expect("serialization failed");
        assert_eq!(
            json,
            r#"{"index_settings":{"docstore_compression":"zstd(compression_level=4)","docstore_blocksize":1000000},"segments":[],"schema":[{"name":"text","type":"text","options":{"indexing":{"record":"position","fieldnorms":true,"tokenizer":"default"},"stored":false,"fast":false}}],"opstamp":0}"#
        );

        let deser_meta: UntrackedIndexMeta = serde_json::from_str(&json).unwrap();
        assert_eq!(index_metas.index_settings, deser_meta.index_settings);
        assert_eq!(index_metas.schema, deser_meta.schema);
        assert_eq!(index_metas.opstamp, deser_meta.opstamp);
    }

    #[test]
    #[cfg(all(feature = "lz4-compression", feature = "zstd-compression"))]
    fn test_serialize_metas_invalid_comp() {
        let json = r#"{"index_settings":{"docstore_compression":"zsstd","docstore_blocksize":1000000},"segments":[],"schema":[{"name":"text","type":"text","options":{"indexing":{"record":"position","fieldnorms":true,"tokenizer":"default"},"stored":false,"fast":false}}],"opstamp":0}"#;

        let err = serde_json::from_str::<UntrackedIndexMeta>(json).unwrap_err();
        assert_eq!(
            err.to_string(),
            "unknown variant `zsstd`, expected one of `none`, `lz4`, `zstd`, \
             `zstd(compression_level=5)` at line 1 column 49"
                .to_string()
        );

        let json = r#"{"index_settings":{"docstore_compression":"zstd(bla=10)","docstore_blocksize":1000000},"segments":[],"schema":[{"name":"text","type":"text","options":{"indexing":{"record":"position","fieldnorms":true,"tokenizer":"default"},"stored":false,"fast":false}}],"opstamp":0}"#;

        let err = serde_json::from_str::<UntrackedIndexMeta>(json).unwrap_err();
        assert_eq!(
            err.to_string(),
            "unknown zstd option \"bla\" at line 1 column 56".to_string()
        );
    }

    #[test]
    #[cfg(not(feature = "zstd-compression"))]
    fn test_serialize_metas_unsupported_comp() {
        let json = r#"{"index_settings":{"docstore_compression":"zstd","docstore_blocksize":1000000},"segments":[],"schema":[{"name":"text","type":"text","options":{"indexing":{"record":"position","fieldnorms":true,"tokenizer":"default"},"stored":false,"fast":false}}],"opstamp":0}"#;

        let err = serde_json::from_str::<UntrackedIndexMeta>(json).unwrap_err();
        assert_eq!(
            err.to_string(),
            "unsupported variant `zstd`, please enable Tantivy's `zstd-compression` feature at \
             line 1 column 48"
                .to_string()
        );
    }

    #[test]
    #[cfg(feature = "lz4-compression")]
    fn test_index_settings_default() {
        use crate::store::Compressor;

        let mut index_settings = IndexSettings::default();
        assert_eq!(
            index_settings,
            IndexSettings {
                docstore_compression: Compressor::default(),
                docstore_compress_dedicated_thread: true,
                docstore_blocksize: 16_384
            }
        );
        {
            let index_settings_json = serde_json::to_value(&index_settings).unwrap();
            assert_eq!(
                index_settings_json,
                serde_json::json!({
                    "docstore_compression": "lz4",
                    "docstore_blocksize": 16384
                })
            );
            let index_settings_deser: IndexSettings =
                serde_json::from_value(index_settings_json).unwrap();
            assert_eq!(index_settings_deser, index_settings);
        }
        {
            index_settings.docstore_compress_dedicated_thread = false;
            let index_settings_json = serde_json::to_value(&index_settings).unwrap();
            assert_eq!(
                index_settings_json,
                serde_json::json!({
                    "docstore_compression": "lz4",
                    "docstore_blocksize": 16384,
                    "docstore_compress_dedicated_thread": false,
                })
            );
            let index_settings_deser: IndexSettings =
                serde_json::from_value(index_settings_json).unwrap();
            assert_eq!(index_settings_deser, index_settings);
        }
    }
}


================================================
FILE: src/index/inverted_index_reader.rs
================================================
use std::io;

use common::json_path_writer::JSON_END_OF_PATH;
use common::{BinarySerializable, ByteCount};
#[cfg(feature = "quickwit")]
use futures_util::{FutureExt, StreamExt, TryStreamExt};
#[cfg(feature = "quickwit")]
use itertools::Itertools;
#[cfg(feature = "quickwit")]
use tantivy_fst::automaton::{AlwaysMatch, Automaton};

use crate::directory::FileSlice;
use crate::positions::PositionReader;
use crate::postings::{BlockSegmentPostings, SegmentPostings, TermInfo};
use crate::schema::{IndexRecordOption, Term, Type};
use crate::termdict::TermDictionary;

/// The inverted index reader is in charge of accessing
/// the inverted index associated with a specific field.
///
/// # Note
///
/// It is safe to delete the segment associated with
/// an `InvertedIndexReader`. As long as it is open,
/// the [`FileSlice`] it is relying on should
/// stay available.
///
/// `InvertedIndexReader` are created by calling
/// [`SegmentReader::inverted_index()`](crate::SegmentReader::inverted_index).
pub struct InvertedIndexReader {
    termdict: TermDictionary,
    postings_file_slice: FileSlice,
    positions_file_slice: FileSlice,
    record_option: IndexRecordOption,
    total_num_tokens: u64,
}

/// Object that records the amount of space used by a field in an inverted index.
pub(crate) struct InvertedIndexFieldSpace {
    pub field_name: String,
    pub field_type: Type,
    pub postings_size: ByteCount,
    pub positions_size: ByteCount,
    pub num_terms: u64,
}

/// Returns None if the term is not a valid JSON path.
fn extract_field_name_and_field_type_from_json_path(term: &[u8]) -> Option<(String, Type)> {
    let index = term.iter().position(|&byte| byte == JSON_END_OF_PATH)?;
    let field_type_code = term.get(index + 1).copied()?;
    let field_type = Type::from_code(field_type_code)?;
    // Let's flush the current field.
    let field_name = String::from_utf8_lossy(&term[..index]).to_string();
    Some((field_name, field_type))
}

impl InvertedIndexFieldSpace {
    fn record(&mut self, term_info: &TermInfo) {
        self.postings_size += ByteCount::from(term_info.posting_num_bytes() as u64);
        self.positions_size += ByteCount::from(term_info.positions_num_bytes() as u64);
        self.num_terms += 1;
    }
}

impl InvertedIndexReader {
    pub(crate) fn new(
        termdict: TermDictionary,
        postings_file_slice: FileSlice,
        positions_file_slice: FileSlice,
        record_option: IndexRecordOption,
    ) -> io::Result<InvertedIndexReader> {
        let (total_num_tokens_slice, postings_body) = postings_file_slice.split(8);
        let total_num_tokens = u64::deserialize(&mut total_num_tokens_slice.read_bytes()?)?;
        Ok(InvertedIndexReader {
            termdict,
            postings_file_slice: postings_body,
            positions_file_slice,
            record_option,
            total_num_tokens,
        })
    }

    /// Creates an empty `InvertedIndexReader` object, which
    /// contains no terms at all.
    pub fn empty(record_option: IndexRecordOption) -> InvertedIndexReader {
        InvertedIndexReader {
            termdict: TermDictionary::empty(),
            postings_file_slice: FileSlice::empty(),
            positions_file_slice: FileSlice::empty(),
            record_option,
            total_num_tokens: 0u64,
        }
    }

    /// Returns the term info associated with the term.
    pub fn get_term_info(&self, term: &Term) -> io::Result<Option<TermInfo>> {
        self.termdict.get(term.serialized_value_bytes())
    }

    /// Return the term dictionary datastructure.
    pub fn terms(&self) -> &TermDictionary {
        &self.termdict
    }

    /// Return the fields and types encoded in the dictionary in lexicographic order.
    /// Only valid on JSON fields.
    ///
    /// Notice: This requires a full scan and therefore **very expensive**.
    /// TODO: Move to sstable to use the index.
    pub(crate) fn list_encoded_json_fields(&self) -> io::Result<Vec<InvertedIndexFieldSpace>> {
        let mut stream = self.termdict.stream()?;
        let mut fields: Vec<InvertedIndexFieldSpace> = Vec::new();

        let mut current_field_opt: Option<InvertedIndexFieldSpace> = None;
        // Current field bytes, including the JSON_END_OF_PATH.
        let mut current_field_bytes: Vec<u8> = Vec::new();

        while let Some((term, term_info)) = stream.next() {
            if let Some(current_field) = &mut current_field_opt {
                if term.starts_with(&current_field_bytes) {
                    // We are still in the same field.
                    current_field.record(term_info);
                    continue;
                }
            }

            // This is a new field!
            // Let's flush the current field.
            fields.extend(current_field_opt.take());
            current_field_bytes.clear();

            // And create a new one.
            let Some((field_name, field_type)) =
                extract_field_name_and_field_type_from_json_path(term)
            else {
                error!(
                    "invalid term bytes encountered {term:?}. this only happens if the term \
                     dictionary is corrupted. please report"
                );
                continue;
            };
            let mut field_space = InvertedIndexFieldSpace {
                field_name,
                field_type,
                postings_size: ByteCount::default(),
                positions_size: ByteCount::default(),
                num_terms: 0u64,
            };
            field_space.record(term_info);

            // We include the json type and the json end of path to make sure the prefix check
            // is meaningful.
            current_field_bytes.extend_from_slice(&term[..field_space.field_name.len() + 2]);
            current_field_opt = Some(field_space);
        }

        // We need to flush the last field as well.
        fields.extend(current_field_opt.take());

        Ok(fields)
    }

    /// Resets the block segment to another position of the postings
    /// file.
    ///
    /// This is useful for enumerating through a list of terms,
    /// and consuming the associated posting lists while avoiding
    /// reallocating a [`BlockSegmentPostings`].
    ///
    /// # Warning
    ///
    /// This does not reset the positions list.
    pub fn reset_block_postings_from_terminfo(
        &self,
        term_info: &TermInfo,
        block_postings: &mut BlockSegmentPostings,
    ) -> io::Result<()> {
        let postings_slice = self
            .postings_file_slice
            .slice(term_info.postings_range.clone());
        let postings_bytes = postings_slice.read_bytes()?;
        block_postings.reset(term_info.doc_freq, postings_bytes)?;
        Ok(())
    }

    /// Returns a block postings given a `Term`.
    /// This method is for an advanced usage only.
    ///
    /// Most users should prefer using [`Self::read_postings()`] instead.
    pub fn read_block_postings(
        &self,
        term: &Term,
        option: IndexRecordOption,
    ) -> io::Result<Option<BlockSegmentPostings>> {
        self.get_term_info(term)?
            .map(move |term_info| self.read_block_postings_from_terminfo(&term_info, option))
            .transpose()
    }

    /// Returns a block postings given a `term_info`.
    /// This method is for an advanced usage only.
    ///
    /// Most users should prefer using [`Self::read_postings()`] instead.
    pub fn read_block_postings_from_terminfo(
        &self,
        term_info: &TermInfo,
        requested_option: IndexRecordOption,
    ) -> io::Result<BlockSegmentPostings> {
        let postings_data = self
            .postings_file_slice
            .slice(term_info.postings_range.clone());
        BlockSegmentPostings::open(
            term_info.doc_freq,
            postings_data,
            self.record_option,
            requested_option,
        )
    }

    /// Returns a posting object given a `term_info`.
    /// This method is for an advanced usage only.
    ///
    /// Most users should prefer using [`Self::read_postings()`] instead.
    pub fn read_postings_from_terminfo(
        &self,
        term_info: &TermInfo,
        option: IndexRecordOption,
    ) -> io::Result<SegmentPostings> {
        let option = option.downgrade(self.record_option);

        let block_postings = self.read_block_postings_from_terminfo(term_info, option)?;
        let position_reader = {
            if option.has_positions() {
                let positions_data = self
                    .positions_file_slice
                    .read_bytes_slice(term_info.positions_range.clone())?;
                let position_reader = PositionReader::open(positions_data)?;
                Some(position_reader)
            } else {
                None
            }
        };
        Ok(SegmentPostings::from_block_postings(
            block_postings,
            position_reader,
        ))
    }

    /// Returns the total number of tokens recorded for all documents
    /// (including deleted documents).
    pub fn total_num_tokens(&self) -> u64 {
        self.total_num_tokens
    }

    /// Returns the segment postings associated with the term, and with the given option,
    /// or `None` if the term has never been encountered and indexed.
    ///
    /// If the field was not indexed with the indexing options that cover
    /// the requested options, the returned [`SegmentPostings`] the method does not fail
    /// and returns a `SegmentPostings` with as much information as possible.
    ///
    /// For instance, requesting [`IndexRecordOption::WithFreqs`] for a
    /// [`TextOptions`](crate::schema::TextOptions) that does not index position
    /// will return a [`SegmentPostings`] with `DocId`s and frequencies.
    pub fn read_postings(
        &self,
        term: &Term,
        option: IndexRecordOption,
    ) -> io::Result<Option<SegmentPostings>> {
        self.get_term_info(term)?
            .map(move |term_info| self.read_postings_from_terminfo(&term_info, option))
            .transpose()
    }

    /// Returns the number of documents containing the term.
    pub fn doc_freq(&self, term: &Term) -> io::Result<u32> {
        Ok(self
            .get_term_info(term)?
            .map(|term_info| term_info.doc_freq)
            .unwrap_or(0u32))
    }
}

#[cfg(feature = "quickwit")]
impl InvertedIndexReader {
    pub(crate) async fn get_term_info_async(&self, term: &Term) -> io::Result<Option<TermInfo>> {
        self.termdict.get_async(term.serialized_value_bytes()).await
    }

    async fn get_term_range_async<'a, A: Automaton + 'a>(
        &'a self,
        terms: impl std::ops::RangeBounds<Term>,
        automaton: A,
        limit: Option<u64>,
        merge_holes_under_bytes: usize,
    ) -> io::Result<impl Iterator<Item = TermInfo> + 'a>
    where
        A::State: Clone,
    {
        use std::ops::Bound;
        let range_builder = self.termdict.search(automaton);
        let range_builder = match terms.start_bound() {
            Bound::Included(bound) => range_builder.ge(bound.serialized_value_bytes()),
            Bound::Excluded(bound) => range_builder.gt(bound.serialized_value_bytes()),
            Bound::Unbounded => range_builder,
        };
        let range_builder = match terms.end_bound() {
            Bound::Included(bound) => range_builder.le(bound.serialized_value_bytes()),
            Bound::Excluded(bound) => range_builder.lt(bound.serialized_value_bytes()),
            Bound::Unbounded => range_builder,
        };
        let range_builder = if let Some(limit) = limit {
            range_builder.limit(limit)
        } else {
            range_builder
        };

        let mut stream = range_builder
            .into_stream_async_merging_holes(merge_holes_under_bytes)
            .await?;

        let iter = std::iter::from_fn(move || stream.next().map(|(_k, v)| v.clone()));

        // limit on stream is only an optimization to load less data, the stream may still return
        // more than limit elements.
        let limit = limit.map(|limit| limit as usize).unwrap_or(usize::MAX);
        let iter = iter.take(limit);

        Ok(iter)
    }

    /// Warmup a block postings given a `Term`.
    /// This method is for an advanced usage only.
    ///
    /// returns a boolean, whether the term was found in the dictionary
    pub async fn warm_postings(&self, term: &Term, with_positions: bool) -> io::Result<bool> {
        let term_info_opt: Option<TermInfo> = self.get_term_info_async(term).await?;
        if let Some(term_info) = term_info_opt {
            let postings = self
                .postings_file_slice
                .read_bytes_slice_async(term_info.postings_range.clone());
            if with_positions {
                let positions = self
                    .positions_file_slice
                    .read_bytes_slice_async(term_info.positions_range.clone());
                futures_util::future::try_join(postings, positions).await?;
            } else {
                postings.await?;
            }
            Ok(true)
        } else {
            Ok(false)
        }
    }

    /// Warmup a block postings given a range of `Term`s.
    /// This method is for an advanced usage only.
    ///
    /// returns a boolean, whether a term matching the range was found in the dictionary
    pub async fn warm_postings_range(
        &self,
        terms: impl std::ops::RangeBounds<Term>,
        limit: Option<u64>,
        with_positions: bool,
    ) -> io::Result<bool> {
        let mut term_info = self
            .get_term_range_async(terms, AlwaysMatch, limit, 0)
            .await?;

        let Some(first_terminfo) = term_info.next() else {
            // no key matches, nothing more to load
            return Ok(false);
        };

        let last_terminfo = term_info.last().unwrap_or_else(|| first_terminfo.clone());

        let postings_range = first_terminfo.postings_range.start..last_terminfo.postings_range.end;
        let positions_range =
            first_terminfo.positions_range.start..last_terminfo.positions_range.end;

        let postings = self
            .postings_file_slice
            .read_bytes_slice_async(postings_range);
        if with_positions {
            let positions = self
                .positions_file_slice
                .read_bytes_slice_async(positions_range);
            futures_util::future::try_join(postings, positions).await?;
        } else {
            postings.await?;
        }
        Ok(true)
    }

    /// Warmup a block postings given a range of `Term`s.
    /// This method is for an advanced usage only.
    ///
    /// returns a boolean, whether a term matching the range was found in the dictionary
    pub async fn warm_postings_automaton<
        A: Automaton + Clone + Send + 'static,
        E: FnOnce(Box<dyn FnOnce() -> io::Result<()> + Send>) -> F,
        F: std::future::Future<Output = io::Result<()>>,
    >(
        &self,
        automaton: A,
        // with_positions: bool, at the moment we have no use for it, and supporting it would add
        // complexity to the coalesce
        executor: E,
    ) -> io::Result<bool>
    where
        A::State: Clone,
    {
        // merge holes under 4MiB, that's how many bytes we can hope to receive during a TTFB from
        // S3 (~80MiB/s, and 50ms latency)
        const MERGE_HOLES_UNDER_BYTES: usize = (80 * 1024 * 1024 * 50) / 1000;
        // we build a first iterator to download everything. Simply calling the function already
        // download everything we need from the sstable, but doesn't start iterating over it.
        let _term_info_iter = self
            .get_term_range_async(.., automaton.clone(), None, MERGE_HOLES_UNDER_BYTES)
            .await?;

        let (sender, posting_ranges_to_load_stream) = futures_channel::mpsc::unbounded();
        let termdict = self.termdict.clone();
        let cpu_bound_task = move || {
            // then we build a 2nd iterator, this one with no holes, so we don't go through blocks
            // we can't match.
            // This makes the assumption there is a caching layer below us, which gives sync read
            // for free after the initial async access. This might not always be true, but is in
            // Quickwit.
            // We build things from this closure otherwise we get into lifetime issues that can only
            // be solved with self referential strucs. Returning an io::Result from here is a bit
            // more leaky abstraction-wise, but a lot better than the alternative
            let mut stream = termdict.search(automaton).into_stream()?;

            // we could do without an iterator, but this allows us access to coalesce which simplify
            // things
            let posting_ranges_iter =
                std::iter::from_fn(move || stream.next().map(|(_k, v)| v.postings_range.clone()));

            let merged_posting_ranges_iter = posting_ranges_iter.coalesce(|range1, range2| {
                if range1.end + MERGE_HOLES_UNDER_BYTES >= range2.start {
                    Ok(range1.start..range2.end)
                } else {
                    Err((range1, range2))
                }
            });

            for posting_range in merged_posting_ranges_iter {
                if let Err(_) = sender.unbounded_send(posting_range) {
                    // this should happen only when search is cancelled
                    return Err(io::Error::other("failed to send posting range back"));
                }
            }
            Ok(())
        };
        let task_handle = executor(Box::new(cpu_bound_task));

        let posting_downloader = posting_ranges_to_load_stream
            .map(|posting_slice| {
                self.postings_file_slice
                    .read_bytes_slice_async(posting_slice)
                    .map(|result| result.map(|_slice| ()))
            })
            .buffer_unordered(5)
            .try_collect::<Vec<()>>();

        let (_, slices_downloaded) =
            futures_util::future::try_join(task_handle, posting_downloader).await?;

        Ok(!slices_downloaded.is_empty())
    }

    /// Warmup the block postings for all terms.
    /// This method is for an advanced usage only.
    ///
    /// If you know which terms to pre-load, prefer using [`Self::warm_postings`] or
    /// [`Self::warm_postings`] instead.
    pub async fn warm_postings_full(&self, with_positions: bool) -> io::Result<()> {
        self.postings_file_slice.read_bytes_async().await?;
        if with_positions {
            self.positions_file_slice.read_bytes_async().await?;
        }
        Ok(())
    }

    /// Returns the number of documents containing the term asynchronously.
    pub async fn doc_freq_async(&self, term: &Term) -> io::Result<u32> {
        Ok(self
            .get_term_info_async(term)
            .await?
            .map(|term_info| term_info.doc_freq)
            .unwrap_or(0u32))
    }
}


================================================
FILE: src/index/mod.rs
================================================
//! The `index` module in Tantivy contains core components to read and write indexes.
//!
//! It contains `Index` and `Segment`, where a `Index` consists of one or more `Segment`s.

mod index;
mod index_meta;
mod inverted_index_reader;
mod segment;
mod segment_component;
mod segment_id;
mod segment_reader;

pub use self::index::{Index, IndexBuilder};
pub(crate) use self::index_meta::SegmentMetaInventory;
pub use self::index_meta::{IndexMeta, IndexSettings, Order, SegmentMeta};
pub use self::inverted_index_reader::InvertedIndexReader;
pub use self::segment::Segment;
pub use self::segment_component::SegmentComponent;
pub use self::segment_id::SegmentId;
pub use self::segment_reader::{FieldMetadata, SegmentReader};


================================================
FILE: src/index/segment.rs
================================================
use std::fmt;
use std::path::PathBuf;

use super::SegmentComponent;
use crate::directory::error::{OpenReadError, OpenWriteError};
use crate::directory::{Directory, FileSlice, WritePtr};
use crate::index::{Index, SegmentId, SegmentMeta};
use crate::schema::Schema;
use crate::Opstamp;

/// A segment is a piece of the index.
#[derive(Clone)]
pub struct Segment {
    index: Index,
    meta: SegmentMeta,
}

impl fmt::Debug for Segment {
    fn fmt(&self, f: &mut fmt::Formatter<'_>) -> fmt::Result {
        write!(f, "Segment({:?})", self.id().uuid_string())
    }
}

impl Segment {
    /// Creates a new segment given an `Index` and a `SegmentId`
    pub(crate) fn for_index(index: Index, meta: SegmentMeta) -> Segment {
        Segment { index, meta }
    }

    /// Returns the index the segment belongs to.
    pub fn index(&self) -> &Index {
        &self.index
    }

    /// Returns our index's schema.
    pub fn schema(&self) -> Schema {
        self.index.schema()
    }

    /// Returns the segment meta-information
    pub fn meta(&self) -> &SegmentMeta {
        &self.meta
    }

    /// Updates the max_doc value from the `SegmentMeta`.
    ///
    /// This method is only used when updating `max_doc` from 0
    /// as we finalize a fresh new segment.
    pub fn with_max_doc(self, max_doc: u32) -> Segment {
        Segment {
            index: self.index,
            meta: self.meta.with_max_doc(max_doc),
        }
    }

    #[doc(hidden)]
    #[must_use]
    pub fn with_delete_meta(self, num_deleted_docs: u32, opstamp: Opstamp) -> Segment {
        Segment {
            index: self.index,
            meta: self.meta.with_delete_meta(num_deleted_docs, opstamp),
        }
    }

    /// Returns the segment's id.
    pub fn id(&self) -> SegmentId {
        self.meta.id()
    }

    /// Returns the relative path of a component of our segment.
    ///
    /// It just joins the segment id with the extension
    /// associated with a segment component.
    pub fn relative_path(&self, component: SegmentComponent) -> PathBuf {
        self.meta.relative_path(component)
    }

    /// Open one of the component file for a *regular* read.
    pub fn open_read(&self, component: SegmentComponent) -> Result<FileSlice, OpenReadError> {
        let path = self.relative_path(component);
        self.index.directory().open_read(&path)
    }

    /// Open one of the component file for *regular* write.
    pub fn open_write(&mut self, component: SegmentComponent) -> Result<WritePtr, OpenWriteError> {
        let path = self.relative_path(component);
        let write = self.index.directory_mut().open_write(&path)?;
        Ok(write)
    }
}


================================================
FILE: src/index/segment_component.rs
================================================
use std::slice;

/// Enum describing each component of a tantivy segment.
///
/// Each component is stored in its own file,
/// using the pattern `segment_uuid`.`component_extension`,
/// except the delete component that takes an `segment_uuid`.`delete_opstamp`.`component_extension`
#[derive(Copy, Clone, Eq, PartialEq)]
pub enum SegmentComponent {
    /// Postings (or inverted list). Sorted lists of document ids, associated with terms
    Postings,
    /// Positions of terms in each document.
    Positions,
    /// Column-oriented random-access storage of fields.
    FastFields,
    /// Stores the sum  of the length (in terms) of each field for each document.
    /// Field norms are stored as a special u64 fast field.
    FieldNorms,
    /// Dictionary associating `Term`s to `TermInfo`s which is
    /// simply an address into the `postings` file and the `positions` file.
    Terms,
    /// Row-oriented, compressed storage of the documents.
    /// Accessing a document from the store is relatively slow, as it
    /// requires to decompress the entire block it belongs to.
    Store,
    /// Bitset describing which document of the segment is alive.
    /// (It was representing deleted docs but changed to represent alive docs from v0.17)
    Delete,
}

impl SegmentComponent {
    /// Iterates through the components.
    pub fn iterator() -> slice::Iter<'static, SegmentComponent> {
        static SEGMENT_COMPONENTS: [SegmentComponent; 7] = [
            SegmentComponent::Postings,
            SegmentComponent::Positions,
            SegmentComponent::FastFields,
            SegmentComponent::FieldNorms,
            SegmentComponent::Terms,
            SegmentComponent::Store,
            SegmentComponent::Delete,
        ];
        SEGMENT_COMPONENTS.iter()
    }
}


================================================
FILE: src/index/segment_id.rs
================================================
use std::cmp::Ordering;
use std::error::Error;
use std::fmt;
use std::str::FromStr;
#[cfg(test)]
use std::sync::atomic;

#[cfg(test)]
use once_cell::sync::Lazy;
use serde::{Deserialize, Serialize};
use uuid::Uuid;

/// Uuid identifying a segment.
///
/// Tantivy's segment are identified
/// by a UUID which is used to prefix the filenames
/// of all of the file associated with the segment.
///
/// In unit test, for reproducibility, the `SegmentId` are
/// simply generated in an autoincrement fashion.
#[derive(Clone, Copy, PartialEq, Eq, Hash, Serialize, Deserialize)]
pub struct SegmentId(Uuid);

#[cfg(test)]
static AUTO_INC_COUNTER: Lazy<atomic::AtomicUsize> = Lazy::new(atomic::AtomicUsize::default);

#[cfg(test)]
const ZERO_ARRAY: [u8; 8] = [0u8; 8];

// During tests, we generate the segment id in a autoincrement manner
// for consistency of segment id between run.
//
// The order of the test execution is not guaranteed, but the order
// of segments within a single test is guaranteed.
#[cfg(test)]
fn create_uuid() -> Uuid {
    let new_auto_inc_id = (*AUTO_INC_COUNTER).fetch_add(1, atomic::Ordering::SeqCst);
    Uuid::from_fields(new_auto_inc_id as u32, 0, 0, &ZERO_ARRAY)
}

#[cfg(not(test))]
fn create_uuid() -> Uuid {
    Uuid::new_v4()
}

impl SegmentId {
    #[doc(hidden)]
    pub fn generate_random() -> SegmentId {
        SegmentId(create_uuid())
    }

    /// Returns a shorter identifier of the segment.
    ///
    /// We are using UUID4, so only 6 bits are fixed,
    /// and the rest is random.
    ///
    /// Picking the first 8 chars is ok to identify
    /// segments in a display message (e.g. a5c4dfcb).
    pub fn short_uuid_string(&self) -> String {
        self.0.as_simple().to_string()[..8].to_string()
    }

    /// Returns a segment uuid string.
    ///
    /// It consists in 32 lowercase hexadecimal chars
    /// (e.g. a5c4dfcbdfe645089129e308e26d5523)
    pub fn uuid_string(&self) -> String {
        self.0.as_simple().to_string()
    }

    /// Build a `SegmentId` string from the full uuid string.
    ///
    /// E.g. "a5c4dfcbdfe645089129e308e26d5523"
    pub fn from_uuid_string(uuid_string: &str) -> Result<SegmentId, SegmentIdParseError> {
        FromStr::from_str(uuid_string)
    }
}

/// Error type used when parsing a `SegmentId` from a string fails.
pub struct SegmentIdParseError(uuid::Error);

impl Error for SegmentIdParseError {}

impl fmt::Debug for SegmentIdParseError {
    fn fmt(&self, f: &mut fmt::Formatter) -> fmt::Result {
        self.0.fmt(f)
    }
}

impl fmt::Display for SegmentIdParseError {
    fn fmt(&self, f: &mut fmt::Formatter) -> fmt::Result {
        self.0.fmt(f)
    }
}

impl FromStr for SegmentId {
    type Err = SegmentIdParseError;

    fn from_str(uuid_string: &str) -> Result<Self, SegmentIdParseError> {
        let uuid = Uuid::parse_str(uuid_string).map_err(SegmentIdParseError)?;
        Ok(SegmentId(uuid))
    }
}

impl fmt::Debug for SegmentId {
    fn fmt(&self, f: &mut fmt::Formatter<'_>) -> fmt::Result {
        write!(f, "Seg({:?})", self.short_uuid_string())
    }
}

impl fmt::Display for SegmentId {
    fn fmt(&self, f: &mut fmt::Formatter<'_>) -> fmt::Result {
        write!(f, "Seg({:?})", self.short_uuid_string())
    }
}

impl PartialOrd for SegmentId {
    fn partial_cmp(&self, other: &Self) -> Option<Ordering> {
        Some(self.cmp(other))
    }
}

impl Ord for SegmentId {
    fn cmp(&self, other: &Self) -> Ordering {
        self.0.as_bytes().cmp(other.0.as_bytes())
    }
}

#[cfg(test)]
mod tests {
    use super::SegmentId;

    #[test]
    fn test_to_uuid_string() {
        let full_uuid = "a5c4dfcbdfe645089129e308e26d5523";
        let segment_id = SegmentId::from_uuid_string(full_uuid).unwrap();
        assert_eq!(segment_id.uuid_string(), full_uuid);
        assert_eq!(segment_id.short_uuid_string(), "a5c4dfcb");
        // one extra char
        assert!(SegmentId::from_uuid_string("a5c4dfcbdfe645089129e308e26d5523b").is_err());
    }
}


================================================
FILE: src/index/segment_reader.rs
================================================
use std::collections::HashMap;
use std::sync::{Arc, RwLock};
use std::{fmt, io};

use common::{ByteCount, HasLen};
use fnv::FnvHashMap;
use itertools::Itertools;

use crate::directory::{CompositeFile, FileSlice};
use crate::error::DataCorruption;
use crate::fastfield::{intersect_alive_bitsets, AliveBitSet, FacetReader, FastFieldReaders};
use crate::fieldnorm::{FieldNormReader, FieldNormReaders};
use crate::index::{InvertedIndexReader, Segment, SegmentComponent, SegmentId};
use crate::json_utils::json_path_sep_to_dot;
use crate::schema::{Field, IndexRecordOption, Schema, Type};
use crate::space_usage::SegmentSpaceUsage;
use crate::store::StoreReader;
use crate::termdict::TermDictionary;
use crate::{DocId, Opstamp};

/// Entry point to access all of the datastructures of the `Segment`
///
/// - term dictionary
/// - postings
/// - store
/// - fast field readers
/// - field norm reader
///
/// The segment reader has a very low memory footprint,
/// as close to all of the memory data is mmapped.
#[derive(Clone)]
pub struct SegmentReader {
    inv_idx_reader_cache: Arc<RwLock<HashMap<Field, Arc<InvertedIndexReader>>>>,

    segment_id: SegmentId,
    delete_opstamp: Option<Opstamp>,

    max_doc: DocId,
    num_docs: DocId,

    termdict_composite: CompositeFile,
    postings_composite: CompositeFile,
    positions_composite: CompositeFile,
    fast_fields_readers: FastFieldReaders,
    fieldnorm_readers: FieldNormReaders,

    store_file: FileSlice,
    alive_bitset_opt: Option<AliveBitSet>,
    schema: Schema,
}

impl SegmentReader {
    /// Returns the highest document id ever attributed in
    /// this segment + 1.
    pub fn max_doc(&self) -> DocId {
        self.max_doc
    }

    /// Returns the number of alive documents.
    /// Deleted documents are not counted.
    pub fn num_docs(&self) -> DocId {
        self.num_docs
    }

    /// Returns the schema of the index this segment belongs to.
    pub fn schema(&self) -> &Schema {
        &self.schema
    }

    /// Return the number of documents that have been
    /// deleted in the segment.
    pub fn num_deleted_docs(&self) -> DocId {
        self.max_doc - self.num_docs
    }

    /// Returns true if some of the documents of the segment have been deleted.
    pub fn has_deletes(&self) -> bool {
        self.num_deleted_docs() > 0
    }

    /// Accessor to a segment's fast field reader given a field.
    ///
    /// Returns the u64 fast value reader if the field
    /// is a u64 field indexed as "fast".
    ///
    /// Return a FastFieldNotAvailableError if the field is not
    /// declared as a fast field in the schema.
    ///
    /// # Panics
    /// May panic if the index is corrupted.
    pub fn fast_fields(&self) -> &FastFieldReaders {
        &self.fast_fields_readers
    }

    /// Accessor to the `FacetReader` associated with a given `Field`.
    pub fn facet_reader(&self, field_name: &str) -> crate::Result<FacetReader> {
        let schema = self.schema();
        let field = schema.get_field(field_name)?;
        let field_entry = schema.get_field_entry(field);
        if field_entry.field_type().value_type() != Type::Facet {
            return Err(crate::TantivyError::SchemaError(format!(
                "`{field_name}` is not a facet field.`"
            )));
        }
        let Some(facet_column) = self.fast_fields().str(field_name)? else {
            panic!("Facet Field `{field_name}` is missing. This should not happen");
        };
        Ok(FacetReader::new(facet_column))
    }

    /// Accessor to the segment's `Field norms`'s reader.
    ///
    /// Field norms are the length (in tokens) of the fields.
    /// It is used in the computation of the [TfIdf](https://fulmicoton.gitbooks.io/tantivy-doc/content/tfidf.html).
    ///
    /// They are simply stored as a fast field, serialized in
    /// the `.fieldnorm` file of the segment.
    pub fn get_fieldnorms_reader(&self, field: Field) -> crate::Result<FieldNormReader> {
        self.fieldnorm_readers.get_field(field)?.ok_or_else(|| {
            let field_name = self.schema.get_field_name(field);
            let err_msg = format!(
                "Field norm not found for field {field_name:?}. Was the field set to record norm \
                 during indexing?"
            );
            crate::TantivyError::SchemaError(err_msg)
        })
    }

    #[doc(hidden)]
    pub fn fieldnorms_readers(&self) -> &FieldNormReaders {
        &self.fieldnorm_readers
    }

    /// Accessor to the segment's [`StoreReader`](crate::store::StoreReader).
    ///
    /// `cache_num_blocks` sets the number of decompressed blocks to be cached in an LRU.
    /// The size of blocks is configurable, this should be reflexted in the
    pub fn get_store_reader(&self, cache_num_blocks: usize) -> io::Result<StoreReader> {
        StoreReader::open(self.store_file.clone(), cache_num_blocks)
    }

    /// Open a new segment for reading.
    pub fn open(segment: &Segment) -> crate::Result<SegmentReader> {
        Self::open_with_custom_alive_set(segment, None)
    }

    /// Open a new segment for reading.
    pub fn open_with_custom_alive_set(
        segment: &Segment,
        custom_bitset: Option<AliveBitSet>,
    ) -> crate::Result<SegmentReader> {
        let termdict_file = segment.open_read(SegmentComponent::Terms)?;
        let termdict_composite = CompositeFile::open(&termdict_file)?;

        let store_file = segment.open_read(SegmentComponent::Store)?;

        crate::fail_point!("SegmentReader::open#middle");

        let postings_file = segment.open_read(SegmentComponent::Postings)?;
        let postings_composite = CompositeFile::open(&postings_file)?;

        let positions_composite = {
            if let Ok(positions_file) = segment.open_read(SegmentComponent::Positions) {
                CompositeFile::open(&positions_file)?
            } else {
                CompositeFile::empty()
            }
        };

        let schema = segment.schema();

        let fast_fields_data = segment.open_read(SegmentComponent::FastFields)?;
        let fast_fields_readers = FastFieldReaders::open(fast_fields_data, schema.clone())?;
        let fieldnorm_data = segment.open_read(SegmentComponent::FieldNorms)?;
        let fieldnorm_readers = FieldNormReaders::open(fieldnorm_data)?;

        let original_bitset = if segment.meta().has_deletes() {
            let alive_doc_file_slice = segment.open_read(SegmentComponent::Delete)?;
            let alive_doc_data = alive_doc_file_slice.read_bytes()?;
            Some(AliveBitSet::open(alive_doc_data))
        } else {
            None
        };

        let alive_bitset_opt = intersect_alive_bitset(original_bitset, custom_bitset);

        let max_doc = segment.meta().max_doc();
        let num_docs = alive_bitset_opt
            .as_ref()
            .map(|alive_bitset| alive_bitset.num_alive_docs() as u32)
            .unwrap_or(max_doc);

        Ok(SegmentReader {
            inv_idx_reader_cache: Default::default(),
            num_docs,
            max_doc,
            termdict_composite,
            postings_composite,
            fast_fields_readers,
            fieldnorm_readers,
            segment_id: segment.id(),
            delete_opstamp: segment.meta().delete_opstamp(),
            store_file,
            alive_bitset_opt,
            positions_composite,
            schema,
        })
    }

    /// Returns a field reader associated with the field given in argument.
    /// If the field was not present in the index during indexing time,
    /// the InvertedIndexReader is empty.
    ///
    /// The field reader is in charge of iterating through the
    /// term dictionary associated with a specific field,
    /// and opening the posting list associated with any term.
    ///
    /// If the field is not marked as index, a warning is logged and an empty `InvertedIndexReader`
    /// is returned.
    /// Similarly, if the field is marked as indexed but no term has been indexed for the given
    /// index, an empty `InvertedIndexReader` is returned (but no warning is logged).
    pub fn inverted_index(&self, field: Field) -> crate::Result<Arc<InvertedIndexReader>> {
        if let Some(inv_idx_reader) = self
            .inv_idx_reader_cache
            .read()
            .expect("Lock poisoned. This should never happen")
            .get(&field)
        {
            return Ok(Arc::clone(inv_idx_reader));
        }
        let field_entry = self.schema.get_field_entry(field);
        let field_type = field_entry.field_type();
        let record_option_opt = field_type.get_index_record_option();

        if record_option_opt.is_none() {
            warn!("Field {:?} does not seem indexed.", field_entry.name());
        }

        let postings_file_opt = self.postings_composite.open_read(field);

        if postings_file_opt.is_none() || record_option_opt.is_none() {
            // no documents in the segment contained this field.
            // As a result, no data is associated with the inverted index.
            //
            // Returns an empty inverted index.
            let record_option = record_option_opt.unwrap_or(IndexRecordOption::Basic);
            return Ok(Arc::new(InvertedIndexReader::empty(record_option)));
        }

        let record_option = record_option_opt.unwrap();
        let postings_file = postings_file_opt.unwrap();

        let termdict_file: FileSlice =
            self.termdict_composite.open_read(field).ok_or_else(|| {
                DataCorruption::comment_only(format!(
                    "Failed to open field {:?}'s term dictionary in the composite file. Has the \
                     schema been modified?",
                    field_entry.name()
                ))
            })?;

        let positions_file = self.positions_composite.open_read(field).ok_or_else(|| {
            let error_msg = format!(
                "Failed to open field {:?}'s positions in the composite file. Has the schema been \
                 modified?",
                field_entry.name()
            );
            DataCorruption::comment_only(error_msg)
        })?;

        let inv_idx_reader = Arc::new(InvertedIndexReader::new(
            TermDictionary::open(termdict_file)?,
            postings_file,
            positions_file,
            record_option,
        )?);

        // by releasing the lock in between, we may end up opening the inverting index
        // twice, but this is fine.
        self.inv_idx_reader_cache
            .write()
            .expect("Field reader cache lock poisoned. This should never happen.")
            .insert(field, Arc::clone(&inv_idx_reader));

        Ok(inv_idx_reader)
    }

    /// Returns the list of fields that have been indexed in the segment.
    /// The field list includes the field defined in the schema as well as the fields
    /// that have been indexed as a part of a JSON field.
    /// The returned field name is the full field name, including the name of the JSON field.
    ///
    /// The returned field names can be used in queries.
    ///
    /// Notice: If your data contains JSON fields this is **very expensive**, as it requires
    /// browsing through the inverted index term dictionary and the columnar field dictionary.
    ///
    /// Disclaimer: Some fields may not be listed here. For instance, if the schema contains a json
    /// field that is not indexed nor a fast field but is stored, it is possible for the field
    /// to not be listed.
    pub fn fields_metadata(&self) -> crate::Result<Vec<FieldMetadata>> {
        let mut indexed_fields: Vec<FieldMetadata> = Vec::new();
        let mut map_to_canonical = FnvHashMap::default();
        for (field, field_entry) in self.schema().fields() {
            let field_name = field_entry.name().to_string();
            let is_indexed = field_entry.is_indexed();
            if is_indexed {
                let is_json = field_entry.field_type().value_type() == Type::Json;
                if is_json {
                    let term_dictionary_json_field_num_bytes: u64 = self
                        .termdict_composite
                        .open_read(field)
                        .map(|file_slice| file_slice.len() as u64)
                        .unwrap_or(0u64);
                    let inv_index = self.inverted_index(field)?;
                    let encoded_fields_in_index = inv_index.list_encoded_json_fields()?;
                    let mut build_path = |field_name: &str, mut json_path: String| {
                        // In this case we need to map the potential fast field to the field name
                        // accepted by the query parser.
                        let create_canonical =
                            !field_entry.is_expand_dots_enabled() && json_path.contains('.');
                        if create_canonical {
                            // Without expand dots enabled dots need to be escaped.
                            let escaped_json_path = json_path.replace('.', "\\.");
                            let full_path = format!("{field_name}.{escaped_json_path}");
                            let full_path_unescaped = format!("{}.{}", field_name, &json_path);
                            map_to_canonical.insert(full_path_unescaped, full_path.to_string());
                            full_path
                        } else {
                            // With expand dots enabled, we can use '.' instead of '\u{1}'.
                            json_path_sep_to_dot(&mut json_path);
                            format!("{field_name}.{json_path}")
                        }
                    };
                    let total_num_terms = encoded_fields_in_index
                        .iter()
                        .map(|field_space| field_space.num_terms)
                        .sum();
                    indexed_fields.extend(encoded_fields_in_index.into_iter().map(|field_space| {
                        let field_name = build_path(&field_name, field_space.field_name);
                        // It is complex to attribute the exact amount of bytes required by specific
                        // field in the json field. Instead, as a proxy, we
                        // attribute the total amount of bytes for the entire json field,
                        // proportionally to the number of terms in each
                        // fields.
                        let term_dictionary_size = (term_dictionary_json_field_num_bytes
                            * field_space.num_terms)
                            .checked_div(total_num_terms)
                            .unwrap_or(0);
                        FieldMetadata {
                            postings_size: Some(field_space.postings_size),
                            positions_size: Some(field_space.positions_size),
                            term_dictionary_size: Some(ByteCount::from(term_dictionary_size)),
                            fast_size: None,
                            // The stored flag will be set at the end of this function!
                            stored: field_entry.is_stored(),
                            field_name,
                            typ: field_space.field_type,
                        }
                    }));
                } else {
                    let postings_size: ByteCount = self
                        .postings_composite
                        .open_read(field)
                        .map(|posting_fileslice| posting_fileslice.len())
                        .unwrap_or(0)
                        .into();
                    let positions_size: ByteCount = self
                        .positions_composite
                        .open_read(field)
                        .map(|positions_fileslice| positions_fileslice.len())
                        .unwrap_or(0)
                        .into();
                    let term_dictionary_size: ByteCount = self
                        .termdict_composite
                        .open_read(field)
                        .map(|term_dictionary_fileslice| term_dictionary_fileslice.len())
                        .unwrap_or(0)
                        .into();
                    indexed_fields.push(FieldMetadata {
                        field_name: field_name.to_string(),
                        typ: field_entry.field_type().value_type(),
                        // The stored flag will be set at the end of this function!
                        stored: field_entry.is_stored(),
                        fast_size: None,
                        term_dictionary_size: Some(term_dictionary_size),
                        postings_size: Some(postings_size),
                        positions_size: Some(positions_size),
                    });
                }
            }
        }
        let fast_fields: Vec<FieldMetadata> = self
            .fast_fields()
            .columnar()
            .iter_columns()?
            .map(|(mut field_name, handle)| {
                json_path_sep_to_dot(&mut field_name);
                // map to canonical path, to avoid similar but different entries.
                // Eventually we should just accept '.' separated for all cases.
                let field_name = map_to_canonical
                    .get(&field_name)
                    .unwrap_or(&field_name)
                    .to_string();
                let stored = is_field_stored(&field_name, &self.schema);
                FieldMetadata {
                    field_name,
                    typ: Type::from(handle.column_type()),
                    stored,
                    fast_size: Some(handle.num_bytes()),
                    term_dictionary_size: None,
                    postings_size: None,
                    positions_size: None,
                }
            })
            .collect();
        let merged_field_metadatas: Vec<FieldMetadata> =
            merge_field_meta_data(vec![indexed_fields, fast_fields]);
        Ok(merged_field_metadatas)
    }

    /// Returns the segment id
    pub fn segment_id(&self) -> SegmentId {
        self.segment_id
    }

    /// Returns the delete opstamp
    pub fn delete_opstamp(&self) -> Option<Opstamp> {
        self.delete_opstamp
    }

    /// Returns the bitset representing the alive `DocId`s.
    pub fn alive_bitset(&self) -> Option<&AliveBitSet> {
        self.alive_bitset_opt.as_ref()
    }

    /// Returns true if the `doc` is marked
    /// as deleted.
    pub fn is_deleted(&self, doc: DocId) -> bool {
        self.alive_bitset()
            .map(|alive_bitset| alive_bitset.is_deleted(doc))
            .unwrap_or(false)
    }

    /// Returns an iterator that will iterate over the alive document ids
    pub fn doc_ids_alive(&self) -> Box<dyn Iterator<Item = DocId> + Send + '_> {
        if let Some(alive_bitset) = &self.alive_bitset_opt {
            Box::new(alive_bitset.iter_alive())
        } else {
            Box::new(0u32..self.max_doc)
        }
    }

    /// Summarize total space usage of this segment.
    pub fn space_usage(&self) -> io::Result<SegmentSpaceUsage> {
        Ok(SegmentSpaceUsage::new(
            self.num_docs(),
            self.termdict_composite.space_usage(self.schema()),
            self.postings_composite.space_usage(self.schema()),
            self.positions_composite.space_usage(self.schema()),
            self.fast_fields_readers.space_usage()?,
            self.fieldnorm_readers.space_usage(self.schema()),
            self.get_store_reader(0)?.space_usage(),
            self.alive_bitset_opt
                .as_ref()
                .map(AliveBitSet::space_usage)
                .unwrap_or_default(),
        ))
    }
}

#[derive(Clone, Debug, PartialEq, Eq, PartialOrd, Ord)]
/// FieldMetadata
pub struct FieldMetadata {
    /// The field name
    // Notice: Don't reorder the declaration of 1.field_name 2.typ, as it is used for ordering by
    // field_name then typ.
    pub field_name: String,
    /// The field type
    // Notice: Don't reorder the declaration of 1.field_name 2.typ, as it is used for ordering by
    // field_name then typ.
    pub typ: Type,
    /// Is the field stored in the doc store
    pub stored: bool,
    /// Size occupied in the columnar storage (None if not fast)
    pub fast_size: Option<ByteCount>,
    /// term_dictionary
    pub term_dictionary_size: Option<ByteCount>,
    /// Size occupied in the index postings storage (None if not indexed)
    pub postings_size: Option<ByteCount>,
    /// Size occupied in the index postings storage (None if positions are not recorded)
    pub positions_size: Option<ByteCount>,
}

fn merge_options(left: Option<ByteCount>, right: Option<ByteCount>) -> Option<ByteCount> {
    match (left, right) {
        (Some(l), Some(r)) => Some(l + r),
        (None, right) => right,
        (left, None) => left,
    }
}

impl FieldMetadata {
    /// Returns true if and only if the field is indexed.
    pub fn is_indexed(&self) -> bool {
        self.postings_size.is_some()
    }

    /// Returns true if and only if the field is a fast field (i.e.: recorded in  columnar format).
    pub fn is_fast(&self) -> bool {
        self.fast_size.is_some()
    }

    /// Merges two field metadata.
    pub fn merge(&mut self, rhs: Self) {
        assert_eq!(self.field_name, rhs.field_name);
        assert_eq!(self.typ, rhs.typ);
        self.stored |= rhs.stored;
        self.fast_size = merge_options(self.fast_size, rhs.fast_size);
        self.term_dictionary_size =
            merge_options(self.term_dictionary_size, rhs.term_dictionary_size);
        self.postings_size = merge_options(self.postings_size, rhs.postings_size);
        self.positions_size = merge_options(self.positions_size, rhs.positions_size);
    }
}

// Maybe too slow for the high cardinality case
fn is_field_stored(field_name: &str, schema: &Schema) -> bool {
    schema
        .find_field(field_name)
        .map(|(field, _path)| schema.get_field_entry(field).is_stored())
        .unwrap_or(false)
}

/// Helper to merge the field metadata from multiple segments.
pub fn merge_field_meta_data(mut field_metadatas: Vec<Vec<FieldMetadata>>) -> Vec<FieldMetadata> {
    // READ BEFORE REMOVING THIS!
    //
    // Because we replace field sep by `.`, fields are not always sorted.
    // Also, to enforce such an implicit contract, we would have to add
    // assert here.
    //
    // Sorting is linear time on pre-sorted data, so we are simply better off sorting data here.
    for field_metadatas in &mut field_metadatas {
        field_metadatas.sort_unstable();
    }
    let mut merged_field_metadata = Vec::new();
    for (_key, mut group) in &field_metadatas
        .into_iter()
        .kmerge()
        // TODO: Remove allocation
        .chunk_by(|el| (el.field_name.to_string(), el.typ))
    {
        let mut merged: FieldMetadata = group.next().unwrap();
        for el in group {
            merged.merge(el);
        }
        // Currently is_field_stored is maybe too slow for the high cardinality case
        merged_field_metadata.push(merged);
    }
    merged_field_metadata
}

fn intersect_alive_bitset(
    left_opt: Option<AliveBitSet>,
    right_opt: Option<AliveBitSet>,
) -> Option<AliveBitSet> {
    match (left_opt, right_opt) {
        (Some(left), Some(right)) => {
            assert_eq!(left.bitset().max_value(), right.bitset().max_value());
            Some(intersect_alive_bitsets(left, right))
        }
        (Some(left), None) => Some(left),
        (None, Some(right)) => Some(right),
        (None, None) => None,
    }
}

impl fmt::Debug for SegmentReader {
    fn fmt(&self, f: &mut fmt::Formatter) -> fmt::Result {
        write!(f, "SegmentReader({:?})", self.segment_id)
    }
}

#[cfg(test)]
mod test {
    use super::*;
    use crate::index::Index;
    use crate::schema::{Term, STORED, TEXT};
    use crate::IndexWriter;

    #[track_caller]
    fn assert_merge(fields_metadatas: &[Vec<FieldMetadata>], expected: &[FieldMetadata]) {
        use itertools::Itertools;
        let num_els = fields_metadatas.len();
        for permutation in fields_metadatas.iter().cloned().permutations(num_els) {
            let res = merge_field_meta_data(permutation);
            assert_eq!(&res, &expected);
        }
    }

    #[test]
    fn test_merge_field_meta_data_same_field() {
        let field_metadata1 = FieldMetadata {
            field_name: "a".to_string(),
            typ: crate::schema::Type::Str,
            stored: false,
            term_dictionary_size: Some(ByteCount::from(100u64)),
            postings_size: Some(ByteCount::from(1_000u64)),
            positions_size: Some(ByteCount::from(2_000u64)),
            fast_size: Some(ByteCount::from(1_000u64)),
        };
        let field_metadata2 = FieldMetadata {
            field_name: "a".to_string(),
            typ: crate::schema::Type::Str,
            stored: false,
            term_dictionary_size: Some(ByteCount::from(80u64)),
            postings_size: Some(ByteCount::from(1_500u64)),
            positions_size: Some(ByteCount::from(2_500u64)),
            fast_size: Some(ByteCount::from(3_000u64)),
        };
        let expected = FieldMetadata {
            field_name: "a".to_string(),
            typ: crate::schema::Type::Str,
            stored: false,
            term_dictionary_size: Some(ByteCount::from(180u64)),
            postings_size: Some(ByteCount::from(2_500u64)),
            positions_size: Some(ByteCount::from(4_500u64)),
            fast_size: Some(ByteCount::from(4_000u64)),
        };
        assert_merge(
            &[vec![field_metadata1.clone()], vec![field_metadata2]],
            &[expected],
        );
    }

    #[track_caller]
    #[test]
    fn test_merge_field_meta_data_different() {
        let field_metadata1 = FieldMetadata {
            field_name: "a".to_string(),
            typ: crate::schema::Type::Str,
            stored: false,
            fast_size: Some(1_000u64.into()),
            term_dictionary_size: Some(100u64.into()),
            postings_size: Some(2_000u64.into()),
            positions_size: Some(4_000u64.into()),
        };
        let field_metadata2 = FieldMetadata {
            field_name: "b".to_string(),
            typ: crate::schema::Type::Str,
            stored: false,
            fast_size: Some(1_002u64.into()),
            term_dictionary_size: None,
            postings_size: None,
            positions_size: None,
        };
        let field_metadata3 = FieldMetadata {
            field_name: "a".to_string(),
            typ: crate::schema::Type::Str,
            term_dictionary_size: Some(101u64.into()),
            postings_size: Some(2_001u64.into()),
            positions_size: Some(4_001u64.into()),
            stored: false,
            fast_size: None,
        };
        let expected = vec![
            FieldMetadata {
                field_name: "a".to_string(),
                typ: crate::schema::Type::Str,
                stored: false,
                term_dictionary_size: Some(201u64.into()),
                postings_size: Some(4_001u64.into()),
                positions_size: Some(8_001u64.into()),
                fast_size: Some(1_000u64.into()),
            },
            FieldMetadata {
                field_name: "b".to_string(),
                typ: crate::schema::Type::Str,
                stored: false,
                term_dictionary_size: None,
                postings_size: None,
                positions_size: None,
                fast_size: Some(1_002u64.into()),
            },
        ];
        assert_merge(
            &[
                vec![field_metadata1.clone(), field_metadata2.clone()],
                vec![field_metadata3],
            ],
            &expected,
        );
    }

    #[test]
    fn test_merge_field_meta_data_merge() {
        let get_meta_data = |name: &str, typ: Type| FieldMetadata {
            field_name: name.to_string(),
            typ,
            term_dictionary_size: None,
            postings_size: None,
            positions_size: None,
            stored: false,
            fast_size: Some(1u64.into()),
        };
        let metas = vec![get_meta_data("d", Type::Str), get_meta_data("e", Type::U64)];
        assert_merge(
            &[vec![get_meta_data("e", Type::Str)], metas],
            &[
                get_meta_data("d", Type::Str),
                get_meta_data("e", Type::Str),
                get_meta_data("e", Type::U64),
            ],
        );
    }

    #[test]
    fn test_merge_field_meta_data_bitxor() {
        let field_metadata1 = FieldMetadata {
            field_name: "a".to_string(),
            typ: crate::schema::Type::Str,
            term_dictionary_size: None,
            postings_size: None,
            positions_size: None,
            stored: false,
            fast_size: Some(10u64.into()),
        };
        let field_metadata2 = FieldMetadata {
            field_name: "a".to_string(),
            typ: crate::schema::Type::Str,
            term_dictionary_size: Some(10u64.into()),
            postings_size: Some(11u64.into()),
            positions_size: Some(12u64.into()),
            stored: false,
            fast_size: None,
        };
        let field_metadata_expected = FieldMetadata {
            field_name: "a".to_string(),
            typ: crate::schema::Type::Str,
            term_dictionary_size: Some(10u64.into()),
            postings_size: Some(11u64.into()),
            positions_size: Some(12u64.into()),
            stored: false,
            fast_size: Some(10u64.into()),
        };
        let mut res1 = field_metadata1.clone();
        res1.merge(field_metadata2.clone());
        let mut res2 = field_metadata2.clone();
        res2.merge(field_metadata1);
        assert_eq!(res1, field_metadata_expected);
        assert_eq!(res2, field_metadata_expected);
    }

    #[test]
    fn test_num_alive() -> crate::Result<()> {
        let mut schema_builder = Schema::builder();
        schema_builder.add_text_field("name", TEXT | STORED);
        let schema = schema_builder.build();
        let index = Index::create_in_ram(schema.clone());
        let name = schema.get_field("name").unwrap();

        {
            let mut index_writer: IndexWriter = index.writer_for_tests()?;
            index_writer.add_document(doc!(name => "tantivy"))?;
            index_writer.add_document(doc!(name => "horse"))?;
            index_writer.add_document(doc!(name => "jockey"))?;
            index_writer.add_document(doc!(name => "cap"))?;
            // we should now have one segment with two docs
            index_writer.delete_term(Term::from_field_text(name, "horse"));
            index_writer.delete_term(Term::from_field_text(name, "cap"));

            // ok, now we should have a deleted doc
            index_writer.commit()?;
        }
        let searcher = index.reader()?.searcher();
        assert_eq!(2, searcher.segment_reader(0).num_docs());
        assert_eq!(4, searcher.segment_reader(0).max_doc());
        Ok(())
    }

    #[test]
    fn test_alive_docs_iterator() -> crate::Result<()> {
        let mut schema_builder = Schema::builder();
        schema_builder.add_text_field("name", TEXT | STORED);
        let schema = schema_builder.build();
        let index = Index::create_in_ram(schema.clone());
        let name = schema.get_field("name").unwrap();

        {
            let mut index_writer: IndexWriter = index.writer_for_tests()?;
            index_writer.add_document(doc!(name => "tantivy"))?;
            index_writer.add_document(doc!(name => "horse"))?;
            index_writer.add_document(doc!(name => "jockey"))?;
            index_writer.add_document(doc!(name => "cap"))?;
            // we should now have one segment with two docs
            index_writer.commit()?;
        }

        {
            let mut index_writer2: IndexWriter = index.writer(50_000_000)?;
            index_writer2.delete_term(Term::from_field_text(name, "horse"));
            index_writer2.delete_term(Term::from_field_text(name, "cap"));

            // ok, now we should have a deleted doc
            index_writer2.commit()?;
        }
        let searcher = index.reader()?.searcher();
        let docs: Vec<DocId> = searcher.segment_reader(0).doc_ids_alive().collect();
        assert_eq!(vec![0u32, 2u32], docs);
        Ok(())
    }
}


================================================
FILE: src/indexer/delete_queue.rs
================================================
use std::ops::DerefMut;
use std::sync::{Arc, RwLock, Weak};

use super::operation::DeleteOperation;
use crate::Opstamp;

/// The DeleteQueue is similar in conceptually to a multiple
/// consumer single producer broadcast channel.
///
/// All consumer will receive all messages.
///
/// Consumer of the delete queue are holding a `DeleteCursor`,
/// which points to a specific place of the `DeleteQueue`.
///
/// New consumer can be created in two ways
/// - calling `delete_queue.cursor()` returns a cursor, that will include all future delete
///   operation (and some or none of the past operations... The client is in charge of checking the
///   opstamps.).
/// - cloning an existing cursor returns a new cursor, that is at the exact same position, and can
///   now advance independently from the original cursor.
#[derive(Default)]
struct InnerDeleteQueue {
    writer: Vec<DeleteOperation>,
    last_block: Weak<Block>,
}

/// The delete queue is a linked list storing delete operations.
///
/// Several consumers can hold a reference to it. Delete operations
/// get dropped/gc'ed when no more consumers are holding a reference
/// to them.
#[derive(Clone, Default)]
pub struct DeleteQueue {
    inner: Arc<RwLock<InnerDeleteQueue>>,
}

impl DeleteQueue {
    fn get_last_block(&self) -> Arc<Block> {
        {
            // try get the last block with simply acquiring the read lock.
            let rlock = self.inner.read().unwrap();
            if let Some(block) = rlock.last_block.upgrade() {
                return block;
            }
        }
        // It failed. Let's double check after acquiring the write, as someone could have called
        // `get_last_block` right after we released the rlock.
        let mut wlock = self.inner.write().unwrap();
        if let Some(block) = wlock.last_block.upgrade() {
            return block;
        }
        let block = Arc::new(Block {
            operations: Arc::new([]),
            next: NextBlock::from(self.clone()),
        });
        wlock.last_block = Arc::downgrade(&block);
        block
    }

    /// Creates a new cursor that makes it possible to
    /// consume future delete operations.
    ///
    /// Past delete operations are not accessible.
    pub fn cursor(&self) -> DeleteCursor {
        let last_block = self.get_last_block();
        let operations_len = last_block.operations.len();
        DeleteCursor {
            block: last_block,
            pos: operations_len,
        }
    }

    /// Appends a new delete operations.
    pub fn push(&self, delete_operation: DeleteOperation) {
        self.inner
            .write()
            .expect("Failed to acquire write lock on delete queue writer")
            .writer
            .push(delete_operation);
    }

    // DeleteQueue is a linked list of blocks of
    // delete operations.
    //
    // Writing happens by simply appending to a vec.
    // `.flush()` takes this pending delete operations vec
    // creates a new read-only block from it,
    // and appends it to the linked list.
    //
    // `.flush()` happens when, for instance,
    // a consumer reaches the last read-only operations.
    // It then ask the delete queue if there happen to
    // be some unflushed operations.
    //
    fn flush(&self) -> Option<Arc<Block>> {
        let mut self_wlock = self
            .inner
            .write()
            .expect("Failed to acquire write lock on delete queue writer");

        if self_wlock.writer.is_empty() {
            return None;
        }

        let delete_operations = std::mem::take(&mut self_wlock.writer);

        let new_block = Arc::new(Block {
            operations: Arc::from(delete_operations.into_boxed_slice()),
            next: NextBlock::from(self.clone()),
        });

        self_wlock.last_block = Arc::downgrade(&new_block);
        Some(new_block)
    }
}

enum InnerNextBlock {
    Writer(DeleteQueue),
    Closed(Arc<Block>),
}

struct NextBlock(RwLock<InnerNextBlock>);

impl From<DeleteQueue> for NextBlock {
    fn from(delete_queue: DeleteQueue) -> NextBlock {
        NextBlock(RwLock::new(InnerNextBlock::Writer(delete_queue)))
    }
}

impl NextBlock {
    fn next_block(&self) -> Option<Arc<Block>> {
        {
            let next_read_lock = self
                .0
                .read()
                .expect("Failed to acquire write lock in delete queue");
            if let InnerNextBlock::Closed(ref block) = *next_read_lock {
                return Some(Arc::clone(block));
            }
        }
        let next_block;
        {
            let mut next_write_lock = self
                .0
                .write()
                .expect("Failed to acquire write lock in delete queue");
            match *next_write_lock {
                InnerNextBlock::Closed(ref block) => {
                    return Some(Arc::clone(block));
                }
                InnerNextBlock::Writer(ref writer) => match writer.flush() {
                    Some(flushed_next_block) => {
                        next_block = flushed_next_block;
                    }
                    None => {
                        return None;
                    }
                },
            }
            *next_write_lock.deref_mut() = InnerNextBlock::Closed(Arc::clone(&next_block));
            Some(next_block)
        }
    }
}

struct Block {
    operations: Arc<[DeleteOperation]>,
    next: NextBlock,
}

/// As we process delete operations, keeps track of our position.
#[derive(Clone)]
pub struct DeleteCursor {
    block: Arc<Block>,
    pos: usize,
}

impl DeleteCursor {
    /// Skips operations and position it so that
    /// - either all of the delete operation currently in the queue are consume and the next get
    ///   will return `None`.
    /// - the next get will return the first operation with an `opstamp >= target_opstamp`.
    pub fn skip_to(&mut self, target_opstamp: Opstamp) {
        // TODO Can be optimize as we work with block.
        while self.is_behind_opstamp(target_opstamp) {
            self.advance();
        }
    }

    fn is_behind_opstamp(&mut self, target_opstamp: Opstamp) -> bool {
        self.get()
            .map(|operation| operation.opstamp < target_opstamp)
            .unwrap_or(false)
    }

    /// If the current block has been entirely
    /// consumed, try to load the next one.
    ///
    /// Return `true`, if after this attempt,
    /// the cursor is on a block that has not
    /// been entirely consumed.
    /// Return `false`, if we have reached the end of the queue.
    fn load_block_if_required(&mut self) -> bool {
        if self.pos >= self.block.operations.len() {
            // we have consumed our operations entirely.
            // let's ask our writer if he has more for us.
            // self.go_next_block();
            match self.block.next.next_block() {
                Some(block) => {
                    self.block = block;
                    self.pos = 0;
                    true
                }
                None => false,
            }
        } else {
            true
        }
    }

    /// Advance to the next delete operation.
    /// Returns true if and only if there is such an operation.
    pub fn advance(&mut self) -> bool {
        if self.load_block_if_required() {
            self.pos += 1;
            true
        } else {
            false
        }
    }

    /// Get the current delete operation.
    /// Calling `.get` does not advance the cursor.
    pub fn get(&mut self) -> Option<&DeleteOperation> {
        if self.load_block_if_required() {
            Some(&self.block.operations[self.pos])
        } else {
            None
        }
    }
}

#[cfg(test)]
mod tests {

    use super::{DeleteOperation, DeleteQueue};
    use crate::index::SegmentReader;
    use crate::query::{Explanation, Scorer, Weight};
    use crate::{DocId, Score};

    struct DummyWeight;
    impl Weight for DummyWeight {
        fn scorer(&self, _reader: &SegmentReader, _boost: Score) -> crate::Result<Box<dyn Scorer>> {
            Err(crate::TantivyError::InternalError("dummy impl".to_owned()))
        }

        fn explain(&self, _reader: &SegmentReader, _doc: DocId) -> crate::Result<Explanation> {
            Err(crate::TantivyError::InternalError("dummy impl".to_owned()))
        }
    }

    #[test]
    fn test_deletequeue() {
        let delete_queue = DeleteQueue::default();

        let make_op = |i: usize| DeleteOperation {
            opstamp: i as u64,
            target: Box::new(DummyWeight),
        };

        delete_queue.push(make_op(1));
        delete_queue.push(make_op(2));

        let snapshot = delete_queue.cursor();
        {
            let mut operations_it = snapshot.clone();
            assert_eq!(operations_it.get().unwrap().opstamp, 1);
            operations_it.advance();
            assert_eq!(operations_it.get().unwrap().opstamp, 2);
            operations_it.advance();
            assert!(operations_it.get().is_none());
            operations_it.advance();

            let mut snapshot2 = delete_queue.cursor();
            assert!(snapshot2.get().is_none());
            delete_queue.push(make_op(3));
            assert_eq!(snapshot2.get().unwrap().opstamp, 3);
            assert_eq!(operations_it.get().unwrap().opstamp, 3);
            assert_eq!(operations_it.get().unwrap().opstamp, 3);
            operations_it.advance();
            assert!(operations_it.get().is_none());
            operations_it.advance();
        }
        {
            let mut operations_it = snapshot;
            assert_eq!(operations_it.get().unwrap().opstamp, 1);
            operations_it.advance();
            assert_eq!(operations_it.get().unwrap().opstamp, 2);
            operations_it.advance();
            assert_eq!(operations_it.get().unwrap().opstamp, 3);
            operations_it.advance();
            assert!(operations_it.get().is_none());
        }
    }
}


================================================
FILE: src/indexer/doc_id_mapping.rs
================================================
//! This module is used when sorting the index by a property, e.g.
//! to get mappings from old doc_id to new doc_id and vice versa, after sorting

use common::ReadOnlyBitSet;

use crate::DocAddress;

#[derive(Copy, Clone, Eq, PartialEq)]
pub enum MappingType {
    Stacked,
    StackedWithDeletes,
}

/// Struct to provide mapping from new doc_id to old doc_id and segment.
#[derive(Clone)]
pub(crate) struct SegmentDocIdMapping {
    pub(crate) new_doc_id_to_old_doc_addr: Vec<DocAddress>,
    pub(crate) alive_bitsets: Vec<Option<ReadOnlyBitSet>>,
    mapping_type: MappingType,
}

impl SegmentDocIdMapping {
    pub(crate) fn new(
        new_doc_id_to_old_doc_addr: Vec<DocAddress>,
        mapping_type: MappingType,
        alive_bitsets: Vec<Option<ReadOnlyBitSet>>,
    ) -> Self {
        Self {
            new_doc_id_to_old_doc_addr,
            mapping_type,
            alive_bitsets,
        }
    }

    pub fn mapping_type(&self) -> MappingType {
        self.mapping_type
    }

    /// Returns an iterator over the old document addresses, ordered by the new document ids.
    ///
    /// In the returned `DocAddress`, the `segment_ord` is the ordinal of targeted segment
    /// in the list of merged segments.
    pub(crate) fn iter_old_doc_addrs(&self) -> impl Iterator<Item = DocAddress> + '_ {
        self.new_doc_id_to_old_doc_addr.iter().copied()
    }
}


================================================
FILE: src/indexer/doc_opstamp_mapping.rs
================================================
use crate::{DocId, Opstamp};

// Doc to opstamp is used to identify which
// document should be deleted.
//
// Since the docset matching the query of a delete operation
// is not computed right when the delete operation is received,
// we need to find a way to evaluate, for each document,
// whether the document was added before or after
// the delete operation. This anteriority is used by comparing
// the docstamp of the document.
//
// The doc to opstamp mapping stores precisely an array
// indexed by doc id and storing the opstamp of the document.
//
// This mapping is NOT necessarily increasing, because
// we might be sorting documents according to a fast field.
#[derive(Clone)]
pub enum DocToOpstampMapping<'a> {
    WithMap(&'a [Opstamp]),
    None,
}

impl DocToOpstampMapping<'_> {
    /// Assess whether a document should be considered deleted given that it contains
    /// a deleted term that was deleted at the opstamp: `delete_opstamp`.
    ///
    /// This function returns true if the `DocToOpstamp` mapping is none or if
    /// the `doc_opstamp` is anterior to the delete opstamp.
    pub fn is_deleted(&self, doc_id: DocId, delete_opstamp: Opstamp) -> bool {
        match self {
            Self::WithMap(doc_opstamps) => {
                let doc_opstamp = doc_opstamps[doc_id as usize];
                doc_opstamp < delete_opstamp
            }
            Self::None => true,
        }
    }
}

#[cfg(test)]
mod tests {

    use super::DocToOpstampMapping;

    #[test]
    fn test_doc_to_opstamp_mapping_none() {
        let doc_to_opstamp_mapping = DocToOpstampMapping::None;
        assert!(doc_to_opstamp_mapping.is_deleted(1u32, 0u64));
        assert!(doc_to_opstamp_mapping.is_deleted(1u32, 2u64));
    }

    #[test]
    fn test_doc_to_opstamp_mapping_with_map() {
        let doc_to_opstamp_mapping = DocToOpstampMapping::WithMap(&[5u64, 1u64, 0u64, 4u64, 3u64]);
        assert_eq!(doc_to_opstamp_mapping.is_deleted(0u32, 2u64), false);
        assert_eq!(doc_to_opstamp_mapping.is_deleted(1u32, 2u64), true);
        assert_eq!(doc_to_opstamp_mapping.is_deleted(2u32, 2u64), true);
        assert_eq!(doc_to_opstamp_mapping.is_deleted(3u32, 2u64), false);
        assert_eq!(doc_to_opstamp_mapping.is_deleted(4u32, 2u64), false);
    }
}


================================================
FILE: src/indexer/flat_map_with_buffer.rs
================================================
pub struct FlatMapWithBuffer<T, F, Iter> {
    buffer: Vec<T>,
    fill_buffer: F,
    underlying_it: Iter,
}

impl<T, F, Iter, I> Iterator for FlatMapWithBuffer<T, F, Iter>
where
    Iter: Iterator<Item = I>,
    F: Fn(I, &mut Vec<T>),
{
    type Item = T;

    fn next(&mut self) -> Option<Self::Item> {
        while self.buffer.is_empty() {
            let next_el = self.underlying_it.next()?;
            (self.fill_buffer)(next_el, &mut self.buffer);
            // We will pop elements, so we reverse the buffer first.
            self.buffer.reverse();
        }
        self.buffer.pop()
    }
}

#[allow(dead_code)]
pub trait FlatMapWithBufferIter: Iterator {
    /// Function similar to `flat_map`, but allows reusing a shared `Vec`.
    fn flat_map_with_buffer<F, T>(self, fill_buffer: F) -> FlatMapWithBuffer<T, F, Self>
    where
        F: Fn(Self::Item, &mut Vec<T>),
        Self: Sized,
    {
        FlatMapWithBuffer {
            buffer: Vec::with_capacity(10),
            fill_buffer,
            underlying_it: self,
        }
    }
}

impl<T: ?Sized> FlatMapWithBufferIter for T where T: Iterator {}

#[cfg(test)]
mod tests {
    use crate::indexer::flat_map_with_buffer::FlatMapWithBufferIter;

    #[test]
    fn test_flat_map_with_buffer_empty() {
        let mut empty_iter = std::iter::empty::<usize>()
            .flat_map_with_buffer(|_val: usize, _buffer: &mut Vec<usize>| {});
        assert!(empty_iter.next().is_none());
    }

    #[test]
    fn test_flat_map_with_buffer_simple() {
        let vals: Vec<usize> = (1..5)
            .flat_map_with_buffer(|val: usize, buffer: &mut Vec<usize>| buffer.extend(0..val))
            .collect();
        assert_eq!(&[0, 0, 1, 0, 1, 2, 0, 1, 2, 3], &vals[..]);
    }

    #[test]
    fn test_flat_map_filling_no_elements_does_not_stop_iterator() {
        let vals: Vec<usize> = [2, 0, 0, 3]
            .into_iter()
            .flat_map_with_buffer(|val: usize, buffer: &mut Vec<usize>| buffer.extend(0..val))
            .collect();
        assert_eq!(&[0, 1, 0, 1, 2], &vals[..]);
    }
}


================================================
FILE: src/indexer/index_writer.rs
================================================
use std::ops::Range;
use std::sync::Arc;
use std::thread;
use std::thread::JoinHandle;

use common::BitSet;
use smallvec::smallvec;

use super::operation::{AddOperation, UserOperation};
use super::segment_updater::SegmentUpdater;
use super::{AddBatch, AddBatchReceiver, AddBatchSender, PreparedCommit};
use crate::directory::{DirectoryLock, GarbageCollectionResult, TerminatingWrite};
use crate::error::TantivyError;
use crate::fastfield::write_alive_bitset;
use crate::index::{Index, Segment, SegmentComponent, SegmentId, SegmentMeta, SegmentReader};
use crate::indexer::delete_queue::{DeleteCursor, DeleteQueue};
use crate::indexer::doc_opstamp_mapping::DocToOpstampMapping;
use crate::indexer::index_writer_status::IndexWriterStatus;
use crate::indexer::operation::DeleteOperation;
use crate::indexer::stamper::Stamper;
use crate::indexer::{MergePolicy, SegmentEntry, SegmentWriter};
use crate::query::{EnableScoring, Query, TermQuery};
use crate::schema::document::Document;
use crate::schema::{IndexRecordOption, TantivyDocument, Term};
use crate::{FutureResult, Opstamp};

// Size of the margin for the `memory_arena`. A segment is closed when the remaining memory
// in the `memory_arena` goes below MARGIN_IN_BYTES.
pub const MARGIN_IN_BYTES: usize = 1_000_000;

// We impose the memory per thread to be at least 15 MB, as the baseline consumption is 12MB.
pub const MEMORY_BUDGET_NUM_BYTES_MIN: usize = ((MARGIN_IN_BYTES as u32) * 15u32) as usize;
pub const MEMORY_BUDGET_NUM_BYTES_MAX: usize = u32::MAX as usize - MARGIN_IN_BYTES;

// We impose the number of index writer threads to be at most this.
pub const MAX_NUM_THREAD: usize = 8;

// Add document will block if the number of docs waiting in the queue to be indexed
// reaches `PIPELINE_MAX_SIZE_IN_DOCS`
const PIPELINE_MAX_SIZE_IN_DOCS: usize = 10_000;

fn error_in_index_worker_thread(context: &str) -> TantivyError {
    TantivyError::ErrorInThread(format!(
        "{context}. A worker thread encountered an error (io::Error most likely) or panicked."
    ))
}

#[derive(Clone, bon::Builder)]
/// A builder for creating a new [IndexWriter] for an index.
pub struct IndexWriterOptions {
    #[builder(default = MEMORY_BUDGET_NUM_BYTES_MIN)]
    /// The memory budget per indexer thread.
    ///
    /// When an indexer thread has buffered this much data in memory
    /// it will flush the segment to disk (although this is not searchable until commit is called.)
    memory_budget_per_thread: usize,
    #[builder(default = 1)]
    /// The number of indexer worker threads to use.
    num_worker_threads: usize,
    #[builder(default = 4)]
    /// Defines the number of merger threads to use.
    num_merge_threads: usize,
}

/// `IndexWriter` is the user entry-point to add document to an index.
///
/// It manages a small number of indexing thread, as well as a shared
/// indexing queue.
/// Each indexing thread builds its own independent [`Segment`], via
/// a `SegmentWriter` object.
pub struct IndexWriter<D: Document = TantivyDocument> {
    // the lock is just used to bind the
    // lifetime of the lock with that of the IndexWriter.
    _directory_lock: Option<DirectoryLock>,

    index: Index,

    options: IndexWriterOptions,

    workers_join_handle: Vec<JoinHandle<crate::Result<()>>>,

    index_writer_status: IndexWriterStatus<D>,
    operation_sender: AddBatchSender<D>,

    segment_updater: SegmentUpdater,

    worker_id: usize,

    delete_queue: DeleteQueue,

    stamper: Stamper,
    committed_opstamp: Opstamp,
}

fn compute_deleted_bitset(
    alive_bitset: &mut BitSet,
    segment_reader: &SegmentReader,
    delete_cursor: &mut DeleteCursor,
    doc_opstamps: &DocToOpstampMapping,
    target_opstamp: Opstamp,
) -> crate::Result<bool> {
    let mut might_have_changed = false;
    while let Some(delete_op) = delete_cursor.get() {
        if delete_op.opstamp > target_opstamp {
            break;
        }

        // A delete operation should only affect
        // document that were inserted before it.
        delete_op
            .target
            .for_each_no_score(segment_reader, &mut |docs_matching_delete_query| {
                for doc_matching_delete_query in docs_matching_delete_query.iter().cloned() {
                    if doc_opstamps.is_deleted(doc_matching_delete_query, delete_op.opstamp) {
                        alive_bitset.remove(doc_matching_delete_query);
                        might_have_changed = true;
                    }
                }
            })?;
        delete_cursor.advance();
    }
    Ok(might_have_changed)
}

/// Advance delete for the given segment up to the target opstamp.
///
/// Note that there are no guarantee that the resulting `segment_entry` delete_opstamp
/// is `==` target_opstamp.
/// For instance, there was no delete operation between the state of the `segment_entry` and
/// the `target_opstamp`, `segment_entry` is not updated.
pub fn advance_deletes(
    mut segment: Segment,
    segment_entry: &mut SegmentEntry,
    target_opstamp: Opstamp,
) -> crate::Result<()> {
    if segment_entry.meta().delete_opstamp() == Some(target_opstamp) {
        // We are already up-to-date here.
        return Ok(());
    }

    if segment_entry.alive_bitset().is_none() && segment_entry.delete_cursor().get().is_none() {
        // There has been no `DeleteOperation` between the segment status and `target_opstamp`.
        return Ok(());
    }

    let segment_reader = SegmentReader::open(&segment)?;

    let max_doc = segment_reader.max_doc();
    let mut alive_bitset: BitSet = match segment_entry.alive_bitset() {
        Some(previous_alive_bitset) => (*previous_alive_bitset).clone(),
        None => BitSet::with_max_value_and_full(max_doc),
    };

    let num_deleted_docs_before = segment.meta().num_deleted_docs();

    compute_deleted_bitset(
        &mut alive_bitset,
        &segment_reader,
        segment_entry.delete_cursor(),
        &DocToOpstampMapping::None,
        target_opstamp,
    )?;

    if let Some(seg_alive_bitset) = segment_reader.alive_bitset() {
        alive_bitset.intersect_update(seg_alive_bitset.bitset());
    }

    let num_alive_docs: u32 = alive_bitset.len() as u32;
    let num_deleted_docs = max_doc - num_alive_docs;
    if num_deleted_docs > num_deleted_docs_before {
        // There are new deletes. We need to write a new delete file.
        segment = segment.with_delete_meta(num_deleted_docs, target_opstamp);
        let mut alive_doc_file = segment.open_write(SegmentComponent::Delete)?;
        write_alive_bitset(&alive_bitset, &mut alive_doc_file)?;
        alive_doc_file.terminate()?;
    }

    segment_entry.set_meta(segment.meta().clone());
    Ok(())
}

fn index_documents<D: Document>(
    memory_budget: usize,
    segment: Segment,
    grouped_document_iterator: &mut dyn Iterator<Item = AddBatch<D>>,
    segment_updater: &SegmentUpdater,
    mut delete_cursor: DeleteCursor,
) -> crate::Result<()> {
    let mut segment_writer = SegmentWriter::for_segment(memory_budget, segment.clone())?;
    for document_group in grouped_document_iterator {
        for doc in document_group {
            segment_writer.add_document(doc)?;
        }
        let mem_usage = segment_writer.mem_usage();
        if mem_usage >= memory_budget - MARGIN_IN_BYTES {
            info!(
                "Buffer limit reached, flushing segment with maxdoc={}.",
                segment_writer.max_doc()
            );
            break;
        }
    }

    if !segment_updater.is_alive() {
        return Ok(());
    }

    let max_doc = segment_writer.max_doc();

    // this is ensured by the call to peek before starting
    // the worker thread.
    assert!(max_doc > 0);

    let doc_opstamps: Vec<Opstamp> = segment_writer.finalize()?;

    let segment_with_max_doc = segment.with_max_doc(max_doc);

    let alive_bitset_opt = apply_deletes(&segment_with_max_doc, &mut delete_cursor, &doc_opstamps)?;

    let meta = segment_with_max_doc.meta().clone();

    // update segment_updater inventory to remove tempstore
    let segment_entry = SegmentEntry::new(meta, delete_cursor, alive_bitset_opt);
    segment_updater.schedule_add_segment(segment_entry).wait()?;
    Ok(())
}

/// `doc_opstamps` is required to be non-empty.
fn apply_deletes(
    segment: &Segment,
    delete_cursor: &mut DeleteCursor,
    doc_opstamps: &[Opstamp],
) -> crate::Result<Option<BitSet>> {
    if delete_cursor.get().is_none() {
        // if there are no delete operation in the queue, no need
        // to even open the segment.
        return Ok(None);
    }

    let max_doc_opstamp: Opstamp = doc_opstamps
        .iter()
        .cloned()
        .max()
        .expect("Empty DocOpstamp is forbidden");

    let segment_reader = SegmentReader::open(segment)?;
    let doc_to_opstamps = DocToOpstampMapping::WithMap(doc_opstamps);

    let max_doc = segment.meta().max_doc();
    let mut deleted_bitset = BitSet::with_max_value_and_full(max_doc);
    let may_have_deletes = compute_deleted_bitset(
        &mut deleted_bitset,
        &segment_reader,
        delete_cursor,
        &doc_to_opstamps,
        max_doc_opstamp,
    )?;
    Ok(if may_have_deletes {
        Some(deleted_bitset)
    } else {
        None
    })
}

impl<D: Document> IndexWriter<D> {
    /// Create a new index writer. Attempts to acquire a lockfile.
    ///
    /// The lockfile should be deleted on drop, but it is possible
    /// that due to a panic or other error, a stale lockfile will be
    /// left in the index directory. If you are sure that no other
    /// `IndexWriter` on the system is accessing the index directory,
    /// it is safe to manually delete the lockfile.
    ///
    /// `num_threads` specifies the number of indexing workers that
    /// should work at the same time.
    /// # Errors
    /// If the lockfile already exists, returns `Error::FileAlreadyExists`.
    /// If the memory arena per thread is too small or too big, returns
    /// `TantivyError::InvalidArgument`
    pub(crate) fn new(
        index: &Index,
        options: IndexWriterOptions,
        directory_lock: DirectoryLock,
    ) -> crate::Result<Self> {
        if options.memory_budget_per_thread < MEMORY_BUDGET_NUM_BYTES_MIN {
            let err_msg = format!(
                "The memory arena in bytes per thread needs to be at least \
                 {MEMORY_BUDGET_NUM_BYTES_MIN}."
            );
            return Err(TantivyError::InvalidArgument(err_msg));
        }
        if options.memory_budget_per_thread >= MEMORY_BUDGET_NUM_BYTES_MAX {
            let err_msg = format!(
                "The memory arena in bytes per thread cannot exceed {MEMORY_BUDGET_NUM_BYTES_MAX}"
            );
            return Err(TantivyError::InvalidArgument(err_msg));
        }
        if options.num_worker_threads == 0 {
            let err_msg = "At least one worker thread is required, got 0".to_string();
            return Err(TantivyError::InvalidArgument(err_msg));
        }

        let (document_sender, document_receiver) =
            crossbeam_channel::bounded(PIPELINE_MAX_SIZE_IN_DOCS);

        let delete_queue = DeleteQueue::default();

        let current_opstamp = index.load_metas()?.opstamp;

        let stamper = Stamper::new(current_opstamp);

        let segment_updater = SegmentUpdater::create(
            index.clone(),
            stamper.clone(),
            &delete_queue.cursor(),
            options.num_merge_threads,
        )?;

        let mut index_writer = Self {
            _directory_lock: Some(directory_lock),

            options: options.clone(),
            index: index.clone(),
            index_writer_status: IndexWriterStatus::from(document_receiver),
            operation_sender: document_sender,

            segment_updater,

            workers_join_handle: vec![],

            delete_queue,

            committed_opstamp: current_opstamp,
            stamper,

            worker_id: 0,
        };
        index_writer.start_workers()?;
        Ok(index_writer)
    }

    fn drop_sender(&mut self) {
        let (sender, _receiver) = crossbeam_channel::bounded(1);
        self.operation_sender = sender;
    }

    /// Accessor to the index.
    pub fn index(&self) -> &Index {
        &self.index
    }

    /// If there are some merging threads, blocks until they all finish their work and
    /// then drop the `IndexWriter`.
    pub fn wait_merging_threads(mut self) -> crate::Result<()> {
        // this will stop the indexing thread,
        // dropping the last reference to the segment_updater.
        self.drop_sender();

        let former_workers_handles = std::mem::take(&mut self.workers_join_handle);
        for join_handle in former_workers_handles {
            join_handle
                .join()
                .map_err(|_| error_in_index_worker_thread("Worker thread panicked."))?
                .map_err(|_| error_in_index_worker_thread("Worker thread failed."))?;
        }

        let result = self
            .segment_updater
            .wait_merging_thread()
            .map_err(|_| error_in_index_worker_thread("Failed to join merging thread."));

        if let Err(ref e) = result {
            error!("Some merging thread failed {e:?}");
        }

        result
    }

    #[doc(hidden)]
    pub fn add_segment(&self, segment_meta: SegmentMeta) -> crate::Result<()> {
        let delete_cursor = self.delete_queue.cursor();
        let segment_entry = SegmentEntry::new(segment_meta, delete_cursor, None);
        self.segment_updater
            .schedule_add_segment(segment_entry)
            .wait()
    }

    /// Creates a new segment.
    ///
    /// This method is useful only for users trying to do complex
    /// operations, like converting an index format to another.
    ///
    /// It is safe to start writing file associated with the new `Segment`.
    /// These will not be garbage collected as long as an instance object of
    /// `SegmentMeta` object associated with the new `Segment` is "alive".
    pub fn new_segment(&self) -> Segment {
        self.index.new_segment()
    }

    fn operation_receiver(&self) -> crate::Result<AddBatchReceiver<D>> {
        self.index_writer_status
            .operation_receiver()
            .ok_or_else(|| {
                crate::TantivyError::ErrorInThread(
                    "The index writer was killed. It can happen if an indexing worker encountered \
                     an Io error for instance."
                        .to_string(),
                )
            })
    }

    /// Spawns a new worker thread for indexing.
    /// The thread consumes documents from the pipeline.
    fn add_indexing_worker(&mut self) -> crate::Result<()> {
        let document_receiver_clone = self.operation_receiver()?;
        let index_writer_bomb = self.index_writer_status.create_bomb();

        let segment_updater = self.segment_updater.clone();

        let mut delete_cursor = self.delete_queue.cursor();

        let mem_budget = self.options.memory_budget_per_thread;
        let index = self.index.clone();
        let join_handle: JoinHandle<crate::Result<()>> = thread::Builder::new()
            .name(format!("thrd-tantivy-index{}", self.worker_id))
            .spawn(move || {
                loop {
                    let mut document_iterator = document_receiver_clone
                        .clone()
                        .into_iter()
                        .filter(|batch| !batch.is_empty())
                        .peekable();

                    // The peeking here is to avoid creating a new segment's files
                    // if no document are available.
                    //
                    // This is a valid guarantee as the peeked document now belongs to
                    // our local iterator.
                    if let Some(batch) = document_iterator.peek() {
                        assert!(!batch.is_empty());
                        delete_cursor.skip_to(batch[0].opstamp);
                    } else {
                        // No more documents.
                        // It happens when there is a commit, or if the `IndexWriter`
                        // was dropped.
                        index_writer_bomb.defuse();
                        return Ok(());
                    }

                    index_documents(
                        mem_budget,
                        index.new_segment(),
                        &mut document_iterator,
                        &segment_updater,
                        delete_cursor.clone(),
                    )?;
                }
            })?;
        self.worker_id += 1;
        self.workers_join_handle.push(join_handle);
        Ok(())
    }

    /// Accessor to the merge policy.
    pub fn get_merge_policy(&self) -> Arc<dyn MergePolicy> {
        self.segment_updater.get_merge_policy()
    }

    /// Setter for the merge policy.
    pub fn set_merge_policy(&self, merge_policy: Box<dyn MergePolicy>) {
        self.segment_updater.set_merge_policy(merge_policy);
    }

    fn start_workers(&mut self) -> crate::Result<()> {
        for _ in 0..self.options.num_worker_threads {
            self.add_indexing_worker()?;
        }
        Ok(())
    }

    /// Detects and removes the files that are not used by the index anymore.
    pub fn garbage_collect_files(&self) -> FutureResult<GarbageCollectionResult> {
        self.segment_updater.schedule_garbage_collect()
    }

    /// Deletes all documents from the index
    ///
    /// Requires `commit`ing
    /// Enables users to rebuild the index,
    /// by clearing and resubmitting necessary documents
    ///
    /// ```rust
    /// use tantivy::collector::TopDocs;
    /// use tantivy::query::QueryParser;
    /// use tantivy::schema::*;
    /// use tantivy::{doc, Index};
    ///
    /// fn main() -> tantivy::Result<()> {
    ///     let mut schema_builder = Schema::builder();
    ///     let title = schema_builder.add_text_field("title", TEXT | STORED);
    ///     let schema = schema_builder.build();
    ///
    ///     let index = Index::create_in_ram(schema.clone());
    ///
    ///     let mut index_writer = index.writer_with_num_threads(1, 50_000_000)?;
    ///     index_writer.add_document(doc!(title => "The modern Prometheus"))?;
    ///     index_writer.commit()?;
    ///
    ///     let clear_res = index_writer.delete_all_documents().unwrap();
    ///     // have to commit, otherwise deleted terms remain available
    ///     index_writer.commit()?;
    ///
    ///     let searcher = index.reader()?.searcher();
    ///     let query_parser = QueryParser::for_index(&index, vec![title]);
    ///     let query_promo = query_parser.parse_query("Prometheus")?;
    ///     let top_docs_promo = searcher.search(&query_promo, &TopDocs::with_limit(1).order_by_score())?;
    ///
    ///     assert!(top_docs_promo.is_empty());
    ///     Ok(())
    /// }
    /// ```
    pub fn delete_all_documents(&self) -> crate::Result<Opstamp> {
        // Delete segments
        self.segment_updater.remove_all_segments();
        // Return new stamp - reverted stamp
        self.stamper.revert(self.committed_opstamp);
        Ok(self.committed_opstamp)
    }

    /// Merges a given list of segments.
    ///
    /// If all segments are empty no new segment will be created.
    ///
    /// `segment_ids` is required to be non-empty.
    pub fn merge(&mut self, segment_ids: &[SegmentId]) -> FutureResult<Option<SegmentMeta>> {
        let merge_operation = self.segment_updater.make_merge_operation(segment_ids);
        let segment_updater = self.segment_updater.clone();
        segment_updater.start_merge(merge_operation)
    }

    /// Closes the current document channel send.
    /// and replace all the channels by new ones.
    ///
    /// The current workers will keep on indexing
    /// the pending document and stop
    /// when no documents are remaining.
    ///
    /// Returns the former segment_ready channel.
    fn recreate_document_channel(&mut self) {
        let (document_sender, document_receiver) =
            crossbeam_channel::bounded(PIPELINE_MAX_SIZE_IN_DOCS);
        self.operation_sender = document_sender;
        self.index_writer_status = IndexWriterStatus::from(document_receiver);
    }

    /// Rollback to the last commit
    ///
    /// This cancels all of the updates that
    /// happened after the last commit.
    /// After calling rollback, the index is in the same
    /// state as it was after the last commit.
    ///
    /// The opstamp at the last commit is returned.
    pub fn rollback(&mut self) -> crate::Result<Opstamp> {
        info!("Rolling back to opstamp {}", self.committed_opstamp);
        // marks the segment updater as killed. From now on, all
        // segment updates will be ignored.
        self.segment_updater.kill();
        let document_receiver_res = self.operation_receiver();

        // take the directory lock to create a new index_writer.
        let directory_lock = self
            ._directory_lock
            .take()
            .expect("The IndexWriter does not have any lock. This is a bug, please report.");

        let new_index_writer = IndexWriter::new(&self.index, self.options.clone(), directory_lock)?;

        // the current `self` is dropped right away because of this call.
        //
        // This will drop the document queue, and the thread
        // should terminate.
        *self = new_index_writer;

        // Drains the document receiver pipeline :
        // Workers don't need to index the pending documents.
        //
        // This will reach an end as the only document_sender
        // was dropped with the index_writer.
        if let Ok(document_receiver) = document_receiver_res {
            for _ in document_receiver {}
        }

        Ok(self.committed_opstamp)
    }

    /// Prepares a commit.
    ///
    /// Calling `prepare_commit()` will cut the indexing
    /// queue. All pending documents will be sent to the
    /// indexing workers. They will then terminate, regardless
    /// of the size of their current segment and flush their
    /// work on disk.
    ///
    /// Once a commit is "prepared", you can either
    /// call
    /// * `.commit()`: to accept this commit
    /// * `.abort()`: to cancel this commit.
    ///
    /// In the current implementation, [`PreparedCommit`] borrows
    /// the [`IndexWriter`] mutably so we are guaranteed that no new
    /// document can be added as long as it is committed or is
    /// dropped.
    ///
    /// It is also possible to add a payload to the `commit`
    /// using this API.
    /// See [`PreparedCommit::set_payload()`].
    pub fn prepare_commit(&mut self) -> crate::Result<PreparedCommit<'_, D>> {
        // Here, because we join all of the worker threads,
        // all of the segment update for this commit have been
        // sent.
        //
        // No document belonging to the next commit have been
        // pushed too, because add_document can only happen
        // on this thread.
        //
        // This will move uncommitted segments to the state of
        // committed segments.
        info!("Preparing commit");

        // this will drop the current document channel
        // and recreate a new one.
        self.recreate_document_channel();

        let former_workers_join_handle = std::mem::take(&mut self.workers_join_handle);

        for worker_handle in former_workers_join_handle {
            let indexing_worker_result = worker_handle
                .join()
                .map_err(|e| TantivyError::ErrorInThread(format!("{e:?}")))?;
            indexing_worker_result?;
            self.add_indexing_worker()?;
        }

        let commit_opstamp = self.stamper.stamp();
        let prepared_commit = PreparedCommit::new(self, commit_opstamp);
        info!("Prepared commit {commit_opstamp}");
        Ok(prepared_commit)
    }

    /// Commits all of the pending changes
    ///
    /// A call to commit blocks.
    /// After it returns, all of the document that
    /// were added since the last commit are published
    /// and persisted.
    ///
    /// In case of a crash or an hardware failure (as
    /// long as the hard disk is spared), it will be possible
    /// to resume indexing from this point.
    ///
    /// Commit returns the `opstamp` of the last document
    /// that made it in the commit.
    pub fn commit(&mut self) -> crate::Result<Opstamp> {
        self.prepare_commit()?.commit()
    }

    pub(crate) fn segment_updater(&self) -> &SegmentUpdater {
        &self.segment_updater
    }

    /// Delete all documents containing a given term.
    ///
    /// Delete operation only affects documents that
    /// were added in previous commits, and documents
    /// that were added previously in the same commit.
    ///
    /// Like adds, the deletion itself will be visible
    /// only after calling `commit()`.
    pub fn delete_term(&self, term: Term) -> Opstamp {
        let query = TermQuery::new(term, IndexRecordOption::Basic);
        // For backward compatibility, if Term is invalid for the index, do nothing but return an
        // Opstamp
        self.delete_query(Box::new(query))
            .unwrap_or_else(|_| self.stamper.stamp())
    }

    /// Delete all documents matching a given query.
    /// Returns an `Err` if the query can't be executed.
    ///
    /// Delete operation only affects documents that
    /// were added in previous commits, and documents
    /// that were added previously in the same commit.
    ///
    /// Like adds, the deletion itself will be visible
    /// only after calling `commit()`.
    #[doc(hidden)]
    pub fn delete_query(&self, query: Box<dyn Query>) -> crate::Result<Opstamp> {
        let weight = query.weight(EnableScoring::disabled_from_schema(&self.index.schema()))?;
        let opstamp = self.stamper.stamp();
        let delete_operation = DeleteOperation {
            opstamp,
            target: weight,
        };
        self.delete_queue.push(delete_operation);
        Ok(opstamp)
    }

    /// Returns the opstamp of the last successful commit.
    ///
    /// This is, for instance, the opstamp the index will
    /// rollback to if there is a failure like a power surge.
    ///
    /// This is also the opstamp of the commit that is currently
    /// available for searchers.
    pub fn commit_opstamp(&self) -> Opstamp {
        self.committed_opstamp
    }

    /// Adds a document.
    ///
    /// If the indexing pipeline is full, this call may block.
    ///
    /// The opstamp is an increasing `u64` that can
    /// be used by the client to align commits with its own
    /// document queue.
    pub fn add_document(&self, document: D) -> crate::Result<Opstamp> {
        let opstamp = self.stamper.stamp();
        self.send_add_documents_batch(smallvec![AddOperation { opstamp, document }])?;
        Ok(opstamp)
    }

    /// Gets a range of stamps from the stamper and "pops" the last stamp
    /// from the range returning a tuple of the last optstamp and the popped
    /// range.
    ///
    /// The total number of stamps generated by this method is `count + 1`;
    /// each operation gets a stamp from the `stamps` iterator and `last_opstamp`
    /// is for the batch itself.
    fn get_batch_opstamps(&self, count: Opstamp) -> (Opstamp, Range<Opstamp>) {
        let Range { start, end } = self.stamper.stamps(count + 1u64);
        let last_opstamp = end - 1;
        (last_opstamp, start..last_opstamp)
    }

    /// Runs a group of document operations ensuring that the operations are
    /// assigned contiguous u64 opstamps and that add operations of the same
    /// group are flushed into the same segment.
    ///
    /// If the indexing pipeline is full, this call may block.
    ///
    /// Each operation of the given `user_operations` will receive an in-order,
    /// contiguous u64 opstamp. The entire batch itself is also given an
    /// opstamp that is 1 greater than the last given operation. This
    /// `batch_opstamp` is the return value of `run`. An empty group of
    /// `user_operations`, an empty `Vec<UserOperation>`, still receives
    /// a valid opstamp even though no changes were _actually_ made to the index.
    ///
    /// Like adds and deletes (see `IndexWriter.add_document` and
    /// `IndexWriter.delete_term`), the changes made by calling `run` will be
    /// visible to readers only after calling `commit()`.
    pub fn run<I>(&self, user_operations: I) -> crate::Result<Opstamp>
    where
        I: IntoIterator<Item = UserOperation<D>>,
        I::IntoIter: ExactSizeIterator,
    {
        let user_operations_it = user_operations.into_iter();
        let count = user_operations_it.len() as u64;
        if count == 0 {
            return Ok(self.stamper.stamp());
        }
        let (batch_opstamp, stamps) = self.get_batch_opstamps(count);

        let mut adds = AddBatch::default();

        for (user_op, opstamp) in user_operations_it.zip(stamps) {
            match user_op {
                UserOperation::Delete(term) => {
                    let query = TermQuery::new(term, IndexRecordOption::Basic);
                    let weight =
                        query.weight(EnableScoring::disabled_from_schema(&self.index.schema()))?;
                    let delete_operation = DeleteOperation {
                        opstamp,
                        target: weight,
                    };
                    self.delete_queue.push(delete_operation);
                }
                UserOperation::Add(document) => {
                    let add_operation = AddOperation { opstamp, document };
                    adds.push(add_operation);
                }
            }
        }
        self.send_add_documents_batch(adds)?;
        Ok(batch_opstamp)
    }

    fn send_add_documents_batch(&self, add_ops: AddBatch<D>) -> crate::Result<()> {
        if self.index_writer_status.is_alive() && self.operation_sender.send(add_ops).is_ok() {
            Ok(())
        } else {
            Err(error_in_index_worker_thread("An index writer was killed."))
        }
    }
}

impl<D: Document> Drop for IndexWriter<D> {
    fn drop(&mut self) {
        self.segment_updater.kill();
        self.drop_sender();
        for work in self.workers_join_handle.drain(..) {
            let _ = work.join();
        }
    }
}

#[cfg(test)]
mod tests {
    use std::collections::{HashMap, HashSet};
    use std::net::Ipv6Addr;

    use columnar::{Column, MonotonicallyMappableToU128};
    use itertools::Itertools;
    use proptest::prop_oneof;

    use super::super::operation::UserOperation;
    use crate::collector::{Count, TopDocs};
    use crate::directory::error::LockError;
    use crate::error::*;
    use crate::indexer::index_writer::MEMORY_BUDGET_NUM_BYTES_MIN;
    use crate::indexer::{IndexWriterOptions, NoMergePolicy};
    use crate::query::{QueryParser, TermQuery};
    use crate::schema::{
        self, Facet, FacetOptions, IndexRecordOption, IpAddrOptions, JsonObjectOptions,
        NumericOptions, Schema, TextFieldIndexing, TextOptions, Value, FAST, INDEXED, STORED,
        STRING, TEXT,
    };
    use crate::store::DOCSTORE_CACHE_CAPACITY;
    use crate::{
        DateTime, DocAddress, Index, IndexSettings, IndexWriter, ReloadPolicy, TantivyDocument,
        Term,
    };

    const LOREM: &str = "Doc Lorem ipsum dolor sit amet, consectetur adipiscing elit, sed do \
                         eiusmod tempor incididunt ut labore et dolore magna aliqua. Ut enim ad \
                         minim veniam, quis nostrud exercitation ullamco laboris nisi ut aliquip \
                         ex ea commodo consequat. Duis aute irure dolor in reprehenderit in \
                         voluptate velit esse cillum dolore eu fugiat nulla pariatur. Excepteur \
                         sint occaecat cupidatat non proident, sunt in culpa qui officia deserunt \
                         mollit anim id est laborum.";

    #[test]
    fn test_operations_group() {
        // an operations group with 2 items should cause 3 opstamps 0, 1, and 2.
        let mut schema_builder = schema::Schema::builder();
        let text_field = schema_builder.add_text_field("text", TEXT);
        let index = Index::create_in_ram(schema_builder.build());
        let index_writer = index.writer_for_tests().unwrap();
        let operations = vec![
            UserOperation::Add(doc!(text_field=>"a")),
            UserOperation::Add(doc!(text_field=>"b")),
        ];
        let batch_opstamp1 = index_writer.run(operations).unwrap();
        assert_eq!(batch_opstamp1, 2u64);
    }

    #[test]
    fn test_no_need_to_rewrite_delete_file_if_no_new_deletes() {
        let mut schema_builder = schema::Schema::builder();
        let text_field = schema_builder.add_text_field("text", TEXT);
        let index = Index::create_in_ram(schema_builder.build());

        let mut index_writer: IndexWriter = index.writer_for_tests().unwrap();
        index_writer
            .add_document(doc!(text_field => "hello1"))
            .unwrap();
        index_writer
            .add_document(doc!(text_field => "hello2"))
            .unwrap();
        assert!(index_writer.commit().is_ok());

        let reader = index.reader().unwrap();
        let searcher = reader.searcher();
        assert_eq!(searcher.segment_readers().len(), 1);
        assert_eq!(searcher.segment_reader(0u32).num_docs(), 2);

        index_writer.delete_term(Term::from_field_text(text_field, "hello1"));
        assert!(index_writer.commit().is_ok());

        assert!(reader.reload().is_ok());
        let searcher = reader.searcher();
        assert_eq!(searcher.segment_readers().len(), 1);
        assert_eq!(searcher.segment_reader(0u32).num_docs(), 1);

        let previous_delete_opstamp = index.load_metas().unwrap().segments[0].delete_opstamp();

        // All docs containing hello1 have been already removed.
        // We should not update the delete meta.
        index_writer.delete_term(Term::from_field_text(text_field, "hello1"));
        assert!(index_writer.commit().is_ok());

        assert!(reader.reload().is_ok());
        let searcher = reader.searcher();
        assert_eq!(searcher.segment_readers().len(), 1);
        assert_eq!(searcher.segment_reader(0u32).num_docs(), 1);

        let after_delete_opstamp = index.load_metas().unwrap().segments[0].delete_opstamp();
        assert_eq!(after_delete_opstamp, previous_delete_opstamp);
    }

    #[test]
    fn test_ordered_batched_operations() {
        // * one delete for `doc!(field=>"a")`
        // * one add for `doc!(field=>"a")`
        // * one add for `doc!(field=>"b")`
        // * one delete for `doc!(field=>"b")`
        // after commit there is one doc with "a" and 0 doc with "b"
        let mut schema_builder = schema::Schema::builder();
        let text_field = schema_builder.add_text_field("text", TEXT);
        let index = Index::create_in_ram(schema_builder.build());
        let reader = index
            .reader_builder()
            .reload_policy(ReloadPolicy::Manual)
            .try_into()
            .unwrap();
        let mut index_writer: IndexWriter = index.writer_for_tests().unwrap();
        let a_term = Term::from_field_text(text_field, "a");
        let b_term = Term::from_field_text(text_field, "b");
        let operations = vec![
            UserOperation::Delete(a_term),
            UserOperation::Add(doc!(text_field=>"a")),
            UserOperation::Add(doc!(text_field=>"b")),
            UserOperation::Delete(b_term),
        ];

        index_writer.run(operations).unwrap();
        index_writer.commit().expect("failed to commit");
        reader.reload().expect("failed to load searchers");

        let a_term = Term::from_field_text(text_field, "a");
        let b_term = Term::from_field_text(text_field, "b");

        let a_query = TermQuery::new(a_term, IndexRecordOption::Basic);
        let b_query = TermQuery::new(b_term, IndexRecordOption::Basic);

        let searcher = reader.searcher();

        let a_docs = searcher
            .search(&a_query, &TopDocs::with_limit(1).order_by_score())
            .expect("search for a failed");

        let b_docs = searcher
            .search(&b_query, &TopDocs::with_limit(1).order_by_score())
            .expect("search for b failed");

        assert_eq!(a_docs.len(), 1);
        assert_eq!(b_docs.len(), 0);
    }

    #[test]
    fn test_empty_operations_group() {
        let schema_builder = schema::Schema::builder();
        let index = Index::create_in_ram(schema_builder.build());
        let index_writer: IndexWriter = index.writer_for_tests().unwrap();
        let operations1 = vec![];
        let batch_opstamp1 = index_writer.run(operations1).unwrap();
        assert_eq!(batch_opstamp1, 0u64);
        let operations2 = vec![];
        let batch_opstamp2 = index_writer.run(operations2).unwrap();
        assert_eq!(batch_opstamp2, 1u64);
    }

    #[test]
    fn test_lockfile_stops_duplicates() {
        let schema_builder = schema::Schema::builder();
        let index = Index::create_in_ram(schema_builder.build());
        let _index_writer: IndexWriter = index.writer_for_tests().unwrap();
        match index.writer_for_tests::<TantivyDocument>() {
            Err(TantivyError::LockFailure(LockError::LockBusy, _)) => {}
            _ => panic!("Expected a `LockFailure` error"),
        }
    }

    #[test]
    fn test_lockfile_already_exists_error_msg() {
        let schema_builder = schema::Schema::builder();
        let index = Index::create_in_ram(schema_builder.build());
        let _index_writer: IndexWriter = index.writer_for_tests().unwrap();
        match index.writer_for_tests::<TantivyDocument>() {
            Err(err) => {
                let err_msg = err.to_string();
                assert!(err_msg.contains("already an `IndexWriter`"));
            }
            _ => panic!("Expected LockfileAlreadyExists error"),
        }
    }

    #[test]
    fn test_set_merge_policy() {
        let schema_builder = schema::Schema::builder();
        let index = Index::create_in_ram(schema_builder.build());
        let index_writer: IndexWriter = index.writer_for_tests().unwrap();
        assert_eq!(
            format!("{:?}", index_writer.get_merge_policy()),
            "LogMergePolicy { min_num_segments: 8, max_docs_before_merge: 10000000, \
             min_layer_size: 10000, level_log_size: 0.75, del_docs_ratio_before_merge: 1.0 }"
        );
        let merge_policy = Box::<NoMergePolicy>::default();
        index_writer.set_merge_policy(merge_policy);
        assert_eq!(
            format!("{:?}", index_writer.get_merge_policy()),
            "NoMergePolicy"
        );
    }

    #[test]
    fn test_lockfile_released_on_drop() {
        let schema_builder = schema::Schema::builder();
        let index = Index::create_in_ram(schema_builder.build());
        {
            let _index_writer: IndexWriter = index.writer_for_tests().unwrap();
            // the lock should be released when the
            // index_writer leaves the scope.
        }
        let _index_writer_two: IndexWriter = index.writer_for_tests().unwrap();
    }

    #[test]
    fn test_commit_and_rollback() -> crate::Result<()> {
        let mut schema_builder = schema::Schema::builder();
        let text_field = schema_builder.add_text_field("text", TEXT);
        let index = Index::create_in_ram(schema_builder.build());
        let reader = index
            .reader_builder()
            .reload_policy(ReloadPolicy::Manual)
            .try_into()?;
        let num_docs_containing = |s: &str| {
            let searcher = reader.searcher();
            let term = Term::from_field_text(text_field, s);
            searcher.doc_freq(&term).unwrap()
        };

        {
            // writing the segment
            let mut index_writer = index.writer_for_tests()?;
            index_writer.add_document(doc!(text_field=>"a"))?;
            index_writer.rollback()?;
            assert_eq!(index_writer.commit_opstamp(), 0u64);
            assert_eq!(num_docs_containing("a"), 0);
            index_writer.add_document(doc!(text_field=>"b"))?;
            index_writer.add_document(doc!(text_field=>"c"))?;
            index_writer.commit()?;
            reader.reload()?;
            assert_eq!(num_docs_containing("a"), 0);
            assert_eq!(num_docs_containing("b"), 1);
            assert_eq!(num_docs_containing("c"), 1);
        }
        reader.reload()?;
        reader.searcher();
        Ok(())
    }

    #[test]
    fn test_merge_on_empty_segments_single_segment() -> crate::Result<()> {
        let mut schema_builder = schema::Schema::builder();
        let text_field = schema_builder.add_text_field("text", TEXT);
        let index = Index::create_in_ram(schema_builder.build());
        let reader = index
            .reader_builder()
            .reload_policy(ReloadPolicy::Manual)
            .try_into()?;
        let num_docs_containing = |s: &str| {
            let term_a = Term::from_field_text(text_field, s);
            reader.searcher().doc_freq(&term_a).unwrap()
        };
        // writing the segment
        let mut index_writer: IndexWriter = index.writer_for_tests().unwrap();
        index_writer.add_document(doc!(text_field=>"a"))?;
        index_writer.commit()?;
        //  this should create 1 segment

        let segments = index.searchable_segment_ids().unwrap();
        assert_eq!(segments.len(), 1);

        reader.reload().unwrap();
        assert_eq!(num_docs_containing("a"), 1);

        index_writer.delete_term(Term::from_field_text(text_field, "a"));
        index_writer.commit()?;

        reader.reload().unwrap();
        assert_eq!(num_docs_containing("a"), 0);

        index_writer.merge(&segments);
        index_writer.wait_merging_threads().unwrap();

        let segments = index.searchable_segment_ids().unwrap();
        assert_eq!(segments.len(), 0);

        Ok(())
    }

    #[test]
    fn test_merge_on_empty_segments() -> crate::Result<()> {
        let mut schema_builder = schema::Schema::builder();
        let text_field = schema_builder.add_text_field("text", TEXT);
        let index = Index::create_in_ram(schema_builder.build());
        let reader = index
            .reader_builder()
            .reload_policy(ReloadPolicy::Manual)
            .try_into()?;
        let num_docs_containing = |s: &str| {
            let term_a = Term::from_field_text(text_field, s);
            reader.searcher().doc_freq(&term_a).unwrap()
        };
        // writing the segment
        let mut index_writer: IndexWriter = index.writer_for_tests().unwrap();
        index_writer.add_document(doc!(text_field=>"a"))?;
        index_writer.commit()?;
        index_writer.add_document(doc!(text_field=>"a"))?;
        index_writer.commit()?;
        index_writer.add_document(doc!(text_field=>"a"))?;
        index_writer.commit()?;
        index_writer.add_document(doc!(text_field=>"a"))?;
        index_writer.commit()?;
        //  this should create 4 segments

        let segments = index.searchable_segment_ids().unwrap();
        assert_eq!(segments.len(), 4);

        reader.reload().unwrap();
        assert_eq!(num_docs_containing("a"), 4);

        index_writer.delete_term(Term::from_field_text(text_field, "a"));
        index_writer.commit()?;

        reader.reload().unwrap();
        assert_eq!(num_docs_containing("a"), 0);

        index_writer.merge(&segments);
        index_writer.wait_merging_threads().unwrap();

        let segments = index.searchable_segment_ids().unwrap();
        assert_eq!(segments.len(), 0);

        Ok(())
    }

    #[test]
    fn test_with_merges() -> crate::Result<()> {
        let mut schema_builder = schema::Schema::builder();
        let text_field = schema_builder.add_text_field("text", TEXT);
        let index = Index::create_in_ram(schema_builder.build());
        let reader = index
            .reader_builder()
            .reload_policy(ReloadPolicy::Manual)
            .try_into()?;
        let num_docs_containing = |s: &str| {
            let term_a = Term::from_field_text(text_field, s);
            reader.searcher().doc_freq(&term_a).unwrap()
        };
        // writing the segment
        let mut index_writer = index.writer(MEMORY_BUDGET_NUM_BYTES_MIN).unwrap();
        // create 8 segments with 100 tiny docs
        for _doc in 0..100 {
            index_writer.add_document(doc!(text_field=>"a"))?;
        }
        index_writer.commit()?;
        for _doc in 0..100 {
            index_writer.add_document(doc!(text_field=>"a"))?;
        }
        //  this should create 8 segments and trigger a merge.
        index_writer.commit()?;
        index_writer.wait_merging_threads()?;
        reader.reload()?;
        assert_eq!(num_docs_containing("a"), 200);
        assert!(index.searchable_segments()?.len() < 8);
        Ok(())
    }

    #[test]
    fn test_prepare_with_commit_message() -> crate::Result<()> {
        let mut schema_builder = schema::Schema::builder();
        let text_field = schema_builder.add_text_field("text", TEXT);
        let index = Index::create_in_ram(schema_builder.build());

        let mut index_writer = index.writer_for_tests()?;
        for _doc in 0..100 {
            index_writer.add_document(doc!(text_field => "a"))?;
        }
        {
            let mut prepared_commit = index_writer.prepare_commit()?;
            prepared_commit.set_payload("first commit");
            prepared_commit.commit()?;
        }
        {
            let metas = index.load_metas()?;
            assert_eq!(metas.payload.unwrap(), "first commit");
        }
        for _doc in 0..100 {
            index_writer.add_document(doc!(text_field => "a"))?;
        }
        index_writer.commit()?;
        {
            let metas = index.load_metas()?;
            assert!(metas.payload.is_none());
        }
        Ok(())
    }

    #[test]
    fn test_prepare_but_rollback() -> crate::Result<()> {
        let mut schema_builder = schema::Schema::builder();
        let text_field = schema_builder.add_text_field("text", TEXT);
        let index = Index::create_in_ram(schema_builder.build());

        {
            // writing the segment
            let mut index_writer =
                index.writer_with_num_threads(4, MEMORY_BUDGET_NUM_BYTES_MIN * 4)?;
            // create 8 segments with 100 tiny docs
            for _doc in 0..100 {
                index_writer.add_document(doc!(text_field => "a"))?;
            }
            {
                let mut prepared_commit = index_writer.prepare_commit()?;
                prepared_commit.set_payload("first commit");
                prepared_commit.abort()?;
            }
            {
                let metas = index.load_metas()?;
                assert!(metas.payload.is_none());
            }
            for _doc in 0..100 {
                index_writer.add_document(doc!(text_field => "b"))?;
            }
            index_writer.commit()?;
        }
        let num_docs_containing = |s: &str| {
            let term_a = Term::from_field_text(text_field, s);
            index
                .reader_builder()
                .reload_policy(ReloadPolicy::Manual)
                .try_into()?
                .searcher()
                .doc_freq(&term_a)
        };
        assert_eq!(num_docs_containing("a")?, 0);
        assert_eq!(num_docs_containing("b")?, 100);
        Ok(())
    }

    #[test]
    fn test_add_then_delete_all_documents() {
        let mut schema_builder = schema::Schema::builder();
        let text_field = schema_builder.add_text_field("text", TEXT);
        let index = Index::create_in_ram(schema_builder.build());
        let reader = index
            .reader_builder()
            .reload_policy(ReloadPolicy::Manual)
            .try_into()
            .unwrap();
        let num_docs_containing = |s: &str| {
            reader.reload().unwrap();
            let searcher = reader.searcher();
            let term = Term::from_field_text(text_field, s);
            searcher.doc_freq(&term).unwrap()
        };
        let mut index_writer = index
            .writer_with_num_threads(4, MEMORY_BUDGET_NUM_BYTES_MIN * 4)
            .unwrap();

        let add_tstamp = index_writer.add_document(doc!(text_field => "a")).unwrap();
        let commit_tstamp = index_writer.commit().unwrap();
        assert!(commit_tstamp > add_tstamp);
        index_writer.delete_all_documents().unwrap();
        index_writer.commit().unwrap();

        // Search for documents with the same term that we added
        assert_eq!(num_docs_containing("a"), 0);
    }

    #[test]
    fn test_delete_all_documents_rollback_correct_stamp() {
        let mut schema_builder = schema::Schema::builder();
        let text_field = schema_builder.add_text_field("text", TEXT);
        let index = Index::create_in_ram(schema_builder.build());
        let mut index_writer = index
            .writer_with_num_threads(4, MEMORY_BUDGET_NUM_BYTES_MIN * 4)
            .unwrap();

        let add_tstamp = index_writer.add_document(doc!(text_field => "a")).unwrap();

        // commit documents - they are now available
        let first_commit = index_writer.commit();
        assert!(first_commit.is_ok());
        let first_commit_tstamp = first_commit.unwrap();
        assert!(first_commit_tstamp > add_tstamp);

        // delete_all_documents the index
        let clear_tstamp = index_writer.delete_all_documents().unwrap();
        assert_eq!(clear_tstamp, add_tstamp);

        // commit the clear command - now documents aren't available
        let second_commit = index_writer.commit();
        assert!(second_commit.is_ok());
        let second_commit_tstamp = second_commit.unwrap();

        // add new documents again
        for _ in 0..100 {
            index_writer.add_document(doc!(text_field => "b")).unwrap();
        }

        // rollback to last commit, when index was empty
        let rollback = index_writer.rollback();
        assert!(rollback.is_ok());
        let rollback_tstamp = rollback.unwrap();
        assert_eq!(rollback_tstamp, second_commit_tstamp);

        // working with an empty index == no documents
        let term_b = Term::from_field_text(text_field, "b");
        assert_eq!(
            index
                .reader()
                .unwrap()
                .searcher()
                .doc_freq(&term_b)
                .unwrap(),
            0
        );
    }

    #[test]
    fn test_delete_all_documents_then_add() {
        let mut schema_builder = schema::Schema::builder();
        let text_field = schema_builder.add_text_field("text", TEXT);
        let index = Index::create_in_ram(schema_builder.build());
        // writing the segment
        let mut index_writer = index
            .writer_with_num_threads(4, MEMORY_BUDGET_NUM_BYTES_MIN * 4)
            .unwrap();
        let res = index_writer.delete_all_documents();
        assert!(res.is_ok());

        assert!(index_writer.commit().is_ok());
        // add one simple doc
        index_writer.add_document(doc!(text_field => "a")).unwrap();
        assert!(index_writer.commit().is_ok());

        let term_a = Term::from_field_text(text_field, "a");
        // expect the document with that term to be in the index
        assert_eq!(
            index
                .reader()
                .unwrap()
                .searcher()
                .doc_freq(&term_a)
                .unwrap(),
            1
        );
    }

    #[test]
    fn test_delete_all_documents_and_rollback() {
        let mut schema_builder = schema::Schema::builder();
        let text_field = schema_builder.add_text_field("text", TEXT);
        let index = Index::create_in_ram(schema_builder.build());
        let mut index_writer = index
            .writer_with_num_threads(4, MEMORY_BUDGET_NUM_BYTES_MIN * 4)
            .unwrap();

        // add one simple doc
        assert!(index_writer.add_document(doc!(text_field => "a")).is_ok());
        let comm = index_writer.commit();
        assert!(comm.is_ok());
        let commit_tstamp = comm.unwrap();

        // clear but don't commit!
        let clear_tstamp = index_writer.delete_all_documents().unwrap();
        // clear_tstamp should reset to before the last commit
        assert!(clear_tstamp < commit_tstamp);

        // rollback
        let _rollback_tstamp = index_writer.rollback().unwrap();
        // Find original docs in the index
        let term_a = Term::from_field_text(text_field, "a");
        // expect the document with that term to be in the index
        assert_eq!(
            index
                .reader()
                .unwrap()
                .searcher()
                .doc_freq(&term_a)
                .unwrap(),
            1
        );
    }

    #[test]
    fn test_delete_all_documents_empty_index() {
        let schema_builder = schema::Schema::builder();
        let index = Index::create_in_ram(schema_builder.build());
        let mut index_writer: IndexWriter = index
            .writer_with_num_threads(4, MEMORY_BUDGET_NUM_BYTES_MIN * 4)
            .unwrap();
        let clear = index_writer.delete_all_documents();
        let commit = index_writer.commit();
        assert!(clear.is_ok());
        assert!(commit.is_ok());
    }

    #[test]
    fn test_delete_all_documents_index_twice() {
        let schema_builder = schema::Schema::builder();
        let index = Index::create_in_ram(schema_builder.build());
        let mut index_writer: IndexWriter = index
            .writer_with_num_threads(4, MEMORY_BUDGET_NUM_BYTES_MIN * 4)
            .unwrap();
        let clear = index_writer.delete_all_documents();
        let commit = index_writer.commit();
        assert!(clear.is_ok());
        assert!(commit.is_ok());
        let clear_again = index_writer.delete_all_documents();
        let commit_again = index_writer.commit();
        assert!(clear_again.is_ok());
        assert!(commit_again.is_ok());
    }

    #[test]
    fn test_delete_and_merge_removes_terms_fast_field_dict() {
        let mut schema_builder = schema::Schema::builder();
        let text_field = schema_builder.add_text_field("text", STRING | FAST);
        let schema = schema_builder.build();

        let index = Index::builder().schema(schema).create_in_ram().unwrap();
        let mut index_writer: IndexWriter = index.writer_for_tests().unwrap();
        index_writer
            .add_document(doc!(text_field => "one"))
            .unwrap();
        index_writer
            .add_document(doc!(text_field => "two"))
            .unwrap();
        index_writer
            .add_document(doc!(text_field => "three"))
            .unwrap();
        index_writer.commit().unwrap();
        let index_reader = index.reader().unwrap();
        let searcher = index_reader.searcher();
        let segment_reader = searcher.segment_reader(0);
        let text_fast_field = segment_reader.fast_fields().str("text").unwrap().unwrap();
        let mut buffer = String::new();
        assert!(text_fast_field.ord_to_str(0, &mut buffer).unwrap());
        assert_eq!(buffer, "one");
        assert!(text_fast_field.ord_to_str(1, &mut buffer).unwrap());
        assert_eq!(buffer, "three");
        assert!(text_fast_field.ord_to_str(2, &mut buffer).unwrap());
        assert_eq!(buffer, "two");
        assert!(!text_fast_field.ord_to_str(3, &mut buffer).unwrap());

        assert_eq!(segment_reader.max_doc(), 3);
        index_writer.delete_term(Term::from_field_text(text_field, "three"));
        index_writer.commit().unwrap();
        index_writer
            .merge(&[segment_reader.segment_id()])
            .wait()
            .unwrap();
        index_reader.reload().unwrap();
        let searcher = index_reader.searcher();
        let segment_reader = searcher.segment_reader(0);
        assert_eq!(segment_reader.max_doc(), 2);
        let text_fast_field = segment_reader.fast_fields().str("text").unwrap().unwrap();
        let mut buffer = String::new();
        assert!(text_fast_field.ord_to_str(0, &mut buffer).unwrap());
        assert_eq!(buffer, "one");
        assert!(text_fast_field.ord_to_str(1, &mut buffer).unwrap());
        assert_eq!(buffer, "two");
        assert!(!text_fast_field.ord_to_str(2, &mut buffer).unwrap());
        assert!(text_fast_field.term_ords(0).eq([0].into_iter()));
        assert!(text_fast_field.term_ords(1).eq([1].into_iter()));
    }

    #[derive(Debug, Clone)]
    enum IndexingOp {
        AddMultipleDoc {
            id: u64,
            num_docs: u64,
            value: IndexValue,
        },
        AddDoc {
            id: u64,
            value: IndexValue,
        },
        DeleteDoc {
            id: u64,
        },
        DeleteDocQuery {
            id: u64,
        },
        Commit,
        Merge,
    }
    impl IndexingOp {
        fn add(id: u64) -> Self {
            IndexingOp::AddDoc {
                id,
                value: IndexValue::F64(id as f64),
            }
        }
    }

    use serde::Serialize;
    #[derive(Debug, Clone, Serialize)]
    #[serde(untagged)]
    enum IndexValue {
        Str(String),
        F64(f64),
        U64(u64),
        I64(i64),
    }
    impl Default for IndexValue {
        fn default() -> Self {
            IndexValue::F64(0.0)
        }
    }

    fn value_strategy() -> impl Strategy<Value = IndexValue> {
        prop_oneof![
            any::<f64>().prop_map(IndexValue::F64),
            any::<u64>().prop_map(IndexValue::U64),
            any::<i64>().prop_map(IndexValue::I64),
            any::<String>().prop_map(IndexValue::Str),
        ]
    }

    fn balanced_operation_strategy() -> impl Strategy<Value = IndexingOp> {
        prop_oneof![
            (0u64..20u64).prop_map(|id| IndexingOp::DeleteDoc { id }),
            (0u64..20u64).prop_map(|id| IndexingOp::DeleteDocQuery { id }),
            (0u64..20u64, value_strategy())
                .prop_map(move |(id, value)| IndexingOp::AddDoc { id, value }),
            ((0u64..20u64), (1u64..100), value_strategy()).prop_map(
                move |(id, num_docs, value)| {
                    IndexingOp::AddMultipleDoc {
                        id,
                        num_docs,
                        value,
                    }
                }
            ),
            (0u64..1u64).prop_map(|_| IndexingOp::Commit),
            (0u64..1u64).prop_map(|_| IndexingOp::Merge),
        ]
    }

    fn adding_operation_strategy() -> impl Strategy<Value = IndexingOp> {
        prop_oneof![
            5 => (0u64..100u64).prop_map(|id| IndexingOp::DeleteDoc { id }),
            5 => (0u64..100u64).prop_map(|id| IndexingOp::DeleteDocQuery { id }),
            50 => (0u64..100u64, value_strategy())
                .prop_map(move |(id, value)| IndexingOp::AddDoc { id, value }),
            50 => (0u64..100u64, (1u64..100), value_strategy()).prop_map(
                move |(id, num_docs, value)| {
                    IndexingOp::AddMultipleDoc {
                        id,
                        num_docs,
                        value,
                    }
                }
            ),
            2 => (0u64..1u64).prop_map(|_| IndexingOp::Commit),
            1 => (0u64..1u64).prop_map(|_| IndexingOp::Merge),
        ]
    }

    fn expected_ids(ops: &[IndexingOp]) -> (HashMap<u64, u64>, HashSet<u64>) {
        let mut existing_ids = HashMap::new();
        let mut deleted_ids = HashSet::new();
        for op in ops {
            match op {
                IndexingOp::AddDoc { id, value: _ } => {
                    *existing_ids.entry(*id).or_insert(0) += 1;
                    deleted_ids.remove(id);
                }
                IndexingOp::AddMultipleDoc {
                    id,
                    num_docs,
                    value: _,
                } => {
                    *existing_ids.entry(*id).or_insert(0) += num_docs;
                    deleted_ids.remove(id);
                }
                IndexingOp::DeleteDoc { id } => {
                    existing_ids.remove(id);
                    deleted_ids.insert(*id);
                }
                IndexingOp::DeleteDocQuery { id } => {
                    existing_ids.remove(id);
                    deleted_ids.insert(*id);
                }
                _ => {}
            }
        }
        (existing_ids, deleted_ids)
    }

    fn get_id_list(ops: &[IndexingOp]) -> Vec<u64> {
        let mut id_list = Vec::new();
        for op in ops {
            match op {
                IndexingOp::AddDoc { id, value: _ } => {
                    id_list.push(*id);
                }
                IndexingOp::AddMultipleDoc { id, .. } => {
                    id_list.push(*id);
                }
                IndexingOp::DeleteDoc { id } => {
                    id_list.retain(|el| el != id);
                }
                IndexingOp::DeleteDocQuery { id } => {
                    id_list.retain(|el| el != id);
                }
                _ => {}
            }
        }
        id_list
    }

    fn test_operation_strategy(ops: &[IndexingOp], force_end_merge: bool) -> crate::Result<Index> {
        let mut schema_builder = schema::Schema::builder();
        let json_field = schema_builder.add_json_field("json", FAST | TEXT | STORED);
        let ip_field = schema_builder.add_ip_addr_field("ip", FAST | INDEXED | STORED);
        let ips_field = schema_builder
            .add_ip_addr_field("ips", IpAddrOptions::default().set_fast().set_indexed());
        let i64_field = schema_builder.add_i64_field("i64", INDEXED);
        let id_field = schema_builder.add_u64_field("id", FAST | INDEXED | STORED);
        let id_opt_field = schema_builder.add_u64_field("id_opt", FAST | INDEXED | STORED);
        let f64_field = schema_builder.add_f64_field("f64", INDEXED);
        let date_field = schema_builder.add_date_field("date", INDEXED);
        let bytes_field = schema_builder.add_bytes_field("bytes", FAST | INDEXED | STORED);
        let bool_field = schema_builder.add_bool_field("bool", FAST | INDEXED | STORED);
        let text_field = schema_builder.add_text_field(
            "text_field",
            TextOptions::default()
                .set_indexing_options(
                    TextFieldIndexing::default()
                        .set_index_option(schema::IndexRecordOption::WithFreqsAndPositions),
                )
                .set_stored(),
        );

        let large_text_field = schema_builder.add_text_field("large_text_field", TEXT | STORED);
        let multi_text_fields = schema_builder.add_text_field("multi_text_fields", TEXT | STORED);

        let multi_numbers = schema_builder.add_u64_field(
            "multi_numbers",
            NumericOptions::default().set_fast().set_stored(),
        );
        let multi_bools = schema_builder.add_bool_field(
            "multi_bools",
            NumericOptions::default().set_fast().set_stored(),
        );
        let facet_field = schema_builder.add_facet_field("facet", FacetOptions::default());
        let schema = schema_builder.build();
        let settings = {
            IndexSettings {
                ..Default::default()
            }
        };
        let index = Index::builder()
            .schema(schema)
            .settings(settings)
            .create_in_ram()?;
        let mut index_writer = index.writer_for_tests()?;
        index_writer.set_merge_policy(Box::new(NoMergePolicy));

        let old_reader = index.reader()?;

        // Every 3rd doc has only id field
        let id_is_full_doc = |id| id % 3 != 0;

        let multi_text_field_text1 = "test1 test2 test3 test1 test2 test3";
        // rotate left
        let multi_text_field_text2 = "test2 test3 test1 test2 test3 test1";
        // rotate right
        let multi_text_field_text3 = "test3 test1 test2 test3 test1 test2";

        let ip_from_id = |id| Ipv6Addr::from_u128(id as u128);

        let add_docs = |index_writer: &mut IndexWriter,
                        id: u64,
                        value: IndexValue,
                        num: u64|
         -> crate::Result<()> {
            let facet = Facet::from(&("/cola/".to_string() + &id.to_string()));
            let ip = ip_from_id(id);
            let doc = if !id_is_full_doc(id) {
                // every 3rd doc has no ip field
                doc!(
                    id_field=>id,
                )
            } else {
                let json = json!({"date1": format!("2022-{id}-01T00:00:01Z"), "date2": format!("{id}-05-01T00:00:01Z"), "id": id, "ip": ip.to_string(), "val": value});
                doc!(id_field=>id,
                        json_field=>json,
                        bytes_field => id.to_le_bytes().as_slice(),
                        id_opt_field => id,
                        ip_field => ip,
                        ips_field => ip,
                        ips_field => ip,
                        multi_numbers=> id,
                        multi_numbers => id,
                        bool_field => (id % 2u64) != 0,
                        i64_field => id as i64,
                        f64_field => id as f64,
                        date_field => DateTime::from_timestamp_secs(id as i64),
                        multi_bools => (id % 2u64) != 0,
                        multi_bools => (id % 2u64) == 0,
                        text_field => id.to_string(),
                        facet_field => facet,
                        large_text_field => LOREM,
                        multi_text_fields => multi_text_field_text1,
                        multi_text_fields => multi_text_field_text2,
                        multi_text_fields => multi_text_field_text3,
                )
            };
            for _ in 0..num {
                index_writer.add_document(doc.clone())?;
            }
            Ok(())
        };
        for op in ops {
            match op.clone() {
                IndexingOp::AddMultipleDoc {
                    id,
                    num_docs,
                    value,
                } => {
                    add_docs(&mut index_writer, id, value, num_docs)?;
                }
                IndexingOp::AddDoc { id, value } => {
                    add_docs(&mut index_writer, id, value, 1)?;
                }
                IndexingOp::DeleteDoc { id } => {
                    index_writer.delete_term(Term::from_field_u64(id_field, id));
                }
                IndexingOp::DeleteDocQuery { id } => {
                    let term = Term::from_field_u64(id_field, id);
                    let query = TermQuery::new(term, Default::default());
                    index_writer.delete_query(Box::new(query))?;
                }
                IndexingOp::Commit => {
                    index_writer.commit()?;
                }
                IndexingOp::Merge => {
                    let mut segment_ids = index
                        .searchable_segment_ids()
                        .expect("Searchable segments failed.");
                    segment_ids.sort();
                    if segment_ids.len() >= 2 {
                        index_writer.merge(&segment_ids).wait().unwrap();
                        assert!(index_writer.segment_updater().wait_merging_thread().is_ok());
                    }
                }
            }
        }
        index_writer.commit()?;

        let searcher = index.reader()?.searcher();
        let num_segments_before_merge = searcher.segment_readers().len();
        if force_end_merge {
            index_writer.wait_merging_threads()?;
            let mut index_writer: IndexWriter = index.writer_for_tests()?;
            let segment_ids = index
                .searchable_segment_ids()
                .expect("Searchable segments failed.");
            if segment_ids.len() >= 2 {
                index_writer.merge(&segment_ids).wait().unwrap();
                assert!(index_writer.wait_merging_threads().is_ok());
            }
        }
        let num_segments_after_merge = searcher.segment_readers().len();

        old_reader.reload()?;
        let old_searcher = old_reader.searcher();

        let ids_old_searcher: HashSet<u64> = old_searcher
            .segment_readers()
            .iter()
            .flat_map(|segment_reader| {
                let ff_reader = segment_reader.fast_fields().u64("id").unwrap();
                segment_reader
                    .doc_ids_alive()
                    .flat_map(move |doc| ff_reader.values_for_doc(doc).collect_vec().into_iter())
            })
            .collect();

        let ids: HashSet<u64> = searcher
            .segment_readers()
            .iter()
            .flat_map(|segment_reader| {
                let ff_reader = segment_reader.fast_fields().u64("id").unwrap();
                segment_reader
                    .doc_ids_alive()
                    .flat_map(move |doc| ff_reader.values_for_doc(doc).collect_vec().into_iter())
            })
            .collect();

        let (expected_ids_and_num_occurrences, deleted_ids) = expected_ids(ops);

        let id_list = get_id_list(ops);

        // multivalue fast field content
        let mut all_ips = Vec::new();
        let mut num_ips = 0;
        for segment_reader in searcher.segment_readers().iter() {
            let ip_reader: Column<Ipv6Addr> = segment_reader
                .fast_fields()
                .column_opt("ips")
                .unwrap()
                .unwrap();
            for doc in segment_reader.doc_ids_alive() {
                all_ips.extend(ip_reader.values_for_doc(doc));
            }
            num_ips += ip_reader.values.num_vals();
        }

        let num_docs_expected = expected_ids_and_num_occurrences
            .values()
            .map(|id_occurrences| *id_occurrences as usize)
            .sum::<usize>();

        let num_docs_with_values = expected_ids_and_num_occurrences
            .iter()
            .filter(|(id, _id_occurrences)| id_is_full_doc(**id))
            .map(|(_, id_occurrences)| *id_occurrences as usize)
            .sum::<usize>();

        assert_eq!(searcher.num_docs() as usize, num_docs_expected);
        assert_eq!(old_searcher.num_docs() as usize, num_docs_expected);
        assert_eq!(
            ids_old_searcher,
            expected_ids_and_num_occurrences
                .keys()
                .cloned()
                .collect::<HashSet<_>>()
        );
        assert_eq!(
            ids,
            expected_ids_and_num_occurrences
                .keys()
                .cloned()
                .collect::<HashSet<_>>()
        );

        if force_end_merge && num_segments_before_merge > 1 && num_segments_after_merge == 1 {
            let mut expected_multi_ips: Vec<_> = id_list
                .iter()
                .filter(|id| id_is_full_doc(**id))
                .flat_map(|id| vec![ip_from_id(*id), ip_from_id(*id)])
                .collect();
            assert_eq!(num_ips, expected_multi_ips.len() as u32);

            expected_multi_ips.sort();
            all_ips.sort();
            assert_eq!(expected_multi_ips, all_ips);

            // Test fastfield num_docs
            let num_docs: usize = searcher
                .segment_readers()
                .iter()
                .map(|segment_reader| {
                    let ff_reader = segment_reader
                        .fast_fields()
                        .column_opt::<Ipv6Addr>("ips")
                        .unwrap()
                        .unwrap();
                    ff_reader.num_docs() as usize
                })
                .sum();
            assert_eq!(num_docs, num_docs_expected);
        }

        // Load all ips addr
        let mut ips: HashSet<Ipv6Addr> = Default::default();
        for reader in searcher.segment_readers() {
            if let Some(ff_reader) = reader.fast_fields().column_opt::<Ipv6Addr>("ips").unwrap() {
                for doc in reader.doc_ids_alive() {
                    ips.extend(ff_reader.values_for_doc(doc));
                }
            }
        }

        let expected_ips = expected_ids_and_num_occurrences
            .keys()
            .flat_map(|id| {
                if !id_is_full_doc(*id) {
                    None
                } else {
                    Some(Ipv6Addr::from_u128(*id as u128))
                }
            })
            .collect::<HashSet<_>>();
        assert_eq!(ips, expected_ips);

        let expected_ips = expected_ids_and_num_occurrences
            .keys()
            .filter_map(|id| {
                if !id_is_full_doc(*id) {
                    None
                } else {
                    Some(Ipv6Addr::from_u128(*id as u128))
                }
            })
            .collect::<HashSet<_>>();

        let mut ips: HashSet<Ipv6Addr> = Default::default();
        for reader in searcher.segment_readers() {
            if let Some(ff_reader) = reader.fast_fields().column_opt::<Ipv6Addr>("ips").unwrap() {
                for doc in reader.doc_ids_alive() {
                    ips.extend(ff_reader.values_for_doc(doc));
                }
            }
        }
        assert_eq!(ips, expected_ips);

        // multivalue fast field tests
        for segment_reader in searcher.segment_readers().iter() {
            let id_reader = segment_reader.fast_fields().u64("id").unwrap();
            let ff_reader = segment_reader
                .fast_fields()
                .column_opt("multi_numbers")
                .unwrap()
                .unwrap();
            let bool_ff_reader = segment_reader
                .fast_fields()
                .column_opt::<bool>("multi_bools")
                .unwrap()
                .unwrap();
            for doc in segment_reader.doc_ids_alive() {
                let id = id_reader.first(doc).unwrap();

                let vals: Vec<u64> = ff_reader.values_for_doc(doc).collect();
                if id_is_full_doc(id) {
                    assert_eq!(vals.len(), 2);
                    assert_eq!(vals[0], vals[1]);
                    assert!(expected_ids_and_num_occurrences.contains_key(&vals[0]));
                    assert_eq!(id_reader.first(doc), Some(vals[0]));
                } else {
                    assert_eq!(vals.len(), 0);
                }

                let bool_vals: Vec<bool> = bool_ff_reader.values_for_doc(doc).collect();
                if id_is_full_doc(id) {
                    assert_eq!(bool_vals.len(), 2);
                    assert_ne!(bool_vals[0], bool_vals[1]);
                } else {
                    assert_eq!(bool_vals.len(), 0);
                }
            }
        }

        // doc store tests
        for segment_reader in searcher.segment_readers().iter() {
            let store_reader = segment_reader
                .get_store_reader(DOCSTORE_CACHE_CAPACITY)
                .unwrap();
            // test store iterator
            for doc in store_reader.iter::<TantivyDocument>(segment_reader.alive_bitset()) {
                let id = doc
                    .unwrap()
                    .get_first(id_field)
                    .unwrap()
                    .as_value()
                    .as_u64()
                    .unwrap();
                assert!(expected_ids_and_num_occurrences.contains_key(&id));
            }
            // test store random access
            for doc_id in segment_reader.doc_ids_alive() {
                let id = store_reader
                    .get::<TantivyDocument>(doc_id)
                    .unwrap()
                    .get_first(id_field)
                    .unwrap()
                    .as_u64()
                    .unwrap();
                assert!(expected_ids_and_num_occurrences.contains_key(&id));
                if id_is_full_doc(id) {
                    let id2 = store_reader
                        .get::<TantivyDocument>(doc_id)
                        .unwrap()
                        .get_first(multi_numbers)
                        .unwrap()
                        .as_u64()
                        .unwrap();
                    assert_eq!(id, id2);
                    let bool = store_reader
                        .get::<TantivyDocument>(doc_id)
                        .unwrap()
                        .get_first(bool_field)
                        .unwrap()
                        .as_bool()
                        .unwrap();
                    let doc = store_reader.get::<TantivyDocument>(doc_id).unwrap();
                    let mut bool2 = doc.get_all(multi_bools);
                    assert_eq!(bool, bool2.next().unwrap().as_bool().unwrap());
                    assert_ne!(bool, bool2.next().unwrap().as_bool().unwrap());
                    assert!(bool2.next().is_none())
                }
            }
        }
        // test search
        let do_search = |term: &str, field| {
            let query = QueryParser::for_index(&index, vec![field])
                .parse_query(term)
                .unwrap();
            let top_docs: Vec<(f32, DocAddress)> = searcher
                .search(&query, &TopDocs::with_limit(1000).order_by_score())
                .unwrap();

            top_docs.iter().map(|el| el.1).collect::<Vec<_>>()
        };
        let count_search = |term: &str, field| {
            let query = QueryParser::for_index(&index, vec![field])
                .parse_query(term)
                .unwrap();
            searcher.search(&query, &Count).unwrap()
        };

        let count_search2 = |term: Term| {
            let query = TermQuery::new(term, IndexRecordOption::Basic);
            searcher.search(&query, &Count).unwrap()
        };

        for (id, count) in &expected_ids_and_num_occurrences {
            // skip expensive queries
            let (existing_id, count) = (*id, *count);
            let get_num_hits = |field| count_search(&existing_id.to_string(), field) as u64;
            assert_eq!(get_num_hits(id_field), count);
            if !id_is_full_doc(existing_id) {
                continue;
            }
            assert_eq!(get_num_hits(text_field), count);
            assert_eq!(get_num_hits(i64_field), count);
            assert_eq!(get_num_hits(f64_field), count);

            // Test multi text
            if num_docs_with_values < 1000 {
                assert_eq!(
                    do_search("\"test1 test2\"", multi_text_fields).len(),
                    num_docs_with_values
                );
                assert_eq!(
                    do_search("\"test2 test3\"", multi_text_fields).len(),
                    num_docs_with_values
                );
            }

            // Test bytes
            let term = Term::from_field_bytes(bytes_field, existing_id.to_le_bytes().as_slice());
            assert_eq!(count_search2(term) as u64, count);

            // Test date
            let term = Term::from_field_date(
                date_field,
                DateTime::from_timestamp_secs(existing_id as i64),
            );
            assert_eq!(count_search2(term) as u64, count);
        }
        for deleted_id in deleted_ids {
            let assert_field = |field| {
                assert_eq!(count_search(&deleted_id.to_string(), field) as u64, 0);
            };
            assert_field(text_field);
            assert_field(f64_field);
            assert_field(i64_field);
            assert_field(id_field);

            // Test bytes
            let term = Term::from_field_bytes(bytes_field, deleted_id.to_le_bytes().as_slice());
            assert_eq!(count_search2(term), 0);

            // Test date
            let term =
                Term::from_field_date(date_field, DateTime::from_timestamp_secs(deleted_id as i64));
            assert_eq!(count_search2(term), 0);
        }
        // search ip address
        //
        for (existing_id, count) in &expected_ids_and_num_occurrences {
            let (existing_id, count) = (*existing_id, *count);
            if !id_is_full_doc(existing_id) {
                continue;
            }
            let do_search_ip_field = |term: &str| count_search(term, ip_field) as u64;
            let ip_addr = Ipv6Addr::from_u128(existing_id as u128);
            // Test incoming ip as ipv6
            assert_eq!(do_search_ip_field(&format!("\"{ip_addr}\"")), count);

            let term = Term::from_field_ip_addr(ip_field, ip_addr);
            assert_eq!(count_search2(term) as u64, count);

            // Test incoming ip as ipv4
            if let Some(ip_addr) = ip_addr.to_ipv4_mapped() {
                assert_eq!(do_search_ip_field(&format!("\"{ip_addr}\"")), count);
            }
        }

        // Range query
        //
        // Take half as sample
        let mut sample: Vec<_> = expected_ids_and_num_occurrences.iter().collect();
        sample.sort_by_key(|(k, _num_occurrences)| *k);
        // sample.truncate(sample.len() / 2);
        if !sample.is_empty() {
            let (left_sample, right_sample) = sample.split_at(sample.len() / 2);

            let calc_expected_count = |sample: &[(&u64, &u64)]| {
                sample
                    .iter()
                    .filter(|(id, _)| id_is_full_doc(**id))
                    .map(|(_id, num_occurrences)| **num_occurrences)
                    .sum::<u64>()
            };
            fn gen_query_inclusive<T1: ToString, T2: ToString>(
                field: &str,
                from: T1,
                to: T2,
            ) -> String {
                format!("{}:[{} TO {}]", field, &from.to_string(), &to.to_string())
            }

            // Query first half
            let expected_count = calc_expected_count(left_sample);
            if !left_sample.is_empty() && expected_count < 1000 {
                let start_range = *left_sample[0].0;
                let end_range = *left_sample.last().unwrap().0;
                let query = gen_query_inclusive("id_opt", start_range, end_range);
                assert_eq!(count_search(&query, id_opt_field) as u64, expected_count);

                // Range query on ip field
                let ip1 = ip_from_id(start_range);
                let ip2 = ip_from_id(end_range);
                let do_search_ip_field = |term: &str| count_search(term, ip_field) as u64;
                let query = gen_query_inclusive("ip", ip1, ip2);
                assert_eq!(do_search_ip_field(&query), expected_count);
                let query = gen_query_inclusive("ip", "*", ip2);
                assert_eq!(do_search_ip_field(&query), expected_count);
                // Range query on multi value field
                let query = gen_query_inclusive("ips", ip1, ip2);
                assert_eq!(do_search_ip_field(&query), expected_count);
                let query = gen_query_inclusive("ips", "*", ip2);
                assert_eq!(do_search_ip_field(&query), expected_count);
            }
            // Query second half
            let expected_count = calc_expected_count(right_sample);
            if !right_sample.is_empty() && expected_count < 1000 {
                let start_range = *right_sample[0].0;
                let end_range = *right_sample.last().unwrap().0;
                // Range query on id opt field
                let query =
                    gen_query_inclusive("id_opt", start_range.to_string(), end_range.to_string());
                assert_eq!(count_search(&query, id_opt_field) as u64, expected_count);

                // Range query on ip field
                let ip1 = ip_from_id(start_range);
                let ip2 = ip_from_id(end_range);
                let do_search_ip_field = |term: &str| count_search(term, ip_field) as u64;
                let query = gen_query_inclusive("ip", ip1, ip2);
                assert_eq!(do_search_ip_field(&query), expected_count);
                let query = gen_query_inclusive("ip", ip1, "*");
                assert_eq!(do_search_ip_field(&query), expected_count);
                // Range query on multi value field
                let query = gen_query_inclusive("ips", ip1, ip2);
                assert_eq!(do_search_ip_field(&query), expected_count);
                let query = gen_query_inclusive("ips", ip1, "*");
                assert_eq!(do_search_ip_field(&query), expected_count);
            }
        }

        // ip range query on fast field
        //
        for (existing_id, count) in expected_ids_and_num_occurrences.iter().take(10) {
            let (existing_id, count) = (*existing_id, *count);
            if !id_is_full_doc(existing_id) {
                continue;
            }
            let gen_query_inclusive = |field: &str, from: Ipv6Addr, to: Ipv6Addr| {
                format!("{}:[{} TO {}]", field, &from.to_string(), &to.to_string())
            };
            let ip = ip_from_id(existing_id);

            let do_search_ip_field = |term: &str| count_search(term, ip_field) as u64;
            // Range query on single value field
            let query = gen_query_inclusive("ip", ip, ip);
            assert_eq!(do_search_ip_field(&query), count);

            // Range query on multi value field
            let query = gen_query_inclusive("ips", ip, ip);
            assert_eq!(do_search_ip_field(&query), count);
        }

        // test facets
        for segment_reader in searcher.segment_readers().iter() {
            let facet_reader = segment_reader.facet_reader("facet").unwrap();
            let ff_reader = segment_reader
                .fast_fields()
                .u64("id")
                .unwrap()
                .first_or_default_col(9999);
            for doc_id in segment_reader.doc_ids_alive() {
                let id = ff_reader.get_val(doc_id);
                if !id_is_full_doc(id) {
                    continue;
                }
                let facet_ords: Vec<u64> = facet_reader.facet_ords(doc_id).collect();
                assert_eq!(facet_ords.len(), 1);
                let mut facet = Facet::default();
                facet_reader
                    .facet_from_ord(facet_ords[0], &mut facet)
                    .unwrap();
                let facet_expected = Facet::from(&("/cola/".to_string() + &id.to_string()));

                assert_eq!(facet, facet_expected);
            }
        }

        Ok(index)
    }

    #[test]
    fn test_fast_field_range() {
        let ops: Vec<_> = (0..1000).map(IndexingOp::add).collect();
        assert!(test_operation_strategy(&ops, true).is_ok());
    }

    #[test]
    fn test_ip_range_query_multivalue_bug() {
        assert!(test_operation_strategy(
            &[
                IndexingOp::add(2),
                IndexingOp::Commit,
                IndexingOp::add(1),
                IndexingOp::add(1),
                IndexingOp::Commit,
                IndexingOp::Merge
            ],
            false
        )
        .is_ok());
    }

    #[test]
    fn test_ff_num_ips_regression() {
        assert!(test_operation_strategy(
            &[
                IndexingOp::add(13),
                IndexingOp::add(1),
                IndexingOp::Commit,
                IndexingOp::DeleteDocQuery { id: 13 },
                IndexingOp::add(1),
                IndexingOp::Commit,
            ],
            true
        )
        .is_ok());
    }

    #[test]
    fn test_minimal_sort_force_end_merge() {
        assert!(
            test_operation_strategy(&[IndexingOp::add(23), IndexingOp::add(13),], false).is_ok()
        );
    }

    #[test]
    fn test_minimal_no_force_end_merge() {
        assert!(test_operation_strategy(
            &[
                IndexingOp::add(23),
                IndexingOp::add(13),
                IndexingOp::DeleteDoc { id: 13 }
            ],
            false
        )
        .is_ok());
    }

    use proptest::prelude::*;

    proptest! {

        #![proptest_config(ProptestConfig::with_cases(20))]
        #[test]
        fn test_delete_proptest_adding(ops in proptest::collection::vec(adding_operation_strategy(), 1..100)) {
            assert!(test_operation_strategy(&ops[..],  false).is_ok());
        }

        #[test]
        fn test_delete_proptest_with_merge_adding(ops in proptest::collection::vec(adding_operation_strategy(), 1..100)) {
            assert!(test_operation_strategy(&ops[..],  true).is_ok());
        }

        #[test]
        fn test_delete_proptest(ops in proptest::collection::vec(balanced_operation_strategy(), 1..10)) {
            assert!(test_operation_strategy(&ops[..],  false).is_ok());
        }

        #[test]
        fn test_delete_proptest_with_merge(ops in proptest::collection::vec(balanced_operation_strategy(), 1..100)) {
            assert!(test_operation_strategy(&ops[..],  true).is_ok());
        }
    }

    #[test]
    fn test_delete_bug_reproduction_ip_addr() {
        use IndexingOp::*;
        let ops = &[
            IndexingOp::add(1),
            IndexingOp::add(2),
            Commit,
            IndexingOp::add(3),
            DeleteDoc { id: 1 },
            Commit,
            Merge,
            IndexingOp::add(4),
            Commit,
        ];
        test_operation_strategy(&ops[..], true).unwrap();
    }

    #[test]
    fn test_merge_regression_1() {
        use IndexingOp::*;
        let ops = &[
            IndexingOp::add(15),
            Commit,
            IndexingOp::add(9),
            Commit,
            Merge,
        ];
        test_operation_strategy(&ops[..], true).unwrap();
    }

    #[test]
    fn test_range_query_bug_1() {
        use IndexingOp::*;
        let ops = &[
            IndexingOp::add(9),
            IndexingOp::add(0),
            IndexingOp::add(13),
            Commit,
        ];
        test_operation_strategy(&ops[..], true).unwrap();
    }

    #[test]
    fn test_range_query_bug_2() {
        let ops = &[
            IndexingOp::add(3),
            IndexingOp::add(6),
            IndexingOp::add(9),
            IndexingOp::add(10),
        ];
        test_operation_strategy(&ops[..], false).unwrap();
    }

    #[test]
    fn test_index_doc_missing_field() -> crate::Result<()> {
        let mut schema_builder = schema::Schema::builder();
        let idfield = schema_builder.add_text_field("id", STRING);
        schema_builder.add_text_field("optfield", STRING);
        let index = Index::create_in_ram(schema_builder.build());
        let mut index_writer = index.writer_for_tests()?;
        index_writer.add_document(doc!(idfield=>"myid"))?;
        index_writer.commit()?;
        Ok(())
    }

    #[test]
    fn test_bug_1617_3() {
        assert!(test_operation_strategy(
            &[
                IndexingOp::DeleteDoc { id: 0 },
                IndexingOp::add(6),
                IndexingOp::DeleteDocQuery { id: 11 },
                IndexingOp::Commit,
                IndexingOp::Merge,
                IndexingOp::Commit,
                IndexingOp::Commit
            ],
            false
        )
        .is_ok());
    }

    #[test]
    fn test_bug_1617_2() {
        test_operation_strategy(
            &[
                IndexingOp::AddDoc {
                    id: 13,
                    value: Default::default(),
                },
                IndexingOp::DeleteDoc { id: 13 },
                IndexingOp::Commit,
                IndexingOp::add(30),
                IndexingOp::Commit,
                IndexingOp::Merge,
            ],
            true,
        )
        .unwrap();
    }

    #[test]
    fn test_bug_1617() -> crate::Result<()> {
        let mut schema_builder = schema::Schema::builder();
        let id_field = schema_builder.add_u64_field("id", INDEXED);

        let schema = schema_builder.build();
        let index = Index::builder().schema(schema).create_in_ram()?;
        let mut index_writer = index.writer_for_tests()?;
        index_writer.set_merge_policy(Box::new(NoMergePolicy));

        let existing_id = 16u64;
        let deleted_id = 13u64;
        index_writer.add_document(doc!(
            id_field=>existing_id,
        ))?;
        index_writer.add_document(doc!(
            id_field=>deleted_id,
        ))?;
        index_writer.delete_term(Term::from_field_u64(id_field, deleted_id));
        index_writer.commit()?;

        // Merge
        {
            assert!(index_writer.wait_merging_threads().is_ok());
            let mut index_writer: IndexWriter = index.writer_for_tests()?;
            let segment_ids = index
                .searchable_segment_ids()
                .expect("Searchable segments failed.");
            index_writer.merge(&segment_ids).wait().unwrap();
            assert!(index_writer.wait_merging_threads().is_ok());
        }
        let searcher = index.reader()?.searcher();

        let query = TermQuery::new(
            Term::from_field_u64(id_field, existing_id),
            IndexRecordOption::Basic,
        );
        let top_docs: Vec<(f32, DocAddress)> = searcher
            .search(&query, &TopDocs::with_limit(10).order_by_score())
            .unwrap();

        assert_eq!(top_docs.len(), 1); // Was failing

        Ok(())
    }

    #[test]
    fn test_bug_1618() -> crate::Result<()> {
        let mut schema_builder = schema::Schema::builder();
        let id_field = schema_builder.add_i64_field("id", INDEXED);

        let schema = schema_builder.build();
        let index = Index::builder().schema(schema).create_in_ram()?;
        let mut index_writer = index.writer_for_tests()?;
        index_writer.set_merge_policy(Box::new(NoMergePolicy));

        index_writer.add_document(doc!(
            id_field=>10i64,
        ))?;
        index_writer.add_document(doc!(
            id_field=>30i64,
        ))?;
        index_writer.commit()?;

        // Merge
        {
            assert!(index_writer.wait_merging_threads().is_ok());
            let mut index_writer: IndexWriter = index.writer_for_tests()?;
            let segment_ids = index
                .searchable_segment_ids()
                .expect("Searchable segments failed.");
            index_writer.merge(&segment_ids).wait().unwrap();
            assert!(index_writer.wait_merging_threads().is_ok());
        }
        let searcher = index.reader()?.searcher();

        let query = TermQuery::new(
            Term::from_field_i64(id_field, 10i64),
            IndexRecordOption::Basic,
        );
        let top_docs: Vec<(f32, DocAddress)> = searcher
            .search(&query, &TopDocs::with_limit(10).order_by_score())
            .unwrap();

        assert_eq!(top_docs.len(), 1); // Fails

        let query = TermQuery::new(
            Term::from_field_i64(id_field, 30i64),
            IndexRecordOption::Basic,
        );
        let top_docs: Vec<(f32, DocAddress)> = searcher
            .search(&query, &TopDocs::with_limit(10).order_by_score())
            .unwrap();

        assert_eq!(top_docs.len(), 1); // Fails

        Ok(())
    }

    #[test]
    fn test_bug_2442_reserved_character_fast_field() -> crate::Result<()> {
        let mut schema_builder = schema::Schema::builder();
        let json_field = schema_builder.add_json_field("json", FAST | TEXT);

        let schema = schema_builder.build();
        let index = Index::builder().schema(schema).create_in_ram()?;
        let mut index_writer = index.writer_for_tests()?;
        index_writer.set_merge_policy(Box::new(NoMergePolicy));

        index_writer
            .add_document(doc!(
                json_field=>json!({"\u{0000}B":"1"})
            ))
            .unwrap();
        index_writer
            .add_document(doc!(
                json_field=>json!({" A":"1"})
            ))
            .unwrap();
        index_writer.commit()?;

        Ok(())
    }

    #[test]
    fn test_bug_2442_reserved_character_columnar() -> crate::Result<()> {
        let mut schema_builder = Schema::builder();
        let options = JsonObjectOptions::from(FAST).set_expand_dots_enabled();
        let field = schema_builder.add_json_field("json", options);
        let index = Index::create_in_ram(schema_builder.build());
        let mut index_writer = index.writer_for_tests().unwrap();
        index_writer
            .add_document(doc!(field=>json!({"\u{0000}": "A"})))
            .unwrap();
        index_writer
            .add_document(doc!(field=>json!({format!("\u{0000}\u{0000}"): "A"})))
            .unwrap();
        index_writer.commit().unwrap();
        Ok(())
    }

    #[test]
    fn test_writer_options_validation() {
        let mut schema_builder = Schema::builder();
        let _field = schema_builder.add_bool_field("example", STORED);
        let index = Index::create_in_ram(schema_builder.build());

        let opt_wo_threads = IndexWriterOptions::builder().num_worker_threads(0).build();
        let result = index.writer_with_options::<TantivyDocument>(opt_wo_threads);
        assert!(result.is_err(), "Writer should reject 0 thread count");
        assert!(matches!(result, Err(TantivyError::InvalidArgument(_))));

        let opt_with_low_memory = IndexWriterOptions::builder()
            .memory_budget_per_thread(10 << 10)
            .build();
        let result = index.writer_with_options::<TantivyDocument>(opt_with_low_memory);
        assert!(
            result.is_err(),
            "Writer should reject options with too low memory size"
        );
        assert!(matches!(result, Err(TantivyError::InvalidArgument(_))));

        let opt_with_low_memory = IndexWriterOptions::builder()
            .memory_budget_per_thread(5 << 30)
            .build();
        let result = index.writer_with_options::<TantivyDocument>(opt_with_low_memory);
        assert!(
            result.is_err(),
            "Writer should reject options with too high memory size"
        );
        assert!(matches!(result, Err(TantivyError::InvalidArgument(_))));
    }
}


================================================
FILE: src/indexer/index_writer_status.rs
================================================
use std::sync::atomic::{AtomicBool, Ordering};
use std::sync::{Arc, RwLock};

use super::AddBatchReceiver;
use crate::schema::document::Document;
use crate::TantivyDocument;

#[derive(Clone)]
pub(crate) struct IndexWriterStatus<D: Document = TantivyDocument> {
    inner: Arc<Inner<D>>,
}

impl<D: Document> IndexWriterStatus<D> {
    /// Returns true iff the index writer is alive.
    pub fn is_alive(&self) -> bool {
        self.inner.as_ref().is_alive()
    }

    /// Returns a copy of the operation receiver.
    /// If the index writer was killed, returns `None`.
    pub fn operation_receiver(&self) -> Option<AddBatchReceiver<D>> {
        let rlock = self
            .inner
            .receive_channel
            .read()
            .expect("This lock should never be poisoned");
        rlock.as_ref().cloned()
    }

    /// Create an index writer bomb.
    /// If dropped, the index writer status will be killed.
    pub(crate) fn create_bomb(&self) -> IndexWriterBomb<D> {
        IndexWriterBomb {
            inner: Some(self.inner.clone()),
        }
    }
}

struct Inner<D: Document> {
    is_alive: AtomicBool,
    receive_channel: RwLock<Option<AddBatchReceiver<D>>>,
}

impl<D: Document> Inner<D> {
    fn is_alive(&self) -> bool {
        self.is_alive.load(Ordering::Relaxed)
    }

    fn kill(&self) {
        self.is_alive.store(false, Ordering::Relaxed);
        self.receive_channel
            .write()
            .expect("This lock should never be poisoned")
            .take();
    }
}

impl<D: Document> From<AddBatchReceiver<D>> for IndexWriterStatus<D> {
    fn from(receiver: AddBatchReceiver<D>) -> Self {
        IndexWriterStatus {
            inner: Arc::new(Inner {
                is_alive: AtomicBool::new(true),
                receive_channel: RwLock::new(Some(receiver)),
            }),
        }
    }
}

/// If dropped, the index writer will be killed.
/// To prevent this, clients can call `.defuse()`.
pub(crate) struct IndexWriterBomb<D: Document> {
    inner: Option<Arc<Inner<D>>>,
}

impl<D: Document> IndexWriterBomb<D> {
    /// Defuses the bomb.
    ///
    /// This is the only way to drop the bomb without killing
    /// the index writer.
    pub fn defuse(mut self) {
        self.inner = None;
    }
}

impl<D: Document> Drop for IndexWriterBomb<D> {
    fn drop(&mut self) {
        if let Some(inner) = self.inner.take() {
            inner.kill();
        }
    }
}

#[cfg(test)]
mod tests {
    use std::mem;

    use crossbeam_channel as channel;

    use super::IndexWriterStatus;

    #[test]
    fn test_bomb_goes_boom() {
        let (_tx, rx) = channel::bounded(10);
        let index_writer_status: IndexWriterStatus = IndexWriterStatus::from(rx);
        assert!(index_writer_status.operation_receiver().is_some());
        let bomb = index_writer_status.create_bomb();
        assert!(index_writer_status.operation_receiver().is_some());
        mem::drop(bomb);
        // boom!
        assert!(index_writer_status.operation_receiver().is_none());
    }

    #[test]
    fn test_bomb_defused() {
        let (_tx, rx) = channel::bounded(10);
        let index_writer_status: IndexWriterStatus = IndexWriterStatus::from(rx);
        assert!(index_writer_status.operation_receiver().is_some());
        let bomb = index_writer_status.create_bomb();
        bomb.defuse();
        assert!(index_writer_status.operation_receiver().is_some());
    }
}


================================================
FILE: src/indexer/indexing_term.rs
================================================
use std::net::Ipv6Addr;

use columnar::MonotonicallyMappableToU128;

use crate::fastfield::FastValue;
use crate::schema::Field;

/// IndexingTerm is used to represent a term during indexing.
/// It's a serialized representation over field and value.
///
/// It actually wraps a `Vec<u8>`. The first 4 bytes are the field.
///
/// We serialize the field, because we index everything in a single
/// global term dictionary during indexing.
#[derive(Clone)]
pub(crate) struct IndexingTerm<B = Vec<u8>>(B)
where B: AsRef<[u8]>;

/// The number of bytes used as metadata by `Term`.
const TERM_METADATA_LENGTH: usize = 4;

impl IndexingTerm {
    /// Create a new Term with a buffer with a given capacity.
    pub fn with_capacity(capacity: usize) -> IndexingTerm {
        let mut data = Vec::with_capacity(TERM_METADATA_LENGTH + capacity);
        data.resize(TERM_METADATA_LENGTH, 0u8);
        IndexingTerm(data)
    }

    /// Panics when the term is not empty... ie: some value is set.
    /// Use `clear_with_field_and_type` in that case.
    ///
    /// Sets field and the type.
    pub(crate) fn set_field(&mut self, field: Field) {
        assert!(self.is_empty());
        self.0[0..4].clone_from_slice(field.field_id().to_be_bytes().as_ref());
    }

    /// Is empty if there are no value bytes.
    pub fn is_empty(&self) -> bool {
        self.0.len() == TERM_METADATA_LENGTH
    }

    /// Removes the value_bytes and set the field
    pub(crate) fn clear_with_field(&mut self, field: Field) {
        self.truncate_value_bytes(0);
        self.set_field(field);
    }

    /// Sets a u64 value in the term.
    ///
    /// U64 are serialized using (8-byte) BigEndian
    /// representation.
    /// The use of BigEndian has the benefit of preserving
    /// the natural order of the values.
    pub fn set_u64(&mut self, val: u64) {
        self.set_fast_value(val);
    }

    /// Sets a `i64` value in the term.
    pub fn set_i64(&mut self, val: i64) {
        self.set_fast_value(val);
    }

    /// Sets a `f64` value in the term.
    pub fn set_f64(&mut self, val: f64) {
        self.set_fast_value(val);
    }

    /// Sets a `bool` value in the term.
    pub fn set_bool(&mut self, val: bool) {
        self.set_fast_value(val);
    }

    fn set_fast_value<T: FastValue>(&mut self, val: T) {
        self.set_bytes(val.to_u64().to_be_bytes().as_ref());
    }

    /// Append a type marker + fast value to a term.
    /// This is used in JSON type to append a fast value after the path.
    ///
    /// It will not clear existing bytes.
    pub fn append_type_and_fast_value<T: FastValue>(&mut self, val: T) {
        self.0.push(T::to_type().to_code());
        let value = val.to_u64();
        self.0.extend(value.to_be_bytes().as_ref());
    }

    /// Sets a `Ipv6Addr` value in the term.
    pub fn set_ip_addr(&mut self, val: Ipv6Addr) {
        self.set_bytes(val.to_u128().to_be_bytes().as_ref());
    }

    /// Sets the value of a `Bytes` field.
    pub fn set_bytes(&mut self, bytes: &[u8]) {
        self.truncate_value_bytes(0);
        self.0.extend(bytes);
    }

    /// Truncates the value bytes of the term. Value and field type stays the same.
    pub fn truncate_value_bytes(&mut self, len: usize) {
        self.0.truncate(len + TERM_METADATA_LENGTH);
    }

    /// The length of the bytes.
    pub fn len_bytes(&self) -> usize {
        self.0.len() - TERM_METADATA_LENGTH
    }

    /// Appends value bytes to the Term.
    ///
    /// This function returns the segment that has just been added.
    #[inline]
    pub fn append_bytes(&mut self, bytes: &[u8]) -> &mut [u8] {
        let len_before = self.0.len();
        self.0.extend_from_slice(bytes);
        &mut self.0[len_before..]
    }
}

impl<B> IndexingTerm<B>
where B: AsRef<[u8]>
{
    /// Wraps serialized term bytes.
    ///
    /// The input buffer is expected to be the concatenation of the big endian encoded field id
    /// followed by the serialized value bytes (type tag + payload).
    #[inline]
    pub fn wrap(serialized_term: B) -> IndexingTerm<B> {
        debug_assert!(serialized_term.as_ref().len() >= TERM_METADATA_LENGTH);
        IndexingTerm(serialized_term)
    }

    /// Returns the field this term belongs to.
    #[inline]
    pub fn field(&self) -> Field {
        let field_id_bytes: [u8; 4] = self.0.as_ref()[..4].try_into().unwrap();
        Field::from_field_id(u32::from_be_bytes(field_id_bytes))
    }

    /// Returns the serialized representation of Term.
    /// This includes field_id, value type and value.
    ///
    /// Do NOT rely on this byte representation in the index.
    /// This value is likely to change in the future.
    #[inline]
    pub fn serialized_term(&self) -> &[u8] {
        self.0.as_ref()
    }
}

#[cfg(test)]
mod tests {

    use super::IndexingTerm;
    use crate::schema::*;

    #[test]
    pub fn test_term_str() {
        let mut schema_builder = Schema::builder();
        schema_builder.add_text_field("text", STRING);
        let title_field = schema_builder.add_text_field("title", STRING);
        let mut term = IndexingTerm::with_capacity(0);
        term.set_field(title_field);
        term.set_bytes(b"test");
        assert_eq!(term.field(), title_field);
        assert_eq!(term.serialized_term(), b"\x00\x00\x00\x01test".to_vec())
    }

    /// Size (in bytes) of the buffer of a fast value (u64, i64, f64, or date) term.
    /// <field> + <type byte> + <value len>
    ///
    /// - <field> is a big endian encoded u32 field id
    /// - <value> is,  if this is not the json term, a binary representation specific to the type.
    ///   If it is a JSON Term, then it is prepended with the path that leads to this leaf value.
    const FAST_VALUE_TERM_LEN: usize = 4 + 8;

    #[test]
    pub fn test_term_u64() {
        let mut schema_builder = Schema::builder();
        let count_field = schema_builder.add_u64_field("count", INDEXED);
        let mut term = IndexingTerm::with_capacity(0);
        term.set_field(count_field);
        term.set_u64(983u64);
        assert_eq!(term.field(), count_field);
        assert_eq!(term.serialized_term().len(), FAST_VALUE_TERM_LEN);
    }

    #[test]
    pub fn test_term_bool() {
        let mut schema_builder = Schema::builder();
        let bool_field = schema_builder.add_bool_field("bool", INDEXED);
        let term = {
            let mut term = IndexingTerm::with_capacity(0);
            term.set_field(bool_field);
            term.set_bool(true);
            term
        };
        assert_eq!(term.field(), bool_field);
        assert_eq!(term.serialized_term().len(), FAST_VALUE_TERM_LEN);
    }

    #[test]
    pub fn indexing_term_wrap_extracts_field() {
        let field = Field::from_field_id(7u32);
        let mut term = IndexingTerm::with_capacity(0);
        term.set_field(field);
        term.append_bytes(b"abc");

        let wrapped = IndexingTerm::wrap(term.serialized_term());
        assert_eq!(wrapped.field(), field);
        assert_eq!(wrapped.serialized_term(), term.serialized_term());
    }
}


================================================
FILE: src/indexer/log_merge_policy.rs
================================================
use std::cmp;

use itertools::Itertools;

use super::merge_policy::{MergeCandidate, MergePolicy};
use crate::index::SegmentMeta;

const DEFAULT_LEVEL_LOG_SIZE: f64 = 0.75;
const DEFAULT_MIN_LAYER_SIZE: u32 = 10_000;
const DEFAULT_MIN_NUM_SEGMENTS_IN_MERGE: usize = 8;
const DEFAULT_MAX_DOCS_BEFORE_MERGE: usize = 10_000_000;
// The default value of 1 means that deletes are not taken in account when
// identifying merge candidates. This is not a very sensible default: it was
// set like that for backward compatibility and might change in the near future.
const DEFAULT_DEL_DOCS_RATIO_BEFORE_MERGE: f32 = 1.0f32;

/// `LogMergePolicy` tries to merge segments that have a similar number of
/// documents.
#[derive(Debug, Clone)]
pub struct LogMergePolicy {
    min_num_segments: usize,
    max_docs_before_merge: usize,
    min_layer_size: u32,
    level_log_size: f64,
    del_docs_ratio_before_merge: f32,
}

impl LogMergePolicy {
    fn clip_min_size(&self, size: u32) -> u32 {
        cmp::max(self.min_layer_size, size)
    }

    /// Set the minimum number of segments that may be merged together.
    pub fn set_min_num_segments(&mut self, min_num_segments: usize) {
        self.min_num_segments = min_num_segments;
    }

    /// Set the maximum number docs in a segment for it to be considered for
    /// merging. A segment can still reach more than max_docs, by merging many
    /// smaller ones.
    pub fn set_max_docs_before_merge(&mut self, max_docs_merge_size: usize) {
        self.max_docs_before_merge = max_docs_merge_size;
    }

    /// Set the minimum segment size under which all segment belong
    /// to the same level.
    pub fn set_min_layer_size(&mut self, min_layer_size: u32) {
        self.min_layer_size = min_layer_size;
    }

    /// Set the ratio between two consecutive levels.
    ///
    /// Segments are grouped in levels according to their sizes.
    /// These levels are defined as intervals of exponentially growing sizes.
    /// level_log_size define the factor by which one should multiply the limit
    /// to reach a level, in order to get the limit to reach the following
    /// level.
    pub fn set_level_log_size(&mut self, level_log_size: f64) {
        self.level_log_size = level_log_size;
    }

    /// Set the ratio of deleted documents in a segment to tolerate.
    ///
    /// If it is exceeded by any segment at a log level, a merge
    /// will be triggered for that level.
    ///
    /// If there is a single segment at a level, we effectively end up expunging
    /// deleted documents from it.
    ///
    /// # Panics
    ///
    /// Panics if del_docs_ratio_before_merge is not within (0..1].
    pub fn set_del_docs_ratio_before_merge(&mut self, del_docs_ratio_before_merge: f32) {
        assert!(del_docs_ratio_before_merge <= 1.0f32);
        assert!(del_docs_ratio_before_merge > 0f32);
        self.del_docs_ratio_before_merge = del_docs_ratio_before_merge;
    }

    fn has_segment_above_deletes_threshold(&self, level: &[&SegmentMeta]) -> bool {
        level
            .iter()
            .any(|segment| deletes_ratio(segment) > self.del_docs_ratio_before_merge)
    }
}

fn deletes_ratio(segment: &SegmentMeta) -> f32 {
    if segment.max_doc() == 0 {
        return 0f32;
    }
    segment.num_deleted_docs() as f32 / segment.max_doc() as f32
}

impl MergePolicy for LogMergePolicy {
    fn compute_merge_candidates(&self, segments: &[SegmentMeta]) -> Vec<MergeCandidate> {
        let size_sorted_segments = segments
            .iter()
            .filter(|seg| (seg.num_docs() as usize) <= self.max_docs_before_merge)
            .sorted_by_key(|seg| std::cmp::Reverse(seg.max_doc()))
            .collect::<Vec<&SegmentMeta>>();

        if size_sorted_segments.is_empty() {
            return vec![];
        }

        let mut current_max_log_size = f64::MAX;
        let mut levels = vec![];
        for (_, merge_group) in &size_sorted_segments.into_iter().chunk_by(|segment| {
            let segment_log_size = f64::from(self.clip_min_size(segment.num_docs())).log2();
            if segment_log_size < (current_max_log_size - self.level_log_size) {
                // update current_max_log_size to create a new group
                current_max_log_size = segment_log_size;
            }
            // return current_max_log_size to be grouped to the current group
            current_max_log_size
        }) {
            levels.push(merge_group.collect::<Vec<&SegmentMeta>>());
        }

        levels
            .iter()
            .filter(|level| {
                level.len() >= self.min_num_segments
                    || self.has_segment_above_deletes_threshold(level)
            })
            .map(|segments| MergeCandidate(segments.iter().map(|&seg| seg.id()).collect()))
            .collect()
    }
}

impl Default for LogMergePolicy {
    fn default() -> LogMergePolicy {
        LogMergePolicy {
            min_num_segments: DEFAULT_MIN_NUM_SEGMENTS_IN_MERGE,
            max_docs_before_merge: DEFAULT_MAX_DOCS_BEFORE_MERGE,
            min_layer_size: DEFAULT_MIN_LAYER_SIZE,
            level_log_size: DEFAULT_LEVEL_LOG_SIZE,
            del_docs_ratio_before_merge: DEFAULT_DEL_DOCS_RATIO_BEFORE_MERGE,
        }
    }
}

#[cfg(test)]
mod tests {
    use once_cell::sync::Lazy;

    use super::*;
    use crate::index::{SegmentId, SegmentMetaInventory};
    use crate::schema;
    use crate::schema::INDEXED;

    static INVENTORY: Lazy<SegmentMetaInventory> = Lazy::new(SegmentMetaInventory::default);

    use crate::Index;

    #[test]
    fn create_index_test_max_merge_issue_1035() -> crate::Result<()> {
        let mut schema_builder = schema::Schema::builder();
        let int_field = schema_builder.add_u64_field("intval", INDEXED);
        let schema = schema_builder.build();

        let index = Index::create_in_ram(schema);

        {
            let mut log_merge_policy = LogMergePolicy::default();
            log_merge_policy.set_min_num_segments(1);
            log_merge_policy.set_max_docs_before_merge(1);
            log_merge_policy.set_min_layer_size(0);

            let mut index_writer = index.writer_for_tests()?;
            index_writer.set_merge_policy(Box::new(log_merge_policy));

            // after every commit the merge checker is started, it will merge only segments with 1
            // element in it because of the max_docs_before_merge.
            index_writer.add_document(doc!(int_field=>1_u64))?;
            index_writer.commit()?;

            index_writer.add_document(doc!(int_field=>2_u64))?;
            index_writer.commit()?;

            index_writer.add_document(doc!(int_field=>3_u64))?;
            index_writer.commit()?;

            index_writer.add_document(doc!(int_field=>4_u64))?;
            index_writer.commit()?;

            index_writer.add_document(doc!(int_field=>5_u64))?;
            index_writer.commit()?;

            index_writer.add_document(doc!(int_field=>6_u64))?;
            index_writer.commit()?;

            index_writer.add_document(doc!(int_field=>7_u64))?;
            index_writer.commit()?;

            index_writer.add_document(doc!(int_field=>8_u64))?;
            index_writer.commit()?;
        }

        let _segment_ids = index
            .searchable_segment_ids()
            .expect("Searchable segments failed.");

        let reader = index.reader().unwrap();
        let searcher = reader.searcher();
        let segment_readers = searcher.segment_readers();
        for segment in segment_readers {
            if segment.num_docs() > 2 {
                panic!("segment can't have more than two segments");
            } // don't know how to wait for the merge, then it could be a simple eq
        }
        Ok(())
    }

    fn test_merge_policy() -> LogMergePolicy {
        let mut log_merge_policy = LogMergePolicy::default();
        log_merge_policy.set_min_num_segments(3);
        log_merge_policy.set_max_docs_before_merge(100_000);
        log_merge_policy.set_min_layer_size(2);
        log_merge_policy
    }

    #[test]
    fn test_log_merge_policy_empty() {
        let y = Vec::new();
        let result_list = test_merge_policy().compute_merge_candidates(&y);
        assert!(result_list.is_empty());
    }

    fn create_random_segment_meta(num_docs: u32) -> SegmentMeta {
        INVENTORY.new_segment_meta(SegmentId::generate_random(), num_docs)
    }

    #[test]
    fn test_log_merge_policy_pair() {
        let test_input = vec![
            create_random_segment_meta(10),
            create_random_segment_meta(10),
            create_random_segment_meta(10),
        ];
        let result_list = test_merge_policy().compute_merge_candidates(&test_input);
        assert_eq!(result_list.len(), 1);
    }

    #[test]
    fn test_log_merge_policy_levels() {
        // multiple levels all get merged correctly
        // 2 MergeCandidates expected:
        // * one with the 6 * 10-docs segments
        // * one with the 3 * 1000-docs segments
        // no MergeCandidate expected for the 2 * 10_000-docs segments as min_merge_size=3
        let test_input = vec![
            create_random_segment_meta(10),
            create_random_segment_meta(10),
            create_random_segment_meta(10),
            create_random_segment_meta(1_000),
            create_random_segment_meta(1_000),
            create_random_segment_meta(1_000),
            create_random_segment_meta(10_000),
            create_random_segment_meta(10_000),
            create_random_segment_meta(10),
            create_random_segment_meta(10),
            create_random_segment_meta(10),
        ];
        let result_list = test_merge_policy().compute_merge_candidates(&test_input);
        assert_eq!(result_list.len(), 2);
    }

    #[test]
    fn test_log_merge_policy_within_levels() {
        // multiple levels all get merged correctly
        let test_input = vec![
            create_random_segment_meta(10),   // log2(10) = ~3.32 (> 3.58 - 0.75)
            create_random_segment_meta(11),   // log2(11) = ~3.46
            create_random_segment_meta(12),   // log2(12) = ~3.58
            create_random_segment_meta(800),  // log2(800) = ~9.64 (> 9.97 - 0.75)
            create_random_segment_meta(1000), // log2(1000) = ~9.97
            create_random_segment_meta(1000),
        ]; // log2(1000) = ~9.97
        let result_list = test_merge_policy().compute_merge_candidates(&test_input);
        assert_eq!(result_list.len(), 2);
    }

    #[test]
    fn test_log_merge_policy_small_segments() {
        // segments under min_layer_size are merged together
        let test_input = vec![
            create_random_segment_meta(1),
            create_random_segment_meta(1),
            create_random_segment_meta(1),
            create_random_segment_meta(2),
            create_random_segment_meta(2),
            create_random_segment_meta(2),
        ];
        let result_list = test_merge_policy().compute_merge_candidates(&test_input);
        assert_eq!(result_list.len(), 1);
    }

    #[test]
    fn test_log_merge_policy_all_segments_too_large_to_merge() {
        let eight_large_segments: Vec<SegmentMeta> =
            std::iter::repeat_with(|| create_random_segment_meta(100_001))
                .take(8)
                .collect();
        assert!(test_merge_policy()
            .compute_merge_candidates(&eight_large_segments)
            .is_empty());
    }

    #[test]
    fn test_large_merge_segments() {
        let test_input = vec![
            create_random_segment_meta(1_000_000),
            create_random_segment_meta(100_001),
            create_random_segment_meta(100_000),
            create_random_segment_meta(1_000_001),
            create_random_segment_meta(100_000),
            create_random_segment_meta(100_000),
            create_random_segment_meta(1_500_000),
        ];
        let result_list = test_merge_policy().compute_merge_candidates(&test_input);
        // Do not include large segments
        assert_eq!(result_list.len(), 1);
        assert_eq!(result_list[0].0.len(), 3);

        // Making sure merge policy points to the correct index of the original input
        assert_eq!(result_list[0].0[0], test_input[2].id());
        assert_eq!(result_list[0].0[1], test_input[4].id());
        assert_eq!(result_list[0].0[2], test_input[5].id());
    }

    #[test]
    fn test_merge_single_segment_with_deletes_below_threshold() {
        let mut test_merge_policy = test_merge_policy();
        test_merge_policy.set_del_docs_ratio_before_merge(0.25f32);
        let test_input = vec![create_random_segment_meta(40_000).with_delete_meta(10_000, 1)];
        let merge_candidates = test_merge_policy.compute_merge_candidates(&test_input);
        assert!(merge_candidates.is_empty());
    }

    #[test]
    fn test_merge_single_segment_with_deletes_above_threshold() {
        let mut test_merge_policy = test_merge_policy();
        test_merge_policy.set_del_docs_ratio_before_merge(0.25f32);
        let test_input = vec![create_random_segment_meta(40_000).with_delete_meta(10_001, 1)];
        let merge_candidates = test_merge_policy.compute_merge_candidates(&test_input);
        assert_eq!(merge_candidates.len(), 1);
    }

    #[test]
    fn test_merge_segments_with_deletes_above_threshold_all_in_level() {
        let mut test_merge_policy = test_merge_policy();
        test_merge_policy.set_del_docs_ratio_before_merge(0.25f32);
        let test_input = vec![
            create_random_segment_meta(40_000).with_delete_meta(10_001, 1),
            create_random_segment_meta(40_000),
        ];
        let merge_candidates = test_merge_policy.compute_merge_candidates(&test_input);
        assert_eq!(merge_candidates.len(), 1);
        assert_eq!(merge_candidates[0].0.len(), 2);
    }

    #[test]
    fn test_merge_segments_with_deletes_above_threshold_different_level_not_involved() {
        let mut test_merge_policy = test_merge_policy();
        test_merge_policy.set_del_docs_ratio_before_merge(0.25f32);
        let test_input = vec![
            create_random_segment_meta(100),
            create_random_segment_meta(40_000).with_delete_meta(10_001, 1),
        ];
        let merge_candidates = test_merge_policy.compute_merge_candidates(&test_input);
        assert_eq!(merge_candidates.len(), 1);
        assert_eq!(merge_candidates[0].0.len(), 1);
        assert_eq!(merge_candidates[0].0[0], test_input[1].id());
    }

    #[test]
    fn test_max_docs_before_merge_large_value() {
        // Regression test: (max_docs_before_merge as u32) truncates values > u32::MAX.
        // Casting num_docs() to usize instead avoids the truncation.
        let mut policy = LogMergePolicy::default();
        policy.set_min_num_segments(2);
        policy.set_max_docs_before_merge(5_000_000_000usize);
        let test_input = vec![
            create_random_segment_meta(100_000),
            create_random_segment_meta(100_000),
        ];
        let result = policy.compute_merge_candidates(&test_input);
        // Both segments should be eligible (100_000 < 5_000_000_000)
        assert_eq!(result.len(), 1);
        assert_eq!(result[0].0.len(), 2);
    }
}


================================================
FILE: src/indexer/merge_index_test.rs
================================================
#[cfg(test)]
mod tests {
    use crate::collector::TopDocs;
    use crate::fastfield::AliveBitSet;
    use crate::index::Index;
    use crate::postings::Postings;
    use crate::query::QueryParser;
    use crate::schema::{
        self, BytesOptions, Facet, FacetOptions, IndexRecordOption, NumericOptions,
        TextFieldIndexing, TextOptions,
    };
    use crate::{DocAddress, DocSet, IndexSettings, IndexWriter, Term};

    fn create_test_index(index_settings: Option<IndexSettings>) -> crate::Result<Index> {
        let mut schema_builder = schema::Schema::builder();
        let int_options = NumericOptions::default()
            .set_fast()
            .set_stored()
            .set_indexed();
        let int_field = schema_builder.add_u64_field("intval", int_options);

        let bytes_options = BytesOptions::default().set_fast().set_indexed();
        let bytes_field = schema_builder.add_bytes_field("bytes", bytes_options);
        let facet_field = schema_builder.add_facet_field("facet", FacetOptions::default());

        let multi_numbers =
            schema_builder.add_u64_field("multi_numbers", NumericOptions::default().set_fast());
        let text_field_options = TextOptions::default()
            .set_indexing_options(
                TextFieldIndexing::default()
                    .set_index_option(schema::IndexRecordOption::WithFreqsAndPositions),
            )
            .set_stored();
        let text_field = schema_builder.add_text_field("text_field", text_field_options);
        let schema = schema_builder.build();

        let mut index_builder = Index::builder().schema(schema);
        if let Some(settings) = index_settings {
            index_builder = index_builder.settings(settings);
        }
        let index = index_builder.create_in_ram()?;

        {
            let mut index_writer = index.writer_for_tests()?;

            // segment 1 - range 1-3
            index_writer.add_document(doc!(int_field=>1_u64))?;
            index_writer.add_document(
                doc!(int_field=>3_u64, multi_numbers => 3_u64, multi_numbers => 4_u64, bytes_field => vec![1, 2, 3], text_field => "some text", facet_field=> Facet::from("/book/crime")),
            )?;
            index_writer.add_document(
                doc!(int_field=>1_u64, text_field=> "deleteme",  text_field => "ok text more text"),
            )?;
            index_writer.add_document(
                doc!(int_field=>2_u64, multi_numbers => 2_u64, multi_numbers => 3_u64, text_field => "ok text more text"),
            )?;

            index_writer.commit()?;
            index_writer.add_document(doc!(int_field=>20_u64, multi_numbers => 20_u64))?;

            let in_val = 1u64;
            index_writer.add_document(doc!(int_field=>in_val, text_field=> "deleteme" , text_field => "ok text more text", facet_field=> Facet::from("/book/crime")))?;
            index_writer.commit()?;
            let int_vals = [10u64, 5];
            index_writer.add_document( // position of this doc after delete in desc sorting = [2], in disjunct case [1]
                doc!(int_field=>int_vals[0], multi_numbers => 10_u64, multi_numbers => 11_u64, text_field=> "blubber", facet_field=> Facet::from("/book/fantasy")),
            )?;
            index_writer.add_document(doc!(int_field=>int_vals[1], text_field=> "deleteme"))?;
            index_writer.add_document(
                doc!(int_field=>1_000u64, multi_numbers => 1001_u64, multi_numbers => 1002_u64, bytes_field => vec![5, 5],text_field => "the biggest num")
            )?;

            index_writer.delete_term(Term::from_field_text(text_field, "deleteme"));
            index_writer.commit()?;
        }

        // Merging the segments
        {
            let segment_ids = index.searchable_segment_ids()?;
            let mut index_writer: IndexWriter = index.writer_for_tests()?;
            index_writer.merge(&segment_ids).wait()?;
            index_writer.wait_merging_threads()?;
        }
        Ok(index)
    }

    #[test]
    fn test_merge_index() {
        let index = create_test_index(Some(IndexSettings {
            ..Default::default()
        }))
        .unwrap();

        let reader = index.reader().unwrap();
        let searcher = reader.searcher();
        assert_eq!(searcher.segment_readers().len(), 1);
        let segment_reader = searcher.segment_readers().last().unwrap();

        let searcher = index.reader().unwrap().searcher();
        {
            let my_text_field = index.schema().get_field("text_field").unwrap();

            let do_search = |term: &str| {
                let query = QueryParser::for_index(&index, vec![my_text_field])
                    .parse_query(term)
                    .unwrap();
                let top_docs: Vec<(f32, DocAddress)> = searcher
                    .search(&query, &TopDocs::with_limit(3).order_by_score())
                    .unwrap();

                top_docs.iter().map(|el| el.1.doc_id).collect::<Vec<_>>()
            };

            assert_eq!(do_search("some"), vec![1]);
            assert_eq!(do_search("blubber"), vec![3]);
            assert_eq!(do_search("biggest"), vec![4]);
        }

        // postings file
        {
            let my_text_field = index.schema().get_field("text_field").unwrap();
            let term_a = Term::from_field_text(my_text_field, "text");
            let inverted_index = segment_reader.inverted_index(my_text_field).unwrap();
            let mut postings = inverted_index
                .read_postings(&term_a, IndexRecordOption::WithFreqsAndPositions)
                .unwrap()
                .unwrap();
            assert_eq!(postings.doc_freq(), 2);
            let fallback_bitset = AliveBitSet::for_test_from_deleted_docs(&[0], 100);
            assert_eq!(
                postings.doc_freq_given_deletes(
                    segment_reader.alive_bitset().unwrap_or(&fallback_bitset)
                ),
                2
            );

            assert_eq!(postings.term_freq(), 1);
            let mut output = vec![];
            postings.positions(&mut output);
            assert_eq!(output, vec![1]);
            postings.advance();

            assert_eq!(postings.term_freq(), 2);
            postings.positions(&mut output);
            assert_eq!(output, vec![1, 3]);
        }
    }
}


================================================
FILE: src/indexer/merge_operation.rs
================================================
use std::collections::HashSet;
use std::ops::Deref;

use crate::index::SegmentId;
use crate::{Inventory, Opstamp, TrackedObject};

#[derive(Default)]
pub(crate) struct MergeOperationInventory(Inventory<InnerMergeOperation>);

impl Deref for MergeOperationInventory {
    type Target = Inventory<InnerMergeOperation>;

    fn deref(&self) -> &Self::Target {
        &self.0
    }
}

impl MergeOperationInventory {
    pub fn segment_in_merge(&self) -> HashSet<SegmentId> {
        let mut segment_in_merge = HashSet::default();
        for merge_op in self.list() {
            for &segment_id in &merge_op.segment_ids {
                segment_in_merge.insert(segment_id);
            }
        }
        segment_in_merge
    }
}

/// A `MergeOperation` has two roles.
/// It carries all of the information required to describe a merge:
/// - `target_opstamp` is the opstamp up to which we want to consume the delete queue and reflect
///   their deletes.
/// - `segment_ids` is the list of segment to be merged.
///
/// The second role is to ensure keep track of the fact that these
/// segments are in merge and avoid starting a merge operation that
/// may conflict with this one.
///
/// This works by tracking merge operations. When considering computing
/// merge candidates, we simply list tracked merge operations and remove
/// their segments from possible merge candidates.
pub struct MergeOperation {
    inner: TrackedObject<InnerMergeOperation>,
}

pub(crate) struct InnerMergeOperation {
    target_opstamp: Opstamp,
    segment_ids: Vec<SegmentId>,
}

impl MergeOperation {
    pub(crate) fn new(
        inventory: &MergeOperationInventory,
        target_opstamp: Opstamp,
        segment_ids: Vec<SegmentId>,
    ) -> MergeOperation {
        let inner_merge_operation = InnerMergeOperation {
            target_opstamp,
            segment_ids,
        };
        MergeOperation {
            inner: inventory.track(inner_merge_operation),
        }
    }

    /// Returns the opstamp up to which we want to consume the delete queue and reflect their
    /// deletes.
    pub fn target_opstamp(&self) -> Opstamp {
        self.inner.target_opstamp
    }

    /// Returns the list of segment to be merged.
    pub fn segment_ids(&self) -> &[SegmentId] {
        &self.inner.segment_ids[..]
    }
}


================================================
FILE: src/indexer/merge_policy.rs
================================================
use std::fmt::Debug;
use std::marker;

use crate::index::{SegmentId, SegmentMeta};

/// Set of segment suggested for a merge.
#[derive(Debug, Clone)]
pub struct MergeCandidate(pub Vec<SegmentId>);

/// The `MergePolicy` defines which segments should be merged.
///
/// Every time the list of segments changes, the segment updater
/// asks the merge policy if some segments should be merged.
pub trait MergePolicy: marker::Send + marker::Sync + Debug {
    /// Given the list of segment metas, returns the list of merge candidates.
    ///
    /// This call happens on the segment updater thread, and will block
    /// other segment updates, so all implementations should happen rapidly.
    fn compute_merge_candidates(&self, segments: &[SegmentMeta]) -> Vec<MergeCandidate>;
}

/// Never merge segments.
#[derive(Debug, Clone)]
pub struct NoMergePolicy;

impl Default for NoMergePolicy {
    fn default() -> NoMergePolicy {
        NoMergePolicy
    }
}

impl MergePolicy for NoMergePolicy {
    fn compute_merge_candidates(&self, _segments: &[SegmentMeta]) -> Vec<MergeCandidate> {
        Vec::new()
    }
}

#[cfg(test)]
pub(crate) mod tests {

    use super::*;

    /// `MergePolicy` useful for test purposes.
    ///
    /// Every time there is more than one segment,
    /// it will suggest to merge them.
    #[derive(Debug, Clone)]
    pub struct MergeWheneverPossible;

    impl MergePolicy for MergeWheneverPossible {
        fn compute_merge_candidates(&self, segment_metas: &[SegmentMeta]) -> Vec<MergeCandidate> {
            let segment_ids = segment_metas
                .iter()
                .map(|segment_meta| segment_meta.id())
                .collect::<Vec<SegmentId>>();
            if segment_ids.len() > 1 {
                vec![MergeCandidate(segment_ids)]
            } else {
                vec![]
            }
        }
    }
}


================================================
FILE: src/indexer/merger.rs
================================================
use std::sync::Arc;

use columnar::{
    ColumnType, ColumnarReader, MergeRowOrder, RowAddr, ShuffleMergeOrder, StackMergeOrder,
};
use common::ReadOnlyBitSet;
use itertools::Itertools;
use measure_time::debug_time;

use crate::directory::WritePtr;
use crate::docset::{DocSet, TERMINATED};
use crate::error::DataCorruption;
use crate::fastfield::AliveBitSet;
use crate::fieldnorm::{FieldNormReader, FieldNormReaders, FieldNormsSerializer, FieldNormsWriter};
use crate::index::{Segment, SegmentComponent, SegmentReader};
use crate::indexer::doc_id_mapping::{MappingType, SegmentDocIdMapping};
use crate::indexer::SegmentSerializer;
use crate::postings::{InvertedIndexSerializer, Postings, SegmentPostings};
use crate::schema::{value_type_to_column_type, Field, FieldType, Schema};
use crate::store::StoreWriter;
use crate::termdict::{TermMerger, TermOrdinal};
use crate::{DocAddress, DocId, InvertedIndexReader};

/// Segment's max doc must be `< MAX_DOC_LIMIT`.
///
/// We do not allow segments with more than
pub const MAX_DOC_LIMIT: u32 = 1 << 31;

fn estimate_total_num_tokens_in_single_segment(
    reader: &SegmentReader,
    field: Field,
) -> crate::Result<u64> {
    // There are no deletes. We can simply use the exact value saved into the posting list.
    // Note that this value is not necessarily exact as it could have been the result of a merge
    // between segments themselves containing deletes.
    if !reader.has_deletes() {
        return Ok(reader.inverted_index(field)?.total_num_tokens());
    }

    // When there are deletes, we use an approximation either
    // by using the fieldnorm.
    if let Some(fieldnorm_reader) = reader.fieldnorms_readers().get_field(field)? {
        let mut count: [usize; 256] = [0; 256];
        for doc in reader.doc_ids_alive() {
            let fieldnorm_id = fieldnorm_reader.fieldnorm_id(doc);
            count[fieldnorm_id as usize] += 1;
        }
        let total_num_tokens = count
            .iter()
            .cloned()
            .enumerate()
            .map(|(fieldnorm_ord, count)| {
                count as u64 * u64::from(FieldNormReader::id_to_fieldnorm(fieldnorm_ord as u8))
            })
            .sum::<u64>();
        return Ok(total_num_tokens);
    }

    // There are no fieldnorms available.
    // Here we just do a pro-rata with the overall number of tokens an the ratio of
    // documents alive.
    let segment_num_tokens = reader.inverted_index(field)?.total_num_tokens();
    if reader.max_doc() == 0 {
        // That supposedly never happens, but let's be a bit defensive here.
        return Ok(0u64);
    }
    let ratio = reader.num_docs() as f64 / reader.max_doc() as f64;
    Ok((segment_num_tokens as f64 * ratio) as u64)
}

fn estimate_total_num_tokens(readers: &[SegmentReader], field: Field) -> crate::Result<u64> {
    let mut total_num_tokens: u64 = 0;
    for reader in readers {
        total_num_tokens += estimate_total_num_tokens_in_single_segment(reader, field)?;
    }
    Ok(total_num_tokens)
}

pub struct IndexMerger {
    schema: Schema,
    pub(crate) readers: Vec<SegmentReader>,
    max_doc: u32,
}

struct DeltaComputer {
    buffer: Vec<u32>,
}

impl DeltaComputer {
    fn new() -> DeltaComputer {
        DeltaComputer {
            buffer: vec![0u32; 512],
        }
    }

    fn compute_delta(&mut self, positions: &[u32]) -> &[u32] {
        if positions.len() > self.buffer.len() {
            self.buffer.resize(positions.len(), 0u32);
        }
        let mut last_pos = 0u32;
        for (cur_pos, dest) in positions.iter().cloned().zip(self.buffer.iter_mut()) {
            *dest = cur_pos - last_pos;
            last_pos = cur_pos;
        }
        &self.buffer[..positions.len()]
    }
}

fn convert_to_merge_order(
    columnars: &[&ColumnarReader],
    doc_id_mapping: SegmentDocIdMapping,
) -> MergeRowOrder {
    match doc_id_mapping.mapping_type() {
        MappingType::Stacked => MergeRowOrder::Stack(StackMergeOrder::stack(columnars)),
        MappingType::StackedWithDeletes => {
            // RUST/LLVM is amazing. The following conversion is actually a no-op:
            // no allocation, no copy.
            let new_row_id_to_old_row_id: Vec<RowAddr> = doc_id_mapping
                .new_doc_id_to_old_doc_addr
                .into_iter()
                .map(|doc_addr| RowAddr {
                    segment_ord: doc_addr.segment_ord,
                    row_id: doc_addr.doc_id,
                })
                .collect();
            MergeRowOrder::Shuffled(ShuffleMergeOrder {
                new_row_id_to_old_row_id,
                alive_bitsets: doc_id_mapping.alive_bitsets,
            })
        }
    }
}

fn extract_fast_field_required_columns(schema: &Schema) -> Vec<(String, ColumnType)> {
    schema
        .fields()
        .map(|(_, field_entry)| field_entry)
        .filter(|field_entry| field_entry.is_fast())
        .filter_map(|field_entry| {
            let column_name = field_entry.name().to_string();
            let column_type = value_type_to_column_type(field_entry.field_type().value_type())?;
            Some((column_name, column_type))
        })
        .collect()
}

impl IndexMerger {
    pub fn open(schema: Schema, segments: &[Segment]) -> crate::Result<IndexMerger> {
        let alive_bitset = segments.iter().map(|_| None).collect_vec();
        Self::open_with_custom_alive_set(schema, segments, alive_bitset)
    }

    // Create merge with a custom delete set.
    // For every Segment, a delete bitset can be provided, which
    // will be merged with the existing bit set. Make sure the index
    // corresponds to the segment index.
    //
    // If `None` is provided for custom alive set, the regular alive set will be used.
    // If a alive_bitset is provided, the union between the provided and regular
    // alive set will be used.
    //
    // This can be used to merge but also apply an additional filter.
    // One use case is demux, which is basically taking a list of
    // segments and partitions them e.g. by a value in a field.
    pub fn open_with_custom_alive_set(
        schema: Schema,
        segments: &[Segment],
        alive_bitset_opt: Vec<Option<AliveBitSet>>,
    ) -> crate::Result<IndexMerger> {
        let mut readers = vec![];
        for (segment, new_alive_bitset_opt) in segments.iter().zip(alive_bitset_opt) {
            if segment.meta().num_docs() > 0 {
                let reader =
                    SegmentReader::open_with_custom_alive_set(segment, new_alive_bitset_opt)?;
                readers.push(reader);
            }
        }

        let max_doc = readers.iter().map(|reader| reader.num_docs()).sum();
        // sort segments by their natural sort setting
        if max_doc >= MAX_DOC_LIMIT {
            let err_msg = format!(
                "The segment resulting from this merge would have {max_doc} docs,which exceeds \
                 the limit {MAX_DOC_LIMIT}."
            );
            return Err(crate::TantivyError::InvalidArgument(err_msg));
        }
        Ok(IndexMerger {
            schema,
            readers,
            max_doc,
        })
    }

    fn write_fieldnorms(
        &self,
        mut fieldnorms_serializer: FieldNormsSerializer,
        doc_id_mapping: &SegmentDocIdMapping,
    ) -> crate::Result<()> {
        let fields = FieldNormsWriter::fields_with_fieldnorm(&self.schema);
        let mut fieldnorms_data = Vec::with_capacity(self.max_doc as usize);
        for field in fields {
            fieldnorms_data.clear();
            let fieldnorms_readers: Vec<FieldNormReader> = self
                .readers
                .iter()
                .map(|reader| reader.get_fieldnorms_reader(field))
                .collect::<Result<_, _>>()?;
            for old_doc_addr in doc_id_mapping.iter_old_doc_addrs() {
                let fieldnorms_reader = &fieldnorms_readers[old_doc_addr.segment_ord as usize];
                let fieldnorm_id = fieldnorms_reader.fieldnorm_id(old_doc_addr.doc_id);
                fieldnorms_data.push(fieldnorm_id);
            }
            fieldnorms_serializer.serialize_field(field, &fieldnorms_data[..])?;
        }
        fieldnorms_serializer.close()?;
        Ok(())
    }

    fn write_fast_fields(
        &self,
        fast_field_wrt: &mut WritePtr,
        doc_id_mapping: SegmentDocIdMapping,
    ) -> crate::Result<()> {
        debug_time!("write-fast-fields");
        let required_columns = extract_fast_field_required_columns(&self.schema);
        let columnars: Vec<&ColumnarReader> = self
            .readers
            .iter()
            .map(|reader| reader.fast_fields().columnar())
            .collect();
        let merge_row_order = convert_to_merge_order(&columnars[..], doc_id_mapping);
        columnar::merge_columnar(
            &columnars[..],
            &required_columns,
            merge_row_order,
            fast_field_wrt,
        )?;
        Ok(())
    }

    /// Creates a mapping if the segments are stacked. this is helpful to merge codelines between
    /// index sorting and the others
    pub(crate) fn get_doc_id_from_concatenated_data(&self) -> crate::Result<SegmentDocIdMapping> {
        let total_num_new_docs = self
            .readers
            .iter()
            .map(|reader| reader.num_docs() as usize)
            .sum();

        let mut mapping: Vec<DocAddress> = Vec::with_capacity(total_num_new_docs);

        mapping.extend(
            self.readers
                .iter()
                .enumerate()
                .flat_map(|(segment_ord, reader)| {
                    reader.doc_ids_alive().map(move |doc_id| DocAddress {
                        segment_ord: segment_ord as u32,
                        doc_id,
                    })
                }),
        );

        let has_deletes: bool = self.readers.iter().any(SegmentReader::has_deletes);
        let mapping_type = if has_deletes {
            MappingType::StackedWithDeletes
        } else {
            MappingType::Stacked
        };
        let alive_bitsets: Vec<Option<ReadOnlyBitSet>> = self
            .readers
            .iter()
            .map(|reader| {
                let alive_bitset = reader.alive_bitset()?;
                Some(alive_bitset.bitset().clone())
            })
            .collect();
        Ok(SegmentDocIdMapping::new(
            mapping,
            mapping_type,
            alive_bitsets,
        ))
    }

    fn write_postings_for_field(
        &self,
        indexed_field: Field,
        _field_type: &FieldType,
        serializer: &mut InvertedIndexSerializer,
        fieldnorm_reader: Option<FieldNormReader>,
        doc_id_mapping: &SegmentDocIdMapping,
    ) -> crate::Result<()> {
        debug_time!("write-postings-for-field");
        let mut positions_buffer: Vec<u32> = Vec::with_capacity(1_000);
        let mut delta_computer = DeltaComputer::new();

        let mut max_term_ords: Vec<TermOrdinal> = Vec::new();

        let field_readers: Vec<Arc<InvertedIndexReader>> = self
            .readers
            .iter()
            .map(|reader| reader.inverted_index(indexed_field))
            .collect::<crate::Result<Vec<_>>>()?;

        let mut field_term_streams = Vec::new();
        for field_reader in &field_readers {
            let terms = field_reader.terms();
            field_term_streams.push(terms.stream()?);
            max_term_ords.push(terms.num_terms() as u64);
        }

        let mut merged_terms = TermMerger::new(field_term_streams);

        // map from segment doc ids to the resulting merged segment doc id.

        let mut merged_doc_id_map: Vec<Vec<Option<DocId>>> = self
            .readers
            .iter()
            .map(|reader| {
                let mut segment_local_map = vec![];
                segment_local_map.resize(reader.max_doc() as usize, None);
                segment_local_map
            })
            .collect();
        for (new_doc_id, old_doc_addr) in doc_id_mapping.iter_old_doc_addrs().enumerate() {
            let segment_map = &mut merged_doc_id_map[old_doc_addr.segment_ord as usize];
            segment_map[old_doc_addr.doc_id as usize] = Some(new_doc_id as DocId);
        }

        // Note that the total number of tokens is not exact.
        // It is only used as a parameter in the BM25 formula.
        let total_num_tokens: u64 = estimate_total_num_tokens(&self.readers, indexed_field)?;

        // Create the total list of doc ids
        // by stacking the doc ids from the different segment.
        //
        // In the new segments, the doc id from the different
        // segment are stacked so that :
        // - Segment 0's doc ids become doc id [0, seg.max_doc]
        // - Segment 1's doc ids become  [seg0.max_doc, seg0.max_doc + seg.max_doc]
        // - Segment 2's doc ids become  [seg0.max_doc + seg1.max_doc, seg0.max_doc + seg1.max_doc +
        //   seg2.max_doc]
        //
        // This stacking applies only when the index is not sorted, in that case the
        // doc_ids are kmerged by their sort property
        let mut field_serializer =
            serializer.new_field(indexed_field, total_num_tokens, fieldnorm_reader)?;

        let field_entry = self.schema.get_field_entry(indexed_field);

        // ... set segment postings option the new field.
        let segment_postings_option = field_entry.field_type().get_index_record_option().expect(
            "Encountered a field that is not supposed to be
                         indexed. Have you modified the schema?",
        );

        let mut segment_postings_containing_the_term: Vec<(usize, SegmentPostings)> = vec![];

        while merged_terms.advance() {
            segment_postings_containing_the_term.clear();
            let term_bytes: &[u8] = merged_terms.key();

            let mut total_doc_freq = 0;

            // Let's compute the list of non-empty posting lists
            for (segment_ord, term_info) in merged_terms.current_segment_ords_and_term_infos() {
                let segment_reader = &self.readers[segment_ord];
                let inverted_index: &InvertedIndexReader = &field_readers[segment_ord];
                let segment_postings = inverted_index
                    .read_postings_from_terminfo(&term_info, segment_postings_option)?;
                let alive_bitset_opt = segment_reader.alive_bitset();
                let doc_freq = if let Some(alive_bitset) = alive_bitset_opt {
                    segment_postings.doc_freq_given_deletes(alive_bitset)
                } else {
                    segment_postings.doc_freq()
                };
                if doc_freq > 0u32 {
                    total_doc_freq += doc_freq;
                    segment_postings_containing_the_term.push((segment_ord, segment_postings));
                }
            }

            // At this point, `segment_postings` contains the posting list
            // of all of the segments containing the given term (and that are non-empty)
            //
            // These segments are non-empty and advance has already been called.
            if total_doc_freq == 0u32 {
                // All docs that used to contain the term have been deleted. The `term` will be
                // entirely removed.
                continue;
            }

            // This should never happen as we early exited for total_doc_freq == 0.
            assert!(!segment_postings_containing_the_term.is_empty());

            let has_term_freq = {
                let has_term_freq = !segment_postings_containing_the_term[0]
                    .1
                    .block_cursor
                    .freqs()
                    .is_empty();
                for (_, postings) in &segment_postings_containing_the_term[1..] {
                    // This may look at a strange way to test whether we have term freq or not.
                    // With JSON object, the schema is not sufficient to know whether a term
                    // has its term frequency encoded or not:
                    // strings may have term frequencies, while number terms never have one.
                    //
                    // Ideally, we should have burnt one bit of two in the `TermInfo`.
                    // However, we preferred not changing the codec too much and detect this
                    // instead by
                    // - looking at the size of the skip data for bitpacked blocks
                    // - observing the absence of remaining data after reading the docs for vint
                    // blocks.
                    //
                    // Overall the reliable way to know if we have actual frequencies loaded or not
                    // is to check whether the actual decoded array is empty or not.
                    if has_term_freq == postings.block_cursor.freqs().is_empty() {
                        return Err(DataCorruption::comment_only(
                            "Term freqs are inconsistent across segments",
                        )
                        .into());
                    }
                }
                has_term_freq
            };

            field_serializer.new_term(term_bytes, total_doc_freq, has_term_freq)?;

            // We can now serialize this postings, by pushing each document to the
            // postings serializer.
            for (segment_ord, mut segment_postings) in
                segment_postings_containing_the_term.drain(..)
            {
                let old_to_new_doc_id = &merged_doc_id_map[segment_ord];

                let mut doc = segment_postings.doc();
                while doc != TERMINATED {
                    // deleted doc are skipped as they do not have a `remapped_doc_id`.
                    if let Some(remapped_doc_id) = old_to_new_doc_id[doc as usize] {
                        // we make sure to only write the term if
                        // there is at least one document.
                        let term_freq = if has_term_freq {
                            segment_postings.positions(&mut positions_buffer);
                            segment_postings.term_freq()
                        } else {
                            // The positions_buffer may contain positions from the previous term
                            // Existence of positions depend on the value type in JSON fields.
                            // https://github.com/quickwit-oss/tantivy/issues/2283
                            positions_buffer.clear();
                            0u32
                        };

                        let delta_positions = delta_computer.compute_delta(&positions_buffer);
                        field_serializer.write_doc(remapped_doc_id, term_freq, delta_positions);
                    }

                    doc = segment_postings.advance();
                }
            }
            // closing the term.
            field_serializer.close_term()?;
        }
        field_serializer.close()?;
        Ok(())
    }

    fn write_postings(
        &self,
        serializer: &mut InvertedIndexSerializer,
        fieldnorm_readers: FieldNormReaders,
        doc_id_mapping: &SegmentDocIdMapping,
    ) -> crate::Result<()> {
        for (field, field_entry) in self.schema.fields() {
            let fieldnorm_reader = fieldnorm_readers.get_field(field)?;
            if field_entry.is_indexed() {
                self.write_postings_for_field(
                    field,
                    field_entry.field_type(),
                    serializer,
                    fieldnorm_reader,
                    doc_id_mapping,
                )?;
            }
        }
        Ok(())
    }

    fn write_storable_fields(&self, store_writer: &mut StoreWriter) -> crate::Result<()> {
        debug_time!("write-storable-fields");
        debug!("write-storable-field");

        for reader in &self.readers {
            let store_reader = reader.get_store_reader(1)?;
            if reader.has_deletes()
                    // If there is not enough data in the store, we avoid stacking in order to
                    // avoid creating many small blocks in the doc store. Once we have 5 full blocks,
                    // we start stacking. In the worst case 2/7 of the blocks would be very small.
                    // [segment 1 - {1 doc}][segment 2 - {fullblock * 5}{1doc}]
                    // => 5 * full blocks, 2 * 1 document blocks
                    //
                    // In a more realistic scenario the segments are of the same size, so 1/6 of
                    // the doc stores would be on average half full, given total randomness (which
                    // is not the case here, but not sure how it behaves exactly).
                    //
                    // https://github.com/quickwit-oss/tantivy/issues/1053
                    //
                    // take 7 in order to not walk over all checkpoints.
                    || store_reader.block_checkpoints().take(7).count() < 6
                    || store_reader.decompressor() != store_writer.compressor().into()
            {
                for doc_bytes_res in store_reader.iter_raw(reader.alive_bitset()) {
                    let doc_bytes = doc_bytes_res?;
                    store_writer.store_bytes(&doc_bytes)?;
                }
            } else {
                store_writer.stack(store_reader)?;
            }
        }
        Ok(())
    }

    /// Writes the merged segment by pushing information
    /// to the `SegmentSerializer`.
    ///
    /// # Returns
    /// The number of documents in the resulting segment.
    pub fn write(&self, mut serializer: SegmentSerializer) -> crate::Result<u32> {
        let doc_id_mapping = self.get_doc_id_from_concatenated_data()?;
        debug!("write-fieldnorms");
        if let Some(fieldnorms_serializer) = serializer.extract_fieldnorms_serializer() {
            self.write_fieldnorms(fieldnorms_serializer, &doc_id_mapping)?;
        }
        debug!("write-postings");
        let fieldnorm_data = serializer
            .segment()
            .open_read(SegmentComponent::FieldNorms)?;
        let fieldnorm_readers = FieldNormReaders::open(fieldnorm_data)?;
        self.write_postings(
            serializer.get_postings_serializer(),
            fieldnorm_readers,
            &doc_id_mapping,
        )?;

        debug!("write-storagefields");
        self.write_storable_fields(serializer.get_store_writer())?;
        debug!("write-fastfields");
        self.write_fast_fields(serializer.get_fast_field_write(), doc_id_mapping)?;

        debug!("close-serializer");
        serializer.close()?;
        Ok(self.max_doc)
    }
}

#[cfg(test)]
mod tests {

    use columnar::Column;
    use proptest::prop_oneof;
    use proptest::strategy::Strategy;
    use schema::FAST;

    use crate::collector::tests::{
        BytesFastFieldTestCollector, FastFieldTestCollector, TEST_COLLECTOR_WITH_SCORE,
    };
    use crate::collector::{Count, FacetCollector};
    use crate::index::{Index, SegmentId};
    use crate::indexer::NoMergePolicy;
    use crate::query::{AllQuery, BooleanQuery, EnableScoring, Scorer, TermQuery};
    use crate::schema::{
        Facet, FacetOptions, IndexRecordOption, NumericOptions, TantivyDocument, Term,
        TextFieldIndexing, Value, INDEXED, TEXT,
    };
    use crate::time::OffsetDateTime;
    use crate::{
        assert_nearly_equals, schema, DateTime, DocAddress, DocId, DocSet, IndexSettings,
        IndexWriter, Searcher,
    };

    #[test]
    fn test_index_merger_no_deletes() -> crate::Result<()> {
        let mut schema_builder = schema::Schema::builder();
        let text_fieldtype = schema::TextOptions::default()
            .set_indexing_options(
                TextFieldIndexing::default().set_index_option(IndexRecordOption::WithFreqs),
            )
            .set_stored();
        let text_field = schema_builder.add_text_field("text", text_fieldtype);
        let date_field = schema_builder.add_date_field("date", INDEXED);
        let score_fieldtype = schema::NumericOptions::default().set_fast();
        let score_field = schema_builder.add_u64_field("score", score_fieldtype);
        let bytes_score_field = schema_builder.add_bytes_field("score_bytes", FAST);
        let index = Index::create_in_ram(schema_builder.build());
        let reader = index.reader()?;
        let curr_time = OffsetDateTime::now_utc();
        {
            let mut index_writer = index.writer_for_tests()?;
            // writing the segment
            index_writer.add_document(doc!(
                text_field => "af b",
                score_field => 3u64,
                date_field => DateTime::from_utc(curr_time),
                bytes_score_field => 3u32.to_be_bytes().as_ref()
            ))?;
            index_writer.add_document(doc!(
                text_field => "a b c",
                score_field => 5u64,
                bytes_score_field => 5u32.to_be_bytes().as_ref()
            ))?;
            index_writer.add_document(doc!(
                text_field => "a b c d",
                score_field => 7u64,
                bytes_score_field => 7u32.to_be_bytes().as_ref()
            ))?;
            index_writer.commit()?;
            // writing the segment
            index_writer.add_document(doc!(
                text_field => "af b",
                date_field => DateTime::from_utc(curr_time),
                score_field => 11u64,
                bytes_score_field => 11u32.to_be_bytes().as_ref()
            ))?;
            index_writer.add_document(doc!(
                text_field => "a b c g",
                score_field => 13u64,
                bytes_score_field => 13u32.to_be_bytes().as_ref()
            ))?;
            index_writer.commit()?;
        }
        {
            let segment_ids = index
                .searchable_segment_ids()
                .expect("Searchable segments failed.");
            let mut index_writer: IndexWriter = index.writer_for_tests()?;
            index_writer.merge(&segment_ids).wait()?;
            index_writer.wait_merging_threads()?;
        }
        {
            reader.reload()?;
            let searcher = reader.searcher();
            let get_doc_ids = |terms: Vec<Term>| {
                let query = BooleanQuery::new_multiterms_query(terms);
                searcher
                    .search(&query, &TEST_COLLECTOR_WITH_SCORE)
                    .map(|top_docs| top_docs.docs().to_vec())
            };
            {
                assert_eq!(
                    get_doc_ids(vec![Term::from_field_text(text_field, "a")])?,
                    vec![
                        DocAddress::new(0, 1),
                        DocAddress::new(0, 2),
                        DocAddress::new(0, 4)
                    ]
                );
                assert_eq!(
                    get_doc_ids(vec![Term::from_field_text(text_field, "af")])?,
                    vec![DocAddress::new(0, 0), DocAddress::new(0, 3)]
                );
                assert_eq!(
                    get_doc_ids(vec![Term::from_field_text(text_field, "g")])?,
                    vec![DocAddress::new(0, 4)]
                );
                assert_eq!(
                    get_doc_ids(vec![Term::from_field_text(text_field, "b")])?,
                    vec![
                        DocAddress::new(0, 0),
                        DocAddress::new(0, 1),
                        DocAddress::new(0, 2),
                        DocAddress::new(0, 3),
                        DocAddress::new(0, 4)
                    ]
                );
                assert_eq!(
                    get_doc_ids(vec![Term::from_field_date_for_search(
                        date_field,
                        DateTime::from_utc(curr_time)
                    )])?,
                    vec![DocAddress::new(0, 0), DocAddress::new(0, 3)]
                );
            }
            {
                let doc = searcher.doc::<TantivyDocument>(DocAddress::new(0, 0))?;
                assert_eq!(
                    doc.get_first(text_field).unwrap().as_value().as_str(),
                    Some("af b")
                );
            }
            {
                let doc = searcher.doc::<TantivyDocument>(DocAddress::new(0, 1))?;
                assert_eq!(
                    doc.get_first(text_field).unwrap().as_value().as_str(),
                    Some("a b c")
                );
            }
            {
                let doc = searcher.doc::<TantivyDocument>(DocAddress::new(0, 2))?;
                assert_eq!(
                    doc.get_first(text_field).unwrap().as_value().as_str(),
                    Some("a b c d")
                );
            }
            {
                let doc = searcher.doc::<TantivyDocument>(DocAddress::new(0, 3))?;
                assert_eq!(doc.get_first(text_field).unwrap().as_str(), Some("af b"));
            }
            {
                let doc = searcher.doc::<TantivyDocument>(DocAddress::new(0, 4))?;
                assert_eq!(doc.get_first(text_field).unwrap().as_str(), Some("a b c g"));
            }

            {
                let get_fast_vals = |terms: Vec<Term>| {
                    let query = BooleanQuery::new_multiterms_query(terms);
                    searcher.search(&query, &FastFieldTestCollector::for_field("score"))
                };
                let get_fast_vals_bytes = |terms: Vec<Term>| {
                    let query = BooleanQuery::new_multiterms_query(terms);
                    searcher.search(
                        &query,
                        &BytesFastFieldTestCollector::for_field("score_bytes"),
                    )
                };
                assert_eq!(
                    get_fast_vals(vec![Term::from_field_text(text_field, "a")])?,
                    vec![5, 7, 13]
                );
                assert_eq!(
                    get_fast_vals_bytes(vec![Term::from_field_text(text_field, "a")])?,
                    vec![0, 0, 0, 5, 0, 0, 0, 7, 0, 0, 0, 13]
                );
            }
        }
        Ok(())
    }

    #[test]
    fn test_index_merger_with_deletes() -> crate::Result<()> {
        let mut schema_builder = schema::Schema::builder();
        let text_fieldtype = schema::TextOptions::default()
            .set_indexing_options(
                TextFieldIndexing::default().set_index_option(IndexRecordOption::WithFreqs),
            )
            .set_stored();
        let text_field = schema_builder.add_text_field("text", text_fieldtype);
        let score_fieldtype = schema::NumericOptions::default().set_fast();
        let score_field = schema_builder.add_u64_field("score", score_fieldtype);
        let bytes_score_field = schema_builder.add_bytes_field("score_bytes", FAST);
        let index = Index::create_in_ram(schema_builder.build());
        let mut index_writer = index.writer_for_tests()?;
        let reader = index.reader().unwrap();
        let search_term = |searcher: &Searcher, term: Term| {
            let collector = FastFieldTestCollector::for_field("score");
            // let bytes_collector = BytesFastFieldTestCollector::for_field(bytes_score_field);
            let term_query = TermQuery::new(term, IndexRecordOption::Basic);
            // searcher
            //     .search(&term_query, &(collector, bytes_collector))
            //     .map(|(scores, bytes)| {
            //         let mut score_bytes = &bytes[..];
            //         for &score in &scores {
            //             assert_eq!(score as u32, score_bytes.read_u32::<BigEndian>().unwrap());
            //         }
            //         scores
            //     })
            searcher.search(&term_query, &collector)
        };

        let empty_vec = Vec::<u64>::new();
        {
            // a first commit
            index_writer.add_document(doc!(
                text_field => "a b d",
                score_field => 1u64,
                bytes_score_field => vec![0u8, 0, 0, 1],
            ))?;
            index_writer.add_document(doc!(
                text_field => "b c",
                score_field => 2u64,
                bytes_score_field => vec![0u8, 0, 0, 2],
            ))?;
            index_writer.delete_term(Term::from_field_text(text_field, "c"));
            index_writer.add_document(doc!(
                text_field => "c d",
                score_field => 3u64,
                bytes_score_field => vec![0u8, 0, 0, 3],
            ))?;
            index_writer.commit()?;
            reader.reload()?;
            let searcher = reader.searcher();
            assert_eq!(searcher.num_docs(), 2);
            assert_eq!(searcher.segment_readers()[0].num_docs(), 2);
            assert_eq!(searcher.segment_readers()[0].max_doc(), 3);
            assert_eq!(
                search_term(&searcher, Term::from_field_text(text_field, "a"))?,
                vec![1]
            );
            assert_eq!(
                search_term(&searcher, Term::from_field_text(text_field, "b"))?,
                vec![1]
            );
            assert_eq!(
                search_term(&searcher, Term::from_field_text(text_field, "c"))?,
                vec![3]
            );
            assert_eq!(
                search_term(&searcher, Term::from_field_text(text_field, "d"))?,
                vec![1, 3]
            );
        }
        {
            // a second commit
            index_writer.add_document(doc!(
                text_field => "a d e",
                score_field => 4_000u64,
                bytes_score_field => vec![0u8, 0, 0, 4],
            ))?;
            index_writer.add_document(doc!(
                text_field => "e f",
                score_field => 5_000u64,
                bytes_score_field => vec![0u8, 0, 0, 5],
            ))?;
            index_writer.delete_term(Term::from_field_text(text_field, "a"));
            index_writer.delete_term(Term::from_field_text(text_field, "f"));
            index_writer.add_document(doc!(
                text_field => "f g",
                score_field => 6_000u64,
                bytes_score_field => vec![0u8, 0, 23, 112],
            ))?;
            index_writer.add_document(doc!(
                text_field => "g h",
                score_field => 7_000u64,
                bytes_score_field => vec![0u8, 0, 27, 88],
            ))?;
            index_writer.commit()?;
            reader.reload()?;
            let searcher = reader.searcher();

            assert_eq!(searcher.segment_readers().len(), 2);
            assert_eq!(searcher.num_docs(), 3);
            assert_eq!(searcher.segment_readers()[0].num_docs(), 2);
            assert_eq!(searcher.segment_readers()[0].max_doc(), 4);
            assert_eq!(searcher.segment_readers()[1].num_docs(), 1);
            assert_eq!(searcher.segment_readers()[1].max_doc(), 3);
            assert_eq!(
                search_term(&searcher, Term::from_field_text(text_field, "a"))?,
                empty_vec
            );
            assert_eq!(
                search_term(&searcher, Term::from_field_text(text_field, "b"))?,
                empty_vec
            );
            assert_eq!(
                search_term(&searcher, Term::from_field_text(text_field, "c"))?,
                vec![3]
            );
            assert_eq!(
                search_term(&searcher, Term::from_field_text(text_field, "d"))?,
                vec![3]
            );
            assert_eq!(
                search_term(&searcher, Term::from_field_text(text_field, "e"))?,
                empty_vec
            );
            assert_eq!(
                search_term(&searcher, Term::from_field_text(text_field, "f"))?,
                vec![6_000]
            );
            assert_eq!(
                search_term(&searcher, Term::from_field_text(text_field, "g"))?,
                vec![6_000, 7_000]
            );

            let score_field_reader = searcher
                .segment_reader(0)
                .fast_fields()
                .u64("score")
                .unwrap();
            assert_eq!(score_field_reader.min_value(), 4000);
            assert_eq!(score_field_reader.max_value(), 7000);

            let score_field_reader = searcher
                .segment_reader(1)
                .fast_fields()
                .u64("score")
                .unwrap();
            assert_eq!(score_field_reader.min_value(), 1);
            assert_eq!(score_field_reader.max_value(), 3);
        }
        {
            // merging the segments
            let segment_ids = index.searchable_segment_ids()?;
            index_writer.merge(&segment_ids).wait()?;
            reader.reload()?;
            let searcher = reader.searcher();
            assert_eq!(searcher.segment_readers().len(), 1);
            assert_eq!(searcher.num_docs(), 3);
            assert_eq!(searcher.segment_readers()[0].num_docs(), 3);
            assert_eq!(searcher.segment_readers()[0].max_doc(), 3);
            assert_eq!(
                search_term(&searcher, Term::from_field_text(text_field, "a"))?,
                empty_vec
            );
            assert_eq!(
                search_term(&searcher, Term::from_field_text(text_field, "b"))?,
                empty_vec
            );
            assert_eq!(
                search_term(&searcher, Term::from_field_text(text_field, "c"))?,
                vec![3]
            );
            assert_eq!(
                search_term(&searcher, Term::from_field_text(text_field, "d"))?,
                vec![3]
            );
            assert_eq!(
                search_term(&searcher, Term::from_field_text(text_field, "e"))?,
                empty_vec
            );
            assert_eq!(
                search_term(&searcher, Term::from_field_text(text_field, "f"))?,
                vec![6_000]
            );
            assert_eq!(
                search_term(&searcher, Term::from_field_text(text_field, "g"))?,
                vec![6_000, 7_000]
            );
            let score_field_reader = searcher
                .segment_reader(0)
                .fast_fields()
                .u64("score")
                .unwrap();
            assert_eq!(score_field_reader.min_value(), 3);
            assert_eq!(score_field_reader.max_value(), 7000);
        }
        {
            // test a commit with only deletes
            index_writer.delete_term(Term::from_field_text(text_field, "c"));
            index_writer.commit()?;

            reader.reload()?;
            let searcher = reader.searcher();
            assert_eq!(searcher.segment_readers().len(), 1);
            assert_eq!(searcher.num_docs(), 2);
            assert_eq!(searcher.segment_readers()[0].num_docs(), 2);
            assert_eq!(searcher.segment_readers()[0].max_doc(), 3);
            assert_eq!(
                search_term(&searcher, Term::from_field_text(text_field, "a"))?,
                empty_vec
            );
            assert_eq!(
                search_term(&searcher, Term::from_field_text(text_field, "b"))?,
                empty_vec
            );
            assert_eq!(
                search_term(&searcher, Term::from_field_text(text_field, "c"))?,
                empty_vec
            );
            assert_eq!(
                search_term(&searcher, Term::from_field_text(text_field, "d"))?,
                empty_vec
            );
            assert_eq!(
                search_term(&searcher, Term::from_field_text(text_field, "e"))?,
                empty_vec
            );
            assert_eq!(
                search_term(&searcher, Term::from_field_text(text_field, "f"))?,
                vec![6_000]
            );
            assert_eq!(
                search_term(&searcher, Term::from_field_text(text_field, "g"))?,
                vec![6_000, 7_000]
            );
            let score_field_reader = searcher
                .segment_reader(0)
                .fast_fields()
                .u64("score")
                .unwrap();
            assert_eq!(score_field_reader.min_value(), 3);
            assert_eq!(score_field_reader.max_value(), 7000);
        }
        {
            // Test merging a single segment in order to remove deletes.
            let segment_ids = index.searchable_segment_ids()?;
            index_writer.merge(&segment_ids).wait()?;
            reader.reload()?;

            let searcher = reader.searcher();
            assert_eq!(searcher.segment_readers().len(), 1);
            assert_eq!(searcher.num_docs(), 2);
            assert_eq!(searcher.segment_readers()[0].num_docs(), 2);
            assert_eq!(searcher.segment_readers()[0].max_doc(), 2);
            assert_eq!(
                search_term(&searcher, Term::from_field_text(text_field, "a"))?,
                empty_vec
            );
            assert_eq!(
                search_term(&searcher, Term::from_field_text(text_field, "b"))?,
                empty_vec
            );
            assert_eq!(
                search_term(&searcher, Term::from_field_text(text_field, "c"))?,
                empty_vec
            );
            assert_eq!(
                search_term(&searcher, Term::from_field_text(text_field, "d"))?,
                empty_vec
            );
            assert_eq!(
                search_term(&searcher, Term::from_field_text(text_field, "e"))?,
                empty_vec
            );
            assert_eq!(
                search_term(&searcher, Term::from_field_text(text_field, "f"))?,
                vec![6_000]
            );
            assert_eq!(
                search_term(&searcher, Term::from_field_text(text_field, "g"))?,
                vec![6_000, 7_000]
            );
            let score_field_reader = searcher
                .segment_reader(0)
                .fast_fields()
                .u64("score")
                .unwrap();
            assert_eq!(score_field_reader.min_value(), 6000);
            assert_eq!(score_field_reader.max_value(), 7000);
        }

        {
            // Test removing all docs
            index_writer.delete_term(Term::from_field_text(text_field, "g"));
            index_writer.commit()?;
            let segment_ids = index.searchable_segment_ids()?;
            reader.reload()?;

            let searcher = reader.searcher();
            assert!(segment_ids.is_empty());
            assert!(searcher.segment_readers().is_empty());
            assert_eq!(searcher.num_docs(), 0);
        }
        Ok(())
    }

    #[test]
    fn test_merge_facets_sort_none() {
        test_merge_facets(None, true)
    }

    // force_segment_value_overlap forces the int value for sorting to have overlapping min and max
    // ranges between segments so that merge algorithm can't apply certain optimizations
    fn test_merge_facets(index_settings: Option<IndexSettings>, force_segment_value_overlap: bool) {
        let mut schema_builder = schema::Schema::builder();
        let facet_field = schema_builder.add_facet_field("facet", FacetOptions::default());
        let int_options = NumericOptions::default().set_fast().set_indexed();
        let int_field = schema_builder.add_u64_field("intval", int_options);
        let mut index_builder = Index::builder().schema(schema_builder.build());
        if let Some(settings) = index_settings {
            index_builder = index_builder.settings(settings);
        }
        let index = index_builder.create_in_ram().unwrap();
        // let index = Index::create_in_ram(schema_builder.build());
        let reader = index.reader().unwrap();
        let mut int_val = 0;
        {
            let mut index_writer: IndexWriter = index.writer_for_tests().unwrap();
            let index_doc =
                |index_writer: &mut IndexWriter, doc_facets: &[&str], int_val: &mut u64| {
                    let mut doc = TantivyDocument::default();
                    for facet in doc_facets {
                        doc.add_facet(facet_field, Facet::from(facet));
                    }
                    doc.add_u64(int_field, *int_val);
                    *int_val += 1;
                    index_writer.add_document(doc).unwrap();
                };

            index_doc(
                &mut index_writer,
                &["/top/a/firstdoc", "/top/b"],
                &mut int_val,
            );
            index_doc(
                &mut index_writer,
                &["/top/a/firstdoc", "/top/b", "/top/c"],
                &mut int_val,
            );
            index_doc(&mut index_writer, &["/top/a", "/top/b"], &mut int_val);
            index_doc(&mut index_writer, &["/top/a"], &mut int_val);

            index_doc(&mut index_writer, &["/top/b", "/top/d"], &mut int_val);
            if force_segment_value_overlap {
                index_doc(&mut index_writer, &["/top/d"], &mut 0);
                index_doc(&mut index_writer, &["/top/e"], &mut 10);
                index_writer.commit().expect("committed");
                index_doc(&mut index_writer, &["/top/a"], &mut 5); // 5 is between 0 - 10 so the
                                                                   // segments don' have disjunct
                                                                   // ranges
            } else {
                index_doc(&mut index_writer, &["/top/d"], &mut int_val);
                index_doc(&mut index_writer, &["/top/e"], &mut int_val);
                index_writer.commit().expect("committed");
                index_doc(&mut index_writer, &["/top/a"], &mut int_val);
            }
            index_doc(&mut index_writer, &["/top/b"], &mut int_val);
            index_doc(&mut index_writer, &["/top/c"], &mut int_val);
            index_writer.commit().expect("committed");

            index_doc(&mut index_writer, &["/top/e", "/top/f"], &mut int_val);
            index_writer.commit().expect("committed");
        }

        reader.reload().unwrap();
        let test_searcher = |expected_num_docs: usize, expected: &[(&str, u64)]| {
            let searcher = reader.searcher();
            let mut facet_collector = FacetCollector::for_field("facet");
            facet_collector.add_facet(Facet::from("/top"));
            let (count, facet_counts) = searcher
                .search(&AllQuery, &(Count, facet_collector))
                .unwrap();
            assert_eq!(count, expected_num_docs);
            let facets: Vec<(String, u64)> = facet_counts
                .get("/top")
                .map(|(facet, count)| (facet.to_string(), count))
                .collect();
            assert_eq!(
                facets,
                expected
                    .iter()
                    .map(|&(facet_str, count)| (String::from(facet_str), count))
                    .collect::<Vec<_>>()
            );
        };
        test_searcher(
            11,
            &[
                ("/top/a", 5),
                ("/top/b", 5),
                ("/top/c", 2),
                ("/top/d", 2),
                ("/top/e", 2),
                ("/top/f", 1),
            ],
        );
        // Merging the segments
        {
            let segment_ids = index
                .searchable_segment_ids()
                .expect("Searchable segments failed.");
            let mut index_writer: IndexWriter = index.writer_for_tests().unwrap();
            index_writer
                .merge(&segment_ids)
                .wait()
                .expect("Merging failed");
            index_writer.wait_merging_threads().unwrap();
            reader.reload().unwrap();
            test_searcher(
                11,
                &[
                    ("/top/a", 5),
                    ("/top/b", 5),
                    ("/top/c", 2),
                    ("/top/d", 2),
                    ("/top/e", 2),
                    ("/top/f", 1),
                ],
            );
        }

        // Deleting one term
        {
            let mut index_writer: IndexWriter = index.writer_for_tests().unwrap();
            let facet = Facet::from_path(vec!["top", "a", "firstdoc"]);
            let facet_term = Term::from_facet(facet_field, &facet);
            index_writer.delete_term(facet_term);
            index_writer.commit().unwrap();
            reader.reload().unwrap();
            test_searcher(
                9,
                &[
                    ("/top/a", 3),
                    ("/top/b", 3),
                    ("/top/c", 1),
                    ("/top/d", 2),
                    ("/top/e", 2),
                    ("/top/f", 1),
                ],
            );
        }
    }

    #[test]
    fn test_bug_merge() -> crate::Result<()> {
        let mut schema_builder = schema::Schema::builder();
        let int_field = schema_builder.add_u64_field("intvals", INDEXED);
        let index = Index::create_in_ram(schema_builder.build());
        let mut index_writer: IndexWriter = index.writer_for_tests().unwrap();
        index_writer.add_document(doc!(int_field => 1u64))?;
        index_writer.commit().expect("commit failed");
        index_writer.add_document(doc!(int_field => 1u64))?;
        index_writer.commit().expect("commit failed");
        let reader = index.reader()?;
        let searcher = reader.searcher();
        assert_eq!(searcher.num_docs(), 2);
        index_writer.delete_term(Term::from_field_u64(int_field, 1));
        let segment_ids = index
            .searchable_segment_ids()
            .expect("Searchable segments failed.");
        index_writer.merge(&segment_ids).wait()?;
        reader.reload()?;
        // commit has not been called yet. The document should still be
        // there.
        assert_eq!(reader.searcher().num_docs(), 2);
        Ok(())
    }

    #[test]
    fn test_merge_multivalued_int_fields_all_deleted() -> crate::Result<()> {
        let mut schema_builder = schema::Schema::builder();
        let int_options = NumericOptions::default().set_fast().set_indexed();
        let int_field = schema_builder.add_u64_field("intvals", int_options);
        let index = Index::create_in_ram(schema_builder.build());
        let reader = index.reader()?;
        {
            let mut index_writer = index.writer_for_tests()?;
            let mut doc = TantivyDocument::default();
            doc.add_u64(int_field, 1);
            index_writer.add_document(doc.clone())?;
            index_writer.commit()?;
            index_writer.add_document(doc)?;
            index_writer.commit()?;
            index_writer.delete_term(Term::from_field_u64(int_field, 1));
            let segment_ids = index.searchable_segment_ids()?;
            index_writer.merge(&segment_ids).wait()?;

            // assert delete has not been committed
            reader.reload()?;
            let searcher = reader.searcher();
            assert_eq!(searcher.num_docs(), 2);

            index_writer.commit()?;

            index_writer.wait_merging_threads()?;
        }

        reader.reload()?;
        let searcher = reader.searcher();
        assert_eq!(searcher.num_docs(), 0);
        Ok(())
    }

    #[derive(Debug, Clone, Copy, Eq, PartialEq)]
    enum IndexingOp {
        ZeroVal,
        OneVal { val: u64 },
        TwoVal { val: u64 },
        Commit,
    }

    fn balanced_operation_strategy() -> impl Strategy<Value = IndexingOp> {
        prop_oneof![
            (0u64..1u64).prop_map(|_| IndexingOp::ZeroVal),
            (0u64..1u64).prop_map(|val| IndexingOp::OneVal { val }),
            (0u64..1u64).prop_map(|val| IndexingOp::TwoVal { val }),
            (0u64..1u64).prop_map(|_| IndexingOp::Commit),
        ]
    }

    use proptest::prelude::*;
    proptest! {
        #[test]
        fn test_merge_columnar_int_proptest(ops in proptest::collection::vec(balanced_operation_strategy(), 1..20)) {
            assert!(test_merge_int_fields(&ops[..]).is_ok());
        }
    }
    fn test_merge_int_fields(ops: &[IndexingOp]) -> crate::Result<()> {
        if ops.iter().all(|op| *op == IndexingOp::Commit) {
            return Ok(());
        }
        let expected_doc_and_vals: Vec<(u32, Vec<u64>)> = ops
            .iter()
            .filter(|op| *op != &IndexingOp::Commit)
            .map(|op| match op {
                IndexingOp::ZeroVal => vec![],
                IndexingOp::OneVal { val } => vec![*val],
                IndexingOp::TwoVal { val } => vec![*val, *val],
                IndexingOp::Commit => unreachable!(),
            })
            .enumerate()
            .map(|(id, val)| (id as u32, val))
            .collect();

        let mut schema_builder = schema::Schema::builder();
        let int_options = NumericOptions::default().set_fast().set_indexed();
        let int_field = schema_builder.add_u64_field("intvals", int_options);
        let index = Index::create_in_ram(schema_builder.build());
        {
            let mut index_writer = index.writer_for_tests()?;
            index_writer.set_merge_policy(Box::new(NoMergePolicy));
            let index_doc = |index_writer: &mut IndexWriter, int_vals: &[u64]| {
                let mut doc = TantivyDocument::default();
                for &val in int_vals {
                    doc.add_u64(int_field, val);
                }
                index_writer.add_document(doc).unwrap();
            };

            for op in ops {
                match op {
                    IndexingOp::ZeroVal => index_doc(&mut index_writer, &[]),
                    IndexingOp::OneVal { val } => index_doc(&mut index_writer, &[*val]),
                    IndexingOp::TwoVal { val } => index_doc(&mut index_writer, &[*val, *val]),
                    IndexingOp::Commit => {
                        index_writer.commit().expect("commit failed");
                    }
                }
            }
            index_writer.commit().expect("commit failed");
        }
        {
            let mut segment_ids = index.searchable_segment_ids()?;
            segment_ids.sort();
            let mut index_writer: IndexWriter = index.writer_for_tests()?;
            index_writer.merge(&segment_ids).wait()?;
            index_writer.wait_merging_threads()?;
        }
        let reader = index.reader()?;
        reader.reload()?;

        let mut vals: Vec<u64> = Vec::new();
        let mut test_vals = move |col: &Column<u64>, doc: DocId, expected: &[u64]| {
            vals.clear();
            vals.extend(col.values_for_doc(doc));
            assert_eq!(&vals[..], expected);
        };

        let mut test_col = move |col: &Column<u64>, column_expected: &[(u32, Vec<u64>)]| {
            for (doc_id, vals) in column_expected.iter() {
                test_vals(col, *doc_id, vals);
            }
        };

        {
            let searcher = reader.searcher();
            let segment = searcher.segment_reader(0u32);
            let col = segment
                .fast_fields()
                .column_opt::<u64>("intvals")
                .unwrap()
                .unwrap();

            test_col(&col, &expected_doc_and_vals);
        }

        Ok(())
    }

    #[test]
    fn test_merge_multivalued_int_fields_simple() -> crate::Result<()> {
        let mut schema_builder = schema::Schema::builder();
        let int_options = NumericOptions::default().set_fast().set_indexed();
        let int_field = schema_builder.add_u64_field("intvals", int_options);
        let index = Index::create_in_ram(schema_builder.build());

        let mut vals: Vec<u64> = Vec::new();
        let mut test_vals = move |col: &Column<u64>, doc: DocId, expected: &[u64]| {
            vals.clear();
            vals.extend(col.values_for_doc(doc));
            assert_eq!(&vals[..], expected);
        };

        {
            let mut index_writer = index.writer_for_tests()?;
            let index_doc = |index_writer: &mut IndexWriter, int_vals: &[u64]| {
                let mut doc = TantivyDocument::default();
                for &val in int_vals {
                    doc.add_u64(int_field, val);
                }
                index_writer.add_document(doc).unwrap();
            };
            index_doc(&mut index_writer, &[1, 2]);
            index_doc(&mut index_writer, &[1, 2, 3]);
            index_doc(&mut index_writer, &[4, 5]);
            index_doc(&mut index_writer, &[1, 2]);
            index_doc(&mut index_writer, &[1, 5]);
            index_doc(&mut index_writer, &[3]);
            index_doc(&mut index_writer, &[17]);
            assert!(index_writer.commit().is_ok());
            index_doc(&mut index_writer, &[20]);
            assert!(index_writer.commit().is_ok());
            index_doc(&mut index_writer, &[28, 27]);
            index_doc(&mut index_writer, &[1_000]);
            assert!(index_writer.commit().is_ok());
        }
        let reader = index.reader()?;
        let searcher = reader.searcher();

        {
            let segment = searcher.segment_reader(0u32);
            let column = segment
                .fast_fields()
                .column_opt::<u64>("intvals")
                .unwrap()
                .unwrap();
            test_vals(&column, 0, &[1, 2]);
            test_vals(&column, 1, &[1, 2, 3]);
            test_vals(&column, 2, &[4, 5]);
            test_vals(&column, 3, &[1, 2]);
            test_vals(&column, 4, &[1, 5]);
            test_vals(&column, 5, &[3]);
            test_vals(&column, 6, &[17]);
        }

        {
            let segment = searcher.segment_reader(1u32);
            let col = segment
                .fast_fields()
                .column_opt::<u64>("intvals")
                .unwrap()
                .unwrap();
            test_vals(&col, 0, &[28, 27]);
            test_vals(&col, 1, &[1000]);
        }

        {
            let segment = searcher.segment_reader(2u32);
            let col = segment
                .fast_fields()
                .column_opt::<u64>("intvals")
                .unwrap()
                .unwrap();
            test_vals(&col, 0, &[20]);
        }

        // Merging the segments
        {
            let segment_ids = index.searchable_segment_ids()?;
            let mut index_writer: IndexWriter = index.writer_for_tests()?;
            index_writer.merge(&segment_ids).wait()?;
            index_writer.wait_merging_threads()?;
        }
        reader.reload()?;

        {
            let searcher = reader.searcher();
            let segment = searcher.segment_reader(0u32);
            let col = segment
                .fast_fields()
                .column_opt::<u64>("intvals")
                .unwrap()
                .unwrap();
            test_vals(&col, 0, &[1, 2]);
            test_vals(&col, 1, &[1, 2, 3]);
            test_vals(&col, 2, &[4, 5]);
            test_vals(&col, 3, &[1, 2]);
            test_vals(&col, 4, &[1, 5]);
            test_vals(&col, 5, &[3]);
            test_vals(&col, 6, &[17]);
            test_vals(&col, 7, &[28, 27]);
            test_vals(&col, 8, &[1000]);
            test_vals(&col, 9, &[20]);
        }
        Ok(())
    }

    #[test]
    fn merges_f64_fast_fields_correctly() -> crate::Result<()> {
        let mut builder = schema::SchemaBuilder::new();

        let fast_multi = NumericOptions::default().set_fast();

        let field = builder.add_f64_field("f64", schema::FAST);
        let multi_field = builder.add_f64_field("f64s", fast_multi);

        let index = Index::create_in_ram(builder.build());

        let mut writer = index.writer_for_tests()?;

        // Make sure we'll attempt to merge every created segment
        let mut policy = crate::indexer::LogMergePolicy::default();
        policy.set_min_num_segments(2);
        writer.set_merge_policy(Box::new(policy));

        for i in 0..100 {
            let mut doc = TantivyDocument::new();
            doc.add_f64(field, 42.0);
            doc.add_f64(multi_field, 0.24);
            doc.add_f64(multi_field, 0.27);
            writer.add_document(doc)?;
            if i % 5 == 0 {
                writer.commit()?;
            }
        }

        writer.commit()?;
        writer.wait_merging_threads()?;

        // If a merging thread fails, we should end up with more
        // than one segment here
        assert_eq!(1, index.searchable_segments()?.len());
        Ok(())
    }

    #[test]
    fn test_merged_index_has_blockwand() -> crate::Result<()> {
        let mut builder = schema::SchemaBuilder::new();
        let text = builder.add_text_field("text", TEXT);
        let index = Index::create_in_ram(builder.build());
        let mut writer = index.writer_for_tests()?;
        let happy_term = Term::from_field_text(text, "happy");
        let term_query = TermQuery::new(happy_term, IndexRecordOption::WithFreqs);
        for _ in 0..62 {
            writer.add_document(doc!(text=>"hello happy tax payer"))?;
        }
        writer.commit()?;
        let reader = index.reader()?;
        let searcher = reader.searcher();
        let mut term_scorer = term_query
            .specialized_weight(EnableScoring::enabled_from_searcher(&searcher))?
            .term_scorer_for_test(searcher.segment_reader(0u32), 1.0)?
            .unwrap();
        assert_eq!(term_scorer.doc(), 0);
        assert_nearly_equals!(term_scorer.block_max_score(), 0.0079681855);
        assert_nearly_equals!(term_scorer.score(), 0.0079681855);
        for _ in 0..81 {
            writer.add_document(doc!(text=>"hello happy tax payer"))?;
        }
        writer.commit()?;
        reader.reload()?;
        let searcher = reader.searcher();

        assert_eq!(searcher.segment_readers().len(), 2);
        for segment_reader in searcher.segment_readers() {
            let mut term_scorer = term_query
                .specialized_weight(EnableScoring::enabled_from_searcher(&searcher))?
                .term_scorer_for_test(segment_reader, 1.0)?
                .unwrap();
            // the difference compared to before is intrinsic to the bm25 formula. no worries
            // there.
            for doc in segment_reader.doc_ids_alive() {
                assert_eq!(term_scorer.doc(), doc);
                assert_nearly_equals!(term_scorer.block_max_score(), 0.003478312);
                assert_nearly_equals!(term_scorer.score(), 0.003478312);
                term_scorer.advance();
            }
        }

        let segment_ids: Vec<SegmentId> = searcher
            .segment_readers()
            .iter()
            .map(|reader| reader.segment_id())
            .collect();
        writer.merge(&segment_ids[..]).wait()?;

        reader.reload()?;
        let searcher = reader.searcher();
        assert_eq!(searcher.segment_readers().len(), 1);

        let segment_reader = searcher.segment_reader(0u32);
        let mut term_scorer = term_query
            .specialized_weight(EnableScoring::enabled_from_searcher(&searcher))?
            .term_scorer_for_test(segment_reader, 1.0)?
            .unwrap();
        // the difference compared to before is intrinsic to the bm25 formula. no worries there.
        for doc in segment_reader.doc_ids_alive() {
            assert_eq!(term_scorer.doc(), doc);
            assert_nearly_equals!(term_scorer.block_max_score(), 0.003478312);
            assert_nearly_equals!(term_scorer.score(), 0.003478312);
            term_scorer.advance();
        }

        Ok(())
    }

    #[test]
    fn test_max_doc() {
        // this is the first time I write a unit test for a constant.
        assert!(((super::MAX_DOC_LIMIT - 1) as i32) >= 0);
        assert!((super::MAX_DOC_LIMIT as i32) < 0);
    }
}


================================================
FILE: src/indexer/mod.rs
================================================
//! Indexing and merging data.
//!
//! Contains code to create and merge segments.
//! `IndexWriter` is the main entry point for that, which created from
//! [`Index::writer`](crate::Index::writer).

/// Delete queue implementation for broadcasting delete operations to consumers.
pub(crate) mod delete_queue;
pub(crate) mod path_to_unordered_id;

pub(crate) mod doc_id_mapping;
mod doc_opstamp_mapping;
mod flat_map_with_buffer;
pub(crate) mod index_writer;
pub(crate) mod index_writer_status;
pub(crate) mod indexing_term;
mod log_merge_policy;
mod merge_index_test;
mod merge_operation;
pub(crate) mod merge_policy;
pub(crate) mod merger;
pub(crate) mod operation;
pub(crate) mod prepared_commit;
mod segment_entry;
mod segment_manager;
mod segment_register;
pub(crate) mod segment_serializer;
pub(crate) mod segment_updater;
pub(crate) mod segment_writer;
pub(crate) mod single_segment_index_writer;
mod stamper;

use crossbeam_channel as channel;
use smallvec::SmallVec;

pub use self::index_writer::{advance_deletes, IndexWriter, IndexWriterOptions};
pub use self::log_merge_policy::LogMergePolicy;
pub use self::merge_operation::MergeOperation;
pub use self::merge_policy::{MergeCandidate, MergePolicy, NoMergePolicy};
pub use self::operation::{AddOperation, DeleteOperation, UserOperation};
pub use self::prepared_commit::PreparedCommit;
pub use self::segment_entry::SegmentEntry;
pub(crate) use self::segment_serializer::SegmentSerializer;
pub use self::segment_updater::{merge_filtered_segments, merge_indices};
pub use self::segment_writer::SegmentWriter;
pub use self::single_segment_index_writer::SingleSegmentIndexWriter;

/// Alias for the default merge policy, which is the `LogMergePolicy`.
pub type DefaultMergePolicy = LogMergePolicy;

// Batch of documents.
// Most of the time, users will send operation one-by-one, but it can be useful to
// send them as a small block to ensure that
// - all docs in the operation will happen on the same segment and continuous doc_ids.
// - all operations in the group are committed at the same time, making the group
// atomic.
type AddBatch<D> = SmallVec<[AddOperation<D>; 4]>;
type AddBatchSender<D> = channel::Sender<AddBatch<D>>;
type AddBatchReceiver<D> = channel::Receiver<AddBatch<D>>;

#[cfg(feature = "mmap")]
#[cfg(test)]
mod tests_mmap {

    use common::ByteCount;

    use crate::aggregation::agg_req::Aggregations;
    use crate::aggregation::agg_result::AggregationResults;
    use crate::aggregation::AggregationCollector;
    use crate::collector::{Count, TopDocs};
    use crate::index::FieldMetadata;
    use crate::query::{AllQuery, QueryParser};
    use crate::schema::{JsonObjectOptions, Schema, Type, FAST, INDEXED, STORED, TEXT};
    use crate::{Index, IndexWriter, Term};

    #[test]
    fn test_advance_delete_bug() -> crate::Result<()> {
        let mut schema_builder = Schema::builder();
        let text_field = schema_builder.add_text_field("text", TEXT);
        let index = Index::create_from_tempdir(schema_builder.build())?;
        let mut index_writer: IndexWriter = index.writer_for_tests()?;
        // there must be one deleted document in the segment
        index_writer.add_document(doc!(text_field=>"b"))?;
        index_writer.delete_term(Term::from_field_text(text_field, "b"));
        // we need enough data to trigger the bug (at least 32 documents)
        for _ in 0..32 {
            index_writer.add_document(doc!(text_field=>"c"))?;
        }
        index_writer.commit()?;
        Ok(())
    }

    #[test]
    fn test_json_field_expand_dots_disabled_dot_escaped_required() {
        let mut schema_builder = Schema::builder();
        let json_field = schema_builder.add_json_field("json", TEXT);
        let index = Index::create_in_ram(schema_builder.build());
        let mut index_writer: IndexWriter = index.writer_for_tests().unwrap();
        let json = serde_json::json!({"k8s.container.name": "prometheus", "val": "hello"});
        index_writer.add_document(doc!(json_field=>json)).unwrap();
        index_writer.commit().unwrap();
        let reader = index.reader().unwrap();
        let searcher = reader.searcher();
        assert_eq!(searcher.num_docs(), 1);
        let parse_query = QueryParser::for_index(&index, Vec::new());
        {
            let query = parse_query
                .parse_query(r"json.k8s\.container\.name:prometheus")
                .unwrap();
            let num_docs = searcher.search(&query, &Count).unwrap();
            assert_eq!(num_docs, 1);
        }
        {
            let query = parse_query
                .parse_query(r#"json.k8s.container.name:prometheus"#)
                .unwrap();
            let num_docs = searcher.search(&query, &Count).unwrap();
            assert_eq!(num_docs, 0);
        }
    }

    #[test]
    fn test_json_field_number() {
        // this test was added specifically to reach some cases related to using json fields, with
        // frequency enabled, to store integers, with enough documents containing a single integer
        // that the posting list can be bitpacked.
        let mut schema_builder = Schema::builder();

        let json_field = schema_builder.add_json_field("json", TEXT);
        let index = Index::create_in_ram(schema_builder.build());
        let mut index_writer = index.writer_for_tests().unwrap();
        for _ in 0..256 {
            let json = serde_json::json!({"somekey": 1u64, "otherkey": -2i64});
            index_writer.add_document(doc!(json_field=>json)).unwrap();

            let json = serde_json::json!({"somekey": "1str", "otherkey": "2str"});
            index_writer.add_document(doc!(json_field=>json)).unwrap();
        }
        index_writer.commit().unwrap();
        let reader = index.reader().unwrap();
        let searcher = reader.searcher();
        assert_eq!(searcher.num_docs(), 512);
        let parse_query = QueryParser::for_index(&index, Vec::new());
        {
            let query = parse_query.parse_query(r"json.somekey:1").unwrap();
            let num_docs = searcher.search(&query, &Count).unwrap();
            assert_eq!(num_docs, 256);
        }
    }
    #[test]
    fn test_json_field_null_byte_is_ignored() {
        let mut schema_builder = Schema::builder();
        let options = JsonObjectOptions::from(TEXT | FAST).set_expand_dots_enabled();
        let field = schema_builder.add_json_field("json", options);
        let index = Index::create_in_ram(schema_builder.build());
        let mut index_writer = index.writer_for_tests().unwrap();
        index_writer
            .add_document(doc!(field=>json!({"key": "test1", "invalidkey\u{0000}": "test2"})))
            .unwrap();
        index_writer.commit().unwrap();
        let reader = index.reader().unwrap();
        let searcher = reader.searcher();
        let segment_reader = searcher.segment_reader(0);
        let inv_indexer = segment_reader.inverted_index(field).unwrap();
        let term_dict = inv_indexer.terms();
        assert_eq!(term_dict.num_terms(), 1);
        let mut term_bytes = Vec::new();
        term_dict.ord_to_term(0, &mut term_bytes).unwrap();
        assert_eq!(term_bytes, b"key\0stest1");
    }

    #[test]
    fn test_json_field_1byte() {
        // Test when field name contains a '1' byte, which has special meaning in tantivy.
        // The 1 byte can be addressed as '1' byte or '.'.
        let field_name_in = "\u{0001}";
        let field_name_out = "\u{0001}";
        test_json_field_name(field_name_in, field_name_out);

        // Test when field name contains a '1' byte, which has special meaning in tantivy.
        let field_name_in = "\u{0001}";
        let field_name_out = ".";
        test_json_field_name(field_name_in, field_name_out);
    }

    #[test]
    fn test_json_field_dot() {
        // Test when field name contains a '.'
        let field_name_in = ".";
        let field_name_out = ".";
        test_json_field_name(field_name_in, field_name_out);
    }
    fn test_json_field_name(field_name_in: &str, field_name_out: &str) {
        let mut schema_builder = Schema::builder();

        let options = JsonObjectOptions::from(TEXT | FAST).set_expand_dots_enabled();
        let field = schema_builder.add_json_field("json", options);
        let index = Index::create_in_ram(schema_builder.build());
        let mut index_writer = index.writer_for_tests().unwrap();
        index_writer
            .add_document(doc!(field=>json!({format!("{field_name_in}"): "test1", format!("num{field_name_in}"): 10})))
            .unwrap();
        index_writer
            .add_document(doc!(field=>json!({format!("a{field_name_in}"): "test2"})))
            .unwrap();
        index_writer
            .add_document(doc!(field=>json!({format!("a{field_name_in}a"): "test3"})))
            .unwrap();
        index_writer
            .add_document(
                doc!(field=>json!({format!("a{field_name_in}a{field_name_in}"): "test4"})),
            )
            .unwrap();
        index_writer
            .add_document(
                doc!(field=>json!({format!("a{field_name_in}.ab{field_name_in}"): "test5"})),
            )
            .unwrap();
        index_writer
            .add_document(
                doc!(field=>json!({format!("a{field_name_in}"): json!({format!("a{field_name_in}"): "test6"}) })),
            )
            .unwrap();
        index_writer
            .add_document(doc!(field=>json!({format!("{field_name_in}a" ): "test7"})))
            .unwrap();

        index_writer.commit().unwrap();
        let reader = index.reader().unwrap();
        let searcher = reader.searcher();
        let parse_query = QueryParser::for_index(&index, Vec::new());
        let test_query = |query_str: &str| {
            let query = parse_query.parse_query(query_str).unwrap();
            let num_docs = searcher.search(&query, &Count).unwrap();
            assert_eq!(num_docs, 1, "{query_str}");
        };
        test_query(format!("json.{field_name_out}:test1").as_str());
        test_query(format!("json.a{field_name_out}:test2").as_str());
        test_query(format!("json.a{field_name_out}a:test3").as_str());
        test_query(format!("json.a{field_name_out}a{field_name_out}:test4").as_str());
        test_query(format!("json.a{field_name_out}.ab{field_name_out}:test5").as_str());
        test_query(format!("json.a{field_name_out}.a{field_name_out}:test6").as_str());
        test_query(format!("json.{field_name_out}a:test7").as_str());

        let test_agg = |field_name: &str, expected: &str| {
            let agg_req_str = json!(
            {
              "termagg": {
                "terms": {
                  "field": field_name,
                }
              }
            });

            let agg_req: Aggregations = serde_json::from_value(agg_req_str).unwrap();
            let collector = AggregationCollector::from_aggs(agg_req, Default::default());
            let agg_res: AggregationResults = searcher.search(&AllQuery, &collector).unwrap();
            let res = serde_json::to_value(agg_res).unwrap();
            assert_eq!(res["termagg"]["buckets"][0]["doc_count"], 1);
            assert_eq!(res["termagg"]["buckets"][0]["key"], expected);
        };

        test_agg(format!("json.{field_name_out}").as_str(), "test1");
        test_agg(format!("json.a{field_name_out}").as_str(), "test2");
        test_agg(format!("json.a{field_name_out}a").as_str(), "test3");
        test_agg(
            format!("json.a{field_name_out}a{field_name_out}").as_str(),
            "test4",
        );
        test_agg(
            format!("json.a{field_name_out}.ab{field_name_out}").as_str(),
            "test5",
        );
        test_agg(
            format!("json.a{field_name_out}.a{field_name_out}").as_str(),
            "test6",
        );
        test_agg(format!("json.{field_name_out}a").as_str(), "test7");

        // `.` is stored as `\u{0001}` internally in tantivy
        let field_name_out_internal = if field_name_out == "." {
            "\u{0001}"
        } else {
            field_name_out
        };

        let mut fields: Vec<(String, Type)> = reader.searcher().segment_readers()[0]
            .inverted_index(field)
            .unwrap()
            .list_encoded_json_fields()
            .unwrap()
            .into_iter()
            .map(|field_space| (field_space.field_name, field_space.field_type))
            .collect();
        assert_eq!(fields.len(), 8);
        fields.sort();
        let mut expected_fields = vec![
            (format!("a{field_name_out_internal}"), Type::Str),
            (format!("a{field_name_out_internal}a"), Type::Str),
            (
                format!("a{field_name_out_internal}a{field_name_out_internal}"),
                Type::Str,
            ),
            (
                format!("a{field_name_out_internal}\u{1}ab{field_name_out_internal}"),
                Type::Str,
            ),
            (
                format!("a{field_name_out_internal}\u{1}a{field_name_out_internal}"),
                Type::Str,
            ),
            (format!("{field_name_out_internal}a"), Type::Str),
            (field_name_out_internal.to_string(), Type::Str),
            (format!("num{field_name_out_internal}"), Type::I64),
        ];
        expected_fields.sort();
        assert_eq!(fields, expected_fields);
        // Check columnar reader
        let mut columns = reader.searcher().segment_readers()[0]
            .fast_fields()
            .columnar()
            .list_columns()
            .unwrap()
            .into_iter()
            .map(|(name, _)| name)
            .collect::<Vec<_>>();
        let mut expected_columns = vec![
            format!("json\u{1}{field_name_out_internal}"),
            format!("json\u{1}{field_name_out_internal}a"),
            format!("json\u{1}a{field_name_out_internal}"),
            format!("json\u{1}a{field_name_out_internal}a"),
            format!("json\u{1}a{field_name_out_internal}a{field_name_out_internal}"),
            format!("json\u{1}a{field_name_out_internal}\u{1}ab{field_name_out_internal}"),
            format!("json\u{1}a{field_name_out_internal}\u{1}a{field_name_out_internal}"),
            format!("json\u{1}num{field_name_out_internal}"),
        ];
        columns.sort();
        expected_columns.sort();
        assert_eq!(columns, expected_columns);
    }

    #[test]
    fn test_json_field_expand_dots_enabled_dot_escape_not_required() {
        let mut schema_builder = Schema::builder();
        let json_options: JsonObjectOptions =
            JsonObjectOptions::from(TEXT).set_expand_dots_enabled();
        let json_field = schema_builder.add_json_field("json", json_options);
        let index = Index::create_in_ram(schema_builder.build());
        let mut index_writer: IndexWriter = index.writer_for_tests().unwrap();
        let json = serde_json::json!({"k8s.container.name": "prometheus", "val": "hello"});
        index_writer.add_document(doc!(json_field=>json)).unwrap();
        index_writer.commit().unwrap();
        let reader = index.reader().unwrap();
        let searcher = reader.searcher();
        assert_eq!(searcher.num_docs(), 1);
        let parse_query = QueryParser::for_index(&index, Vec::new());
        {
            let query = parse_query
                .parse_query(r#"json.k8s.container.name:prometheus"#)
                .unwrap();
            let num_docs = searcher.search(&query, &Count).unwrap();
            assert_eq!(num_docs, 1);
        }
        {
            let query = parse_query
                .parse_query(r"json.k8s\.container\.name:prometheus")
                .unwrap();
            let num_docs = searcher.search(&query, &Count).unwrap();
            assert_eq!(num_docs, 1);
        }
    }

    #[test]
    fn test_json_field_list_fields() {
        let mut schema_builder = Schema::builder();
        let json_options: JsonObjectOptions = JsonObjectOptions::from(TEXT);
        let json_field = schema_builder.add_json_field("json", json_options);
        let index = Index::create_in_ram(schema_builder.build());
        let mut index_writer = index.writer_for_tests().unwrap();
        let json = serde_json::json!({"k8s.container.name": "prometheus", "val": "hello", "sub": {"a": 1, "b": 2}});
        index_writer.add_document(doc!(json_field=>json)).unwrap();
        let json = serde_json::json!({"k8s.container.name": "prometheus", "val": "hello", "suber": {"a": 1, "b": 2}});
        index_writer.add_document(doc!(json_field=>json)).unwrap();
        let json = serde_json::json!({"k8s.container.name": "prometheus", "val": "hello", "suber": {"a": "mixed", "b": 2}});
        index_writer.add_document(doc!(json_field=>json)).unwrap();
        index_writer.commit().unwrap();
        let reader = index.reader().unwrap();

        let searcher = reader.searcher();
        assert_eq!(searcher.num_docs(), 3);

        let reader = &searcher.segment_readers()[0];
        let inverted_index = reader.inverted_index(json_field).unwrap();
        assert_eq!(
            inverted_index
                .list_encoded_json_fields()
                .unwrap()
                .into_iter()
                .map(|field_space| (field_space.field_name, field_space.field_type))
                .collect::<Vec<_>>(),
            [
                ("k8s.container.name".to_string(), Type::Str),
                ("sub\u{1}a".to_string(), Type::I64),
                ("sub\u{1}b".to_string(), Type::I64),
                ("suber\u{1}a".to_string(), Type::I64),
                ("suber\u{1}a".to_string(), Type::Str),
                ("suber\u{1}b".to_string(), Type::I64),
                ("val".to_string(), Type::Str),
            ]
        );
    }

    #[test]
    fn test_json_fields_metadata_expanded_dots_one_segment() {
        test_json_fields_metadata(true, true);
    }

    #[test]
    fn test_json_fields_metadata_expanded_dots_multi_segment() {
        test_json_fields_metadata(true, false);
    }

    #[test]
    fn test_json_fields_metadata_no_expanded_dots_one_segment() {
        test_json_fields_metadata(false, true);
    }

    #[test]
    fn test_json_fields_metadata_no_expanded_dots_multi_segment() {
        test_json_fields_metadata(false, false);
    }

    #[track_caller]
    fn assert_size_eq(lhs: Option<ByteCount>, rhs: Option<ByteCount>) {
        let ignore_actual_values = |size_opt: Option<ByteCount>| size_opt.map(|val| val > 0);
        assert_eq!(ignore_actual_values(lhs), ignore_actual_values(rhs));
    }

    #[track_caller]
    fn assert_field_metadata_eq_but_ignore_field_size(
        expected: &FieldMetadata,
        actual: &FieldMetadata,
    ) {
        assert_eq!(&expected.field_name, &actual.field_name);
        assert_eq!(&expected.typ, &actual.typ);
        assert_eq!(&expected.stored, &actual.stored);
        assert_size_eq(expected.postings_size, actual.postings_size);
        assert_size_eq(expected.positions_size, actual.positions_size);
        assert_size_eq(expected.fast_size, actual.fast_size);
    }

    fn test_json_fields_metadata(expanded_dots: bool, one_segment: bool) {
        use pretty_assertions::assert_eq;
        let mut schema_builder = Schema::builder();
        let json_options: JsonObjectOptions =
            JsonObjectOptions::from(TEXT).set_fast(None).set_stored();
        let json_options = if expanded_dots {
            json_options.set_expand_dots_enabled()
        } else {
            json_options
        };
        schema_builder.add_json_field("json.confusing", json_options.clone());
        let json_field = schema_builder.add_json_field("json.shadow", json_options.clone());
        let json_field2 = schema_builder.add_json_field("json", json_options.clone());
        schema_builder.add_json_field("empty_json", json_options);
        let number_field = schema_builder.add_u64_field("numbers", FAST);
        schema_builder.add_u64_field("empty", FAST | INDEXED | STORED);
        let index = Index::create_in_ram(schema_builder.build());
        let mut index_writer = index.writer_for_tests().unwrap();
        let json =
            serde_json::json!({"k8s.container.name": "a", "val": "a", "sub": {"a": 1, "b": 1}});
        index_writer.add_document(doc!(json_field=>json)).unwrap();
        let json =
            serde_json::json!({"k8s.container.name": "a", "val": "a", "suber": {"a": 1, "b": 1}});
        if !one_segment {
            index_writer.commit().unwrap();
        }
        index_writer.add_document(doc!(json_field=>json)).unwrap();
        let json = serde_json::json!({"k8s.container.name": "a", "k8s.container.name": "a", "val": "a", "suber": {"a": "a", "b": 1}});
        index_writer
            .add_document(doc!(number_field => 50u64, json_field=>json, json_field2=>json!({"shadow": {"val": "a"}})))
            .unwrap();
        index_writer.commit().unwrap();
        let reader = index.reader().unwrap();

        let searcher = reader.searcher();
        assert_eq!(searcher.num_docs(), 3);

        let fields_metadata = index.fields_metadata().unwrap();

        let expected_fields = &[
            FieldMetadata {
                field_name: "empty".to_string(),
                stored: true,
                typ: Type::U64,
                term_dictionary_size: Some(0u64.into()),
                fast_size: Some(1u64.into()),
                postings_size: Some(0u64.into()),
                positions_size: Some(0u64.into()),
            },
            FieldMetadata {
                field_name: if expanded_dots {
                    "json.shadow.k8s.container.name".to_string()
                } else {
                    "json.shadow.k8s\\.container\\.name".to_string()
                },
                stored: true,
                typ: Type::Str,
                term_dictionary_size: Some(1u64.into()),
                fast_size: Some(1u64.into()),
                postings_size: Some(1u64.into()),
                positions_size: Some(1u64.into()),
            },
            FieldMetadata {
                field_name: "json.shadow.sub.a".to_string(),
                typ: Type::I64,
                stored: true,
                fast_size: Some(1u64.into()),
                term_dictionary_size: Some(1u64.into()),
                postings_size: Some(1u64.into()),
                positions_size: Some(1u64.into()),
            },
            FieldMetadata {
                field_name: "json.shadow.sub.b".to_string(),
                typ: Type::I64,
                stored: true,
                fast_size: Some(1u64.into()),
                term_dictionary_size: Some(1u64.into()),
                postings_size: Some(1u64.into()),
                positions_size: Some(1u64.into()),
            },
            FieldMetadata {
                field_name: "json.shadow.suber.a".to_string(),
                stored: true,
                typ: Type::I64,
                fast_size: Some(1u64.into()),
                term_dictionary_size: Some(1u64.into()),
                postings_size: Some(1u64.into()),
                positions_size: Some(1u64.into()),
            },
            FieldMetadata {
                field_name: "json.shadow.suber.a".to_string(),
                typ: Type::Str,
                stored: true,
                fast_size: Some(1u64.into()),
                term_dictionary_size: Some(1u64.into()),
                postings_size: Some(1u64.into()),
                positions_size: Some(1u64.into()),
            },
            FieldMetadata {
                field_name: "json.shadow.suber.b".to_string(),
                typ: Type::I64,
                stored: true,
                fast_size: Some(1u64.into()),
                term_dictionary_size: Some(1u64.into()),
                postings_size: Some(1u64.into()),
                positions_size: Some(1u64.into()),
            },
            FieldMetadata {
                field_name: "json.shadow.val".to_string(),
                typ: Type::Str,
                stored: true,
                fast_size: Some(1u64.into()),
                term_dictionary_size: Some(1u64.into()),
                postings_size: Some(1u64.into()),
                positions_size: Some(1u64.into()),
            },
            FieldMetadata {
                field_name: "numbers".to_string(),
                stored: false,
                typ: Type::U64,
                fast_size: Some(1u64.into()),
                term_dictionary_size: None,
                postings_size: None,
                positions_size: None,
            },
        ];
        assert_eq!(fields_metadata.len(), expected_fields.len());
        for (expected, value) in expected_fields.iter().zip(fields_metadata.iter()) {
            assert_field_metadata_eq_but_ignore_field_size(expected, value);
        }
        let query_parser = QueryParser::for_index(&index, vec![]);
        // Test if returned field name can be queried
        for indexed_field in fields_metadata.iter().filter(|meta| meta.is_indexed()) {
            let val = if indexed_field.typ == Type::Str {
                "a"
            } else {
                "1"
            };
            let query_str = &format!("{}:{}", indexed_field.field_name, val);
            let query = query_parser.parse_query(query_str).unwrap();
            let count_docs = searcher
                .search(&*query, &TopDocs::with_limit(2).order_by_score())
                .unwrap();
            if indexed_field.field_name.contains("empty") || indexed_field.typ == Type::Json {
                assert_eq!(count_docs.len(), 0);
            } else {
                assert!(!count_docs.is_empty(), "{}", indexed_field.field_name);
            }
        }
        // Test if returned field name can be used for aggregation
        for fast_field in fields_metadata
            .iter()
            .filter(|field_metadata| field_metadata.is_fast())
        {
            let agg_req_str = json!(
            {
              "termagg": {
                "terms": {
                  "field": fast_field.field_name,
                }
              }
            });

            let agg_req: Aggregations = serde_json::from_value(agg_req_str).unwrap();
            let collector = AggregationCollector::from_aggs(agg_req, Default::default());
            let agg_res: AggregationResults = searcher.search(&AllQuery, &collector).unwrap();
            let res = serde_json::to_value(agg_res).unwrap();
            if !fast_field.field_name.contains("empty") && fast_field.typ != Type::Json {
                assert!(
                    !res["termagg"]["buckets"].as_array().unwrap().is_empty(),
                    "{}",
                    fast_field.field_name
                );
            }
        }
    }

    #[test]
    fn test_json_field_shadowing_field_name_bug() {
        /// This test is only there to display a bug on addressing a field if it gets shadowed
        /// The issues only occurs if the field name that shadows contains a dot.
        ///
        /// Happens independently of the `expand_dots` option. Since that option does not
        /// affect the field name itself.
        use pretty_assertions::assert_eq;
        let mut schema_builder = Schema::builder();
        let json_options: JsonObjectOptions =
            JsonObjectOptions::from(TEXT).set_fast(None).set_stored();
        // let json_options = json_options.set_expand_dots_enabled();
        let json_field_shadow = schema_builder.add_json_field("json.shadow", json_options.clone());
        let json_field = schema_builder.add_json_field("json", json_options.clone());
        let index = Index::create_in_ram(schema_builder.build());
        let mut index_writer = index.writer_for_tests().unwrap();
        index_writer
            .add_document(
                doc!(json_field_shadow=>json!({"val": "b"}), json_field=>json!({"shadow": {"val": "a"}})),
            )
            .unwrap();
        index_writer.commit().unwrap();
        let reader = index.reader().unwrap();

        let searcher = reader.searcher();

        let fields_and_vals = [
            ("json.shadow\u{1}val".to_string(), "a"), // Succeeds
            //("json.shadow.val".to_string(), "a"),   // Fails
            ("json.shadow.val".to_string(), "b"),
        ];

        let query_parser = QueryParser::for_index(&index, vec![]);
        // Test if field name can be queried
        for (indexed_field, val) in fields_and_vals.iter() {
            let query_str = &format!("{indexed_field}:{val}");
            let query = query_parser.parse_query(query_str).unwrap();
            let count_docs = searcher
                .search(&*query, &TopDocs::with_limit(2).order_by_score())
                .unwrap();
            assert!(!count_docs.is_empty(), "{indexed_field}:{val}");
        }
        // Test if field name can be used for aggregation
        for (field_name, val) in fields_and_vals.iter() {
            let agg_req_str = json!(
            {
              "termagg": {
                "terms": {
                  "field": field_name,
                }
              }
            });

            let agg_req: Aggregations = serde_json::from_value(agg_req_str).unwrap();
            let collector = AggregationCollector::from_aggs(agg_req, Default::default());
            let agg_res: AggregationResults = searcher.search(&AllQuery, &collector).unwrap();
            let res = serde_json::to_value(agg_res).unwrap();
            assert_eq!(
                res["termagg"]["buckets"].as_array().unwrap()[0]["key"]
                    .as_str()
                    .unwrap(),
                *val,
                "{}",
                field_name
            );
        }
    }
}


================================================
FILE: src/indexer/operation.rs
================================================
use crate::query::Weight;
use crate::schema::document::Document;
use crate::schema::{TantivyDocument, Term};
use crate::Opstamp;

/// Timestamped Delete operation.
pub struct DeleteOperation {
    /// Operation stamp.
    /// It is used to check whether the delete operation
    /// applies to an added document operation.
    pub opstamp: Opstamp,
    /// Weight is used to define the set of documents to be deleted.
    pub target: Box<dyn Weight>,
}

/// Timestamped Add operation.
#[derive(Eq, PartialEq, Debug)]
pub struct AddOperation<D: Document = TantivyDocument> {
    /// Operation stamp.
    pub opstamp: Opstamp,
    /// Document to be added.
    pub document: D,
}

/// UserOperation is an enum type that encapsulates other operation types.
#[derive(Eq, PartialEq, Debug)]
pub enum UserOperation<D: Document = TantivyDocument> {
    /// Add operation
    Add(D),
    /// Delete operation
    Delete(Term),
}


================================================
FILE: src/indexer/path_to_unordered_id.rs
================================================
use fnv::FnvHashMap;

/// `Field` is represented by an unsigned 32-bit integer type.
/// The schema holds the mapping between field names and `Field` objects.
#[derive(Copy, Default, Clone, Debug, PartialEq, PartialOrd, Eq, Ord, Hash)]
pub struct OrderedPathId(u32);

impl OrderedPathId {
    /// Create a new field object for the given PathId.
    pub const fn from_ordered_id(field_id: u32) -> OrderedPathId {
        OrderedPathId(field_id)
    }

    /// Returns a u32 identifying uniquely a path within a schema.
    pub const fn path_id(self) -> u32 {
        self.0
    }
}
impl From<u32> for OrderedPathId {
    fn from(id: u32) -> Self {
        Self(id)
    }
}

#[derive(Default)]
pub(crate) struct PathToUnorderedId {
    map: FnvHashMap<String, u32>,
}

impl PathToUnorderedId {
    #[inline]
    pub(crate) fn get_or_allocate_unordered_id(&mut self, path: &str) -> u32 {
        if let Some(id) = self.map.get(path) {
            return *id;
        }
        self.insert_new_path(path)
    }
    #[cold]
    fn insert_new_path(&mut self, path: &str) -> u32 {
        let next_id = self.map.len() as u32;
        let new_path = path.to_string();
        self.map.insert(new_path, next_id);
        next_id
    }

    /// Returns ids which reflect the lexical order of the paths.
    ///
    /// The returned vec can be indexed with the unordered id to get the ordered id.
    pub(crate) fn unordered_id_to_ordered_id(&self) -> Vec<OrderedPathId> {
        let mut sorted_ids: Vec<(&str, &u32)> =
            self.map.iter().map(|(k, v)| (k.as_str(), v)).collect();
        sorted_ids.sort_unstable_by_key(|(path, _)| *path);
        let mut result = vec![OrderedPathId::default(); sorted_ids.len()];
        for (ordered, unordered) in sorted_ids.iter().map(|(_k, v)| v).enumerate() {
            result[**unordered as usize] = OrderedPathId::from_ordered_id(ordered as u32);
        }
        result
    }

    /// Returns the paths so they can be queried by the ordered id (which is the index).
    pub(crate) fn ordered_id_to_path(&self) -> Vec<&str> {
        let mut paths = self.map.keys().map(String::as_str).collect::<Vec<_>>();
        paths.sort_unstable();
        paths
    }
}

#[cfg(test)]
mod tests {
    use super::*;

    #[test]
    fn path_to_unordered_test() {
        let mut path_to_id = PathToUnorderedId::default();
        let terms = vec!["b", "a", "b", "c"];
        let ids = terms
            .iter()
            .map(|term| path_to_id.get_or_allocate_unordered_id(term))
            .collect::<Vec<u32>>();
        assert_eq!(ids, vec![0, 1, 0, 2]);
        let ordered_ids = ids
            .iter()
            .map(|id| path_to_id.unordered_id_to_ordered_id()[*id as usize])
            .collect::<Vec<OrderedPathId>>();
        assert_eq!(ordered_ids, vec![1.into(), 0.into(), 1.into(), 2.into()]);
        // Fetch terms
        let terms_fetched = ordered_ids
            .iter()
            .map(|id| path_to_id.ordered_id_to_path()[id.path_id() as usize])
            .collect::<Vec<&str>>();
        assert_eq!(terms_fetched, terms);
    }
}


================================================
FILE: src/indexer/prepared_commit.rs
================================================
use super::IndexWriter;
use crate::schema::document::Document;
use crate::{FutureResult, Opstamp, TantivyDocument};

/// A prepared commit
pub struct PreparedCommit<'a, D: Document = TantivyDocument> {
    index_writer: &'a mut IndexWriter<D>,
    payload: Option<String>,
    opstamp: Opstamp,
}

impl<'a, D: Document> PreparedCommit<'a, D> {
    pub(crate) fn new(index_writer: &'a mut IndexWriter<D>, opstamp: Opstamp) -> Self {
        Self {
            index_writer,
            payload: None,
            opstamp,
        }
    }

    /// Returns the opstamp associated with the prepared commit.
    pub fn opstamp(&self) -> Opstamp {
        self.opstamp
    }

    /// Adds an arbitrary payload to the commit.
    pub fn set_payload(&mut self, payload: &str) {
        self.payload = Some(payload.to_string())
    }

    /// Rollbacks any change.
    pub fn abort(self) -> crate::Result<Opstamp> {
        self.index_writer.rollback()
    }

    /// Proceeds to commit.
    /// See `.commit_future()`.
    pub fn commit(self) -> crate::Result<Opstamp> {
        self.commit_future().wait()
    }

    /// Proceeds to commit.
    ///
    /// Unfortunately, contrary to what `PrepareCommit` may suggests,
    /// this operation is not at all really light.
    /// At this point deletes have not been flushed yet.
    pub fn commit_future(self) -> FutureResult<Opstamp> {
        info!("committing {}", self.opstamp);
        self.index_writer
            .segment_updater()
            .schedule_commit(self.opstamp, self.payload)
    }
}


================================================
FILE: src/indexer/segment_entry.rs
================================================
use std::fmt;

use common::BitSet;

use crate::index::{SegmentId, SegmentMeta};
use crate::indexer::delete_queue::DeleteCursor;

/// A segment entry describes the state of
/// a given segment, at a given instant.
///
/// In addition to segment `meta`,
/// it contains a few transient states
/// - `alive_bitset` is a bitset describing documents that were alive during the commit itself.
/// - `delete_cursor` is the position in the delete queue. Deletes happening before the cursor are
///   reflected either in the .del file or in the `alive_bitset`.
#[derive(Clone)]
pub struct SegmentEntry {
    meta: SegmentMeta,
    alive_bitset: Option<BitSet>,
    delete_cursor: DeleteCursor,
}

impl SegmentEntry {
    /// Create a new `SegmentEntry`
    pub fn new(
        segment_meta: SegmentMeta,
        delete_cursor: DeleteCursor,
        alive_bitset: Option<BitSet>,
    ) -> SegmentEntry {
        SegmentEntry {
            meta: segment_meta,
            alive_bitset,
            delete_cursor,
        }
    }

    /// Return a reference to the segment entry deleted bitset.
    ///
    /// `DocId` in this bitset are flagged as deleted.
    pub fn alive_bitset(&self) -> Option<&BitSet> {
        self.alive_bitset.as_ref()
    }

    /// Set the `SegmentMeta` for this segment.
    pub fn set_meta(&mut self, segment_meta: SegmentMeta) {
        self.meta = segment_meta;
    }

    /// Return a reference to the segment_entry's delete cursor
    pub fn delete_cursor(&mut self) -> &mut DeleteCursor {
        &mut self.delete_cursor
    }

    /// Returns the segment id.
    pub fn segment_id(&self) -> SegmentId {
        self.meta.id()
    }

    /// Accessor to the `SegmentMeta`
    pub fn meta(&self) -> &SegmentMeta {
        &self.meta
    }
}

impl fmt::Debug for SegmentEntry {
    fn fmt(&self, formatter: &mut fmt::Formatter<'_>) -> fmt::Result {
        write!(formatter, "SegmentEntry({:?})", self.meta)
    }
}


================================================
FILE: src/indexer/segment_manager.rs
================================================
use std::collections::hash_set::HashSet;
use std::fmt::{self, Debug, Formatter};
use std::sync::{RwLock, RwLockReadGuard, RwLockWriteGuard};

use super::segment_register::SegmentRegister;
use crate::error::TantivyError;
use crate::index::{SegmentId, SegmentMeta};
use crate::indexer::delete_queue::DeleteCursor;
use crate::indexer::SegmentEntry;

#[derive(Default)]
struct SegmentRegisters {
    uncommitted: SegmentRegister,
    committed: SegmentRegister,
}

#[derive(PartialEq, Eq)]
pub(crate) enum SegmentsStatus {
    Committed,
    Uncommitted,
}

impl SegmentRegisters {
    /// Check if all the segments are committed or uncommitted.
    ///
    /// If some segment is missing or segments are in a different state (this should not happen
    /// if tantivy is used correctly), returns `None`.
    fn segments_status(&self, segment_ids: &[SegmentId]) -> Option<SegmentsStatus> {
        if self.uncommitted.contains_all(segment_ids) {
            Some(SegmentsStatus::Uncommitted)
        } else if self.committed.contains_all(segment_ids) {
            Some(SegmentsStatus::Committed)
        } else {
            warn!(
                "segment_ids: {:?}, committed_ids: {:?}, uncommitted_ids {:?}",
                segment_ids,
                self.committed.segment_ids(),
                self.uncommitted.segment_ids()
            );
            None
        }
    }
}

/// The segment manager stores the list of segments
/// as well as their state.
///
/// It guarantees the atomicity of the
/// changes (merges especially)
#[derive(Default)]
pub struct SegmentManager {
    registers: RwLock<SegmentRegisters>,
}

impl Debug for SegmentManager {
    fn fmt(&self, f: &mut Formatter<'_>) -> fmt::Result {
        let lock = self.read();
        write!(
            f,
            "{{ uncommitted: {:?}, committed: {:?} }}",
            lock.uncommitted, lock.committed
        )
    }
}

impl SegmentManager {
    pub fn from_segments(
        segment_metas: Vec<SegmentMeta>,
        delete_cursor: &DeleteCursor,
    ) -> SegmentManager {
        SegmentManager {
            registers: RwLock::new(SegmentRegisters {
                uncommitted: SegmentRegister::default(),
                committed: SegmentRegister::new(segment_metas, delete_cursor),
            }),
        }
    }

    pub fn get_mergeable_segments(
        &self,
        in_merge_segment_ids: &HashSet<SegmentId>,
    ) -> (Vec<SegmentMeta>, Vec<SegmentMeta>) {
        let registers_lock = self.read();
        (
            registers_lock
                .committed
                .get_mergeable_segments(in_merge_segment_ids),
            registers_lock
                .uncommitted
                .get_mergeable_segments(in_merge_segment_ids),
        )
    }
    /// Returns all of the segment entries (committed or uncommitted)
    pub fn segment_entries(&self) -> Vec<SegmentEntry> {
        let registers_lock = self.read();
        let mut segment_entries = registers_lock.uncommitted.segment_entries();
        segment_entries.extend(registers_lock.committed.segment_entries());
        segment_entries
    }

    // Lock poisoning should never happen :
    // The lock is acquired and released within this class,
    // and the operations cannot panic.
    fn read(&self) -> RwLockReadGuard<'_, SegmentRegisters> {
        self.registers
            .read()
            .expect("Failed to acquire read lock on SegmentManager.")
    }

    fn write(&self) -> RwLockWriteGuard<'_, SegmentRegisters> {
        self.registers
            .write()
            .expect("Failed to acquire write lock on SegmentManager.")
    }

    /// Deletes all empty segments
    fn remove_empty_segments(&self) {
        let mut registers_lock = self.write();
        registers_lock
            .committed
            .segment_entries()
            .iter()
            .filter(|segment| segment.meta().num_docs() == 0)
            .for_each(|segment| {
                registers_lock
                    .committed
                    .remove_segment(&segment.segment_id())
            });
    }

    pub(crate) fn remove_all_segments(&self) {
        let mut registers_lock = self.write();
        registers_lock.committed.clear();
        registers_lock.uncommitted.clear();
    }

    pub fn commit(&self, segment_entries: Vec<SegmentEntry>) {
        let mut registers_lock = self.write();
        registers_lock.committed.clear();
        registers_lock.uncommitted.clear();
        for segment_entry in segment_entries {
            registers_lock.committed.add_segment_entry(segment_entry);
        }
    }

    /// Marks a list of segments as in merge.
    ///
    /// Returns an error if some segments are missing, or if
    /// the `segment_ids` are not either all committed or all
    /// uncommitted.
    pub fn start_merge(&self, segment_ids: &[SegmentId]) -> crate::Result<Vec<SegmentEntry>> {
        let registers_lock = self.read();
        let mut segment_entries = vec![];
        if registers_lock.uncommitted.contains_all(segment_ids) {
            for segment_id in segment_ids {
                let segment_entry = registers_lock.uncommitted.get(segment_id).expect(
                    "Segment id not found {}. Should never happen because of the contains all \
                     if-block.",
                );
                segment_entries.push(segment_entry);
            }
        } else if registers_lock.committed.contains_all(segment_ids) {
            for segment_id in segment_ids {
                let segment_entry = registers_lock.committed.get(segment_id).expect(
                    "Segment id not found {}. Should never happen because of the contains all \
                     if-block.",
                );
                segment_entries.push(segment_entry);
            }
        } else {
            let error_msg = "Merge operation sent for segments that are not all uncommitted or \
                             committed."
                .to_string();
            return Err(TantivyError::InvalidArgument(error_msg));
        }

        Ok(segment_entries)
    }

    pub fn add_segment(&self, segment_entry: SegmentEntry) {
        let mut registers_lock = self.write();
        registers_lock.uncommitted.add_segment_entry(segment_entry);
    }
    // Replace a list of segments for their equivalent merged segment.
    //
    // Returns true if these segments are committed, false if the merge segments are uncommitted.
    pub(crate) fn end_merge(
        &self,
        before_merge_segment_ids: &[SegmentId],
        after_merge_segment_entry: Option<SegmentEntry>,
    ) -> crate::Result<SegmentsStatus> {
        let mut registers_lock = self.write();
        let segments_status = registers_lock
            .segments_status(before_merge_segment_ids)
            .ok_or_else(|| {
                warn!("couldn't find segment in SegmentManager");
                crate::TantivyError::InvalidArgument(
                    "The segments that were merged could not be found in the SegmentManager. This \
                     is not necessarily a bug, and can happen after a rollback for instance."
                        .to_string(),
                )
            })?;

        let target_register: &mut SegmentRegister = match segments_status {
            SegmentsStatus::Uncommitted => &mut registers_lock.uncommitted,
            SegmentsStatus::Committed => &mut registers_lock.committed,
        };
        for segment_id in before_merge_segment_ids {
            target_register.remove_segment(segment_id);
        }
        if let Some(entry) = after_merge_segment_entry {
            target_register.add_segment_entry(entry);
        }
        Ok(segments_status)
    }

    pub fn committed_segment_metas(&self) -> Vec<SegmentMeta> {
        self.remove_empty_segments();
        let registers_lock = self.read();
        registers_lock.committed.segment_metas()
    }
}


================================================
FILE: src/indexer/segment_register.rs
================================================
use std::collections::{HashMap, HashSet};
use std::fmt::{self, Debug, Display, Formatter};

use crate::index::{SegmentId, SegmentMeta};
use crate::indexer::delete_queue::DeleteCursor;
use crate::indexer::segment_entry::SegmentEntry;

/// The segment register keeps track
/// of the list of segment, their size as well
/// as the state they are in.
///
/// It is consumed by indexes to get the list of
/// segments that are currently searchable,
/// and by the index merger to identify
/// merge candidates.
#[derive(Default)]
pub struct SegmentRegister {
    segment_states: HashMap<SegmentId, SegmentEntry>,
}

impl Debug for SegmentRegister {
    fn fmt(&self, f: &mut Formatter<'_>) -> Result<(), fmt::Error> {
        write!(f, "SegmentRegister(")?;
        for k in self.segment_states.keys() {
            write!(f, "{}, ", k.short_uuid_string())?;
        }
        write!(f, ")")?;
        Ok(())
    }
}
impl Display for SegmentRegister {
    fn fmt(&self, f: &mut Formatter<'_>) -> Result<(), fmt::Error> {
        write!(f, "SegmentRegister(")?;
        for k in self.segment_states.keys() {
            write!(f, "{}, ", k.short_uuid_string())?;
        }
        write!(f, ")")?;
        Ok(())
    }
}

impl SegmentRegister {
    pub fn clear(&mut self) {
        self.segment_states.clear();
    }

    pub fn get_mergeable_segments(
        &self,
        in_merge_segment_ids: &HashSet<SegmentId>,
    ) -> Vec<SegmentMeta> {
        self.segment_states
            .values()
            .filter(|segment_entry| !in_merge_segment_ids.contains(&segment_entry.segment_id()))
            .map(|segment_entry| segment_entry.meta().clone())
            .collect()
    }

    pub fn segment_ids(&self) -> Vec<SegmentId> {
        self.segment_states.keys().cloned().collect()
    }

    pub fn segment_entries(&self) -> Vec<SegmentEntry> {
        self.segment_states.values().cloned().collect()
    }

    pub fn segment_metas(&self) -> Vec<SegmentMeta> {
        self.segment_states
            .values()
            .map(|segment_entry| segment_entry.meta().clone())
            .collect()
    }

    pub fn contains_all(&self, segment_ids: &[SegmentId]) -> bool {
        segment_ids
            .iter()
            .all(|segment_id| self.segment_states.contains_key(segment_id))
    }

    pub fn add_segment_entry(&mut self, segment_entry: SegmentEntry) {
        let segment_id = segment_entry.segment_id();
        self.segment_states.insert(segment_id, segment_entry);
    }

    pub fn remove_segment(&mut self, segment_id: &SegmentId) {
        self.segment_states.remove(segment_id);
    }

    pub fn get(&self, segment_id: &SegmentId) -> Option<SegmentEntry> {
        self.segment_states.get(segment_id).cloned()
    }

    pub fn new(segment_metas: Vec<SegmentMeta>, delete_cursor: &DeleteCursor) -> SegmentRegister {
        let mut segment_states = HashMap::new();
        for segment_meta in segment_metas {
            let segment_id = segment_meta.id();
            let segment_entry = SegmentEntry::new(segment_meta, delete_cursor.clone(), None);
            segment_states.insert(segment_id, segment_entry);
        }
        SegmentRegister { segment_states }
    }
}

#[cfg(test)]
mod tests {
    use super::*;
    use crate::index::SegmentMetaInventory;
    use crate::indexer::delete_queue::*;

    fn segment_ids(segment_register: &SegmentRegister) -> Vec<SegmentId> {
        segment_register
            .segment_metas()
            .into_iter()
            .map(|segment_meta| segment_meta.id())
            .collect()
    }

    #[test]
    fn test_segment_register() {
        let inventory = SegmentMetaInventory::default();
        let delete_queue = DeleteQueue::default();

        let mut segment_register = SegmentRegister::default();
        let segment_id_a = SegmentId::generate_random();
        let segment_id_b = SegmentId::generate_random();
        let segment_id_merged = SegmentId::generate_random();

        {
            let segment_meta = inventory.new_segment_meta(segment_id_a, 0u32);
            let segment_entry = SegmentEntry::new(segment_meta, delete_queue.cursor(), None);
            segment_register.add_segment_entry(segment_entry);
        }
        assert_eq!(segment_ids(&segment_register), vec![segment_id_a]);
        {
            let segment_meta = inventory.new_segment_meta(segment_id_b, 0u32);
            let segment_entry = SegmentEntry::new(segment_meta, delete_queue.cursor(), None);
            segment_register.add_segment_entry(segment_entry);
        }
        segment_register.remove_segment(&segment_id_a);
        segment_register.remove_segment(&segment_id_b);
        {
            let segment_meta_merged = inventory.new_segment_meta(segment_id_merged, 0u32);
            let segment_entry = SegmentEntry::new(segment_meta_merged, delete_queue.cursor(), None);
            segment_register.add_segment_entry(segment_entry);
        }
        assert_eq!(segment_ids(&segment_register), vec![segment_id_merged]);
    }
}


================================================
FILE: src/indexer/segment_serializer.rs
================================================
use common::TerminatingWrite;

use crate::directory::WritePtr;
use crate::fieldnorm::FieldNormsSerializer;
use crate::index::{Segment, SegmentComponent};
use crate::postings::InvertedIndexSerializer;
use crate::store::StoreWriter;

/// Segment serializer is in charge of laying out on disk
/// the data accumulated and sorted by the `SegmentWriter`.
pub struct SegmentSerializer {
    segment: Segment,
    pub(crate) store_writer: StoreWriter,
    fast_field_write: WritePtr,
    fieldnorms_serializer: Option<FieldNormsSerializer>,
    postings_serializer: InvertedIndexSerializer,
}

impl SegmentSerializer {
    /// Creates a new `SegmentSerializer`.
    pub fn for_segment(mut segment: Segment) -> crate::Result<SegmentSerializer> {
        let settings = segment.index().settings().clone();
        let store_writer = {
            let store_write = segment.open_write(SegmentComponent::Store)?;
            StoreWriter::new(
                store_write,
                settings.docstore_compression,
                settings.docstore_blocksize,
                settings.docstore_compress_dedicated_thread,
            )?
        };

        let fast_field_write = segment.open_write(SegmentComponent::FastFields)?;

        let fieldnorms_write = segment.open_write(SegmentComponent::FieldNorms)?;
        let fieldnorms_serializer = FieldNormsSerializer::from_write(fieldnorms_write)?;

        let postings_serializer = InvertedIndexSerializer::open(&mut segment)?;
        Ok(SegmentSerializer {
            segment,
            store_writer,
            fast_field_write,
            fieldnorms_serializer: Some(fieldnorms_serializer),
            postings_serializer,
        })
    }

    /// The memory used (inclusive childs)
    pub fn mem_usage(&self) -> usize {
        self.store_writer.mem_usage()
    }

    pub fn segment(&self) -> &Segment {
        &self.segment
    }

    /// Accessor to the `PostingsSerializer`.
    pub fn get_postings_serializer(&mut self) -> &mut InvertedIndexSerializer {
        &mut self.postings_serializer
    }

    /// Accessor to the `FastFieldSerializer`.
    pub fn get_fast_field_write(&mut self) -> &mut WritePtr {
        &mut self.fast_field_write
    }

    /// Extract the field norm serializer.
    ///
    /// Note the fieldnorms serializer can only be extracted once.
    pub fn extract_fieldnorms_serializer(&mut self) -> Option<FieldNormsSerializer> {
        self.fieldnorms_serializer.take()
    }

    /// Accessor to the `StoreWriter`.
    pub fn get_store_writer(&mut self) -> &mut StoreWriter {
        &mut self.store_writer
    }

    /// Finalize the segment serialization.
    pub fn close(mut self) -> crate::Result<()> {
        if let Some(fieldnorms_serializer) = self.extract_fieldnorms_serializer() {
            fieldnorms_serializer.close()?;
        }
        self.fast_field_write.terminate()?;
        self.postings_serializer.close()?;
        self.store_writer.close()?;
        Ok(())
    }
}


================================================
FILE: src/indexer/segment_updater.rs
================================================
use std::any::Any;
use std::borrow::BorrowMut;
use std::collections::HashSet;
use std::io::Write;
use std::ops::Deref;
use std::path::PathBuf;
use std::sync::atomic::{AtomicBool, Ordering};
use std::sync::{Arc, RwLock};

use rayon::{ThreadPool, ThreadPoolBuilder};

use super::segment_manager::SegmentManager;
use crate::core::META_FILEPATH;
use crate::directory::{Directory, DirectoryClone, GarbageCollectionResult};
use crate::fastfield::AliveBitSet;
use crate::index::{Index, IndexMeta, IndexSettings, Segment, SegmentId, SegmentMeta};
use crate::indexer::delete_queue::DeleteCursor;
use crate::indexer::index_writer::advance_deletes;
use crate::indexer::merge_operation::MergeOperationInventory;
use crate::indexer::merger::IndexMerger;
use crate::indexer::segment_manager::SegmentsStatus;
use crate::indexer::stamper::Stamper;
use crate::indexer::{
    DefaultMergePolicy, MergeCandidate, MergeOperation, MergePolicy, SegmentEntry,
    SegmentSerializer,
};
use crate::{FutureResult, Opstamp, TantivyError};

const PANIC_CAUGHT: &str = "Panic caught in merge thread";

/// Save the index meta file.
/// This operation is atomic:
/// Either
/// - it fails, in which case an error is returned, and the `meta.json` remains untouched,
/// - it success, and `meta.json` is written and flushed.
///
/// This method is not part of tantivy's public API
pub(crate) fn save_metas(metas: &IndexMeta, directory: &dyn Directory) -> crate::Result<()> {
    info!("save metas");
    let mut buffer = serde_json::to_vec_pretty(metas)?;
    // Just adding a new line at the end of the buffer.
    writeln!(&mut buffer)?;
    crate::fail_point!("save_metas", |msg| Err(crate::TantivyError::from(
        std::io::Error::new(
            std::io::ErrorKind::Other,
            msg.unwrap_or_else(|| "Undefined".to_string())
        )
    )));
    directory.sync_directory()?;
    directory.atomic_write(&META_FILEPATH, &buffer[..])?;
    debug!("Saved metas {:?}", serde_json::to_string_pretty(&metas));
    Ok(())
}

// The segment update runner is in charge of processing all
//  of the `SegmentUpdate`s.
//
// All this processing happens on a single thread
// consuming a common queue.
//
// We voluntarily pass a merge_operation ref to guarantee that
// the merge_operation is alive during the process
#[derive(Clone)]
pub(crate) struct SegmentUpdater(Arc<InnerSegmentUpdater>);

impl Deref for SegmentUpdater {
    type Target = InnerSegmentUpdater;

    #[inline]
    fn deref(&self) -> &Self::Target {
        &self.0
    }
}

fn garbage_collect_files(
    segment_updater: SegmentUpdater,
) -> crate::Result<GarbageCollectionResult> {
    info!("Running garbage collection");
    let mut index = segment_updater.index.clone();
    index
        .directory_mut()
        .garbage_collect(move || segment_updater.list_files())
}

/// Merges a list of segments the list of segment givens in the `segment_entries`.
/// This function happens in the calling thread and is computationally expensive.
fn merge(
    index: &Index,
    mut segment_entries: Vec<SegmentEntry>,
    target_opstamp: Opstamp,
) -> crate::Result<Option<SegmentEntry>> {
    let num_docs = segment_entries
        .iter()
        .map(|segment| segment.meta().num_docs() as u64)
        .sum::<u64>();
    if num_docs == 0 {
        return Ok(None);
    }

    // first we need to apply deletes to our segment.
    let merged_segment = index.new_segment();

    // First we apply all of the delete to the merged segment, up to the target opstamp.
    for segment_entry in &mut segment_entries {
        let segment = index.segment(segment_entry.meta().clone());
        advance_deletes(segment, segment_entry, target_opstamp)?;
    }

    let delete_cursor = segment_entries[0].delete_cursor().clone();

    let segments: Vec<Segment> = segment_entries
        .iter()
        .map(|segment_entry| index.segment(segment_entry.meta().clone()))
        .collect();

    // An IndexMerger is like a "view" of our merged segments.
    let merger: IndexMerger = IndexMerger::open(index.schema(), &segments[..])?;

    // ... we just serialize this index merger in our new segment to merge the segments.
    let segment_serializer = SegmentSerializer::for_segment(merged_segment.clone())?;

    let num_docs = merger.write(segment_serializer)?;

    let merged_segment_id = merged_segment.id();

    let segment_meta = index.new_segment_meta(merged_segment_id, num_docs);
    Ok(Some(SegmentEntry::new(segment_meta, delete_cursor, None)))
}

/// Advanced: Merges a list of segments from different indices in a new index.
///
/// Returns `TantivyError` if the indices list is empty or their
/// schemas don't match.
///
/// `output_directory`: is assumed to be empty.
///
/// # Warning
/// This function does NOT check or take the `IndexWriter` is running. It is not
/// meant to work if you have an `IndexWriter` running for the origin indices, or
/// the destination `Index`.
#[doc(hidden)]
pub fn merge_indices<T: Into<Box<dyn Directory>>>(
    indices: &[Index],
    output_directory: T,
) -> crate::Result<Index> {
    if indices.is_empty() {
        // If there are no indices to merge, there is no need to do anything.
        return Err(crate::TantivyError::InvalidArgument(
            "No indices given to merge".to_string(),
        ));
    }

    let target_settings = indices[0].settings().clone();

    // let's check that all of the indices have the same index settings
    if indices
        .iter()
        .skip(1)
        .any(|index| index.settings() != &target_settings)
    {
        return Err(crate::TantivyError::InvalidArgument(
            "Attempt to merge indices with different index_settings".to_string(),
        ));
    }

    let mut segments: Vec<Segment> = Vec::new();
    for index in indices {
        segments.extend(index.searchable_segments()?);
    }

    let non_filter = segments.iter().map(|_| None).collect::<Vec<_>>();
    merge_filtered_segments(&segments, target_settings, non_filter, output_directory)
}

/// Advanced: Merges a list of segments from different indices in a new index.
/// Additional you can provide a delete bitset for each segment to ignore doc_ids.
///
/// Returns `TantivyError` if the indices list is empty or their
/// schemas don't match.
///
/// `output_directory`: is assumed to be empty.
///
/// # Warning
/// This function does NOT check or take the `IndexWriter` is running. It is not
/// meant to work if you have an `IndexWriter` running for the origin indices, or
/// the destination `Index`.
#[doc(hidden)]
pub fn merge_filtered_segments<T: Into<Box<dyn Directory>>>(
    segments: &[Segment],
    target_settings: IndexSettings,
    filter_doc_ids: Vec<Option<AliveBitSet>>,
    output_directory: T,
) -> crate::Result<Index> {
    if segments.is_empty() {
        // If there are no indices to merge, there is no need to do anything.
        return Err(crate::TantivyError::InvalidArgument(
            "No segments given to merge".to_string(),
        ));
    }

    let target_schema = segments[0].schema();

    // let's check that all of the indices have the same schema
    if segments
        .iter()
        .skip(1)
        .any(|index| index.schema() != target_schema)
    {
        return Err(crate::TantivyError::InvalidArgument(
            "Attempt to merge different schema indices".to_string(),
        ));
    }

    let mut merged_index = Index::create(
        output_directory,
        target_schema.clone(),
        target_settings.clone(),
    )?;
    let merged_segment = merged_index.new_segment();
    let merged_segment_id = merged_segment.id();
    let merger: IndexMerger =
        IndexMerger::open_with_custom_alive_set(merged_index.schema(), segments, filter_doc_ids)?;
    let segment_serializer = SegmentSerializer::for_segment(merged_segment)?;
    let num_docs = merger.write(segment_serializer)?;

    let segment_meta = merged_index.new_segment_meta(merged_segment_id, num_docs);

    let stats = format!(
        "Segments Merge: [{}]",
        segments
            .iter()
            .fold(String::new(), |sum, current| format!(
                "{sum}{} ",
                current.meta().id().uuid_string()
            ))
            .trim_end()
    );

    let index_meta = IndexMeta {
        index_settings: target_settings, // index_settings of all segments should be the same
        segments: vec![segment_meta],
        schema: target_schema,
        opstamp: 0u64,
        payload: Some(stats),
    };

    // save the meta.json
    save_metas(&index_meta, merged_index.directory_mut())?;

    Ok(merged_index)
}

pub(crate) struct InnerSegmentUpdater {
    // we keep a copy of the current active IndexMeta to
    // avoid loading the file every time we need it in the
    // `SegmentUpdater`.
    //
    // This should be up to date as all update happen through
    // the unique active `SegmentUpdater`.
    active_index_meta: RwLock<Arc<IndexMeta>>,
    pool: ThreadPool,
    merge_thread_pool: ThreadPool,

    index: Index,
    segment_manager: SegmentManager,
    merge_policy: RwLock<Arc<dyn MergePolicy>>,
    killed: AtomicBool,
    stamper: Stamper,
    merge_operations: MergeOperationInventory,
}

impl SegmentUpdater {
    pub fn create(
        index: Index,
        stamper: Stamper,
        delete_cursor: &DeleteCursor,
        num_merge_threads: usize,
    ) -> crate::Result<SegmentUpdater> {
        let segments = index.searchable_segment_metas()?;
        let segment_manager = SegmentManager::from_segments(segments, delete_cursor);
        let pool = ThreadPoolBuilder::new()
            .thread_name(|_| "segment_updater".to_string())
            .num_threads(1)
            .build()
            .map_err(|_| {
                crate::TantivyError::SystemError(
                    "Failed to spawn segment updater thread".to_string(),
                )
            })?;
        let merge_thread_pool = ThreadPoolBuilder::new()
            .thread_name(|i| format!("merge_thread_{i}"))
            .num_threads(num_merge_threads)
            .panic_handler(move |panic| {
                // We don't print the panic content itself,
                // it is already printed during the unwinding
                if let Some(message) = panic.downcast_ref::<&str>() {
                    if *message != PANIC_CAUGHT {
                        error!("uncaught merge panic")
                    }
                }
            })
            .build()
            .map_err(|_| {
                crate::TantivyError::SystemError(
                    "Failed to spawn segment merging thread".to_string(),
                )
            })?;
        let index_meta = index.load_metas()?;
        Ok(SegmentUpdater(Arc::new(InnerSegmentUpdater {
            active_index_meta: RwLock::new(Arc::new(index_meta)),
            pool,
            merge_thread_pool,
            index,
            segment_manager,
            merge_policy: RwLock::new(Arc::new(DefaultMergePolicy::default())),
            killed: AtomicBool::new(false),
            stamper,
            merge_operations: Default::default(),
        })))
    }

    pub fn get_merge_policy(&self) -> Arc<dyn MergePolicy> {
        self.merge_policy.read().unwrap().clone()
    }

    pub fn set_merge_policy(&self, merge_policy: Box<dyn MergePolicy>) {
        let arc_merge_policy = Arc::from(merge_policy);
        *self.merge_policy.write().unwrap() = arc_merge_policy;
    }

    fn schedule_task<T: 'static + Send, F: FnOnce() -> crate::Result<T> + 'static + Send>(
        &self,
        task: F,
    ) -> FutureResult<T> {
        if !self.is_alive() {
            return crate::TantivyError::SystemError("Segment updater killed".to_string()).into();
        }
        let (scheduled_result, sender) = FutureResult::create(
            "A segment_updater future did not succeed. This should never happen.",
        );
        self.pool.spawn(|| {
            let task_result = task();
            let _ = sender.send(task_result);
        });
        scheduled_result
    }

    pub fn schedule_add_segment(&self, segment_entry: SegmentEntry) -> FutureResult<()> {
        let segment_updater = self.clone();
        self.schedule_task(move || {
            segment_updater.segment_manager.add_segment(segment_entry);
            segment_updater.consider_merge_options();
            Ok(())
        })
    }

    /// Orders `SegmentManager` to remove all segments
    pub(crate) fn remove_all_segments(&self) {
        self.segment_manager.remove_all_segments();
    }

    pub fn kill(&mut self) {
        self.killed.store(true, Ordering::Release);
    }

    pub fn is_alive(&self) -> bool {
        !self.killed.load(Ordering::Acquire)
    }

    /// Apply deletes up to the target opstamp to all segments.
    ///
    /// The method returns copies of the segment entries,
    /// updated with the delete information.
    fn purge_deletes(&self, target_opstamp: Opstamp) -> crate::Result<Vec<SegmentEntry>> {
        let mut segment_entries = self.segment_manager.segment_entries();
        for segment_entry in &mut segment_entries {
            let segment = self.index.segment(segment_entry.meta().clone());
            advance_deletes(segment, segment_entry, target_opstamp)?;
        }
        Ok(segment_entries)
    }

    pub fn save_metas(
        &self,
        opstamp: Opstamp,
        commit_message: Option<String>,
    ) -> crate::Result<()> {
        if self.is_alive() {
            let index = &self.index;
            let directory = index.directory();
            let mut committed_segment_metas = self.segment_manager.committed_segment_metas();

            // We sort segment_readers by number of documents.
            // This is an heuristic to make multithreading more efficient.
            //
            // This is not done at the searcher level because I had a strange
            // use case in which I was dealing with a large static index,
            // dispatched over 5 SSD drives.
            //
            // A `UnionDirectory` makes it possible to read from these
            // 5 different drives and creates a meta.json on the fly.
            // In order to optimize the throughput, it creates a lasagna of segments
            // from the different drives.
            //
            // Segment 1 from disk 1, Segment 1 from disk 2, etc.
            committed_segment_metas
                .sort_by_key(|segment_meta| std::cmp::Reverse(segment_meta.max_doc()));
            let index_meta = IndexMeta {
                index_settings: index.settings().clone(),
                segments: committed_segment_metas,
                schema: index.schema(),
                opstamp,
                payload: commit_message,
            };
            // TODO add context to the error.
            save_metas(&index_meta, directory.box_clone().borrow_mut())?;
            self.store_meta(&index_meta);
        }
        Ok(())
    }

    pub fn schedule_garbage_collect(&self) -> FutureResult<GarbageCollectionResult> {
        let self_clone = self.clone();
        self.schedule_task(move || garbage_collect_files(self_clone))
    }

    /// List the files that are useful to the index.
    ///
    /// This does not include lock files, or files that are obsolete
    /// but have not yet been deleted by the garbage collector.
    fn list_files(&self) -> HashSet<PathBuf> {
        let mut files: HashSet<PathBuf> = self
            .index
            .list_all_segment_metas()
            .into_iter()
            .flat_map(|segment_meta| segment_meta.list_files())
            .collect();
        files.insert(META_FILEPATH.to_path_buf());
        files
    }

    pub(crate) fn schedule_commit(
        &self,
        opstamp: Opstamp,
        payload: Option<String>,
    ) -> FutureResult<Opstamp> {
        let segment_updater: SegmentUpdater = self.clone();
        self.schedule_task(move || {
            let segment_entries = segment_updater.purge_deletes(opstamp)?;
            segment_updater.segment_manager.commit(segment_entries);
            segment_updater.save_metas(opstamp, payload)?;
            let _ = garbage_collect_files(segment_updater.clone());
            segment_updater.consider_merge_options();
            Ok(opstamp)
        })
    }

    fn store_meta(&self, index_meta: &IndexMeta) {
        *self.active_index_meta.write().unwrap() = Arc::new(index_meta.clone());
    }

    fn load_meta(&self) -> Arc<IndexMeta> {
        self.active_index_meta.read().unwrap().clone()
    }

    pub(crate) fn make_merge_operation(&self, segment_ids: &[SegmentId]) -> MergeOperation {
        let commit_opstamp = self.load_meta().opstamp;
        MergeOperation::new(&self.merge_operations, commit_opstamp, segment_ids.to_vec())
    }

    // Starts a merge operation. This function will block until the merge operation is effectively
    // started. Note that it does not wait for the merge to terminate.
    // The calling thread should not be block for a long time, as this only involve waiting for the
    // `SegmentUpdater` queue which in turns only contains lightweight operations.
    //
    // The merge itself happens on a different thread.
    //
    // When successful, this function returns a `Future` for a `Result<SegmentMeta>` that represents
    // the actual outcome of the merge operation.
    //
    // It returns an error if for some reason the merge operation could not be started.
    //
    // At this point an error is not necessarily the sign of a malfunction.
    // (e.g. A rollback could have happened, between the instant when the merge operation was
    // suggested and the moment when it ended up being executed.)
    //
    // `segment_ids` is required to be non-empty.
    pub fn start_merge(
        &self,
        merge_operation: MergeOperation,
    ) -> FutureResult<Option<SegmentMeta>> {
        assert!(
            !merge_operation.segment_ids().is_empty(),
            "Segment_ids cannot be empty."
        );

        let segment_updater = self.clone();
        let segment_entries: Vec<SegmentEntry> = match self
            .segment_manager
            .start_merge(merge_operation.segment_ids())
        {
            Ok(segment_entries) => segment_entries,
            Err(err) => {
                warn!(
                    "Starting the merge failed for the following reason. This is not fatal. {err}"
                );
                return err.into();
            }
        };

        info!("Starting merge  - {:?}", merge_operation.segment_ids());

        let (scheduled_result, merging_future_send) =
            FutureResult::create("Merge operation failed.");

        self.merge_thread_pool.spawn(move || {
            // The fact that `merge_operation` is moved here is important.
            // Its lifetime is used to track how many merging thread are currently running,
            // as well as which segment is currently in merge and therefore should not be
            // candidate for another merge.
            let merge_panic_res = std::panic::catch_unwind(std::panic::AssertUnwindSafe(|| {
                merge(
                    &segment_updater.index,
                    segment_entries,
                    merge_operation.target_opstamp(),
                )
            }));
            let merge_res = match merge_panic_res {
                Ok(merge_res) => merge_res,
                Err(panic_err) => {
                    let panic_str = if let Some(msg) = panic_err.downcast_ref::<&str>() {
                        *msg
                    } else if let Some(msg) = panic_err.downcast_ref::<String>() {
                        msg.as_str()
                    } else {
                        "UNKNOWN"
                    };
                    let _send_result = merging_future_send.send(Err(TantivyError::SystemError(
                        format!("Merge thread panicked: {panic_str}"),
                    )));
                    // Resume unwinding because we forced unwind safety with
                    // `std::panic::AssertUnwindSafe` Use a specific message so
                    // the panic_handler can double check that we properly caught the panic.
                    let boxed_panic_message: Box<dyn Any + Send> = Box::new(PANIC_CAUGHT);
                    std::panic::resume_unwind(boxed_panic_message);
                }
            };
            match merge_res {
                Ok(after_merge_segment_entry) => {
                    let res = segment_updater.end_merge(merge_operation, after_merge_segment_entry);
                    let _send_result = merging_future_send.send(res);
                }
                Err(merge_error) => {
                    warn!(
                        "Merge of {:?} was cancelled: {:?}",
                        merge_operation.segment_ids().to_vec(),
                        merge_error
                    );
                    if cfg!(test) {
                        panic!("{merge_error:?}");
                    }
                    let _send_result = merging_future_send.send(Err(merge_error));
                }
            }
        });

        scheduled_result
    }

    pub(crate) fn get_mergeable_segments(&self) -> (Vec<SegmentMeta>, Vec<SegmentMeta>) {
        let merge_segment_ids: HashSet<SegmentId> = self.merge_operations.segment_in_merge();
        self.segment_manager
            .get_mergeable_segments(&merge_segment_ids)
    }

    fn consider_merge_options(&self) {
        let (mut committed_segments, mut uncommitted_segments) = self.get_mergeable_segments();
        if committed_segments.len() == 1 && committed_segments[0].num_deleted_docs() == 0 {
            committed_segments.clear();
        }
        if uncommitted_segments.len() == 1 && uncommitted_segments[0].num_deleted_docs() == 0 {
            uncommitted_segments.clear();
        }

        // Committed segments cannot be merged with uncommitted_segments.
        // We therefore consider merges using these two sets of segments independently.
        let merge_policy = self.get_merge_policy();

        let current_opstamp = self.stamper.stamp();
        let mut merge_candidates: Vec<MergeOperation> = merge_policy
            .compute_merge_candidates(&uncommitted_segments)
            .into_iter()
            .map(|merge_candidate| {
                MergeOperation::new(&self.merge_operations, current_opstamp, merge_candidate.0)
            })
            .collect();

        let commit_opstamp = self.load_meta().opstamp;
        let committed_merge_candidates = merge_policy
            .compute_merge_candidates(&committed_segments)
            .into_iter()
            .map(|merge_candidate: MergeCandidate| {
                MergeOperation::new(&self.merge_operations, commit_opstamp, merge_candidate.0)
            });
        merge_candidates.extend(committed_merge_candidates);

        for merge_operation in merge_candidates {
            // If a merge cannot be started this is not a fatal error.
            // We do log a warning in `start_merge`.
            drop(self.start_merge(merge_operation));
        }
    }

    /// Queues a `end_merge` in the segment updater and blocks until it is successfully processed.
    fn end_merge(
        &self,
        merge_operation: MergeOperation,
        mut after_merge_segment_entry: Option<SegmentEntry>,
    ) -> crate::Result<Option<SegmentMeta>> {
        let segment_updater = self.clone();
        let after_merge_segment_meta = after_merge_segment_entry
            .as_ref()
            .map(|after_merge_segment_entry| after_merge_segment_entry.meta().clone());
        self.schedule_task(move || {
            info!(
                "End merge {:?}",
                after_merge_segment_entry.as_ref().map(|entry| entry.meta())
            );
            {
                if let Some(after_merge_segment_entry) = after_merge_segment_entry.as_mut() {
                    // Deletes and commits could have happened as we were merging.
                    // We need to make sure we are up to date with deletes before accepting the
                    // segment.
                    let mut delete_cursor = after_merge_segment_entry.delete_cursor().clone();
                    if let Some(delete_operation) = delete_cursor.get() {
                        let committed_opstamp = segment_updater.load_meta().opstamp;
                        if delete_operation.opstamp < committed_opstamp {
                            // We are not up to date! Let's create a new tombstone file for our
                            // freshly create split.
                            let index = &segment_updater.index;
                            let segment = index.segment(after_merge_segment_entry.meta().clone());
                            if let Err(advance_deletes_err) = advance_deletes(
                                segment,
                                after_merge_segment_entry,
                                committed_opstamp,
                            ) {
                                error!(
                                    "Merge of {:?} was cancelled (advancing deletes failed): {:?}",
                                    merge_operation.segment_ids(),
                                    advance_deletes_err
                                );
                                // `merge_operations` are tracked. As it is dropped, the
                                // the segment_ids will be available again for merge.
                                return Err(advance_deletes_err);
                            }
                        }
                    }
                }
                let previous_metas = segment_updater.load_meta();
                let segments_status = segment_updater
                    .segment_manager
                    .end_merge(merge_operation.segment_ids(), after_merge_segment_entry)?;

                if segments_status == SegmentsStatus::Committed {
                    segment_updater
                        .save_metas(previous_metas.opstamp, previous_metas.payload.clone())?;
                }

                segment_updater.consider_merge_options();
            } // we drop all possible handle to a now useless `SegmentMeta`.

            let _ = garbage_collect_files(segment_updater);
            Ok(())
        })
        .wait()?;
        Ok(after_merge_segment_meta)
    }

    /// Wait for current merging threads.
    ///
    /// Upon termination of the current merging threads,
    /// merge opportunity may appear.
    ///
    /// We keep waiting until the merge policy judges that
    /// no opportunity is available.
    ///
    /// Note that it is not required to call this
    /// method in your application.
    /// Terminating your application without letting
    /// merge terminate is perfectly safe.
    ///
    /// Obsolete files will eventually be cleaned up
    /// by the directory garbage collector.
    pub fn wait_merging_thread(&self) -> crate::Result<()> {
        self.merge_operations.wait_until_empty();
        Ok(())
    }
}

#[cfg(test)]
mod tests {
    use super::merge_indices;
    use crate::collector::TopDocs;
    use crate::directory::RamDirectory;
    use crate::fastfield::AliveBitSet;
    use crate::index::{SegmentId, SegmentMetaInventory};
    use crate::indexer::merge_policy::tests::MergeWheneverPossible;
    use crate::indexer::merger::IndexMerger;
    use crate::indexer::segment_updater::merge_filtered_segments;
    use crate::query::QueryParser;
    use crate::schema::*;
    use crate::{Directory, DocAddress, Index, Segment};

    #[test]
    fn test_segment_sort_large_max_doc() {
        // Regression test: -(max_doc as i32) overflows for max_doc >= 2^31.
        // Using std::cmp::Reverse avoids this.
        let inventory = SegmentMetaInventory::default();
        let mut metas = [
            inventory.new_segment_meta(SegmentId::generate_random(), 100),
            inventory.new_segment_meta(SegmentId::generate_random(), (1u32 << 31) - 1),
            inventory.new_segment_meta(SegmentId::generate_random(), 50_000),
        ];
        metas.sort_by_key(|m| std::cmp::Reverse(m.max_doc()));
        assert_eq!(metas[0].max_doc(), (1u32 << 31) - 1);
        assert_eq!(metas[1].max_doc(), 50_000);
        assert_eq!(metas[2].max_doc(), 100);
    }

    #[test]
    fn test_delete_during_merge() -> crate::Result<()> {
        let mut schema_builder = Schema::builder();
        let text_field = schema_builder.add_text_field("text", TEXT);
        let index = Index::create_in_ram(schema_builder.build());

        // writing the segment
        let mut index_writer = index.writer_for_tests()?;
        index_writer.set_merge_policy(Box::new(MergeWheneverPossible));

        for _ in 0..100 {
            index_writer.add_document(doc!(text_field=>"a"))?;
            index_writer.add_document(doc!(text_field=>"b"))?;
        }
        index_writer.commit()?;

        for _ in 0..100 {
            index_writer.add_document(doc!(text_field=>"c"))?;
            index_writer.add_document(doc!(text_field=>"d"))?;
        }
        index_writer.commit()?;

        index_writer.add_document(doc!(text_field=>"e"))?;
        index_writer.add_document(doc!(text_field=>"f"))?;
        index_writer.commit()?;

        let term = Term::from_field_text(text_field, "a");
        index_writer.delete_term(term);
        index_writer.commit()?;

        let reader = index.reader()?;
        assert_eq!(reader.searcher().num_docs(), 302);

        index_writer.wait_merging_threads()?;

        reader.reload()?;
        assert_eq!(reader.searcher().segment_readers().len(), 1);
        assert_eq!(reader.searcher().num_docs(), 302);
        Ok(())
    }

    #[test]
    fn delete_all_docs_min() -> crate::Result<()> {
        let mut schema_builder = Schema::builder();
        let text_field = schema_builder.add_text_field("text", TEXT);
        let index = Index::create_in_ram(schema_builder.build());

        // writing the segment
        let mut index_writer = index.writer_for_tests()?;

        for _ in 0..10 {
            index_writer.add_document(doc!(text_field=>"a"))?;
            index_writer.add_document(doc!(text_field=>"b"))?;
        }
        index_writer.commit()?;

        let seg_ids = index.searchable_segment_ids()?;
        // docs exist, should have at least 1 segment
        assert!(!seg_ids.is_empty());

        let term = Term::from_field_text(text_field, "a");
        index_writer.delete_term(term);
        index_writer.commit()?;

        let term = Term::from_field_text(text_field, "b");
        index_writer.delete_term(term);
        index_writer.commit()?;

        index_writer.wait_merging_threads()?;

        let reader = index.reader()?;
        assert_eq!(reader.searcher().num_docs(), 0);

        let seg_ids = index.searchable_segment_ids()?;
        assert!(seg_ids.is_empty());

        reader.reload()?;
        assert_eq!(reader.searcher().num_docs(), 0);
        // empty segments should be erased
        assert!(index.searchable_segment_metas()?.is_empty());
        assert!(reader.searcher().segment_readers().is_empty());

        Ok(())
    }

    #[test]
    fn delete_all_docs() -> crate::Result<()> {
        let mut schema_builder = Schema::builder();
        let text_field = schema_builder.add_text_field("text", TEXT);
        let index = Index::create_in_ram(schema_builder.build());

        // writing the segment
        let mut index_writer = index.writer_for_tests()?;

        for _ in 0..100 {
            index_writer.add_document(doc!(text_field=>"a"))?;
            index_writer.add_document(doc!(text_field=>"b"))?;
        }
        index_writer.commit()?;

        for _ in 0..100 {
            index_writer.add_document(doc!(text_field=>"c"))?;
            index_writer.add_document(doc!(text_field=>"d"))?;
        }
        index_writer.commit()?;

        index_writer.add_document(doc!(text_field=>"e"))?;
        index_writer.add_document(doc!(text_field=>"f"))?;
        index_writer.commit()?;

        let seg_ids = index.searchable_segment_ids()?;
        // docs exist, should have at least 1 segment
        assert!(!seg_ids.is_empty());

        let term_vals = vec!["a", "b", "c", "d", "e", "f"];
        for term_val in term_vals {
            let term = Term::from_field_text(text_field, term_val);
            index_writer.delete_term(term);
            index_writer.commit()?;
        }

        index_writer.wait_merging_threads()?;

        let reader = index.reader()?;
        assert_eq!(reader.searcher().num_docs(), 0);

        let seg_ids = index.searchable_segment_ids()?;
        assert!(seg_ids.is_empty());

        reader.reload()?;
        assert_eq!(reader.searcher().num_docs(), 0);
        // empty segments should be erased
        assert!(index.searchable_segment_metas()?.is_empty());
        assert!(reader.searcher().segment_readers().is_empty());

        Ok(())
    }

    #[test]
    fn test_remove_all_segments() -> crate::Result<()> {
        let mut schema_builder = Schema::builder();
        let text_field = schema_builder.add_text_field("text", TEXT);
        let index = Index::create_in_ram(schema_builder.build());

        // writing the segment
        let mut index_writer = index.writer_for_tests()?;
        for _ in 0..100 {
            index_writer.add_document(doc!(text_field=>"a"))?;
            index_writer.add_document(doc!(text_field=>"b"))?;
        }
        index_writer.commit()?;

        index_writer.segment_updater().remove_all_segments();
        let seg_vec = index_writer
            .segment_updater()
            .segment_manager
            .segment_entries();
        assert!(seg_vec.is_empty());
        Ok(())
    }

    #[test]
    fn test_merge_segments() -> crate::Result<()> {
        let mut indices = vec![];
        let mut schema_builder = Schema::builder();
        let text_field = schema_builder.add_text_field("text", TEXT);
        let schema = schema_builder.build();

        for _ in 0..3 {
            let index = Index::create_in_ram(schema.clone());

            // writing two segments
            let mut index_writer = index.writer_for_tests()?;
            for _ in 0..100 {
                index_writer.add_document(doc!(text_field=>"fizz"))?;
                index_writer.add_document(doc!(text_field=>"buzz"))?;
            }
            index_writer.commit()?;

            for _ in 0..1000 {
                index_writer.add_document(doc!(text_field=>"foo"))?;
                index_writer.add_document(doc!(text_field=>"bar"))?;
            }
            index_writer.commit()?;
            indices.push(index);
        }

        assert_eq!(indices.len(), 3);
        let output_directory: Box<dyn Directory> = Box::<RamDirectory>::default();
        let index = merge_indices(&indices, output_directory)?;
        assert_eq!(index.schema(), schema);

        let segments = index.searchable_segments()?;
        assert_eq!(segments.len(), 1);

        let segment_metas = segments[0].meta();
        assert_eq!(segment_metas.num_deleted_docs(), 0);
        assert_eq!(segment_metas.num_docs(), 6600);
        Ok(())
    }

    #[test]
    fn test_merge_empty_indices_array() {
        let merge_result = merge_indices(&[], RamDirectory::default());
        assert!(merge_result.is_err());
    }

    #[test]
    fn test_merge_mismatched_schema() -> crate::Result<()> {
        let first_index = {
            let mut schema_builder = Schema::builder();
            let text_field = schema_builder.add_text_field("text", TEXT);
            let index = Index::create_in_ram(schema_builder.build());
            let mut index_writer = index.writer_for_tests()?;
            index_writer.add_document(doc!(text_field=>"some text"))?;
            index_writer.commit()?;
            index
        };

        let second_index = {
            let mut schema_builder = Schema::builder();
            let body_field = schema_builder.add_text_field("body", TEXT);
            let index = Index::create_in_ram(schema_builder.build());
            let mut index_writer = index.writer_for_tests()?;
            index_writer.add_document(doc!(body_field=>"some body"))?;
            index_writer.commit()?;
            index
        };

        // mismatched schema index list
        let result = merge_indices(&[first_index, second_index], RamDirectory::default());
        assert!(result.is_err());

        Ok(())
    }

    #[test]
    fn test_merge_filtered_segments() -> crate::Result<()> {
        let first_index = {
            let mut schema_builder = Schema::builder();
            let text_field = schema_builder.add_text_field("text", TEXT);
            let index = Index::create_in_ram(schema_builder.build());
            let mut index_writer = index.writer_for_tests()?;
            index_writer.add_document(doc!(text_field=>"some text 1"))?;
            index_writer.add_document(doc!(text_field=>"some text 2"))?;
            index_writer.commit()?;
            index
        };

        let second_index = {
            let mut schema_builder = Schema::builder();
            let text_field = schema_builder.add_text_field("text", TEXT);
            let index = Index::create_in_ram(schema_builder.build());
            let mut index_writer = index.writer_for_tests()?;
            index_writer.add_document(doc!(text_field=>"some text 3"))?;
            index_writer.add_document(doc!(text_field=>"some text 4"))?;
            index_writer.delete_term(Term::from_field_text(text_field, "4"));

            index_writer.commit()?;
            index
        };

        let mut segments: Vec<Segment> = Vec::new();
        segments.extend(first_index.searchable_segments()?);
        segments.extend(second_index.searchable_segments()?);

        let target_settings = first_index.settings().clone();

        let filter_segment_1 = AliveBitSet::for_test_from_deleted_docs(&[1], 2);
        let filter_segment_2 = AliveBitSet::for_test_from_deleted_docs(&[0], 2);

        let filter_segments = vec![Some(filter_segment_1), Some(filter_segment_2)];

        let merged_index = merge_filtered_segments(
            &segments,
            target_settings,
            filter_segments,
            RamDirectory::default(),
        )?;

        let segments = merged_index.searchable_segments()?;
        assert_eq!(segments.len(), 1);

        let segment_metas = segments[0].meta();
        assert_eq!(segment_metas.num_deleted_docs(), 0);
        assert_eq!(segment_metas.num_docs(), 1);

        Ok(())
    }

    #[test]
    fn test_merge_single_filtered_segments() -> crate::Result<()> {
        let first_index = {
            let mut schema_builder = Schema::builder();
            let text_field = schema_builder.add_text_field("text", TEXT);
            let index = Index::create_in_ram(schema_builder.build());
            let mut index_writer = index.writer_for_tests()?;
            index_writer.add_document(doc!(text_field=>"test text"))?;
            index_writer.add_document(doc!(text_field=>"some text 2"))?;

            index_writer.add_document(doc!(text_field=>"some text 3"))?;
            index_writer.add_document(doc!(text_field=>"some text 4"))?;

            index_writer.delete_term(Term::from_field_text(text_field, "4"));

            index_writer.commit()?;
            index
        };

        let mut segments: Vec<Segment> = Vec::new();
        segments.extend(first_index.searchable_segments()?);

        let target_settings = first_index.settings().clone();

        let filter_segment = AliveBitSet::for_test_from_deleted_docs(&[0], 4);

        let filter_segments = vec![Some(filter_segment)];

        let index = merge_filtered_segments(
            &segments,
            target_settings,
            filter_segments,
            RamDirectory::default(),
        )?;

        let segments = index.searchable_segments()?;
        assert_eq!(segments.len(), 1);

        let segment_metas = segments[0].meta();
        assert_eq!(segment_metas.num_deleted_docs(), 0);
        assert_eq!(segment_metas.num_docs(), 2);

        let searcher = index.reader()?.searcher();
        {
            let text_field = index.schema().get_field("text").unwrap();

            let do_search = |term: &str| {
                let query = QueryParser::for_index(&index, vec![text_field])
                    .parse_query(term)
                    .unwrap();
                let top_docs: Vec<(f32, DocAddress)> = searcher
                    .search(&query, &TopDocs::with_limit(3).order_by_score())
                    .unwrap();

                top_docs.iter().map(|el| el.1.doc_id).collect::<Vec<_>>()
            };

            assert_eq!(do_search("test"), vec![] as Vec<u32>);
            assert_eq!(do_search("text"), vec![0, 1]);
        }

        Ok(())
    }

    #[test]
    fn test_apply_doc_id_filter_in_merger() -> crate::Result<()> {
        let first_index = {
            let mut schema_builder = Schema::builder();
            let text_field = schema_builder.add_text_field("text", TEXT);
            let index = Index::create_in_ram(schema_builder.build());
            let mut index_writer = index.writer_for_tests()?;
            index_writer.add_document(doc!(text_field=>"some text 1"))?;
            index_writer.add_document(doc!(text_field=>"some text 2"))?;

            index_writer.add_document(doc!(text_field=>"some text 3"))?;
            index_writer.add_document(doc!(text_field=>"some text 4"))?;

            index_writer.delete_term(Term::from_field_text(text_field, "4"));

            index_writer.commit()?;
            index
        };

        let mut segments: Vec<Segment> = Vec::new();
        segments.extend(first_index.searchable_segments()?);

        let target_settings = first_index.settings().clone();
        {
            let filter_segment = AliveBitSet::for_test_from_deleted_docs(&[1], 4);
            let filter_segments = vec![Some(filter_segment)];
            let target_schema = segments[0].schema();
            let merged_index = Index::create(
                RamDirectory::default(),
                target_schema,
                target_settings.clone(),
            )?;
            let merger: IndexMerger = IndexMerger::open_with_custom_alive_set(
                merged_index.schema(),
                &segments[..],
                filter_segments,
            )?;

            let doc_ids_alive: Vec<_> = merger.readers[0].doc_ids_alive().collect();
            assert_eq!(doc_ids_alive, vec![0, 2]);
        }

        {
            let filter_segments = vec![None];
            let target_schema = segments[0].schema();
            let merged_index =
                Index::create(RamDirectory::default(), target_schema, target_settings)?;
            let merger: IndexMerger = IndexMerger::open_with_custom_alive_set(
                merged_index.schema(),
                &segments[..],
                filter_segments,
            )?;

            let doc_ids_alive: Vec<_> = merger.readers[0].doc_ids_alive().collect();
            assert_eq!(doc_ids_alive, vec![0, 1, 2]);
        }

        Ok(())
    }
}


================================================
FILE: src/indexer/segment_writer.rs
================================================
use columnar::MonotonicallyMappableToU64;
use common::JsonPathWriter;
use itertools::Itertools;
use tokenizer_api::BoxTokenStream;

use super::operation::AddOperation;
use crate::fastfield::FastFieldsWriter;
use crate::fieldnorm::{FieldNormReaders, FieldNormsWriter};
use crate::index::{Segment, SegmentComponent};
use crate::indexer::indexing_term::IndexingTerm;
use crate::indexer::segment_serializer::SegmentSerializer;
use crate::json_utils::{index_json_value, IndexingPositionsPerPath};
use crate::postings::{
    compute_table_memory_size, serialize_postings, IndexingContext, IndexingPosition,
    PerFieldPostingsWriter, PostingsWriter,
};
use crate::schema::document::{Document, Value};
use crate::schema::{FieldEntry, FieldType, Schema, DATE_TIME_PRECISION_INDEXED};
use crate::tokenizer::{FacetTokenizer, PreTokenizedStream, TextAnalyzer, Tokenizer};
use crate::{DocId, Opstamp, TantivyError};

/// Computes the initial size of the hash table.
///
/// Returns the recommended initial table size as a power of 2.
///
/// Note this is a very dumb way to compute log2, but it is easier to proofread that way.
fn compute_initial_table_size(per_thread_memory_budget: usize) -> crate::Result<usize> {
    let table_memory_upper_bound = per_thread_memory_budget / 3;
    (10..20) // We cap it at 2^19 = 512K capacity.
        // TODO: There are cases where this limit causes a
        // reallocation in the hashmap. Check if this affects performance.
        .map(|power| 1 << power)
        .take_while(|capacity| compute_table_memory_size(*capacity) < table_memory_upper_bound)
        .last()
        .ok_or_else(|| {
            crate::TantivyError::InvalidArgument(format!(
                "per thread memory budget (={per_thread_memory_budget}) is too small. Raise the \
                 memory budget or lower the number of threads."
            ))
        })
}

/// A `SegmentWriter` is in charge of creating segment index from a
/// set of documents.
///
/// They creates the postings list in anonymous memory.
/// The segment is laid on disk when the segment gets `finalized`.
pub struct SegmentWriter {
    pub(crate) max_doc: DocId,
    pub(crate) ctx: IndexingContext,
    pub(crate) per_field_postings_writers: PerFieldPostingsWriter,
    pub(crate) segment_serializer: SegmentSerializer,
    pub(crate) fast_field_writers: FastFieldsWriter,
    pub(crate) fieldnorms_writer: FieldNormsWriter,
    pub(crate) json_path_writer: JsonPathWriter,
    pub(crate) json_positions_per_path: IndexingPositionsPerPath,
    pub(crate) doc_opstamps: Vec<Opstamp>,
    per_field_text_analyzers: Vec<TextAnalyzer>,
    term_buffer: IndexingTerm,
    schema: Schema,
}

impl SegmentWriter {
    /// Creates a new `SegmentWriter`
    ///
    /// The arguments are defined as follows
    ///
    /// - memory_budget: most of the segment writer data (terms, and postings lists recorders) is
    ///   stored in a memory arena. This makes it possible for the user to define the flushing
    ///   behavior as a memory limit.
    /// - segment: The segment being written
    /// - schema
    pub fn for_segment(memory_budget_in_bytes: usize, segment: Segment) -> crate::Result<Self> {
        let schema = segment.schema();
        let tokenizer_manager = segment.index().tokenizers().clone();
        let tokenizer_manager_fast_field = segment.index().fast_field_tokenizer().clone();
        let table_size = compute_initial_table_size(memory_budget_in_bytes)?;
        let segment_serializer = SegmentSerializer::for_segment(segment)?;
        let per_field_postings_writers = PerFieldPostingsWriter::for_schema(&schema);
        let per_field_text_analyzers = schema
            .fields()
            .map(|(_, field_entry): (_, &FieldEntry)| {
                let text_options = match field_entry.field_type() {
                    FieldType::Str(ref text_options) => text_options.get_indexing_options(),
                    FieldType::JsonObject(ref json_object_options) => {
                        json_object_options.get_text_indexing_options()
                    }
                    _ => None,
                };
                let tokenizer_name = text_options
                    .map(|text_index_option| text_index_option.tokenizer())
                    .unwrap_or("default");

                tokenizer_manager.get(tokenizer_name).ok_or_else(|| {
                    TantivyError::SchemaError(format!(
                        "Error getting tokenizer for field: {}",
                        field_entry.name()
                    ))
                })
            })
            .collect::<Result<Vec<_>, _>>()?;
        Ok(Self {
            max_doc: 0,
            ctx: IndexingContext::new(table_size),
            per_field_postings_writers,
            fieldnorms_writer: FieldNormsWriter::for_schema(&schema),
            json_path_writer: JsonPathWriter::default(),
            json_positions_per_path: IndexingPositionsPerPath::default(),
            segment_serializer,
            fast_field_writers: FastFieldsWriter::from_schema_and_tokenizer_manager(
                &schema,
                tokenizer_manager_fast_field,
            )?,
            doc_opstamps: Vec::with_capacity(1_000),
            per_field_text_analyzers,
            term_buffer: IndexingTerm::with_capacity(16),
            schema,
        })
    }

    /// Lay on disk the current content of the `SegmentWriter`
    ///
    /// Finalize consumes the `SegmentWriter`, so that it cannot
    /// be used afterwards.
    pub fn finalize(mut self) -> crate::Result<Vec<u64>> {
        self.fieldnorms_writer.fill_up_to_max_doc(self.max_doc);
        remap_and_write(
            self.schema,
            &self.per_field_postings_writers,
            self.ctx,
            self.fast_field_writers,
            &self.fieldnorms_writer,
            self.segment_serializer,
        )?;
        Ok(self.doc_opstamps)
    }

    /// Returns an estimation of the current memory usage of the segment writer.
    /// If the mem usage exceeds the `memory_budget`, the segment be serialized.
    pub fn mem_usage(&self) -> usize {
        self.ctx.mem_usage()
            + self.fieldnorms_writer.mem_usage()
            + self.fast_field_writers.mem_usage()
            + self.segment_serializer.mem_usage()
    }

    fn index_document<D: Document>(&mut self, doc: &D) -> crate::Result<()> {
        let doc_id = self.max_doc;

        // TODO: Can this be optimised a bit?
        let vals_grouped_by_field = doc
            .iter_fields_and_values()
            .sorted_by_key(|(field, _)| *field)
            .chunk_by(|(field, _)| *field);

        for (field, field_values) in &vals_grouped_by_field {
            let values = field_values.map(|el| el.1);

            let field_entry = self.schema.get_field_entry(field);
            let make_schema_error = || {
                TantivyError::SchemaError(format!(
                    "Expected a {:?} for field {:?}",
                    field_entry.field_type().value_type(),
                    field_entry.name()
                ))
            };
            if !field_entry.is_indexed() {
                continue;
            }

            let (term_buffer, ctx) = (&mut self.term_buffer, &mut self.ctx);
            let postings_writer: &mut dyn PostingsWriter =
                self.per_field_postings_writers.get_for_field_mut(field);
            term_buffer.clear_with_field(field);

            match field_entry.field_type() {
                FieldType::Facet(_) => {
                    let mut facet_tokenizer = FacetTokenizer::default(); // this can be global
                    for value in values {
                        let value = value.as_value();

                        let facet_str = value.as_facet().ok_or_else(make_schema_error)?;
                        let mut facet_tokenizer = facet_tokenizer.token_stream(facet_str);
                        let mut indexing_position = IndexingPosition::default();
                        postings_writer.index_text(
                            doc_id,
                            &mut facet_tokenizer,
                            term_buffer,
                            ctx,
                            &mut indexing_position,
                        );
                    }
                }
                FieldType::Str(_) => {
                    let mut indexing_position = IndexingPosition::default();
                    for value in values {
                        let value = value.as_value();

                        let mut token_stream = if let Some(text) = value.as_str() {
                            let text_analyzer =
                                &mut self.per_field_text_analyzers[field.field_id() as usize];
                            text_analyzer.token_stream(text)
                        } else if let Some(tok_str) = value.into_pre_tokenized_text() {
                            BoxTokenStream::new(PreTokenizedStream::from(*tok_str.clone()))
                        } else {
                            continue;
                        };

                        assert!(term_buffer.is_empty());
                        postings_writer.index_text(
                            doc_id,
                            &mut *token_stream,
                            term_buffer,
                            ctx,
                            &mut indexing_position,
                        );
                    }
                    if field_entry.has_fieldnorms() {
                        self.fieldnorms_writer
                            .record(doc_id, field, indexing_position.num_tokens);
                    }
                }
                FieldType::U64(_) => {
                    let mut num_vals = 0;
                    for value in values {
                        let value = value.as_value();

                        num_vals += 1;
                        let u64_val = value.as_u64().ok_or_else(make_schema_error)?;
                        term_buffer.set_u64(u64_val);
                        postings_writer.subscribe(doc_id, 0u32, term_buffer, ctx);
                    }
                    if field_entry.has_fieldnorms() {
                        self.fieldnorms_writer.record(doc_id, field, num_vals);
                    }
                }
                FieldType::Date(_) => {
                    let mut num_vals = 0;
                    for value in values {
                        let value = value.as_value();

                        num_vals += 1;
                        let date_val = value.as_datetime().ok_or_else(make_schema_error)?;
                        term_buffer
                            .set_u64(date_val.truncate(DATE_TIME_PRECISION_INDEXED).to_u64());
                        postings_writer.subscribe(doc_id, 0u32, term_buffer, ctx);
                    }
                    if field_entry.has_fieldnorms() {
                        self.fieldnorms_writer.record(doc_id, field, num_vals);
                    }
                }
                FieldType::I64(_) => {
                    let mut num_vals = 0;
                    for value in values {
                        let value = value.as_value();

                        num_vals += 1;
                        let i64_val = value.as_i64().ok_or_else(make_schema_error)?;
                        term_buffer.set_i64(i64_val);
                        postings_writer.subscribe(doc_id, 0u32, term_buffer, ctx);
                    }
                    if field_entry.has_fieldnorms() {
                        self.fieldnorms_writer.record(doc_id, field, num_vals);
                    }
                }
                FieldType::F64(_) => {
                    let mut num_vals = 0;
                    for value in values {
                        let value = value.as_value();
                        num_vals += 1;
                        let f64_val = value.as_f64().ok_or_else(make_schema_error)?;
                        term_buffer.set_f64(f64_val);
                        postings_writer.subscribe(doc_id, 0u32, term_buffer, ctx);
                    }
                    if field_entry.has_fieldnorms() {
                        self.fieldnorms_writer.record(doc_id, field, num_vals);
                    }
                }
                FieldType::Bool(_) => {
                    let mut num_vals = 0;
                    for value in values {
                        let value = value.as_value();
                        num_vals += 1;
                        let bool_val = value.as_bool().ok_or_else(make_schema_error)?;
                        term_buffer.set_bool(bool_val);
                        postings_writer.subscribe(doc_id, 0u32, term_buffer, ctx);
                    }
                    if field_entry.has_fieldnorms() {
                        self.fieldnorms_writer.record(doc_id, field, num_vals);
                    }
                }
                FieldType::Bytes(_) => {
                    let mut num_vals = 0;
                    for value in values {
                        let value = value.as_value();
                        num_vals += 1;
                        let bytes = value.as_bytes().ok_or_else(make_schema_error)?;
                        term_buffer.set_bytes(bytes);
                        postings_writer.subscribe(doc_id, 0u32, term_buffer, ctx);
                    }
                    if field_entry.has_fieldnorms() {
                        self.fieldnorms_writer.record(doc_id, field, num_vals);
                    }
                }
                FieldType::JsonObject(json_options) => {
                    let text_analyzer =
                        &mut self.per_field_text_analyzers[field.field_id() as usize];

                    self.json_positions_per_path.clear();
                    self.json_path_writer
                        .set_expand_dots(json_options.is_expand_dots_enabled());
                    for json_value in values {
                        self.json_path_writer.clear();

                        index_json_value(
                            doc_id,
                            json_value,
                            text_analyzer,
                            term_buffer,
                            &mut self.json_path_writer,
                            postings_writer,
                            ctx,
                            &mut self.json_positions_per_path,
                        );
                    }
                }
                FieldType::IpAddr(_) => {
                    let mut num_vals = 0;
                    for value in values {
                        let value = value.as_value();

                        num_vals += 1;
                        let ip_addr = value.as_ip_addr().ok_or_else(make_schema_error)?;
                        term_buffer.set_ip_addr(ip_addr);
                        postings_writer.subscribe(doc_id, 0u32, term_buffer, ctx);
                    }
                    if field_entry.has_fieldnorms() {
                        self.fieldnorms_writer.record(doc_id, field, num_vals);
                    }
                }
            }
        }
        Ok(())
    }

    /// Indexes a new document
    ///
    /// As a user, you should rather use `IndexWriter`'s add_document.
    pub fn add_document<D: Document>(
        &mut self,
        add_operation: AddOperation<D>,
    ) -> crate::Result<()> {
        let AddOperation { document, opstamp } = add_operation;
        self.doc_opstamps.push(opstamp);
        self.fast_field_writers.add_document(&document)?;
        self.index_document(&document)?;
        let doc_writer = self.segment_serializer.get_store_writer();
        doc_writer.store(&document, &self.schema)?;
        self.max_doc += 1;
        Ok(())
    }

    /// Max doc is
    /// - the number of documents in the segment assuming there is no deletes
    /// - the maximum document id (including deleted documents) + 1
    ///
    /// Currently, **tantivy** does not handle deletes anyway,
    /// so `max_doc == num_docs`
    pub fn max_doc(&self) -> u32 {
        self.max_doc
    }

    /// Number of documents in the index.
    /// Deleted documents are not counted.
    ///
    /// Currently, **tantivy** does not handle deletes anyway,
    /// so `max_doc == num_docs`
    #[allow(dead_code)]
    pub fn num_docs(&self) -> u32 {
        self.max_doc
    }
}

/// This method is used as a trick to workaround the borrow checker
/// Writes a view of a segment by pushing information
/// to the `SegmentSerializer`.
///
/// `doc_id_map` is used to map to the new doc_id order.
fn remap_and_write(
    schema: Schema,
    per_field_postings_writers: &PerFieldPostingsWriter,
    ctx: IndexingContext,
    fast_field_writers: FastFieldsWriter,
    fieldnorms_writer: &FieldNormsWriter,
    mut serializer: SegmentSerializer,
) -> crate::Result<()> {
    debug!("remap-and-write");
    if let Some(fieldnorms_serializer) = serializer.extract_fieldnorms_serializer() {
        fieldnorms_writer.serialize(fieldnorms_serializer)?;
    }
    let fieldnorm_data = serializer
        .segment()
        .open_read(SegmentComponent::FieldNorms)?;
    let fieldnorm_readers = FieldNormReaders::open(fieldnorm_data)?;
    serialize_postings(
        ctx,
        schema,
        per_field_postings_writers,
        fieldnorm_readers,
        serializer.get_postings_serializer(),
    )?;
    debug!("fastfield-serialize");
    fast_field_writers.serialize(serializer.get_fast_field_write())?;

    debug!("serializer-close");
    serializer.close()?;

    Ok(())
}

#[cfg(test)]
mod tests {
    use std::collections::BTreeMap;
    use std::path::Path;

    use columnar::ColumnType;

    use crate::collector::{Count, TopDocs};
    use crate::directory::RamDirectory;
    use crate::fastfield::FastValue;
    use crate::postings::{Postings, TermInfo};
    use crate::query::{PhraseQuery, QueryParser};
    use crate::schema::{
        Document, IndexRecordOption, OwnedValue, Schema, TextFieldIndexing, TextOptions, Value,
        DATE_TIME_PRECISION_INDEXED, FAST, STORED, STRING, TEXT,
    };
    use crate::store::{Compressor, StoreReader, StoreWriter};
    use crate::time::format_description::well_known::Rfc3339;
    use crate::time::OffsetDateTime;
    use crate::tokenizer::{PreTokenizedString, Token};
    use crate::{
        DateTime, Directory, DocAddress, DocSet, Index, IndexWriter, SegmentReader,
        TantivyDocument, Term, TERMINATED,
    };

    #[test]
    #[cfg(not(feature = "compare_hash_only"))]
    fn test_hashmap_size() {
        use super::compute_initial_table_size;
        assert_eq!(compute_initial_table_size(100_000).unwrap(), 1 << 12);
        assert_eq!(compute_initial_table_size(1_000_000).unwrap(), 1 << 15);
        assert_eq!(compute_initial_table_size(15_000_000).unwrap(), 1 << 19);
        assert_eq!(compute_initial_table_size(1_000_000_000).unwrap(), 1 << 19);
        assert_eq!(compute_initial_table_size(4_000_000_000).unwrap(), 1 << 19);
    }

    #[test]
    fn test_prepare_for_store() {
        let mut schema_builder = Schema::builder();
        let text_field = schema_builder.add_text_field("title", TEXT | STORED);
        let schema = schema_builder.build();
        let mut doc = TantivyDocument::default();
        let pre_tokenized_text = PreTokenizedString {
            text: String::from("A"),
            tokens: vec![Token {
                offset_from: 0,
                offset_to: 1,
                position: 0,
                text: String::from("A"),
                position_length: 1,
            }],
        };

        doc.add_pre_tokenized_text(text_field, pre_tokenized_text);
        doc.add_text(text_field, "title");

        let path = Path::new("store");
        let directory = RamDirectory::create();
        let store_wrt = directory.open_write(path).unwrap();

        let mut store_writer = StoreWriter::new(store_wrt, Compressor::None, 0, false).unwrap();
        store_writer.store(&doc, &schema).unwrap();
        store_writer.close().unwrap();

        let reader = StoreReader::open(directory.open_read(path).unwrap(), 0).unwrap();
        let doc = reader.get::<TantivyDocument>(0).unwrap();

        assert_eq!(doc.field_values().count(), 2);
        assert_eq!(
            doc.get_all(text_field).next().unwrap().as_value().as_str(),
            Some("A")
        );
        assert_eq!(
            doc.get_all(text_field).nth(1).unwrap().as_value().as_str(),
            Some("title")
        );
    }
    #[test]
    fn test_simple_json_indexing() {
        let mut schema_builder = Schema::builder();
        let json_field = schema_builder.add_json_field("json", STORED | STRING);
        let schema = schema_builder.build();
        let index = Index::create_in_ram(schema.clone());
        let mut writer = index.writer_for_tests().unwrap();
        writer
            .add_document(doc!(json_field=>json!({"my_field": "b"})))
            .unwrap();
        writer
            .add_document(doc!(json_field=>json!({"my_field": "a"})))
            .unwrap();
        writer
            .add_document(doc!(json_field=>json!({"my_field": "b"})))
            .unwrap();
        writer.commit().unwrap();

        let query_parser = QueryParser::for_index(&index, vec![json_field]);
        let text_query = query_parser.parse_query("my_field:a").unwrap();
        let score_docs: Vec<(_, DocAddress)> = index
            .reader()
            .unwrap()
            .searcher()
            .search(&text_query, &TopDocs::with_limit(4).order_by_score())
            .unwrap();
        assert_eq!(score_docs.len(), 1);

        let text_query = query_parser.parse_query("my_field:b").unwrap();
        let score_docs: Vec<(_, DocAddress)> = index
            .reader()
            .unwrap()
            .searcher()
            .search(&text_query, &TopDocs::with_limit(4).order_by_score())
            .unwrap();
        assert_eq!(score_docs.len(), 2);
    }

    #[test]
    fn test_flat_json_indexing() {
        // A JSON Object that contains mixed values on the first level
        let mut schema_builder = Schema::builder();
        let json_field = schema_builder.add_json_field("json", STORED | STRING);
        let schema = schema_builder.build();
        let index = Index::create_in_ram(schema.clone());
        let mut writer = index.writer_for_tests().unwrap();
        // Text, i64, u64
        writer.add_document(doc!(json_field=>"b")).unwrap();
        writer
            .add_document(doc!(json_field=>OwnedValue::I64(10i64)))
            .unwrap();
        writer
            .add_document(doc!(json_field=>OwnedValue::U64(55u64)))
            .unwrap();
        writer
            .add_document(doc!(json_field=>json!({"my_field": "a"})))
            .unwrap();
        writer.commit().unwrap();

        let search_and_expect = |query| {
            let query_parser = QueryParser::for_index(&index, vec![json_field]);
            let text_query = query_parser.parse_query(query).unwrap();
            let score_docs: Vec<(_, DocAddress)> = index
                .reader()
                .unwrap()
                .searcher()
                .search(&text_query, &TopDocs::with_limit(4).order_by_score())
                .unwrap();
            assert_eq!(score_docs.len(), 1);
        };

        search_and_expect("my_field:a");
        search_and_expect("b");
        search_and_expect("10");
        search_and_expect("55");
    }

    #[test]
    fn test_json_indexing() {
        let mut schema_builder = Schema::builder();
        let json_field = schema_builder.add_json_field("json", STORED | TEXT);
        let schema = schema_builder.build();
        let json_val: serde_json::Value = serde_json::from_str(
            r#"{
            "toto": "titi",
            "float": -0.2,
            "bool": true,
            "unsigned": 1,
            "signed": -2,
            "complexobject": {
                "field.with.dot": 1
            },
            "date": "1985-04-12T23:20:50.52Z",
            "my_arr": [2, 3, {"my_key": "two tokens"}, 4]
        }"#,
        )
        .unwrap();
        let doc = doc!(json_field=>json_val.clone());
        let index = Index::create_in_ram(schema.clone());
        let mut writer = index.writer_for_tests().unwrap();
        writer.add_document(doc).unwrap();
        writer.commit().unwrap();
        let reader = index.reader().unwrap();
        let searcher = reader.searcher();
        let doc = searcher
            .doc::<TantivyDocument>(DocAddress {
                segment_ord: 0u32,
                doc_id: 0u32,
            })
            .unwrap();
        let serdeser_json_val = serde_json::from_str::<serde_json::Value>(&doc.to_json(&schema))
            .unwrap()
            .get("json")
            .unwrap()[0]
            .clone();
        assert_eq!(json_val, serdeser_json_val);
        let segment_reader = searcher.segment_reader(0u32);
        let inv_idx = segment_reader.inverted_index(json_field).unwrap();
        let term_dict = inv_idx.terms();

        let mut term_stream = term_dict.stream().unwrap();

        let term_from_path =
            |path: &str| -> Term { Term::from_field_json_path(json_field, path, false) };

        fn set_fast_val<T: FastValue>(val: T, mut term: Term) -> Term {
            term.append_type_and_fast_value(val);
            term
        }
        fn set_str(val: &str, mut term: Term) -> Term {
            term.append_type_and_str(val);
            term
        }

        let term = term_from_path("bool");
        assert!(term_stream.advance());
        assert_eq!(
            term_stream.key(),
            set_fast_val(true, term).serialized_value_bytes()
        );

        let term = term_from_path("complexobject.field\\.with\\.dot");
        assert!(term_stream.advance());
        assert_eq!(
            term_stream.key(),
            set_fast_val(1i64, term).serialized_value_bytes()
        );

        // Date
        let term = term_from_path("date");

        assert!(term_stream.advance());
        assert_eq!(
            term_stream.key(),
            set_fast_val(
                DateTime::from_utc(
                    OffsetDateTime::parse("1985-04-12T23:20:50.52Z", &Rfc3339).unwrap(),
                )
                .truncate(DATE_TIME_PRECISION_INDEXED),
                term
            )
            .serialized_value_bytes()
        );

        // Float
        let term = term_from_path("float");
        assert!(term_stream.advance());
        assert_eq!(
            term_stream.key(),
            set_fast_val(-0.2f64, term).serialized_value_bytes()
        );

        // Number In Array
        let term = term_from_path("my_arr");
        assert!(term_stream.advance());
        assert_eq!(
            term_stream.key(),
            set_fast_val(2i64, term).serialized_value_bytes()
        );

        let term = term_from_path("my_arr");
        assert!(term_stream.advance());
        assert_eq!(
            term_stream.key(),
            set_fast_val(3i64, term).serialized_value_bytes()
        );

        let term = term_from_path("my_arr");
        assert!(term_stream.advance());
        assert_eq!(
            term_stream.key(),
            set_fast_val(4i64, term).serialized_value_bytes()
        );

        // El in Array
        let term = term_from_path("my_arr.my_key");
        assert!(term_stream.advance());
        assert_eq!(
            term_stream.key(),
            set_str("tokens", term).serialized_value_bytes()
        );
        let term = term_from_path("my_arr.my_key");
        assert!(term_stream.advance());
        assert_eq!(
            term_stream.key(),
            set_str("two", term).serialized_value_bytes()
        );

        // Signed
        let term = term_from_path("signed");
        assert!(term_stream.advance());
        assert_eq!(
            term_stream.key(),
            set_fast_val(-2i64, term).serialized_value_bytes()
        );

        let term = term_from_path("toto");
        assert!(term_stream.advance());
        assert_eq!(
            term_stream.key(),
            set_str("titi", term).serialized_value_bytes()
        );
        // Unsigned
        let term = term_from_path("unsigned");
        assert!(term_stream.advance());
        assert_eq!(
            term_stream.key(),
            set_fast_val(1i64, term).serialized_value_bytes()
        );

        assert!(!term_stream.advance());
    }

    #[test]
    fn test_json_tokenized_with_position() {
        let mut schema_builder = Schema::builder();
        let json_field = schema_builder.add_json_field("json", STORED | TEXT);
        let schema = schema_builder.build();
        let mut doc = TantivyDocument::default();
        let json_val: BTreeMap<String, crate::schema::OwnedValue> =
            serde_json::from_str(r#"{"mykey": "repeated token token"}"#).unwrap();
        doc.add_object(json_field, json_val);
        let index = Index::create_in_ram(schema);
        let mut writer = index.writer_for_tests().unwrap();
        writer.add_document(doc).unwrap();
        writer.commit().unwrap();
        let reader = index.reader().unwrap();
        let searcher = reader.searcher();
        let segment_reader = searcher.segment_reader(0u32);
        let inv_index = segment_reader.inverted_index(json_field).unwrap();
        let mut term = Term::from_field_json_path(json_field, "mykey", false);
        term.append_type_and_str("token");
        let term_info = inv_index.get_term_info(&term).unwrap().unwrap();
        assert_eq!(
            term_info,
            TermInfo {
                doc_freq: 1,
                postings_range: 2..4,
                positions_range: 2..5
            }
        );
        let mut postings = inv_index
            .read_postings(&term, IndexRecordOption::WithFreqsAndPositions)
            .unwrap()
            .unwrap();
        assert_eq!(postings.doc(), 0);
        assert_eq!(postings.term_freq(), 2);
        let mut positions = Vec::new();
        postings.positions(&mut positions);
        assert_eq!(&positions[..], &[1, 2]);
        assert_eq!(postings.advance(), TERMINATED);
    }

    #[test]
    fn test_json_raw_no_position() {
        let mut schema_builder = Schema::builder();
        let json_field = schema_builder.add_json_field("json", STRING);
        let schema = schema_builder.build();
        let json_val: serde_json::Value =
            serde_json::from_str(r#"{"mykey": "two tokens"}"#).unwrap();
        let doc = doc!(json_field=>json_val);
        let index = Index::create_in_ram(schema);
        let mut writer = index.writer_for_tests().unwrap();
        writer.add_document(doc).unwrap();
        writer.commit().unwrap();
        let reader = index.reader().unwrap();
        let searcher = reader.searcher();
        let segment_reader = searcher.segment_reader(0u32);
        let inv_index = segment_reader.inverted_index(json_field).unwrap();
        let mut term = Term::from_field_json_path(json_field, "mykey", false);
        term.append_type_and_str("two tokens");
        let term_info = inv_index.get_term_info(&term).unwrap().unwrap();
        assert_eq!(
            term_info,
            TermInfo {
                doc_freq: 1,
                postings_range: 0..1,
                positions_range: 0..0
            }
        );
        let mut postings = inv_index
            .read_postings(&term, IndexRecordOption::WithFreqs)
            .unwrap()
            .unwrap();
        assert_eq!(postings.doc(), 0);
        assert_eq!(postings.term_freq(), 1);
        let mut positions = Vec::new();
        postings.positions(&mut positions);
        assert_eq!(postings.advance(), TERMINATED);
    }

    #[test]
    fn test_position_overlapping_path() {
        // This test checks that we do not end up detecting phrase query due
        // to several string literal in the same json object being overlapping.
        let mut schema_builder = Schema::builder();
        let json_field = schema_builder.add_json_field("json", TEXT);
        let schema = schema_builder.build();
        let json_val: serde_json::Value = serde_json::from_str(
            r#"{"mykey": [{"field": "hello happy tax payer"}, {"field": "nothello"}]}"#,
        )
        .unwrap();
        let doc = doc!(json_field=>json_val);
        let index = Index::create_in_ram(schema);
        let mut writer = index.writer_for_tests().unwrap();
        writer.add_document(doc).unwrap();
        writer.commit().unwrap();
        let reader = index.reader().unwrap();
        let searcher = reader.searcher();

        let term = Term::from_field_json_path(json_field, "mykey.field", false);

        let mut hello_term = term.clone();
        hello_term.append_type_and_str("hello");

        let mut nothello_term = term.clone();
        nothello_term.append_type_and_str("nothello");

        let mut happy_term = term.clone();
        happy_term.append_type_and_str("happy");

        let phrase_query = PhraseQuery::new(vec![hello_term, happy_term.clone()]);
        assert_eq!(searcher.search(&phrase_query, &Count).unwrap(), 1);
        let phrase_query = PhraseQuery::new(vec![nothello_term, happy_term]);
        assert_eq!(searcher.search(&phrase_query, &Count).unwrap(), 0);
    }

    #[test]
    fn test_json_fast() {
        let mut schema_builder = Schema::builder();
        let json_field = schema_builder.add_json_field("json", FAST);
        let schema = schema_builder.build();
        let json_val: serde_json::Value = serde_json::from_str(
            r#"{
            "toto": "titi",
            "float": -0.2,
            "bool": true,
            "unsigned": 1,
            "signed": -2,
            "complexobject": {
                "field.with.dot": 1
            },
            "date": "1985-04-12T23:20:50.52Z",
            "my_arr": [2, 3, {"my_key": "two tokens"}, 4]
        }"#,
        )
        .unwrap();
        let doc = doc!(json_field=>json_val.clone());
        let index = Index::create_in_ram(schema.clone());
        let mut writer = index.writer_for_tests().unwrap();
        writer.add_document(doc).unwrap();
        writer.commit().unwrap();
        let reader = index.reader().unwrap();
        let searcher = reader.searcher();
        let segment_reader = searcher.segment_reader(0u32);

        fn assert_type(reader: &SegmentReader, field: &str, typ: ColumnType) {
            let cols = reader.fast_fields().dynamic_column_handles(field).unwrap();
            assert_eq!(cols.len(), 1, "{field}");
            assert_eq!(cols[0].column_type(), typ, "{field}");
        }
        assert_type(segment_reader, "json.toto", ColumnType::Str);
        assert_type(segment_reader, "json.float", ColumnType::F64);
        assert_type(segment_reader, "json.bool", ColumnType::Bool);
        assert_type(segment_reader, "json.unsigned", ColumnType::I64);
        assert_type(segment_reader, "json.signed", ColumnType::I64);
        assert_type(
            segment_reader,
            "json.complexobject.field\\.with\\.dot",
            ColumnType::I64,
        );
        assert_type(segment_reader, "json.date", ColumnType::DateTime);
        assert_type(segment_reader, "json.my_arr", ColumnType::I64);
        assert_type(segment_reader, "json.my_arr.my_key", ColumnType::Str);

        fn assert_empty(reader: &SegmentReader, field: &str) {
            let cols = reader.fast_fields().dynamic_column_handles(field).unwrap();
            assert_eq!(cols.len(), 0);
        }
        assert_empty(segment_reader, "unknown");
        assert_empty(segment_reader, "json");
        assert_empty(segment_reader, "json.toto.titi");

        let sub_columns = segment_reader
            .fast_fields()
            .dynamic_subpath_column_handles("json")
            .unwrap();
        assert_eq!(sub_columns.len(), 9);

        let subsub_columns = segment_reader
            .fast_fields()
            .dynamic_subpath_column_handles("json.complexobject")
            .unwrap();
        assert_eq!(subsub_columns.len(), 1);
    }

    #[test]
    fn test_json_term_with_numeric_merge_panic_regression_bug_2283() {
        // https://github.com/quickwit-oss/tantivy/issues/2283
        let mut schema_builder = Schema::builder();
        let json = schema_builder.add_json_field("json", TEXT);
        let schema = schema_builder.build();
        let index = Index::create_in_ram(schema);
        let mut writer = index.writer_for_tests().unwrap();
        let doc = json!({"field": "a"});
        writer.add_document(doc!(json=>doc)).unwrap();
        writer.commit().unwrap();
        let doc = json!({"field": "a", "id": 1});
        writer.add_document(doc!(json=>doc.clone())).unwrap();
        writer.commit().unwrap();

        // Force Merge
        writer.wait_merging_threads().unwrap();
        let mut index_writer: IndexWriter = index.writer_for_tests().unwrap();
        let segment_ids = index
            .searchable_segment_ids()
            .expect("Searchable segments failed.");
        index_writer.merge(&segment_ids).wait().unwrap();
        assert!(index_writer.wait_merging_threads().is_ok());
    }

    #[test]
    fn test_bug_regression_1629_position_when_array_with_a_field_value_that_does_not_contain_any_token(
    ) {
        // We experienced a bug where we would have a position underflow when computing position
        // delta in an horrible corner case.
        //
        // See the commit with this unit test if you want the details.
        let mut schema_builder = Schema::builder();
        let text = schema_builder.add_text_field("text", TEXT);
        let schema = schema_builder.build();
        let doc = TantivyDocument::parse_json(&schema, r#"{"text": [ "bbb", "aaa", "", "aaa"]}"#)
            .unwrap();
        let index = Index::create_in_ram(schema);
        let mut index_writer: IndexWriter = index.writer_for_tests().unwrap();
        index_writer.add_document(doc).unwrap();
        // On debug this did panic on the underflow
        index_writer.commit().unwrap();
        let reader = index.reader().unwrap();
        let searcher = reader.searcher();
        let seg_reader = searcher.segment_reader(0);
        let inv_index = seg_reader.inverted_index(text).unwrap();
        let term = Term::from_field_text(text, "aaa");
        let mut postings = inv_index
            .read_postings(&term, IndexRecordOption::WithFreqsAndPositions)
            .unwrap()
            .unwrap();
        assert_eq!(postings.doc(), 0u32);
        let mut positions = Vec::new();
        postings.positions(&mut positions);
        // On release this was [2, 1]. (< note the decreasing values)
        assert_eq!(positions, &[2, 5]);
    }

    #[test]
    fn test_multiple_field_value_and_long_tokens() {
        let mut schema_builder = Schema::builder();
        let text = schema_builder.add_text_field("text", TEXT);
        let schema = schema_builder.build();
        let mut doc = TantivyDocument::default();
        // This is a bit of a contrived example.
        let tokens = PreTokenizedString {
            text: "roller-coaster".to_string(),
            tokens: vec![Token {
                offset_from: 0,
                offset_to: 14,
                position: 0,
                text: "rollercoaster".to_string(),
                position_length: 2,
            }],
        };
        doc.add_pre_tokenized_text(text, tokens.clone());
        doc.add_pre_tokenized_text(text, tokens);
        let index = Index::create_in_ram(schema);
        let mut index_writer: IndexWriter = index.writer_for_tests().unwrap();
        index_writer.add_document(doc).unwrap();
        index_writer.commit().unwrap();
        let reader = index.reader().unwrap();
        let searcher = reader.searcher();
        let seg_reader = searcher.segment_reader(0);
        let inv_index = seg_reader.inverted_index(text).unwrap();
        let term = Term::from_field_text(text, "rollercoaster");
        let mut postings = inv_index
            .read_postings(&term, IndexRecordOption::WithFreqsAndPositions)
            .unwrap()
            .unwrap();
        assert_eq!(postings.doc(), 0u32);
        let mut positions = Vec::new();
        postings.positions(&mut positions);
        assert_eq!(positions, &[0, 3]); //< as opposed to 0, 2 if we had a position length of 1.
    }

    #[test]
    fn test_last_token_not_ending_last() {
        let mut schema_builder = Schema::builder();
        let text = schema_builder.add_text_field("text", TEXT);
        let schema = schema_builder.build();
        let mut doc = TantivyDocument::default();
        // This is a bit of a contrived example.
        let tokens = PreTokenizedString {
            text: "contrived-example".to_string(), //< I can't think of a use case where this corner case happens in real life.
            tokens: vec![
                Token {
                    // Not the last token, yet ends after the last token.
                    offset_from: 0,
                    offset_to: 14,
                    position: 0,
                    text: "long_token".to_string(),
                    position_length: 3,
                },
                Token {
                    offset_from: 0,
                    offset_to: 14,
                    position: 1,
                    text: "short".to_string(),
                    position_length: 1,
                },
            ],
        };
        doc.add_pre_tokenized_text(text, tokens);
        doc.add_text(text, "hello");
        let index = Index::create_in_ram(schema);
        let mut index_writer: IndexWriter = index.writer_for_tests().unwrap();
        index_writer.add_document(doc).unwrap();
        index_writer.commit().unwrap();
        let reader = index.reader().unwrap();
        let searcher = reader.searcher();
        let seg_reader = searcher.segment_reader(0);
        let inv_index = seg_reader.inverted_index(text).unwrap();
        let term = Term::from_field_text(text, "hello");
        let mut postings = inv_index
            .read_postings(&term, IndexRecordOption::WithFreqsAndPositions)
            .unwrap()
            .unwrap();
        assert_eq!(postings.doc(), 0u32);
        let mut positions = Vec::new();
        postings.positions(&mut positions);
        assert_eq!(positions, &[4]); //< as opposed to 3 if we had a position length of 1.
    }

    #[test]
    fn test_show_error_when_tokenizer_not_registered() {
        let text_field_indexing = TextFieldIndexing::default()
            .set_tokenizer("custom_en")
            .set_index_option(IndexRecordOption::WithFreqsAndPositions);
        let text_options = TextOptions::default()
            .set_indexing_options(text_field_indexing)
            .set_stored();
        let mut schema_builder = Schema::builder();
        schema_builder.add_text_field("title", text_options);
        let schema = schema_builder.build();
        let index = Index::create_in_ram(schema);
        let schema = index.schema();
        let mut index_writer = index.writer(50_000_000).unwrap();
        let title = schema.get_field("title").unwrap();
        let mut document = TantivyDocument::default();
        document.add_text(title, "The Old Man and the Sea");
        index_writer.add_document(document).unwrap();
        let error = index_writer.commit().unwrap_err();
        assert_eq!(
            error.to_string(),
            "Schema error: 'Error getting tokenizer for field: title'"
        );
    }
}


================================================
FILE: src/indexer/single_segment_index_writer.rs
================================================
use std::marker::PhantomData;

use crate::indexer::operation::AddOperation;
use crate::indexer::segment_updater::save_metas;
use crate::indexer::SegmentWriter;
use crate::schema::document::Document;
use crate::{Directory, Index, IndexMeta, Opstamp, Segment, TantivyDocument};

#[doc(hidden)]
pub struct SingleSegmentIndexWriter<D: Document = TantivyDocument> {
    segment_writer: SegmentWriter,
    segment: Segment,
    opstamp: Opstamp,
    _phantom: PhantomData<D>,
}

impl<D: Document> SingleSegmentIndexWriter<D> {
    pub fn new(index: Index, mem_budget: usize) -> crate::Result<Self> {
        let segment = index.new_segment();
        let segment_writer = SegmentWriter::for_segment(mem_budget, segment.clone())?;
        Ok(Self {
            segment_writer,
            segment,
            opstamp: 0,
            _phantom: PhantomData,
        })
    }

    pub fn mem_usage(&self) -> usize {
        self.segment_writer.mem_usage()
    }

    pub fn add_document(&mut self, document: D) -> crate::Result<()> {
        let opstamp = self.opstamp;
        self.opstamp += 1;
        self.segment_writer
            .add_document(AddOperation { opstamp, document })
    }

    pub fn finalize(self) -> crate::Result<Index> {
        let max_doc = self.segment_writer.max_doc();
        self.segment_writer.finalize()?;
        let segment: Segment = self.segment.with_max_doc(max_doc);
        let index = segment.index();
        let index_meta = IndexMeta {
            index_settings: index.settings().clone(),
            segments: vec![segment.meta().clone()],
            schema: index.schema(),
            opstamp: 0,
            payload: None,
        };
        save_metas(&index_meta, index.directory())?;
        index.directory().sync_directory()?;
        Ok(segment.index().clone())
    }
}


================================================
FILE: src/indexer/stamper.rs
================================================
use std::ops::Range;
use std::sync::atomic::{AtomicU64, Ordering};
use std::sync::Arc;

use crate::Opstamp;

/// Stamper provides Opstamps, which is just an auto-increment id to label
/// an operation.
///
/// Cloning does not "fork" the stamp generation. The stamper actually wraps an `Arc`.
#[derive(Clone, Default)]
pub struct Stamper(Arc<AtomicU64>);

impl Stamper {
    pub fn new(first_opstamp: Opstamp) -> Stamper {
        Stamper(Arc::new(AtomicU64::new(first_opstamp)))
    }

    pub fn stamp(&self) -> Opstamp {
        self.0.fetch_add(1u64, Ordering::SeqCst)
    }

    /// Given a desired count `n`, `stamps` returns an iterator that
    /// will supply `n` number of u64 stamps.
    pub fn stamps(&self, n: u64) -> Range<Opstamp> {
        let start = self.0.fetch_add(n, Ordering::SeqCst);
        Range {
            start,
            end: start + n,
        }
    }

    /// Reverts the stamper to a given `Opstamp` value and returns it
    pub fn revert(&self, to_opstamp: Opstamp) -> Opstamp {
        self.0.store(to_opstamp, Ordering::SeqCst);
        to_opstamp
    }
}

#[cfg(test)]
mod test {

    use super::Stamper;

    #[test]
    fn test_stamper() {
        let stamper = Stamper::new(7u64);
        assert_eq!(stamper.stamp(), 7u64);
        assert_eq!(stamper.stamp(), 8u64);

        let stamper_clone = stamper.clone();
        assert_eq!(stamper.stamp(), 9u64);

        assert_eq!(stamper.stamp(), 10u64);
        assert_eq!(stamper_clone.stamp(), 11u64);
        assert_eq!(stamper.stamps(3u64), (12..15));
        assert_eq!(stamper.stamp(), 15u64);
    }

    #[test]
    fn test_stamper_revert() {
        let stamper = Stamper::new(7u64);
        assert_eq!(stamper.stamp(), 7u64);
        assert_eq!(stamper.stamp(), 8u64);

        let stamper_clone = stamper.clone();
        assert_eq!(stamper_clone.stamp(), 9u64);

        stamper.revert(6);
        assert_eq!(stamper.stamp(), 6);
        assert_eq!(stamper_clone.stamp(), 7);
    }
}


================================================
FILE: src/lib.rs
================================================
#![doc(html_logo_url = "http://fulmicoton.com/tantivy-logo/tantivy-logo.png")]
#![cfg_attr(all(feature = "unstable", test), feature(test))]
#![doc(test(attr(allow(unused_variables), deny(warnings))))]
#![warn(missing_docs)]
#![allow(
    clippy::len_without_is_empty,
    clippy::derive_partial_eq_without_eq,
    clippy::module_inception,
    clippy::needless_range_loop,
    clippy::bool_assert_comparison
)]

//! # `tantivy`
//!
//! Tantivy is a search engine library.
//! Think `Lucene`, but in Rust.
//!
//! ```rust
//! # use std::path::Path;
//! # use std::fs;
//! # use tempfile::TempDir;
//! # use tantivy::collector::TopDocs;
//! # use tantivy::query::QueryParser;
//! # use tantivy::schema::*;
//! # use tantivy::{doc, DocAddress, Index, IndexWriter, Score};
//! #
//! # fn main() {
//! #     // Let's create a temporary directory for the
//! #     // sake of this example
//! #     if let Ok(dir) = TempDir::new() {
//! #         let index_path = dir.path().join("index");
//! #         // In case the directory already exists, we remove it
//! #         let _ = fs::remove_dir_all(&index_path);
//! #         fs::create_dir_all(&index_path).unwrap();
//! #         run_example(&index_path).unwrap();
//! #     }
//! # }
//! #
//! # fn run_example(index_path: &Path) -> tantivy::Result<()> {
//! // First we need to define a schema ...
//!
//! // `TEXT` means the field should be tokenized and indexed,
//! // along with its term frequency and term positions.
//! //
//! // `STORED` means that the field will also be saved
//! // in a compressed, row-oriented key-value store.
//! // This store is useful to reconstruct the
//! // documents that were selected during the search phase.
//! let mut schema_builder = Schema::builder();
//! let title = schema_builder.add_text_field("title", TEXT | STORED);
//! let body = schema_builder.add_text_field("body", TEXT);
//! let schema = schema_builder.build();
//!
//! // Indexing documents
//!
//! let index = Index::create_in_dir(index_path, schema.clone())?;
//!
//! // Here we use a buffer of 100MB that will be split
//! // between indexing threads.
//! let mut index_writer: IndexWriter = index.writer(100_000_000)?;
//!
//! // Let's index a document!
//! index_writer.add_document(doc!(
//!     title => "The Old Man and the Sea",
//!     body => "He was an old man who fished alone in a skiff in \
//!             the Gulf Stream and he had gone eighty-four days \
//!             now without taking a fish."
//! ))?;
//!
//! // We need to call .commit() explicitly to force the
//! // index_writer to finish processing the documents in the queue,
//! // flush the current index to the disk, and advertise
//! // the existence of new documents.
//! index_writer.commit()?;
//!
//! // # Searching
//!
//! let reader = index.reader()?;
//!
//! let searcher = reader.searcher();
//!
//! let query_parser = QueryParser::for_index(&index, vec![title, body]);
//!
//! // QueryParser may fail if the query is not in the right
//! // format. For user facing applications, this can be a problem.
//! // A ticket has been opened regarding this problem.
//! let query = query_parser.parse_query("sea whale")?;
//!
//! // Perform search.
//! // `topdocs` contains the 10 most relevant doc ids, sorted by decreasing scores...
//! let top_docs: Vec<(Score, DocAddress)> =
//!     searcher.search(&query, &TopDocs::with_limit(10).order_by_score())?;
//!
//! for (_score, doc_address) in top_docs {
//!     // Retrieve the actual content of documents given its `doc_address`.
//!     let retrieved_doc = searcher.doc::<TantivyDocument>(doc_address)?;
//!     println!("{}", retrieved_doc.to_json(&schema));
//! }
//!
//! # Ok(())
//! # }
//! ```
//!
//!
//!
//! A good place for you to get started is to check out
//! the example code (
//! [literate programming](https://tantivy-search.github.io/examples/basic_search.html) /
//! [source code](https://github.com/quickwit-oss/tantivy/blob/main/examples/basic_search.rs))
//!
//! # Tantivy Architecture Overview
//!
//! Tantivy is inspired by Lucene, the Architecture is very similar.
//!
//! ## Core Concepts
//!
//! - **[Index]**: A collection of segments. The top level entry point for tantivy users to search
//!   and index data.
//!
//! - **[Segment]**: At the heart of Tantivy's indexing structure is the [Segment]. It contains
//!   documents and indices and is the atomic unit of indexing and search.
//!
//! - **[Schema](schema)**: A schema is a set of fields in an index. Each field has a specific data
//!   type and set of attributes.
//!
//! - **[IndexWriter]**: Responsible creating and merging segments. It executes the indexing
//!   pipeline including tokenization, creating indices, and storing the index in the
//!   [Directory](directory).
//!
//! - **Searching**: [Searcher] searches the segments with anything that implements
//!   [Query](query::Query) and merges the results. The list of [supported
//!   queries](query::Query#implementers). Custom Queries are supported by implementing the
//!   [Query](query::Query) trait.
//!
//! - **[Directory](directory)**: Abstraction over the storage where the index data is stored.
//!
//! - **[Tokenizer](tokenizer)**: Breaks down text into individual tokens. Users can implement or
//!   use provided tokenizers.
//!
//! ## Architecture Flow
//!
//! 1. **Document Addition**: Users create documents according to the defined schema. The documents
//!    fields are tokenized, processed, and added to the current segment. See
//!    [Document](schema::document) for the structure and usage.
//!
//! 2. **Segment Creation**: Once the memory limit threshold is reached or a commit is called, the
//!    segment is written to the Directory. Documents are searchable after `commit`.
//!
//! 3. **Merging**: To optimize space and search speed, segments might be merged. This operation is
//!    performed in the background. Customize the merge behaviour via
//!    [IndexWriter::set_merge_policy].
#[cfg_attr(test, macro_use)]
extern crate serde_json;
#[macro_use]
extern crate log;

#[macro_use]
extern crate thiserror;

#[cfg(all(test, feature = "unstable"))]
extern crate test;

#[cfg(feature = "mmap")]
#[cfg(test)]
mod functional_test;

#[macro_use]
mod macros;
mod future_result;

// Re-exports
pub use columnar;
pub use common::{ByteCount, DateTime};
pub use query_grammar;
pub use time;

pub use crate::error::TantivyError;
pub use crate::future_result::FutureResult;

/// Tantivy result.
///
/// Within tantivy, please avoid importing `Result` using `use crate::Result`
/// and instead, refer to this as `crate::Result<T>`.
pub type Result<T> = std::result::Result<T, TantivyError>;

mod core;
pub mod indexer;

pub mod error;
pub mod tokenizer;

pub mod aggregation;
pub mod collector;
pub mod directory;
pub mod fastfield;
pub mod fieldnorm;
pub mod index;
pub mod positions;
pub mod postings;

/// Module containing the different query implementations.
pub mod query;
pub mod schema;
pub mod space_usage;
pub mod store;
pub mod termdict;

mod docset;
mod reader;

#[cfg(test)]
#[cfg(feature = "mmap")]
mod compat_tests;

pub use self::reader::{IndexReader, IndexReaderBuilder, ReloadPolicy, Warmer};
pub mod snippet;

use std::fmt;

pub use census::{Inventory, TrackedObject};
pub use common::{f64_to_u64, i64_to_u64, u64_to_f64, u64_to_i64, HasLen};
use once_cell::sync::Lazy;
use serde::{Deserialize, Serialize};

pub use self::docset::{DocSet, COLLECT_BLOCK_BUFFER_LEN, TERMINATED};
pub use crate::core::{json_utils, Executor, Searcher, SearcherGeneration};
pub use crate::directory::Directory;
pub use crate::index::{
    Index, IndexBuilder, IndexMeta, IndexSettings, InvertedIndexReader, Order, Segment,
    SegmentMeta, SegmentReader,
};
pub use crate::indexer::{IndexWriter, SingleSegmentIndexWriter};
pub use crate::schema::{Document, TantivyDocument, Term};

/// Index format version.
pub const INDEX_FORMAT_VERSION: u32 = 7;
/// Oldest index format version this tantivy version can read.
pub const INDEX_FORMAT_OLDEST_SUPPORTED_VERSION: u32 = 4;

/// Structure version for the index.
#[derive(Clone, PartialEq, Eq, Serialize, Deserialize)]
pub struct Version {
    major: u32,
    minor: u32,
    patch: u32,
    index_format_version: u32,
}

impl fmt::Debug for Version {
    fn fmt(&self, f: &mut fmt::Formatter) -> fmt::Result {
        fmt::Display::fmt(self, f)
    }
}

static VERSION: Lazy<Version> = Lazy::new(|| Version {
    major: env!("CARGO_PKG_VERSION_MAJOR").parse().unwrap(),
    minor: env!("CARGO_PKG_VERSION_MINOR").parse().unwrap(),
    patch: env!("CARGO_PKG_VERSION_PATCH").parse().unwrap(),
    index_format_version: INDEX_FORMAT_VERSION,
});

impl fmt::Display for Version {
    fn fmt(&self, f: &mut fmt::Formatter) -> fmt::Result {
        write!(
            f,
            "tantivy v{}.{}.{}, index_format v{}",
            self.major, self.minor, self.patch, self.index_format_version
        )
    }
}

static VERSION_STRING: Lazy<String> = Lazy::new(|| VERSION.to_string());

/// Expose the current version of tantivy as found in Cargo.toml during compilation.
/// eg. "0.11.0" as well as the compression scheme used in the docstore.
pub fn version() -> &'static Version {
    &VERSION
}

/// Exposes the complete version of tantivy as found in Cargo.toml during compilation as a string.
/// eg. "tantivy v0.11.0, index_format v1, store_compression: lz4".
pub fn version_string() -> &'static str {
    VERSION_STRING.as_str()
}

/// Defines tantivy's merging strategy
pub mod merge_policy {
    pub use crate::indexer::{
        DefaultMergePolicy, LogMergePolicy, MergeCandidate, MergePolicy, NoMergePolicy,
    };
}

/// A `u32` identifying a document within a segment.
/// Documents have their `DocId` assigned incrementally,
/// as they are added in the segment.
///
/// At most, a segment can contain 2^31 documents.
pub type DocId = u32;

/// A u64 assigned to every operation incrementally
///
/// All operations modifying the index receives an monotonic Opstamp.
/// The resulting state of the index is consistent with the opstamp ordering.
///
/// For instance, a commit with opstamp `32_423` will reflect all Add and Delete operations
/// with an opstamp `<= 32_423`. A delete operation with opstamp n will no affect a document added
/// with opstamp `n+1`.
pub type Opstamp = u64;

/// A Score that represents the relevance of the document to the query
///
/// This is modelled internally as a `f32`. The larger the number, the more relevant
/// the document to the search query.
pub type Score = f32;

/// A `SegmentOrdinal` identifies a segment, within a `Searcher` or `Merger`.
pub type SegmentOrdinal = u32;

impl DocAddress {
    /// Creates a new DocAddress from the segment/docId pair.
    pub fn new(segment_ord: SegmentOrdinal, doc_id: DocId) -> DocAddress {
        DocAddress {
            segment_ord,
            doc_id,
        }
    }
}

/// `DocAddress` contains all the necessary information
/// to identify a document given a `Searcher` object.
///
/// It consists of an id identifying its segment, and
/// a segment-local `DocId`.
///
/// The id used for the segment is actually an ordinal
/// in the list of `Segment`s held by a `Searcher`.
#[derive(Debug, Clone, Copy, PartialEq, Eq, PartialOrd, Ord, Hash, Serialize, Deserialize)]
pub struct DocAddress {
    /// The segment ordinal id that identifies the segment
    /// hosting the document in the `Searcher` it is called from.
    pub segment_ord: SegmentOrdinal,
    /// The segment-local `DocId`.
    pub doc_id: DocId,
}

#[macro_export]
/// Enable fail_point if feature is enabled.
macro_rules! fail_point {
    ($name:expr) => {{
        #[cfg(feature = "failpoints")]
        {
            fail::eval($name, |_| {
                panic!("Return is not supported for the fail point \"{}\"", $name);
            });
        }
    }};
    ($name:expr, $e:expr) => {{
        #[cfg(feature = "failpoints")]
        {
            if let Some(res) = fail::eval($name, $e) {
                return res;
            }
        }
    }};
    ($name:expr, $cond:expr, $e:expr) => {{
        #[cfg(feature = "failpoints")]
        {
            if $cond {
                fail::fail_point!($name, $e);
            }
        }
    }};
}

/// Common test utilities.
#[cfg(test)]
pub mod tests {
    use std::collections::BTreeMap;

    use common::{BinarySerializable, FixedSize};
    use query_grammar::{UserInputAst, UserInputLeaf, UserInputLiteral};
    use rand::distr::{Bernoulli, Uniform};
    use rand::rngs::StdRng;
    use rand::{Rng, SeedableRng};
    use time::OffsetDateTime;

    use crate::collector::tests::TEST_COLLECTOR_WITH_SCORE;
    use crate::docset::{DocSet, TERMINATED};
    use crate::index::SegmentReader;
    use crate::merge_policy::NoMergePolicy;
    use crate::postings::Postings;
    use crate::query::{BooleanQuery, QueryParser};
    use crate::schema::*;
    use crate::{DateTime, DocAddress, Index, IndexWriter, ReloadPolicy};

    /// Asserts that the serialized value is the value in the trait.
    pub fn fixed_size_test<O: BinarySerializable + FixedSize + Default>() {
        let mut buffer = Vec::new();
        O::default().serialize(&mut buffer).unwrap();
        assert_eq!(buffer.len(), O::SIZE_IN_BYTES);
    }

    /// Checks if left and right are close one to each other.
    /// Panics if the two values are more than 0.5% apart.
    #[macro_export]
    macro_rules! assert_nearly_equals {
        ($left:expr, $right:expr) => {{
            assert_nearly_equals!($left, $right, 0.0005);
        }};
        ($left:expr, $right:expr, $epsilon:expr) => {{
            match (&$left, &$right, &$epsilon) {
                (left_val, right_val, epsilon_val) => {
                    let diff = (left_val - right_val).abs();

                    if diff > *epsilon_val {
                        panic!(
                            r#"assertion failed: `abs(left-right)>epsilon`
    left: `{:?}`,
    right: `{:?}`,
    epsilon: `{:?}`"#,
                            &*left_val, &*right_val, &*epsilon_val
                        )
                    }
                }
            }
        }};
    }

    /// Generates random numbers
    pub fn generate_nonunique_unsorted(max_value: u32, n_elems: usize) -> Vec<u32> {
        let seed: [u8; 32] = [1; 32];
        StdRng::from_seed(seed)
            .sample_iter(&Uniform::new(0u32, max_value).unwrap())
            .take(n_elems)
            .collect::<Vec<u32>>()
    }

    /// Sample `n` elements with Bernoulli distribution.
    pub fn sample_with_seed(n: u32, ratio: f64, seed_val: u8) -> Vec<u32> {
        StdRng::from_seed([seed_val; 32])
            .sample_iter(&Bernoulli::new(ratio).unwrap())
            .take(n as usize)
            .enumerate()
            .filter_map(|(val, keep)| if keep { Some(val as u32) } else { None })
            .collect()
    }

    /// Sample `n` elements with Bernoulli distribution.
    pub fn sample(n: u32, ratio: f64) -> Vec<u32> {
        sample_with_seed(n, ratio, 4)
    }

    #[test]
    fn test_version_string() {
        use regex::Regex;
        let regex_ptn = Regex::new(
            "tantivy v[0-9]{1,3}\\.[0-9]{1,3}\\.[0-9]{1,3}\\.{0,10}, index_format v[0-9]{1,5}",
        )
        .unwrap();
        let version = super::version().to_string();
        assert!(regex_ptn.find(&version).is_some());
    }

    #[test]
    #[cfg(feature = "mmap")]
    fn test_indexing() -> crate::Result<()> {
        let mut schema_builder = Schema::builder();
        let text_field = schema_builder.add_text_field("text", TEXT);
        let schema = schema_builder.build();
        let index = Index::create_from_tempdir(schema)?;
        // writing the segment
        let mut index_writer: IndexWriter = index.writer_for_tests()?;
        {
            let doc = doc!(text_field=>"af b");
            index_writer.add_document(doc)?;
        }
        {
            let doc = doc!(text_field=>"a b c");
            index_writer.add_document(doc)?;
        }
        {
            let doc = doc!(text_field=>"a b c d");
            index_writer.add_document(doc)?;
        }
        index_writer.commit()?;
        Ok(())
    }

    #[test]
    fn test_docfreq1() -> crate::Result<()> {
        let mut schema_builder = Schema::builder();
        let text_field = schema_builder.add_text_field("text", TEXT);
        let index = Index::create_in_ram(schema_builder.build());
        let mut index_writer: IndexWriter = index.writer_for_tests()?;
        index_writer.add_document(doc!(text_field=>"a b c"))?;
        index_writer.commit()?;
        index_writer.add_document(doc!(text_field=>"a"))?;
        index_writer.add_document(doc!(text_field=>"a a"))?;
        index_writer.commit()?;
        index_writer.add_document(doc!(text_field=>"c"))?;
        index_writer.commit()?;
        let reader = index.reader()?;
        let searcher = reader.searcher();
        let term_a = Term::from_field_text(text_field, "a");
        assert_eq!(searcher.doc_freq(&term_a)?, 3);
        let term_b = Term::from_field_text(text_field, "b");
        assert_eq!(searcher.doc_freq(&term_b)?, 1);
        let term_c = Term::from_field_text(text_field, "c");
        assert_eq!(searcher.doc_freq(&term_c)?, 2);
        let term_d = Term::from_field_text(text_field, "d");
        assert_eq!(searcher.doc_freq(&term_d)?, 0);
        Ok(())
    }

    #[test]
    fn test_fieldnorm_no_docs_with_field() -> crate::Result<()> {
        let mut schema_builder = Schema::builder();
        let title_field = schema_builder.add_text_field("title", TEXT);
        let text_field = schema_builder.add_text_field("text", TEXT);
        let index = Index::create_in_ram(schema_builder.build());
        let mut index_writer: IndexWriter = index.writer_for_tests()?;
        index_writer.add_document(doc!(text_field=>"a b c"))?;
        index_writer.commit()?;
        let index_reader = index.reader()?;
        let searcher = index_reader.searcher();
        let reader = searcher.segment_reader(0);
        {
            let fieldnorm_reader = reader.get_fieldnorms_reader(text_field)?;
            assert_eq!(fieldnorm_reader.fieldnorm(0), 3);
        }
        {
            let fieldnorm_reader = reader.get_fieldnorms_reader(title_field)?;
            assert_eq!(fieldnorm_reader.fieldnorm_id(0), 0);
        }
        Ok(())
    }

    #[test]
    fn test_fieldnorm() -> crate::Result<()> {
        let mut schema_builder = Schema::builder();
        let text_field = schema_builder.add_text_field("text", TEXT);
        let index = Index::create_in_ram(schema_builder.build());
        let mut index_writer: IndexWriter = index.writer_for_tests()?;
        index_writer.add_document(doc!(text_field=>"a b c"))?;
        index_writer.add_document(doc!())?;
        index_writer.add_document(doc!(text_field=>"a b"))?;
        index_writer.commit()?;
        let reader = index.reader()?;
        let searcher = reader.searcher();
        let segment_reader: &SegmentReader = searcher.segment_reader(0);
        let fieldnorms_reader = segment_reader.get_fieldnorms_reader(text_field)?;
        assert_eq!(fieldnorms_reader.fieldnorm(0), 3);
        assert_eq!(fieldnorms_reader.fieldnorm(1), 0);
        assert_eq!(fieldnorms_reader.fieldnorm(2), 2);
        Ok(())
    }

    fn advance_undeleted(docset: &mut dyn DocSet, reader: &SegmentReader) -> bool {
        let mut doc = docset.advance();
        while doc != TERMINATED {
            if !reader.is_deleted(doc) {
                return true;
            }
            doc = docset.advance();
        }
        false
    }

    #[test]
    fn test_delete_postings1() -> crate::Result<()> {
        let mut schema_builder = Schema::builder();
        let text_field = schema_builder.add_text_field("text", TEXT);
        let term_abcd = Term::from_field_text(text_field, "abcd");
        let term_a = Term::from_field_text(text_field, "a");
        let term_b = Term::from_field_text(text_field, "b");
        let term_c = Term::from_field_text(text_field, "c");
        let schema = schema_builder.build();
        let index = Index::create_in_ram(schema);
        let reader = index
            .reader_builder()
            .reload_policy(ReloadPolicy::Manual)
            .try_into()
            .unwrap();
        {
            // writing the segment
            let mut index_writer: IndexWriter = index.writer_for_tests()?;
            // 0
            index_writer.add_document(doc!(text_field=>"a b"))?;
            // 1
            index_writer.add_document(doc!(text_field=>" a c"))?;
            // 2
            index_writer.add_document(doc!(text_field=>" b c"))?;
            // 3
            index_writer.add_document(doc!(text_field=>" b d"))?;

            index_writer.delete_term(Term::from_field_text(text_field, "c"));
            index_writer.delete_term(Term::from_field_text(text_field, "a"));
            // 4
            index_writer.add_document(doc!(text_field=>" b c"))?;
            // 5
            index_writer.add_document(doc!(text_field=>" a"))?;
            index_writer.commit()?;
        }
        {
            reader.reload()?;
            let searcher = reader.searcher();
            let segment_reader = searcher.segment_reader(0);
            let inverted_index = segment_reader.inverted_index(text_field)?;
            assert!(inverted_index
                .read_postings(&term_abcd, IndexRecordOption::WithFreqsAndPositions)?
                .is_none());
            {
                let mut postings = inverted_index
                    .read_postings(&term_a, IndexRecordOption::WithFreqsAndPositions)?
                    .unwrap();
                assert!(advance_undeleted(&mut postings, segment_reader));
                assert_eq!(postings.doc(), 5);
                assert!(!advance_undeleted(&mut postings, segment_reader));
            }
            {
                let mut postings = inverted_index
                    .read_postings(&term_b, IndexRecordOption::WithFreqsAndPositions)?
                    .unwrap();
                assert!(advance_undeleted(&mut postings, segment_reader));
                assert_eq!(postings.doc(), 3);
                assert!(advance_undeleted(&mut postings, segment_reader));
                assert_eq!(postings.doc(), 4);
                assert!(!advance_undeleted(&mut postings, segment_reader));
            }
        }
        {
            // writing the segment
            let mut index_writer: IndexWriter = index.writer_for_tests()?;
            // 0
            index_writer.add_document(doc!(text_field=>"a b"))?;
            // 1
            index_writer.delete_term(Term::from_field_text(text_field, "c"));
            index_writer.rollback()?;
        }
        {
            reader.reload()?;
            let searcher = reader.searcher();
            let seg_reader = searcher.segment_reader(0);
            let inverted_index = seg_reader.inverted_index(term_abcd.field())?;

            assert!(inverted_index
                .read_postings(&term_abcd, IndexRecordOption::WithFreqsAndPositions)?
                .is_none());
            {
                let mut postings = inverted_index
                    .read_postings(&term_a, IndexRecordOption::WithFreqsAndPositions)?
                    .unwrap();
                assert!(advance_undeleted(&mut postings, seg_reader));
                assert_eq!(postings.doc(), 5);
                assert!(!advance_undeleted(&mut postings, seg_reader));
            }
            {
                let mut postings = inverted_index
                    .read_postings(&term_b, IndexRecordOption::WithFreqsAndPositions)?
                    .unwrap();
                assert!(advance_undeleted(&mut postings, seg_reader));
                assert_eq!(postings.doc(), 3);
                assert!(advance_undeleted(&mut postings, seg_reader));
                assert_eq!(postings.doc(), 4);
                assert!(!advance_undeleted(&mut postings, seg_reader));
            }
        }
        {
            // writing the segment
            let mut index_writer: IndexWriter = index.writer_for_tests()?;
            index_writer.add_document(doc!(text_field=>"a b"))?;
            index_writer.delete_term(Term::from_field_text(text_field, "c"));
            index_writer.rollback()?;
            index_writer.delete_term(Term::from_field_text(text_field, "a"));
            index_writer.commit()?;
        }
        {
            reader.reload()?;
            let searcher = reader.searcher();
            let segment_reader = searcher.segment_reader(0);
            let inverted_index = segment_reader.inverted_index(term_abcd.field())?;
            assert!(inverted_index
                .read_postings(&term_abcd, IndexRecordOption::WithFreqsAndPositions)?
                .is_none());
            {
                let mut postings = inverted_index
                    .read_postings(&term_a, IndexRecordOption::WithFreqsAndPositions)?
                    .unwrap();
                assert!(!advance_undeleted(&mut postings, segment_reader));
            }
            {
                let mut postings = inverted_index
                    .read_postings(&term_b, IndexRecordOption::WithFreqsAndPositions)?
                    .unwrap();
                assert!(advance_undeleted(&mut postings, segment_reader));
                assert_eq!(postings.doc(), 3);
                assert!(advance_undeleted(&mut postings, segment_reader));
                assert_eq!(postings.doc(), 4);
                assert!(!advance_undeleted(&mut postings, segment_reader));
            }
            {
                let mut postings = inverted_index
                    .read_postings(&term_c, IndexRecordOption::WithFreqsAndPositions)?
                    .unwrap();
                assert!(advance_undeleted(&mut postings, segment_reader));
                assert_eq!(postings.doc(), 4);
                assert!(!advance_undeleted(&mut postings, segment_reader));
            }
        }
        Ok(())
    }

    #[test]
    fn test_indexed_u64() -> crate::Result<()> {
        let mut schema_builder = Schema::builder();
        let field = schema_builder.add_u64_field("value", INDEXED);
        let schema = schema_builder.build();

        let index = Index::create_in_ram(schema);
        let mut index_writer: IndexWriter = index.writer_for_tests()?;
        index_writer.add_document(doc!(field=>1u64))?;
        index_writer.commit()?;
        let reader = index.reader()?;
        let searcher = reader.searcher();
        let term = Term::from_field_u64(field, 1u64);
        let mut postings = searcher
            .segment_reader(0)
            .inverted_index(term.field())?
            .read_postings(&term, IndexRecordOption::Basic)?
            .unwrap();
        assert_eq!(postings.doc(), 0);
        assert_eq!(postings.advance(), TERMINATED);
        Ok(())
    }

    #[test]
    fn test_indexed_i64() -> crate::Result<()> {
        let mut schema_builder = Schema::builder();
        let value_field = schema_builder.add_i64_field("value", INDEXED);
        let schema = schema_builder.build();

        let index = Index::create_in_ram(schema);
        let mut index_writer: IndexWriter = index.writer_for_tests()?;
        let negative_val = -1i64;
        index_writer.add_document(doc!(value_field => negative_val))?;
        index_writer.commit()?;
        let reader = index.reader()?;
        let searcher = reader.searcher();
        let term = Term::from_field_i64(value_field, negative_val);
        let mut postings = searcher
            .segment_reader(0)
            .inverted_index(term.field())?
            .read_postings(&term, IndexRecordOption::Basic)?
            .unwrap();
        assert_eq!(postings.doc(), 0);
        assert_eq!(postings.advance(), TERMINATED);
        Ok(())
    }

    #[test]
    fn test_indexed_f64() -> crate::Result<()> {
        let mut schema_builder = Schema::builder();
        let value_field = schema_builder.add_f64_field("value", INDEXED);
        let schema = schema_builder.build();

        let index = Index::create_in_ram(schema);
        let mut index_writer: IndexWriter = index.writer_for_tests()?;
        let val = std::f64::consts::PI;
        index_writer.add_document(doc!(value_field => val))?;
        index_writer.commit()?;
        let reader = index.reader()?;
        let searcher = reader.searcher();
        let term = Term::from_field_f64(value_field, val);
        let mut postings = searcher
            .segment_reader(0)
            .inverted_index(term.field())?
            .read_postings(&term, IndexRecordOption::Basic)?
            .unwrap();
        assert_eq!(postings.doc(), 0);
        assert_eq!(postings.advance(), TERMINATED);
        Ok(())
    }

    #[test]
    fn test_indexedfield_not_in_documents() -> crate::Result<()> {
        let mut schema_builder = Schema::builder();
        let text_field = schema_builder.add_text_field("text", TEXT);
        let absent_field = schema_builder.add_text_field("absent_text", TEXT);
        let schema = schema_builder.build();
        let index = Index::create_in_ram(schema);
        let mut index_writer: IndexWriter = index.writer_for_tests()?;
        index_writer.add_document(doc!(text_field=>"a"))?;
        assert!(index_writer.commit().is_ok());
        let reader = index.reader()?;
        let searcher = reader.searcher();
        let segment_reader = searcher.segment_reader(0);
        let inverted_index = segment_reader.inverted_index(absent_field)?;
        assert_eq!(inverted_index.terms().num_terms(), 0);
        Ok(())
    }

    #[test]
    fn test_delete_postings2() -> crate::Result<()> {
        let mut schema_builder = Schema::builder();
        let text_field = schema_builder.add_text_field("text", TEXT);
        let schema = schema_builder.build();
        let index = Index::create_in_ram(schema);
        let reader = index
            .reader_builder()
            .reload_policy(ReloadPolicy::Manual)
            .try_into()?;

        // writing the segment
        let mut index_writer: IndexWriter = index.writer_for_tests()?;
        index_writer.add_document(doc!(text_field=>"63"))?;
        index_writer.add_document(doc!(text_field=>"70"))?;
        index_writer.add_document(doc!(text_field=>"34"))?;
        index_writer.add_document(doc!(text_field=>"1"))?;
        index_writer.add_document(doc!(text_field=>"38"))?;
        index_writer.add_document(doc!(text_field=>"33"))?;
        index_writer.add_document(doc!(text_field=>"40"))?;
        index_writer.add_document(doc!(text_field=>"17"))?;
        index_writer.delete_term(Term::from_field_text(text_field, "38"));
        index_writer.delete_term(Term::from_field_text(text_field, "34"));
        index_writer.commit()?;
        reader.reload()?;
        assert_eq!(reader.searcher().num_docs(), 6);
        Ok(())
    }

    #[test]
    fn test_termfreq() -> crate::Result<()> {
        let mut schema_builder = Schema::builder();
        let text_field = schema_builder.add_text_field("text", TEXT);
        let schema = schema_builder.build();
        let index = Index::create_in_ram(schema);
        {
            // writing the segment
            let mut index_writer: IndexWriter = index.writer_for_tests()?;
            index_writer.add_document(doc!(text_field=>"af af af bc bc"))?;
            index_writer.commit()?;
        }
        {
            let index_reader = index.reader()?;
            let searcher = index_reader.searcher();
            let reader = searcher.segment_reader(0);
            let inverted_index = reader.inverted_index(text_field)?;
            let term_abcd = Term::from_field_text(text_field, "abcd");
            assert!(inverted_index
                .read_postings(&term_abcd, IndexRecordOption::WithFreqsAndPositions)?
                .is_none());
            let term_af = Term::from_field_text(text_field, "af");
            let mut postings = inverted_index
                .read_postings(&term_af, IndexRecordOption::WithFreqsAndPositions)?
                .unwrap();
            assert_eq!(postings.doc(), 0);
            assert_eq!(postings.term_freq(), 3);
            assert_eq!(postings.advance(), TERMINATED);
        }
        Ok(())
    }

    #[test]
    fn test_searcher_1() -> crate::Result<()> {
        let mut schema_builder = Schema::builder();
        let text_field = schema_builder.add_text_field("text", TEXT);
        let schema = schema_builder.build();
        let index = Index::create_in_ram(schema);
        let reader = index.reader()?;
        // writing the segment
        let mut index_writer: IndexWriter = index.writer_for_tests()?;
        index_writer.add_document(doc!(text_field=>"af af af b"))?;
        index_writer.add_document(doc!(text_field=>"a b c"))?;
        index_writer.add_document(doc!(text_field=>"a b c d"))?;
        index_writer.commit()?;

        reader.reload()?;
        let searcher = reader.searcher();
        let get_doc_ids = |terms: Vec<Term>| {
            let query = BooleanQuery::new_multiterms_query(terms);
            searcher
                .search(&query, &TEST_COLLECTOR_WITH_SCORE)
                .map(|topdocs| topdocs.docs().to_vec())
        };
        assert_eq!(
            get_doc_ids(vec![Term::from_field_text(text_field, "a")])?,
            vec![DocAddress::new(0, 1), DocAddress::new(0, 2)]
        );
        assert_eq!(
            get_doc_ids(vec![Term::from_field_text(text_field, "af")])?,
            vec![DocAddress::new(0, 0)]
        );
        assert_eq!(
            get_doc_ids(vec![Term::from_field_text(text_field, "b")])?,
            vec![
                DocAddress::new(0, 0),
                DocAddress::new(0, 1),
                DocAddress::new(0, 2)
            ]
        );
        assert_eq!(
            get_doc_ids(vec![Term::from_field_text(text_field, "c")])?,
            vec![DocAddress::new(0, 1), DocAddress::new(0, 2)]
        );
        assert_eq!(
            get_doc_ids(vec![Term::from_field_text(text_field, "d")])?,
            vec![DocAddress::new(0, 2)]
        );
        assert_eq!(
            get_doc_ids(vec![
                Term::from_field_text(text_field, "b"),
                Term::from_field_text(text_field, "a"),
            ])?,
            vec![
                DocAddress::new(0, 0),
                DocAddress::new(0, 1),
                DocAddress::new(0, 2)
            ]
        );
        Ok(())
    }

    #[test]
    fn test_searcher_2() -> crate::Result<()> {
        let mut schema_builder = Schema::builder();
        let text_field = schema_builder.add_text_field("text", TEXT);
        let schema = schema_builder.build();
        let index = Index::create_in_ram(schema);
        let reader = index
            .reader_builder()
            .reload_policy(ReloadPolicy::Manual)
            .try_into()?;
        assert_eq!(reader.searcher().num_docs(), 0u64);
        // writing the segment
        let mut index_writer: IndexWriter = index.writer_for_tests()?;
        index_writer.add_document(doc!(text_field=>"af b"))?;
        index_writer.add_document(doc!(text_field=>"a b c"))?;
        index_writer.add_document(doc!(text_field=>"a b c d"))?;
        index_writer.commit()?;
        reader.reload()?;
        assert_eq!(reader.searcher().num_docs(), 3u64);
        Ok(())
    }

    #[test]
    fn test_searcher_on_json_field_with_type_inference() {
        // When indexing and searching a json value, we infer its type.
        // This tests aims to check the type infereence is consistent between indexing and search.
        // Inference order is date, i64, u64, f64, bool.
        let mut schema_builder = Schema::builder();
        let json_field = schema_builder.add_json_field("json", STORED | TEXT);
        let schema = schema_builder.build();
        let json_val: serde_json::Value = serde_json::from_str(
            r#"{
            "signed": 2,
            "float": 2.0,
            "unsigned": 10000000000000,
            "date": "1985-04-12T23:20:50.52Z",
            "bool": true
        }"#,
        )
        .unwrap();
        let doc = doc!(json_field=>json_val);
        let index = Index::create_in_ram(schema);
        let mut writer = index.writer_for_tests().unwrap();
        writer.add_document(doc).unwrap();
        writer.commit().unwrap();
        let reader = index.reader().unwrap();
        let searcher = reader.searcher();
        let get_doc_ids = |user_input_literal: UserInputLiteral| {
            let query_parser = crate::query::QueryParser::for_index(&index, Vec::new());
            let query = query_parser
                .build_query_from_user_input_ast(UserInputAst::from(UserInputLeaf::Literal(
                    user_input_literal,
                )))
                .unwrap();
            searcher
                .search(&query, &TEST_COLLECTOR_WITH_SCORE)
                .map(|topdocs| topdocs.docs().to_vec())
                .unwrap()
        };
        {
            let user_input_literal = UserInputLiteral {
                field_name: Some("json.signed".to_string()),
                phrase: "2".to_string(),
                delimiter: crate::query_grammar::Delimiter::None,
                slop: 0,
                prefix: false,
            };
            assert_eq!(get_doc_ids(user_input_literal), vec![DocAddress::new(0, 0)]);
        }
        {
            let user_input_literal = UserInputLiteral {
                field_name: Some("json.float".to_string()),
                phrase: "2.0".to_string(),
                delimiter: crate::query_grammar::Delimiter::None,
                slop: 0,
                prefix: false,
            };
            assert_eq!(get_doc_ids(user_input_literal), vec![DocAddress::new(0, 0)]);
        }
        {
            let user_input_literal = UserInputLiteral {
                field_name: Some("json.date".to_string()),
                phrase: "1985-04-12T23:20:50.52Z".to_string(),
                delimiter: crate::query_grammar::Delimiter::None,
                slop: 0,
                prefix: false,
            };
            assert_eq!(get_doc_ids(user_input_literal), vec![DocAddress::new(0, 0)]);
        }
        {
            let user_input_literal = UserInputLiteral {
                field_name: Some("json.unsigned".to_string()),
                phrase: "10000000000000".to_string(),
                delimiter: crate::query_grammar::Delimiter::None,
                slop: 0,
                prefix: false,
            };
            assert_eq!(get_doc_ids(user_input_literal), vec![DocAddress::new(0, 0)]);
        }
        {
            let user_input_literal = UserInputLiteral {
                field_name: Some("json.bool".to_string()),
                phrase: "true".to_string(),
                delimiter: crate::query_grammar::Delimiter::None,
                slop: 0,
                prefix: false,
            };
            assert_eq!(get_doc_ids(user_input_literal), vec![DocAddress::new(0, 0)]);
        }
    }

    #[test]
    fn test_doc_macro() {
        let mut schema_builder = Schema::builder();
        let text_field = schema_builder.add_text_field("text", TEXT);
        let other_text_field = schema_builder.add_text_field("text2", TEXT);
        let document = doc!(text_field => "tantivy",
                            text_field => "some other value",
                            other_text_field => "short");
        assert_eq!(document.len(), 3);
        let values: Vec<OwnedValue> = document.get_all(text_field).map(OwnedValue::from).collect();
        assert_eq!(values.len(), 2);
        assert_eq!(values[0].as_ref().as_str(), Some("tantivy"));
        assert_eq!(values[1].as_ref().as_str(), Some("some other value"));
        let values: Vec<OwnedValue> = document
            .get_all(other_text_field)
            .map(OwnedValue::from)
            .collect();
        assert_eq!(values.len(), 1);
        assert_eq!(values[0].as_ref().as_str(), Some("short"));
    }

    #[test]
    fn test_wrong_fast_field_type() -> crate::Result<()> {
        let mut schema_builder = Schema::builder();
        let fast_field_unsigned = schema_builder.add_u64_field("unsigned", FAST);
        let fast_field_signed = schema_builder.add_i64_field("signed", FAST);
        let fast_field_float = schema_builder.add_f64_field("float", FAST);
        schema_builder.add_text_field("text", TEXT);
        schema_builder.add_u64_field("stored_int", STORED);
        let schema = schema_builder.build();

        let index = Index::create_in_ram(schema);
        let mut index_writer: IndexWriter = index.writer_for_tests()?;
        {
            let document =
                doc!(fast_field_unsigned => 4u64, fast_field_signed=>4i64, fast_field_float=>4f64);
            index_writer.add_document(document)?;
            index_writer.commit()?;
        }
        let reader = index.reader()?;
        let searcher = reader.searcher();
        let segment_reader: &SegmentReader = searcher.segment_reader(0);
        {
            let fast_field_reader_res = segment_reader.fast_fields().u64("text");
            assert!(fast_field_reader_res.is_err());
        }
        {
            let fast_field_reader_opt = segment_reader.fast_fields().u64("stored_int");
            assert!(fast_field_reader_opt.is_err());
        }
        {
            let fast_field_reader_opt = segment_reader.fast_fields().u64("signed");
            assert!(fast_field_reader_opt.is_err());
        }
        {
            let fast_field_reader_opt = segment_reader.fast_fields().u64("float");
            assert!(fast_field_reader_opt.is_err());
        }
        {
            let fast_field_reader_opt = segment_reader.fast_fields().u64("unsigned");
            assert!(fast_field_reader_opt.is_ok());
            let fast_field_reader = fast_field_reader_opt.unwrap();
            assert_eq!(fast_field_reader.first(0), Some(4u64))
        }

        {
            let fast_field_reader_res = segment_reader.fast_fields().i64("signed");
            assert!(fast_field_reader_res.is_ok());
            let fast_field_reader = fast_field_reader_res.unwrap();
            assert_eq!(fast_field_reader.first(0), Some(4i64))
        }

        {
            let fast_field_reader_res = segment_reader.fast_fields().f64("float");
            assert!(fast_field_reader_res.is_ok());
            let fast_field_reader = fast_field_reader_res.unwrap();
            assert_eq!(fast_field_reader.first(0), Some(4f64))
        }
        Ok(())
    }

    // motivated by #729
    #[test]
    fn test_update_via_delete_insert() -> crate::Result<()> {
        use crate::collector::Count;
        use crate::index::SegmentId;
        use crate::indexer::NoMergePolicy;
        use crate::query::AllQuery;

        const DOC_COUNT: u64 = 2u64;

        let mut schema_builder = SchemaBuilder::default();
        let id = schema_builder.add_u64_field("id", INDEXED);
        let schema = schema_builder.build();

        let index = Index::create_in_ram(schema);
        let index_reader = index.reader()?;

        let mut index_writer: IndexWriter = index.writer_for_tests()?;
        index_writer.set_merge_policy(Box::new(NoMergePolicy));

        for doc_id in 0u64..DOC_COUNT {
            index_writer.add_document(doc!(id => doc_id))?;
        }
        index_writer.commit()?;

        index_reader.reload()?;
        let searcher = index_reader.searcher();

        assert_eq!(
            searcher.search(&AllQuery, &Count).unwrap(),
            DOC_COUNT as usize
        );

        // update the 10 elements by deleting and re-adding
        for doc_id in 0u64..DOC_COUNT {
            index_writer.delete_term(Term::from_field_u64(id, doc_id));
            index_writer.commit()?;
            index_reader.reload()?;
            index_writer.add_document(doc!(id =>  doc_id))?;
            index_writer.commit()?;
            index_reader.reload()?;
            let searcher = index_reader.searcher();
            // The number of document should be stable.
            assert_eq!(
                searcher.search(&AllQuery, &Count).unwrap(),
                DOC_COUNT as usize
            );
        }

        index_reader.reload()?;
        let searcher = index_reader.searcher();
        let segment_ids: Vec<SegmentId> = searcher
            .segment_readers()
            .iter()
            .map(|reader| reader.segment_id())
            .collect();
        index_writer.merge(&segment_ids).wait()?;
        index_reader.reload()?;
        let searcher = index_reader.searcher();
        assert_eq!(searcher.search(&AllQuery, &Count)?, DOC_COUNT as usize);
        Ok(())
    }

    #[test]
    fn test_validate_checksum() -> crate::Result<()> {
        let mut builder = Schema::builder();
        let body = builder.add_text_field("body", TEXT | STORED);
        let schema = builder.build();
        let index = Index::create_in_ram(schema);
        let mut writer: IndexWriter = index.writer_for_tests()?;
        writer.set_merge_policy(Box::new(NoMergePolicy));
        for _ in 0..5000 {
            writer.add_document(doc!(body => "foo"))?;
            writer.add_document(doc!(body => "boo"))?;
        }
        writer.commit()?;
        assert!(index.validate_checksum()?.is_empty());

        // delete few docs
        writer.delete_term(Term::from_field_text(body, "foo"));
        writer.commit()?;
        let segment_ids = index.searchable_segment_ids()?;
        writer.merge(&segment_ids).wait()?;
        assert!(index.validate_checksum()?.is_empty());
        Ok(())
    }

    #[test]
    fn test_datetime() {
        let now = OffsetDateTime::now_utc();

        let dt = DateTime::from_utc(now).into_utc();
        assert_eq!(dt.to_ordinal_date(), now.to_ordinal_date());
        assert_eq!(dt.to_hms_micro(), now.to_hms_micro());
        // We store nanosecond level precision.
        assert_eq!(dt.nanosecond(), now.nanosecond());

        let dt = DateTime::from_timestamp_secs(now.unix_timestamp()).into_utc();
        assert_eq!(dt.to_ordinal_date(), now.to_ordinal_date());
        assert_eq!(dt.to_hms(), now.to_hms());
        // Constructed from a second precision.
        assert_ne!(dt.to_hms_micro(), now.to_hms_micro());

        let dt =
            DateTime::from_timestamp_micros((now.unix_timestamp_nanos() / 1_000) as i64).into_utc();
        assert_eq!(dt.to_ordinal_date(), now.to_ordinal_date());
        assert_eq!(dt.to_hms_micro(), now.to_hms_micro());

        let dt_from_ts_nanos =
            OffsetDateTime::from_unix_timestamp_nanos(1492432621123456789).unwrap();
        let offset_dt = DateTime::from_utc(dt_from_ts_nanos).into_utc();
        assert_eq!(
            dt_from_ts_nanos.to_ordinal_date(),
            offset_dt.to_ordinal_date()
        );
        assert_eq!(dt_from_ts_nanos.to_hms_micro(), offset_dt.to_hms_micro());
    }

    #[test]
    fn test_json_number_ambiguity() {
        let mut schema_builder = Schema::builder();
        let json_field = schema_builder.add_json_field("number", crate::schema::TEXT);
        let schema = schema_builder.build();
        let index = Index::create_in_ram(schema);
        let mut index_writer = index.writer_for_tests().unwrap();
        {
            let mut doc = TantivyDocument::new();
            let mut obj = BTreeMap::default();
            obj.insert("key".to_string(), OwnedValue::I64(1i64));
            doc.add_object(json_field, obj);
            index_writer.add_document(doc).unwrap();
        }
        {
            let mut doc = TantivyDocument::new();
            let mut obj = BTreeMap::default();
            obj.insert("key".to_string(), OwnedValue::U64(1u64));
            doc.add_object(json_field, obj);
            index_writer.add_document(doc).unwrap();
        }
        {
            let mut doc = TantivyDocument::new();
            let mut obj = BTreeMap::default();
            obj.insert("key".to_string(), OwnedValue::F64(1.0f64));
            doc.add_object(json_field, obj);
            index_writer.add_document(doc).unwrap();
        }
        index_writer.commit().unwrap();
        let searcher = index.reader().unwrap().searcher();
        assert_eq!(searcher.num_docs(), 3);
        {
            let parser = QueryParser::for_index(&index, vec![]);
            let query = parser.parse_query("number.key:1").unwrap();
            let count = searcher.search(&query, &crate::collector::Count).unwrap();
            assert_eq!(count, 3);
        }
        {
            let parser = QueryParser::for_index(&index, vec![]);
            let query = parser.parse_query("number.key:1.0").unwrap();
            let count = searcher.search(&query, &crate::collector::Count).unwrap();
            assert_eq!(count, 3);
        }
    }
}


================================================
FILE: src/macros.rs
================================================
/// `doc!` is a shortcut that helps building `Document`
/// objects.
///
/// Assuming that `field1` and `field2` are `Field` instances.
/// You can create a document with a value of `value1` for `field1`
/// `value2` for `field2`, as follows :
///
/// ```c
/// doc!(
///     field1 => value1,
///     field2 => value2,
/// )
/// ```
///
/// The value can be a `u64`, a `&str`, a `i64`, or a `String`.
///
/// # Warning
///
/// The document hence created, is not yet validated against a schema.
/// Nothing prevents its user from creating an invalid document missing a
/// field, or associating a `String` to a `u64` field for instance.
///
/// # Example
///
/// ```rust
/// use tantivy::schema::{Schema, TEXT, FAST};
/// use tantivy::doc;
///
/// //...
///
/// # fn main() {
/// let mut schema_builder = Schema::builder();
/// let title = schema_builder.add_text_field("title", TEXT);
/// let author = schema_builder.add_text_field("text", TEXT);
/// let likes = schema_builder.add_u64_field("num_u64", FAST);
/// let schema = schema_builder.build();
/// let doc = doc!(
///     title => "Life Aquatic",
///     author => "Wes Anderson",
///     likes => 4u64
/// );
/// # }
/// ```
#[macro_export]
macro_rules! doc(
    () => {
        {
            ($crate::TantivyDocument::default())
        }
    }; // avoids a warning due to the useless `mut`.
    ($($field:expr => $value:expr),*) => {
        {
            let mut document = $crate::TantivyDocument::default();
            $(
                document.add_field_value($field, &$value);
            )*
            document
        }
    };
    // if there is a trailing comma retry with the trailing comma stripped.
    ($($field:expr => $value:expr),+ ,) => {
        doc!( $( $field => $value ), *)
    };
);

#[cfg(test)]
mod test {
    use crate::schema::{Schema, FAST, TEXT};

    #[test]
    fn test_doc_basic() {
        let mut schema_builder = Schema::builder();
        let title = schema_builder.add_text_field("title", TEXT);
        let author = schema_builder.add_text_field("text", TEXT);
        let likes = schema_builder.add_u64_field("num_u64", FAST);
        let _schema = schema_builder.build();
        let _doc = doc!(
        title => "Life Aquatic",
        author => "Wes Anderson",
        likes => 4u64
        );
    }

    #[test]
    fn test_doc_trailing_comma() {
        let mut schema_builder = Schema::builder();
        let title = schema_builder.add_text_field("title", TEXT);
        let author = schema_builder.add_text_field("text", TEXT);
        let likes = schema_builder.add_u64_field("num_u64", FAST);
        let _schema = schema_builder.build();
        let _doc = doc!(
        title => "Life Aquatic",
        author => "Wes Anderson",
        likes => 4u64,
        );
    }
}


================================================
FILE: src/positions/mod.rs
================================================
//! Tantivy can (if instructed to do so in the schema) store the term positions in a given field.
//!
//! This position is expressed as token ordinal. For instance,
//! In "The beauty and the beast", the term "the" appears in position 0 and position 3.
//! This information is useful to run phrase queries.
//!
//! The [position](crate::index::SegmentComponent::Positions) file contains all of the
//! bitpacked positions delta, for all terms of a given field, one term after the other.
//!
//! Each term is encoded independently.
//! Like for posting lists, tantivy relies on simd bitpacking to encode the positions delta in
//! blocks of 128 deltas. Because we rarely have a multiple of 128, the final block encodes
//! the remaining values with variable int encoding.
//!
//! In order to make reading possible, the term delta positions first encode the number of
//! bitpacked blocks, then the bitwidth for each block, then the actual bitpacked blocks and finally
//! the final variable int encoded block.
//!
//! Contrary to postings list, the reader does not have access on the number of positions that is
//! encoded, and instead stops decoding the last block when its byte slice has been entirely read.
//!
//! More formally:
//! * *Positions* := *NumBitPackedBlocks* *BitPackedPositionBlock*^(P/128)
//!   *BitPackedPositionsDeltaBitWidth* *VIntPosDeltas*?
//! * *NumBitPackedBlocks**: := *P* / 128 encoded as a variable byte integer.
//! * *BitPackedPositionBlock* := bit width encoded block of 128 positions delta
//! * *BitPackedPositionsDeltaBitWidth* := (*BitWidth*: u8)^*NumBitPackedBlocks*
//! * *VIntPosDeltas* := *VIntPosDelta*^(*P* % 128).
//!
//! The skip widths encoded separately makes it easy and fast to rapidly skip over n positions.
mod reader;
mod serializer;

use bitpacking::{BitPacker, BitPacker4x};

pub use self::reader::PositionReader;
pub use self::serializer::PositionSerializer;

const COMPRESSION_BLOCK_SIZE: usize = BitPacker4x::BLOCK_LEN;

#[cfg(test)]
pub(crate) mod tests {

    use proptest::prelude::*;
    use proptest::sample::select;

    use super::PositionSerializer;
    use crate::directory::OwnedBytes;
    use crate::positions::reader::PositionReader;

    fn create_positions_data(vals: &[u32]) -> crate::Result<OwnedBytes> {
        let mut positions_buffer = vec![];
        let mut serializer = PositionSerializer::new(&mut positions_buffer);
        serializer.write_positions_delta(vals);
        serializer.close_term()?;
        serializer.close()?;
        Ok(OwnedBytes::new(positions_buffer))
    }

    fn gen_delta_positions() -> BoxedStrategy<Vec<u32>> {
        select(&[0, 1, 70, 127, 128, 129, 200, 255, 256, 257, 270][..])
            .prop_flat_map(|num_delta_positions| {
                proptest::collection::vec(
                    select(&[1u32, 2u32, 4u32, 8u32, 16u32][..]),
                    num_delta_positions,
                )
            })
            .boxed()
    }

    proptest! {
        #[test]
        fn test_position_delta(delta_positions in gen_delta_positions()) {
            let delta_positions_data = create_positions_data(&delta_positions).unwrap();
            let mut position_reader = PositionReader::open(delta_positions_data).unwrap();
            let mut minibuf = [0u32; 1];
            for (offset, &delta_position) in delta_positions.iter().enumerate() {
                position_reader.read(offset as u64, &mut minibuf[..]);
                assert_eq!(delta_position, minibuf[0]);
            }
        }
    }

    #[test]
    fn test_position_read() -> crate::Result<()> {
        let position_deltas: Vec<u32> = (0..1000).collect();
        let positions_data = create_positions_data(&position_deltas[..])?;
        assert_eq!(positions_data.len(), 1224);
        let mut position_reader = PositionReader::open(positions_data)?;
        for &n in &[1, 10, 127, 128, 130, 312] {
            let mut v = vec![0u32; n];
            position_reader.read(0, &mut v[..]);
            for i in 0..n {
                assert_eq!(position_deltas[i], i as u32);
            }
        }
        Ok(())
    }

    #[test]
    fn test_empty_position() -> crate::Result<()> {
        let mut positions_buffer = vec![];
        let mut serializer = PositionSerializer::new(&mut positions_buffer);
        serializer.close_term()?;
        serializer.close()?;
        let position_delta = OwnedBytes::new(positions_buffer);
        assert!(PositionReader::open(position_delta).is_ok());
        Ok(())
    }

    #[test]
    fn test_multiple_write_positions() -> crate::Result<()> {
        let mut positions_buffer = vec![];
        let mut serializer = PositionSerializer::new(&mut positions_buffer);
        serializer.write_positions_delta(&[1u32, 12u32]);
        serializer.write_positions_delta(&[4u32, 17u32]);
        serializer.write_positions_delta(&[443u32]);
        serializer.close_term()?;
        serializer.close()?;
        let position_delta = OwnedBytes::new(positions_buffer);
        let mut output_delta_pos_buffer = [0u32; 5];
        let mut position_reader = PositionReader::open(position_delta)?;
        position_reader.read(0, &mut output_delta_pos_buffer[..]);
        assert_eq!(
            &output_delta_pos_buffer[..],
            &[1u32, 12u32, 4u32, 17u32, 443u32]
        );
        Ok(())
    }

    #[test]
    fn test_position_read_with_offset() -> crate::Result<()> {
        let position_deltas: Vec<u32> = (0..1000).collect();
        let positions_data = create_positions_data(&position_deltas[..])?;
        assert_eq!(positions_data.len(), 1224);
        let mut position_reader = PositionReader::open(positions_data)?;
        for &offset in &[1u64, 10u64, 127u64, 128u64, 130u64, 312u64] {
            for &len in &[1, 10, 130, 500] {
                let mut v = vec![0u32; len];
                position_reader.read(offset, &mut v[..]);
                for i in 0..len {
                    assert_eq!(v[i], i as u32 + offset as u32);
                }
            }
        }
        Ok(())
    }

    #[test]
    fn test_position_read_after_skip() -> crate::Result<()> {
        let position_deltas: Vec<u32> = (0..1_000).collect();
        let positions_data = create_positions_data(&position_deltas[..])?;
        assert_eq!(positions_data.len(), 1224);

        let mut position_reader = PositionReader::open(positions_data)?;
        let mut buf = [0u32; 7];
        let mut c = 0;

        let mut offset = 0;
        for _ in 0..100 {
            position_reader.read(offset, &mut buf);
            position_reader.read(offset, &mut buf);
            offset += 7;
            for &el in &buf {
                assert_eq!(c, el);
                c += 1;
            }
        }
        Ok(())
    }

    #[test]
    fn test_position_reread_anchor_different_than_block() -> crate::Result<()> {
        let positions_delta: Vec<u32> = (0..2_000_000).collect();
        let positions_data = create_positions_data(&positions_delta[..])?;
        assert_eq!(positions_data.len(), 5003499);
        let mut position_reader = PositionReader::open(positions_data)?;
        let mut buf = [0u32; 256];
        position_reader.read(128, &mut buf);
        for i in 0..256 {
            assert_eq!(buf[i], (128 + i) as u32);
        }
        position_reader.read(128, &mut buf);
        for i in 0..256 {
            assert_eq!(buf[i], (128 + i) as u32);
        }
        Ok(())
    }

    #[test]
    fn test_position_requesting_passed_block() -> crate::Result<()> {
        let positions_delta: Vec<u32> = (0..512).collect();
        let positions_data = create_positions_data(&positions_delta[..])?;
        assert_eq!(positions_data.len(), 533);
        let mut buf = [0u32; 1];
        let mut position_reader = PositionReader::open(positions_data)?;
        position_reader.read(230, &mut buf);
        assert_eq!(buf[0], 230);
        position_reader.read(9, &mut buf);
        assert_eq!(buf[0], 9);
        Ok(())
    }

    #[test]
    fn test_position() -> crate::Result<()> {
        const CONST_VAL: u32 = 9u32;
        let positions_delta: Vec<u32> = std::iter::repeat_n(CONST_VAL, 2_000_000).collect();
        let positions_data = create_positions_data(&positions_delta[..])?;
        assert_eq!(positions_data.len(), 1_015_627);
        let mut position_reader = PositionReader::open(positions_data)?;
        let mut buf = [0u32; 1];
        position_reader.read(0, &mut buf);
        assert_eq!(buf[0], CONST_VAL);
        Ok(())
    }

    #[test]
    fn test_position_advance() -> crate::Result<()> {
        let positions_delta: Vec<u32> = (0..2_000_000).collect();
        let positions_data = create_positions_data(&positions_delta[..])?;
        assert_eq!(positions_data.len(), 5_003_499);
        for &offset in &[
            10,
            128 * 1024,
            128 * 1024 - 1,
            128 * 1024 + 7,
            128 * 10 * 1024 + 10,
        ] {
            let mut position_reader = PositionReader::open(positions_data.clone())?;
            let mut buf = [0u32; 1];
            position_reader.read(offset, &mut buf);
            assert_eq!(buf[0], offset as u32);
        }
        Ok(())
    }
}


================================================
FILE: src/positions/reader.rs
================================================
use std::io;

use common::{BinarySerializable, VInt};

use crate::directory::OwnedBytes;
use crate::positions::COMPRESSION_BLOCK_SIZE;
use crate::postings::compression::{BlockDecoder, VIntDecoder};

/// When accessing the positions of a term, we get a positions_idx from the `Terminfo`.
/// This means we need to skip to the `nth` position efficiently.
///
/// Blocks are compressed using bitpacking, so `skip_read` contains the number of bits
/// (values can go from 0 to 32 bits) required to decompress every block.
///
/// A given block obviously takes `(128 x  num_bit_for_the_block / num_bits_in_a_byte)`,
/// so skipping a block without decompressing it is just a matter of advancing that many
/// bytes.

#[derive(Clone)]
pub struct PositionReader {
    bit_widths: OwnedBytes,
    positions: OwnedBytes,

    block_decoder: BlockDecoder,

    // offset, expressed in positions, for the first position of the block currently loaded
    // block_offset is a multiple of COMPRESSION_BLOCK_SIZE.
    block_offset: u64,
    // offset, expressed in positions, for the position of the first block encoded
    // in the `self.positions` bytes, and if bitpacked, compressed using the bitwidth in
    // `self.bit_widths`.
    //
    // As we advance, anchor increases simultaneously with bit_widths and positions get consumed.
    anchor_offset: u64,

    // These are just copies used for .reset().
    original_bit_widths: OwnedBytes,
    original_positions: OwnedBytes,
}

impl PositionReader {
    /// Open and reads the term positions encoded into the positions_data owned bytes.
    pub fn open(mut positions_data: OwnedBytes) -> io::Result<PositionReader> {
        let num_positions_bitpacked_blocks = VInt::deserialize(&mut positions_data)?.0 as usize;
        let (bit_widths, positions) = positions_data.split(num_positions_bitpacked_blocks);
        Ok(PositionReader {
            bit_widths: bit_widths.clone(),
            positions: positions.clone(),
            block_decoder: BlockDecoder::default(),
            block_offset: i64::MAX as u64,
            anchor_offset: 0u64,
            original_bit_widths: bit_widths,
            original_positions: positions,
        })
    }

    fn reset(&mut self) {
        self.positions = self.original_positions.clone();
        self.bit_widths = self.original_bit_widths.clone();
        self.block_offset = i64::MAX as u64;
        self.anchor_offset = 0u64;
    }

    /// Advance from num_blocks bitpacked blocks.
    ///
    /// Panics if there are not that many remaining blocks.
    fn advance_num_blocks(&mut self, num_blocks: usize) {
        let num_bits: usize = self.bit_widths.as_ref()[..num_blocks]
            .iter()
            .cloned()
            .map(|num_bits| num_bits as usize)
            .sum();
        let num_bytes_to_skip = num_bits * COMPRESSION_BLOCK_SIZE / 8;
        self.bit_widths.advance(num_blocks);
        self.positions.advance(num_bytes_to_skip);
        self.anchor_offset += (num_blocks * COMPRESSION_BLOCK_SIZE) as u64;
    }

    /// block_rel_id is counted relatively to the anchor.
    /// block_rel_id = 0 means the anchor block.
    /// block_rel_id = i means the ith block after the anchor block.
    fn load_block(&mut self, block_rel_id: usize) {
        let bit_widths = self.bit_widths.as_slice();
        let byte_offset: usize = bit_widths[0..block_rel_id]
            .iter()
            .map(|&b| b as usize)
            .sum::<usize>()
            * COMPRESSION_BLOCK_SIZE
            / 8;
        let compressed_data = &self.positions.as_slice()[byte_offset..];
        if bit_widths.len() > block_rel_id {
            // that block is bitpacked.
            let bit_width = bit_widths[block_rel_id];
            self.block_decoder
                .uncompress_block_unsorted(compressed_data, bit_width, false);
        } else {
            // that block is vint encoded.
            self.block_decoder
                .uncompress_vint_unsorted_until_end(compressed_data);
        }
        self.block_offset = self.anchor_offset + (block_rel_id * COMPRESSION_BLOCK_SIZE) as u64;
    }

    /// Fills a buffer with the positions `[offset..offset+output.len())` integers.
    ///
    /// This function is optimized to be called with increasing values of `offset`.
    pub fn read(&mut self, mut offset: u64, mut output: &mut [u32]) {
        if offset < self.anchor_offset {
            self.reset();
        }
        let delta_to_block_offset = offset as i64 - self.block_offset as i64;
        if !(0..128).contains(&delta_to_block_offset) {
            // The first position is not within the first block.
            // (Note that it could be before or after)
            // We need to possibly skip a few blocks, and decompress the first relevant  block.
            let delta_to_anchor_offset = offset - self.anchor_offset;
            let num_blocks_to_skip =
                (delta_to_anchor_offset / (COMPRESSION_BLOCK_SIZE as u64)) as usize;
            self.advance_num_blocks(num_blocks_to_skip);
            self.load_block(0);
        } else {
            // The request offset is within the loaded block.
            // We still need to advance anchor_offset to our current block.
            let num_blocks_to_skip =
                ((self.block_offset - self.anchor_offset) / COMPRESSION_BLOCK_SIZE as u64) as usize;
            self.advance_num_blocks(num_blocks_to_skip);
        }

        // At this point, the block containing offset is loaded, and anchor has
        // been updated to point to it as well.
        for i in 1.. {
            // we copy the part from block i - 1 that is relevant.
            let offset_in_block = (offset as usize) % COMPRESSION_BLOCK_SIZE;
            let remaining_in_block = COMPRESSION_BLOCK_SIZE - offset_in_block;
            if remaining_in_block >= output.len() {
                output.copy_from_slice(
                    &self.block_decoder.output_array()[offset_in_block..][..output.len()],
                );
                break;
            }
            output[..remaining_in_block]
                .copy_from_slice(&self.block_decoder.output_array()[offset_in_block..]);
            output = &mut output[remaining_in_block..];
            // we load block #i if necessary.
            offset += remaining_in_block as u64;
            self.load_block(i);
        }
    }
}


================================================
FILE: src/positions/serializer.rs
================================================
use std::io::{self, Write};

use common::{BinarySerializable, CountingWriter, VInt};

use crate::positions::COMPRESSION_BLOCK_SIZE;
use crate::postings::compression::{BlockEncoder, VIntEncoder};

/// The PositionSerializer is in charge of serializing all of the positions
/// of all of the terms of a given field.
///
/// It is valid to call write_position_delta more than once per term.
pub struct PositionSerializer<W: io::Write> {
    block_encoder: BlockEncoder,
    positions_wrt: CountingWriter<W>,
    positions_buffer: Vec<u8>,
    block: Vec<u32>,
    bit_widths: Vec<u8>,
}

impl<W: io::Write> PositionSerializer<W> {
    /// Creates a new PositionSerializer writing into the given positions_wrt.
    pub fn new(positions_wrt: W) -> PositionSerializer<W> {
        PositionSerializer {
            block_encoder: BlockEncoder::new(),
            positions_wrt: CountingWriter::wrap(positions_wrt),
            positions_buffer: Vec::with_capacity(128_000),
            block: Vec::with_capacity(128),
            bit_widths: Vec::new(),
        }
    }

    /// Returns the number of bytes written in the positions write object
    /// at this point.
    /// When called before writing the positions of a term, this value is used as
    /// start offset.
    /// When called after writing the positions of a term, this value is used as
    /// end offset.
    pub fn written_bytes(&self) -> u64 {
        self.positions_wrt.written_bytes()
    }

    fn remaining_block_len(&self) -> usize {
        COMPRESSION_BLOCK_SIZE - self.block.len()
    }

    /// Writes all of the given positions delta.
    pub fn write_positions_delta(&mut self, mut positions_delta: &[u32]) {
        while !positions_delta.is_empty() {
            let remaining_block_len = self.remaining_block_len();
            let num_to_write = remaining_block_len.min(positions_delta.len());
            self.block.extend(&positions_delta[..num_to_write]);
            positions_delta = &positions_delta[num_to_write..];
            if self.remaining_block_len() == 0 {
                self.flush_block();
            }
        }
    }

    fn flush_block(&mut self) {
        // encode the positions in the block
        if self.block.is_empty() {
            return;
        }
        if self.block.len() == COMPRESSION_BLOCK_SIZE {
            let (bit_width, block_encoded): (u8, &[u8]) = self
                .block_encoder
                .compress_block_unsorted(&self.block[..], false);
            self.bit_widths.push(bit_width);
            self.positions_buffer.extend(block_encoded);
        } else {
            debug_assert!(self.block.len() < COMPRESSION_BLOCK_SIZE);
            let block_vint_encoded = self.block_encoder.compress_vint_unsorted(&self.block[..]);
            self.positions_buffer.extend_from_slice(block_vint_encoded);
        }
        self.block.clear();
    }

    /// Close the positions for the current term.
    pub fn close_term(&mut self) -> io::Result<()> {
        self.flush_block();
        VInt(self.bit_widths.len() as u64).serialize(&mut self.positions_wrt)?;
        self.positions_wrt.write_all(&self.bit_widths[..])?;
        self.positions_wrt.write_all(&self.positions_buffer)?;
        self.bit_widths.clear();
        self.positions_buffer.clear();
        Ok(())
    }

    /// Close the positions for this term and flushes the data.
    pub fn close(mut self) -> io::Result<()> {
        self.positions_wrt.flush()
    }
}


================================================
FILE: src/postings/block_search.rs
================================================
use crate::postings::compression::COMPRESSION_BLOCK_SIZE;

/// Search the first index containing an element greater or equal to
/// the target.
///
/// The results should be equivalent to
/// ```compile_fail
/// block[..]
//       .iter()
//       .take_while(|&&val| val < target)
//       .count()
/// ```
/// 
/// the `start` argument is just used to hint that the response is
/// greater than beyond `start`. The implementation may or may not use
/// it for optimization.
///
/// # Assumption
///
/// - The block is sorted. Some elements may appear several times. This is the case at the
///   end of the last block for instance.
/// - The target is assumed smaller or equal to the last element of the block.
pub fn branchless_binary_search(arr: &[u32; COMPRESSION_BLOCK_SIZE], target: u32) -> usize {
    let mut start = 0;
    let mut len = arr.len();
    for _ in 0..7 {
        len /= 2;
        let pivot = unsafe { *arr.get_unchecked(start + len - 1) };
        if pivot < target {
            start += len;
        }
    }
    start
}

#[cfg(test)]
mod tests {
    use std::collections::HashSet;

    use proptest::prelude::*;

    use super::branchless_binary_search;
    use crate::docset::TERMINATED;
    use crate::postings::compression::COMPRESSION_BLOCK_SIZE;

    fn search_in_block_trivial_but_slow(block: &[u32], target: u32) -> usize {
        block.iter().take_while(|&&val| val < target).count()
    }

    fn util_test_search_in_block(block: &[u32], target: u32) {
        let cursor = search_in_block_trivial_but_slow(block, target);
        assert!(cursor < COMPRESSION_BLOCK_SIZE);
        assert!(block[cursor] >= target);
        if cursor > 0 {
            assert!(block[cursor - 1] < target);
        }
        assert_eq!(block.len(), COMPRESSION_BLOCK_SIZE);
        let mut output_buffer = [TERMINATED; COMPRESSION_BLOCK_SIZE];
        output_buffer[..block.len()].copy_from_slice(block);
        assert_eq!(branchless_binary_search(&output_buffer, target), cursor);
    }

    fn util_test_search_in_block_all(block: &[u32]) {
        let mut targets = HashSet::new();
        targets.insert(0);
        for &val in block {
            if val > 0 {
                targets.insert(val - 1);
            }
            targets.insert(val);
        }
        for target in targets {
            util_test_search_in_block(block, target);
        }
    }

    #[test]
    fn test_search_in_branchless_binary_search() {
        let v: Vec<u32> = (0..COMPRESSION_BLOCK_SIZE).map(|i| i as u32 * 2).collect();
        util_test_search_in_block_all(&v[..]);
    }

    fn monotonous_block() -> impl Strategy<Value = Vec<u32>> {
        prop::collection::vec(0u32..5u32, COMPRESSION_BLOCK_SIZE).prop_map(|mut deltas| {
            let mut el = 0;
            for i in 0..COMPRESSION_BLOCK_SIZE {
                el += deltas[i];
                deltas[i] = el;
            }
            deltas
        })
    }

    proptest! {
        #[test]
        fn test_proptest_branchless_binary_search(block in monotonous_block()) {
            util_test_search_in_block_all(&block[..]);
        }
    }
}


================================================
FILE: src/postings/block_segment_postings.rs
================================================
use std::io;

use common::VInt;

use crate::directory::{FileSlice, OwnedBytes};
use crate::fieldnorm::FieldNormReader;
use crate::postings::compression::{BlockDecoder, VIntDecoder, COMPRESSION_BLOCK_SIZE};
use crate::postings::{BlockInfo, FreqReadingOption, SkipReader};
use crate::query::Bm25Weight;
use crate::schema::IndexRecordOption;
use crate::{DocId, Score, TERMINATED};

fn max_score<I: Iterator<Item = Score>>(mut it: I) -> Option<Score> {
    it.next().map(|first| it.fold(first, Score::max))
}

/// `BlockSegmentPostings` is a cursor iterating over blocks
/// of documents.
///
/// # Warning
///
/// While it is useful for some very specific high-performance
/// use cases, you should prefer using `SegmentPostings` for most usage.
#[derive(Clone)]
pub struct BlockSegmentPostings {
    pub(crate) doc_decoder: BlockDecoder,
    block_loaded: bool,
    freq_decoder: BlockDecoder,
    freq_reading_option: FreqReadingOption,
    block_max_score_cache: Option<Score>,
    doc_freq: u32,
    data: OwnedBytes,
    skip_reader: SkipReader,
}

fn decode_bitpacked_block(
    doc_decoder: &mut BlockDecoder,
    freq_decoder_opt: Option<&mut BlockDecoder>,
    data: &[u8],
    doc_offset: DocId,
    doc_num_bits: u8,
    tf_num_bits: u8,
    strict_delta: bool,
) {
    let num_consumed_bytes =
        doc_decoder.uncompress_block_sorted(data, doc_offset, doc_num_bits, strict_delta);
    if let Some(freq_decoder) = freq_decoder_opt {
        freq_decoder.uncompress_block_unsorted(
            &data[num_consumed_bytes..],
            tf_num_bits,
            strict_delta,
        );
    }
}

fn decode_vint_block(
    doc_decoder: &mut BlockDecoder,
    freq_decoder_opt: Option<&mut BlockDecoder>,
    data: &[u8],
    doc_offset: DocId,
    num_vint_docs: usize,
) {
    let num_consumed_bytes =
        doc_decoder.uncompress_vint_sorted(data, doc_offset, num_vint_docs, TERMINATED);
    if let Some(freq_decoder) = freq_decoder_opt {
        // if it's a json term with freq, containing less than 256 docs, we can reach here thinking
        // we have a freq, despite not really having one.
        if data.len() > num_consumed_bytes {
            freq_decoder.uncompress_vint_unsorted(
                &data[num_consumed_bytes..],
                num_vint_docs,
                TERMINATED,
            );
        }
    }
}

fn split_into_skips_and_postings(
    doc_freq: u32,
    mut bytes: OwnedBytes,
) -> io::Result<(Option<OwnedBytes>, OwnedBytes)> {
    if doc_freq < COMPRESSION_BLOCK_SIZE as u32 {
        return Ok((None, bytes));
    }
    let skip_len = VInt::deserialize_u64(&mut bytes)? as usize;
    let (skip_data, postings_data) = bytes.split(skip_len);
    Ok((Some(skip_data), postings_data))
}

impl BlockSegmentPostings {
    /// Opens a `BlockSegmentPostings`.
    /// `doc_freq` is the number of documents in the posting list.
    /// `record_option` represents the amount of data available according to the schema.
    /// `requested_option` is the amount of data requested by the user.
    /// If for instance, we do not request for term frequencies, this function will not decompress
    /// term frequency blocks.
    pub(crate) fn open(
        doc_freq: u32,
        data: FileSlice,
        mut record_option: IndexRecordOption,
        requested_option: IndexRecordOption,
    ) -> io::Result<BlockSegmentPostings> {
        let bytes = data.read_bytes()?;
        let (skip_data_opt, postings_data) = split_into_skips_and_postings(doc_freq, bytes)?;
        let skip_reader = match skip_data_opt {
            Some(skip_data) => {
                let block_count = doc_freq as usize / COMPRESSION_BLOCK_SIZE;
                // 8 is the minimum size of a block with frequency (can be more if pos are stored
                // too)
                if skip_data.len() < 8 * block_count {
                    // the field might be encoded with frequency, but this term in particular isn't.
                    // This can happen for JSON field with term frequencies:
                    // - text terms are encoded with term freqs.
                    // - numerical terms are encoded without term freqs.
                    record_option = IndexRecordOption::Basic;
                }
                SkipReader::new(skip_data, doc_freq, record_option)
            }
            None => SkipReader::new(OwnedBytes::empty(), doc_freq, record_option),
        };

        let freq_reading_option = match (record_option, requested_option) {
            (IndexRecordOption::Basic, _) => FreqReadingOption::NoFreq,
            (_, IndexRecordOption::Basic) => FreqReadingOption::SkipFreq,
            (_, _) => FreqReadingOption::ReadFreq,
        };

        let mut block_segment_postings = BlockSegmentPostings {
            doc_decoder: BlockDecoder::with_val(TERMINATED),
            block_loaded: false,
            freq_decoder: BlockDecoder::with_val(1),
            freq_reading_option,
            block_max_score_cache: None,
            doc_freq,
            data: postings_data,
            skip_reader,
        };
        block_segment_postings.load_block();
        Ok(block_segment_postings)
    }

    /// Returns the block_max_score for the current block.
    /// It does not require the block to be loaded. For instance, it is ok to call this method
    /// after having called `.shallow_advance(..)`.
    ///
    /// See `TermScorer::block_max_score(..)` for more information.
    pub fn block_max_score(
        &mut self,
        fieldnorm_reader: &FieldNormReader,
        bm25_weight: &Bm25Weight,
    ) -> Score {
        if let Some(score) = self.block_max_score_cache {
            return score;
        }
        if let Some(skip_reader_max_score) = self.skip_reader.block_max_score(bm25_weight) {
            // if we are on a full block, the skip reader should have the block max information
            // for us
            self.block_max_score_cache = Some(skip_reader_max_score);
            return skip_reader_max_score;
        }
        // this is the last block of the segment posting list.
        // If it is actually loaded, we can compute block max manually.
        if self.block_is_loaded() {
            let docs = self.doc_decoder.output_array().iter().cloned();
            let freqs = self.freq_decoder.output_array().iter().cloned();
            let bm25_scores = docs.zip(freqs).map(|(doc, term_freq)| {
                let fieldnorm_id = fieldnorm_reader.fieldnorm_id(doc);
                bm25_weight.score(fieldnorm_id, term_freq)
            });
            let block_max_score = max_score(bm25_scores).unwrap_or(0.0);
            self.block_max_score_cache = Some(block_max_score);
            return block_max_score;
        }
        // We do not have access to any good block max value. We return bm25_weight.max_score()
        // as it is a valid upperbound.
        //
        // We do not cache it however, so that it gets computed when once block is loaded.
        bm25_weight.max_score()
    }

    pub(crate) fn freq_reading_option(&self) -> FreqReadingOption {
        self.freq_reading_option
    }

    // Resets the block segment postings on another position
    // in the postings file.
    //
    // This is useful for enumerating through a list of terms,
    // and consuming the associated posting lists while avoiding
    // reallocating a `BlockSegmentPostings`.
    //
    // # Warning
    //
    // This does not reset the positions list.
    pub(crate) fn reset(&mut self, doc_freq: u32, postings_data: OwnedBytes) -> io::Result<()> {
        let (skip_data_opt, postings_data) =
            split_into_skips_and_postings(doc_freq, postings_data)?;
        self.data = postings_data;
        self.block_max_score_cache = None;
        self.block_loaded = false;
        if let Some(skip_data) = skip_data_opt {
            self.skip_reader.reset(skip_data, doc_freq);
        } else {
            self.skip_reader.reset(OwnedBytes::empty(), doc_freq);
        }
        self.doc_freq = doc_freq;
        self.load_block();
        Ok(())
    }

    /// Returns the overall number of documents in the block postings.
    /// It does not take in account whether documents are deleted or not.
    ///
    /// This `doc_freq` is simply the sum of the length of all of the blocks
    /// length, and it does not take in account deleted documents.
    pub fn doc_freq(&self) -> u32 {
        self.doc_freq
    }

    /// Returns the array of docs in the current block.
    ///
    /// Before the first call to `.advance()`, the block
    /// returned by `.docs()` is empty.
    #[inline]
    pub fn docs(&self) -> &[DocId] {
        debug_assert!(self.block_is_loaded());
        self.doc_decoder.output_array()
    }

    /// Return the document at index `idx` of the block.
    #[inline]
    pub fn doc(&self, idx: usize) -> u32 {
        self.doc_decoder.output(idx)
    }

    /// Return the array of `term freq` in the block.
    #[inline]
    pub fn freqs(&self) -> &[u32] {
        debug_assert!(self.block_is_loaded());
        self.freq_decoder.output_array()
    }

    /// Return the frequency at index `idx` of the block.
    #[inline]
    pub fn freq(&self, idx: usize) -> u32 {
        debug_assert!(self.block_is_loaded());
        self.freq_decoder.output(idx)
    }

    /// Returns the length of the current block.
    ///
    /// All blocks have a length of `NUM_DOCS_PER_BLOCK`,
    /// except the last block that may have a length
    /// of any number between 1 and `NUM_DOCS_PER_BLOCK - 1`
    #[inline]
    pub fn block_len(&self) -> usize {
        debug_assert!(self.block_is_loaded());
        self.doc_decoder.output_len
    }

    /// Position on a block that may contains `target_doc`.
    ///
    /// If all docs are smaller than target, the block loaded may be empty,
    /// or be the last an incomplete VInt block.
    pub fn seek(&mut self, target_doc: DocId) -> usize {
        // Move to the block that might contain our document.
        self.seek_block(target_doc);
        self.load_block();

        // At this point we are on the block that might contain our document.
        let doc = self.doc_decoder.seek_within_block(target_doc);

        // The last block is not full and padded with TERMINATED,
        // so we are guaranteed to have at least one value (real or padding)
        // that is >= target_doc.
        debug_assert!(doc < COMPRESSION_BLOCK_SIZE);

        // `doc` is now the first element >= `target_doc`.
        // If all docs are smaller than target, the current block is incomplete and padded
        // with TERMINATED. After the search, the cursor points to the first TERMINATED.
        doc
    }

    pub(crate) fn position_offset(&self) -> u64 {
        self.skip_reader.position_offset()
    }

    /// Dangerous API! This calls seeks the next block on the skip list,
    /// but does not `.load_block()` afterwards.
    ///
    /// `.load_block()` needs to be called manually afterwards.
    /// If all docs are smaller than target, the block loaded may be empty,
    /// or be the last an incomplete VInt block.
    pub(crate) fn seek_block(&mut self, target_doc: DocId) {
        if self.skip_reader.seek(target_doc) {
            self.block_max_score_cache = None;
            self.block_loaded = false;
        }
    }

    pub(crate) fn block_is_loaded(&self) -> bool {
        self.block_loaded
    }

    pub(crate) fn load_block(&mut self) {
        if self.block_is_loaded() {
            return;
        }
        let offset = self.skip_reader.byte_offset();
        match self.skip_reader.block_info() {
            BlockInfo::BitPacked {
                doc_num_bits,
                strict_delta_encoded,
                tf_num_bits,
                ..
            } => {
                decode_bitpacked_block(
                    &mut self.doc_decoder,
                    if let FreqReadingOption::ReadFreq = self.freq_reading_option {
                        Some(&mut self.freq_decoder)
                    } else {
                        None
                    },
                    &self.data.as_slice()[offset..],
                    self.skip_reader.last_doc_in_previous_block,
                    doc_num_bits,
                    tf_num_bits,
                    strict_delta_encoded,
                );
            }
            BlockInfo::VInt { num_docs } => {
                let data = {
                    if num_docs == 0 {
                        &[]
                    } else {
                        &self.data.as_slice()[offset..]
                    }
                };
                decode_vint_block(
                    &mut self.doc_decoder,
                    if let FreqReadingOption::ReadFreq = self.freq_reading_option {
                        Some(&mut self.freq_decoder)
                    } else {
                        None
                    },
                    data,
                    self.skip_reader.last_doc_in_previous_block,
                    num_docs as usize,
                );
            }
        }
        self.block_loaded = true;
    }

    /// Advance to the next block.
    pub fn advance(&mut self) {
        self.skip_reader.advance();
        self.block_loaded = false;
        self.block_max_score_cache = None;
        self.load_block();
    }

    /// Returns an empty segment postings object
    pub fn empty() -> BlockSegmentPostings {
        BlockSegmentPostings {
            doc_decoder: BlockDecoder::with_val(TERMINATED),
            block_loaded: true,
            freq_decoder: BlockDecoder::with_val(1),
            freq_reading_option: FreqReadingOption::NoFreq,
            block_max_score_cache: None,
            doc_freq: 0,
            data: OwnedBytes::empty(),
            skip_reader: SkipReader::new(OwnedBytes::empty(), 0, IndexRecordOption::Basic),
        }
    }

    pub(crate) fn skip_reader(&self) -> &SkipReader {
        &self.skip_reader
    }
}

#[cfg(test)]
mod tests {
    use common::HasLen;

    use super::BlockSegmentPostings;
    use crate::docset::{DocSet, TERMINATED};
    use crate::index::Index;
    use crate::postings::compression::COMPRESSION_BLOCK_SIZE;
    use crate::postings::postings::Postings;
    use crate::postings::SegmentPostings;
    use crate::schema::{IndexRecordOption, Schema, Term, INDEXED};
    use crate::DocId;

    #[test]
    fn test_empty_segment_postings() {
        let mut postings = SegmentPostings::empty();
        assert_eq!(postings.doc(), TERMINATED);
        assert_eq!(postings.advance(), TERMINATED);
        assert_eq!(postings.advance(), TERMINATED);
        assert_eq!(postings.doc_freq(), 0);
        assert_eq!(postings.len(), 0);
    }

    #[test]
    fn test_empty_postings_doc_returns_terminated() {
        let mut postings = SegmentPostings::empty();
        assert_eq!(postings.doc(), TERMINATED);
        assert_eq!(postings.advance(), TERMINATED);
    }

    #[test]
    fn test_empty_postings_doc_term_freq_returns_0() {
        let postings = SegmentPostings::empty();
        assert_eq!(postings.term_freq(), 1);
    }

    #[test]
    fn test_empty_block_segment_postings() {
        let mut postings = BlockSegmentPostings::empty();
        assert!(postings.docs().is_empty());
        assert_eq!(postings.doc_freq(), 0);
        postings.advance();
        assert!(postings.docs().is_empty());
        assert_eq!(postings.doc_freq(), 0);
    }

    #[test]
    fn test_block_segment_postings() -> crate::Result<()> {
        let mut block_segments = build_block_postings(&(0..100_000).collect::<Vec<u32>>())?;
        let mut offset: u32 = 0u32;
        // checking that the `doc_freq` is correct
        assert_eq!(block_segments.doc_freq(), 100_000);
        loop {
            let block = block_segments.docs();
            if block.is_empty() {
                break;
            }
            for (i, doc) in block.iter().cloned().enumerate() {
                assert_eq!(offset + (i as u32), doc);
            }
            offset += block.len() as u32;
            block_segments.advance();
        }
        Ok(())
    }

    #[test]
    fn test_skip_right_at_new_block() -> crate::Result<()> {
        let mut doc_ids = (0..128).collect::<Vec<u32>>();
        // 128 is missing
        doc_ids.push(129);
        doc_ids.push(130);
        {
            let block_segments = build_block_postings(&doc_ids)?;
            let mut docset = SegmentPostings::from_block_postings(block_segments, None);
            assert_eq!(docset.seek(128), 129);
            assert_eq!(docset.doc(), 129);
            assert_eq!(docset.advance(), 130);
            assert_eq!(docset.doc(), 130);
            assert_eq!(docset.advance(), TERMINATED);
        }
        {
            let block_segments = build_block_postings(&doc_ids).unwrap();
            let mut docset = SegmentPostings::from_block_postings(block_segments, None);
            assert_eq!(docset.seek(129), 129);
            assert_eq!(docset.doc(), 129);
            assert_eq!(docset.advance(), 130);
            assert_eq!(docset.doc(), 130);
            assert_eq!(docset.advance(), TERMINATED);
        }
        {
            let block_segments = build_block_postings(&doc_ids)?;
            let mut docset = SegmentPostings::from_block_postings(block_segments, None);
            assert_eq!(docset.doc(), 0);
            assert_eq!(docset.seek(131), TERMINATED);
            assert_eq!(docset.doc(), TERMINATED);
        }
        Ok(())
    }

    fn build_block_postings(docs: &[DocId]) -> crate::Result<BlockSegmentPostings> {
        let mut schema_builder = Schema::builder();
        let int_field = schema_builder.add_u64_field("id", INDEXED);
        let schema = schema_builder.build();
        let index = Index::create_in_ram(schema);
        let mut index_writer = index.writer_for_tests()?;
        let mut last_doc = 0u32;
        for &doc in docs {
            for _ in last_doc..doc {
                index_writer.add_document(doc!(int_field=>1u64))?;
            }
            index_writer.add_document(doc!(int_field=>0u64))?;
            last_doc = doc + 1;
        }
        index_writer.commit()?;
        let searcher = index.reader()?.searcher();
        let segment_reader = searcher.segment_reader(0);
        let inverted_index = segment_reader.inverted_index(int_field).unwrap();
        let term = Term::from_field_u64(int_field, 0u64);
        let term_info = inverted_index.get_term_info(&term)?.unwrap();
        let block_postings = inverted_index
            .read_block_postings_from_terminfo(&term_info, IndexRecordOption::Basic)?;
        Ok(block_postings)
    }

    #[test]
    fn test_block_segment_postings_seek() -> crate::Result<()> {
        let mut docs = vec![0];
        for i in 0..1300 {
            docs.push((i * i / 100) + i);
        }
        let mut block_postings = build_block_postings(&docs[..])?;
        for i in &[0, 424, 10000] {
            block_postings.seek(*i);
            let docs = block_postings.docs();
            assert!(docs[0] <= *i);
            assert!(docs.last().cloned().unwrap_or(0u32) >= *i);
        }
        block_postings.seek(100_000);
        assert_eq!(block_postings.doc(COMPRESSION_BLOCK_SIZE - 1), TERMINATED);
        Ok(())
    }

    #[test]
    fn test_reset_block_segment_postings() -> crate::Result<()> {
        let mut schema_builder = Schema::builder();
        let int_field = schema_builder.add_u64_field("id", INDEXED);
        let schema = schema_builder.build();
        let index = Index::create_in_ram(schema);
        let mut index_writer = index.writer_for_tests()?;
        // create two postings list, one containing even number,
        // the other containing odd numbers.
        for i in 0..6 {
            let doc = doc!(int_field=> (i % 2) as u64);
            index_writer.add_document(doc)?;
        }
        index_writer.commit()?;
        let searcher = index.reader()?.searcher();
        let segment_reader = searcher.segment_reader(0);

        let mut block_segments;
        {
            let term = Term::from_field_u64(int_field, 0u64);
            let inverted_index = segment_reader.inverted_index(int_field)?;
            let term_info = inverted_index.get_term_info(&term)?.unwrap();
            block_segments = inverted_index
                .read_block_postings_from_terminfo(&term_info, IndexRecordOption::Basic)?;
        }
        assert_eq!(block_segments.docs(), &[0, 2, 4]);
        {
            let term = Term::from_field_u64(int_field, 1u64);
            let inverted_index = segment_reader.inverted_index(int_field)?;
            let term_info = inverted_index.get_term_info(&term)?.unwrap();
            inverted_index.reset_block_postings_from_terminfo(&term_info, &mut block_segments)?;
        }
        assert_eq!(block_segments.docs(), &[1, 3, 5]);
        Ok(())
    }
}


================================================
FILE: src/postings/compression/mod.rs
================================================
use bitpacking::{BitPacker, BitPacker4x};

pub const COMPRESSION_BLOCK_SIZE: usize = BitPacker4x::BLOCK_LEN;
// in vint encoding, each byte stores 7 bits of data, so we need at most 32 / 7 = 4.57 bytes to
// store a u32 in the worst case, rounding up to 5 bytes total
const MAX_VINT_SIZE: usize = 5;
const COMPRESSED_BLOCK_MAX_SIZE: usize = COMPRESSION_BLOCK_SIZE * MAX_VINT_SIZE;

mod vint;

/// Returns the size in bytes of a compressed block, given `num_bits`.
#[inline]
pub fn compressed_block_size(num_bits: u8) -> usize {
    (num_bits as usize) * COMPRESSION_BLOCK_SIZE / 8
}

pub struct BlockEncoder {
    bitpacker: BitPacker4x,
    pub output: [u8; COMPRESSED_BLOCK_MAX_SIZE],
}

impl Default for BlockEncoder {
    fn default() -> Self {
        BlockEncoder::new()
    }
}

impl BlockEncoder {
    pub fn new() -> BlockEncoder {
        BlockEncoder {
            bitpacker: BitPacker4x::new(),
            output: [0u8; COMPRESSED_BLOCK_MAX_SIZE],
        }
    }

    pub fn compress_block_sorted(&mut self, block: &[u32], offset: u32) -> (u8, &[u8]) {
        // if offset is zero, convert it to None. This is correct as long as we do the same when
        // decompressing. It's required in case the block starts with an actual zero.
        let offset = if offset == 0u32 { None } else { Some(offset) };

        let num_bits = self.bitpacker.num_bits_strictly_sorted(offset, block);
        let written_size =
            self.bitpacker
                .compress_strictly_sorted(offset, block, &mut self.output[..], num_bits);
        (num_bits, &self.output[..written_size])
    }

    /// Compress a single block of unsorted numbers.
    ///
    /// If `minus_one_encoded` is set, each value must be >= 1, and will be encoded in a sligly
    /// more compact format. This is useful for some values where 0 isn't a correct value, such
    /// as term frequency, but isn't correct for some usages like position lists, where 0 can
    /// appear.
    pub fn compress_block_unsorted(
        &mut self,
        block: &[u32],
        minus_one_encoded: bool,
    ) -> (u8, &[u8]) {
        debug_assert!(!minus_one_encoded || !block.contains(&0));

        let mut block_minus_one = [0; COMPRESSION_BLOCK_SIZE];
        let block = if minus_one_encoded {
            for (elem_min_one, elem) in block_minus_one.iter_mut().zip(block) {
                *elem_min_one = elem - 1;
            }
            &block_minus_one
        } else {
            block
        };

        let num_bits = self.bitpacker.num_bits(block);
        let written_size = self
            .bitpacker
            .compress(block, &mut self.output[..], num_bits);
        (num_bits, &self.output[..written_size])
    }
}

#[derive(Clone)]
pub struct BlockDecoder {
    bitpacker: BitPacker4x,
    output: [u32; COMPRESSION_BLOCK_SIZE],
    pub output_len: usize,
}

impl Default for BlockDecoder {
    fn default() -> Self {
        BlockDecoder::with_val(0u32)
    }
}

impl BlockDecoder {
    pub fn with_val(val: u32) -> BlockDecoder {
        BlockDecoder {
            bitpacker: BitPacker4x::new(),
            output: [val; COMPRESSION_BLOCK_SIZE],
            output_len: 0,
        }
    }

    /// Decompress block of sorted integers.
    ///
    /// `strict_delta` depends on what encoding was used. Older version of tantivy never use strict
    /// deltas, newer versions always use them.
    pub fn uncompress_block_sorted(
        &mut self,
        compressed_data: &[u8],
        offset: u32,
        num_bits: u8,
        strict_delta: bool,
    ) -> usize {
        if strict_delta {
            let offset = std::num::NonZeroU32::new(offset).map(std::num::NonZeroU32::get);

            self.output_len = COMPRESSION_BLOCK_SIZE;
            self.bitpacker.decompress_strictly_sorted(
                offset,
                compressed_data,
                &mut self.output,
                num_bits,
            )
        } else {
            self.output_len = COMPRESSION_BLOCK_SIZE;
            self.bitpacker
                .decompress_sorted(offset, compressed_data, &mut self.output, num_bits)
        }
    }

    /// Decompress block of unsorted integers.
    ///
    /// `minus_one_encoded` depends on what encoding was used. Older version of tantivy never use
    /// that encoding. Newer version use it for some structures, but not all. See the corresponding
    /// call to `BlockEncoder::compress_block_unsorted`.
    pub fn uncompress_block_unsorted(
        &mut self,
        compressed_data: &[u8],
        num_bits: u8,
        minus_one_encoded: bool,
    ) -> usize {
        self.output_len = COMPRESSION_BLOCK_SIZE;
        let res = self
            .bitpacker
            .decompress(compressed_data, &mut self.output, num_bits);
        if minus_one_encoded {
            for val in &mut self.output {
                *val += 1;
            }
        }
        res
    }

    #[inline]
    pub fn output_array(&self) -> &[u32] {
        &self.output[..self.output_len]
    }

    /// Return in-block index of first value >= `target`.
    /// Uses the padded buffer to enable branchless search.
    #[inline]
    pub(crate) fn seek_within_block(&self, target: u32) -> usize {
        crate::postings::branchless_binary_search(&self.output, target)
    }

    #[inline]
    pub fn output(&self, idx: usize) -> u32 {
        self.output[idx]
    }
}

pub trait VIntEncoder {
    /// Compresses an array of `u32` integers,
    /// using [delta-encoding](https://en.wikipedia.org/wiki/Delta_encoding)
    /// and variable bytes encoding.
    ///
    /// The method takes an array of ints to compress, and returns
    /// a `&[u8]` representing the compressed data.
    ///
    /// The method also takes an offset to give the value of the
    /// hypothetical previous element in the delta-encoding.
    fn compress_vint_sorted(&mut self, input: &[u32], offset: u32) -> &[u8];

    /// Compresses an array of `u32` integers,
    /// using variable bytes encoding.
    ///
    /// The method takes an array of ints to compress, and returns
    /// a `&[u8]` representing the compressed data.
    fn compress_vint_unsorted(&mut self, input: &[u32]) -> &[u8];
}

pub trait VIntDecoder {
    /// Uncompress an array of `u32` integers,
    /// that were compressed using [delta-encoding](https://en.wikipedia.org/wiki/Delta_encoding)
    /// and variable bytes encoding.
    ///
    /// The method takes a number of int to decompress, and returns
    /// the amount of bytes that were read to decompress them.
    ///
    /// The method also takes an offset to give the value of the
    /// hypothetical previous element in the delta-encoding.
    ///
    /// For instance, if delta encoded are `1, 3, 9`, and the
    /// `offset` is 5, then the output will be:
    /// `5 + 1 = 6, 6 + 3= 9, 9 + 9 = 18`
    ///
    /// The value given in `padding` will be used to fill the remaining `128 - num_els` values.
    fn uncompress_vint_sorted(
        &mut self,
        compressed_data: &[u8],
        offset: u32,
        num_els: usize,
        padding: u32,
    ) -> usize;

    /// Uncompress an array of `u32s`, compressed using variable
    /// byte encoding.
    ///
    /// The method takes a number of int to decompress, and returns
    /// the amount of bytes that were read to decompress them.
    ///
    /// The value given in `padding` will be used to fill the remaining `128 - num_els` values.
    fn uncompress_vint_unsorted(
        &mut self,
        compressed_data: &[u8],
        num_els: usize,
        padding: u32,
    ) -> usize;

    fn uncompress_vint_unsorted_until_end(&mut self, compressed_data: &[u8]);
}

impl VIntEncoder for BlockEncoder {
    fn compress_vint_sorted(&mut self, input: &[u32], offset: u32) -> &[u8] {
        vint::compress_sorted(input, &mut self.output, offset)
    }

    fn compress_vint_unsorted(&mut self, input: &[u32]) -> &[u8] {
        vint::compress_unsorted(input, &mut self.output)
    }
}

impl VIntDecoder for BlockDecoder {
    fn uncompress_vint_sorted(
        &mut self,
        compressed_data: &[u8],
        offset: u32,
        num_els: usize,
        padding: u32,
    ) -> usize {
        self.output_len = num_els;
        self.output.iter_mut().for_each(|el| *el = padding);
        vint::uncompress_sorted(compressed_data, &mut self.output[..num_els], offset)
    }

    fn uncompress_vint_unsorted(
        &mut self,
        compressed_data: &[u8],
        num_els: usize,
        padding: u32,
    ) -> usize {
        self.output_len = num_els;
        self.output.iter_mut().for_each(|el| *el = padding);
        vint::uncompress_unsorted(compressed_data, &mut self.output[..num_els])
    }

    fn uncompress_vint_unsorted_until_end(&mut self, compressed_data: &[u8]) {
        let num_els = vint::uncompress_unsorted_until_end(compressed_data, &mut self.output);
        self.output_len = num_els;
    }
}

#[cfg(test)]
pub(crate) mod tests {
    use super::*;
    use crate::TERMINATED;

    #[test]
    fn test_encode_sorted_block() {
        let vals: Vec<u32> = (0u32..128u32).map(|i| i * 7).collect();
        let mut encoder = BlockEncoder::new();
        let (num_bits, compressed_data) = encoder.compress_block_sorted(&vals, 0);
        let mut decoder = BlockDecoder::default();
        {
            let consumed_num_bytes =
                decoder.uncompress_block_sorted(compressed_data, 0, num_bits, true);
            assert_eq!(consumed_num_bytes, compressed_data.len());
        }
        for i in 0..128 {
            assert_eq!(vals[i], decoder.output(i));
        }
    }

    #[test]
    fn test_encode_sorted_block_with_offset() {
        let vals: Vec<u32> = (0u32..128u32).map(|i| 11 + i * 7).collect();
        let mut encoder = BlockEncoder::default();
        let (num_bits, compressed_data) = encoder.compress_block_sorted(&vals, 10);
        let mut decoder = BlockDecoder::default();
        {
            let consumed_num_bytes =
                decoder.uncompress_block_sorted(compressed_data, 10, num_bits, true);
            assert_eq!(consumed_num_bytes, compressed_data.len());
        }
        for i in 0..128 {
            assert_eq!(vals[i], decoder.output(i));
        }
    }

    #[test]
    fn test_encode_sorted_block_with_junk() {
        let mut compressed: Vec<u8> = Vec::new();
        let n = 128;
        let vals: Vec<u32> = (0..n).map(|i| 11u32 + (i as u32) * 7u32).collect();
        let mut encoder = BlockEncoder::default();
        let (num_bits, compressed_data) = encoder.compress_block_sorted(&vals, 10);
        compressed.extend_from_slice(compressed_data);
        compressed.push(173u8);
        let mut decoder = BlockDecoder::default();
        {
            let consumed_num_bytes =
                decoder.uncompress_block_sorted(&compressed, 10, num_bits, true);
            assert_eq!(consumed_num_bytes, compressed.len() - 1);
            assert_eq!(compressed[consumed_num_bytes], 173u8);
        }
        for i in 0..n {
            assert_eq!(vals[i], decoder.output(i));
        }
    }

    #[test]
    fn test_encode_unsorted_block_with_junk() {
        for minus_one_encode in [false, true] {
            let mut compressed: Vec<u8> = Vec::new();
            let n = 128;
            let vals: Vec<u32> = (0..n).map(|i| 11u32 + (i as u32) * 7u32 % 12).collect();
            let mut encoder = BlockEncoder::default();
            let (num_bits, compressed_data) =
                encoder.compress_block_unsorted(&vals, minus_one_encode);
            compressed.extend_from_slice(compressed_data);
            compressed.push(173u8);
            let mut decoder = BlockDecoder::default();
            {
                let consumed_num_bytes =
                    decoder.uncompress_block_unsorted(&compressed, num_bits, minus_one_encode);
                assert_eq!(consumed_num_bytes + 1, compressed.len());
                assert_eq!(compressed[consumed_num_bytes], 173u8);
            }
            for i in 0..n {
                assert_eq!(vals[i], decoder.output(i));
            }
        }
    }

    #[test]
    fn test_block_decoder_initialization() {
        let block = BlockDecoder::with_val(TERMINATED);
        assert_eq!(block.output(0), TERMINATED);
    }
    #[test]
    fn test_encode_vint() {
        const PADDING_VALUE: u32 = 234_234_345u32;
        let expected_length = 154;
        let mut encoder = BlockEncoder::new();
        let input: Vec<u32> = (0u32..123u32).map(|i| 4 + i * 7 / 2).collect();
        for offset in &[0u32, 1u32, 2u32] {
            let encoded_data = encoder.compress_vint_sorted(&input, *offset);
            assert!(encoded_data.len() <= expected_length);
            let mut decoder = BlockDecoder::default();
            let consumed_num_bytes =
                decoder.uncompress_vint_sorted(encoded_data, *offset, input.len(), PADDING_VALUE);
            assert_eq!(consumed_num_bytes, encoded_data.len());
            assert_eq!(input, decoder.output_array());
            for i in input.len()..COMPRESSION_BLOCK_SIZE {
                assert_eq!(decoder.output(i), PADDING_VALUE);
            }
        }
    }

    #[test]
    fn test_compress_vint_unsorted_does_not_overflow() {
        let mut encoder = BlockEncoder::new();
        let input: Vec<u32> = vec![u32::MAX; COMPRESSION_BLOCK_SIZE];
        encoder.compress_vint_unsorted(&input);
    }
}

#[cfg(all(test, feature = "unstable"))]
mod bench {

    use rand::rngs::StdRng;
    use rand::{Rng, SeedableRng};
    use test::Bencher;

    use super::*;
    use crate::TERMINATED;

    fn generate_array_with_seed(n: usize, ratio: f64, seed_val: u8) -> Vec<u32> {
        let mut seed: [u8; 32] = [0; 32];
        seed[31] = seed_val;
        let mut rng = StdRng::from_seed(seed);
        (0u32..)
            .filter(|_| rng.random_bool(ratio))
            .take(n)
            .collect()
    }

    pub fn generate_array(n: usize, ratio: f64) -> Vec<u32> {
        generate_array_with_seed(n, ratio, 4)
    }

    #[bench]
    fn bench_compress(b: &mut Bencher) {
        let mut encoder = BlockEncoder::new();
        let data = generate_array(COMPRESSION_BLOCK_SIZE, 0.1);
        b.iter(|| {
            encoder.compress_block_sorted(&data, 0u32);
        });
    }

    #[bench]
    fn bench_uncompress(b: &mut Bencher) {
        let mut encoder = BlockEncoder::new();
        let data = generate_array(COMPRESSION_BLOCK_SIZE, 0.1);
        let (num_bits, compressed) = encoder.compress_block_sorted(&data, 0u32);
        let mut decoder = BlockDecoder::default();
        b.iter(|| {
            decoder.uncompress_block_sorted(compressed, 0u32, num_bits, true);
        });
    }

    //#[test]
    // fn test_all_docs_compression_numbits() {
    // for expected_num_bits in 0u8.. {
    // let mut data = [0u32; 128];
    // if expected_num_bits > 0 {
    // data[0] = (1u64 << (expected_num_bits as usize) - 1) as u32;
    //}
    // let mut encoder = BlockEncoder::new();
    // let (num_bits, compressed) = encoder.compress_block_unsorted(&data);
    // assert_eq!(compressed.len(), compressed_block_size(num_bits));
    //}

    const NUM_INTS_BENCH_VINT: usize = 10;

    #[bench]
    fn bench_compress_vint(b: &mut Bencher) {
        let mut encoder = BlockEncoder::new();
        let data = generate_array(NUM_INTS_BENCH_VINT, 0.001);
        b.iter(|| {
            encoder.compress_vint_sorted(&data, 0u32);
        });
    }

    #[bench]
    fn bench_uncompress_vint(b: &mut Bencher) {
        let mut encoder = BlockEncoder::new();
        let data = generate_array(NUM_INTS_BENCH_VINT, 0.001);
        let compressed = encoder.compress_vint_sorted(&data, 0u32);
        let mut decoder = BlockDecoder::default();
        b.iter(|| {
            decoder.uncompress_vint_sorted(compressed, 0u32, NUM_INTS_BENCH_VINT, TERMINATED);
        });
    }
}


================================================
FILE: src/postings/compression/vint.rs
================================================
#[inline]
pub fn compress_sorted<'a>(input: &[u32], output: &'a mut [u8], mut offset: u32) -> &'a [u8] {
    let mut byte_written = 0;
    for &v in input {
        let mut to_encode: u32 = v - offset;
        offset = v;
        loop {
            let next_byte: u8 = (to_encode % 128u32) as u8;
            to_encode /= 128u32;
            if to_encode == 0u32 {
                output[byte_written] = next_byte | 128u8;
                byte_written += 1;
                break;
            } else {
                output[byte_written] = next_byte;
                byte_written += 1;
            }
        }
    }
    &output[..byte_written]
}

#[inline]
pub(crate) fn compress_unsorted<'a>(input: &[u32], output: &'a mut [u8]) -> &'a [u8] {
    let mut byte_written = 0;
    for &v in input {
        let mut to_encode: u32 = v;
        loop {
            let next_byte: u8 = (to_encode % 128u32) as u8;
            to_encode /= 128u32;
            if to_encode == 0u32 {
                output[byte_written] = next_byte | 128u8;
                byte_written += 1;
                break;
            } else {
                output[byte_written] = next_byte;
                byte_written += 1;
            }
        }
    }
    &output[..byte_written]
}

#[inline]
pub fn uncompress_sorted(compressed_data: &[u8], output: &mut [u32], offset: u32) -> usize {
    let mut read_byte = 0;
    let mut result = offset;
    for output_mut in output.iter_mut() {
        let mut shift = 0u32;
        loop {
            let cur_byte = compressed_data[read_byte];
            read_byte += 1;
            result += u32::from(cur_byte % 128u8) << shift;
            if cur_byte & 128u8 != 0u8 {
                break;
            }
            shift += 7;
        }
        *output_mut = result;
    }
    read_byte
}

#[inline]
pub(crate) fn uncompress_unsorted(compressed_data: &[u8], output_arr: &mut [u32]) -> usize {
    let mut num_read_bytes = 0;
    for output_mut in output_arr.iter_mut() {
        let mut result = 0u32;
        let mut shift = 0u32;
        loop {
            let cur_byte = compressed_data[num_read_bytes];
            num_read_bytes += 1;
            result += u32::from(cur_byte % 128u8) << shift;
            if cur_byte & 128u8 != 0u8 {
                break;
            }
            shift += 7;
        }
        *output_mut = result;
    }
    num_read_bytes
}

#[inline]
pub(crate) fn uncompress_unsorted_until_end(
    compressed_data: &[u8],
    output_arr: &mut [u32],
) -> usize {
    let mut num_read_bytes = 0;
    for (num_ints_written, output_mut) in output_arr.iter_mut().enumerate() {
        if compressed_data.len() == num_read_bytes {
            return num_ints_written;
        }
        let mut result = 0u32;
        let mut shift = 0u32;
        loop {
            let cur_byte = compressed_data[num_read_bytes];
            num_read_bytes += 1;
            result += u32::from(cur_byte % 128u8) << shift;
            if cur_byte & 128u8 != 0u8 {
                break;
            }
            shift += 7;
        }
        *output_mut = result;
    }
    output_arr.len()
}


================================================
FILE: src/postings/indexing_context.rs
================================================
use stacker::{ArenaHashMap, MemoryArena};

use crate::indexer::path_to_unordered_id::PathToUnorderedId;

/// IndexingContext contains all of the transient memory arenas
/// required for building the inverted index.
pub(crate) struct IndexingContext {
    /// The term index is an adhoc hashmap,
    /// itself backed by a dedicated memory arena.
    pub term_index: ArenaHashMap,
    /// Arena is a memory arena that stores posting lists / term frequencies / positions.
    pub arena: MemoryArena,
    pub path_to_unordered_id: PathToUnorderedId,
}

impl IndexingContext {
    /// Create a new IndexingContext given the size of the term hash map.
    pub(crate) fn new(table_size: usize) -> IndexingContext {
        let term_index = ArenaHashMap::with_capacity(table_size);
        IndexingContext {
            arena: MemoryArena::default(),
            term_index,
            path_to_unordered_id: PathToUnorderedId::default(),
        }
    }

    /// Returns the memory usage for the inverted index memory arenas, in bytes.
    pub(crate) fn mem_usage(&self) -> usize {
        self.term_index.mem_usage() + self.arena.mem_usage()
    }
}


================================================
FILE: src/postings/json_postings_writer.rs
================================================
use std::io;

use common::json_path_writer::JSON_END_OF_PATH;
use stacker::Addr;

use crate::indexer::indexing_term::IndexingTerm;
use crate::indexer::path_to_unordered_id::OrderedPathId;
use crate::postings::postings_writer::SpecializedPostingsWriter;
use crate::postings::recorder::{BufferLender, DocIdRecorder, Recorder};
use crate::postings::{FieldSerializer, IndexingContext, IndexingPosition, PostingsWriter};
use crate::schema::{Field, Type};
use crate::tokenizer::TokenStream;
use crate::DocId;

/// The `JsonPostingsWriter` is odd in that it relies on a hidden contract:
///
/// `subscribe` is called directly to index non-text tokens, while
/// `index_text` is used to index text.
#[derive(Default)]
pub(crate) struct JsonPostingsWriter<Rec: Recorder> {
    str_posting_writer: SpecializedPostingsWriter<Rec>,
    non_str_posting_writer: SpecializedPostingsWriter<DocIdRecorder>,
}

impl<Rec: Recorder> From<JsonPostingsWriter<Rec>> for Box<dyn PostingsWriter> {
    fn from(json_postings_writer: JsonPostingsWriter<Rec>) -> Box<dyn PostingsWriter> {
        Box::new(json_postings_writer)
    }
}

impl<Rec: Recorder> PostingsWriter for JsonPostingsWriter<Rec> {
    #[inline]
    fn subscribe(
        &mut self,
        doc: crate::DocId,
        pos: u32,
        term: &IndexingTerm,
        ctx: &mut IndexingContext,
    ) {
        self.non_str_posting_writer.subscribe(doc, pos, term, ctx);
    }

    fn index_text(
        &mut self,
        doc_id: DocId,
        token_stream: &mut dyn TokenStream,
        term_buffer: &mut IndexingTerm,
        ctx: &mut IndexingContext,
        indexing_position: &mut IndexingPosition,
    ) {
        self.str_posting_writer.index_text(
            doc_id,
            token_stream,
            term_buffer,
            ctx,
            indexing_position,
        );
    }

    /// The actual serialization format is handled by the `PostingsSerializer`.
    fn serialize(
        &self,
        ordered_term_addrs: &[(Field, OrderedPathId, &[u8], Addr)],
        ordered_id_to_path: &[&str],
        ctx: &IndexingContext,
        serializer: &mut FieldSerializer,
    ) -> io::Result<()> {
        let mut term_buffer = JsonTermSerializer(Vec::with_capacity(48));
        let mut buffer_lender = BufferLender::default();
        let mut prev_term_id = u32::MAX;
        let mut term_path_len = 0; // this will be set in the first iteration
        for (_field, path_id, term, addr) in ordered_term_addrs {
            if prev_term_id != path_id.path_id() {
                term_buffer.clear();
                term_buffer.append_json_path(ordered_id_to_path[path_id.path_id() as usize]);
                term_path_len = term_buffer.len();
                prev_term_id = path_id.path_id();
            }
            term_buffer.truncate(term_path_len);
            term_buffer.append_bytes(term);

            let typ = Type::from_code(term[0]).expect("Invalid type code in JSON term");
            if typ == Type::Str {
                SpecializedPostingsWriter::<Rec>::serialize_one_term(
                    term_buffer.as_bytes(),
                    *addr,
                    &mut buffer_lender,
                    ctx,
                    serializer,
                )?;
            } else {
                SpecializedPostingsWriter::<DocIdRecorder>::serialize_one_term(
                    term_buffer.as_bytes(),
                    *addr,
                    &mut buffer_lender,
                    ctx,
                    serializer,
                )?;
            }
        }
        Ok(())
    }

    fn total_num_tokens(&self) -> u64 {
        self.str_posting_writer.total_num_tokens() + self.non_str_posting_writer.total_num_tokens()
    }
}

/// Helper to build the JSON term bytes that land in the term dictionary.
/// Format: `[json path utf8][JSON_END_OF_PATH][type tag][payload]`
struct JsonTermSerializer(Vec<u8>);
impl JsonTermSerializer {
    /// Appends a JSON path to the Term.
    /// The path is terminated by a special end-of-path 0 byte.
    #[inline]
    pub fn append_json_path(&mut self, path: &str) {
        let bytes = path.as_bytes();
        // Replace any occurrence of the end-of-path byte with Ascii '0' byte.
        if bytes.contains(&JSON_END_OF_PATH) {
            self.0.extend(
                bytes
                    .iter()
                    .map(|&b| if b == JSON_END_OF_PATH { b'0' } else { b }),
            );
        } else {
            self.0.extend_from_slice(bytes);
        }
        self.0.push(JSON_END_OF_PATH);
    }

    /// Appends value bytes to the Term.
    ///
    /// This function returns the segment that has just been added.
    #[inline]
    pub fn append_bytes(&mut self, bytes: &[u8]) -> &mut [u8] {
        let len_before = self.0.len();
        self.0.extend_from_slice(bytes);
        &mut self.0[len_before..]
    }

    fn clear(&mut self) {
        self.0.clear();
    }
    fn truncate(&mut self, len: usize) {
        self.0.truncate(len);
    }
    fn len(&self) -> usize {
        self.0.len()
    }

    fn as_bytes(&self) -> &[u8] {
        &self.0
    }
}


================================================
FILE: src/postings/loaded_postings.rs
================================================
use crate::docset::{DocSet, TERMINATED};
use crate::postings::{Postings, SegmentPostings};
use crate::DocId;

/// `LoadedPostings` is a `DocSet` and `Postings` implementation.
/// It is used to represent the postings of a term in memory.
/// It is suitable if there are few documents for a term.
///
/// It exists mainly to reduce memory usage.
/// `SegmentPostings` uses 1840 bytes per instance due to its caches.
/// If you need to keep many terms around with few docs, it's cheaper to load all the
/// postings in memory.
///
/// This is relevant for `RegexPhraseQuery`, which may have a lot of
/// terms.
/// E.g. 100_000 terms would need 184MB due to SegmentPostings.
pub struct LoadedPostings {
    doc_ids: Box<[DocId]>,
    position_offsets: Box<[u32]>,
    positions: Box<[u32]>,
    cursor: usize,
}

impl LoadedPostings {
    /// Creates a new `LoadedPostings` from a `SegmentPostings`.
    ///
    /// It will also preload positions, if positions are available in the SegmentPostings.
    pub fn load(segment_postings: &mut SegmentPostings) -> LoadedPostings {
        let num_docs = segment_postings.doc_freq() as usize;
        let mut doc_ids = Vec::with_capacity(num_docs);
        let mut positions = Vec::with_capacity(num_docs);
        let mut position_offsets = Vec::with_capacity(num_docs);
        while segment_postings.doc() != TERMINATED {
            position_offsets.push(positions.len() as u32);
            doc_ids.push(segment_postings.doc());
            segment_postings.append_positions_with_offset(0, &mut positions);
            segment_postings.advance();
        }
        position_offsets.push(positions.len() as u32);
        LoadedPostings {
            doc_ids: doc_ids.into_boxed_slice(),
            positions: positions.into_boxed_slice(),
            position_offsets: position_offsets.into_boxed_slice(),
            cursor: 0,
        }
    }
}

#[cfg(test)]
impl From<(Vec<DocId>, Vec<Vec<u32>>)> for LoadedPostings {
    fn from(doc_ids_and_positions: (Vec<DocId>, Vec<Vec<u32>>)) -> LoadedPostings {
        let mut position_offsets = Vec::new();
        let mut all_positions = Vec::new();
        let (doc_ids, docid_positions) = doc_ids_and_positions;
        for positions in docid_positions {
            position_offsets.push(all_positions.len() as u32);
            all_positions.extend_from_slice(&positions);
        }
        position_offsets.push(all_positions.len() as u32);
        LoadedPostings {
            doc_ids: doc_ids.into_boxed_slice(),
            positions: all_positions.into_boxed_slice(),
            position_offsets: position_offsets.into_boxed_slice(),
            cursor: 0,
        }
    }
}

impl DocSet for LoadedPostings {
    fn advance(&mut self) -> DocId {
        self.cursor += 1;
        if self.cursor >= self.doc_ids.len() {
            self.cursor = self.doc_ids.len();
            return TERMINATED;
        }
        self.doc()
    }

    fn doc(&self) -> DocId {
        if self.cursor >= self.doc_ids.len() {
            return TERMINATED;
        }
        self.doc_ids[self.cursor]
    }

    fn size_hint(&self) -> u32 {
        self.doc_ids.len() as u32
    }
}
impl Postings for LoadedPostings {
    fn term_freq(&self) -> u32 {
        let start = self.position_offsets[self.cursor] as usize;
        let end = self.position_offsets[self.cursor + 1] as usize;
        (end - start) as u32
    }

    fn append_positions_with_offset(&mut self, offset: u32, output: &mut Vec<u32>) {
        let start = self.position_offsets[self.cursor] as usize;
        let end = self.position_offsets[self.cursor + 1] as usize;
        for pos in &self.positions[start..end] {
            output.push(*pos + offset);
        }
    }
}

#[cfg(test)]
pub(crate) mod tests {

    use super::*;

    #[test]
    pub fn test_vec_postings() {
        let doc_ids: Vec<DocId> = (0u32..1024u32).map(|e| e * 3).collect();
        let mut postings = LoadedPostings::from((doc_ids, vec![]));
        assert_eq!(postings.doc(), 0u32);
        assert_eq!(postings.advance(), 3u32);
        assert_eq!(postings.doc(), 3u32);
        assert_eq!(postings.seek(14u32), 15u32);
        assert_eq!(postings.doc(), 15u32);
        assert_eq!(postings.seek(300u32), 300u32);
        assert_eq!(postings.doc(), 300u32);
        assert_eq!(postings.seek(6000u32), TERMINATED);
    }

    #[test]
    pub fn test_vec_postings2() {
        let doc_ids: Vec<DocId> = (0u32..1024u32).map(|e| e * 3).collect();
        let mut positions = Vec::new();
        positions.resize(1024, Vec::new());
        positions[0] = vec![1u32, 2u32, 3u32];
        positions[1] = vec![30u32];
        positions[2] = vec![10u32];
        positions[4] = vec![50u32];
        let mut postings = LoadedPostings::from((doc_ids, positions));

        let load = |postings: &mut LoadedPostings| {
            let mut loaded_positions = Vec::new();
            postings.positions(loaded_positions.as_mut());
            loaded_positions
        };
        assert_eq!(postings.doc(), 0u32);
        assert_eq!(load(&mut postings), vec![1u32, 2u32, 3u32]);

        assert_eq!(postings.advance(), 3u32);
        assert_eq!(postings.doc(), 3u32);

        assert_eq!(load(&mut postings), vec![30u32]);

        assert_eq!(postings.seek(14u32), 15u32);
        assert_eq!(postings.doc(), 15u32);
        assert_eq!(postings.seek(300u32), 300u32);
        assert_eq!(postings.doc(), 300u32);
        assert_eq!(postings.seek(6000u32), TERMINATED);
    }
}


================================================
FILE: src/postings/mod.rs
================================================
//! Postings module (also called inverted index)

mod block_search;

pub(crate) use self::block_search::branchless_binary_search;

mod block_segment_postings;
pub(crate) mod compression;
mod indexing_context;
mod json_postings_writer;
mod loaded_postings;
mod per_field_postings_writer;
mod postings;
mod postings_writer;
mod recorder;
mod segment_postings;
/// Serializer module for the inverted index
pub mod serializer;
mod skip;
mod term_info;

pub(crate) use loaded_postings::LoadedPostings;
pub(crate) use stacker::compute_table_memory_size;

pub use self::block_segment_postings::BlockSegmentPostings;
pub(crate) use self::indexing_context::IndexingContext;
pub(crate) use self::per_field_postings_writer::PerFieldPostingsWriter;
pub use self::postings::Postings;
pub(crate) use self::postings_writer::{serialize_postings, IndexingPosition, PostingsWriter};
pub use self::segment_postings::SegmentPostings;
pub use self::serializer::{FieldSerializer, InvertedIndexSerializer};
pub(crate) use self::skip::{BlockInfo, SkipReader};
pub use self::term_info::TermInfo;

#[expect(clippy::enum_variant_names)]
#[derive(Debug, PartialEq, Clone, Copy, Eq)]
pub(crate) enum FreqReadingOption {
    NoFreq,
    SkipFreq,
    ReadFreq,
}

#[cfg(test)]
pub(crate) mod tests {
    use std::mem;

    use super::{InvertedIndexSerializer, Postings};
    use crate::docset::{DocSet, TERMINATED};
    use crate::fieldnorm::FieldNormReader;
    use crate::index::{Index, SegmentComponent, SegmentReader};
    use crate::indexer::operation::AddOperation;
    use crate::indexer::SegmentWriter;
    use crate::query::Scorer;
    use crate::schema::{
        Field, IndexRecordOption, Schema, Term, TextFieldIndexing, TextOptions, INDEXED, TEXT,
    };
    use crate::tokenizer::{SimpleTokenizer, MAX_TOKEN_LEN};
    use crate::{DocId, HasLen, IndexWriter, Score};

    #[test]
    pub fn test_position_write() -> crate::Result<()> {
        let mut schema_builder = Schema::builder();
        let text_field = schema_builder.add_text_field("text", TEXT);
        let schema = schema_builder.build();
        let index = Index::create_in_ram(schema);
        let mut segment = index.new_segment();
        let mut posting_serializer = InvertedIndexSerializer::open(&mut segment)?;
        let mut field_serializer = posting_serializer.new_field(text_field, 120 * 4, None)?;
        field_serializer.new_term("abc".as_bytes(), 12u32, true)?;
        for doc_id in 0u32..120u32 {
            let delta_positions = vec![1, 2, 3, 2];
            field_serializer.write_doc(doc_id, 4, &delta_positions);
        }
        field_serializer.close_term()?;
        mem::drop(field_serializer);
        posting_serializer.close()?;
        let read = segment.open_read(SegmentComponent::Positions)?;
        assert_eq!(read.len(), 207);
        Ok(())
    }

    #[test]
    pub fn test_skip_positions() -> crate::Result<()> {
        let mut schema_builder = Schema::builder();
        let title = schema_builder.add_text_field("title", TEXT);
        let schema = schema_builder.build();
        let index = Index::create_in_ram(schema);
        let mut index_writer = index.writer_for_tests()?;
        index_writer.add_document(doc!(title => r#"abc abc abc"#))?;
        index_writer.add_document(doc!(title => r#"abc be be be be abc"#))?;
        for _ in 0..1_000 {
            index_writer.add_document(doc!(title => r#"abc abc abc"#))?;
        }
        index_writer.add_document(doc!(title => r#"abc be be be be abc"#))?;
        index_writer.commit()?;

        let searcher = index.reader()?.searcher();
        let inverted_index = searcher.segment_reader(0u32).inverted_index(title)?;
        let term = Term::from_field_text(title, "abc");
        let mut positions = Vec::new();
        {
            let mut postings = inverted_index
                .read_postings(&term, IndexRecordOption::WithFreqsAndPositions)?
                .unwrap();
            assert_eq!(postings.doc(), 0);
            postings.positions(&mut positions);
            assert_eq!(&[0, 1, 2], &positions[..]);
            postings.positions(&mut positions);
            assert_eq!(&[0, 1, 2], &positions[..]);
            assert_eq!(postings.advance(), 1);
            assert_eq!(postings.doc(), 1);
            postings.positions(&mut positions);
            assert_eq!(&[0, 5], &positions[..]);
        }
        {
            let mut postings = inverted_index
                .read_postings(&term, IndexRecordOption::WithFreqsAndPositions)?
                .unwrap();
            assert_eq!(postings.doc(), 0);
            assert_eq!(postings.advance(), 1);
            postings.positions(&mut positions);
            assert_eq!(&[0, 5], &positions[..]);
        }
        {
            let mut postings = inverted_index
                .read_postings(&term, IndexRecordOption::WithFreqsAndPositions)?
                .unwrap();
            assert_eq!(postings.seek(1), 1);
            assert_eq!(postings.doc(), 1);
            postings.positions(&mut positions);
            assert_eq!(&[0, 5], &positions[..]);
        }
        {
            let mut postings = inverted_index
                .read_postings(&term, IndexRecordOption::WithFreqsAndPositions)?
                .unwrap();
            assert_eq!(postings.seek(1002), 1002);
            assert_eq!(postings.doc(), 1002);
            postings.positions(&mut positions);
            assert_eq!(&[0, 5], &positions[..]);
        }
        {
            let mut postings = inverted_index
                .read_postings(&term, IndexRecordOption::WithFreqsAndPositions)?
                .unwrap();
            assert_eq!(postings.seek(100), 100);
            assert_eq!(postings.seek(1002), 1002);
            assert_eq!(postings.doc(), 1002);
            postings.positions(&mut positions);
            assert_eq!(&[0, 5], &positions[..]);
        }
        Ok(())
    }

    #[test]
    pub fn test_index_max_length_token() -> crate::Result<()> {
        let mut schema_builder = Schema::builder();
        let text_options = TextOptions::default().set_indexing_options(
            TextFieldIndexing::default()
                .set_index_option(IndexRecordOption::WithFreqsAndPositions)
                .set_tokenizer("simple_no_truncation"),
        );
        let text_field = schema_builder.add_text_field("text", text_options);
        let schema = schema_builder.build();
        let index = Index::create_in_ram(schema);
        index
            .tokenizers()
            .register("simple_no_truncation", SimpleTokenizer::default());
        let reader = index.reader()?;
        let mut index_writer = index.writer_for_tests()?;

        let ok_token_text: String = "A".repeat(MAX_TOKEN_LEN);
        index_writer.add_document(doc!(text_field=>ok_token_text.clone()))?;
        index_writer.commit()?;
        reader.reload()?;
        let searcher = reader.searcher();
        let segment_reader = searcher.segment_reader(0u32);
        let inverted_index = segment_reader.inverted_index(text_field)?;
        assert_eq!(inverted_index.terms().num_terms(), 1);
        let mut bytes = vec![];
        assert!(inverted_index.terms().ord_to_term(0, &mut bytes)?);
        assert_eq!(&bytes[..], ok_token_text.as_bytes());

        Ok(())
    }

    #[test]
    pub fn test_drop_token_that_are_too_long() -> crate::Result<()> {
        let mut schema_builder = Schema::builder();
        let text_options = TextOptions::default().set_indexing_options(
            TextFieldIndexing::default()
                .set_index_option(IndexRecordOption::WithFreqsAndPositions)
                .set_tokenizer("simple_no_truncation"),
        );
        let text_field = schema_builder.add_text_field("text", text_options);
        let schema = schema_builder.build();
        let index = Index::create_in_ram(schema);
        index
            .tokenizers()
            .register("simple_no_truncation", SimpleTokenizer::default());
        let reader = index.reader()?;
        let mut index_writer = index.writer_for_tests()?;

        let mut exceeding_token_text: String = "A".repeat(MAX_TOKEN_LEN + 1);
        exceeding_token_text.push_str(" hello");
        index_writer.add_document(doc!(text_field=>exceeding_token_text))?;
        index_writer.commit()?;
        reader.reload()?;
        let searcher = reader.searcher();
        let segment_reader = searcher.segment_reader(0u32);
        let inverted_index = segment_reader.inverted_index(text_field)?;
        assert_eq!(inverted_index.terms().num_terms(), 1);
        let mut bytes = vec![];
        assert!(inverted_index.terms().ord_to_term(0, &mut bytes)?);
        assert_eq!(&bytes, b"hello");

        Ok(())
    }

    #[test]
    pub fn test_position_and_fieldnorm1() -> crate::Result<()> {
        let mut positions = Vec::new();
        let mut schema_builder = Schema::builder();
        let text_field = schema_builder.add_text_field("text", TEXT);
        let schema = schema_builder.build();
        let index = Index::create_in_ram(schema);
        let segment = index.new_segment();

        {
            let mut segment_writer =
                SegmentWriter::for_segment(15_000_000, segment.clone()).unwrap();
            {
                // checking that position works if the field has two values
                let op = AddOperation {
                    opstamp: 0u64,
                    document: doc!(
                       text_field => "a b a c a d a a.",
                       text_field => "d d d d a"
                    ),
                };
                segment_writer.add_document(op)?;
            }
            {
                let op = AddOperation {
                    opstamp: 1u64,
                    document: doc!(text_field => "b a"),
                };
                segment_writer.add_document(op).unwrap();
            }
            for i in 2..1000 {
                let mut text: String = "e ".repeat(i);
                text.push_str(" a");
                let op = AddOperation {
                    opstamp: 2u64,
                    document: doc!(text_field => text),
                };
                segment_writer.add_document(op).unwrap();
            }
            segment_writer.finalize()?;
        }
        {
            let segment_reader = SegmentReader::open(&segment)?;
            {
                let fieldnorm_reader = segment_reader.get_fieldnorms_reader(text_field)?;
                assert_eq!(fieldnorm_reader.fieldnorm(0), 8 + 5);
                assert_eq!(fieldnorm_reader.fieldnorm(1), 2);
                for i in 2..1000 {
                    assert_eq!(
                        fieldnorm_reader.fieldnorm_id(i),
                        FieldNormReader::fieldnorm_to_id(i + 1)
                    );
                }
            }
            {
                let term_a = Term::from_field_text(text_field, "abcdef");
                assert!(segment_reader
                    .inverted_index(term_a.field())?
                    .read_postings(&term_a, IndexRecordOption::WithFreqsAndPositions)?
                    .is_none());
            }
            {
                let term_a = Term::from_field_text(text_field, "a");
                let mut postings_a = segment_reader
                    .inverted_index(term_a.field())?
                    .read_postings(&term_a, IndexRecordOption::WithFreqsAndPositions)?
                    .unwrap();
                assert_eq!(postings_a.len(), 1000);
                assert_eq!(postings_a.doc(), 0);
                assert_eq!(postings_a.term_freq(), 6);
                postings_a.positions(&mut positions);
                assert_eq!(&positions[..], [0, 2, 4, 6, 7, 13]);
                assert_eq!(postings_a.advance(), 1u32);
                assert_eq!(postings_a.doc(), 1u32);
                assert_eq!(postings_a.term_freq(), 1);
                for i in 2u32..1000u32 {
                    assert_eq!(postings_a.advance(), i);
                    assert_eq!(postings_a.term_freq(), 1);
                    postings_a.positions(&mut positions);
                    assert_eq!(&positions[..], [i]);
                    assert_eq!(postings_a.doc(), i);
                }
                assert_eq!(postings_a.advance(), TERMINATED);
            }
            {
                let term_e = Term::from_field_text(text_field, "e");
                let mut postings_e = segment_reader
                    .inverted_index(term_e.field())?
                    .read_postings(&term_e, IndexRecordOption::WithFreqsAndPositions)?
                    .unwrap();
                assert_eq!(postings_e.len(), 1000 - 2);
                for i in 2u32..1000u32 {
                    assert_eq!(postings_e.term_freq(), i);
                    postings_e.positions(&mut positions);
                    assert_eq!(positions.len(), i as usize);
                    for j in 0..positions.len() {
                        assert_eq!(positions[j], (j as u32));
                    }
                    assert_eq!(postings_e.doc(), i);
                    postings_e.advance();
                }
                assert_eq!(postings_e.doc(), TERMINATED);
            }
        }
        Ok(())
    }

    #[test]
    pub fn test_position_and_fieldnorm2() -> crate::Result<()> {
        let mut positions: Vec<u32> = Vec::new();
        let mut schema_builder = Schema::builder();
        let text_field = schema_builder.add_text_field("text", TEXT);
        let schema = schema_builder.build();
        let index = Index::create_in_ram(schema);
        {
            let mut index_writer = index.writer_for_tests()?;
            index_writer.add_document(doc!(text_field => "g b b d c g c"))?;
            index_writer.add_document(doc!(text_field => "g a b b a d c g c"))?;
            index_writer.commit()?;
        }
        let term_a = Term::from_field_text(text_field, "a");
        let searcher = index.reader()?.searcher();
        let segment_reader = searcher.segment_reader(0);
        let mut postings = segment_reader
            .inverted_index(text_field)?
            .read_postings(&term_a, IndexRecordOption::WithFreqsAndPositions)?
            .unwrap();
        assert_eq!(postings.doc(), 1u32);
        postings.positions(&mut positions);
        assert_eq!(&positions[..], &[1u32, 4]);
        Ok(())
    }

    #[test]
    fn test_skip_next() -> crate::Result<()> {
        let term_0 = Term::from_field_u64(Field::from_field_id(0), 0);
        let term_1 = Term::from_field_u64(Field::from_field_id(0), 1);
        let term_2 = Term::from_field_u64(Field::from_field_id(0), 2);

        let num_docs = 300u32;

        let index = {
            let mut schema_builder = Schema::builder();
            let value_field = schema_builder.add_u64_field("value", INDEXED);
            let schema = schema_builder.build();
            let index = Index::create_in_ram(schema);
            {
                let mut index_writer = index.writer_for_tests()?;
                for i in 0u64..num_docs as u64 {
                    let doc = doc!(value_field => 2u64, value_field => i % 2u64);
                    index_writer.add_document(doc)?;
                }
                assert!(index_writer.commit().is_ok());
            }
            index
        };
        let searcher = index.reader()?.searcher();
        let segment_reader = searcher.segment_reader(0);

        // check that the basic usage works
        for i in 0..num_docs - 1 {
            for j in i + 1..num_docs {
                let mut segment_postings = segment_reader
                    .inverted_index(term_2.field())?
                    .read_postings(&term_2, IndexRecordOption::Basic)?
                    .unwrap();
                assert_eq!(segment_postings.seek(i), i);
                assert_eq!(segment_postings.doc(), i);

                assert_eq!(segment_postings.seek(j), j);
                assert_eq!(segment_postings.doc(), j);
            }
        }

        {
            let mut segment_postings = segment_reader
                .inverted_index(term_2.field())?
                .read_postings(&term_2, IndexRecordOption::Basic)?
                .unwrap();

            // check that `skip_next` advances the iterator
            assert_eq!(segment_postings.doc(), 0);

            assert_eq!(segment_postings.seek(1), 1);
            assert_eq!(segment_postings.doc(), 1);

            assert_eq!(segment_postings.seek(1), 1);
            assert_eq!(segment_postings.doc(), 1);

            // check that going beyond the end is handled
            assert_eq!(segment_postings.seek(num_docs), TERMINATED);
        }

        // check that filtering works
        {
            let mut segment_postings = segment_reader
                .inverted_index(term_0.field())?
                .read_postings(&term_0, IndexRecordOption::Basic)?
                .unwrap();

            for i in 0..num_docs / 2 {
                assert_eq!(segment_postings.seek(i * 2), i * 2);
                assert_eq!(segment_postings.doc(), i * 2);
            }

            let mut segment_postings = segment_reader
                .inverted_index(term_0.field())?
                .read_postings(&term_0, IndexRecordOption::Basic)?
                .unwrap();

            for i in 0..num_docs / 2 - 1 {
                assert!(segment_postings.seek(i * 2 + 1) > i * 2);
                assert_eq!(segment_postings.doc(), (i + 1) * 2);
            }
        }

        // delete some of the documents
        {
            let mut index_writer: IndexWriter = index.writer_for_tests()?;
            index_writer.delete_term(term_0);
            assert!(index_writer.commit().is_ok());
        }
        let searcher = index.reader()?.searcher();
        assert_eq!(searcher.segment_readers().len(), 1);
        let segment_reader = searcher.segment_reader(0);

        // make sure seeking still works
        for i in 0..num_docs {
            let mut segment_postings = segment_reader
                .inverted_index(term_2.field())?
                .read_postings(&term_2, IndexRecordOption::Basic)?
                .unwrap();

            assert_eq!(segment_postings.seek(i), i);
            assert_eq!(segment_postings.doc(), i);
            if i % 2 == 0 {
                assert!(segment_reader.is_deleted(i));
            }
        }

        // now try with a longer sequence
        {
            let mut segment_postings = segment_reader
                .inverted_index(term_2.field())?
                .read_postings(&term_2, IndexRecordOption::Basic)?
                .unwrap();

            let mut last = 2; // start from 5 to avoid seeking to 3 twice
            let mut cur = 3;
            loop {
                let seek = segment_postings.seek(cur);
                if seek == TERMINATED {
                    break;
                }
                assert_eq!(seek, segment_postings.doc());
                if seek == cur {
                    assert_eq!(segment_postings.doc(), cur);
                } else {
                    assert_eq!(segment_postings.doc(), cur + 1);
                }
                let next = cur + last;
                last = cur;
                cur = next;
            }
            assert_eq!(cur, 377);
        }

        // delete everything else
        {
            let mut index_writer: IndexWriter = index.writer_for_tests()?;
            index_writer.delete_term(term_1);
            assert!(index_writer.commit().is_ok());
        }
        let searcher = index.reader()?.searcher();

        // finally, check that it's empty
        {
            let searchable_segment_ids = index.searchable_segment_ids()?;
            assert!(searchable_segment_ids.is_empty());
            assert_eq!(searcher.num_docs(), 0);
        }
        Ok(())
    }

    /// Wraps a given docset, and forward all call but the
    /// `.skip_next(...)`. This is useful to test that a specialized
    /// implementation of `.skip_next(...)` is consistent
    /// with the default implementation.
    pub(crate) struct UnoptimizedDocSet<TDocSet: DocSet>(TDocSet);

    impl<TDocSet: DocSet> UnoptimizedDocSet<TDocSet> {
        pub fn wrap(docset: TDocSet) -> UnoptimizedDocSet<TDocSet> {
            UnoptimizedDocSet(docset)
        }
    }

    impl<TDocSet: DocSet> DocSet for UnoptimizedDocSet<TDocSet> {
        fn advance(&mut self) -> DocId {
            self.0.advance()
        }

        fn doc(&self) -> DocId {
            self.0.doc()
        }

        fn size_hint(&self) -> u32 {
            self.0.size_hint()
        }
    }

    impl<TScorer: Scorer> Scorer for UnoptimizedDocSet<TScorer> {
        #[inline]
        fn score(&mut self) -> Score {
            self.0.score()
        }
    }

    pub fn test_skip_against_unoptimized<F: Fn() -> Box<dyn DocSet>>(
        postings_factory: F,
        targets: Vec<u32>,
    ) {
        for target in targets {
            let mut postings_opt = postings_factory();
            if target < postings_opt.doc() {
                continue;
            }
            let mut postings_unopt = UnoptimizedDocSet::wrap(postings_factory());
            let skip_result_opt = postings_opt.seek(target);
            let skip_result_unopt = postings_unopt.seek(target);
            assert_eq!(
                skip_result_unopt, skip_result_opt,
                "Failed while skipping to {target}"
            );
            assert!(skip_result_opt >= target);
            assert_eq!(skip_result_opt, postings_opt.doc());
            if skip_result_opt == TERMINATED {
                return;
            }
            while postings_opt.doc() != TERMINATED {
                assert_eq!(postings_opt.doc(), postings_unopt.doc());
                assert_eq!(postings_opt.advance(), postings_unopt.advance());
            }
        }
    }
}

#[cfg(all(test, feature = "unstable"))]
mod bench {
    use once_cell::sync::Lazy;
    use rand::rngs::StdRng;
    use rand::{Rng, SeedableRng};
    use test::{self, Bencher};

    use crate::docset::TERMINATED;
    use crate::query::Intersection;
    use crate::schema::{Field, IndexRecordOption, Schema, TantivyDocument, Term, STRING};
    use crate::{tests, DocSet, Index, IndexWriter};

    pub static TERM_A: Lazy<Term> = Lazy::new(|| {
        let field = Field::from_field_id(0);
        Term::from_field_text(field, "a")
    });
    pub static TERM_B: Lazy<Term> = Lazy::new(|| {
        let field = Field::from_field_id(0);
        Term::from_field_text(field, "b")
    });
    pub static TERM_C: Lazy<Term> = Lazy::new(|| {
        let field = Field::from_field_id(0);
        Term::from_field_text(field, "c")
    });
    pub static TERM_D: Lazy<Term> = Lazy::new(|| {
        let field = Field::from_field_id(0);
        Term::from_field_text(field, "d")
    });

    pub static INDEX: Lazy<Index> = Lazy::new(|| {
        let mut schema_builder = Schema::builder();
        let text_field = schema_builder.add_text_field("text", STRING);
        let schema = schema_builder.build();

        let mut rng: StdRng = StdRng::from_seed([1u8; 32]);

        let index = Index::create_in_ram(schema);
        let posting_list_size = 1_000_000;
        {
            let mut index_writer: IndexWriter = index.writer_for_tests().unwrap();
            for _ in 0..posting_list_size {
                let mut doc = TantivyDocument::default();
                if rng.random_bool(1f64 / 15f64) {
                    doc.add_text(text_field, "a");
                }
                if rng.random_bool(1f64 / 10f64) {
                    doc.add_text(text_field, "b");
                }
                if rng.random_bool(1f64 / 5f64) {
                    doc.add_text(text_field, "c");
                }
                doc.add_text(text_field, "d");
                index_writer.add_document(doc).unwrap();
            }
            assert!(index_writer.commit().is_ok());
        }
        index
    });

    #[bench]
    fn bench_segment_postings(b: &mut Bencher) {
        let reader = INDEX.reader().unwrap();
        let searcher = reader.searcher();
        let segment_reader = searcher.segment_reader(0);

        b.iter(|| {
            let mut segment_postings = segment_reader
                .inverted_index(TERM_A.field())
                .unwrap()
                .read_postings(&TERM_A, IndexRecordOption::Basic)
                .unwrap()
                .unwrap();
            while segment_postings.advance() != TERMINATED {}
        });
    }

    #[bench]
    fn bench_segment_intersection(b: &mut Bencher) {
        let reader = INDEX.reader().unwrap();
        let searcher = reader.searcher();
        let segment_reader = searcher.segment_reader(0);
        b.iter(|| {
            let segment_postings_a = segment_reader
                .inverted_index(TERM_A.field())
                .unwrap()
                .read_postings(&TERM_A, IndexRecordOption::Basic)
                .unwrap()
                .unwrap();
            let segment_postings_b = segment_reader
                .inverted_index(TERM_B.field())
                .unwrap()
                .read_postings(&TERM_B, IndexRecordOption::Basic)
                .unwrap()
                .unwrap();
            let segment_postings_c = segment_reader
                .inverted_index(TERM_C.field())
                .unwrap()
                .read_postings(&TERM_C, IndexRecordOption::Basic)
                .unwrap()
                .unwrap();
            let segment_postings_d = segment_reader
                .inverted_index(TERM_D.field())
                .unwrap()
                .read_postings(&TERM_D, IndexRecordOption::Basic)
                .unwrap()
                .unwrap();
            let mut intersection = Intersection::new(
                vec![
                    segment_postings_a,
                    segment_postings_b,
                    segment_postings_c,
                    segment_postings_d,
                ],
                reader.searcher().num_docs() as u32,
            );
            while intersection.advance() != TERMINATED {}
        });
    }

    fn bench_skip_next(p: f64, b: &mut Bencher) {
        let reader = INDEX.reader().unwrap();
        let searcher = reader.searcher();
        let segment_reader = searcher.segment_reader(0);
        let docs = tests::sample(segment_reader.num_docs(), p);

        let mut segment_postings = segment_reader
            .inverted_index(TERM_A.field())
            .unwrap()
            .read_postings(&TERM_A, IndexRecordOption::Basic)
            .unwrap()
            .unwrap();

        let mut existing_docs = Vec::new();
        for doc in &docs {
            if *doc >= segment_postings.doc() {
                existing_docs.push(*doc);
                if segment_postings.seek(*doc) == TERMINATED {
                    break;
                }
            }
        }

        b.iter(|| {
            let mut segment_postings = segment_reader
                .inverted_index(TERM_A.field())
                .unwrap()
                .read_postings(&TERM_A, IndexRecordOption::Basic)
                .unwrap()
                .unwrap();
            for doc in &existing_docs {
                if segment_postings.seek(*doc) == TERMINATED {
                    break;
                }
            }
        });
    }

    #[bench]
    fn bench_skip_next_p01(b: &mut Bencher) {
        bench_skip_next(0.001, b);
    }

    #[bench]
    fn bench_skip_next_p1(b: &mut Bencher) {
        bench_skip_next(0.01, b);
    }

    #[bench]
    fn bench_skip_next_p10(b: &mut Bencher) {
        bench_skip_next(0.1, b);
    }

    #[bench]
    fn bench_skip_next_p90(b: &mut Bencher) {
        bench_skip_next(0.9, b);
    }

    #[bench]
    fn bench_iterate_segment_postings(b: &mut Bencher) {
        let reader = INDEX.reader().unwrap();
        let searcher = reader.searcher();
        let segment_reader = searcher.segment_reader(0);
        b.iter(|| {
            let n: u32 = test::black_box(17);
            let mut segment_postings = segment_reader
                .inverted_index(TERM_A.field())
                .unwrap()
                .read_postings(&TERM_A, IndexRecordOption::Basic)
                .unwrap()
                .unwrap();
            let mut s = 0u32;
            while segment_postings.doc() != TERMINATED {
                s += (segment_postings.doc() & n) % 1024;
                segment_postings.advance();
            }
            s
        });
    }
}


================================================
FILE: src/postings/per_field_postings_writer.rs
================================================
use crate::postings::json_postings_writer::JsonPostingsWriter;
use crate::postings::postings_writer::SpecializedPostingsWriter;
use crate::postings::recorder::{DocIdRecorder, TermFrequencyRecorder, TfAndPositionRecorder};
use crate::postings::PostingsWriter;
use crate::schema::{Field, FieldEntry, FieldType, IndexRecordOption, Schema};

pub(crate) struct PerFieldPostingsWriter {
    per_field_postings_writers: Vec<Box<dyn PostingsWriter>>,
}

impl PerFieldPostingsWriter {
    pub fn for_schema(schema: &Schema) -> Self {
        let per_field_postings_writers = schema
            .fields()
            .map(|(_, field_entry)| posting_writer_from_field_entry(field_entry))
            .collect();
        PerFieldPostingsWriter {
            per_field_postings_writers,
        }
    }

    pub(crate) fn get_for_field(&self, field: Field) -> &dyn PostingsWriter {
        self.per_field_postings_writers[field.field_id() as usize].as_ref()
    }

    pub(crate) fn get_for_field_mut(&mut self, field: Field) -> &mut dyn PostingsWriter {
        self.per_field_postings_writers[field.field_id() as usize].as_mut()
    }
}

fn posting_writer_from_field_entry(field_entry: &FieldEntry) -> Box<dyn PostingsWriter> {
    match *field_entry.field_type() {
        FieldType::Str(ref text_options) => text_options
            .get_indexing_options()
            .map(|indexing_options| match indexing_options.index_option() {
                IndexRecordOption::Basic => {
                    SpecializedPostingsWriter::<DocIdRecorder>::default().into()
                }
                IndexRecordOption::WithFreqs => {
                    SpecializedPostingsWriter::<TermFrequencyRecorder>::default().into()
                }
                IndexRecordOption::WithFreqsAndPositions => {
                    SpecializedPostingsWriter::<TfAndPositionRecorder>::default().into()
                }
            })
            .unwrap_or_else(|| SpecializedPostingsWriter::<DocIdRecorder>::default().into()),
        FieldType::U64(_)
        | FieldType::I64(_)
        | FieldType::F64(_)
        | FieldType::Bool(_)
        | FieldType::Date(_)
        | FieldType::Bytes(_)
        | FieldType::IpAddr(_)
        | FieldType::Facet(_) => Box::<SpecializedPostingsWriter<DocIdRecorder>>::default(),
        FieldType::JsonObject(ref json_object_options) => {
            if let Some(text_indexing_option) = json_object_options.get_text_indexing_options() {
                match text_indexing_option.index_option() {
                    IndexRecordOption::Basic => {
                        JsonPostingsWriter::<DocIdRecorder>::default().into()
                    }
                    IndexRecordOption::WithFreqs => {
                        JsonPostingsWriter::<TermFrequencyRecorder>::default().into()
                    }
                    IndexRecordOption::WithFreqsAndPositions => {
                        JsonPostingsWriter::<TfAndPositionRecorder>::default().into()
                    }
                }
            } else {
                JsonPostingsWriter::<DocIdRecorder>::default().into()
            }
        }
    }
}


================================================
FILE: src/postings/postings.rs
================================================
use crate::docset::DocSet;

/// Postings (also called inverted list)
///
/// For a given term, it is the list of doc ids of the doc
/// containing the term. Optionally, for each document,
/// it may also give access to the term frequency
/// as well as the list of term positions.
///
/// Its main implementation is `SegmentPostings`,
/// but other implementations mocking `SegmentPostings` exist,
/// for merging segments or for testing.
pub trait Postings: DocSet + 'static {
    /// The number of times the term appears in the document.
    fn term_freq(&self) -> u32;

    /// Returns the positions offsetted with a given value.
    /// It is not necessary to clear the `output` before calling this method.
    /// The output vector will be resized to the `term_freq`.
    fn positions_with_offset(&mut self, offset: u32, output: &mut Vec<u32>) {
        output.clear();
        self.append_positions_with_offset(offset, output);
    }

    /// Returns the positions offsetted with a given value.
    /// Data will be appended to the output.
    fn append_positions_with_offset(&mut self, offset: u32, output: &mut Vec<u32>);

    /// Returns the positions of the term in the given document.
    /// The output vector will be resized to the `term_freq`.
    fn positions(&mut self, output: &mut Vec<u32>) {
        self.positions_with_offset(0u32, output);
    }
}

impl Postings for Box<dyn Postings> {
    fn term_freq(&self) -> u32 {
        (**self).term_freq()
    }

    fn append_positions_with_offset(&mut self, offset: u32, output: &mut Vec<u32>) {
        (**self).append_positions_with_offset(offset, output);
    }
}


================================================
FILE: src/postings/postings_writer.rs
================================================
use std::io;
use std::marker::PhantomData;
use std::ops::Range;

use stacker::Addr;

use crate::fieldnorm::FieldNormReaders;
use crate::indexer::indexing_term::IndexingTerm;
use crate::indexer::path_to_unordered_id::OrderedPathId;
use crate::postings::recorder::{BufferLender, Recorder};
use crate::postings::{
    FieldSerializer, IndexingContext, InvertedIndexSerializer, PerFieldPostingsWriter,
};
use crate::schema::{Field, Schema, Type};
use crate::tokenizer::{Token, TokenStream, MAX_TOKEN_LEN};
use crate::DocId;

const POSITION_GAP: u32 = 1;

fn make_field_partition(
    term_offsets: &[(Field, OrderedPathId, &[u8], Addr)],
) -> Vec<(Field, Range<usize>)> {
    let term_offsets_it = term_offsets
        .iter()
        .map(|(field, _, _, _)| *field)
        .enumerate();
    let mut prev_field_opt = None;
    let mut fields = vec![];
    let mut offsets = vec![];
    for (offset, field) in term_offsets_it {
        if Some(field) != prev_field_opt {
            prev_field_opt = Some(field);
            fields.push(field);
            offsets.push(offset);
        }
    }
    offsets.push(term_offsets.len());
    let mut field_offsets = vec![];
    for i in 0..fields.len() {
        field_offsets.push((fields[i], offsets[i]..offsets[i + 1]));
    }
    field_offsets
}

/// Serialize the inverted index.
/// It pushes all term, one field at a time, towards the
/// postings serializer.
pub(crate) fn serialize_postings(
    ctx: IndexingContext,
    schema: Schema,
    per_field_postings_writers: &PerFieldPostingsWriter,
    fieldnorm_readers: FieldNormReaders,
    serializer: &mut InvertedIndexSerializer,
) -> crate::Result<()> {
    // Replace unordered ids by ordered ids to be able to sort
    let unordered_id_to_ordered_id: Vec<OrderedPathId> =
        ctx.path_to_unordered_id.unordered_id_to_ordered_id();

    let mut term_offsets: Vec<(Field, OrderedPathId, &[u8], Addr)> =
        Vec::with_capacity(ctx.term_index.len());
    term_offsets.extend(ctx.term_index.iter().map(|(key, addr)| {
        let field = IndexingTerm::wrap(key).field();
        if schema.get_field_entry(field).field_type().value_type() == Type::Json {
            let byte_range_path = 4..4 + 4;
            let unordered_id = u32::from_be_bytes(key[byte_range_path.clone()].try_into().unwrap());
            let path_id = unordered_id_to_ordered_id[unordered_id as usize];
            (field, path_id, &key[byte_range_path.end..], addr)
        } else {
            (field, 0.into(), &key[4..], addr)
        }
    }));
    // Sort by field, path, and term
    term_offsets.sort_unstable_by(
        |(field1, path_id1, bytes1, _), (field2, path_id2, bytes2, _)| {
            (field1, path_id1, bytes1).cmp(&(field2, path_id2, bytes2))
        },
    );
    let ordered_id_to_path = ctx.path_to_unordered_id.ordered_id_to_path();
    let field_offsets = make_field_partition(&term_offsets);
    for (field, byte_offsets) in field_offsets {
        let postings_writer = per_field_postings_writers.get_for_field(field);
        let fieldnorm_reader = fieldnorm_readers.get_field(field)?;
        let mut field_serializer =
            serializer.new_field(field, postings_writer.total_num_tokens(), fieldnorm_reader)?;
        postings_writer.serialize(
            &term_offsets[byte_offsets],
            &ordered_id_to_path,
            &ctx,
            &mut field_serializer,
        )?;
        field_serializer.close()?;
    }

    Ok(())
}

#[derive(Default, Debug)]
pub(crate) struct IndexingPosition {
    pub num_tokens: u32,
    pub end_position: u32,
}

/// The `PostingsWriter` is in charge of receiving documenting
/// and building a `Segment` in anonymous memory.
///
/// `PostingsWriter` writes in a `MemoryArena`.
pub(crate) trait PostingsWriter: Send + Sync {
    /// Record that a document contains a term at a given position.
    ///
    /// * doc  - the document id
    /// * pos  - the term position (expressed in tokens)
    /// * term - the term
    /// * ctx - Contains a term hashmap and a memory arena to store all necessary posting list
    ///   information.
    fn subscribe(&mut self, doc: DocId, pos: u32, term: &IndexingTerm, ctx: &mut IndexingContext);

    /// Serializes the postings on disk.
    /// The actual serialization format is handled by the `PostingsSerializer`.
    fn serialize(
        &self,
        term_addrs: &[(Field, OrderedPathId, &[u8], Addr)],
        ordered_id_to_path: &[&str],
        ctx: &IndexingContext,
        serializer: &mut FieldSerializer,
    ) -> io::Result<()>;

    /// Tokenize a text and subscribe all of its token.
    fn index_text(
        &mut self,
        doc_id: DocId,
        token_stream: &mut dyn TokenStream,
        term_buffer: &mut IndexingTerm,
        ctx: &mut IndexingContext,
        indexing_position: &mut IndexingPosition,
    ) {
        let end_of_path_idx = term_buffer.len_bytes();
        let mut num_tokens = 0;
        let mut end_position = indexing_position.end_position;
        token_stream.process(&mut |token: &Token| {
            // We skip all tokens with a len greater than u16.
            if token.text.len() > MAX_TOKEN_LEN {
                warn!(
                    "A token exceeding MAX_TOKEN_LEN ({}>{}) was dropped. Search for \
                     MAX_TOKEN_LEN in the documentation for more information.",
                    token.text.len(),
                    MAX_TOKEN_LEN
                );
                return;
            }
            term_buffer.truncate_value_bytes(end_of_path_idx);
            term_buffer.append_bytes(token.text.as_bytes());
            let start_position = indexing_position.end_position + token.position as u32;
            end_position = end_position.max(start_position + token.position_length as u32);
            self.subscribe(doc_id, start_position, term_buffer, ctx);
            num_tokens += 1;
        });

        indexing_position.end_position = end_position + POSITION_GAP;
        indexing_position.num_tokens += num_tokens;
        term_buffer.truncate_value_bytes(end_of_path_idx);
    }

    fn total_num_tokens(&self) -> u64;
}

/// The `SpecializedPostingsWriter` is just here to remove dynamic
/// dispatch to the recorder information.
#[derive(Default)]
pub(crate) struct SpecializedPostingsWriter<Rec: Recorder> {
    total_num_tokens: u64,
    _recorder_type: PhantomData<Rec>,
}

impl<Rec: Recorder> From<SpecializedPostingsWriter<Rec>> for Box<dyn PostingsWriter> {
    fn from(
        specialized_postings_writer: SpecializedPostingsWriter<Rec>,
    ) -> Box<dyn PostingsWriter> {
        Box::new(specialized_postings_writer)
    }
}

impl<Rec: Recorder> SpecializedPostingsWriter<Rec> {
    #[inline]
    pub(crate) fn serialize_one_term(
        term: &[u8],
        addr: Addr,
        buffer_lender: &mut BufferLender,
        ctx: &IndexingContext,
        serializer: &mut FieldSerializer,
    ) -> io::Result<()> {
        let recorder: Rec = ctx.term_index.read(addr);
        let term_doc_freq = recorder.term_doc_freq().unwrap_or(0u32);
        serializer.new_term(term, term_doc_freq, recorder.has_term_freq())?;
        recorder.serialize(&ctx.arena, serializer, buffer_lender);
        serializer.close_term()?;
        Ok(())
    }
}

impl<Rec: Recorder> PostingsWriter for SpecializedPostingsWriter<Rec> {
    #[inline]
    fn subscribe(
        &mut self,
        doc: DocId,
        position: u32,
        term: &IndexingTerm,
        ctx: &mut IndexingContext,
    ) {
        debug_assert!(term.serialized_term().len() >= 4);
        self.total_num_tokens += 1;
        let (term_index, arena) = (&mut ctx.term_index, &mut ctx.arena);
        term_index.mutate_or_create(term.serialized_term(), |opt_recorder: Option<Rec>| {
            if let Some(mut recorder) = opt_recorder {
                let current_doc = recorder.current_doc();
                if current_doc != doc {
                    recorder.close_doc(arena);
                    recorder.new_doc(doc, arena);
                }
                recorder.record_position(position, arena);
                recorder
            } else {
                let mut recorder = Rec::default();
                recorder.new_doc(doc, arena);
                recorder.record_position(position, arena);
                recorder
            }
        });
    }

    fn serialize(
        &self,
        term_addrs: &[(Field, OrderedPathId, &[u8], Addr)],
        _ordered_id_to_path: &[&str],
        ctx: &IndexingContext,
        serializer: &mut FieldSerializer,
    ) -> io::Result<()> {
        let mut buffer_lender = BufferLender::default();
        for (_field, _path_id, term, addr) in term_addrs {
            Self::serialize_one_term(term, *addr, &mut buffer_lender, ctx, serializer)?;
        }
        Ok(())
    }

    fn total_num_tokens(&self) -> u64 {
        self.total_num_tokens
    }
}


================================================
FILE: src/postings/recorder.rs
================================================
use common::read_u32_vint;
use stacker::{ExpUnrolledLinkedList, MemoryArena};

use crate::postings::FieldSerializer;
use crate::DocId;

const POSITION_END: u32 = 0;

#[derive(Default)]
pub(crate) struct BufferLender {
    buffer_u8: Vec<u8>,
    buffer_u32: Vec<u32>,
}

impl BufferLender {
    pub fn lend_u8(&mut self) -> &mut Vec<u8> {
        self.buffer_u8.clear();
        &mut self.buffer_u8
    }
    pub fn lend_all(&mut self) -> (&mut Vec<u8>, &mut Vec<u32>) {
        self.buffer_u8.clear();
        self.buffer_u32.clear();
        (&mut self.buffer_u8, &mut self.buffer_u32)
    }
}

pub struct VInt32Reader<'a> {
    data: &'a [u8],
}

impl<'a> VInt32Reader<'a> {
    fn new(data: &'a [u8]) -> VInt32Reader<'a> {
        VInt32Reader { data }
    }
}

impl Iterator for VInt32Reader<'_> {
    type Item = u32;

    fn next(&mut self) -> Option<u32> {
        if self.data.is_empty() {
            None
        } else {
            Some(read_u32_vint(&mut self.data))
        }
    }
}

/// `Recorder` is in charge of recording relevant information about
/// the presence of a term in a document.
///
/// Depending on the [`TextOptions`](crate::schema::TextOptions) associated
/// with the field, the recorder may record:
///   * the document frequency
///   * the document id
///   * the term frequency
///   * the term positions
pub(crate) trait Recorder: Copy + Default + Send + Sync + 'static {
    /// Returns the current document
    fn current_doc(&self) -> u32;
    /// Starts recording information about a new document
    /// This method shall only be called if the term is within the document.
    fn new_doc(&mut self, doc: DocId, arena: &mut MemoryArena);
    /// Record the position of a term. For each document,
    /// this method will be called `term_freq` times.
    fn record_position(&mut self, position: u32, arena: &mut MemoryArena);
    /// Close the document. It will help record the term frequency.
    fn close_doc(&mut self, arena: &mut MemoryArena);
    /// Pushes the postings information to the serializer.
    fn serialize(
        &self,
        arena: &MemoryArena,
        serializer: &mut FieldSerializer<'_>,
        buffer_lender: &mut BufferLender,
    );
    /// Returns the number of document containing this term.
    ///
    /// Returns `None` if not available.
    fn term_doc_freq(&self) -> Option<u32>;

    #[inline]
    fn has_term_freq(&self) -> bool {
        true
    }
}

/// Only records the doc ids
#[derive(Clone, Copy, Default)]
pub struct DocIdRecorder {
    stack: ExpUnrolledLinkedList,
    current_doc: DocId,
}

impl Recorder for DocIdRecorder {
    #[inline]
    fn current_doc(&self) -> DocId {
        self.current_doc
    }

    #[inline]
    fn new_doc(&mut self, doc: DocId, arena: &mut MemoryArena) {
        let delta = doc - self.current_doc;
        self.current_doc = doc;
        self.stack.writer(arena).write_u32_vint(delta);
    }

    #[inline]
    fn record_position(&mut self, _position: u32, _arena: &mut MemoryArena) {}

    #[inline]
    fn close_doc(&mut self, _arena: &mut MemoryArena) {}

    fn serialize(
        &self,
        arena: &MemoryArena,
        serializer: &mut FieldSerializer<'_>,
        buffer_lender: &mut BufferLender,
    ) {
        let buffer = buffer_lender.lend_u8();
        // TODO avoid reading twice.
        self.stack.read_to_end(arena, buffer);
        let iter = get_sum_reader(VInt32Reader::new(&buffer[..]));
        for doc_id in iter {
            serializer.write_doc(doc_id, 0u32, &[][..]);
        }
    }

    fn term_doc_freq(&self) -> Option<u32> {
        None
    }

    fn has_term_freq(&self) -> bool {
        false
    }
}

/// Takes an Iterator of delta encoded elements and returns an iterator
/// that yields the sum of the elements.
fn get_sum_reader(iter: impl Iterator<Item = u32>) -> impl Iterator<Item = u32> {
    iter.scan(0, |state, delta| {
        *state += delta;
        Some(*state)
    })
}

/// Recorder encoding document ids, and term frequencies
#[derive(Clone, Copy, Default)]
pub struct TermFrequencyRecorder {
    stack: ExpUnrolledLinkedList,
    current_doc: DocId,
    current_tf: u32,
    term_doc_freq: u32,
}

impl Recorder for TermFrequencyRecorder {
    #[inline]
    fn current_doc(&self) -> DocId {
        self.current_doc
    }

    #[inline]
    fn new_doc(&mut self, doc: DocId, arena: &mut MemoryArena) {
        let delta = doc - self.current_doc;
        self.term_doc_freq += 1;
        self.current_doc = doc;
        self.stack.writer(arena).write_u32_vint(delta);
    }

    #[inline]
    fn record_position(&mut self, _position: u32, _arena: &mut MemoryArena) {
        self.current_tf += 1;
    }

    #[inline]
    fn close_doc(&mut self, arena: &mut MemoryArena) {
        debug_assert!(self.current_tf > 0);
        self.stack.writer(arena).write_u32_vint(self.current_tf);
        self.current_tf = 0;
    }

    fn serialize(
        &self,
        arena: &MemoryArena,
        serializer: &mut FieldSerializer<'_>,
        buffer_lender: &mut BufferLender,
    ) {
        let buffer = buffer_lender.lend_u8();
        self.stack.read_to_end(arena, buffer);
        let mut u32_it = VInt32Reader::new(&buffer[..]);
        let mut prev_doc = 0;
        while let Some(delta_doc_id) = u32_it.next() {
            let doc_id = prev_doc + delta_doc_id;
            prev_doc = doc_id;
            let term_freq = u32_it.next().unwrap_or(self.current_tf);
            serializer.write_doc(doc_id, term_freq, &[][..]);
        }
    }

    fn term_doc_freq(&self) -> Option<u32> {
        Some(self.term_doc_freq)
    }
}

/// Recorder encoding term frequencies as well as positions.
#[derive(Clone, Copy, Default)]
pub struct TfAndPositionRecorder {
    stack: ExpUnrolledLinkedList,
    current_doc: DocId,
    term_doc_freq: u32,
}

impl Recorder for TfAndPositionRecorder {
    #[inline]
    fn current_doc(&self) -> DocId {
        self.current_doc
    }

    #[inline]
    fn new_doc(&mut self, doc: DocId, arena: &mut MemoryArena) {
        let delta = doc - self.current_doc;
        self.current_doc = doc;
        self.term_doc_freq += 1u32;
        self.stack.writer(arena).write_u32_vint(delta);
    }

    #[inline]
    fn record_position(&mut self, position: u32, arena: &mut MemoryArena) {
        self.stack
            .writer(arena)
            .write_u32_vint(position.wrapping_add(1u32));
    }

    #[inline]
    fn close_doc(&mut self, arena: &mut MemoryArena) {
        self.stack.writer(arena).write_u32_vint(POSITION_END);
    }

    fn serialize(
        &self,
        arena: &MemoryArena,
        serializer: &mut FieldSerializer<'_>,
        buffer_lender: &mut BufferLender,
    ) {
        let (buffer_u8, buffer_positions) = buffer_lender.lend_all();
        self.stack.read_to_end(arena, buffer_u8);
        let mut u32_it = VInt32Reader::new(&buffer_u8[..]);
        let mut prev_doc = 0;
        while let Some(delta_doc_id) = u32_it.next() {
            let doc_id = prev_doc + delta_doc_id;
            prev_doc = doc_id;
            let mut prev_position_plus_one = 1u32;
            buffer_positions.clear();
            loop {
                match u32_it.next() {
                    Some(POSITION_END) | None => {
                        break;
                    }
                    Some(position_plus_one) => {
                        let delta_position = position_plus_one - prev_position_plus_one;
                        buffer_positions.push(delta_position);
                        prev_position_plus_one = position_plus_one;
                    }
                }
            }
            serializer.write_doc(doc_id, buffer_positions.len() as u32, buffer_positions);
        }
    }

    fn term_doc_freq(&self) -> Option<u32> {
        Some(self.term_doc_freq)
    }
}

#[cfg(test)]
mod tests {

    use common::write_u32_vint;

    use super::{BufferLender, VInt32Reader};

    #[test]
    fn test_buffer_lender() {
        let mut buffer_lender = BufferLender::default();
        {
            let buf = buffer_lender.lend_u8();
            assert!(buf.is_empty());
            buf.push(1u8);
        }
        {
            let buf = buffer_lender.lend_u8();
            assert!(buf.is_empty());
            buf.push(1u8);
        }
        {
            let (_, buf) = buffer_lender.lend_all();
            assert!(buf.is_empty());
            buf.push(1u32);
        }
        {
            let (_, buf) = buffer_lender.lend_all();
            assert!(buf.is_empty());
            buf.push(1u32);
        }
    }

    #[test]
    fn test_vint_u32() {
        let mut buffer = vec![];
        let vals = [0, 1, 324_234_234, u32::MAX];
        for &i in &vals {
            assert!(write_u32_vint(i, &mut buffer).is_ok());
        }
        assert_eq!(buffer.len(), 1 + 1 + 5 + 5);
        let res: Vec<u32> = VInt32Reader::new(&buffer[..]).collect();
        assert_eq!(&res[..], &vals[..]);
    }
}


================================================
FILE: src/postings/segment_postings.rs
================================================
use common::HasLen;

use crate::docset::DocSet;
use crate::fastfield::AliveBitSet;
use crate::positions::PositionReader;
use crate::postings::compression::COMPRESSION_BLOCK_SIZE;
use crate::postings::{BlockSegmentPostings, Postings};
use crate::{DocId, TERMINATED};

/// `SegmentPostings` represents the inverted list or postings associated with
/// a term in a `Segment`.
///
/// As we iterate through the `SegmentPostings`, the frequencies are optionally decoded.
/// Positions on the other hand, are optionally entirely decoded upfront.
#[derive(Clone)]
pub struct SegmentPostings {
    pub(crate) block_cursor: BlockSegmentPostings,
    cur: usize,
    position_reader: Option<PositionReader>,
}

impl SegmentPostings {
    /// Returns an empty segment postings object
    pub fn empty() -> Self {
        SegmentPostings {
            block_cursor: BlockSegmentPostings::empty(),
            cur: 0,
            position_reader: None,
        }
    }

    /// Compute the number of non-deleted documents.
    ///
    /// This method will clone and scan through the posting lists.
    /// (this is a rather expensive operation).
    pub fn doc_freq_given_deletes(&self, alive_bitset: &AliveBitSet) -> u32 {
        let mut docset = self.clone();
        let mut doc_freq = 0;
        loop {
            let doc = docset.doc();
            if doc == TERMINATED {
                return doc_freq;
            }
            if alive_bitset.is_alive(doc) {
                doc_freq += 1u32;
            }
            docset.advance();
        }
    }

    /// Returns the overall number of documents in the block postings.
    /// It does not take in account whether documents are deleted or not.
    pub fn doc_freq(&self) -> u32 {
        self.block_cursor.doc_freq()
    }

    /// Creates a segment postings object with the given documents
    /// and no frequency encoded.
    ///
    /// This method is mostly useful for unit tests.
    ///
    /// It serializes the doc ids using tantivy's codec
    /// and returns a `SegmentPostings` object that embeds a
    /// buffer with the serialized data.
    #[cfg(test)]
    pub fn create_from_docs(docs: &[u32]) -> SegmentPostings {
        use crate::directory::FileSlice;
        use crate::postings::serializer::PostingsSerializer;
        use crate::schema::IndexRecordOption;
        let mut buffer = Vec::new();
        {
            let mut postings_serializer =
                PostingsSerializer::new(0.0, IndexRecordOption::Basic, None);
            postings_serializer.new_term(docs.len() as u32, false);
            for &doc in docs {
                postings_serializer.write_doc(doc, 1u32);
            }
            postings_serializer
                .close_term(docs.len() as u32, &mut buffer)
                .expect("In memory Serialization should never fail.");
        }
        let block_segment_postings = BlockSegmentPostings::open(
            docs.len() as u32,
            FileSlice::from(buffer),
            IndexRecordOption::Basic,
            IndexRecordOption::Basic,
        )
        .unwrap();
        SegmentPostings::from_block_postings(block_segment_postings, None)
    }

    /// Helper functions to create `SegmentPostings` for tests.
    #[cfg(test)]
    pub fn create_from_docs_and_tfs(
        doc_and_tfs: &[(u32, u32)],
        fieldnorms: Option<&[u32]>,
    ) -> SegmentPostings {
        use crate::directory::FileSlice;
        use crate::fieldnorm::FieldNormReader;
        use crate::postings::serializer::PostingsSerializer;
        use crate::schema::IndexRecordOption;
        use crate::Score;
        let mut buffer: Vec<u8> = Vec::new();
        let fieldnorm_reader = fieldnorms.map(FieldNormReader::for_test);
        let average_field_norm = fieldnorms
            .map(|fieldnorms| {
                if fieldnorms.is_empty() {
                    return 0.0;
                }
                let total_num_tokens: u64 = fieldnorms
                    .iter()
                    .map(|&fieldnorm| fieldnorm as u64)
                    .sum::<u64>();
                total_num_tokens as Score / fieldnorms.len() as Score
            })
            .unwrap_or(0.0);
        let mut postings_serializer = PostingsSerializer::new(
            average_field_norm,
            IndexRecordOption::WithFreqs,
            fieldnorm_reader,
        );
        postings_serializer.new_term(doc_and_tfs.len() as u32, true);
        for &(doc, tf) in doc_and_tfs {
            postings_serializer.write_doc(doc, tf);
        }
        postings_serializer
            .close_term(doc_and_tfs.len() as u32, &mut buffer)
            .unwrap();
        let block_segment_postings = BlockSegmentPostings::open(
            doc_and_tfs.len() as u32,
            FileSlice::from(buffer),
            IndexRecordOption::WithFreqs,
            IndexRecordOption::WithFreqs,
        )
        .unwrap();
        SegmentPostings::from_block_postings(block_segment_postings, None)
    }

    /// Reads a Segment postings from an &[u8]
    ///
    /// * `len` - number of document in the posting lists.
    /// * `data` - data array. The complete data is not necessarily used.
    /// * `freq_handler` - the freq handler is in charge of decoding frequencies and/or positions
    pub(crate) fn from_block_postings(
        segment_block_postings: BlockSegmentPostings,
        position_reader: Option<PositionReader>,
    ) -> SegmentPostings {
        SegmentPostings {
            block_cursor: segment_block_postings,
            cur: 0, // cursor within the block
            position_reader,
        }
    }
}

impl DocSet for SegmentPostings {
    // goes to the next element.
    // next needs to be called a first time to point to the correct element.
    #[inline]
    fn advance(&mut self) -> DocId {
        debug_assert!(self.block_cursor.block_is_loaded());
        if self.cur == COMPRESSION_BLOCK_SIZE - 1 {
            self.cur = 0;
            self.block_cursor.advance();
        } else {
            self.cur += 1;
        }
        self.doc()
    }

    #[inline]
    fn seek(&mut self, target: DocId) -> DocId {
        debug_assert!(self.doc() <= target);
        if self.doc() >= target {
            return self.doc();
        }

        // As an optimization, if the block is already loaded, we can
        // cheaply check the next doc.
        self.cur = (self.cur + 1).min(COMPRESSION_BLOCK_SIZE - 1);
        if self.doc() >= target {
            return self.doc();
        }

        // Delegate block-local search to BlockSegmentPostings::seek, which returns
        // the in-block index of the first doc >= target.
        self.cur = self.block_cursor.seek(target);
        let doc = self.doc();
        debug_assert!(doc >= target);
        doc
    }

    /// Return the current document's `DocId`.
    #[inline]
    fn doc(&self) -> DocId {
        self.block_cursor.doc(self.cur)
    }

    fn size_hint(&self) -> u32 {
        self.len() as u32
    }
}

impl HasLen for SegmentPostings {
    fn len(&self) -> usize {
        self.block_cursor.doc_freq() as usize
    }
}

impl Postings for SegmentPostings {
    /// Returns the frequency associated with the current document.
    /// If the schema is set up so that no frequency have been encoded,
    /// this method should always return 1.
    ///
    /// # Panics
    ///
    /// Will panics if called without having called advance before.
    fn term_freq(&self) -> u32 {
        debug_assert!(
            // Here we do not use the len of `freqs()`
            // because it is actually ok to request for the freq of doc
            // even if no frequency were encoded for the field.
            //
            // In that case we hit the block just as if the frequency had been
            // decoded. The block is simply prefilled by the value 1.
            self.cur < COMPRESSION_BLOCK_SIZE,
            "Have you forgotten to call `.advance()` at least once before calling `.term_freq()`."
        );
        self.block_cursor.freq(self.cur)
    }

    fn append_positions_with_offset(&mut self, offset: u32, output: &mut Vec<u32>) {
        let term_freq = self.term_freq();
        let prev_len = output.len();
        if let Some(position_reader) = self.position_reader.as_mut() {
            debug_assert!(
                !self.block_cursor.freqs().is_empty(),
                "No positions available"
            );
            let read_offset = self.block_cursor.position_offset()
                + (self.block_cursor.freqs()[..self.cur]
                    .iter()
                    .cloned()
                    .sum::<u32>() as u64);
            // TODO: instead of zeroing the output, we could use MaybeUninit or similar.
            output.resize(prev_len + term_freq as usize, 0u32);
            position_reader.read(read_offset, &mut output[prev_len..]);
            let mut cum = offset;
            for output_mut in output[prev_len..].iter_mut() {
                cum += *output_mut;
                *output_mut = cum;
            }
        }
    }
}

#[cfg(test)]
mod tests {

    use common::HasLen;

    use super::SegmentPostings;
    use crate::docset::{DocSet, TERMINATED};
    use crate::fastfield::AliveBitSet;
    use crate::postings::postings::Postings;

    #[test]
    fn test_empty_segment_postings() {
        let mut postings = SegmentPostings::empty();
        assert_eq!(postings.advance(), TERMINATED);
        assert_eq!(postings.advance(), TERMINATED);
        assert_eq!(postings.len(), 0);
    }

    #[test]
    fn test_empty_postings_doc_returns_terminated() {
        let mut postings = SegmentPostings::empty();
        assert_eq!(postings.doc(), TERMINATED);
        assert_eq!(postings.advance(), TERMINATED);
    }

    #[test]
    fn test_empty_postings_doc_term_freq_returns_0() {
        let postings = SegmentPostings::empty();
        assert_eq!(postings.term_freq(), 1);
    }

    #[test]
    fn test_doc_freq() {
        let docs = SegmentPostings::create_from_docs(&[0, 2, 10]);
        assert_eq!(docs.doc_freq(), 3);
        let alive_bitset = AliveBitSet::for_test_from_deleted_docs(&[2], 12);
        assert_eq!(docs.doc_freq_given_deletes(&alive_bitset), 2);
        let all_deleted =
            AliveBitSet::for_test_from_deleted_docs(&[0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11], 12);
        assert_eq!(docs.doc_freq_given_deletes(&all_deleted), 0);
    }
}


================================================
FILE: src/postings/serializer.rs
================================================
use std::cmp::Ordering;
use std::io::{self, Write};

use common::{BinarySerializable, CountingWriter, VInt};

use super::TermInfo;
use crate::directory::{CompositeWrite, WritePtr};
use crate::fieldnorm::FieldNormReader;
use crate::index::Segment;
use crate::positions::PositionSerializer;
use crate::postings::compression::{BlockEncoder, VIntEncoder, COMPRESSION_BLOCK_SIZE};
use crate::postings::skip::SkipSerializer;
use crate::query::Bm25Weight;
use crate::schema::{Field, FieldEntry, IndexRecordOption, Schema};
use crate::termdict::TermDictionaryBuilder;
use crate::{DocId, Score};

/// `InvertedIndexSerializer` is in charge of serializing
/// postings on disk, in the
/// * `.idx` (inverted index)
/// * `.pos` (positions file)
/// * `.term` (term dictionary)
///
/// `PostingsWriter` are in charge of pushing the data to the
/// serializer.
///
/// The serializer expects to receive the following calls
/// in this order :
/// * `set_field(...)`
/// * `new_term(...)`
/// * `write_doc(...)`
/// * `write_doc(...)`
/// * `write_doc(...)`
/// * ...
/// * `close_term()`
/// * `new_term(...)`
/// * `write_doc(...)`
/// * ...
/// * `close_term()`
/// * `set_field(...)`
/// * ...
/// * `close()`
///
/// Terms have to be pushed in a lexicographically-sorted order.
/// Within a term, documents have to be pushed in increasing order.
///
/// A description of the serialization format is
/// [available here](https://fulmicoton.gitbooks.io/tantivy-doc/content/inverted-index.html).
pub struct InvertedIndexSerializer {
    terms_write: CompositeWrite<WritePtr>,
    postings_write: CompositeWrite<WritePtr>,
    positions_write: CompositeWrite<WritePtr>,
    schema: Schema,
}

impl InvertedIndexSerializer {
    /// Open a new `InvertedIndexSerializer` for the given segment
    pub fn open(segment: &mut Segment) -> crate::Result<InvertedIndexSerializer> {
        use crate::index::SegmentComponent::{Positions, Postings, Terms};
        let inv_index_serializer = InvertedIndexSerializer {
            terms_write: CompositeWrite::wrap(segment.open_write(Terms)?),
            postings_write: CompositeWrite::wrap(segment.open_write(Postings)?),
            positions_write: CompositeWrite::wrap(segment.open_write(Positions)?),
            schema: segment.schema(),
        };
        Ok(inv_index_serializer)
    }

    /// Must be called before starting pushing terms of
    /// a given field.
    ///
    /// Loads the indexing options for the given field.
    pub fn new_field(
        &mut self,
        field: Field,
        total_num_tokens: u64,
        fieldnorm_reader: Option<FieldNormReader>,
    ) -> io::Result<FieldSerializer<'_>> {
        let field_entry: &FieldEntry = self.schema.get_field_entry(field);
        let term_dictionary_write = self.terms_write.for_field(field);
        let postings_write = self.postings_write.for_field(field);
        let positions_write = self.positions_write.for_field(field);
        let index_record_option = field_entry
            .field_type()
            .index_record_option()
            .unwrap_or(IndexRecordOption::Basic);
        FieldSerializer::create(
            index_record_option,
            total_num_tokens,
            term_dictionary_write,
            postings_write,
            positions_write,
            fieldnorm_reader,
        )
    }

    /// Closes the serializer.
    pub fn close(self) -> io::Result<()> {
        self.terms_write.close()?;
        self.postings_write.close()?;
        self.positions_write.close()?;
        Ok(())
    }
}

/// The field serializer is in charge of
/// the serialization of a specific field.
pub struct FieldSerializer<'a, W: Write = WritePtr> {
    term_dictionary_builder: TermDictionaryBuilder<&'a mut CountingWriter<W>>,
    postings_serializer: PostingsSerializer,
    positions_serializer_opt: Option<PositionSerializer<&'a mut CountingWriter<W>>>,
    current_term_info: TermInfo,
    term_open: bool,
    postings_write: &'a mut CountingWriter<W>,
    postings_start_offset: u64,
}

impl<'a, W: Write> FieldSerializer<'a, W> {
    /// Creates a new `FieldSerializer` for the given field type.
    pub fn create(
        index_record_option: IndexRecordOption,
        total_num_tokens: u64,
        term_dictionary_write: &'a mut CountingWriter<W>,
        postings_write: &'a mut CountingWriter<W>,
        positions_write: &'a mut CountingWriter<W>,
        fieldnorm_reader: Option<FieldNormReader>,
    ) -> io::Result<FieldSerializer<'a, W>> {
        total_num_tokens.serialize(postings_write)?;
        let term_dictionary_builder = TermDictionaryBuilder::create(term_dictionary_write)?;
        let average_fieldnorm = fieldnorm_reader
            .as_ref()
            .map(|ff_reader| total_num_tokens as Score / ff_reader.num_docs() as Score)
            .unwrap_or(0.0);
        let postings_serializer =
            PostingsSerializer::new(average_fieldnorm, index_record_option, fieldnorm_reader);
        let positions_serializer_opt = if index_record_option.has_positions() {
            Some(PositionSerializer::new(positions_write))
        } else {
            None
        };

        let postings_start_offset = postings_write.written_bytes();
        Ok(FieldSerializer {
            term_dictionary_builder,
            postings_serializer,
            positions_serializer_opt,
            current_term_info: TermInfo::default(),
            term_open: false,
            postings_write,
            postings_start_offset,
        })
    }

    fn postings_offset(&self) -> usize {
        (self.postings_write.written_bytes() - self.postings_start_offset) as usize
    }

    fn current_term_info(&self) -> TermInfo {
        let positions_start =
            if let Some(positions_serializer) = self.positions_serializer_opt.as_ref() {
                positions_serializer.written_bytes()
            } else {
                0u64
            } as usize;
        let addr = self.postings_offset();
        TermInfo {
            doc_freq: 0,
            postings_range: addr..addr,
            positions_range: positions_start..positions_start,
        }
    }

    /// Starts the postings for a new term.
    /// * term - the term. It needs to come after the previous term according to the lexicographical
    ///   order.
    /// * term_doc_freq - return the number of document containing the term.
    pub fn new_term(
        &mut self,
        term: &[u8],
        term_doc_freq: u32,
        record_term_freq: bool,
    ) -> io::Result<()> {
        assert!(
            !self.term_open,
            "Called new_term, while the previous term was not closed."
        );
        self.term_open = true;
        self.postings_serializer.clear();
        self.current_term_info = self.current_term_info();
        self.term_dictionary_builder.insert_key(term)?;
        self.postings_serializer
            .new_term(term_doc_freq, record_term_freq);
        Ok(())
    }

    /// Starts the postings for a new term without recording term frequencies.
    pub fn new_term_without_freq(&mut self, term: &[u8]) -> io::Result<()> {
        self.new_term(term, 0, false)
    }

    /// Serialize the information that a document contains for the current term:
    /// its term frequency, and the position deltas.
    ///
    /// At this point, the positions are already `delta-encoded`.
    /// For instance, if the positions are `2, 3, 17`,
    /// `position_deltas` is `2, 1, 14`
    ///
    /// Term frequencies and positions may be ignored by the serializer depending
    /// on the configuration of the field in the `Schema`.
    pub fn write_doc(&mut self, doc_id: DocId, term_freq: u32, position_deltas: &[u32]) {
        self.current_term_info.doc_freq += 1;
        self.postings_serializer.write_doc(doc_id, term_freq);
        if let Some(ref mut positions_serializer) = self.positions_serializer_opt.as_mut() {
            assert_eq!(term_freq as usize, position_deltas.len());
            positions_serializer.write_positions_delta(position_deltas);
        }
    }

    /// Finish the serialization for this term postings.
    ///
    /// If the current block is incomplete, it needs to be encoded
    /// using `VInt` encoding.
    pub fn close_term(&mut self) -> io::Result<()> {
        crate::fail_point!("FieldSerializer::close_term", |msg: Option<String>| {
            Err(io::Error::new(io::ErrorKind::Other, format!("{msg:?}")))
        });

        if !self.term_open {
            return Ok(());
        };

        self.postings_serializer
            .close_term(self.current_term_info.doc_freq, self.postings_write)?;
        self.current_term_info.postings_range.end = self.postings_offset();
        if let Some(positions_serializer) = self.positions_serializer_opt.as_mut() {
            positions_serializer.close_term()?;
            self.current_term_info.positions_range.end =
                positions_serializer.written_bytes() as usize;
        }
        self.term_dictionary_builder
            .insert_value(&self.current_term_info)?;
        self.term_open = false;
        Ok(())
    }

    /// Closes the current field.
    pub fn close(mut self) -> io::Result<()> {
        self.close_term()?;
        if let Some(positions_serializer) = self.positions_serializer_opt {
            positions_serializer.close()?;
        }
        self.postings_write.flush()?;
        self.term_dictionary_builder.finish()?;
        Ok(())
    }
}

struct Block {
    doc_ids: [DocId; COMPRESSION_BLOCK_SIZE],
    term_freqs: [u32; COMPRESSION_BLOCK_SIZE],
    len: usize,
}

impl Block {
    fn new() -> Self {
        Block {
            doc_ids: [0u32; COMPRESSION_BLOCK_SIZE],
            term_freqs: [0u32; COMPRESSION_BLOCK_SIZE],
            len: 0,
        }
    }

    fn doc_ids(&self) -> &[DocId] {
        &self.doc_ids[..self.len]
    }

    fn term_freqs(&self) -> &[u32] {
        &self.term_freqs[..self.len]
    }

    fn clear(&mut self) {
        self.len = 0;
    }

    fn append_doc(&mut self, doc: DocId, term_freq: u32) {
        let len = self.len;
        self.doc_ids[len] = doc;
        self.term_freqs[len] = term_freq;
        self.len = len + 1;
    }

    fn is_full(&self) -> bool {
        self.len == COMPRESSION_BLOCK_SIZE
    }

    fn is_empty(&self) -> bool {
        self.len == 0
    }

    fn last_doc(&self) -> DocId {
        assert_eq!(self.len, COMPRESSION_BLOCK_SIZE);
        self.doc_ids[COMPRESSION_BLOCK_SIZE - 1]
    }
}

/// Serializer for postings lists.
pub struct PostingsSerializer {
    last_doc_id_encoded: u32,

    block_encoder: BlockEncoder,
    block: Box<Block>,

    postings_write: Vec<u8>,
    skip_write: SkipSerializer,

    mode: IndexRecordOption,
    fieldnorm_reader: Option<FieldNormReader>,

    bm25_weight: Option<Bm25Weight>,
    avg_fieldnorm: Score, /* Average number of term in the field for that segment.
                           * this value is used to compute the block wand information. */
    term_has_freq: bool,
}

impl PostingsSerializer {
    /// Creates a new `PostingsSerializer`.
    /// * avg_fieldnorm - average field norm for the field being serialized.
    /// * mode - indexing options for the field being serialized.
    pub fn new(
        avg_fieldnorm: Score,
        mode: IndexRecordOption,
        fieldnorm_reader: Option<FieldNormReader>,
    ) -> PostingsSerializer {
        PostingsSerializer {
            block_encoder: BlockEncoder::new(),
            block: Box::new(Block::new()),

            postings_write: Vec::new(),
            skip_write: SkipSerializer::new(),

            last_doc_id_encoded: 0u32,
            mode,

            fieldnorm_reader,
            bm25_weight: None,
            avg_fieldnorm,
            term_has_freq: false,
        }
    }

    /// Starts the serialization for a new term.
    /// * term_doc_freq - the number of documents containing the term.
    pub fn new_term(&mut self, term_doc_freq: u32, record_term_freq: bool) {
        self.bm25_weight = None;

        self.term_has_freq = self.mode.has_freq() && record_term_freq;
        if !self.term_has_freq {
            return;
        }

        let num_docs_in_segment: u64 =
            if let Some(fieldnorm_reader) = self.fieldnorm_reader.as_ref() {
                fieldnorm_reader.num_docs() as u64
            } else {
                return;
            };

        if num_docs_in_segment == 0 {
            return;
        }

        self.bm25_weight = Some(Bm25Weight::for_one_term_without_explain(
            term_doc_freq as u64,
            num_docs_in_segment,
            self.avg_fieldnorm,
        ));
    }

    fn write_block(&mut self) {
        {
            // encode the doc ids
            let (num_bits, block_encoded): (u8, &[u8]) = self
                .block_encoder
                .compress_block_sorted(self.block.doc_ids(), self.last_doc_id_encoded);
            self.last_doc_id_encoded = self.block.last_doc();
            self.skip_write
                .write_doc(self.last_doc_id_encoded, num_bits);
            // last el block 0, offset block 1,
            self.postings_write.extend(block_encoded);
        }
        if self.term_has_freq {
            // encode the term frequencies
            let (num_bits, block_encoded): (u8, &[u8]) = self
                .block_encoder
                .compress_block_unsorted(self.block.term_freqs(), true);
            self.postings_write.extend(block_encoded);
            self.skip_write.write_term_freq(num_bits);
            if self.mode.has_positions() {
                // We serialize the sum of term freqs within the skip information
                // in order to navigate through positions.
                let sum_freq = self.block.term_freqs().iter().cloned().sum();
                self.skip_write.write_total_term_freq(sum_freq);
            }
            let mut blockwand_params = (0u8, 0u32);
            if let Some(bm25_weight) = self.bm25_weight.as_ref() {
                if let Some(fieldnorm_reader) = self.fieldnorm_reader.as_ref() {
                    let docs = self.block.doc_ids().iter().cloned();
                    let term_freqs = self.block.term_freqs().iter().cloned();
                    let fieldnorms = docs.map(|doc| fieldnorm_reader.fieldnorm_id(doc));
                    blockwand_params = fieldnorms
                        .zip(term_freqs)
                        .max_by(
                            |(left_fieldnorm_id, left_term_freq),
                             (right_fieldnorm_id, right_term_freq)| {
                                let left_score =
                                    bm25_weight.tf_factor(*left_fieldnorm_id, *left_term_freq);
                                let right_score =
                                    bm25_weight.tf_factor(*right_fieldnorm_id, *right_term_freq);
                                left_score
                                    .partial_cmp(&right_score)
                                    .unwrap_or(Ordering::Equal)
                            },
                        )
                        .unwrap();
                }
            }
            let (fieldnorm_id, term_freq) = blockwand_params;
            self.skip_write.write_blockwand_max(fieldnorm_id, term_freq);
        }
        self.block.clear();
    }

    /// Register that the given document contains the current term.
    /// * doc_id - the document id.
    /// * term_freq - the term frequency within the document.
    pub fn write_doc(&mut self, doc_id: DocId, term_freq: u32) {
        self.block.append_doc(doc_id, term_freq);
        if self.block.is_full() {
            self.write_block();
        }
    }

    /// Finish the serialization for this term.
    pub fn close_term(
        &mut self,
        doc_freq: u32,
        output_write: &mut impl std::io::Write,
    ) -> io::Result<()> {
        if !self.block.is_empty() {
            // we have doc ids waiting to be written
            // this happens when the number of doc ids is
            // not a perfect multiple of our block size.
            //
            // In that case, the remaining part is encoded
            // using variable int encoding.
            {
                let block_encoded = self
                    .block_encoder
                    .compress_vint_sorted(self.block.doc_ids(), self.last_doc_id_encoded);
                self.postings_write.write_all(block_encoded)?;
            }
            // ... Idem for term frequencies
            if self.term_has_freq {
                let block_encoded = self
                    .block_encoder
                    .compress_vint_unsorted(self.block.term_freqs());
                self.postings_write.write_all(block_encoded)?;
            }
            self.block.clear();
        }
        if doc_freq >= COMPRESSION_BLOCK_SIZE as u32 {
            let skip_data = self.skip_write.data();
            VInt(skip_data.len() as u64).serialize(output_write)?;
            output_write.write_all(skip_data)?;
        }
        output_write.write_all(&self.postings_write[..])?;
        self.skip_write.clear();
        self.postings_write.clear();
        self.bm25_weight = None;
        Ok(())
    }

    fn clear(&mut self) {
        self.block.clear();
        self.last_doc_id_encoded = 0;
    }
}


================================================
FILE: src/postings/skip.rs
================================================
use crate::directory::OwnedBytes;
use crate::postings::compression::{compressed_block_size, COMPRESSION_BLOCK_SIZE};
use crate::query::Bm25Weight;
use crate::schema::IndexRecordOption;
use crate::{DocId, Score, TERMINATED};

// doc num bits uses the following encoding:
// given 0b a b cdefgh
//         |1|2|3|  4  |
// - 1: unused
// - 2: is delta-1 encoded. 0 if not, 1, if yes
// - 3: unused
// - 4: a 5 bit number in 0..32, the actual bitwidth. Bitpacking could in theory say this is 32
//   (requiring a 6th bit), but the biggest doc_id we can want to encode is TERMINATED-1, which can
//   be represented on 31b without delta encoding.
fn encode_bitwidth(bitwidth: u8, delta_1: bool) -> u8 {
    assert!(
        bitwidth < 32,
        "bitwidth needs to be less than 32, but got {}",
        bitwidth
    );
    bitwidth | ((delta_1 as u8) << 6)
}

fn decode_bitwidth(raw_bitwidth: u8) -> (u8, bool) {
    let delta_1 = ((raw_bitwidth >> 6) & 1) != 0;
    let bitwidth = raw_bitwidth & 0x1f;
    (bitwidth, delta_1)
}

#[inline]
fn encode_block_wand_max_tf(max_tf: u32) -> u8 {
    max_tf.min(u8::MAX as u32) as u8
}

#[inline]
fn decode_block_wand_max_tf(max_tf_code: u8) -> u32 {
    if max_tf_code == u8::MAX {
        u32::MAX
    } else {
        max_tf_code as u32
    }
}

#[inline]
fn read_u32(data: &[u8]) -> u32 {
    u32::from_le_bytes(data[..4].try_into().unwrap())
}

#[inline]
fn write_u32(val: u32, buf: &mut Vec<u8>) {
    buf.extend_from_slice(&val.to_le_bytes());
}

pub struct SkipSerializer {
    buffer: Vec<u8>,
}

impl SkipSerializer {
    pub fn new() -> SkipSerializer {
        SkipSerializer { buffer: Vec::new() }
    }

    pub fn write_doc(&mut self, last_doc: DocId, doc_num_bits: u8) {
        write_u32(last_doc, &mut self.buffer);
        self.buffer.push(encode_bitwidth(doc_num_bits, true));
    }

    pub fn write_term_freq(&mut self, tf_num_bits: u8) {
        self.buffer.push(tf_num_bits);
    }

    pub fn write_total_term_freq(&mut self, tf_sum: u32) {
        write_u32(tf_sum, &mut self.buffer);
    }

    pub fn write_blockwand_max(&mut self, fieldnorm_id: u8, term_freq: u32) {
        let block_wand_tf = encode_block_wand_max_tf(term_freq);
        self.buffer
            .extend_from_slice(&[fieldnorm_id, block_wand_tf]);
    }

    pub fn data(&self) -> &[u8] {
        &self.buffer[..]
    }

    pub fn clear(&mut self) {
        self.buffer.clear();
    }
}

#[derive(Clone)]
pub(crate) struct SkipReader {
    last_doc_in_block: DocId,
    pub(crate) last_doc_in_previous_block: DocId,
    owned_read: OwnedBytes,
    skip_info: IndexRecordOption,
    byte_offset: usize,
    remaining_docs: u32, // number of docs remaining, including the
    // documents in the current block.
    block_info: BlockInfo,

    position_offset: u64,
}

#[derive(Clone, Eq, PartialEq, Copy, Debug)]
pub(crate) enum BlockInfo {
    BitPacked {
        doc_num_bits: u8,
        strict_delta_encoded: bool,
        tf_num_bits: u8,
        tf_sum: u32,
        block_wand_fieldnorm_id: u8,
        block_wand_term_freq: u32,
    },
    VInt {
        num_docs: u32,
    },
}

impl Default for BlockInfo {
    fn default() -> Self {
        BlockInfo::VInt { num_docs: 0u32 }
    }
}

impl SkipReader {
    pub fn new(data: OwnedBytes, doc_freq: u32, skip_info: IndexRecordOption) -> SkipReader {
        let mut skip_reader = SkipReader {
            last_doc_in_block: if doc_freq >= COMPRESSION_BLOCK_SIZE as u32 {
                0
            } else {
                TERMINATED
            },
            last_doc_in_previous_block: 0u32,
            owned_read: data,
            skip_info,
            block_info: BlockInfo::VInt { num_docs: doc_freq },
            byte_offset: 0,
            remaining_docs: doc_freq,
            position_offset: 0u64,
        };
        if doc_freq >= COMPRESSION_BLOCK_SIZE as u32 {
            skip_reader.read_block_info();
        }
        skip_reader
    }

    pub fn reset(&mut self, data: OwnedBytes, doc_freq: u32) {
        self.last_doc_in_block = if doc_freq >= COMPRESSION_BLOCK_SIZE as u32 {
            0
        } else {
            TERMINATED
        };
        self.last_doc_in_previous_block = 0u32;
        self.owned_read = data;
        self.block_info = BlockInfo::VInt { num_docs: doc_freq };
        self.byte_offset = 0;
        self.remaining_docs = doc_freq;
        self.position_offset = 0u64;
        if doc_freq >= COMPRESSION_BLOCK_SIZE as u32 {
            self.read_block_info();
        }
    }

    // Returns the block max score for this block if available.
    //
    // The block max score is available for all full bitpacked block,
    // but no available for the last VInt encoded incomplete block.
    pub fn block_max_score(&self, bm25_weight: &Bm25Weight) -> Option<Score> {
        match self.block_info {
            BlockInfo::BitPacked {
                block_wand_fieldnorm_id,
                block_wand_term_freq,
                ..
            } => Some(bm25_weight.score(block_wand_fieldnorm_id, block_wand_term_freq)),
            BlockInfo::VInt { .. } => None,
        }
    }

    pub(crate) fn last_doc_in_block(&self) -> DocId {
        self.last_doc_in_block
    }

    pub fn position_offset(&self) -> u64 {
        self.position_offset
    }

    #[inline]
    pub fn byte_offset(&self) -> usize {
        self.byte_offset
    }

    fn read_block_info(&mut self) {
        let bytes = self.owned_read.as_slice();
        let advance_len: usize;
        self.last_doc_in_block = read_u32(bytes);
        let (doc_num_bits, strict_delta_encoded) = decode_bitwidth(bytes[4]);
        match self.skip_info {
            IndexRecordOption::Basic => {
                advance_len = 5;
                self.block_info = BlockInfo::BitPacked {
                    doc_num_bits,
                    strict_delta_encoded,
                    tf_num_bits: 0,
                    tf_sum: 0,
                    block_wand_fieldnorm_id: 0,
                    block_wand_term_freq: 0,
                };
            }
            IndexRecordOption::WithFreqs => {
                let tf_num_bits = bytes[5];
                let block_wand_fieldnorm_id = bytes[6];
                let block_wand_term_freq = decode_block_wand_max_tf(bytes[7]);
                advance_len = 8;
                self.block_info = BlockInfo::BitPacked {
                    doc_num_bits,
                    strict_delta_encoded,
                    tf_num_bits,
                    tf_sum: 0,
                    block_wand_fieldnorm_id,
                    block_wand_term_freq,
                };
            }
            IndexRecordOption::WithFreqsAndPositions => {
                let tf_num_bits = bytes[5];
                let tf_sum = read_u32(&bytes[6..10]);
                let block_wand_fieldnorm_id = bytes[10];
                let block_wand_term_freq = decode_block_wand_max_tf(bytes[11]);
                advance_len = 12;
                self.block_info = BlockInfo::BitPacked {
                    doc_num_bits,
                    strict_delta_encoded,
                    tf_num_bits,
                    tf_sum,
                    block_wand_fieldnorm_id,
                    block_wand_term_freq,
                };
            }
        }
        self.owned_read.advance(advance_len);
    }

    pub fn block_info(&self) -> BlockInfo {
        self.block_info
    }

    /// Advance the skip reader to the block that may contain the target.
    ///
    /// If the target is larger than all documents, the skip_reader
    /// then advance to the last Variable In block.
    pub fn seek(&mut self, target: DocId) -> bool {
        if self.last_doc_in_block() >= target {
            return false;
        }
        loop {
            self.advance();
            if self.last_doc_in_block() >= target {
                return true;
            }
        }
    }

    pub fn advance(&mut self) {
        match self.block_info {
            BlockInfo::BitPacked {
                doc_num_bits,
                tf_num_bits,
                tf_sum,
                ..
            } => {
                self.remaining_docs -= COMPRESSION_BLOCK_SIZE as u32;
                self.byte_offset += compressed_block_size(doc_num_bits + tf_num_bits);
                self.position_offset += tf_sum as u64;
            }
            BlockInfo::VInt { num_docs } => {
                debug_assert_eq!(num_docs, self.remaining_docs);
                self.remaining_docs = 0;
                self.byte_offset = usize::MAX;
            }
        }
        self.last_doc_in_previous_block = self.last_doc_in_block;
        if self.remaining_docs >= COMPRESSION_BLOCK_SIZE as u32 {
            self.read_block_info();
        } else {
            self.last_doc_in_block = TERMINATED;
            self.block_info = BlockInfo::VInt {
                num_docs: self.remaining_docs,
            };
        }
    }
}

#[cfg(test)]
mod tests {

    use super::{
        decode_bitwidth, encode_bitwidth, BlockInfo, IndexRecordOption, SkipReader, SkipSerializer,
    };
    use crate::directory::OwnedBytes;
    use crate::postings::compression::COMPRESSION_BLOCK_SIZE;

    #[test]
    fn test_encode_block_wand_max_tf() {
        for tf in 0..255 {
            assert_eq!(super::encode_block_wand_max_tf(tf), tf as u8);
        }
        for &tf in &[255, 256, 1_000_000, u32::MAX] {
            assert_eq!(super::encode_block_wand_max_tf(tf), 255);
        }
    }

    #[test]
    fn test_decode_block_wand_max_tf() {
        for tf in 0..255 {
            assert_eq!(super::decode_block_wand_max_tf(tf), tf as u32);
        }
        assert_eq!(super::decode_block_wand_max_tf(255), u32::MAX);
    }

    #[test]
    fn test_skip_with_freq() {
        let buf = {
            let mut skip_serializer = SkipSerializer::new();
            skip_serializer.write_doc(1u32, 2u8);
            skip_serializer.write_term_freq(3u8);
            skip_serializer.write_blockwand_max(13u8, 3u32);
            skip_serializer.write_doc(5u32, 5u8);
            skip_serializer.write_term_freq(2u8);
            skip_serializer.write_blockwand_max(8u8, 2u32);
            skip_serializer.data().to_owned()
        };
        let doc_freq = 3u32 + (COMPRESSION_BLOCK_SIZE * 2) as u32;
        let mut skip_reader =
            SkipReader::new(OwnedBytes::new(buf), doc_freq, IndexRecordOption::WithFreqs);
        assert_eq!(skip_reader.last_doc_in_block(), 1u32);
        assert_eq!(
            skip_reader.block_info,
            BlockInfo::BitPacked {
                doc_num_bits: 2u8,
                strict_delta_encoded: true,
                tf_num_bits: 3u8,
                tf_sum: 0,
                block_wand_fieldnorm_id: 13,
                block_wand_term_freq: 3
            }
        );
        skip_reader.advance();
        assert_eq!(skip_reader.last_doc_in_block(), 5u32);
        assert_eq!(
            skip_reader.block_info(),
            BlockInfo::BitPacked {
                doc_num_bits: 5u8,
                strict_delta_encoded: true,
                tf_num_bits: 2u8,
                tf_sum: 0,
                block_wand_fieldnorm_id: 8,
                block_wand_term_freq: 2
            }
        );
        skip_reader.advance();
        assert_eq!(skip_reader.block_info(), BlockInfo::VInt { num_docs: 3u32 });
        skip_reader.advance();
        assert_eq!(skip_reader.block_info(), BlockInfo::VInt { num_docs: 0u32 });
        skip_reader.advance();
        assert_eq!(skip_reader.block_info(), BlockInfo::VInt { num_docs: 0u32 });
    }

    #[test]
    fn test_skip_no_freq() {
        let buf = {
            let mut skip_serializer = SkipSerializer::new();
            skip_serializer.write_doc(1u32, 2u8);
            skip_serializer.write_doc(5u32, 5u8);
            skip_serializer.data().to_owned()
        };
        let doc_freq = 3u32 + (COMPRESSION_BLOCK_SIZE * 2) as u32;
        let mut skip_reader =
            SkipReader::new(OwnedBytes::new(buf), doc_freq, IndexRecordOption::Basic);
        assert_eq!(skip_reader.last_doc_in_block(), 1u32);
        assert_eq!(
            skip_reader.block_info(),
            BlockInfo::BitPacked {
                doc_num_bits: 2u8,
                strict_delta_encoded: true,
                tf_num_bits: 0,
                tf_sum: 0u32,
                block_wand_fieldnorm_id: 0,
                block_wand_term_freq: 0
            }
        );
        skip_reader.advance();
        assert_eq!(skip_reader.last_doc_in_block(), 5u32);
        assert_eq!(
            skip_reader.block_info(),
            BlockInfo::BitPacked {
                doc_num_bits: 5u8,
                strict_delta_encoded: true,
                tf_num_bits: 0,
                tf_sum: 0u32,
                block_wand_fieldnorm_id: 0,
                block_wand_term_freq: 0
            }
        );
        skip_reader.advance();
        assert_eq!(skip_reader.block_info(), BlockInfo::VInt { num_docs: 3u32 });
        skip_reader.advance();
        assert_eq!(skip_reader.block_info(), BlockInfo::VInt { num_docs: 0u32 });
        skip_reader.advance();
        assert_eq!(skip_reader.block_info(), BlockInfo::VInt { num_docs: 0u32 });
    }

    #[test]
    fn test_skip_multiple_of_block_size() {
        let buf = {
            let mut skip_serializer = SkipSerializer::new();
            skip_serializer.write_doc(1u32, 2u8);
            skip_serializer.data().to_owned()
        };
        let doc_freq = COMPRESSION_BLOCK_SIZE as u32;
        let mut skip_reader =
            SkipReader::new(OwnedBytes::new(buf), doc_freq, IndexRecordOption::Basic);
        assert_eq!(skip_reader.last_doc_in_block(), 1u32);
        assert_eq!(
            skip_reader.block_info(),
            BlockInfo::BitPacked {
                doc_num_bits: 2u8,
                strict_delta_encoded: true,
                tf_num_bits: 0,
                tf_sum: 0u32,
                block_wand_fieldnorm_id: 0,
                block_wand_term_freq: 0
            }
        );
        skip_reader.advance();
        assert_eq!(skip_reader.block_info(), BlockInfo::VInt { num_docs: 0u32 });
    }

    #[test]
    fn test_encode_decode_bitwidth() {
        for bitwidth in 0..32 {
            for delta_1 in [false, true] {
                assert_eq!(
                    (bitwidth, delta_1),
                    decode_bitwidth(encode_bitwidth(bitwidth, delta_1))
                );
            }
        }
        assert_eq!(0b01000010, encode_bitwidth(0b10, true));
        assert_eq!(0b00000010, encode_bitwidth(0b10, false));
    }
}


================================================
FILE: src/postings/term_info.rs
================================================
use std::io;
use std::ops::Range;

use common::{BinarySerializable, FixedSize};

/// `TermInfo` wraps the metadata associated with a Term.
/// It is segment-local.
#[derive(Debug, Default, Eq, PartialEq, Clone)]
pub struct TermInfo {
    /// Number of documents in the segment containing the term
    pub doc_freq: u32,
    /// Byte range of the posting list within the postings (`.idx`) file.
    pub postings_range: Range<usize>,
    /// Byte range of the positions of this terms in the positions (`.pos`) file.
    pub positions_range: Range<usize>,
}

impl TermInfo {
    pub(crate) fn posting_num_bytes(&self) -> u32 {
        let num_bytes = self.postings_range.len();
        assert!(num_bytes <= u32::MAX as usize);
        num_bytes as u32
    }

    pub(crate) fn positions_num_bytes(&self) -> u32 {
        let num_bytes = self.positions_range.len();
        assert!(num_bytes <= u32::MAX as usize);
        num_bytes as u32
    }
}

impl FixedSize for TermInfo {
    /// Size required for the binary serialization of a `TermInfo` object.
    /// This is large, but in practise, `TermInfo` are encoded in blocks and
    /// only the first `TermInfo` of a block is serialized uncompressed.
    /// The subsequent `TermInfo` are delta encoded and bitpacked.
    const SIZE_IN_BYTES: usize = 3 * u32::SIZE_IN_BYTES + 2 * u64::SIZE_IN_BYTES;
}

impl BinarySerializable for TermInfo {
    fn serialize<W: io::Write + ?Sized>(&self, writer: &mut W) -> io::Result<()> {
        self.doc_freq.serialize(writer)?;
        (self.postings_range.start as u64).serialize(writer)?;
        self.posting_num_bytes().serialize(writer)?;
        (self.positions_range.start as u64).serialize(writer)?;
        self.positions_num_bytes().serialize(writer)?;
        Ok(())
    }

    fn deserialize<R: io::Read>(reader: &mut R) -> io::Result<Self> {
        let doc_freq = u32::deserialize(reader)?;
        let postings_start_offset = u64::deserialize(reader)? as usize;
        let postings_num_bytes = u32::deserialize(reader)? as usize;
        let postings_end_offset = postings_start_offset + postings_num_bytes;
        let positions_start_offset = u64::deserialize(reader)? as usize;
        let positions_num_bytes = u32::deserialize(reader)? as usize;
        let positions_end_offset = positions_start_offset + positions_num_bytes;
        Ok(TermInfo {
            doc_freq,
            postings_range: postings_start_offset..postings_end_offset,
            positions_range: positions_start_offset..positions_end_offset,
        })
    }
}

#[cfg(test)]
mod tests {

    use super::TermInfo;
    use crate::tests::fixed_size_test;

    // TODO add serialize/deserialize test for terminfo

    #[test]
    fn test_fixed_size() {
        fixed_size_test::<TermInfo>();
    }
}


================================================
FILE: src/query/all_query.rs
================================================
use crate::docset::{DocSet, COLLECT_BLOCK_BUFFER_LEN, TERMINATED};
use crate::index::SegmentReader;
use crate::query::boost_query::BoostScorer;
use crate::query::explanation::does_not_match;
use crate::query::{EnableScoring, Explanation, Query, Scorer, Weight};
use crate::{DocId, Score};

/// Query that matches all of the documents.
///
/// All of the documents get the score 1.0.
#[derive(Clone, Debug)]
pub struct AllQuery;

impl Query for AllQuery {
    fn weight(&self, _: EnableScoring<'_>) -> crate::Result<Box<dyn Weight>> {
        Ok(Box::new(AllWeight))
    }
}

/// Weight associated with the `AllQuery` query.
pub struct AllWeight;

impl Weight for AllWeight {
    fn scorer(&self, reader: &SegmentReader, boost: Score) -> crate::Result<Box<dyn Scorer>> {
        let all_scorer = AllScorer::new(reader.max_doc());
        if boost != 1.0 {
            Ok(Box::new(BoostScorer::new(all_scorer, boost)))
        } else {
            Ok(Box::new(all_scorer))
        }
    }

    fn explain(&self, reader: &SegmentReader, doc: DocId) -> crate::Result<Explanation> {
        if doc >= reader.max_doc() {
            return Err(does_not_match(doc));
        }
        Ok(Explanation::new("AllQuery", 1.0))
    }
}

/// Scorer associated with the `AllQuery` query.
pub struct AllScorer {
    doc: DocId,
    max_doc: DocId,
}

impl AllScorer {
    /// Creates a new AllScorer with `max_doc` docs.
    pub fn new(max_doc: DocId) -> AllScorer {
        AllScorer { doc: 0u32, max_doc }
    }
}

impl DocSet for AllScorer {
    #[inline(always)]
    fn advance(&mut self) -> DocId {
        if self.doc + 1 >= self.max_doc {
            self.doc = TERMINATED;
            return TERMINATED;
        }
        self.doc += 1;
        self.doc
    }

    fn seek(&mut self, target: DocId) -> DocId {
        debug_assert!(target >= self.doc);
        self.doc = target;
        if self.doc >= self.max_doc {
            self.doc = TERMINATED;
        }
        self.doc
    }

    fn fill_buffer(&mut self, buffer: &mut [DocId; COLLECT_BLOCK_BUFFER_LEN]) -> usize {
        if self.doc() == TERMINATED {
            return 0;
        }
        let is_safe_distance = self.doc() + (buffer.len() as u32) < self.max_doc;
        if is_safe_distance {
            let num_items = buffer.len();
            for buffer_val in buffer {
                *buffer_val = self.doc();
                self.doc += 1;
            }
            num_items
        } else {
            for (i, buffer_val) in buffer.iter_mut().enumerate() {
                *buffer_val = self.doc();
                if self.advance() == TERMINATED {
                    return i + 1;
                }
            }
            buffer.len()
        }
    }

    #[inline(always)]
    fn doc(&self) -> DocId {
        self.doc
    }

    fn size_hint(&self) -> u32 {
        self.max_doc
    }
}

impl Scorer for AllScorer {
    #[inline]
    fn score(&mut self) -> Score {
        1.0
    }
}

#[cfg(test)]
mod tests {
    use super::AllQuery;
    use crate::docset::{DocSet, COLLECT_BLOCK_BUFFER_LEN, TERMINATED};
    use crate::query::{AllScorer, EnableScoring, Query};
    use crate::schema::{Schema, TEXT};
    use crate::{Index, IndexWriter};

    fn create_test_index() -> crate::Result<Index> {
        let mut schema_builder = Schema::builder();
        let field = schema_builder.add_text_field("text", TEXT);
        let schema = schema_builder.build();
        let index = Index::create_in_ram(schema);
        let mut index_writer: IndexWriter = index.writer_for_tests()?;
        index_writer.add_document(doc!(field=>"aaa"))?;
        index_writer.add_document(doc!(field=>"bbb"))?;
        index_writer.commit()?;
        index_writer.add_document(doc!(field=>"ccc"))?;
        index_writer.commit()?;
        Ok(index)
    }

    #[test]
    fn test_all_query() -> crate::Result<()> {
        let index = create_test_index()?;
        let reader = index.reader()?;
        let searcher = reader.searcher();
        let weight = AllQuery.weight(EnableScoring::disabled_from_schema(&index.schema()))?;
        {
            let reader = searcher.segment_reader(0);
            let mut scorer = weight.scorer(reader, 1.0)?;
            assert_eq!(scorer.doc(), 0u32);
            assert_eq!(scorer.advance(), 1u32);
            assert_eq!(scorer.doc(), 1u32);
            assert_eq!(scorer.advance(), TERMINATED);
        }
        {
            let reader = searcher.segment_reader(1);
            let mut scorer = weight.scorer(reader, 1.0)?;
            assert_eq!(scorer.doc(), 0u32);
            assert_eq!(scorer.advance(), TERMINATED);
        }
        Ok(())
    }

    #[test]
    fn test_all_query_with_boost() -> crate::Result<()> {
        let index = create_test_index()?;
        let reader = index.reader()?;
        let searcher = reader.searcher();
        let weight = AllQuery.weight(EnableScoring::disabled_from_schema(searcher.schema()))?;
        let reader = searcher.segment_reader(0);
        {
            let mut scorer = weight.scorer(reader, 2.0)?;
            assert_eq!(scorer.doc(), 0u32);
            assert_eq!(scorer.score(), 2.0);
        }
        {
            let mut scorer = weight.scorer(reader, 1.5)?;
            assert_eq!(scorer.doc(), 0u32);
            assert_eq!(scorer.score(), 1.5);
        }
        Ok(())
    }

    #[test]
    pub fn test_fill_buffer() {
        let mut postings = AllScorer {
            doc: 0u32,
            max_doc: COLLECT_BLOCK_BUFFER_LEN as u32 * 2 + 9,
        };
        let mut buffer = [0u32; COLLECT_BLOCK_BUFFER_LEN];
        assert_eq!(postings.fill_buffer(&mut buffer), COLLECT_BLOCK_BUFFER_LEN);
        for i in 0u32..COLLECT_BLOCK_BUFFER_LEN as u32 {
            assert_eq!(buffer[i as usize], i);
        }
        assert_eq!(postings.fill_buffer(&mut buffer), COLLECT_BLOCK_BUFFER_LEN);
        for i in 0u32..COLLECT_BLOCK_BUFFER_LEN as u32 {
            assert_eq!(buffer[i as usize], i + COLLECT_BLOCK_BUFFER_LEN as u32);
        }
        assert_eq!(postings.fill_buffer(&mut buffer), 9);
    }
}


================================================
FILE: src/query/automaton_weight.rs
================================================
use std::io;
use std::sync::Arc;

use common::BitSet;
use tantivy_fst::Automaton;

use super::phrase_prefix_query::prefix_end;
use crate::index::SegmentReader;
use crate::postings::TermInfo;
use crate::query::{BitSetDocSet, ConstScorer, Explanation, Scorer, Weight};
use crate::schema::{Field, IndexRecordOption};
use crate::termdict::{TermDictionary, TermStreamer};
use crate::{DocId, Score, TantivyError};

/// A weight struct for Fuzzy Term and Regex Queries
pub struct AutomatonWeight<A> {
    field: Field,
    automaton: Arc<A>,
    // For JSON fields, the term dictionary include terms from all paths.
    // We apply additional filtering based on the given JSON path, when searching within the term
    // dictionary. This prevents terms from unrelated paths from matching the search criteria.
    json_path_bytes: Option<Box<[u8]>>,
}

impl<A> AutomatonWeight<A>
where
    A: Automaton + Send + Sync + 'static,
    A::State: Clone,
{
    /// Create a new AutomationWeight
    pub fn new<IntoArcA: Into<Arc<A>>>(field: Field, automaton: IntoArcA) -> AutomatonWeight<A> {
        AutomatonWeight {
            field,
            automaton: automaton.into(),
            json_path_bytes: None,
        }
    }

    /// Create a new AutomationWeight for a json path
    pub fn new_for_json_path<IntoArcA: Into<Arc<A>>>(
        field: Field,
        automaton: IntoArcA,
        json_path_bytes: &[u8],
    ) -> AutomatonWeight<A> {
        AutomatonWeight {
            field,
            automaton: automaton.into(),
            json_path_bytes: Some(json_path_bytes.to_vec().into_boxed_slice()),
        }
    }

    fn automaton_stream<'a>(
        &'a self,
        term_dict: &'a TermDictionary,
    ) -> io::Result<TermStreamer<'a, &'a A>> {
        let automaton: &A = &self.automaton;
        let mut term_stream_builder = term_dict.search(automaton);

        if let Some(json_path_bytes) = &self.json_path_bytes {
            term_stream_builder = term_stream_builder.ge(json_path_bytes);
            if let Some(end) = prefix_end(json_path_bytes) {
                term_stream_builder = term_stream_builder.lt(&end);
            }
        }

        term_stream_builder.into_stream()
    }

    /// Returns the term infos that match the automaton
    pub fn get_match_term_infos(&self, reader: &SegmentReader) -> crate::Result<Vec<TermInfo>> {
        let inverted_index = reader.inverted_index(self.field)?;
        let term_dict = inverted_index.terms();
        let mut term_stream = self.automaton_stream(term_dict)?;
        let mut term_infos = Vec::new();
        while term_stream.advance() {
            term_infos.push(term_stream.value().clone());
        }
        Ok(term_infos)
    }
}

impl<A> Weight for AutomatonWeight<A>
where
    A: Automaton + Send + Sync + 'static,
    A::State: Clone,
{
    fn scorer(&self, reader: &SegmentReader, boost: Score) -> crate::Result<Box<dyn Scorer>> {
        let max_doc = reader.max_doc();
        let mut doc_bitset = BitSet::with_max_value(max_doc);
        let inverted_index = reader.inverted_index(self.field)?;
        let term_dict = inverted_index.terms();
        let mut term_stream = self.automaton_stream(term_dict)?;
        while term_stream.advance() {
            let term_info = term_stream.value();
            let mut block_segment_postings = inverted_index
                .read_block_postings_from_terminfo(term_info, IndexRecordOption::Basic)?;
            loop {
                let docs = block_segment_postings.docs();
                if docs.is_empty() {
                    break;
                }
                for &doc in docs {
                    doc_bitset.insert(doc);
                }
                block_segment_postings.advance();
            }
        }
        let doc_bitset = BitSetDocSet::from(doc_bitset);
        let const_scorer = ConstScorer::new(doc_bitset, boost);
        Ok(Box::new(const_scorer))
    }

    fn explain(&self, reader: &SegmentReader, doc: DocId) -> crate::Result<Explanation> {
        let mut scorer = self.scorer(reader, 1.0)?;
        if scorer.seek(doc) == doc {
            Ok(Explanation::new("AutomatonScorer", 1.0))
        } else {
            Err(TantivyError::InvalidArgument(
                "Document does not exist".to_string(),
            ))
        }
    }
}

#[cfg(test)]
mod tests {
    use tantivy_fst::Automaton;

    use super::AutomatonWeight;
    use crate::docset::TERMINATED;
    use crate::query::Weight;
    use crate::schema::{Schema, STRING};
    use crate::{Index, IndexWriter};

    fn create_index() -> crate::Result<Index> {
        let mut schema = Schema::builder();
        let title = schema.add_text_field("title", STRING);
        let index = Index::create_in_ram(schema.build());
        let mut index_writer: IndexWriter = index.writer_for_tests()?;
        index_writer.add_document(doc!(title=>"abc"))?;
        index_writer.add_document(doc!(title=>"bcd"))?;
        index_writer.add_document(doc!(title=>"abcd"))?;
        index_writer.commit()?;
        Ok(index)
    }

    #[derive(Clone, Copy)]
    enum State {
        Start,
        NotMatching,
        AfterA,
    }

    struct PrefixedByA;

    impl Automaton for PrefixedByA {
        type State = State;

        fn start(&self) -> Self::State {
            State::Start
        }

        fn is_match(&self, state: &Self::State) -> bool {
            matches!(*state, State::AfterA)
        }

        fn accept(&self, state: &Self::State, byte: u8) -> Self::State {
            match *state {
                State::Start => {
                    if byte == b'a' {
                        State::AfterA
                    } else {
                        State::NotMatching
                    }
                }
                State::AfterA => State::AfterA,
                State::NotMatching => State::NotMatching,
            }
        }
    }

    #[test]
    fn test_automaton_weight() -> crate::Result<()> {
        let index = create_index()?;
        let field = index.schema().get_field("title").unwrap();
        let automaton_weight = AutomatonWeight::new(field, PrefixedByA);
        let reader = index.reader()?;
        let searcher = reader.searcher();
        let mut scorer = automaton_weight.scorer(searcher.segment_reader(0u32), 1.0)?;
        assert_eq!(scorer.doc(), 0u32);
        assert_eq!(scorer.score(), 1.0);
        assert_eq!(scorer.advance(), 2u32);
        assert_eq!(scorer.doc(), 2u32);
        assert_eq!(scorer.score(), 1.0);
        assert_eq!(scorer.advance(), TERMINATED);
        Ok(())
    }

    #[test]
    fn test_automaton_weight_boost() -> crate::Result<()> {
        let index = create_index()?;
        let field = index.schema().get_field("title").unwrap();
        let automaton_weight = AutomatonWeight::new(field, PrefixedByA);
        let reader = index.reader()?;
        let searcher = reader.searcher();
        let mut scorer = automaton_weight.scorer(searcher.segment_reader(0u32), 1.32)?;
        assert_eq!(scorer.doc(), 0u32);
        assert_eq!(scorer.score(), 1.32);
        Ok(())
    }
}


================================================
FILE: src/query/bitset/mod.rs
================================================
use common::{BitSet, TinySet};

use crate::docset::{DocSet, TERMINATED};
use crate::DocId;

/// A `BitSetDocSet` makes it possible to iterate through a bitset as if it was a `DocSet`.
///
/// # Implementation detail
///
/// Skipping is relatively fast here as we can directly point to the
/// right tiny bitset bucket.
///
/// TODO: Consider implementing a `BitTreeSet` in order to advance faster
/// when the bitset is sparse
pub struct BitSetDocSet {
    docs: BitSet,
    cursor_bucket: u32, //< index associated with the current tiny bitset
    cursor_tinybitset: TinySet,
    doc: u32,
}

impl BitSetDocSet {
    fn go_to_bucket(&mut self, bucket_addr: u32) {
        self.cursor_bucket = bucket_addr;
        self.cursor_tinybitset = self.docs.tinyset(bucket_addr);
    }
}

impl From<BitSet> for BitSetDocSet {
    fn from(docs: BitSet) -> BitSetDocSet {
        let first_tiny_bitset = if docs.max_value() == 0 {
            TinySet::empty()
        } else {
            docs.tinyset(0)
        };
        let mut docset = BitSetDocSet {
            docs,
            cursor_bucket: 0,
            cursor_tinybitset: first_tiny_bitset,
            doc: 0u32,
        };
        docset.advance();
        docset
    }
}

impl DocSet for BitSetDocSet {
    #[inline]
    fn advance(&mut self) -> DocId {
        if let Some(lower) = self.cursor_tinybitset.pop_lowest() {
            self.doc = (self.cursor_bucket * 64u32) | lower;
            return self.doc;
        }
        if let Some(cursor_bucket) = self.docs.first_non_empty_bucket(self.cursor_bucket + 1) {
            self.go_to_bucket(cursor_bucket);
            let lower = self.cursor_tinybitset.pop_lowest().unwrap();
            self.doc = (cursor_bucket * 64u32) | lower;
            self.doc
        } else {
            self.doc = TERMINATED;
            TERMINATED
        }
    }

    fn seek(&mut self, target: DocId) -> DocId {
        if target >= self.docs.max_value() {
            self.doc = TERMINATED;
            return TERMINATED;
        }
        let target_bucket = target / 64u32;
        if target_bucket > self.cursor_bucket {
            self.go_to_bucket(target_bucket);
            let greater_filter: TinySet = TinySet::range_greater_or_equal(target);
            self.cursor_tinybitset = self.cursor_tinybitset.intersect(greater_filter);
            self.advance()
        } else {
            let mut doc = self.doc();
            while doc < target {
                doc = self.advance();
            }
            doc
        }
    }

    /// Returns the current document
    fn doc(&self) -> DocId {
        self.doc
    }

    /// Returns the number of values set in the underlying bitset.
    fn size_hint(&self) -> u32 {
        self.docs.len() as u32
    }
}

#[cfg(test)]
mod tests {
    use std::collections::BTreeSet;

    use common::BitSet;

    use super::BitSetDocSet;
    use crate::docset::{DocSet, TERMINATED};
    use crate::tests::generate_nonunique_unsorted;
    use crate::DocId;

    fn create_docbitset(docs: &[DocId], max_doc: DocId) -> BitSetDocSet {
        let mut docset = BitSet::with_max_value(max_doc);
        for &doc in docs {
            docset.insert(doc);
        }
        BitSetDocSet::from(docset)
    }

    #[test]
    fn test_bitset_large() {
        let arr = generate_nonunique_unsorted(100_000, 5_000);
        let mut btreeset: BTreeSet<u32> = BTreeSet::new();
        let mut bitset = BitSet::with_max_value(100_000);
        for el in arr {
            btreeset.insert(el);
            bitset.insert(el);
        }
        for i in 0..100_000 {
            assert_eq!(btreeset.contains(&i), bitset.contains(i));
        }
        assert_eq!(btreeset.len(), bitset.len());
        let mut bitset_docset = BitSetDocSet::from(bitset);
        let mut remaining = true;
        for el in btreeset.into_iter() {
            assert!(remaining);
            assert_eq!(bitset_docset.doc(), el);
            remaining = bitset_docset.advance() != TERMINATED;
        }
        assert!(!remaining);
    }

    #[test]
    fn test_empty() {
        let bitset = BitSet::with_max_value(1000);
        let mut empty = BitSetDocSet::from(bitset);
        assert_eq!(empty.advance(), TERMINATED)
    }

    #[test]
    fn test_seek_terminated() {
        let bitset = BitSet::with_max_value(1000);
        let mut empty = BitSetDocSet::from(bitset);
        assert_eq!(empty.seek(TERMINATED), TERMINATED)
    }

    fn test_go_through_sequential(docs: &[DocId]) {
        let mut docset = create_docbitset(docs, 1_000u32);
        for &doc in docs {
            assert_eq!(doc, docset.doc());
            docset.advance();
        }
        assert_eq!(docset.advance(), TERMINATED);
    }

    #[test]
    fn test_docbitset_sequential() {
        test_go_through_sequential(&[1, 2, 3]);
        test_go_through_sequential(&[1, 2, 3, 4, 5, 63, 64, 65]);
        test_go_through_sequential(&[63, 64, 65]);
        test_go_through_sequential(&[1, 2, 3, 4, 95, 96, 97, 98, 99]);
    }

    #[test]
    fn test_docbitset_skip() {
        {
            let mut docset = create_docbitset(&[1, 5, 6, 7, 5112], 10_000);
            assert_eq!(docset.seek(7), 7);
            assert_eq!(docset.doc(), 7);
            assert_eq!(docset.advance(), 5112);
            assert_eq!(docset.doc(), 5112);
            assert_eq!(docset.advance(), TERMINATED);
        }
        {
            let mut docset = create_docbitset(&[1, 5, 6, 7, 5112], 10_000);
            assert_eq!(docset.seek(3), 5);
            assert_eq!(docset.doc(), 5);
            assert_eq!(docset.advance(), 6);
        }
        {
            let mut docset = create_docbitset(&[5112], 10_000);
            assert_eq!(docset.seek(5112), 5112);
            assert_eq!(docset.doc(), 5112);
            assert_eq!(docset.advance(), TERMINATED);
        }
        {
            let mut docset = create_docbitset(&[5112], 10_000);
            assert_eq!(docset.seek(5113), TERMINATED);
            assert_eq!(docset.advance(), TERMINATED);
        }
        {
            let mut docset = create_docbitset(&[5112], 10_000);
            assert_eq!(docset.seek(5111), 5112);
            assert_eq!(docset.doc(), 5112);
            assert_eq!(docset.advance(), TERMINATED);
        }
        {
            let mut docset = create_docbitset(&[1, 5, 6, 7, 5112, 5500, 6666], 10_000);
            assert_eq!(docset.seek(5112), 5112);
            assert_eq!(docset.doc(), 5112);
            assert_eq!(docset.advance(), 5500);
            assert_eq!(docset.doc(), 5500);
            assert_eq!(docset.advance(), 6666);
            assert_eq!(docset.doc(), 6666);
            assert_eq!(docset.advance(), TERMINATED);
        }
        {
            let mut docset = create_docbitset(&[1, 5, 6, 7, 5112, 5500, 6666], 10_000);
            assert_eq!(docset.seek(5111), 5112);
            assert_eq!(docset.doc(), 5112);
            assert_eq!(docset.advance(), 5500);
            assert_eq!(docset.doc(), 5500);
            assert_eq!(docset.advance(), 6666);
            assert_eq!(docset.doc(), 6666);
            assert_eq!(docset.advance(), TERMINATED);
        }
        {
            let mut docset = create_docbitset(&[1, 5, 6, 7, 5112, 5513, 6666], 10_000);
            assert_eq!(docset.seek(5111), 5112);
            assert_eq!(docset.doc(), 5112);
            assert_eq!(docset.advance(), 5513);
            assert_eq!(docset.doc(), 5513);
            assert_eq!(docset.advance(), 6666);
            assert_eq!(docset.doc(), 6666);
            assert_eq!(docset.advance(), TERMINATED);
        }
    }
}

#[cfg(all(test, feature = "unstable"))]
mod bench {

    use super::{BitSet, BitSetDocSet};
    use crate::docset::TERMINATED;
    use crate::{test, tests, DocSet};

    #[bench]
    fn bench_bitset_1pct_insert(b: &mut test::Bencher) {
        let els = tests::generate_nonunique_unsorted(1_000_000u32, 10_000);
        b.iter(|| {
            let mut bitset = BitSet::with_max_value(1_000_000);
            for el in els.iter().cloned() {
                bitset.insert(el);
            }
        });
    }

    #[bench]
    fn bench_bitset_1pct_clone(b: &mut test::Bencher) {
        let els = tests::generate_nonunique_unsorted(1_000_000u32, 10_000);
        let mut bitset = BitSet::with_max_value(1_000_000);
        for el in els {
            bitset.insert(el);
        }
        b.iter(|| bitset.clone());
    }

    #[bench]
    fn bench_bitset_1pct_clone_iterate(b: &mut test::Bencher) {
        let els = tests::sample(1_000_000u32, 0.01);
        let mut bitset = BitSet::with_max_value(1_000_000);
        for el in els {
            bitset.insert(el);
        }
        b.iter(|| {
            let mut docset = BitSetDocSet::from(bitset.clone());
            while docset.advance() != TERMINATED {}
        });
    }
}


================================================
FILE: src/query/bm25.rs
================================================
use std::sync::Arc;

use crate::fieldnorm::FieldNormReader;
use crate::query::Explanation;
use crate::schema::Field;
use crate::{Score, Searcher, Term};

const K1: Score = 1.2;
const B: Score = 0.75;

/// An interface to compute the statistics needed in BM25 scoring.
///
/// The standard implementation is a [Searcher] but you can also
/// create your own to adjust the statistics.
pub trait Bm25StatisticsProvider {
    /// The total number of tokens in a given field across all documents in
    /// the index.
    fn total_num_tokens(&self, field: Field) -> crate::Result<u64>;

    /// The total number of documents in the index.
    fn total_num_docs(&self) -> crate::Result<u64>;

    /// The number of documents containing the given term.
    fn doc_freq(&self, term: &Term) -> crate::Result<u64>;
}

impl Bm25StatisticsProvider for Searcher {
    fn total_num_tokens(&self, field: Field) -> crate::Result<u64> {
        let mut total_num_tokens = 0u64;

        for segment_reader in self.segment_readers() {
            let inverted_index = segment_reader.inverted_index(field)?;
            total_num_tokens += inverted_index.total_num_tokens();
        }
        Ok(total_num_tokens)
    }

    fn total_num_docs(&self) -> crate::Result<u64> {
        let mut total_num_docs = 0u64;

        for segment_reader in self.segment_readers() {
            total_num_docs += u64::from(segment_reader.max_doc());
        }
        Ok(total_num_docs)
    }

    fn doc_freq(&self, term: &Term) -> crate::Result<u64> {
        self.doc_freq(term)
    }
}

pub(crate) fn idf(doc_freq: u64, doc_count: u64) -> Score {
    assert!(doc_count >= doc_freq, "{doc_count} >= {doc_freq}");
    let x = ((doc_count - doc_freq) as Score + 0.5) / (doc_freq as Score + 0.5);
    (1.0 + x).ln()
}

fn cached_tf_component(fieldnorm: u32, average_fieldnorm: Score) -> Score {
    K1 * (1.0 - B + B * fieldnorm as Score / average_fieldnorm)
}

fn compute_tf_cache(average_fieldnorm: Score) -> Arc<[Score; 256]> {
    let mut cache: [Score; 256] = [0.0; 256];
    for (fieldnorm_id, cache_mut) in cache.iter_mut().enumerate() {
        let fieldnorm = FieldNormReader::id_to_fieldnorm(fieldnorm_id as u8);
        *cache_mut = cached_tf_component(fieldnorm, average_fieldnorm);
    }
    Arc::new(cache)
}

/// A struct used for computing BM25 scores.
#[derive(Clone)]
pub struct Bm25Weight {
    idf_explain: Option<Explanation>,
    weight: Score,
    cache: Arc<[Score; 256]>,
    average_fieldnorm: Score,
}

impl Bm25Weight {
    /// Increase the weight by a multiplicative factor.
    pub fn boost_by(&self, boost: Score) -> Bm25Weight {
        if boost == 1.0f32 {
            return self.clone();
        }
        Bm25Weight {
            idf_explain: self.idf_explain.clone(),
            weight: self.weight * boost,
            cache: self.cache.clone(),
            average_fieldnorm: self.average_fieldnorm,
        }
    }

    /// Construct a [Bm25Weight] for a phrase of terms.
    pub fn for_terms(
        statistics: &dyn Bm25StatisticsProvider,
        terms: &[Term],
    ) -> crate::Result<Bm25Weight> {
        assert!(!terms.is_empty(), "Bm25 requires at least one term");
        let field = terms[0].field();
        for term in &terms[1..] {
            assert_eq!(
                term.field(),
                field,
                "All terms must belong to the same field."
            );
        }

        let total_num_tokens = statistics.total_num_tokens(field)?;
        let total_num_docs = statistics.total_num_docs()?;
        let average_fieldnorm = total_num_tokens as Score / total_num_docs as Score;

        if terms.len() == 1 {
            let term_doc_freq = statistics.doc_freq(&terms[0])?;
            Ok(Bm25Weight::for_one_term(
                term_doc_freq,
                total_num_docs,
                average_fieldnorm,
            ))
        } else {
            let mut idf_sum: Score = 0.0;
            for term in terms {
                let term_doc_freq = statistics.doc_freq(term)?;
                idf_sum += idf(term_doc_freq, total_num_docs);
            }
            let idf_explain = Explanation::new("idf", idf_sum);
            Ok(Bm25Weight::new(idf_explain, average_fieldnorm))
        }
    }

    /// Construct a [Bm25Weight] for a single term.
    pub fn for_one_term(
        term_doc_freq: u64,
        total_num_docs: u64,
        avg_fieldnorm: Score,
    ) -> Bm25Weight {
        let idf = idf(term_doc_freq, total_num_docs);
        let mut idf_explain =
            Explanation::new("idf, computed as log(1 + (N - n + 0.5) / (n + 0.5))", idf);
        idf_explain.add_const(
            "n, number of docs containing this term",
            term_doc_freq as Score,
        );
        idf_explain.add_const("N, total number of docs", total_num_docs as Score);
        Bm25Weight::new(idf_explain, avg_fieldnorm)
    }
    /// Construct a [Bm25Weight] for a single term.
    /// This method does not carry the [Explanation] for the idf.
    pub fn for_one_term_without_explain(
        term_doc_freq: u64,
        total_num_docs: u64,
        avg_fieldnorm: Score,
    ) -> Bm25Weight {
        let idf = idf(term_doc_freq, total_num_docs);
        Bm25Weight::new_without_explain(idf, avg_fieldnorm)
    }

    pub(crate) fn new(idf_explain: Explanation, average_fieldnorm: Score) -> Bm25Weight {
        let weight = idf_explain.value() * (1.0 + K1);
        Bm25Weight {
            idf_explain: Some(idf_explain),
            weight,
            cache: compute_tf_cache(average_fieldnorm),
            average_fieldnorm,
        }
    }
    pub(crate) fn new_without_explain(idf: f32, average_fieldnorm: Score) -> Bm25Weight {
        let weight = idf * (1.0 + K1);
        Bm25Weight {
            idf_explain: None,
            weight,
            cache: compute_tf_cache(average_fieldnorm),
            average_fieldnorm,
        }
    }

    /// Compute the BM25 score of a single document.
    #[inline]
    pub fn score(&self, fieldnorm_id: u8, term_freq: u32) -> Score {
        self.weight * self.tf_factor(fieldnorm_id, term_freq)
    }

    /// Compute the maximum possible BM25 score given this weight.
    pub fn max_score(&self) -> Score {
        self.score(255u8, 2_013_265_944)
    }

    #[inline]
    pub(crate) fn tf_factor(&self, fieldnorm_id: u8, term_freq: u32) -> Score {
        let term_freq = term_freq as Score;
        let norm = self.cache[fieldnorm_id as usize];
        term_freq / (term_freq + norm)
    }

    /// Produce an [Explanation] of a BM25 score.
    pub fn explain(&self, fieldnorm_id: u8, term_freq: u32) -> Explanation {
        // The explain format is directly copied from Lucene's.
        // (So, Kudos to Lucene)
        let score = self.score(fieldnorm_id, term_freq);

        let norm = self.cache[fieldnorm_id as usize];
        let term_freq = term_freq as Score;
        let right_factor = term_freq / (term_freq + norm);

        let mut tf_explanation = Explanation::new(
            "freq / (freq + k1 * (1 - b + b * dl / avgdl))",
            right_factor,
        );

        tf_explanation.add_const("freq, occurrences of term within document", term_freq);
        tf_explanation.add_const("k1, term saturation parameter", K1);
        tf_explanation.add_const("b, length normalization parameter", B);
        tf_explanation.add_const(
            "dl, length of field",
            FieldNormReader::id_to_fieldnorm(fieldnorm_id) as Score,
        );
        tf_explanation.add_const("avgdl, average length of field", self.average_fieldnorm);

        let mut explanation = Explanation::new("TermQuery, product of...", score);
        explanation.add_detail(Explanation::new("(K1+1)", K1 + 1.0));
        if let Some(idf_explain) = &self.idf_explain {
            explanation.add_detail(idf_explain.clone());
        }
        explanation.add_detail(tf_explanation);
        explanation
    }
}

#[cfg(test)]
mod tests {

    use super::idf;
    use crate::{assert_nearly_equals, Score};

    #[test]
    fn test_idf() {
        let score: Score = 2.0;
        assert_nearly_equals!(idf(1, 2), score.ln());
    }
}


================================================
FILE: src/query/boolean_query/block_wand.rs
================================================
use std::ops::{Deref, DerefMut};

use crate::query::term_query::TermScorer;
use crate::query::Scorer;
use crate::{DocId, DocSet, Score, TERMINATED};

/// Takes a term_scorers sorted by their current doc() and a threshold and returns
/// Returns (pivot_len, pivot_ord) defined as follows:
/// - `pivot_doc` lowest document that has a chance of exceeding (>) the threshold score.
/// - `before_pivot_len` number of term_scorers such that term_scorer.doc() < pivot.
/// - `pivot_len` number of term_scorers such that term_scorer.doc() <= pivot.
///
/// We always have `before_pivot_len` < `pivot_len`.
///
/// `None` is returned if we establish that no document can exceed the threshold.
fn find_pivot_doc(
    term_scorers: &[TermScorerWithMaxScore],
    threshold: Score,
) -> Option<(usize, usize, DocId)> {
    let mut max_score = 0.0;
    let mut before_pivot_len = 0;
    let mut pivot_doc = TERMINATED;
    while before_pivot_len < term_scorers.len() {
        let term_scorer = &term_scorers[before_pivot_len];
        max_score += term_scorer.max_score;
        if max_score > threshold {
            pivot_doc = term_scorer.doc();
            break;
        }
        before_pivot_len += 1;
    }
    if pivot_doc == TERMINATED {
        return None;
    }
    // Right now i is an ordinal, we want a len.
    let mut pivot_len = before_pivot_len + 1;
    // Some other term_scorer may be positioned on the same document.
    pivot_len += term_scorers[pivot_len..]
        .iter()
        .take_while(|term_scorer| term_scorer.doc() == pivot_doc)
        .count();
    Some((before_pivot_len, pivot_len, pivot_doc))
}

/// Advance the scorer with best score among the scorers[..pivot_len] to
/// the next doc candidate defined by the min of `last_doc_in_block + 1` for
/// scorer in scorers[..pivot_len] and `scorer.doc()` for scorer in scorers[pivot_len..].
/// Note: before and after calling this method, scorers need to be sorted by their `.doc()`.
fn block_max_was_too_low_advance_one_scorer(
    scorers: &mut [TermScorerWithMaxScore],
    pivot_len: usize,
) {
    debug_assert!(is_sorted(scorers.iter().map(|scorer| scorer.doc())));
    let mut scorer_to_seek = pivot_len - 1;
    let mut global_max_score = scorers[scorer_to_seek].max_score;
    let mut doc_to_seek_after = scorers[scorer_to_seek].last_doc_in_block();
    for scorer_ord in (0..pivot_len - 1).rev() {
        let scorer = &scorers[scorer_ord];
        if scorer.last_doc_in_block() <= doc_to_seek_after {
            doc_to_seek_after = scorer.last_doc_in_block();
        }
        if scorers[scorer_ord].max_score > global_max_score {
            global_max_score = scorers[scorer_ord].max_score;
            scorer_to_seek = scorer_ord;
        }
    }
    // Add +1 to go to the next block unless we are already at the end.
    if doc_to_seek_after != TERMINATED {
        doc_to_seek_after += 1;
    }
    for scorer in &scorers[pivot_len..] {
        if scorer.doc() <= doc_to_seek_after {
            doc_to_seek_after = scorer.doc();
        }
    }
    scorers[scorer_to_seek].seek(doc_to_seek_after);

    restore_ordering(scorers, scorer_to_seek);
    debug_assert!(is_sorted(scorers.iter().map(|scorer| scorer.doc())));
}

// Given a list of term_scorers and a `ord` and assuming that `term_scorers[ord]` is sorted
// except term_scorers[ord] that might be in advance compared to its ranks,
// bubble up term_scorers[ord] in order to restore the ordering.
fn restore_ordering(term_scorers: &mut [TermScorerWithMaxScore], ord: usize) {
    let doc = term_scorers[ord].doc();
    for i in ord + 1..term_scorers.len() {
        if term_scorers[i].doc() >= doc {
            break;
        }
        term_scorers.swap(i, i - 1);
    }
    debug_assert!(is_sorted(term_scorers.iter().map(|scorer| scorer.doc())));
}

// Attempts to advance all term_scorers between `&term_scorers[0..before_len]` to the pivot.
// If this works, return true.
// If this fails (ie: one of the term_scorer does not contain `pivot_doc` and seek goes past the
// pivot), reorder the term_scorers to ensure the list is still sorted and returns `false`.
// If a term_scorer reach TERMINATED in the process return false remove the term_scorer and return.
fn align_scorers(
    term_scorers: &mut Vec<TermScorerWithMaxScore>,
    pivot_doc: DocId,
    before_pivot_len: usize,
) -> bool {
    debug_assert_ne!(pivot_doc, TERMINATED);
    for i in (0..before_pivot_len).rev() {
        let new_doc = term_scorers[i].seek(pivot_doc);
        if new_doc != pivot_doc {
            if new_doc == TERMINATED {
                term_scorers.swap_remove(i);
            }
            // We went past the pivot.
            // We just go through the outer loop mechanic (Note that pivot is
            // still a possible candidate).
            //
            // Termination is still guaranteed since we can only consider the same
            // pivot at most term_scorers.len() - 1 times.
            restore_ordering(term_scorers, i);
            return false;
        }
    }
    true
}

// Assumes terms_scorers[..pivot_len] are positioned on the same doc (pivot_doc).
// Advance term_scorers[..pivot_len] and out of these removes the terminated scores.
// Restores the ordering of term_scorers.
fn advance_all_scorers_on_pivot(term_scorers: &mut Vec<TermScorerWithMaxScore>, pivot_len: usize) {
    for term_scorer in &mut term_scorers[..pivot_len] {
        term_scorer.advance();
    }
    // TODO use drain_filter when available.
    let mut i = 0;
    while i != term_scorers.len() {
        if term_scorers[i].doc() == TERMINATED {
            term_scorers.swap_remove(i);
        } else {
            i += 1;
        }
    }
    term_scorers.sort_by_key(|scorer| scorer.doc());
}

/// Implements the WAND (Weak AND) algorithm for dynamic pruning
/// described in the paper "Faster Top-k Document Retrieval Using Block-Max Indexes".
/// Link: <http://engineering.nyu.edu/~suel/papers/bmw.pdf>
pub fn block_wand(
    mut scorers: Vec<TermScorer>,
    mut threshold: Score,
    callback: &mut dyn FnMut(u32, Score) -> Score,
) {
    let mut scorers: Vec<TermScorerWithMaxScore> = scorers
        .iter_mut()
        .map(TermScorerWithMaxScore::from)
        .collect();
    scorers.sort_by_key(|scorer| scorer.doc());
    // At this point we need to ensure that the scorers are sorted!
    debug_assert!(is_sorted(scorers.iter().map(|scorer| scorer.doc())));
    while let Some((before_pivot_len, pivot_len, pivot_doc)) =
        find_pivot_doc(&scorers[..], threshold)
    {
        debug_assert!(is_sorted(scorers.iter().map(|scorer| scorer.doc())));
        debug_assert_ne!(pivot_doc, TERMINATED);
        debug_assert!(before_pivot_len < pivot_len);

        let block_max_score_upperbound: Score = scorers[..pivot_len]
            .iter_mut()
            .map(|scorer| {
                scorer.seek_block(pivot_doc);
                scorer.block_max_score()
            })
            .sum();

        // Beware after shallow advance, skip readers can be in advance compared to
        // the segment posting lists.
        //
        // `block_segment_postings.load_block()` need to be called separately.
        if block_max_score_upperbound <= threshold {
            // Block max condition was not reached
            // We could get away by simply advancing the scorers to DocId + 1 but it would
            // be inefficient. The optimization requires proper explanation and was
            // isolated in a different function.
            block_max_was_too_low_advance_one_scorer(&mut scorers, pivot_len);
            continue;
        }

        // Block max condition is observed.
        //
        // Let's try and advance all scorers before the pivot to the pivot.
        if !align_scorers(&mut scorers, pivot_doc, before_pivot_len) {
            // At least of the scorer does not contain the pivot.
            //
            // Let's stop scoring this pivot and go through the pivot selection again.
            // Note that the current pivot is not necessarily a bad candidate and it
            // may be picked again.
            continue;
        }

        // At this point, all scorers are positioned on the doc.
        let score = scorers[..pivot_len]
            .iter_mut()
            .map(|scorer| scorer.score())
            .sum();

        if score > threshold {
            threshold = callback(pivot_doc, score);
        }
        // let's advance all of the scorers that are currently positioned on the pivot.
        advance_all_scorers_on_pivot(&mut scorers, pivot_len);
    }
}

/// Specialized version of [`block_wand`] for a single scorer.
/// In this case, the algorithm is simple, readable and faster (~ x3)
/// than the generic algorithm.
/// The algorithm behaves as follows:
/// - While we don't hit the end of the docset:
///   - While the block max score is under the `threshold`, go to the next block.
///   - On a block, advance until the end and execute `callback` when the doc score is greater or
///     equal to the `threshold`.
pub fn block_wand_single_scorer(
    mut scorer: TermScorer,
    mut threshold: Score,
    callback: &mut dyn FnMut(u32, Score) -> Score,
) {
    let mut doc = scorer.doc();
    loop {
        // We position the scorer on a block that can reach
        // the threshold.
        while scorer.block_max_score() < threshold {
            let last_doc_in_block = scorer.last_doc_in_block();
            if last_doc_in_block == TERMINATED {
                return;
            }
            doc = last_doc_in_block + 1;
            scorer.seek_block(doc);
        }
        // Seek will effectively load that block.
        doc = scorer.seek(doc);
        if doc == TERMINATED {
            break;
        }
        loop {
            let score = scorer.score();
            if score > threshold {
                threshold = callback(doc, score);
            }
            debug_assert!(doc <= scorer.last_doc_in_block());
            if doc == scorer.last_doc_in_block() {
                break;
            }
            doc = scorer.advance();
            if doc == TERMINATED {
                return;
            }
        }
        doc += 1;
        scorer.seek_block(doc);
    }
}

struct TermScorerWithMaxScore<'a> {
    scorer: &'a mut TermScorer,
    max_score: Score,
}

impl<'a> From<&'a mut TermScorer> for TermScorerWithMaxScore<'a> {
    fn from(scorer: &'a mut TermScorer) -> Self {
        let max_score = scorer.max_score();
        TermScorerWithMaxScore { scorer, max_score }
    }
}

impl Deref for TermScorerWithMaxScore<'_> {
    type Target = TermScorer;

    fn deref(&self) -> &Self::Target {
        self.scorer
    }
}

impl DerefMut for TermScorerWithMaxScore<'_> {
    fn deref_mut(&mut self) -> &mut Self::Target {
        self.scorer
    }
}

fn is_sorted<I: Iterator<Item = DocId>>(mut it: I) -> bool {
    if let Some(first) = it.next() {
        let mut prev = first;
        for doc in it {
            if doc < prev {
                return false;
            }
            prev = doc;
        }
    }
    true
}
#[cfg(test)]
mod tests {
    use std::cmp::Ordering;
    use std::collections::BinaryHeap;

    use proptest::prelude::*;

    use crate::query::score_combiner::SumCombiner;
    use crate::query::term_query::TermScorer;
    use crate::query::{Bm25Weight, BufferedUnionScorer, Scorer};
    use crate::{DocId, DocSet, Score, TERMINATED};

    struct Float(Score);

    impl Eq for Float {}

    impl PartialEq for Float {
        fn eq(&self, other: &Self) -> bool {
            self.cmp(other) == Ordering::Equal
        }
    }

    impl PartialOrd for Float {
        fn partial_cmp(&self, other: &Self) -> Option<Ordering> {
            Some(self.cmp(other))
        }
    }

    impl Ord for Float {
        fn cmp(&self, other: &Self) -> Ordering {
            other.0.partial_cmp(&self.0).unwrap_or(Ordering::Equal)
        }
    }

    fn nearly_equals(left: Score, right: Score) -> bool {
        (left - right).abs() < 0.0001 * (left + right).abs()
    }

    fn compute_checkpoints_for_each_pruning(
        mut term_scorers: Vec<TermScorer>,
        n: usize,
    ) -> Vec<(DocId, Score)> {
        let mut heap: BinaryHeap<Float> = BinaryHeap::with_capacity(n);
        let mut checkpoints: Vec<(DocId, Score)> = Vec::new();
        let mut limit: Score = 0.0;

        let callback = &mut |doc, score| {
            heap.push(Float(score));
            if heap.len() > n {
                heap.pop().unwrap();
            }
            if heap.len() == n {
                limit = heap.peek().unwrap().0;
            }
            if !nearly_equals(score, limit) {
                checkpoints.push((doc, score));
            }
            limit
        };

        if term_scorers.len() == 1 {
            let scorer = term_scorers.pop().unwrap();
            super::block_wand_single_scorer(scorer, Score::MIN, callback);
        } else {
            super::block_wand(term_scorers, Score::MIN, callback);
        }
        checkpoints
    }

    fn compute_checkpoints_manual(
        term_scorers: Vec<TermScorer>,
        n: usize,
        max_doc: u32,
    ) -> Vec<(DocId, Score)> {
        let mut heap: BinaryHeap<Float> = BinaryHeap::with_capacity(n);
        let mut checkpoints: Vec<(DocId, Score)> = Vec::new();
        let mut scorer = BufferedUnionScorer::build(term_scorers, SumCombiner::default, max_doc);

        let mut limit = Score::MIN;
        loop {
            if scorer.doc() == TERMINATED {
                break;
            }
            let doc = scorer.doc();
            let score = scorer.score();
            if score > limit {
                heap.push(Float(score));
                if heap.len() > n {
                    heap.pop().unwrap();
                }
                if heap.len() == n {
                    limit = heap.peek().unwrap().0;
                }
                if !nearly_equals(score, limit) {
                    checkpoints.push((doc, score));
                }
            }
            scorer.advance();
        }
        checkpoints
    }

    const MAX_TERM_FREQ: u32 = 100u32;

    fn posting_list(max_doc: u32) -> BoxedStrategy<Vec<(DocId, u32)>> {
        (1..max_doc + 1)
            .prop_flat_map(move |doc_freq| {
                (
                    proptest::bits::bitset::sampled(doc_freq as usize, 0..max_doc as usize),
                    proptest::collection::vec(1u32..MAX_TERM_FREQ, doc_freq as usize),
                )
            })
            .prop_map(|(docset, term_freqs)| {
                docset
                    .iter()
                    .map(|doc| doc as u32)
                    .zip(term_freqs.iter().cloned())
                    .collect::<Vec<_>>()
            })
            .boxed()
    }

    #[expect(clippy::type_complexity)]
    fn gen_term_scorers(num_scorers: usize) -> BoxedStrategy<(Vec<Vec<(DocId, u32)>>, Vec<u32>)> {
        (1u32..100u32)
            .prop_flat_map(move |max_doc: u32| {
                (
                    proptest::collection::vec(posting_list(max_doc), num_scorers),
                    proptest::collection::vec(2u32..10u32 * MAX_TERM_FREQ, max_doc as usize),
                )
            })
            .boxed()
    }

    fn test_block_wand_aux(posting_lists: &[Vec<(DocId, u32)>], fieldnorms: &[u32]) {
        // We virtually repeat all docs 64 times in order to emulate blocks of 2 documents
        // and surface blogs more easily.
        const REPEAT: usize = 64;
        let fieldnorms_expanded = fieldnorms
            .iter()
            .cloned()
            .flat_map(|fieldnorm| std::iter::repeat_n(fieldnorm, REPEAT))
            .collect::<Vec<u32>>();

        let postings_lists_expanded: Vec<Vec<(DocId, u32)>> = posting_lists
            .iter()
            .map(|posting_list| {
                posting_list
                    .iter()
                    .cloned()
                    .flat_map(|(doc, term_freq)| {
                        (0_u32..REPEAT as u32).map(move |offset| {
                            (
                                doc * (REPEAT as u32) + offset,
                                if offset == 0 { term_freq } else { 1 },
                            )
                        })
                    })
                    .collect::<Vec<(DocId, u32)>>()
            })
            .collect::<Vec<_>>();

        let total_fieldnorms: u64 = fieldnorms_expanded
            .iter()
            .cloned()
            .map(|fieldnorm| fieldnorm as u64)
            .sum();
        let average_fieldnorm = (total_fieldnorms as Score) / (fieldnorms_expanded.len() as Score);
        let max_doc = fieldnorms_expanded.len();

        let term_scorers: Vec<TermScorer> = postings_lists_expanded
            .iter()
            .map(|postings| {
                let bm25_weight = Bm25Weight::for_one_term(
                    postings.len() as u64,
                    max_doc as u64,
                    average_fieldnorm,
                );
                TermScorer::create_for_test(postings, &fieldnorms_expanded[..], bm25_weight)
            })
            .collect();
        for top_k in 1..4 {
            let checkpoints_for_each_pruning =
                compute_checkpoints_for_each_pruning(term_scorers.clone(), top_k);
            let checkpoints_manual =
                compute_checkpoints_manual(term_scorers.clone(), top_k, max_doc as u32);
            assert_eq!(checkpoints_for_each_pruning.len(), checkpoints_manual.len());
            for (&(left_doc, left_score), &(right_doc, right_score)) in checkpoints_for_each_pruning
                .iter()
                .zip(checkpoints_manual.iter())
            {
                assert_eq!(left_doc, right_doc);
                assert!(nearly_equals(left_score, right_score));
            }
        }
    }

    proptest! {
        #![proptest_config(ProptestConfig::with_cases(500))]
        #[test]
        fn test_block_wand_two_term_scorers((posting_lists, fieldnorms) in gen_term_scorers(2)) {
            test_block_wand_aux(&posting_lists[..], &fieldnorms[..]);
        }
    }

    proptest! {
        #![proptest_config(ProptestConfig::with_cases(500))]
        #[test]
        fn test_block_wand_single_term_scorer((posting_lists, fieldnorms) in gen_term_scorers(1)) {
            test_block_wand_aux(&posting_lists[..], &fieldnorms[..]);
        }
    }

    #[test]
    fn test_fn_reproduce_proptest() {
        let postings_lists = &[
            vec![
                (0, 1),
                (1, 1),
                (2, 1),
                (3, 1),
                (4, 1),
                (6, 1),
                (7, 7),
                (8, 1),
                (10, 1),
                (12, 1),
                (13, 1),
                (14, 1),
                (15, 1),
                (16, 1),
                (19, 1),
                (20, 1),
                (21, 1),
                (22, 1),
                (24, 1),
                (25, 1),
                (26, 1),
                (28, 1),
                (30, 1),
                (31, 1),
                (33, 1),
                (34, 1),
                (35, 1),
                (36, 95),
                (37, 1),
                (39, 1),
                (41, 1),
                (44, 1),
                (46, 1),
            ],
            vec![
                (0, 5),
                (2, 1),
                (4, 1),
                (5, 84),
                (6, 47),
                (7, 26),
                (8, 50),
                (9, 34),
                (11, 73),
                (12, 11),
                (13, 51),
                (14, 45),
                (15, 18),
                (18, 60),
                (19, 80),
                (20, 63),
                (23, 79),
                (24, 69),
                (26, 35),
                (28, 82),
                (29, 19),
                (30, 2),
                (31, 7),
                (33, 40),
                (34, 1),
                (35, 33),
                (36, 27),
                (37, 24),
                (38, 65),
                (39, 32),
                (40, 85),
                (41, 1),
                (42, 69),
                (43, 11),
                (45, 45),
                (47, 97),
            ],
            vec![
                (2, 1),
                (4, 1),
                (7, 94),
                (8, 1),
                (9, 1),
                (10, 1),
                (12, 1),
                (15, 1),
                (22, 1),
                (23, 1),
                (26, 1),
                (27, 1),
                (32, 1),
                (33, 1),
                (34, 1),
                (36, 96),
                (39, 1),
                (41, 1),
            ],
        ];
        let fieldnorms = &[
            685, 239, 780, 564, 664, 827, 5, 56, 930, 887, 263, 665, 167, 127, 120, 919, 292, 92,
            489, 734, 814, 724, 700, 304, 128, 779, 311, 877, 774, 15, 866, 368, 894, 371, 982,
            502, 507, 669, 680, 76, 594, 626, 578, 331, 170, 639, 665, 186,
        ][..];
        test_block_wand_aux(postings_lists, fieldnorms);
    }

    proptest! {
        #![proptest_config(ProptestConfig::with_cases(500))]
        #[ignore]
        #[test]
        #[ignore]
        fn test_block_wand_three_term_scorers((posting_lists, fieldnorms) in gen_term_scorers(3)) {
            test_block_wand_aux(&posting_lists[..], &fieldnorms[..]);
        }
    }
}


================================================
FILE: src/query/boolean_query/boolean_query.rs
================================================
use super::boolean_weight::BooleanWeight;
use crate::query::{EnableScoring, Occur, Query, SumCombiner, TermQuery, Weight};
use crate::schema::{IndexRecordOption, Term};

/// The boolean query returns a set of documents
/// that matches the Boolean combination of constituent subqueries.
///
/// The documents matched by the boolean query are those which
/// - match all of the sub queries associated with the `Must` occurrence
/// - match none of the sub queries associated with the `MustNot` occurrence.
/// - match at least one of the sub queries associated with the `Must` or `Should` occurrence.
///
/// You can combine other query types and their `Occur`ances into one `BooleanQuery`
///
/// ```rust
/// use tantivy::collector::Count;
/// use tantivy::doc;
/// use tantivy::query::{BooleanQuery, Occur, PhraseQuery, Query, TermQuery};
/// use tantivy::schema::{IndexRecordOption, Schema, TEXT};
/// use tantivy::Term;
/// use tantivy::Index;
/// use tantivy::IndexWriter;
///
/// fn main() -> tantivy::Result<()> {
///    let mut schema_builder = Schema::builder();
///    let title = schema_builder.add_text_field("title", TEXT);
///    let body = schema_builder.add_text_field("body", TEXT);
///    let schema = schema_builder.build();
///    let index = Index::create_in_ram(schema);
///    {
///        let mut index_writer: IndexWriter = index.writer(15_000_000)?;
///        index_writer.add_document(doc!(
///            title => "The Name of the Wind",
///        ))?;
///        index_writer.add_document(doc!(
///            title => "The Diary of Muadib",
///        ))?;
///        index_writer.add_document(doc!(
///            title => "A Dairy Cow",
///            body => "hidden",
///        ))?;
///        index_writer.add_document(doc!(
///            title => "A Dairy Cow",
///            body => "found",
///        ))?;
///        index_writer.add_document(doc!(
///            title => "The Diary of a Young Girl",
///        ))?;
///        index_writer.commit()?;
///    }
///
///    let reader = index.reader()?;
///    let searcher = reader.searcher();
///
///    // Make TermQuery's for "girl" and "diary" in the title
///    let girl_term_query: Box<dyn Query> = Box::new(TermQuery::new(
///        Term::from_field_text(title, "girl"),
///        IndexRecordOption::Basic,
///    ));
///    let diary_term_query: Box<dyn Query> = Box::new(TermQuery::new(
///        Term::from_field_text(title, "diary"),
///        IndexRecordOption::Basic,
///    ));
///    let cow_term_query: Box<dyn Query> = Box::new(TermQuery::new(
///        Term::from_field_text(title, "cow"),
///        IndexRecordOption::Basic
///    ));
///    // A TermQuery with "found" in the body
///    let body_term_query: Box<dyn Query> = Box::new(TermQuery::new(
///        Term::from_field_text(body, "found"),
///        IndexRecordOption::Basic,
///    ));
///    // TermQuery "diary" must and "girl" must not be present
///    let queries_with_occurs1 = vec![
///        (Occur::Must, diary_term_query.box_clone()),
///        (Occur::MustNot, girl_term_query.box_clone()),
///    ];
///    // Make a BooleanQuery equivalent to
///    // title:+diary title:-girl
///    let diary_must_and_girl_mustnot = BooleanQuery::new(queries_with_occurs1);
///    let count1 = searcher.search(&diary_must_and_girl_mustnot, &Count)?;
///    assert_eq!(count1, 1);
///
///    // "title:diary OR title:cow"
///    let title_diary_or_cow = BooleanQuery::new(vec![
///        (Occur::Should, diary_term_query.box_clone()),
///        (Occur::Should, cow_term_query.box_clone()),
///    ]);
///    let count2 = searcher.search(&title_diary_or_cow, &Count)?;
///    assert_eq!(count2, 4);
///
///    // Make a `PhraseQuery` from a vector of `Term`s
///    let phrase_query: Box<dyn Query> = Box::new(PhraseQuery::new(vec![
///        Term::from_field_text(title, "dairy"),
///        Term::from_field_text(title, "cow"),
///    ]));
///    // You can combine subqueries of different types into 1 BooleanQuery:
///    // `TermQuery` and `PhraseQuery`
///    // "title:diary OR "dairy cow"
///    let term_of_phrase_query = BooleanQuery::new(vec![
///        (Occur::Should, diary_term_query.box_clone()),
///        (Occur::Should, phrase_query.box_clone()),
///    ]);
///    let count3 = searcher.search(&term_of_phrase_query, &Count)?;
///    assert_eq!(count3, 4);
///
///    // You can nest one BooleanQuery inside another
///    // body:found AND ("title:diary OR "dairy cow")
///    let nested_query = BooleanQuery::new(vec![
///        (Occur::Must, body_term_query),
///        (Occur::Must, Box::new(term_of_phrase_query))
///    ]);
///    let count4 = searcher.search(&nested_query, &Count)?;
///    assert_eq!(count4, 1);
///
///    // You may call `with_minimum_required_clauses` to
///    // specify the number of should clauses the returned documents must match.
///    let minimum_required_query = BooleanQuery::with_minimum_required_clauses(vec![
///         (Occur::Should, cow_term_query.box_clone()),
///         (Occur::Should, girl_term_query.box_clone()),
///         (Occur::Should, diary_term_query.box_clone()),
///    ], 2);
///    // Return documents contains "Diary Cow", "Diary Girl" or "Cow Girl"
///    // Notice: "Diary" isn't "Dairy". ;-)
///    let count5 = searcher.search(&minimum_required_query, &Count)?;
///    assert_eq!(count5, 1);
///    Ok(())
/// }
/// ```
#[derive(Debug)]
pub struct BooleanQuery {
    subqueries: Vec<(Occur, Box<dyn Query>)>,
    minimum_number_should_match: usize,
}

impl Clone for BooleanQuery {
    fn clone(&self) -> Self {
        let subqueries = self
            .subqueries
            .iter()
            .map(|(occur, subquery)| (*occur, subquery.box_clone()))
            .collect::<Vec<_>>();
        Self {
            subqueries,
            minimum_number_should_match: self.minimum_number_should_match,
        }
    }
}

impl From<Vec<(Occur, Box<dyn Query>)>> for BooleanQuery {
    fn from(subqueries: Vec<(Occur, Box<dyn Query>)>) -> BooleanQuery {
        BooleanQuery::new(subqueries)
    }
}

impl Query for BooleanQuery {
    fn weight(&self, enable_scoring: EnableScoring<'_>) -> crate::Result<Box<dyn Weight>> {
        let sub_weights = self
            .subqueries
            .iter()
            .map(|(occur, subquery)| Ok((*occur, subquery.weight(enable_scoring)?)))
            .collect::<crate::Result<_>>()?;
        Ok(Box::new(BooleanWeight::with_minimum_number_should_match(
            sub_weights,
            self.minimum_number_should_match,
            enable_scoring.is_scoring_enabled(),
            Box::new(SumCombiner::default),
        )))
    }

    fn query_terms<'a>(&'a self, visitor: &mut dyn FnMut(&'a Term, bool)) {
        for (_occur, subquery) in &self.subqueries {
            subquery.query_terms(visitor);
        }
    }
}

impl BooleanQuery {
    /// Creates a new boolean query.
    pub fn new(subqueries: Vec<(Occur, Box<dyn Query>)>) -> BooleanQuery {
        // If the bool query includes at least one should clause
        // and no Must or MustNot clauses, the default value is 1. Otherwise, the default value is
        // 0. Keep compatible with Elasticsearch.
        let mut minimum_required = 0;
        for (occur, _) in &subqueries {
            match occur {
                Occur::Should => minimum_required = 1,
                Occur::Must | Occur::MustNot => {
                    minimum_required = 0;
                    break;
                }
            }
        }
        Self::with_minimum_required_clauses(subqueries, minimum_required)
    }

    /// Create a new boolean query with minimum number of required should clauses specified.
    pub fn with_minimum_required_clauses(
        subqueries: Vec<(Occur, Box<dyn Query>)>,
        minimum_number_should_match: usize,
    ) -> BooleanQuery {
        BooleanQuery {
            subqueries,
            minimum_number_should_match,
        }
    }

    /// Getter for `minimum_number_should_match`
    pub fn get_minimum_number_should_match(&self) -> usize {
        self.minimum_number_should_match
    }

    /// Setter for `minimum_number_should_match`
    pub fn set_minimum_number_should_match(&mut self, minimum_number_should_match: usize) {
        self.minimum_number_should_match = minimum_number_should_match;
    }

    /// Returns the intersection of the queries.
    pub fn intersection(queries: Vec<Box<dyn Query>>) -> BooleanQuery {
        let subqueries = queries.into_iter().map(|s| (Occur::Must, s)).collect();
        BooleanQuery::new(subqueries)
    }

    /// Returns the union of the queries.
    pub fn union(queries: Vec<Box<dyn Query>>) -> BooleanQuery {
        let subqueries = queries.into_iter().map(|s| (Occur::Should, s)).collect();
        BooleanQuery::new(subqueries)
    }

    /// Returns the union of the queries with minimum required clause.
    pub fn union_with_minimum_required_clauses(
        queries: Vec<Box<dyn Query>>,
        minimum_required_clauses: usize,
    ) -> BooleanQuery {
        let subqueries = queries
            .into_iter()
            .map(|sub_query| (Occur::Should, sub_query))
            .collect();
        BooleanQuery::with_minimum_required_clauses(subqueries, minimum_required_clauses)
    }

    /// Helper method to create a boolean query matching a given list of terms.
    /// The resulting query is a disjunction of the terms.
    pub fn new_multiterms_query(terms: Vec<Term>) -> BooleanQuery {
        let occur_term_queries: Vec<(Occur, Box<dyn Query>)> = terms
            .into_iter()
            .map(|term| {
                let term_query: Box<dyn Query> =
                    Box::new(TermQuery::new(term, IndexRecordOption::WithFreqs));
                (Occur::Should, term_query)
            })
            .collect();
        BooleanQuery::new(occur_term_queries)
    }

    /// Deconstructed view of the clauses making up this query.
    pub fn clauses(&self) -> &[(Occur, Box<dyn Query>)] {
        &self.subqueries[..]
    }
}

#[cfg(test)]
mod tests {
    use std::collections::HashSet;

    use super::BooleanQuery;
    use crate::collector::{Count, DocSetCollector};
    use crate::query::{Query, QueryClone, QueryParser, TermQuery};
    use crate::schema::{Field, IndexRecordOption, Schema, TEXT};
    use crate::{DocAddress, DocId, Index, Term};

    fn create_test_index() -> crate::Result<Index> {
        let mut schema_builder = Schema::builder();
        let text = schema_builder.add_text_field("text", TEXT);
        let schema = schema_builder.build();
        let index = Index::create_in_ram(schema);
        let mut writer = index.writer_for_tests()?;
        writer.add_document(doc!(text=>"b c"))?;
        writer.add_document(doc!(text=>"a c"))?;
        writer.add_document(doc!(text=>"a b"))?;
        writer.add_document(doc!(text=>"a d"))?;
        writer.commit()?;
        Ok(index)
    }

    #[test]
    fn test_minimum_required() -> crate::Result<()> {
        fn create_test_index_with<T: IntoIterator<Item = &'static str>>(
            docs: T,
        ) -> crate::Result<Index> {
            let mut schema_builder = Schema::builder();
            let text = schema_builder.add_text_field("text", TEXT);
            let schema = schema_builder.build();
            let index = Index::create_in_ram(schema);
            let mut writer = index.writer_for_tests()?;
            for doc in docs {
                writer.add_document(doc!(text => doc))?;
            }
            writer.commit()?;
            Ok(index)
        }
        fn create_boolean_query_with_mr<T: IntoIterator<Item = &'static str>>(
            queries: T,
            field: Field,
            mr: usize,
        ) -> BooleanQuery {
            let terms = queries
                .into_iter()
                .map(|t| Term::from_field_text(field, t))
                .map(|t| TermQuery::new(t, IndexRecordOption::Basic))
                .map(|q| -> Box<dyn Query> { Box::new(q) })
                .collect();
            BooleanQuery::union_with_minimum_required_clauses(terms, mr)
        }
        fn check_doc_id<T: IntoIterator<Item = DocId>>(
            expected: T,
            actually: HashSet<DocAddress>,
            seg: u32,
        ) {
            assert_eq!(
                actually,
                expected
                    .into_iter()
                    .map(|id| DocAddress::new(seg, id))
                    .collect()
            );
        }
        let index = create_test_index_with(["a b c", "a c e", "d f g", "z z z", "c i b"])?;
        let searcher = index.reader()?.searcher();
        let text = index.schema().get_field("text").unwrap();
        // Documents contains 'a c' 'a z' 'a i' 'c z' 'c i' or 'z i' shall be return.
        let q1 = create_boolean_query_with_mr(["a", "c", "z", "i"], text, 2);
        let docs = searcher.search(&q1, &DocSetCollector)?;
        check_doc_id([0, 1, 4], docs, 0);
        // Documents contains 'a b c', 'a b e', 'a c e' or 'b c e' shall be return.
        let q2 = create_boolean_query_with_mr(["a", "b", "c", "e"], text, 3);
        let docs = searcher.search(&q2, &DocSetCollector)?;
        check_doc_id([0, 1], docs, 0);
        // Nothing queried since minimum_required is too large.
        let q3 = create_boolean_query_with_mr(["a", "b"], text, 3);
        let docs = searcher.search(&q3, &DocSetCollector)?;
        assert!(docs.is_empty());
        // When mr is set to zero or one, there are no difference with `Boolean::Union`.
        let q4 = create_boolean_query_with_mr(["a", "z"], text, 1);
        let docs = searcher.search(&q4, &DocSetCollector)?;
        check_doc_id([0, 1, 3], docs, 0);
        let q5 = create_boolean_query_with_mr(["a", "b"], text, 0);
        let docs = searcher.search(&q5, &DocSetCollector)?;
        check_doc_id([0, 1, 4], docs, 0);
        Ok(())
    }

    #[test]
    fn test_union() -> crate::Result<()> {
        let index = create_test_index()?;
        let searcher = index.reader()?.searcher();
        let text = index.schema().get_field("text").unwrap();
        let term_a = TermQuery::new(Term::from_field_text(text, "a"), IndexRecordOption::Basic);
        let term_d = TermQuery::new(Term::from_field_text(text, "d"), IndexRecordOption::Basic);
        let union_ad = BooleanQuery::union(vec![term_a.box_clone(), term_d.box_clone()]);
        let docs = searcher.search(&union_ad, &DocSetCollector)?;
        assert_eq!(
            docs,
            vec![
                DocAddress::new(0u32, 1u32),
                DocAddress::new(0u32, 2u32),
                DocAddress::new(0u32, 3u32)
            ]
            .into_iter()
            .collect()
        );
        Ok(())
    }

    #[test]
    fn test_intersection() -> crate::Result<()> {
        let index = create_test_index()?;
        let searcher = index.reader()?.searcher();
        let text = index.schema().get_field("text").unwrap();
        let term_a = TermQuery::new(Term::from_field_text(text, "a"), IndexRecordOption::Basic);
        let term_b = TermQuery::new(Term::from_field_text(text, "b"), IndexRecordOption::Basic);
        let term_c = TermQuery::new(Term::from_field_text(text, "c"), IndexRecordOption::Basic);
        let intersection_ab =
            BooleanQuery::intersection(vec![term_a.box_clone(), term_b.box_clone()]);
        let intersection_ac =
            BooleanQuery::intersection(vec![term_a.box_clone(), term_c.box_clone()]);
        let intersection_bc =
            BooleanQuery::intersection(vec![term_b.box_clone(), term_c.box_clone()]);
        {
            let docs = searcher.search(&intersection_ab, &DocSetCollector)?;
            assert_eq!(
                docs,
                vec![DocAddress::new(0u32, 2u32)].into_iter().collect()
            );
        }
        {
            let docs = searcher.search(&intersection_ac, &DocSetCollector)?;
            assert_eq!(
                docs,
                vec![DocAddress::new(0u32, 1u32)].into_iter().collect()
            );
        }
        {
            let docs = searcher.search(&intersection_bc, &DocSetCollector)?;
            assert_eq!(
                docs,
                vec![DocAddress::new(0u32, 0u32)].into_iter().collect()
            );
        }
        Ok(())
    }

    #[test]
    pub fn test_json_array_pitfall_bag_of_terms() -> crate::Result<()> {
        let mut schema_builder = Schema::builder();
        let json_field = schema_builder.add_json_field("json", TEXT);
        let schema = schema_builder.build();
        let index = Index::create_in_ram(schema);
        {
            let mut index_writer = index.writer_for_tests()?;
            index_writer.add_document(doc!(json_field=>json!({
                "cart": [
                    {"product_type": "sneakers", "attributes": {"color": "white"}},
                    {"product_type": "t-shirt", "attributes": {"color": "red"}},
                    {"product_type": "cd", "attributes": {"genre": "blues"}},
                ]
            })))?;
            index_writer.commit()?;
        }
        let searcher = index.reader()?.searcher();
        let doc_matches = |query: &str| {
            let query_parser = QueryParser::for_index(&index, vec![json_field]);
            let query = query_parser.parse_query(query).unwrap();
            searcher.search(&query, &Count).unwrap() == 1
        };
        // As expected
        assert!(doc_matches(
            r#"cart.product_type:sneakers AND cart.attributes.color:white"#
        ));
        // Unexpected match, due to the fact that array do not act as nested docs.
        assert!(doc_matches(
            r#"cart.product_type:sneakers AND cart.attributes.color:red"#
        ));
        // However, bviously this works...
        assert!(!doc_matches(
            r#"cart.product_type:sneakers AND cart.attributes.color:blues"#
        ));
        Ok(())
    }
}


================================================
FILE: src/query/boolean_query/boolean_weight.rs
================================================
use std::collections::HashMap;

use crate::docset::COLLECT_BLOCK_BUFFER_LEN;
use crate::index::SegmentReader;
use crate::postings::FreqReadingOption;
use crate::query::disjunction::Disjunction;
use crate::query::explanation::does_not_match;
use crate::query::score_combiner::{DoNothingCombiner, ScoreCombiner};
use crate::query::term_query::TermScorer;
use crate::query::weight::{for_each_docset_buffered, for_each_pruning_scorer, for_each_scorer};
use crate::query::{
    intersect_scorers, AllScorer, BufferedUnionScorer, EmptyScorer, Exclude, Explanation, Occur,
    RequiredOptionalScorer, Scorer, Weight,
};
use crate::{DocId, Score};

enum SpecializedScorer {
    TermUnion(Vec<TermScorer>),
    Other(Box<dyn Scorer>),
}

fn scorer_disjunction<TScoreCombiner>(
    scorers: Vec<Box<dyn Scorer>>,
    score_combiner: TScoreCombiner,
    minimum_match_required: usize,
) -> Box<dyn Scorer>
where
    TScoreCombiner: ScoreCombiner,
{
    debug_assert!(!scorers.is_empty());
    debug_assert!(minimum_match_required > 1);
    if scorers.len() == 1 {
        return scorers.into_iter().next().unwrap(); // Safe unwrap.
    }
    Box::new(Disjunction::new(
        scorers,
        score_combiner,
        minimum_match_required,
    ))
}

/// num_docs is the number of documents in the segment.
fn scorer_union<TScoreCombiner>(
    scorers: Vec<Box<dyn Scorer>>,
    score_combiner_fn: impl Fn() -> TScoreCombiner,
    num_docs: u32,
) -> SpecializedScorer
where
    TScoreCombiner: ScoreCombiner,
{
    assert!(!scorers.is_empty());
    if scorers.len() == 1 {
        return SpecializedScorer::Other(scorers.into_iter().next().unwrap()); //< we checked the size beforehand
    }

    {
        let is_all_term_queries = scorers.iter().all(|scorer| scorer.is::<TermScorer>());
        if is_all_term_queries {
            let scorers: Vec<TermScorer> = scorers
                .into_iter()
                .map(|scorer| *(scorer.downcast::<TermScorer>().map_err(|_| ()).unwrap()))
                .collect();
            if scorers
                .iter()
                .all(|scorer| scorer.freq_reading_option() == FreqReadingOption::ReadFreq)
            {
                // Block wand is only available if we read frequencies.
                return SpecializedScorer::TermUnion(scorers);
            } else {
                return SpecializedScorer::Other(Box::new(BufferedUnionScorer::build(
                    scorers,
                    score_combiner_fn,
                    num_docs,
                )));
            }
        }
    }
    SpecializedScorer::Other(Box::new(BufferedUnionScorer::build(
        scorers,
        score_combiner_fn,
        num_docs,
    )))
}

fn into_box_scorer<TScoreCombiner: ScoreCombiner>(
    scorer: SpecializedScorer,
    score_combiner_fn: impl Fn() -> TScoreCombiner,
    num_docs: u32,
) -> Box<dyn Scorer> {
    match scorer {
        SpecializedScorer::TermUnion(term_scorers) => {
            let union_scorer =
                BufferedUnionScorer::build(term_scorers, score_combiner_fn, num_docs);
            Box::new(union_scorer)
        }
        SpecializedScorer::Other(scorer) => scorer,
    }
}

/// Returns the effective MUST scorer, accounting for removed AllScorers.
///
/// When AllScorer instances are removed from must_scorers as an optimization,
/// we must restore the "match all" semantics if the list becomes empty.
fn effective_must_scorer(
    must_scorers: Vec<Box<dyn Scorer>>,
    removed_all_scorer_count: usize,
    max_doc: DocId,
    num_docs: u32,
) -> Option<Box<dyn Scorer>> {
    if must_scorers.is_empty() {
        if removed_all_scorer_count > 0 {
            // Had AllScorer(s) only - all docs match
            Some(Box::new(AllScorer::new(max_doc)))
        } else {
            // No MUST constraint at all
            None
        }
    } else {
        Some(intersect_scorers(must_scorers, num_docs))
    }
}

/// Returns a SHOULD scorer with AllScorer union if any were removed.
///
/// For union semantics (OR): if any SHOULD clause was an AllScorer, the result
/// should include all documents. We restore this by unioning with AllScorer.
///
/// When `scoring_enabled` is false, we can just return AllScorer alone since
/// we don't need score contributions from the should_scorer.
fn effective_should_scorer_for_union<TScoreCombiner: ScoreCombiner>(
    should_scorer: SpecializedScorer,
    removed_all_scorer_count: usize,
    max_doc: DocId,
    num_docs: u32,
    score_combiner_fn: impl Fn() -> TScoreCombiner,
    scoring_enabled: bool,
) -> SpecializedScorer {
    if removed_all_scorer_count > 0 {
        if scoring_enabled {
            // Need to union to get score contributions from both
            let all_scorers: Vec<Box<dyn Scorer>> = vec![
                into_box_scorer(should_scorer, &score_combiner_fn, num_docs),
                Box::new(AllScorer::new(max_doc)),
            ];
            SpecializedScorer::Other(Box::new(BufferedUnionScorer::build(
                all_scorers,
                score_combiner_fn,
                num_docs,
            )))
        } else {
            // Scoring disabled - AllScorer alone is sufficient
            SpecializedScorer::Other(Box::new(AllScorer::new(max_doc)))
        }
    } else {
        should_scorer
    }
}

enum ShouldScorersCombinationMethod {
    // Should scorers are irrelevant.
    Ignored,
    // Only contributes to final score.
    Optional(SpecializedScorer),
    // Regardless of score, the should scorers may impact whether a document is matching or not.
    Required(SpecializedScorer),
}

/// Weight associated to the `BoolQuery`.
pub struct BooleanWeight<TScoreCombiner: ScoreCombiner> {
    weights: Vec<(Occur, Box<dyn Weight>)>,
    minimum_number_should_match: usize,
    scoring_enabled: bool,
    score_combiner_fn: Box<dyn Fn() -> TScoreCombiner + Sync + Send>,
}

impl<TScoreCombiner: ScoreCombiner> BooleanWeight<TScoreCombiner> {
    /// Creates a new boolean weight.
    pub fn new(
        weights: Vec<(Occur, Box<dyn Weight>)>,
        scoring_enabled: bool,
        score_combiner_fn: Box<dyn Fn() -> TScoreCombiner + Sync + Send + 'static>,
    ) -> BooleanWeight<TScoreCombiner> {
        BooleanWeight {
            weights,
            scoring_enabled,
            score_combiner_fn,
            minimum_number_should_match: 1,
        }
    }

    /// Create a new boolean weight with minimum number of required should clauses specified.
    pub fn with_minimum_number_should_match(
        weights: Vec<(Occur, Box<dyn Weight>)>,
        minimum_number_should_match: usize,
        scoring_enabled: bool,
        score_combiner_fn: Box<dyn Fn() -> TScoreCombiner + Sync + Send + 'static>,
    ) -> BooleanWeight<TScoreCombiner> {
        BooleanWeight {
            weights,
            minimum_number_should_match,
            scoring_enabled,
            score_combiner_fn,
        }
    }

    fn per_occur_scorers(
        &self,
        reader: &SegmentReader,
        boost: Score,
    ) -> crate::Result<HashMap<Occur, Vec<Box<dyn Scorer>>>> {
        let mut per_occur_scorers: HashMap<Occur, Vec<Box<dyn Scorer>>> = HashMap::new();
        for (occur, subweight) in &self.weights {
            let sub_scorer: Box<dyn Scorer> = subweight.scorer(reader, boost)?;
            per_occur_scorers
                .entry(*occur)
                .or_default()
                .push(sub_scorer);
        }
        Ok(per_occur_scorers)
    }

    fn complex_scorer<TComplexScoreCombiner: ScoreCombiner>(
        &self,
        reader: &SegmentReader,
        boost: Score,
        score_combiner_fn: impl Fn() -> TComplexScoreCombiner,
    ) -> crate::Result<SpecializedScorer> {
        let num_docs = reader.num_docs();
        let mut per_occur_scorers = self.per_occur_scorers(reader, boost)?;

        // Indicate how should clauses are combined with must clauses.
        let mut must_scorers: Vec<Box<dyn Scorer>> =
            per_occur_scorers.remove(&Occur::Must).unwrap_or_default();
        let must_special_scorer_counts = remove_and_count_all_and_empty_scorers(&mut must_scorers);

        if must_special_scorer_counts.num_empty_scorers > 0 {
            return Ok(SpecializedScorer::Other(Box::new(EmptyScorer)));
        }

        let mut should_scorers = per_occur_scorers.remove(&Occur::Should).unwrap_or_default();
        let should_special_scorer_counts =
            remove_and_count_all_and_empty_scorers(&mut should_scorers);

        let mut exclude_scorers: Vec<Box<dyn Scorer>> = per_occur_scorers
            .remove(&Occur::MustNot)
            .unwrap_or_default();
        let exclude_special_scorer_counts =
            remove_and_count_all_and_empty_scorers(&mut exclude_scorers);

        if exclude_special_scorer_counts.num_all_scorers > 0 {
            // We exclude all documents at one point.
            return Ok(SpecializedScorer::Other(Box::new(EmptyScorer)));
        }

        let effective_minimum_number_should_match = self
            .minimum_number_should_match
            .saturating_sub(should_special_scorer_counts.num_all_scorers);

        let should_scorers: ShouldScorersCombinationMethod = {
            let num_of_should_scorers = should_scorers.len();
            if effective_minimum_number_should_match > num_of_should_scorers {
                // We don't have enough scorers to satisfy the minimum number of should matches.
                // The request will match no documents.
                return Ok(SpecializedScorer::Other(Box::new(EmptyScorer)));
            }
            match effective_minimum_number_should_match {
                0 if num_of_should_scorers == 0 => ShouldScorersCombinationMethod::Ignored,
                0 => ShouldScorersCombinationMethod::Optional(scorer_union(
                    should_scorers,
                    &score_combiner_fn,
                    num_docs,
                )),
                1 => ShouldScorersCombinationMethod::Required(scorer_union(
                    should_scorers,
                    &score_combiner_fn,
                    num_docs,
                )),
                n if num_of_should_scorers == n => {
                    // When num_of_should_scorers equals the number of should clauses,
                    // they are no different from must clauses.
                    must_scorers.append(&mut should_scorers);
                    ShouldScorersCombinationMethod::Ignored
                }
                _ => ShouldScorersCombinationMethod::Required(SpecializedScorer::Other(
                    scorer_disjunction(
                        should_scorers,
                        score_combiner_fn(),
                        effective_minimum_number_should_match,
                    ),
                )),
            }
        };

        let include_scorer = match (should_scorers, must_scorers) {
            (ShouldScorersCombinationMethod::Ignored, must_scorers) => {
                // No SHOULD clauses (or they were absorbed into MUST).
                // Result depends entirely on MUST + any removed AllScorers.
                let combined_all_scorer_count = must_special_scorer_counts.num_all_scorers
                    + should_special_scorer_counts.num_all_scorers;
                let boxed_scorer: Box<dyn Scorer> = effective_must_scorer(
                    must_scorers,
                    combined_all_scorer_count,
                    reader.max_doc(),
                    num_docs,
                )
                .unwrap_or_else(|| Box::new(EmptyScorer));
                SpecializedScorer::Other(boxed_scorer)
            }
            (ShouldScorersCombinationMethod::Optional(should_scorer), must_scorers) => {
                // Optional SHOULD: contributes to scoring but not required for matching.
                match effective_must_scorer(
                    must_scorers,
                    must_special_scorer_counts.num_all_scorers,
                    reader.max_doc(),
                    num_docs,
                ) {
                    None => {
                        // No MUST constraint: promote SHOULD to required.
                        // Must preserve any removed AllScorers from SHOULD via union.
                        effective_should_scorer_for_union(
                            should_scorer,
                            should_special_scorer_counts.num_all_scorers,
                            reader.max_doc(),
                            num_docs,
                            &score_combiner_fn,
                            self.scoring_enabled,
                        )
                    }
                    Some(must_scorer) => {
                        // Has MUST constraint: SHOULD only affects scoring.
                        if self.scoring_enabled {
                            SpecializedScorer::Other(Box::new(RequiredOptionalScorer::<
                                _,
                                _,
                                TScoreCombiner,
                            >::new(
                                must_scorer,
                                into_box_scorer(should_scorer, &score_combiner_fn, num_docs),
                            )))
                        } else {
                            SpecializedScorer::Other(must_scorer)
                        }
                    }
                }
            }
            (ShouldScorersCombinationMethod::Required(should_scorer), must_scorers) => {
                // Required SHOULD: at least `minimum_number_should_match` must match.
                // Semantics: (MUST constraint) AND (SHOULD constraint)
                match effective_must_scorer(
                    must_scorers,
                    must_special_scorer_counts.num_all_scorers,
                    reader.max_doc(),
                    num_docs,
                ) {
                    None => {
                        // No MUST constraint: SHOULD alone determines matching.
                        should_scorer
                    }
                    Some(must_scorer) => {
                        // Has MUST constraint: intersect MUST with SHOULD.
                        let should_boxed =
                            into_box_scorer(should_scorer, &score_combiner_fn, num_docs);
                        SpecializedScorer::Other(intersect_scorers(
                            vec![must_scorer, should_boxed],
                            num_docs,
                        ))
                    }
                }
            }
        };
        if exclude_scorers.is_empty() {
            return Ok(include_scorer);
        }

        let include_scorer_boxed = into_box_scorer(include_scorer, &score_combiner_fn, num_docs);
        let scorer: Box<dyn Scorer> = if exclude_scorers.len() == 1 {
            let exclude_scorer = exclude_scorers.pop().unwrap();
            match exclude_scorer.downcast::<TermScorer>() {
                // Cast to TermScorer succeeded
                Ok(exclude_scorer) => Box::new(Exclude::new(include_scorer_boxed, *exclude_scorer)),
                // We get back the original Box<dyn Scorer>
                Err(exclude_scorer) => Box::new(Exclude::new(include_scorer_boxed, exclude_scorer)),
            }
        } else {
            Box::new(Exclude::new(include_scorer_boxed, exclude_scorers))
        };
        Ok(SpecializedScorer::Other(scorer))
    }
}

#[derive(Default, Copy, Clone, Debug)]
struct AllAndEmptyScorerCounts {
    num_all_scorers: usize,
    num_empty_scorers: usize,
}

fn remove_and_count_all_and_empty_scorers(
    scorers: &mut Vec<Box<dyn Scorer>>,
) -> AllAndEmptyScorerCounts {
    let mut counts = AllAndEmptyScorerCounts::default();
    scorers.retain(|scorer| {
        if scorer.is::<AllScorer>() {
            counts.num_all_scorers += 1;
            false
        } else if scorer.is::<EmptyScorer>() {
            counts.num_empty_scorers += 1;
            false
        } else {
            true
        }
    });
    counts
}

impl<TScoreCombiner: ScoreCombiner + Sync> Weight for BooleanWeight<TScoreCombiner> {
    fn scorer(&self, reader: &SegmentReader, boost: Score) -> crate::Result<Box<dyn Scorer>> {
        let num_docs = reader.num_docs();
        if self.weights.is_empty() {
            Ok(Box::new(EmptyScorer))
        } else if self.weights.len() == 1 {
            let &(occur, ref weight) = &self.weights[0];
            if occur == Occur::MustNot {
                Ok(Box::new(EmptyScorer))
            } else {
                weight.scorer(reader, boost)
            }
        } else if self.scoring_enabled {
            self.complex_scorer(reader, boost, &self.score_combiner_fn)
                .map(|specialized_scorer| {
                    into_box_scorer(specialized_scorer, &self.score_combiner_fn, num_docs)
                })
        } else {
            self.complex_scorer(reader, boost, DoNothingCombiner::default)
                .map(|specialized_scorer| {
                    into_box_scorer(specialized_scorer, DoNothingCombiner::default, num_docs)
                })
        }
    }

    fn explain(&self, reader: &SegmentReader, doc: DocId) -> crate::Result<Explanation> {
        let mut scorer = self.scorer(reader, 1.0)?;
        if scorer.seek(doc) != doc {
            return Err(does_not_match(doc));
        }
        if !self.scoring_enabled {
            return Ok(Explanation::new("BooleanQuery with no scoring", 1.0));
        }

        let mut explanation = Explanation::new("BooleanClause. sum of ...", scorer.score());
        for (occur, subweight) in &self.weights {
            if is_include_occur(*occur) {
                if let Ok(child_explanation) = subweight.explain(reader, doc) {
                    explanation.add_detail(child_explanation);
                }
            }
        }
        Ok(explanation)
    }

    fn for_each(
        &self,
        reader: &SegmentReader,
        callback: &mut dyn FnMut(DocId, Score),
    ) -> crate::Result<()> {
        let scorer = self.complex_scorer(reader, 1.0, &self.score_combiner_fn)?;
        match scorer {
            SpecializedScorer::TermUnion(term_scorers) => {
                let mut union_scorer = BufferedUnionScorer::build(
                    term_scorers,
                    &self.score_combiner_fn,
                    reader.num_docs(),
                );
                for_each_scorer(&mut union_scorer, callback);
            }
            SpecializedScorer::Other(mut scorer) => {
                for_each_scorer(scorer.as_mut(), callback);
            }
        }
        Ok(())
    }

    fn for_each_no_score(
        &self,
        reader: &SegmentReader,
        callback: &mut dyn FnMut(&[DocId]),
    ) -> crate::Result<()> {
        let scorer = self.complex_scorer(reader, 1.0, || DoNothingCombiner)?;
        let mut buffer = [0u32; COLLECT_BLOCK_BUFFER_LEN];

        match scorer {
            SpecializedScorer::TermUnion(term_scorers) => {
                let mut union_scorer = BufferedUnionScorer::build(
                    term_scorers,
                    &self.score_combiner_fn,
                    reader.num_docs(),
                );
                for_each_docset_buffered(&mut union_scorer, &mut buffer, callback);
            }
            SpecializedScorer::Other(mut scorer) => {
                for_each_docset_buffered(scorer.as_mut(), &mut buffer, callback);
            }
        }
        Ok(())
    }

    /// Calls `callback` with all of the `(doc, score)` for which score
    /// is exceeding a given threshold.
    ///
    /// This method is useful for the TopDocs collector.
    /// For all docsets, the blanket implementation has the benefit
    /// of prefiltering (doc, score) pairs, avoiding the
    /// virtual dispatch cost.
    ///
    /// More importantly, it makes it possible for scorers to implement
    /// important optimization (e.g. BlockWAND for union).
    fn for_each_pruning(
        &self,
        threshold: Score,
        reader: &SegmentReader,
        callback: &mut dyn FnMut(DocId, Score) -> Score,
    ) -> crate::Result<()> {
        let scorer = self.complex_scorer(reader, 1.0, &self.score_combiner_fn)?;
        match scorer {
            SpecializedScorer::TermUnion(term_scorers) => {
                super::block_wand(term_scorers, threshold, callback);
            }
            SpecializedScorer::Other(mut scorer) => {
                for_each_pruning_scorer(scorer.as_mut(), threshold, callback);
            }
        }
        Ok(())
    }
}

fn is_include_occur(occur: Occur) -> bool {
    match occur {
        Occur::Must | Occur::Should => true,
        Occur::MustNot => false,
    }
}


================================================
FILE: src/query/boolean_query/mod.rs
================================================
mod block_wand;
mod boolean_query;
mod boolean_weight;

pub(crate) use self::block_wand::{block_wand, block_wand_single_scorer};
pub use self::boolean_query::BooleanQuery;
pub use self::boolean_weight::BooleanWeight;

#[cfg(test)]
mod tests {

    use std::ops::Bound;

    use super::*;
    use crate::collector::tests::TEST_COLLECTOR_WITH_SCORE;
    use crate::collector::{Count, TopDocs};
    use crate::query::term_query::TermScorer;
    use crate::query::{
        AllScorer, EmptyScorer, EnableScoring, Intersection, Occur, Query, QueryParser, RangeQuery,
        RequiredOptionalScorer, Scorer, SumCombiner, TermQuery,
    };
    use crate::schema::*;
    use crate::{assert_nearly_equals, DocAddress, DocId, Index, IndexWriter, Score};

    fn aux_test_helper() -> crate::Result<(Index, Field)> {
        let mut schema_builder = Schema::builder();
        let text_field = schema_builder.add_text_field("text", TEXT);
        let schema = schema_builder.build();
        let index = Index::create_in_ram(schema);
        {
            // writing the segment
            let mut index_writer: IndexWriter = index.writer_for_tests()?;
            index_writer.add_document(doc!(text_field => "a b c"))?;
            index_writer.add_document(doc!(text_field => "a c"))?;
            index_writer.add_document(doc!(text_field => "b c"))?;
            index_writer.add_document(doc!(text_field => "a b c d"))?;
            index_writer.add_document(doc!(text_field => "d"))?;
            index_writer.commit()?;
        }
        Ok((index, text_field))
    }

    #[test]
    pub fn test_boolean_non_all_term_disjunction() -> crate::Result<()> {
        let (index, text_field) = aux_test_helper()?;
        let query_parser = QueryParser::for_index(&index, vec![text_field]);
        let query = query_parser.parse_query("(+a +b) d")?;
        let searcher = index.reader()?.searcher();
        assert_eq!(query.count(&searcher)?, 3);
        Ok(())
    }

    #[test]
    pub fn test_boolean_single_must_clause() -> crate::Result<()> {
        let (index, text_field) = aux_test_helper()?;
        let query_parser = QueryParser::for_index(&index, vec![text_field]);
        let query = query_parser.parse_query("+a")?;
        let searcher = index.reader()?.searcher();
        let weight = query.weight(EnableScoring::enabled_from_searcher(&searcher))?;
        let scorer = weight.scorer(searcher.segment_reader(0u32), 1.0)?;
        assert!(scorer.is::<TermScorer>());
        Ok(())
    }

    #[test]
    pub fn test_boolean_termonly_intersection() -> crate::Result<()> {
        let (index, text_field) = aux_test_helper()?;
        let query_parser = QueryParser::for_index(&index, vec![text_field]);
        let searcher = index.reader()?.searcher();
        {
            let query = query_parser.parse_query("+a +b +c")?;
            let weight = query.weight(EnableScoring::enabled_from_searcher(&searcher))?;
            let scorer = weight.scorer(searcher.segment_reader(0u32), 1.0)?;
            assert!(scorer.is::<Intersection<TermScorer>>());
        }
        {
            let query = query_parser.parse_query("+a +(b c)")?;
            let weight = query.weight(EnableScoring::enabled_from_searcher(&searcher))?;
            let scorer = weight.scorer(searcher.segment_reader(0u32), 1.0)?;
            assert!(scorer.is::<Intersection<Box<dyn Scorer>>>());
        }
        Ok(())
    }

    #[test]
    pub fn test_boolean_reqopt() -> crate::Result<()> {
        let (index, text_field) = aux_test_helper()?;
        let query_parser = QueryParser::for_index(&index, vec![text_field]);
        let searcher = index.reader()?.searcher();
        {
            let query = query_parser.parse_query("+a b")?;
            let weight = query.weight(EnableScoring::enabled_from_searcher(&searcher))?;
            let scorer = weight.scorer(searcher.segment_reader(0u32), 1.0)?;
            assert!(scorer
                .is::<RequiredOptionalScorer<Box<dyn Scorer>, Box<dyn Scorer>, SumCombiner>>());
        }
        {
            let query = query_parser.parse_query("+a b")?;
            let weight = query.weight(EnableScoring::disabled_from_schema(searcher.schema()))?;
            let scorer = weight.scorer(searcher.segment_reader(0u32), 1.0)?;
            assert!(scorer.is::<TermScorer>());
        }
        Ok(())
    }

    #[test]
    pub fn test_boolean_query() -> crate::Result<()> {
        let (index, text_field) = aux_test_helper()?;

        let make_term_query = |text: &str| {
            let term_query = TermQuery::new(
                Term::from_field_text(text_field, text),
                IndexRecordOption::Basic,
            );
            let query: Box<dyn Query> = Box::new(term_query);
            query
        };

        let reader = index.reader()?;

        let matching_docs = |boolean_query: &dyn Query| {
            reader
                .searcher()
                .search(boolean_query, &TEST_COLLECTOR_WITH_SCORE)
                .unwrap()
                .docs()
                .iter()
                .cloned()
                .map(|doc| doc.doc_id)
                .collect::<Vec<DocId>>()
        };
        {
            let boolean_query = BooleanQuery::new(vec![(Occur::Must, make_term_query("a"))]);
            assert_eq!(matching_docs(&boolean_query), vec![0, 1, 3]);
        }
        {
            let boolean_query = BooleanQuery::new(vec![(Occur::Should, make_term_query("a"))]);
            assert_eq!(matching_docs(&boolean_query), vec![0, 1, 3]);
        }
        {
            let boolean_query = BooleanQuery::new(vec![
                (Occur::Should, make_term_query("a")),
                (Occur::Should, make_term_query("b")),
            ]);
            assert_eq!(matching_docs(&boolean_query), vec![0, 1, 2, 3]);
        }
        {
            let boolean_query = BooleanQuery::new(vec![
                (Occur::Must, make_term_query("a")),
                (Occur::Should, make_term_query("b")),
            ]);
            assert_eq!(matching_docs(&boolean_query), vec![0, 1, 3]);
        }
        {
            let boolean_query = BooleanQuery::new(vec![
                (Occur::Must, make_term_query("a")),
                (Occur::Should, make_term_query("b")),
                (Occur::MustNot, make_term_query("d")),
            ]);
            assert_eq!(matching_docs(&boolean_query), vec![0, 1]);
        }
        {
            let boolean_query = BooleanQuery::new(vec![(Occur::MustNot, make_term_query("d"))]);
            assert_eq!(matching_docs(&boolean_query), Vec::<u32>::new());
        }
        Ok(())
    }

    #[test]
    pub fn test_boolean_query_two_excluded() -> crate::Result<()> {
        let (index, text_field) = aux_test_helper()?;

        let make_term_query = |text: &str| {
            let term_query = TermQuery::new(
                Term::from_field_text(text_field, text),
                IndexRecordOption::Basic,
            );
            let query: Box<dyn Query> = Box::new(term_query);
            query
        };

        let reader = index.reader()?;

        let matching_topdocs = |query: &dyn Query| {
            reader
                .searcher()
                .search(query, &TopDocs::with_limit(3).order_by_score())
                .unwrap()
        };

        let score_doc_4: Score; // score of doc 4 should not be influenced by exclusion
        {
            let boolean_query_no_excluded =
                BooleanQuery::new(vec![(Occur::Must, make_term_query("d"))]);
            let topdocs_no_excluded = matching_topdocs(&boolean_query_no_excluded);
            assert_eq!(topdocs_no_excluded.len(), 2);
            let (top_score, top_doc) = topdocs_no_excluded[0];
            assert_eq!(top_doc, DocAddress::new(0, 4));
            assert_eq!(topdocs_no_excluded[1].1, DocAddress::new(0, 3)); // ignore score of doc 3.
            score_doc_4 = top_score;
        }

        {
            let boolean_query_two_excluded = BooleanQuery::new(vec![
                (Occur::Must, make_term_query("d")),
                (Occur::MustNot, make_term_query("a")),
                (Occur::MustNot, make_term_query("b")),
            ]);
            let topdocs_excluded = matching_topdocs(&boolean_query_two_excluded);
            assert_eq!(topdocs_excluded.len(), 1);
            let (top_score, top_doc) = topdocs_excluded[0];
            assert_eq!(top_doc, DocAddress::new(0, 4));
            assert_eq!(top_score, score_doc_4);
        }
        Ok(())
    }

    #[test]
    pub fn test_boolean_query_with_weight() -> crate::Result<()> {
        let mut schema_builder = Schema::builder();
        let text_field = schema_builder.add_text_field("text", TEXT);
        let schema = schema_builder.build();
        let index = Index::create_in_ram(schema);
        {
            let mut index_writer: IndexWriter = index.writer_for_tests()?;
            index_writer.add_document(doc!(text_field => "a b c"))?;
            index_writer.add_document(doc!(text_field => "a c"))?;
            index_writer.add_document(doc!(text_field => "b c"))?;
            index_writer.commit()?;
        }
        let term_a: Box<dyn Query> = Box::new(TermQuery::new(
            Term::from_field_text(text_field, "a"),
            IndexRecordOption::WithFreqs,
        ));
        let term_b: Box<dyn Query> = Box::new(TermQuery::new(
            Term::from_field_text(text_field, "b"),
            IndexRecordOption::WithFreqs,
        ));
        let reader = index.reader().unwrap();
        let searcher = reader.searcher();
        let boolean_query =
            BooleanQuery::new(vec![(Occur::Should, term_a), (Occur::Should, term_b)]);
        let boolean_weight = boolean_query
            .weight(EnableScoring::enabled_from_searcher(&searcher))
            .unwrap();
        {
            let mut boolean_scorer = boolean_weight.scorer(searcher.segment_reader(0u32), 1.0)?;
            assert_eq!(boolean_scorer.doc(), 0u32);
            assert_nearly_equals!(boolean_scorer.score(), 0.84163445);
        }
        {
            let mut boolean_scorer = boolean_weight.scorer(searcher.segment_reader(0u32), 2.0)?;
            assert_eq!(boolean_scorer.doc(), 0u32);
            assert_nearly_equals!(boolean_scorer.score(), 1.6832689);
        }
        Ok(())
    }

    #[test]
    pub fn test_intersection_score() -> crate::Result<()> {
        let (index, text_field) = aux_test_helper()?;

        let make_term_query = |text: &str| {
            let term_query = TermQuery::new(
                Term::from_field_text(text_field, text),
                IndexRecordOption::Basic,
            );
            let query: Box<dyn Query> = Box::new(term_query);
            query
        };
        let reader = index.reader()?;
        let score_docs = |boolean_query: &dyn Query| {
            let fruit = reader
                .searcher()
                .search(boolean_query, &TEST_COLLECTOR_WITH_SCORE)
                .unwrap();
            fruit.scores().to_vec()
        };

        {
            let boolean_query = BooleanQuery::new(vec![
                (Occur::Must, make_term_query("a")),
                (Occur::Must, make_term_query("b")),
            ]);
            let scores = score_docs(&boolean_query);
            assert_nearly_equals!(scores[0], 0.977973);
            assert_nearly_equals!(scores[1], 0.84699446);
        }
        Ok(())
    }

    #[test]
    pub fn test_explain() -> crate::Result<()> {
        let mut schema_builder = Schema::builder();
        let text = schema_builder.add_text_field("text", STRING);
        let schema = schema_builder.build();
        let index = Index::create_in_ram(schema);
        let mut index_writer: IndexWriter = index.writer_for_tests()?;
        index_writer.add_document(doc!(text=>"a"))?;
        index_writer.add_document(doc!(text=>"b"))?;
        index_writer.commit()?;
        let searcher = index.reader()?.searcher();
        let term_a: Box<dyn Query> = Box::new(TermQuery::new(
            Term::from_field_text(text, "a"),
            IndexRecordOption::Basic,
        ));
        let term_b: Box<dyn Query> = Box::new(TermQuery::new(
            Term::from_field_text(text, "b"),
            IndexRecordOption::Basic,
        ));
        let query = BooleanQuery::from(vec![(Occur::Should, term_a), (Occur::Should, term_b)]);
        let explanation = query.explain(&searcher, DocAddress::new(0, 0u32))?;
        assert_nearly_equals!(explanation.value(), std::f32::consts::LN_2);
        Ok(())
    }

    #[test]
    pub fn test_boolean_weight_optimization() -> crate::Result<()> {
        let mut schema_builder = Schema::builder();
        let text_field = schema_builder.add_text_field("text", TEXT);
        let schema = schema_builder.build();
        let index = Index::create_in_ram(schema);
        let mut index_writer: IndexWriter = index.writer_for_tests()?;
        index_writer.add_document(doc!(text_field=>"hello"))?;
        index_writer.add_document(doc!(text_field=>"hello happy"))?;
        index_writer.commit()?;
        let searcher = index.reader()?.searcher();
        let term_match_all: Box<dyn Query> = Box::new(TermQuery::new(
            Term::from_field_text(text_field, "hello"),
            IndexRecordOption::Basic,
        ));
        let term_match_some: Box<dyn Query> = Box::new(TermQuery::new(
            Term::from_field_text(text_field, "happy"),
            IndexRecordOption::Basic,
        ));
        let term_match_none: Box<dyn Query> = Box::new(TermQuery::new(
            Term::from_field_text(text_field, "tax"),
            IndexRecordOption::Basic,
        ));
        {
            let query = BooleanQuery::from(vec![
                (Occur::Must, term_match_all.box_clone()),
                (Occur::Must, term_match_some.box_clone()),
            ]);
            let weight = query.weight(EnableScoring::disabled_from_searcher(&searcher))?;
            let scorer = weight.scorer(searcher.segment_reader(0u32), 1.0f32)?;
            assert!(scorer.is::<TermScorer>());
        }
        {
            let query = BooleanQuery::from(vec![
                (Occur::Must, term_match_all.box_clone()),
                (Occur::Must, term_match_some.box_clone()),
                (Occur::Must, term_match_none.box_clone()),
            ]);
            let weight = query.weight(EnableScoring::disabled_from_searcher(&searcher))?;
            let scorer = weight.scorer(searcher.segment_reader(0u32), 1.0f32)?;
            assert!(scorer.is::<EmptyScorer>());
        }
        {
            let query = BooleanQuery::from(vec![
                (Occur::Should, term_match_all.box_clone()),
                (Occur::Should, term_match_none.box_clone()),
            ]);
            let weight = query.weight(EnableScoring::disabled_from_searcher(&searcher))?;
            let scorer = weight.scorer(searcher.segment_reader(0u32), 1.0f32)?;
            assert!(scorer.is::<AllScorer>());
        }
        {
            let query = BooleanQuery::from(vec![
                (Occur::Should, term_match_some.box_clone()),
                (Occur::Should, term_match_none.box_clone()),
            ]);
            let weight = query.weight(EnableScoring::disabled_from_searcher(&searcher))?;
            let scorer = weight.scorer(searcher.segment_reader(0u32), 1.0f32)?;
            assert!(scorer.is::<TermScorer>());
        }
        Ok(())
    }

    #[test]
    pub fn test_min_should_match_with_all_query() -> crate::Result<()> {
        let mut schema_builder = Schema::builder();
        let text_field = schema_builder.add_text_field("text", TEXT);
        let num_field =
            schema_builder.add_i64_field("num", NumericOptions::default().set_fast().set_indexed());
        let schema = schema_builder.build();
        let index = Index::create_in_ram(schema);
        let mut index_writer: IndexWriter = index.writer_for_tests()?;

        index_writer.add_document(doc!(text_field => "apple", num_field => 10i64))?;
        index_writer.add_document(doc!(text_field => "banana", num_field => 20i64))?;
        index_writer.commit()?;

        let searcher = index.reader()?.searcher();

        let effective_all_match_query: Box<dyn Query> = Box::new(RangeQuery::new(
            Bound::Excluded(Term::from_field_i64(num_field, 0)),
            Bound::Unbounded,
        ));
        let term_query: Box<dyn Query> = Box::new(TermQuery::new(
            Term::from_field_text(text_field, "apple"),
            IndexRecordOption::Basic,
        ));

        // in some previous version, we would remove the 2 all_match, but then say we need *4*
        // matches out of the 3 term queries, which matches nothing.
        let mut bool_query = BooleanQuery::new(vec![
            (Occur::Should, effective_all_match_query.box_clone()),
            (Occur::Should, effective_all_match_query.box_clone()),
            (Occur::Should, term_query.box_clone()),
            (Occur::Should, term_query.box_clone()),
            (Occur::Should, term_query.box_clone()),
        ]);
        bool_query.set_minimum_number_should_match(4);
        let count = searcher.search(&bool_query, &Count)?;
        assert_eq!(count, 1);

        Ok(())
    }

    // =========================================================================
    // AllScorer Preservation Regression Tests
    // =========================================================================
    //
    // These tests verify the fix for a bug where AllScorer instances (produced by
    // queries matching all documents, such as range queries covering all values)
    // were incorrectly removed from Boolean query processing, causing documents
    // to be unexpectedly excluded from results.
    //
    // The bug manifested in several scenarios:
    // 1. SHOULD + SHOULD where one clause is AllScorer
    // 2. MUST (AllScorer) + SHOULD
    // 3. Range queries in Boolean clauses when all documents match the range

    /// Regression test: SHOULD clause with AllScorer combined with other SHOULD clauses.
    ///
    /// When a SHOULD clause produces an AllScorer (e.g., from a range query matching
    /// all documents), the Boolean query should still match all documents.
    ///
    /// Bug before fix: AllScorer was removed during optimization, leaving only the
    /// other SHOULD clauses, which incorrectly excluded documents.
    #[test]
    pub fn test_should_with_all_scorer_regression() -> crate::Result<()> {
        let mut schema_builder = Schema::builder();
        let text_field = schema_builder.add_text_field("text", TEXT);
        let num_field =
            schema_builder.add_i64_field("num", NumericOptions::default().set_fast().set_indexed());
        let schema = schema_builder.build();
        let index = Index::create_in_ram(schema);
        let mut index_writer: IndexWriter = index.writer_for_tests()?;

        // All docs have num > 0, so range query will return AllScorer
        index_writer.add_document(doc!(text_field => "hello", num_field => 10i64))?;
        index_writer.add_document(doc!(text_field => "world", num_field => 20i64))?;
        index_writer.add_document(doc!(text_field => "hello world", num_field => 30i64))?;
        index_writer.add_document(doc!(text_field => "foo", num_field => 40i64))?;
        index_writer.add_document(doc!(text_field => "bar", num_field => 50i64))?;
        index_writer.add_document(doc!(text_field => "baz", num_field => 60i64))?;
        index_writer.commit()?;

        let searcher = index.reader()?.searcher();

        // Range query matching all docs (returns AllScorer)
        let all_match_query: Box<dyn Query> = Box::new(RangeQuery::new(
            Bound::Excluded(Term::from_field_i64(num_field, 0)),
            Bound::Unbounded,
        ));
        let term_query: Box<dyn Query> = Box::new(TermQuery::new(
            Term::from_field_text(text_field, "hello"),
            IndexRecordOption::Basic,
        ));

        // Verify range matches all 6 docs
        assert_eq!(searcher.search(all_match_query.as_ref(), &Count)?, 6);

        // RangeQuery(all) OR TermQuery should match all 6 docs
        let bool_query = BooleanQuery::new(vec![
            (Occur::Should, all_match_query.box_clone()),
            (Occur::Should, term_query.box_clone()),
        ]);
        let count = searcher.search(&bool_query, &Count)?;
        assert_eq!(count, 6, "SHOULD with AllScorer should match all docs");

        // Order should not matter
        let bool_query_reversed = BooleanQuery::new(vec![
            (Occur::Should, term_query.box_clone()),
            (Occur::Should, all_match_query.box_clone()),
        ]);
        let count_reversed = searcher.search(&bool_query_reversed, &Count)?;
        assert_eq!(
            count_reversed, 6,
            "Order of SHOULD clauses should not matter"
        );

        Ok(())
    }

    /// Regression test: MUST clause with AllScorer combined with SHOULD clause.
    ///
    /// When MUST contains an AllScorer, all documents satisfy the MUST constraint.
    /// The SHOULD clause should only affect scoring, not filtering.
    ///
    /// Bug before fix: AllScorer was removed, leaving an empty must_scorers vector.
    /// intersect_scorers([]) incorrectly returned EmptyScorer, matching 0 documents.
    #[test]
    pub fn test_must_all_with_should_regression() -> crate::Result<()> {
        let mut schema_builder = Schema::builder();
        let text_field = schema_builder.add_text_field("text", TEXT);
        let num_field =
            schema_builder.add_i64_field("num", NumericOptions::default().set_fast().set_indexed());
        let schema = schema_builder.build();
        let index = Index::create_in_ram(schema);
        let mut index_writer: IndexWriter = index.writer_for_tests()?;

        // All docs have num > 0, so range query will return AllScorer
        index_writer.add_document(doc!(text_field => "apple", num_field => 10i64))?;
        index_writer.add_document(doc!(text_field => "banana", num_field => 20i64))?;
        index_writer.add_document(doc!(text_field => "cherry", num_field => 30i64))?;
        index_writer.add_document(doc!(text_field => "date", num_field => 40i64))?;
        index_writer.commit()?;

        let searcher = index.reader()?.searcher();

        // Range query matching all docs (returns AllScorer)
        let all_match_query: Box<dyn Query> = Box::new(RangeQuery::new(
            Bound::Excluded(Term::from_field_i64(num_field, 0)),
            Bound::Unbounded,
        ));
        let term_query: Box<dyn Query> = Box::new(TermQuery::new(
            Term::from_field_text(text_field, "apple"),
            IndexRecordOption::Basic,
        ));

        // Verify range matches all 4 docs
        assert_eq!(searcher.search(all_match_query.as_ref(), &Count)?, 4);

        // MUST(range matching all) AND SHOULD(term) should match all 4 docs
        let bool_query = BooleanQuery::new(vec![
            (Occur::Must, all_match_query.box_clone()),
            (Occur::Should, term_query.box_clone()),
        ]);
        let count = searcher.search(&bool_query, &Count)?;
        assert_eq!(count, 4, "MUST AllScorer + SHOULD should match all docs");

        Ok(())
    }

    /// Regression test: Range queries in Boolean clauses when all documents match.
    ///
    /// Range queries can return AllScorer as an optimization when all indexed values
    /// fall within the range. This test ensures such queries work correctly in
    /// Boolean combinations.
    ///
    /// This is the most common real-world manifestation of the bug, occurring in
    /// queries like: (age > 50 OR name = 'Alice') AND status = 'active'
    /// when all documents have age > 50.
    #[test]
    pub fn test_range_query_all_match_in_boolean() -> crate::Result<()> {
        let mut schema_builder = Schema::builder();
        let name_field = schema_builder.add_text_field("name", TEXT);
        let age_field =
            schema_builder.add_i64_field("age", NumericOptions::default().set_fast().set_indexed());
        let schema = schema_builder.build();
        let index = Index::create_in_ram(schema);
        let mut index_writer: IndexWriter = index.writer_for_tests()?;

        // All documents have age > 50, so range query will return AllScorer
        index_writer.add_document(doc!(name_field => "alice", age_field => 55_i64))?;
        index_writer.add_document(doc!(name_field => "bob", age_field => 60_i64))?;
        index_writer.add_document(doc!(name_field => "charlie", age_field => 70_i64))?;
        index_writer.add_document(doc!(name_field => "diana", age_field => 80_i64))?;
        index_writer.commit()?;

        let searcher = index.reader()?.searcher();

        let range_query: Box<dyn Query> = Box::new(RangeQuery::new(
            Bound::Excluded(Term::from_field_i64(age_field, 50)),
            Bound::Unbounded,
        ));
        let term_query: Box<dyn Query> = Box::new(TermQuery::new(
            Term::from_field_text(name_field, "alice"),
            IndexRecordOption::Basic,
        ));

        // Verify preconditions
        assert_eq!(searcher.search(range_query.as_ref(), &Count)?, 4);
        assert_eq!(searcher.search(term_query.as_ref(), &Count)?, 1);

        // SHOULD(range) OR SHOULD(term): range matches all, so result is 4
        let should_query = BooleanQuery::new(vec![
            (Occur::Should, range_query.box_clone()),
            (Occur::Should, term_query.box_clone()),
        ]);
        assert_eq!(
            searcher.search(&should_query, &Count)?,
            4,
            "SHOULD range OR term should match all"
        );

        // MUST(range) AND SHOULD(term): range matches all, term is optional
        let must_should_query = BooleanQuery::new(vec![
            (Occur::Must, range_query.box_clone()),
            (Occur::Should, term_query.box_clone()),
        ]);
        assert_eq!(
            searcher.search(&must_should_query, &Count)?,
            4,
            "MUST range + SHOULD term should match all"
        );

        Ok(())
    }

    /// Test multiple AllScorer instances in different clause types.
    ///
    /// Verifies correct behavior when AllScorers appear in multiple positions.
    #[test]
    pub fn test_multiple_all_scorers() -> crate::Result<()> {
        let mut schema_builder = Schema::builder();
        let text_field = schema_builder.add_text_field("text", TEXT);
        let num_field =
            schema_builder.add_i64_field("num", NumericOptions::default().set_fast().set_indexed());
        let schema = schema_builder.build();
        let index = Index::create_in_ram(schema);
        let mut index_writer: IndexWriter = index.writer_for_tests()?;

        // All docs have num > 0, so range queries will return AllScorer
        index_writer.add_document(doc!(text_field => "doc1", num_field => 10i64))?;
        index_writer.add_document(doc!(text_field => "doc2", num_field => 20i64))?;
        index_writer.add_document(doc!(text_field => "doc3", num_field => 30i64))?;
        index_writer.commit()?;

        let searcher = index.reader()?.searcher();

        // Two different range queries that both match all docs (return AllScorer)
        let all_query1: Box<dyn Query> = Box::new(RangeQuery::new(
            Bound::Excluded(Term::from_field_i64(num_field, 0)),
            Bound::Unbounded,
        ));
        let all_query2: Box<dyn Query> = Box::new(RangeQuery::new(
            Bound::Excluded(Term::from_field_i64(num_field, 5)),
            Bound::Unbounded,
        ));
        let term_query: Box<dyn Query> = Box::new(TermQuery::new(
            Term::from_field_text(text_field, "doc1"),
            IndexRecordOption::Basic,
        ));

        // Multiple AllScorers in SHOULD
        let multi_all_should = BooleanQuery::new(vec![
            (Occur::Should, all_query1.box_clone()),
            (Occur::Should, all_query2.box_clone()),
            (Occur::Should, term_query.box_clone()),
        ]);
        assert_eq!(
            searcher.search(&multi_all_should, &Count)?,
            3,
            "Multiple AllScorers in SHOULD"
        );

        // AllScorer in both MUST and SHOULD
        let all_must_and_should = BooleanQuery::new(vec![
            (Occur::Must, all_query1.box_clone()),
            (Occur::Should, all_query2.box_clone()),
        ]);
        assert_eq!(
            searcher.search(&all_must_and_should, &Count)?,
            3,
            "AllScorer in both MUST and SHOULD"
        );

        Ok(())
    }
}

/// A proptest which generates arbitrary permutations of a simple boolean AST, and then matches
/// the result against an index which contains all permutations of documents with N fields.
#[cfg(test)]
mod proptest_boolean_query {
    use std::collections::{BTreeMap, HashSet};
    use std::ops::{Bound, Range};

    use proptest::collection::vec;
    use proptest::prelude::*;

    use crate::collector::DocSetCollector;
    use crate::query::{AllQuery, BooleanQuery, Occur, Query, RangeQuery, TermQuery};
    use crate::schema::{Field, NumericOptions, OwnedValue, Schema, TEXT};
    use crate::{DocId, Index, Term};

    #[derive(Debug, Clone)]
    enum BooleanQueryAST {
        /// Matches all documents via AllQuery (wraps AllScorer in BoostScorer)
        All,
        /// Matches all documents via RangeQuery (returns bare AllScorer)
        /// This is the actual trigger for the AllScorer preservation bug
        RangeAll,
        /// Matches documents where the field has value "true"
        Leaf {
            field_idx: usize,
        },
        Union(Vec<BooleanQueryAST>),
        Intersection(Vec<BooleanQueryAST>),
    }

    impl BooleanQueryAST {
        fn matches(&self, doc_id: DocId) -> bool {
            match self {
                BooleanQueryAST::All => true,
                BooleanQueryAST::RangeAll => true,
                BooleanQueryAST::Leaf { field_idx } => Self::matches_field(doc_id, *field_idx),
                BooleanQueryAST::Union(children) => {
                    children.iter().any(|child| child.matches(doc_id))
                }
                BooleanQueryAST::Intersection(children) => {
                    children.iter().all(|child| child.matches(doc_id))
                }
            }
        }

        fn matches_field(doc_id: DocId, field_idx: usize) -> bool {
            ((doc_id as usize) >> field_idx) & 1 == 1
        }

        fn to_query(&self, fields: &[Field], range_field: Field) -> Box<dyn Query> {
            match self {
                BooleanQueryAST::All => Box::new(AllQuery),
                BooleanQueryAST::RangeAll => {
                    // Range query that matches all docs (all have value >= 0)
                    // This returns bare AllScorer, triggering the bug we fixed
                    Box::new(RangeQuery::new(
                        Bound::Included(Term::from_field_i64(range_field, 0)),
                        Bound::Unbounded,
                    ))
                }
                BooleanQueryAST::Leaf { field_idx } => Box::new(TermQuery::new(
                    Term::from_field_text(fields[*field_idx], "true"),
                    crate::schema::IndexRecordOption::Basic,
                )),
                BooleanQueryAST::Union(children) => {
                    let sub_queries = children
                        .iter()
                        .map(|child| (Occur::Should, child.to_query(fields, range_field)))
                        .collect();
                    Box::new(BooleanQuery::new(sub_queries))
                }
                BooleanQueryAST::Intersection(children) => {
                    let sub_queries = children
                        .iter()
                        .map(|child| (Occur::Must, child.to_query(fields, range_field)))
                        .collect();
                    Box::new(BooleanQuery::new(sub_queries))
                }
            }
        }
    }

    fn doc_ids(num_docs: usize, num_fields: usize) -> Range<DocId> {
        let permutations = 1 << num_fields;
        let copies = (num_docs as f32 / permutations as f32).ceil() as u32;
        0..(permutations * copies)
    }

    fn create_index_with_boolean_permutations(
        num_docs: usize,
        num_fields: usize,
    ) -> (Index, Vec<Field>, Field) {
        let mut schema_builder = Schema::builder();
        let fields: Vec<Field> = (0..num_fields)
            .map(|i| schema_builder.add_text_field(&format!("field_{}", i), TEXT))
            .collect();
        // Add a numeric field for RangeQuery tests - all docs have value = doc_id
        let range_field = schema_builder.add_i64_field(
            "range_field",
            NumericOptions::default().set_fast().set_indexed(),
        );
        let schema = schema_builder.build();
        let index = Index::create_in_ram(schema);
        let mut writer = index.writer_for_tests().unwrap();

        for doc_id in doc_ids(num_docs, num_fields) {
            let mut doc: BTreeMap<_, OwnedValue> = BTreeMap::default();
            for (field_idx, &field) in fields.iter().enumerate() {
                if (doc_id >> field_idx) & 1 == 1 {
                    doc.insert(field, "true".into());
                }
            }
            // All docs have non-negative values, so RangeQuery(>=0) matches all
            doc.insert(range_field, (doc_id as i64).into());
            writer.add_document(doc).unwrap();
        }
        writer.commit().unwrap();
        (index, fields, range_field)
    }

    fn arb_boolean_query_ast(num_fields: usize) -> impl Strategy<Value = BooleanQueryAST> {
        // Leaf strategies: term queries, AllQuery, and RangeQuery matching all docs
        let leaf = prop_oneof![
            (0..num_fields).prop_map(|field_idx| BooleanQueryAST::Leaf { field_idx }),
            Just(BooleanQueryAST::All),
            Just(BooleanQueryAST::RangeAll),
        ];
        leaf.prop_recursive(
            8,   // 8 levels of recursion
            256, // 256 nodes max
            10,  // 10 items per collection
            |inner| {
                prop_oneof![
                    vec(inner.clone(), 1..10).prop_map(BooleanQueryAST::Union),
                    vec(inner, 1..10).prop_map(BooleanQueryAST::Intersection),
                ]
            },
        )
    }

    #[test]
    fn proptest_boolean_query() {
        // In the presence of optimizations around buffering, it can take large numbers of
        // documents to uncover some issues.
        let num_fields = 8;
        let num_docs = 1 << num_fields;
        let (index, fields, range_field) =
            create_index_with_boolean_permutations(num_docs, num_fields);
        let searcher = index.reader().unwrap().searcher();
        proptest!(|(ast in arb_boolean_query_ast(num_fields))| {
            let query = ast.to_query(&fields, range_field);

            let mut matching_docs = HashSet::new();
            for doc_id in doc_ids(num_docs, num_fields) {
                if ast.matches(doc_id as DocId) {
                    matching_docs.insert(doc_id as DocId);
                }
            }

            let doc_addresses = searcher.search(&*query, &DocSetCollector).unwrap();
            let result_docs: HashSet<DocId> =
                doc_addresses.into_iter().map(|doc_address| doc_address.doc_id).collect();
            prop_assert_eq!(result_docs, matching_docs);
        });
    }
}


================================================
FILE: src/query/boost_query.rs
================================================
use std::fmt;

use crate::docset::{SeekDangerResult, COLLECT_BLOCK_BUFFER_LEN};
use crate::fastfield::AliveBitSet;
use crate::query::{EnableScoring, Explanation, Query, Scorer, Weight};
use crate::{DocId, DocSet, Score, SegmentReader, Term};

/// `BoostQuery` is a wrapper over a query used to boost its score.
///
/// The document set matched by the `BoostQuery` is strictly the same as the underlying query.
/// The score of each document, is the score of the underlying query multiplied by the `boost`
/// factor.
pub struct BoostQuery {
    query: Box<dyn Query>,
    boost: Score,
}

impl BoostQuery {
    /// Builds a boost query.
    pub fn new(query: Box<dyn Query>, boost: Score) -> BoostQuery {
        BoostQuery { query, boost }
    }
}

impl Clone for BoostQuery {
    fn clone(&self) -> Self {
        BoostQuery {
            query: self.query.box_clone(),
            boost: self.boost,
        }
    }
}

impl fmt::Debug for BoostQuery {
    fn fmt(&self, f: &mut fmt::Formatter) -> fmt::Result {
        write!(f, "Boost(query={:?}, boost={})", self.query, self.boost)
    }
}

impl Query for BoostQuery {
    fn weight(&self, enable_scoring: EnableScoring<'_>) -> crate::Result<Box<dyn Weight>> {
        let weight_without_boost = self.query.weight(enable_scoring)?;
        let boosted_weight = if enable_scoring.is_scoring_enabled() {
            Box::new(BoostWeight::new(weight_without_boost, self.boost))
        } else {
            weight_without_boost
        };
        Ok(boosted_weight)
    }

    fn query_terms<'a>(&'a self, visitor: &mut dyn FnMut(&'a Term, bool)) {
        self.query.query_terms(visitor)
    }
}

/// Weight associated to the BoostQuery.
pub struct BoostWeight {
    weight: Box<dyn Weight>,
    boost: Score,
}

impl BoostWeight {
    /// Creates a new BoostWeight.
    pub fn new(weight: Box<dyn Weight>, boost: Score) -> Self {
        BoostWeight { weight, boost }
    }
}

impl Weight for BoostWeight {
    fn scorer(&self, reader: &SegmentReader, boost: Score) -> crate::Result<Box<dyn Scorer>> {
        self.weight.scorer(reader, boost * self.boost)
    }

    fn explain(&self, reader: &SegmentReader, doc: u32) -> crate::Result<Explanation> {
        let underlying_explanation = self.weight.explain(reader, doc)?;
        let score = underlying_explanation.value() * self.boost;
        let mut explanation =
            Explanation::new_with_string(format!("Boost x{} of ...", self.boost), score);
        explanation.add_detail(underlying_explanation);
        Ok(explanation)
    }

    fn count(&self, reader: &SegmentReader) -> crate::Result<u32> {
        self.weight.count(reader)
    }
}

pub(crate) struct BoostScorer<S: Scorer> {
    underlying: S,
    boost: Score,
}

impl<S: Scorer> BoostScorer<S> {
    pub fn new(underlying: S, boost: Score) -> BoostScorer<S> {
        BoostScorer { underlying, boost }
    }
}

impl<S: Scorer> DocSet for BoostScorer<S> {
    fn advance(&mut self) -> DocId {
        self.underlying.advance()
    }

    fn seek(&mut self, target: DocId) -> DocId {
        self.underlying.seek(target)
    }
    fn seek_danger(&mut self, target: DocId) -> SeekDangerResult {
        self.underlying.seek_danger(target)
    }

    fn fill_buffer(&mut self, buffer: &mut [DocId; COLLECT_BLOCK_BUFFER_LEN]) -> usize {
        self.underlying.fill_buffer(buffer)
    }

    fn doc(&self) -> u32 {
        self.underlying.doc()
    }

    fn size_hint(&self) -> u32 {
        self.underlying.size_hint()
    }

    fn cost(&self) -> u64 {
        self.underlying.cost()
    }

    fn count(&mut self, alive_bitset: &AliveBitSet) -> u32 {
        self.underlying.count(alive_bitset)
    }

    fn count_including_deleted(&mut self) -> u32 {
        self.underlying.count_including_deleted()
    }
}

impl<S: Scorer> Scorer for BoostScorer<S> {
    #[inline]
    fn score(&mut self) -> Score {
        self.underlying.score() * self.boost
    }
}

#[cfg(test)]
mod tests {
    use super::BoostQuery;
    use crate::query::{AllQuery, Query};
    use crate::schema::Schema;
    use crate::{DocAddress, Index, IndexWriter, TantivyDocument};

    #[test]
    fn test_boost_query_explain() -> crate::Result<()> {
        let schema = Schema::builder().build();
        let index = Index::create_in_ram(schema);
        let mut index_writer: IndexWriter = index.writer_for_tests()?;
        index_writer.add_document(TantivyDocument::new())?;
        index_writer.commit()?;
        let reader = index.reader()?;
        let searcher = reader.searcher();
        let query = BoostQuery::new(Box::new(AllQuery), 0.2);
        let explanation = query.explain(&searcher, DocAddress::new(0, 0u32)).unwrap();
        assert_eq!(
            explanation.to_pretty_json(),
            "{\n  \"value\": 0.2,\n  \"description\": \"Boost x0.2 of ...\",\n  \"details\": [\n    {\n      \"value\": 1.0,\n      \"description\": \"AllQuery\"\n    }\n  ]\n}"
        );
        Ok(())
    }
}


================================================
FILE: src/query/const_score_query.rs
================================================
use std::fmt;

use crate::docset::COLLECT_BLOCK_BUFFER_LEN;
use crate::query::{EnableScoring, Explanation, Query, Scorer, Weight};
use crate::{DocId, DocSet, Score, SegmentReader, TantivyError, Term};

/// `ConstScoreQuery` is a wrapper over a query to provide a constant score.
/// It can avoid unnecessary score computation on the wrapped query.
///
/// The document set matched by the `ConstScoreQuery` is strictly the same as the underlying query.
/// The configured score is used for each document.
pub struct ConstScoreQuery {
    query: Box<dyn Query>,
    score: Score,
}

impl ConstScoreQuery {
    /// Builds a const score query.
    pub fn new(query: Box<dyn Query>, score: Score) -> ConstScoreQuery {
        ConstScoreQuery { query, score }
    }
}

impl Clone for ConstScoreQuery {
    fn clone(&self) -> Self {
        ConstScoreQuery {
            query: self.query.box_clone(),
            score: self.score,
        }
    }
}

impl fmt::Debug for ConstScoreQuery {
    fn fmt(&self, f: &mut fmt::Formatter) -> fmt::Result {
        write!(f, "Const(score={}, query={:?})", self.score, self.query)
    }
}

impl Query for ConstScoreQuery {
    fn weight(&self, enable_scoring: EnableScoring<'_>) -> crate::Result<Box<dyn Weight>> {
        let inner_weight = self.query.weight(enable_scoring)?;
        Ok(if enable_scoring.is_scoring_enabled() {
            Box::new(ConstWeight::new(inner_weight, self.score))
        } else {
            inner_weight
        })
    }

    fn query_terms<'a>(&'a self, visitor: &mut dyn FnMut(&'a Term, bool)) {
        self.query.query_terms(visitor);
    }
}

struct ConstWeight {
    weight: Box<dyn Weight>,
    score: Score,
}

impl ConstWeight {
    pub fn new(weight: Box<dyn Weight>, score: Score) -> Self {
        ConstWeight { weight, score }
    }
}

impl Weight for ConstWeight {
    fn scorer(&self, reader: &SegmentReader, boost: Score) -> crate::Result<Box<dyn Scorer>> {
        let inner_scorer = self.weight.scorer(reader, boost)?;
        Ok(Box::new(ConstScorer::new(inner_scorer, boost * self.score)))
    }

    fn explain(&self, reader: &SegmentReader, doc: u32) -> crate::Result<Explanation> {
        let mut scorer = self.scorer(reader, 1.0)?;
        if scorer.seek(doc) != doc {
            return Err(TantivyError::InvalidArgument(format!(
                "Document #({doc}) does not match"
            )));
        }
        let mut explanation = Explanation::new("Const", self.score);
        let underlying_explanation = self.weight.explain(reader, doc)?;
        explanation.add_detail(underlying_explanation);
        Ok(explanation)
    }

    fn count(&self, reader: &SegmentReader) -> crate::Result<u32> {
        self.weight.count(reader)
    }
}

/// Wraps a `DocSet` and simply returns a constant `Scorer`.
/// The `ConstScorer` is useful if you have a `DocSet` where
/// you needed a scorer.
///
/// The `ConstScorer`'s constant score can be set
/// by calling `.set_score(...)`.
pub struct ConstScorer<TDocSet: DocSet> {
    docset: TDocSet,
    score: Score,
}

impl<TDocSet: DocSet> ConstScorer<TDocSet> {
    /// Creates a new `ConstScorer`.
    pub fn new(docset: TDocSet, score: Score) -> ConstScorer<TDocSet> {
        ConstScorer { docset, score }
    }
}

impl<TDocSet: DocSet> From<TDocSet> for ConstScorer<TDocSet> {
    fn from(docset: TDocSet) -> Self {
        ConstScorer::new(docset, 1.0)
    }
}

impl<TDocSet: DocSet> DocSet for ConstScorer<TDocSet> {
    fn advance(&mut self) -> DocId {
        self.docset.advance()
    }

    fn seek(&mut self, target: DocId) -> DocId {
        self.docset.seek(target)
    }

    fn fill_buffer(&mut self, buffer: &mut [DocId; COLLECT_BLOCK_BUFFER_LEN]) -> usize {
        self.docset.fill_buffer(buffer)
    }

    fn doc(&self) -> DocId {
        self.docset.doc()
    }

    fn size_hint(&self) -> u32 {
        self.docset.size_hint()
    }

    fn cost(&self) -> u64 {
        self.docset.cost()
    }
}

impl<TDocSet: DocSet + 'static> Scorer for ConstScorer<TDocSet> {
    #[inline]
    fn score(&mut self) -> Score {
        self.score
    }
}

#[cfg(test)]
mod tests {
    use super::ConstScoreQuery;
    use crate::query::{AllQuery, Query};
    use crate::schema::Schema;
    use crate::{DocAddress, Index, IndexWriter, TantivyDocument};

    #[test]
    fn test_const_score_query_explain() -> crate::Result<()> {
        let schema = Schema::builder().build();
        let index = Index::create_in_ram(schema);
        let mut index_writer: IndexWriter = index.writer_for_tests()?;
        index_writer.add_document(TantivyDocument::new())?;
        index_writer.commit()?;
        let reader = index.reader()?;
        let searcher = reader.searcher();
        let query = ConstScoreQuery::new(Box::new(AllQuery), 0.42);
        let explanation = query.explain(&searcher, DocAddress::new(0, 0u32)).unwrap();
        assert_eq!(
            explanation.to_pretty_json(),
            r#"{
  "value": 0.42,
  "description": "Const",
  "details": [
    {
      "value": 1.0,
      "description": "AllQuery"
    }
  ]
}"#
        );
        Ok(())
    }
}


================================================
FILE: src/query/disjunction.rs
================================================
use std::cmp::Ordering;
use std::collections::BinaryHeap;

use crate::docset::SeekDangerResult;
use crate::query::score_combiner::DoNothingCombiner;
use crate::query::{ScoreCombiner, Scorer};
use crate::{DocId, DocSet, Score, TERMINATED};

/// `Disjunction` is responsible for merging `DocSet` from multiple
/// source. Specifically, It takes the union of two or more `DocSet`s
/// then filtering out elements that appear fewer times than a
/// specified threshold.
pub struct Disjunction<TScorer, TScoreCombiner = DoNothingCombiner> {
    chains: BinaryHeap<ScorerWrapper<TScorer>>,
    minimum_matches_required: usize,
    score_combiner: TScoreCombiner,

    current_doc: DocId,
    current_score: Score,
}

/// A wrapper around a `Scorer` that caches the current `doc_id` and implements the `DocSet` trait.
/// Also, the `Ord` trait and it's family are implemented reversely. So that we can combine
/// `std::BinaryHeap<ScorerWrapper<T>>` to gain a min-heap with current doc id as key.
struct ScorerWrapper<T> {
    scorer: T,
    current_doc: DocId,
}

impl<T: Scorer> ScorerWrapper<T> {
    fn new(scorer: T) -> Self {
        let current_doc = scorer.doc();
        Self {
            scorer,
            current_doc,
        }
    }
}

impl<T: Scorer> PartialEq for ScorerWrapper<T> {
    fn eq(&self, other: &Self) -> bool {
        self.doc() == other.doc()
    }
}

impl<T: Scorer> Eq for ScorerWrapper<T> {}

impl<T: Scorer> PartialOrd for ScorerWrapper<T> {
    fn partial_cmp(&self, other: &Self) -> Option<Ordering> {
        Some(self.cmp(other))
    }
}

impl<T: Scorer> Ord for ScorerWrapper<T> {
    fn cmp(&self, other: &Self) -> Ordering {
        self.doc().cmp(&other.doc()).reverse()
    }
}

impl<T: Scorer> DocSet for ScorerWrapper<T> {
    fn advance(&mut self) -> DocId {
        let doc_id = self.scorer.advance();
        self.current_doc = doc_id;
        doc_id
    }
    fn seek(&mut self, target: DocId) -> DocId {
        let doc_id = self.scorer.seek(target);
        self.current_doc = doc_id;
        doc_id
    }
    fn seek_danger(&mut self, target: DocId) -> SeekDangerResult {
        let result = self.scorer.seek_danger(target);
        if result == SeekDangerResult::Found {
            self.current_doc = target;
        }
        result
    }

    fn doc(&self) -> DocId {
        self.current_doc
    }

    fn size_hint(&self) -> u32 {
        self.scorer.size_hint()
    }

    fn cost(&self) -> u64 {
        self.scorer.cost()
    }
}

impl<TScorer: Scorer, TScoreCombiner: ScoreCombiner> Disjunction<TScorer, TScoreCombiner> {
    pub fn new<T: IntoIterator<Item = TScorer>>(
        docsets: T,
        score_combiner: TScoreCombiner,
        minimum_matches_required: usize,
    ) -> Self {
        debug_assert!(
            minimum_matches_required > 1,
            "union scorer works better if just one matches required"
        );
        let chains = docsets
            .into_iter()
            .map(|doc| ScorerWrapper::new(doc))
            .collect();
        let mut disjunction = Self {
            chains,
            score_combiner,
            current_doc: TERMINATED,
            minimum_matches_required,
            current_score: 0.0,
        };
        if minimum_matches_required > disjunction.chains.len() {
            return disjunction;
        }
        disjunction.advance();
        disjunction
    }
}

impl<TScorer: Scorer, TScoreCombiner: ScoreCombiner> DocSet
    for Disjunction<TScorer, TScoreCombiner>
{
    fn advance(&mut self) -> DocId {
        let mut current_num_matches = 0;
        while let Some(mut candidate) = self.chains.pop() {
            let next = candidate.doc();
            if next != TERMINATED {
                // Peek next doc.
                if self.current_doc != next {
                    if current_num_matches >= self.minimum_matches_required {
                        self.chains.push(candidate);
                        self.current_score = self.score_combiner.score();
                        return self.current_doc;
                    }
                    // Reset current_num_matches and scores.
                    current_num_matches = 0;
                    self.current_doc = next;
                    self.score_combiner.clear();
                }
                current_num_matches += 1;
                self.score_combiner.update(&mut candidate.scorer);
                candidate.advance();
                self.chains.push(candidate);
            }
        }
        if current_num_matches < self.minimum_matches_required {
            self.current_doc = TERMINATED;
        }
        self.current_score = self.score_combiner.score();
        self.current_doc
    }

    #[inline]
    fn doc(&self) -> DocId {
        self.current_doc
    }

    fn size_hint(&self) -> u32 {
        self.chains
            .iter()
            .map(|docset| docset.size_hint())
            .max()
            .unwrap_or(0u32)
    }

    fn cost(&self) -> u64 {
        self.chains
            .iter()
            .map(|docset| docset.cost())
            .max()
            .unwrap_or(0u64)
    }
}

impl<TScorer: Scorer, TScoreCombiner: ScoreCombiner> Scorer
    for Disjunction<TScorer, TScoreCombiner>
{
    #[inline]
    fn score(&mut self) -> Score {
        self.current_score
    }
}

#[cfg(test)]
mod tests {
    use std::collections::BTreeMap;

    use super::Disjunction;
    use crate::query::score_combiner::DoNothingCombiner;
    use crate::query::{ConstScorer, Scorer, SumCombiner, VecDocSet};
    use crate::{DocId, DocSet, Score, TERMINATED};

    fn conjunct<T: Ord + Copy>(arrays: &[Vec<T>], pass_line: usize) -> Vec<T> {
        let mut counts = BTreeMap::new();
        for array in arrays {
            for &element in array {
                *counts.entry(element).or_insert(0) += 1;
            }
        }
        counts
            .iter()
            .filter_map(|(&element, &count)| {
                if count >= pass_line {
                    Some(element)
                } else {
                    None
                }
            })
            .collect()
    }

    fn aux_test_conjunction(vals: Vec<Vec<u32>>, min_match: usize) {
        let mut union_expected = VecDocSet::from(conjunct(&vals, min_match));
        let make_scorer = || {
            Disjunction::new(
                vals.iter()
                    .cloned()
                    .map(VecDocSet::from)
                    .map(|d| ConstScorer::new(d, 1.0)),
                DoNothingCombiner,
                min_match,
            )
        };
        let mut scorer: Disjunction<_, DoNothingCombiner> = make_scorer();
        let mut count = 0;
        while scorer.doc() != TERMINATED {
            assert_eq!(union_expected.doc(), scorer.doc());
            assert_eq!(union_expected.advance(), scorer.advance());
            count += 1;
        }
        assert_eq!(union_expected.advance(), TERMINATED);
        assert_eq!(count, make_scorer().count_including_deleted());
    }

    #[should_panic]
    #[test]
    fn test_arg_check1() {
        aux_test_conjunction(vec![], 0);
    }

    #[should_panic]
    #[test]
    fn test_arg_check2() {
        aux_test_conjunction(vec![], 1);
    }

    #[test]
    fn test_corner_case() {
        aux_test_conjunction(vec![], 2);
        aux_test_conjunction(vec![vec![]; 1000], 2);
        aux_test_conjunction(vec![vec![]; 100], usize::MAX);
        aux_test_conjunction(vec![vec![0xC0FFEE]; 10000], usize::MAX);
        aux_test_conjunction((1..10000u32).map(|i| vec![i]).collect::<Vec<_>>(), 2);
    }

    #[test]
    fn test_conjunction() {
        aux_test_conjunction(
            vec![
                vec![1, 3333, 100000000u32],
                vec![1, 2, 100000000u32],
                vec![1, 2, 100000000u32],
            ],
            2,
        );
        aux_test_conjunction(
            vec![vec![8], vec![3, 4, 0xC0FFEEu32], vec![1, 2, 100000000u32]],
            2,
        );
        aux_test_conjunction(
            vec![
                vec![1, 3333, 100000000u32],
                vec![1, 2, 100000000u32],
                vec![1, 2, 100000000u32],
            ],
            3,
        )
    }

    // This dummy scorer does nothing but yield doc id increasingly.
    // with constant score 1.0
    #[derive(Clone)]
    struct DummyScorer {
        cursor: usize,
        foo: Vec<(DocId, f32)>,
    }

    impl DummyScorer {
        fn new(doc_score: Vec<(DocId, f32)>) -> Self {
            Self {
                cursor: 0,
                foo: doc_score,
            }
        }
    }

    impl DocSet for DummyScorer {
        fn advance(&mut self) -> DocId {
            self.cursor += 1;
            self.doc()
        }

        fn doc(&self) -> DocId {
            self.foo.get(self.cursor).map(|x| x.0).unwrap_or(TERMINATED)
        }

        fn size_hint(&self) -> u32 {
            self.foo.len() as u32
        }
    }

    impl Scorer for DummyScorer {
        #[inline]
        fn score(&mut self) -> Score {
            self.foo.get(self.cursor).map(|x| x.1).unwrap_or(0.0)
        }
    }

    #[test]
    fn test_score_calculate() {
        let mut scorer = Disjunction::new(
            vec![
                DummyScorer::new(vec![(1, 1f32), (2, 1f32)]),
                DummyScorer::new(vec![(1, 1f32), (3, 1f32)]),
                DummyScorer::new(vec![(1, 1f32), (4, 1f32)]),
                DummyScorer::new(vec![(1, 1f32), (2, 1f32)]),
                DummyScorer::new(vec![(1, 1f32), (2, 1f32)]),
            ],
            SumCombiner::default(),
            3,
        );
        assert_eq!(scorer.score(), 5.0);
        assert_eq!(scorer.advance(), 2);
        assert_eq!(scorer.score(), 3.0);
    }

    #[test]
    fn test_score_calculate_corner_case() {
        let mut scorer = Disjunction::new(
            vec![
                DummyScorer::new(vec![(1, 1f32), (2, 1f32)]),
                DummyScorer::new(vec![(1, 1f32), (3, 1f32)]),
                DummyScorer::new(vec![(1, 1f32), (3, 1f32)]),
            ],
            SumCombiner::default(),
            2,
        );
        assert_eq!(scorer.doc(), 1);
        assert_eq!(scorer.score(), 3.0);
        assert_eq!(scorer.advance(), 3);
        assert_eq!(scorer.score(), 2.0);
    }
}


================================================
FILE: src/query/disjunction_max_query.rs
================================================
use crate::query::{BooleanWeight, DisjunctionMaxCombiner, EnableScoring, Occur, Query, Weight};
use crate::{Score, Term};

/// The disjunction max query returns documents matching one or more wrapped queries,
/// called query clauses or clauses.
///
/// If a returned document matches multiple query clauses,
/// the `DisjunctionMaxQuery` assigns the document the highest relevance score from any matching
/// clause, plus a tie breaking increment for any additional matching subqueries.
///
/// ```rust
/// use tantivy::collector::TopDocs;
/// use tantivy::doc;
/// use tantivy::query::{DisjunctionMaxQuery, Query, QueryClone, TermQuery};
/// use tantivy::schema::{IndexRecordOption, Schema, TEXT};
/// use tantivy::Term;
/// use tantivy::Index;
/// use tantivy::IndexWriter;
///
/// fn main() -> tantivy::Result<()> {
///    let mut schema_builder = Schema::builder();
///    let title = schema_builder.add_text_field("title", TEXT);
///    let body = schema_builder.add_text_field("body", TEXT);
///    let schema = schema_builder.build();
///    let index = Index::create_in_ram(schema);
///    {
///        let mut index_writer: IndexWriter = index.writer(15_000_000)?;
///        index_writer.add_document(doc!(
///            title => "The Name of Girl",
///        ))?;
///        index_writer.add_document(doc!(
///            title => "The Diary of Muadib",
///        ))?;
///        index_writer.add_document(doc!(
///            title => "The Diary of Girl",
///        ))?;
///        index_writer.commit()?;
///    }
///
///    let reader = index.reader()?;
///    let searcher = reader.searcher();
///
///    // Make TermQuery's for "girl" and "diary" in the title
///    let girl_term_query: Box<dyn Query> = Box::new(TermQuery::new(
///        Term::from_field_text(title, "girl"),
///        IndexRecordOption::Basic,
///    ));
///    let diary_term_query: Box<dyn Query> = Box::new(TermQuery::new(
///        Term::from_field_text(title, "diary"),
///        IndexRecordOption::Basic,
///    ));
///
///    // TermQuery "diary" and "girl" should be present and only one should be accounted in score
///    let queries1 = vec![diary_term_query.box_clone(), girl_term_query.box_clone()];
///    let diary_and_girl = DisjunctionMaxQuery::new(queries1);
///    let documents = searcher.search(&diary_and_girl, &TopDocs::with_limit(3).order_by_score())?;
///    assert_eq!(documents[0].0, documents[1].0);
///    assert_eq!(documents[1].0, documents[2].0);
///
///    // TermQuery "diary" and "girl" should be present
///    // and one should be accounted with multiplier 0.7
///    let queries2 = vec![diary_term_query.box_clone(), girl_term_query.box_clone()];
///    let tie_breaker = 0.7;
///    let diary_and_girl_with_tie_breaker = DisjunctionMaxQuery::with_tie_breaker(queries2, tie_breaker);
///    let documents = searcher.search(&diary_and_girl_with_tie_breaker, &TopDocs::with_limit(3).order_by_score())?;
///    assert_eq!(documents[1].0, documents[2].0);
///    // For this test all terms brings the same score. So we can do easy math and assume that
///    // `DisjunctionMaxQuery` with tie breakers score should be equal
///    // to term1 score + `tie_breaker` * term2 score or (1.0 + tie_breaker) * term score
///    assert!(f32::abs(documents[0].0 - documents[1].0 * (1.0 + tie_breaker)) < 0.001);
///    Ok(())
/// }
/// ```
#[derive(Debug)]
pub struct DisjunctionMaxQuery {
    disjuncts: Vec<Box<dyn Query>>,
    tie_breaker: Score,
}

impl Clone for DisjunctionMaxQuery {
    fn clone(&self) -> Self {
        DisjunctionMaxQuery::with_tie_breaker(
            self.disjuncts
                .iter()
                .map(|disjunct| disjunct.box_clone())
                .collect::<Vec<_>>(),
            self.tie_breaker,
        )
    }
}

impl Query for DisjunctionMaxQuery {
    fn weight(&self, enable_scoring: EnableScoring<'_>) -> crate::Result<Box<dyn Weight>> {
        let disjuncts = self
            .disjuncts
            .iter()
            .map(|disjunct| Ok((Occur::Should, disjunct.weight(enable_scoring)?)))
            .collect::<crate::Result<_>>()?;
        let tie_breaker = self.tie_breaker;
        Ok(Box::new(BooleanWeight::new(
            disjuncts,
            enable_scoring.is_scoring_enabled(),
            Box::new(move || DisjunctionMaxCombiner::with_tie_breaker(tie_breaker)),
        )))
    }

    fn query_terms<'a>(&'a self, visitor: &mut dyn FnMut(&'a Term, bool)) {
        for disjunct in &self.disjuncts {
            disjunct.query_terms(visitor);
        }
    }
}

impl DisjunctionMaxQuery {
    /// Creates a new `DisjunctionMaxQuery` with tie breaker.
    pub fn with_tie_breaker(
        disjuncts: Vec<Box<dyn Query>>,
        tie_breaker: Score,
    ) -> DisjunctionMaxQuery {
        DisjunctionMaxQuery {
            disjuncts,
            tie_breaker,
        }
    }

    /// Creates a new `DisjunctionMaxQuery` with no tie breaker.
    pub fn new(disjuncts: Vec<Box<dyn Query>>) -> DisjunctionMaxQuery {
        DisjunctionMaxQuery::with_tie_breaker(disjuncts, 0.0)
    }
}


================================================
FILE: src/query/empty_query.rs
================================================
use super::Scorer;
use crate::docset::TERMINATED;
use crate::index::SegmentReader;
use crate::query::explanation::does_not_match;
use crate::query::{EnableScoring, Explanation, Query, Weight};
use crate::{DocId, DocSet, Score, Searcher};

/// `EmptyQuery` is a dummy `Query` in which no document matches.
///
/// It is useful for tests and handling edge cases.
#[derive(Clone, Debug)]
pub struct EmptyQuery;

impl Query for EmptyQuery {
    fn weight(&self, _enable_scoring: EnableScoring<'_>) -> crate::Result<Box<dyn Weight>> {
        Ok(Box::new(EmptyWeight))
    }

    fn count(&self, _searcher: &Searcher) -> crate::Result<usize> {
        Ok(0)
    }
}

/// `EmptyWeight` is a dummy `Weight` in which no document matches.
///
/// It is useful for tests and handling edge cases.
pub struct EmptyWeight;
impl Weight for EmptyWeight {
    fn scorer(&self, _reader: &SegmentReader, _boost: Score) -> crate::Result<Box<dyn Scorer>> {
        Ok(Box::new(EmptyScorer))
    }

    fn explain(&self, _reader: &SegmentReader, doc: DocId) -> crate::Result<Explanation> {
        Err(does_not_match(doc))
    }
}

/// `EmptyScorer` is a dummy `Scorer` in which no document matches.
///
/// It is useful for tests and handling edge cases.
pub struct EmptyScorer;

impl DocSet for EmptyScorer {
    fn advance(&mut self) -> DocId {
        TERMINATED
    }

    fn doc(&self) -> DocId {
        TERMINATED
    }

    fn size_hint(&self) -> u32 {
        0
    }
}

impl Scorer for EmptyScorer {
    #[inline]
    fn score(&mut self) -> Score {
        0.0
    }
}

#[cfg(test)]
mod tests {
    use crate::docset::TERMINATED;
    use crate::query::EmptyScorer;
    use crate::DocSet;

    #[test]
    fn test_empty_scorer() {
        let mut empty_scorer = EmptyScorer;
        assert_eq!(empty_scorer.doc(), TERMINATED);
        assert_eq!(empty_scorer.advance(), TERMINATED);
        assert_eq!(empty_scorer.doc(), TERMINATED);
    }
}


================================================
FILE: src/query/exclude.rs
================================================
use crate::docset::{DocSet, SeekDangerResult, TERMINATED};
use crate::query::Scorer;
use crate::{DocId, Score};

/// An exclusion set is a set of documents
/// that should be excluded from a given DocSet.
///
/// It can be a single DocSet, or a Vec of DocSets.
pub trait ExclusionSet: Send {
    /// Returns `true` if the given `doc` is in the exclusion set.
    fn contains(&mut self, doc: DocId) -> bool;
}

impl<TDocSet: DocSet> ExclusionSet for TDocSet {
    #[inline]
    fn contains(&mut self, doc: DocId) -> bool {
        self.seek_danger(doc) == SeekDangerResult::Found
    }
}

impl<TDocSet: DocSet> ExclusionSet for Vec<TDocSet> {
    #[inline]
    fn contains(&mut self, doc: DocId) -> bool {
        for docset in self.iter_mut() {
            if docset.seek_danger(doc) == SeekDangerResult::Found {
                return true;
            }
        }
        false
    }
}

/// Filters a given `DocSet` by removing the docs from an exclusion set.
///
/// The excluding docsets have no impact on scoring.
pub struct Exclude<TDocSet, TExclusionSet> {
    underlying_docset: TDocSet,
    exclusion_set: TExclusionSet,
}

impl<TDocSet, TExclusionSet> Exclude<TDocSet, TExclusionSet>
where
    TDocSet: DocSet,
    TExclusionSet: ExclusionSet,
{
    /// Creates a new `ExcludeScorer`
    pub fn new(
        mut underlying_docset: TDocSet,
        mut exclusion_set: TExclusionSet,
    ) -> Exclude<TDocSet, TExclusionSet> {
        while underlying_docset.doc() != TERMINATED {
            let target = underlying_docset.doc();
            if !exclusion_set.contains(target) {
                break;
            }
            underlying_docset.advance();
        }
        Exclude {
            underlying_docset,
            exclusion_set,
        }
    }
}

impl<TDocSet, TExclusionSet> DocSet for Exclude<TDocSet, TExclusionSet>
where
    TDocSet: DocSet,
    TExclusionSet: ExclusionSet,
{
    fn advance(&mut self) -> DocId {
        loop {
            let candidate = self.underlying_docset.advance();
            if candidate == TERMINATED {
                return TERMINATED;
            }
            if !self.exclusion_set.contains(candidate) {
                return candidate;
            }
        }
    }

    fn seek(&mut self, target: DocId) -> DocId {
        let candidate = self.underlying_docset.seek(target);
        if candidate == TERMINATED {
            return TERMINATED;
        }
        if !self.exclusion_set.contains(candidate) {
            return candidate;
        }
        self.advance()
    }

    fn doc(&self) -> DocId {
        self.underlying_docset.doc()
    }

    /// `.size_hint()` directly returns the size
    /// of the underlying docset without taking in account
    /// the fact that docs might be deleted.
    fn size_hint(&self) -> u32 {
        self.underlying_docset.size_hint()
    }
}

impl<TScorer, TExclusionSet> Scorer for Exclude<TScorer, TExclusionSet>
where
    TScorer: Scorer,
    TExclusionSet: ExclusionSet + 'static,
{
    #[inline]
    fn score(&mut self) -> Score {
        self.underlying_docset.score()
    }
}

#[cfg(test)]
mod tests {

    use super::*;
    use crate::postings::tests::test_skip_against_unoptimized;
    use crate::query::VecDocSet;
    use crate::tests::sample_with_seed;

    #[test]
    fn test_exclude() {
        let mut exclude_scorer = Exclude::new(
            VecDocSet::from(vec![1, 2, 5, 8, 10, 15, 24]),
            VecDocSet::from(vec![1, 2, 3, 10, 16, 24]),
        );
        let mut els = vec![];
        while exclude_scorer.doc() != TERMINATED {
            els.push(exclude_scorer.doc());
            exclude_scorer.advance();
        }
        assert_eq!(els, vec![5, 8, 15]);
    }

    #[test]
    fn test_exclude_skip() {
        test_skip_against_unoptimized(
            || {
                Box::new(Exclude::new(
                    VecDocSet::from(vec![1, 2, 5, 8, 10, 15, 24]),
                    VecDocSet::from(vec![1, 2, 3, 10, 16, 24]),
                ))
            },
            vec![5, 8, 10, 15, 24],
        );
    }

    #[test]
    fn test_exclude_skip_random() {
        let sample_include = sample_with_seed(10_000, 0.1, 1);
        let sample_exclude = sample_with_seed(10_000, 0.05, 2);
        let sample_skip = sample_with_seed(10_000, 0.005, 3);
        test_skip_against_unoptimized(
            || {
                Box::new(Exclude::new(
                    VecDocSet::from(sample_include.clone()),
                    VecDocSet::from(sample_exclude.clone()),
                ))
            },
            sample_skip,
        );
    }
}


================================================
FILE: src/query/exist_query.rs
================================================
use core::fmt::Debug;

use columnar::{ColumnIndex, DynamicColumn};
use common::BitSet;

use super::{ConstScorer, EmptyScorer};
use crate::docset::{DocSet, TERMINATED};
use crate::index::SegmentReader;
use crate::query::all_query::AllScorer;
use crate::query::boost_query::BoostScorer;
use crate::query::explanation::does_not_match;
use crate::query::{BitSetDocSet, EnableScoring, Explanation, Query, Scorer, Weight};
use crate::schema::Type;
use crate::{DocId, Score, TantivyError};

/// Query that matches all documents with a non-null value in the specified
/// field.
///
/// When querying inside a JSON field, "exists" queries can be executed strictly
/// on the field name or check all the subpaths. In that second case a document
/// will be matched if a non-null value exists in any subpath. For example,
/// assuming the following document where `myfield` is a JSON fast field:
/// ```json
/// {
///   "myfield": {
///     "mysubfield": "hello"
///   }
/// }
/// ```
/// With `json_subpaths` enabled queries on either `myfield` or
/// `myfield.mysubfield` will match the document. If it is set to false, only
/// `myfield.mysubfield` will match it.
///
/// All of the matched documents get the score 1.0.
#[derive(Clone, Debug)]
pub struct ExistsQuery {
    field_name: String,
    json_subpaths: bool,
}

impl ExistsQuery {
    /// Creates a new `ExistQuery` from the given field.
    ///
    /// This query matches all documents with at least one non-null value in the specified field.
    /// This constructor never fails, but executing the search with this query will return an
    /// error if the specified field doesn't exists or is not a fast field.
    #[deprecated]
    pub fn new_exists_query(field: String) -> ExistsQuery {
        ExistsQuery {
            field_name: field,
            json_subpaths: false,
        }
    }

    /// Creates a new `ExistQuery` from the given field.
    ///
    /// This query matches all documents with at least one non-null value in the
    /// specified field. If `json_subpaths` is set to true, documents with
    /// non-null values in any JSON subpath will also be matched.
    ///
    /// This constructor never fails, but executing the search with this query will
    /// return an error if the specified field doesn't exists or is not a fast
    /// field.
    pub fn new(field: String, json_subpaths: bool) -> Self {
        Self {
            field_name: field,
            json_subpaths,
        }
    }
}

impl Query for ExistsQuery {
    fn weight(&self, enable_scoring: EnableScoring) -> crate::Result<Box<dyn Weight>> {
        let schema = enable_scoring.schema();
        let Some((field, _path)) = schema.find_field(&self.field_name) else {
            return Err(TantivyError::FieldNotFound(self.field_name.clone()));
        };
        let field_type = schema.get_field_entry(field).field_type();
        if !field_type.is_fast() {
            return Err(TantivyError::SchemaError(format!(
                "Field {} is not a fast field.",
                self.field_name
            )));
        }
        Ok(Box::new(ExistsWeight {
            field_name: self.field_name.clone(),
            field_type: field_type.value_type(),
            json_subpaths: self.json_subpaths,
        }))
    }
}

/// Weight associated with the `ExistsQuery` query.
pub struct ExistsWeight {
    field_name: String,
    field_type: Type,
    json_subpaths: bool,
}

impl Weight for ExistsWeight {
    fn scorer(&self, reader: &SegmentReader, boost: Score) -> crate::Result<Box<dyn Scorer>> {
        let fast_field_reader = reader.fast_fields();
        let mut column_handles = fast_field_reader.dynamic_column_handles(&self.field_name)?;
        if self.field_type == Type::Json && self.json_subpaths {
            let mut sub_columns =
                fast_field_reader.dynamic_subpath_column_handles(&self.field_name)?;
            column_handles.append(&mut sub_columns);
        }
        let dynamic_columns: crate::Result<Vec<DynamicColumn>> = column_handles
            .into_iter()
            .map(|handle| handle.open().map_err(|io_error| io_error.into()))
            .collect();
        let mut non_empty_columns = Vec::new();
        for column in dynamic_columns? {
            if !matches!(column.column_index(), ColumnIndex::Empty { .. }) {
                non_empty_columns.push(column)
            }
        }
        if non_empty_columns.is_empty() {
            return Ok(Box::new(EmptyScorer));
        }

        // If any column is full, all docs match.
        let max_doc = reader.max_doc();
        if non_empty_columns
            .iter()
            .any(|col| matches!(col.column_index(), ColumnIndex::Full))
        {
            let all_scorer = AllScorer::new(max_doc);
            if boost != 1.0f32 {
                return Ok(Box::new(BoostScorer::new(all_scorer, boost)));
            } else {
                return Ok(Box::new(all_scorer));
            }
        }

        // If we have a single dynamic column, use ExistsDocSet
        // NOTE: A lower number may be better for very sparse columns
        if non_empty_columns.len() < 4 {
            let docset = ExistsDocSet::new(non_empty_columns, reader.max_doc());
            return Ok(Box::new(ConstScorer::new(docset, boost)));
        }

        // If we have many dynamic columns, precompute a bitset of matching docs
        let mut doc_bitset = BitSet::with_max_value(max_doc);
        for column in &non_empty_columns {
            match column.column_index() {
                ColumnIndex::Empty { .. } => {}
                ColumnIndex::Full => {
                    // Handled by AllScorer return above.
                }
                ColumnIndex::Optional(optional_index) => {
                    for doc in optional_index.iter_non_null_docs() {
                        doc_bitset.insert(doc);
                    }
                }
                ColumnIndex::Multivalued(multi_idx) => {
                    for doc in multi_idx.iter_non_null_docs() {
                        doc_bitset.insert(doc);
                    }
                }
            }
        }
        let docset = BitSetDocSet::from(doc_bitset);
        Ok(Box::new(ConstScorer::new(docset, boost)))
    }

    fn explain(&self, reader: &SegmentReader, doc: DocId) -> crate::Result<Explanation> {
        let mut scorer = self.scorer(reader, 1.0)?;
        if scorer.seek(doc) != doc {
            return Err(does_not_match(doc));
        }
        Ok(Explanation::new("ExistsQuery", 1.0))
    }
}

pub(crate) struct ExistsDocSet {
    columns: Vec<DynamicColumn>,
    doc: DocId,
    max_doc: DocId,
}

impl ExistsDocSet {
    pub(crate) fn new(columns: Vec<DynamicColumn>, max_doc: DocId) -> Self {
        let mut set = Self {
            columns,
            doc: 0u32,
            max_doc,
        };
        set.find_next();
        set
    }

    fn find_next(&mut self) -> DocId {
        while self.doc < self.max_doc {
            if self
                .columns
                .iter()
                .any(|col| col.column_index().has_value(self.doc))
            {
                return self.doc;
            }
            self.doc += 1;
        }
        self.doc = TERMINATED;
        TERMINATED
    }
}

impl DocSet for ExistsDocSet {
    fn advance(&mut self) -> DocId {
        self.seek(self.doc + 1)
    }

    fn size_hint(&self) -> u32 {
        0
    }

    fn doc(&self) -> DocId {
        self.doc
    }

    #[inline(always)]
    fn seek(&mut self, target: DocId) -> DocId {
        self.doc = target;
        self.find_next()
    }
}

#[cfg(test)]
mod tests {
    use std::net::Ipv6Addr;
    use std::ops::Bound;

    use common::DateTime;
    use time::OffsetDateTime;

    use crate::collector::Count;
    use crate::query::exist_query::ExistsQuery;
    use crate::query::{BooleanQuery, RangeQuery};
    use crate::schema::{Facet, FacetOptions, Schema, FAST, INDEXED, STRING, TEXT};
    use crate::{Index, Searcher, Term};

    #[test]
    fn test_exists_query_simple() -> crate::Result<()> {
        let mut schema_builder = Schema::builder();
        let all_field = schema_builder.add_u64_field("all", INDEXED | FAST);
        let even_field = schema_builder.add_u64_field("even", INDEXED | FAST);
        let odd_field = schema_builder.add_text_field("odd", STRING | FAST);
        let multi_field = schema_builder.add_text_field("multi", FAST);
        let _never_field = schema_builder.add_u64_field("never", INDEXED | FAST);
        let schema = schema_builder.build();

        let index = Index::create_in_ram(schema);
        {
            let mut index_writer = index.writer_for_tests()?;
            for i in 0u64..100u64 {
                if i % 2 == 0 {
                    if i % 10 == 0 {
                        index_writer.add_document(doc!(all_field => i, even_field => i, multi_field => i.to_string(), multi_field => (i + 1).to_string()))?;
                    } else {
                        index_writer.add_document(doc!(all_field => i, even_field => i))?;
                    }
                } else {
                    index_writer.add_document(doc!(all_field => i, odd_field => i.to_string()))?;
                }
            }
            index_writer.commit()?;
        }
        let reader = index.reader()?;
        let searcher = reader.searcher();

        assert_eq!(count_existing_fields(&searcher, "all", false)?, 100);
        assert_eq!(count_existing_fields(&searcher, "odd", false)?, 50);
        assert_eq!(count_existing_fields(&searcher, "even", false)?, 50);
        assert_eq!(count_existing_fields(&searcher, "multi", false)?, 10);
        assert_eq!(count_existing_fields(&searcher, "multi", true)?, 10);
        assert_eq!(count_existing_fields(&searcher, "never", false)?, 0);

        // exercise seek
        let query = BooleanQuery::intersection(vec![
            Box::new(RangeQuery::new(
                Bound::Included(Term::from_field_u64(all_field, 50)),
                Bound::Unbounded,
            )),
            Box::new(ExistsQuery::new("even".to_string(), false)),
        ]);
        assert_eq!(searcher.search(&query, &Count)?, 25);

        let query = BooleanQuery::intersection(vec![
            Box::new(RangeQuery::new(
                Bound::Included(Term::from_field_u64(all_field, 0)),
                Bound::Included(Term::from_field_u64(all_field, 50)),
            )),
            Box::new(ExistsQuery::new("odd".to_string(), false)),
        ]);
        assert_eq!(searcher.search(&query, &Count)?, 25);

        Ok(())
    }

    #[test]
    fn test_exists_query_json() -> crate::Result<()> {
        let mut schema_builder = Schema::builder();
        let json = schema_builder.add_json_field("json", TEXT | FAST);
        let schema = schema_builder.build();

        let index = Index::create_in_ram(schema);
        {
            let mut index_writer = index.writer_for_tests()?;
            for i in 0u64..100u64 {
                if i % 2 == 0 {
                    index_writer.add_document(doc!(json => json!({"all": i, "even": true})))?;
                } else {
                    index_writer
                        .add_document(doc!(json => json!({"all": i.to_string(), "odd": true})))?;
                }
            }
            index_writer.commit()?;
        }
        let reader = index.reader()?;
        let searcher = reader.searcher();

        assert_eq!(count_existing_fields(&searcher, "json.all", false)?, 100);
        assert_eq!(count_existing_fields(&searcher, "json.even", false)?, 50);
        assert_eq!(count_existing_fields(&searcher, "json.even", true)?, 50);
        assert_eq!(count_existing_fields(&searcher, "json.odd", false)?, 50);
        assert_eq!(count_existing_fields(&searcher, "json", false)?, 0);
        assert_eq!(count_existing_fields(&searcher, "json", true)?, 100);

        // Handling of non-existing fields:
        assert_eq!(count_existing_fields(&searcher, "json.absent", false)?, 0);
        assert_eq!(count_existing_fields(&searcher, "json.absent", true)?, 0);
        assert_does_not_exist(&searcher, "does_not_exists.absent", true);
        assert_does_not_exist(&searcher, "does_not_exists.absent", false);

        Ok(())
    }

    #[test]
    fn test_exists_query_json_union_no_single_full_subpath() -> crate::Result<()> {
        // Build docs where no single subpath exists for all docs, but the union does.
        let mut schema_builder = Schema::builder();
        let json = schema_builder.add_json_field("json", TEXT | FAST);
        let schema = schema_builder.build();

        let index = Index::create_in_ram(schema);
        {
            let mut index_writer = index.writer_for_tests()?;
            for i in 0u64..100u64 {
                if i % 2 == 0 {
                    // only subpath `a`
                    index_writer.add_document(doc!(json => json!({"a": i})))?;
                } else {
                    // only subpath `b`
                    index_writer.add_document(doc!(json => json!({"b": i})))?;
                }
            }
            index_writer.commit()?;
        }
        let reader = index.reader()?;
        let searcher = reader.searcher();

        // No single subpath is full
        assert_eq!(count_existing_fields(&searcher, "json.a", false)?, 50);
        assert_eq!(count_existing_fields(&searcher, "json.b", false)?, 50);

        // Root exists with subpaths disabled is zero
        assert_eq!(count_existing_fields(&searcher, "json", false)?, 0);

        // Root exists with subpaths enabled should match all docs via union
        assert_eq!(count_existing_fields(&searcher, "json", true)?, 100);

        Ok(())
    }

    #[test]
    fn test_exists_query_misc_supported_types() -> crate::Result<()> {
        let mut schema_builder = Schema::builder();
        let bool = schema_builder.add_bool_field("bool", FAST);
        let bytes = schema_builder.add_bytes_field("bytes", FAST);
        let date = schema_builder.add_date_field("date", FAST);
        let f64 = schema_builder.add_f64_field("f64", FAST);
        let ip_addr = schema_builder.add_ip_addr_field("ip_addr", FAST);
        let facet = schema_builder.add_facet_field("facet", FacetOptions::default());
        let schema = schema_builder.build();

        let index = Index::create_in_ram(schema);
        {
            let mut index_writer = index.writer_for_tests()?;
            let now = OffsetDateTime::now_utc().unix_timestamp();
            for i in 0u8..100u8 {
                if i % 2 == 0 {
                    let date_val = DateTime::from_utc(OffsetDateTime::from_unix_timestamp(
                        now + i as i64 * 100,
                    )?);
                    index_writer.add_document(
                        doc!(bool => i % 3 == 0, bytes => vec![i, i + 1,  i + 2], date => date_val),
                    )?;
                } else {
                    let ip_addr_v6 = Ipv6Addr::new(0, 0, 0, 0, 0, 0xffff, 0xc00a, i.into());
                    index_writer
                        .add_document(doc!(f64 => i as f64 * 0.5, ip_addr => ip_addr_v6, facet => Facet::from("/facet/foo"), facet => Facet::from("/facet/bar")))?;
                }
            }
            index_writer.commit()?;
        }
        let reader = index.reader()?;
        let searcher = reader.searcher();

        assert_eq!(count_existing_fields(&searcher, "bool", false)?, 50);
        assert_eq!(count_existing_fields(&searcher, "bool", true)?, 50);
        assert_eq!(count_existing_fields(&searcher, "bytes", false)?, 50);
        assert_eq!(count_existing_fields(&searcher, "date", false)?, 50);
        assert_eq!(count_existing_fields(&searcher, "f64", false)?, 50);
        assert_eq!(count_existing_fields(&searcher, "ip_addr", false)?, 50);
        assert_eq!(count_existing_fields(&searcher, "facet", false)?, 50);

        Ok(())
    }

    #[test]
    fn test_exists_query_unsupported_types() -> crate::Result<()> {
        let mut schema_builder = Schema::builder();
        let not_fast = schema_builder.add_text_field("not_fast", TEXT);
        let schema = schema_builder.build();

        let index = Index::create_in_ram(schema);
        {
            let mut index_writer = index.writer_for_tests()?;
            index_writer.add_document(doc!(
                not_fast => "slow",
            ))?;
            index_writer.commit()?;
        }
        let reader = index.reader()?;
        let searcher = reader.searcher();

        assert_eq!(
            searcher
                .search(&ExistsQuery::new("not_fast".to_string(), false), &Count)
                .unwrap_err()
                .to_string(),
            "Schema error: 'Field not_fast is not a fast field.'"
        );

        assert_does_not_exist(&searcher, "does_not_exists", false);

        Ok(())
    }

    fn count_existing_fields(
        searcher: &Searcher,
        field: &str,
        json_subpaths: bool,
    ) -> crate::Result<usize> {
        let query = ExistsQuery::new(field.to_string(), json_subpaths);
        searcher.search(&query, &Count)
    }

    fn assert_does_not_exist(searcher: &Searcher, field: &str, json_subpaths: bool) {
        assert_eq!(
            searcher
                .search(&ExistsQuery::new(field.to_string(), json_subpaths), &Count)
                .unwrap_err()
                .to_string(),
            format!("The field does not exist: '{field}'")
        );
    }
}


================================================
FILE: src/query/explanation.rs
================================================
use std::borrow::Cow;
use std::fmt;

use serde::Serialize;

use crate::{DocId, Score, TantivyError};

pub(crate) fn does_not_match(doc: DocId) -> TantivyError {
    TantivyError::InvalidArgument(format!("Document #({doc}) does not match"))
}

/// Object describing the score of a given document.
/// It is organized in trees.
///
/// `.to_pretty_json()` can be useful to print out a human readable
/// representation of this tree when debugging a given score.
#[derive(Clone, Serialize)]
pub struct Explanation {
    value: Score,
    description: Cow<'static, str>,
    #[serde(skip_serializing_if = "Option::is_none")]
    details: Option<Vec<Explanation>>,
    #[serde(skip_serializing_if = "Option::is_none")]
    context: Option<Vec<String>>,
}
impl fmt::Debug for Explanation {
    fn fmt(&self, f: &mut fmt::Formatter) -> fmt::Result {
        write!(f, "Explanation({})", self.to_pretty_json())
    }
}

impl Explanation {
    /// Creates a new explanation object.
    pub fn new_with_string(description: String, value: Score) -> Explanation {
        Explanation {
            value,
            description: Cow::Owned(description),
            details: None,
            context: None,
        }
    }
    /// Creates a new explanation object.
    pub fn new(description: &'static str, value: Score) -> Explanation {
        Explanation {
            value,
            description: Cow::Borrowed(description),
            details: None,
            context: None,
        }
    }

    /// Returns the value associated with the current node.
    pub fn value(&self) -> Score {
        self.value
    }

    /// Add some detail, explaining some part of the current node formula.
    ///
    /// Details are treated as child of the current node.
    pub fn add_detail(&mut self, child_explanation: Explanation) {
        self.details
            .get_or_insert_with(Vec::new)
            .push(child_explanation);
    }

    /// Adds some extra context to the explanation.
    pub fn add_context(&mut self, context: String) {
        self.context.get_or_insert_with(Vec::new).push(context);
    }

    /// Shortcut for `self.details.push(Explanation::new(name, value));`
    pub fn add_const(&mut self, name: &'static str, value: Score) {
        self.details
            .get_or_insert_with(Vec::new)
            .push(Explanation::new(name, value));
    }

    /// Returns an indented json representation of the explanation tree for debug usage.
    pub fn to_pretty_json(&self) -> String {
        serde_json::to_string_pretty(self).unwrap()
    }
}


================================================
FILE: src/query/fuzzy_query.rs
================================================
use levenshtein_automata::{Distance, LevenshteinAutomatonBuilder, DFA};
use once_cell::sync::OnceCell;
use tantivy_fst::Automaton;

use crate::query::{AutomatonWeight, EnableScoring, Query, Weight};
use crate::schema::{Term, Type};
use crate::TantivyError::InvalidArgument;

pub(crate) struct DfaWrapper(pub DFA);

impl Automaton for DfaWrapper {
    type State = u32;

    fn start(&self) -> Self::State {
        self.0.initial_state()
    }

    fn is_match(&self, state: &Self::State) -> bool {
        match self.0.distance(*state) {
            Distance::Exact(_) => true,
            Distance::AtLeast(_) => false,
        }
    }

    fn can_match(&self, state: &u32) -> bool {
        *state != levenshtein_automata::SINK_STATE
    }

    fn accept(&self, state: &Self::State, byte: u8) -> Self::State {
        self.0.transition(*state, byte)
    }
}

/// A Fuzzy Query matches all of the documents
/// containing a specific term that is within
/// Levenshtein distance
/// ```rust
/// use tantivy::collector::{Count, TopDocs};
/// use tantivy::query::FuzzyTermQuery;
/// use tantivy::schema::{Schema, TEXT};
/// use tantivy::{doc, Index, IndexWriter, Term};
///
/// fn example() -> tantivy::Result<()> {
///     let mut schema_builder = Schema::builder();
///     let title = schema_builder.add_text_field("title", TEXT);
///     let schema = schema_builder.build();
///     let index = Index::create_in_ram(schema);
///     {
///         let mut index_writer: IndexWriter = index.writer(15_000_000)?;
///         index_writer.add_document(doc!(
///             title => "The Name of the Wind",
///         ))?;
///         index_writer.add_document(doc!(
///             title => "The Diary of Muadib",
///         ))?;
///         index_writer.add_document(doc!(
///             title => "A Dairy Cow",
///         ))?;
///         index_writer.add_document(doc!(
///             title => "The Diary of a Young Girl",
///         ))?;
///         index_writer.commit()?;
///     }
///     let reader = index.reader()?;
///     let searcher = reader.searcher();
///
///     {
///         let term = Term::from_field_text(title, "Diary");
///         let query = FuzzyTermQuery::new(term, 1, true);
///         let (top_docs, count) = searcher.search(&query, &(TopDocs::with_limit(2).order_by_score(), Count)).unwrap();
///         assert_eq!(count, 2);
///         assert_eq!(top_docs.len(), 2);
///     }
///
///     Ok(())
/// }
/// # assert!(example().is_ok());
/// ```
#[derive(Debug, Clone)]
pub struct FuzzyTermQuery {
    /// What term are we searching
    term: Term,
    /// How many changes are we going to allow
    distance: u8,
    /// Should a transposition cost 1 or 2?
    transposition_cost_one: bool,
    /// is a starts with query
    prefix: bool,
}

impl FuzzyTermQuery {
    /// Creates a new Fuzzy Query
    pub fn new(term: Term, distance: u8, transposition_cost_one: bool) -> FuzzyTermQuery {
        FuzzyTermQuery {
            term,
            distance,
            transposition_cost_one,
            prefix: false,
        }
    }

    /// Creates a new Fuzzy Query of the Term prefix
    pub fn new_prefix(term: Term, distance: u8, transposition_cost_one: bool) -> FuzzyTermQuery {
        FuzzyTermQuery {
            term,
            distance,
            transposition_cost_one,
            prefix: true,
        }
    }

    fn specialized_weight(&self) -> crate::Result<AutomatonWeight<DfaWrapper>> {
        static AUTOMATON_BUILDER: [[OnceCell<LevenshteinAutomatonBuilder>; 2]; 3] = [
            [OnceCell::new(), OnceCell::new()],
            [OnceCell::new(), OnceCell::new()],
            [OnceCell::new(), OnceCell::new()],
        ];

        let automaton_builder = AUTOMATON_BUILDER
            .get(self.distance as usize)
            .ok_or_else(|| {
                InvalidArgument(format!(
                    "Levenshtein distance of {} is not allowed. Choose a value less than {}",
                    self.distance,
                    AUTOMATON_BUILDER.len()
                ))
            })?
            .get(self.transposition_cost_one as usize)
            .unwrap()
            .get_or_init(|| {
                LevenshteinAutomatonBuilder::new(self.distance, self.transposition_cost_one)
            });

        let term_value = self.term.value();

        let term_text = if term_value.typ() == Type::Json {
            if let Some(json_path_type) = term_value.json_path_type() {
                if json_path_type != Type::Str {
                    return Err(InvalidArgument(format!(
                        "The fuzzy term query requires a string path type for a json term. Found \
                         {json_path_type:?}"
                    )));
                }
            }

            std::str::from_utf8(self.term.serialized_value_bytes()).map_err(|_| {
                InvalidArgument(
                    "Failed to convert json term value bytes to utf8 string.".to_string(),
                )
            })?
        } else {
            term_value.as_str().ok_or_else(|| {
                InvalidArgument("The fuzzy term query requires a string term.".to_string())
            })?
        };
        let automaton = if self.prefix {
            automaton_builder.build_prefix_dfa(term_text)
        } else {
            automaton_builder.build_dfa(term_text)
        };

        if let Some((json_path_bytes, _)) = term_value.as_json() {
            Ok(AutomatonWeight::new_for_json_path(
                self.term.field(),
                DfaWrapper(automaton),
                json_path_bytes,
            ))
        } else {
            Ok(AutomatonWeight::new(
                self.term.field(),
                DfaWrapper(automaton),
            ))
        }
    }
}

impl Query for FuzzyTermQuery {
    fn weight(&self, _enable_scoring: EnableScoring<'_>) -> crate::Result<Box<dyn Weight>> {
        Ok(Box::new(self.specialized_weight()?))
    }
}

#[cfg(test)]
mod test {
    use super::FuzzyTermQuery;
    use crate::collector::{Count, TopDocs};
    use crate::indexer::NoMergePolicy;
    use crate::query::QueryParser;
    use crate::schema::{Schema, STORED, TEXT};
    use crate::{assert_nearly_equals, Index, IndexWriter, TantivyDocument, Term};

    #[test]
    pub fn test_fuzzy_json_path() -> crate::Result<()> {
        // # Defining the schema
        let mut schema_builder = Schema::builder();
        let attributes = schema_builder.add_json_field("attributes", TEXT | STORED);
        let schema = schema_builder.build();

        // # Indexing documents
        let index = Index::create_in_ram(schema.clone());

        let mut index_writer = index.writer_for_tests()?;
        index_writer.set_merge_policy(Box::new(NoMergePolicy));
        let doc = TantivyDocument::parse_json(
            &schema,
            r#"{
            "attributes": {
                "a": "japan"
            }
        }"#,
        )?;
        index_writer.add_document(doc)?;
        let doc = TantivyDocument::parse_json(
            &schema,
            r#"{
            "attributes": {
                "aa": "japan"
            }
        }"#,
        )?;
        index_writer.add_document(doc)?;
        index_writer.commit()?;

        let reader = index.reader()?;
        let searcher = reader.searcher();

        // # Fuzzy search
        let query_parser = QueryParser::for_index(&index, vec![attributes]);

        let get_json_path_term = |query: &str| -> crate::Result<Term> {
            let query = query_parser.parse_query(query)?;
            let mut terms = Vec::new();
            query.query_terms(&mut |term, _| {
                terms.push(term.clone());
            });

            Ok(terms[0].clone())
        };

        // shall not match the first document due to json path mismatch
        {
            let term = get_json_path_term("attributes.aa:japan")?;
            let fuzzy_query = FuzzyTermQuery::new(term, 2, true);
            let top_docs =
                searcher.search(&fuzzy_query, &TopDocs::with_limit(2).order_by_score())?;
            assert_eq!(top_docs.len(), 1, "Expected only 1 document");
            assert_eq!(top_docs[0].1.doc_id, 1, "Expected the second document");
        }

        // shall match the first document because Levenshtein distance is 1 (substitute 'o' with
        // 'a')
        {
            let term = get_json_path_term("attributes.a:japon")?;

            let fuzzy_query = FuzzyTermQuery::new(term, 1, true);
            let top_docs =
                searcher.search(&fuzzy_query, &TopDocs::with_limit(2).order_by_score())?;
            assert_eq!(top_docs.len(), 1, "Expected only 1 document");
            assert_eq!(top_docs[0].1.doc_id, 0, "Expected the first document");
        }

        // shall not match because non-prefix Levenshtein distance is more than 1 (add 'a' and 'n')
        {
            let term = get_json_path_term("attributes.a:jap")?;

            let fuzzy_query = FuzzyTermQuery::new(term, 1, true);
            let top_docs =
                searcher.search(&fuzzy_query, &TopDocs::with_limit(2).order_by_score())?;
            assert_eq!(top_docs.len(), 0, "Expected no document");
        }

        Ok(())
    }

    #[test]
    pub fn test_fuzzy_term() -> crate::Result<()> {
        let mut schema_builder = Schema::builder();
        let country_field = schema_builder.add_text_field("country", TEXT);
        let schema = schema_builder.build();
        let index = Index::create_in_ram(schema);
        {
            let mut index_writer: IndexWriter = index.writer_for_tests()?;
            index_writer.add_document(doc!(
                country_field => "japan",
            ))?;
            index_writer.add_document(doc!(
                country_field => "korea",
            ))?;
            index_writer.commit()?;
        }
        let reader = index.reader()?;
        let searcher = reader.searcher();

        // passes because Levenshtein distance is 1 (substitute 'o' with 'a')
        {
            let term = Term::from_field_text(country_field, "japon");
            let fuzzy_query = FuzzyTermQuery::new(term, 1, true);
            let top_docs =
                searcher.search(&fuzzy_query, &TopDocs::with_limit(2).order_by_score())?;
            assert_eq!(top_docs.len(), 1, "Expected only 1 document");
            let (score, _) = top_docs[0];
            assert_nearly_equals!(1.0, score);
        }

        // fails because non-prefix Levenshtein distance is more than 1 (add 'a' and 'n')
        {
            let term = Term::from_field_text(country_field, "jap");

            let fuzzy_query = FuzzyTermQuery::new(term, 1, true);
            let top_docs =
                searcher.search(&fuzzy_query, &TopDocs::with_limit(2).order_by_score())?;
            assert_eq!(top_docs.len(), 0, "Expected no document");
        }

        // passes because prefix Levenshtein distance is 0
        {
            let term = Term::from_field_text(country_field, "jap");
            let fuzzy_query = FuzzyTermQuery::new_prefix(term, 1, true);
            let top_docs =
                searcher.search(&fuzzy_query, &TopDocs::with_limit(2).order_by_score())?;
            assert_eq!(top_docs.len(), 1, "Expected only 1 document");
            let (score, _) = top_docs[0];
            assert_nearly_equals!(1.0, score);
        }
        Ok(())
    }

    #[test]
    pub fn test_fuzzy_term_transposition_cost_one() -> crate::Result<()> {
        let mut schema_builder = Schema::builder();
        let country_field = schema_builder.add_text_field("country", TEXT);
        let schema = schema_builder.build();
        let index = Index::create_in_ram(schema);
        let mut index_writer: IndexWriter = index.writer_for_tests()?;
        index_writer.add_document(doc!(country_field => "japan"))?;
        index_writer.commit()?;
        let reader = index.reader()?;
        let searcher = reader.searcher();
        let term_jaapn = Term::from_field_text(country_field, "jaapn");
        {
            let fuzzy_query_transposition = FuzzyTermQuery::new(term_jaapn.clone(), 1, true);
            let count = searcher.search(&fuzzy_query_transposition, &Count)?;
            assert_eq!(count, 1);
        }
        {
            let fuzzy_query_transposition = FuzzyTermQuery::new(term_jaapn, 1, false);
            let count = searcher.search(&fuzzy_query_transposition, &Count)?;
            assert_eq!(count, 0);
        }
        Ok(())
    }
}


================================================
FILE: src/query/intersection.rs
================================================
use super::size_hint::estimate_intersection;
use crate::docset::{DocSet, SeekDangerResult, TERMINATED};
use crate::query::term_query::TermScorer;
use crate::query::{EmptyScorer, Scorer};
use crate::{DocId, Score};

/// Returns the intersection scorer.
///
/// The score associated with the documents is the sum of the
/// score of the `Scorer`s given in argument.
///
/// For better performance, the function uses a
/// specialized implementation if the two
/// shortest scorers are `TermScorer`s.
///
/// num_docs_segment is the number of documents in the segment. It is used for estimating the
/// `size_hint` of the intersection.
pub fn intersect_scorers(
    mut scorers: Vec<Box<dyn Scorer>>,
    num_docs_segment: u32,
) -> Box<dyn Scorer> {
    if scorers.is_empty() {
        return Box::new(EmptyScorer);
    }
    if scorers.len() == 1 {
        return scorers.pop().unwrap();
    }
    // Order by estimated cost to drive each scorer.
    scorers.sort_by_key(|scorer| scorer.cost());
    let doc = go_to_first_doc(&mut scorers[..]);
    if doc == TERMINATED {
        return Box::new(EmptyScorer);
    }
    // We know that we have at least 2 elements.
    let left = scorers.remove(0);
    let right = scorers.remove(0);
    let all_term_scorers = [&left, &right]
        .iter()
        .all(|&scorer| scorer.is::<TermScorer>());
    if all_term_scorers {
        return Box::new(Intersection {
            left: *(left.downcast::<TermScorer>().map_err(|_| ()).unwrap()),
            right: *(right.downcast::<TermScorer>().map_err(|_| ()).unwrap()),
            others: scorers,
            num_docs: num_docs_segment,
        });
    }
    Box::new(Intersection {
        left,
        right,
        others: scorers,
        num_docs: num_docs_segment,
    })
}

/// Creates a `DocSet` that iterate through the intersection of two or more `DocSet`s.
pub struct Intersection<TDocSet: DocSet, TOtherDocSet: DocSet = Box<dyn Scorer>> {
    left: TDocSet,
    right: TDocSet,
    others: Vec<TOtherDocSet>,
    num_docs: u32,
}

fn go_to_first_doc<TDocSet: DocSet>(docsets: &mut [TDocSet]) -> DocId {
    assert!(!docsets.is_empty());
    let mut candidate = docsets.iter().map(TDocSet::doc).max().unwrap();
    'outer: loop {
        for docset in docsets.iter_mut() {
            let seek_doc = docset.seek(candidate);
            if seek_doc > candidate {
                candidate = docset.doc();
                continue 'outer;
            }
        }
        return candidate;
    }
}

impl<TDocSet: DocSet> Intersection<TDocSet, TDocSet> {
    /// num_docs is the number of documents in the segment.
    pub(crate) fn new(mut docsets: Vec<TDocSet>, num_docs: u32) -> Intersection<TDocSet, TDocSet> {
        let num_docsets = docsets.len();
        assert!(num_docsets >= 2);
        docsets.sort_by_key(|docset| docset.cost());
        go_to_first_doc(&mut docsets);
        let left = docsets.remove(0);
        debug_assert!({
            let doc = left.doc();
            if doc == TERMINATED {
                true
            } else {
                docsets.iter().all(|docset| docset.doc() == doc)
            }
        });
        let right = docsets.remove(0);
        Intersection {
            left,
            right,
            others: docsets,
            num_docs,
        }
    }
}

impl<TDocSet: DocSet> Intersection<TDocSet, TDocSet> {
    pub(crate) fn docset_mut_specialized(&mut self, ord: usize) -> &mut TDocSet {
        match ord {
            0 => &mut self.left,
            1 => &mut self.right,
            n => &mut self.others[n - 2],
        }
    }
}

impl<TDocSet: DocSet, TOtherDocSet: DocSet> DocSet for Intersection<TDocSet, TOtherDocSet> {
    #[inline]
    fn advance(&mut self) -> DocId {
        let (left, right) = (&mut self.left, &mut self.right);

        // Invariant:
        // - candidate is always <= to the next document in the intersection.
        // - candidate strictly increases at every occurence of the loop.
        let mut candidate = left.doc() + 1;

        // Termination: candidate strictly increases.
        'outer: while candidate < TERMINATED {
            // As we enter the loop, we should always have candidate < next_doc.

            candidate = left.seek(candidate);

            // Left is positionned on `candidate`.
            debug_assert_eq!(left.doc(), candidate);

            if let SeekDangerResult::SeekLowerBound(seek_lower_bound) = right.seek_danger(candidate)
            {
                debug_assert!(
                    seek_lower_bound == TERMINATED || seek_lower_bound > candidate,
                    "seek_lower_bound {seek_lower_bound} must be greater than candidate \
                     {candidate}"
                );
                candidate = seek_lower_bound;
                continue;
            }

            // Left and right are positionned on `candidate`.
            debug_assert_eq!(right.doc(), candidate);

            for other in &mut self.others {
                if let SeekDangerResult::SeekLowerBound(seek_lower_bound) =
                    other.seek_danger(candidate)
                {
                    // One of the scorer does not match, let's restart at the top of the loop.
                    debug_assert!(
                        seek_lower_bound == TERMINATED || seek_lower_bound > candidate,
                        "seek_lower_bound {seek_lower_bound} must be greater than candidate \
                         {candidate}"
                    );
                    candidate = seek_lower_bound;
                    continue 'outer;
                }
            }

            // At this point all scorers are in a valid state, aligned on the next document in the
            // intersection.
            debug_assert!(self.others.iter().all(|docset| docset.doc() == candidate));
            return candidate;
        }

        // We make sure our docset is in a valid state.
        // In particular, we want .doc() to return TERMINATED.
        left.seek(TERMINATED);

        TERMINATED
    }

    fn seek(&mut self, target: DocId) -> DocId {
        self.left.seek(target);
        let mut docsets: Vec<&mut dyn DocSet> = vec![&mut self.left, &mut self.right];
        for docset in &mut self.others {
            docsets.push(docset);
        }
        let doc = go_to_first_doc(&mut docsets[..]);
        debug_assert!(docsets.iter().all(|docset| docset.doc() == doc));
        debug_assert!(doc >= target);
        doc
    }

    /// Seeks to the target if necessary and checks if the target is an exact match.
    ///
    /// Some implementations may choose to advance past the target if beneficial for performance.
    /// The return value is `true` if the target is in the docset, and `false` otherwise.
    fn seek_danger(&mut self, target: DocId) -> SeekDangerResult {
        if let SeekDangerResult::SeekLowerBound(new_target) = self.left.seek_danger(target) {
            return SeekDangerResult::SeekLowerBound(new_target);
        }
        if let SeekDangerResult::SeekLowerBound(new_target) = self.right.seek_danger(target) {
            return SeekDangerResult::SeekLowerBound(new_target);
        }
        for docset in &mut self.others {
            if let SeekDangerResult::SeekLowerBound(new_target) = docset.seek_danger(target) {
                return SeekDangerResult::SeekLowerBound(new_target);
            }
        }
        SeekDangerResult::Found
    }

    #[inline]
    fn doc(&self) -> DocId {
        self.left.doc()
    }

    fn size_hint(&self) -> u32 {
        estimate_intersection(
            [self.left.size_hint(), self.right.size_hint()]
                .into_iter()
                .chain(self.others.iter().map(DocSet::size_hint)),
            self.num_docs,
        )
    }

    fn cost(&self) -> u64 {
        // What's the best way to compute the cost of an intersection?
        // For now we take the cost of the docset driver, which is the first docset.
        // If there are docsets that are bad at skipping, they should also influence the cost.
        self.left.cost()
    }
}

impl<TScorer, TOtherScorer> Scorer for Intersection<TScorer, TOtherScorer>
where
    TScorer: Scorer,
    TOtherScorer: Scorer,
{
    #[inline]
    fn score(&mut self) -> Score {
        self.left.score()
            + self.right.score()
            + self.others.iter_mut().map(Scorer::score).sum::<Score>()
    }
}

#[cfg(test)]
mod tests {
    use proptest::prelude::*;

    use super::Intersection;
    use crate::collector::Count;
    use crate::docset::{DocSet, TERMINATED};
    use crate::postings::tests::test_skip_against_unoptimized;
    use crate::query::{QueryParser, VecDocSet};
    use crate::schema::{Schema, TEXT};
    use crate::Index;

    #[test]
    fn test_intersection() {
        {
            let left = VecDocSet::from(vec![1, 3, 9]);
            let right = VecDocSet::from(vec![3, 4, 9, 18]);
            let mut intersection = Intersection::new(vec![left, right], 10);
            assert_eq!(intersection.doc(), 3);
            assert_eq!(intersection.advance(), 9);
            assert_eq!(intersection.doc(), 9);
            assert_eq!(intersection.advance(), TERMINATED);
        }
        {
            let a = VecDocSet::from(vec![1, 3, 9]);
            let b = VecDocSet::from(vec![3, 4, 9, 18]);
            let c = VecDocSet::from(vec![1, 5, 9, 111]);
            let mut intersection = Intersection::new(vec![a, b, c], 10);
            assert_eq!(intersection.doc(), 9);
            assert_eq!(intersection.advance(), TERMINATED);
        }
    }

    #[test]
    fn test_intersection_zero() {
        let left = VecDocSet::from(vec![0]);
        let right = VecDocSet::from(vec![0]);
        let mut intersection = Intersection::new(vec![left, right], 10);
        assert_eq!(intersection.doc(), 0);
        assert_eq!(intersection.advance(), TERMINATED);
    }

    #[test]
    fn test_intersection_skip() {
        let left = VecDocSet::from(vec![0, 1, 2, 4]);
        let right = VecDocSet::from(vec![2, 5]);
        let mut intersection = Intersection::new(vec![left, right], 10);
        assert_eq!(intersection.seek(2), 2);
        assert_eq!(intersection.doc(), 2);
    }

    #[test]
    fn test_intersection_skip_against_unoptimized() {
        test_skip_against_unoptimized(
            || {
                let left = VecDocSet::from(vec![4]);
                let right = VecDocSet::from(vec![2, 5]);
                Box::new(Intersection::new(vec![left, right], 10))
            },
            vec![0, 2, 4, 5, 6],
        );
        test_skip_against_unoptimized(
            || {
                let mut left = VecDocSet::from(vec![1, 4, 5, 6]);
                let mut right = VecDocSet::from(vec![2, 5, 10]);
                left.advance();
                right.advance();
                Box::new(Intersection::new(vec![left, right], 10))
            },
            vec![0, 1, 2, 3, 4, 5, 6, 7, 10, 11],
        );
        test_skip_against_unoptimized(
            || {
                Box::new(Intersection::new(
                    vec![
                        VecDocSet::from(vec![1, 4, 5, 6]),
                        VecDocSet::from(vec![1, 2, 5, 6]),
                        VecDocSet::from(vec![1, 4, 5, 6]),
                        VecDocSet::from(vec![1, 5, 6]),
                        VecDocSet::from(vec![2, 4, 5, 7, 8]),
                    ],
                    10,
                ))
            },
            vec![0, 1, 2, 3, 4, 5, 6, 7, 10, 11],
        );
    }

    #[test]
    fn test_intersection_empty() {
        let a = VecDocSet::from(vec![1, 3]);
        let b = VecDocSet::from(vec![1, 4]);
        let c = VecDocSet::from(vec![3, 9]);
        let intersection = Intersection::new(vec![a, b, c], 10);
        assert_eq!(intersection.doc(), TERMINATED);
    }

    #[test]
    fn test_intersection_abc() {
        let a = VecDocSet::from(vec![2, 3, 6]);
        let b = VecDocSet::from(vec![1, 3, 5]);
        let c = VecDocSet::from(vec![1, 3, 5]);
        let mut intersection = Intersection::new(vec![c, b, a], 10);
        let mut docs = Vec::new();
        use crate::DocSet;
        while intersection.doc() != TERMINATED {
            docs.push(intersection.doc());
            intersection.advance();
        }
        assert_eq!(&docs, &[3]);
    }

    #[test]
    fn test_intersection_termination() {
        use crate::query::score_combiner::DoNothingCombiner;
        use crate::query::{BufferedUnionScorer, ConstScorer, VecDocSet};

        let a1 = ConstScorer::new(VecDocSet::from(vec![0u32, 10000]), 1.0);
        let a2 = ConstScorer::new(VecDocSet::from(vec![0u32, 10000]), 1.0);

        let mut b_scorers = vec![];
        for _ in 0..2 {
            // Union matches 0 and 10000.
            b_scorers.push(ConstScorer::new(VecDocSet::from(vec![0, 10000]), 1.0));
        }
        // That's the union of two scores matching 0, and 10_000.
        let union = BufferedUnionScorer::build(b_scorers, DoNothingCombiner::default, 30000);

        // Mismatching scorer: matches 0 and 20000. We then append more docs at the end to ensure it
        // is last.
        let mut m_docs = vec![0, 20000];
        for i in 30000..30100 {
            m_docs.push(i);
        }
        let m = ConstScorer::new(VecDocSet::from(m_docs), 1.0);

        // Costs: A1=2, A2=2, Union=4, M=102.
        // Sorted: A1, A2, Union, M.
        // Left=A1, Right=A2, Others=[Union, M].
        let mut intersection = crate::query::intersect_scorers(
            vec![Box::new(a1), Box::new(a2), Box::new(union), Box::new(m)],
            40000,
        );

        while intersection.doc() != TERMINATED {
            intersection.advance();
        }
    }

    // Strategy to generate sorted and deduplicated vectors of u32 document IDs
    fn sorted_deduped_vec(max_val: u32, max_size: usize) -> impl Strategy<Value = Vec<u32>> {
        prop::collection::vec(0..max_val, 0..max_size).prop_map(|mut vec| {
            vec.sort();
            vec.dedup();
            vec
        })
    }

    proptest! {
        #[test]
        fn prop_test_intersection_consistency(
            a in sorted_deduped_vec(100, 10),
            b in sorted_deduped_vec(100, 10),
            num_docs in 100u32..500u32
        ) {
            let left = VecDocSet::from(a.clone());
            let right = VecDocSet::from(b.clone());
            let mut intersection = Intersection::new(vec![left, right], num_docs);

            let expected: Vec<u32> = a.iter()
                .cloned()
                .filter(|doc| b.contains(doc))
                .collect();

            for expected_doc in expected {
                assert_eq!(intersection.doc(), expected_doc);
                intersection.advance();
            }
            assert_eq!(intersection.doc(), TERMINATED);
        }
    }

    #[test]
    fn test_bug_2811_intersection_candidate_should_increase() {
        let mut schema_builder = Schema::builder();
        let text_field = schema_builder.add_text_field("text", TEXT);
        let schema = schema_builder.build();

        let index = Index::create_in_ram(schema);
        let mut writer = index.writer_for_tests().unwrap();
        writer
            .add_document(doc!(text_field=>"hello happy tax"))
            .unwrap();
        writer.add_document(doc!(text_field=>"hello")).unwrap();
        writer.add_document(doc!(text_field=>"hello")).unwrap();
        writer.add_document(doc!(text_field=>"happy tax")).unwrap();

        writer.commit().unwrap();
        let query_parser = QueryParser::for_index(&index, Vec::new());
        let query = query_parser
            .parse_query(r#"+text:hello +text:"happy tax""#)
            .unwrap();
        let searcher = index.reader().unwrap().searcher();
        let c = searcher.search(&*query, &Count).unwrap();
        assert_eq!(c, 1);
    }
}


================================================
FILE: src/query/mod.rs
================================================
mod all_query;
mod automaton_weight;
mod bitset;
mod bm25;
mod boolean_query;
mod boost_query;
mod const_score_query;
mod disjunction;
mod disjunction_max_query;
mod empty_query;
mod exclude;
mod exist_query;
mod explanation;
mod fuzzy_query;
mod intersection;
mod more_like_this;
mod phrase_prefix_query;
mod phrase_query;
mod query;
mod query_parser;
mod range_query;
mod regex_query;
mod reqopt_scorer;
mod scorer;
mod set_query;
mod size_hint;
mod term_query;
mod union;
mod weight;

#[cfg(test)]
mod vec_docset;

pub(crate) mod score_combiner;
pub use query_grammar::Occur;

pub use self::all_query::{AllQuery, AllScorer, AllWeight};
pub use self::automaton_weight::AutomatonWeight;
pub use self::bitset::BitSetDocSet;
pub use self::bm25::{Bm25StatisticsProvider, Bm25Weight};
pub use self::boolean_query::{BooleanQuery, BooleanWeight};
pub use self::boost_query::{BoostQuery, BoostWeight};
pub use self::const_score_query::{ConstScoreQuery, ConstScorer};
pub use self::disjunction_max_query::DisjunctionMaxQuery;
pub use self::empty_query::{EmptyQuery, EmptyScorer, EmptyWeight};
pub use self::exclude::{Exclude, ExclusionSet};
pub use self::exist_query::ExistsQuery;
pub use self::explanation::Explanation;
#[cfg(test)]
pub(crate) use self::fuzzy_query::DfaWrapper;
pub use self::fuzzy_query::FuzzyTermQuery;
pub use self::intersection::{intersect_scorers, Intersection};
pub use self::more_like_this::{MoreLikeThisQuery, MoreLikeThisQueryBuilder};
pub use self::phrase_prefix_query::PhrasePrefixQuery;
pub use self::phrase_query::regex_phrase_query::{wildcard_query_to_regex_str, RegexPhraseQuery};
pub use self::phrase_query::PhraseQuery;
pub use self::query::{EnableScoring, Query, QueryClone};
pub use self::query_parser::{QueryParser, QueryParserError};
pub use self::range_query::*;
pub use self::regex_query::RegexQuery;
pub use self::reqopt_scorer::RequiredOptionalScorer;
pub use self::score_combiner::{DisjunctionMaxCombiner, ScoreCombiner, SumCombiner};
pub use self::scorer::Scorer;
pub use self::set_query::TermSetQuery;
pub use self::term_query::TermQuery;
pub use self::union::BufferedUnionScorer;
#[cfg(test)]
pub use self::vec_docset::VecDocSet;
pub use self::weight::Weight;

#[cfg(test)]
mod tests {
    use crate::collector::TopDocs;
    use crate::query::phrase_query::tests::create_index;
    use crate::query::QueryParser;
    use crate::schema::{Schema, TEXT};
    use crate::{DocAddress, Index, Term};

    #[test]
    pub fn test_mixed_intersection_and_union() -> crate::Result<()> {
        let index = create_index(&["a b", "a c", "a b c", "b"])?;
        let schema = index.schema();
        let text_field = schema.get_field("text").unwrap();
        let searcher = index.reader()?.searcher();

        let do_search = |term: &str| {
            let query = QueryParser::for_index(&index, vec![text_field])
                .parse_query(term)
                .unwrap();
            let top_docs: Vec<(f32, DocAddress)> = searcher
                .search(&query, &TopDocs::with_limit(10).order_by_score())
                .unwrap();

            top_docs.iter().map(|el| el.1.doc_id).collect::<Vec<_>>()
        };

        assert_eq!(do_search("a AND b"), vec![0, 2]);
        assert_eq!(do_search("(a OR b) AND C"), vec![2, 1]);
        // The intersection code has special code for more than 2 intersections
        // left, right + others
        // The will place the union in the "others" insersection to that seek_into_the_danger_zone
        // is called
        assert_eq!(
            do_search("(a OR b) AND (c OR a) AND (b OR c)"),
            vec![2, 1, 0]
        );

        Ok(())
    }

    #[test]
    pub fn test_mixed_intersection_and_union_with_skip() -> crate::Result<()> {
        // Test 4096 skip in BufferedUnionScorer
        let mut data: Vec<&str> = Vec::new();
        data.push("a b");
        let zz_data = vec!["z z"; 5000];
        data.extend_from_slice(&zz_data);
        data.extend_from_slice(&["a c"]);
        data.extend_from_slice(&zz_data);
        data.extend_from_slice(&["a b c", "b"]);
        let index = create_index(&data)?;
        let schema = index.schema();
        let text_field = schema.get_field("text").unwrap();
        let searcher = index.reader()?.searcher();

        let do_search = |term: &str| {
            let query = QueryParser::for_index(&index, vec![text_field])
                .parse_query(term)
                .unwrap();
            let top_docs: Vec<(f32, DocAddress)> = searcher
                .search(&query, &TopDocs::with_limit(10).order_by_score())
                .unwrap();

            top_docs.iter().map(|el| el.1.doc_id).collect::<Vec<_>>()
        };

        assert_eq!(do_search("a AND b"), vec![0, 10002]);
        assert_eq!(do_search("(a OR b) AND C"), vec![10002, 5001]);
        // The intersection code has special code for more than 2 intersections
        // left, right + others
        // The will place the union in the "others" insersection to that seek_into_the_danger_zone
        // is called
        assert_eq!(
            do_search("(a OR b) AND (c OR a) AND (b OR c)"),
            vec![10002, 5001, 0]
        );

        Ok(())
    }

    #[test]
    fn test_query_terms() {
        let mut schema_builder = Schema::builder();
        let text_field = schema_builder.add_text_field("text", TEXT);
        let schema = schema_builder.build();
        let index = Index::create_in_ram(schema);
        let query_parser = QueryParser::for_index(&index, vec![text_field]);
        let term_a = Term::from_field_text(text_field, "a");
        let term_b = Term::from_field_text(text_field, "b");
        {
            let query = query_parser.parse_query("a").unwrap();
            let mut terms = Vec::new();
            query.query_terms(&mut |term, pos| terms.push((term, pos)));
            assert_eq!(vec![(&term_a, false)], terms);
        }
        {
            let query = query_parser.parse_query("a b").unwrap();
            let mut terms = Vec::new();
            query.query_terms(&mut |term, pos| terms.push((term, pos)));
            assert_eq!(vec![(&term_a, false), (&term_b, false)], terms);
        }
        {
            let query = query_parser.parse_query("\"a b\"").unwrap();
            let mut terms = Vec::new();
            query.query_terms(&mut |term, pos| terms.push((term, pos)));
            assert_eq!(vec![(&term_a, true), (&term_b, true)], terms);
        }
        {
            let query = query_parser.parse_query("a a a a a").unwrap();
            let mut terms = Vec::new();
            query.query_terms(&mut |term, pos| terms.push((term, pos)));
            assert_eq!(vec![(&term_a, false); 1], terms);
        }
        {
            let query = query_parser.parse_query("a -b").unwrap();
            let mut terms = Vec::new();
            query.query_terms(&mut |term, pos| terms.push((term, pos)));
            assert_eq!(vec![(&term_a, false), (&term_b, false)], terms);
        }
    }
}


================================================
FILE: src/query/more_like_this/mod.rs
================================================
mod more_like_this;

/// Module containing the different query implementations.
mod query;

pub use self::more_like_this::MoreLikeThis;
pub use self::query::{MoreLikeThisQuery, MoreLikeThisQueryBuilder};


================================================
FILE: src/query/more_like_this/more_like_this.rs
================================================
use std::cmp::Reverse;
use std::collections::{BinaryHeap, HashMap};

use tokenizer_api::Token;

use crate::query::bm25::idf;
use crate::query::{BooleanQuery, BoostQuery, Occur, Query, TermQuery};
use crate::schema::document::{Document, Value};
use crate::schema::{Field, FieldType, IndexRecordOption, Term};
use crate::tokenizer::{FacetTokenizer, PreTokenizedStream, TokenStream, Tokenizer};
use crate::{DocAddress, Result, Searcher, TantivyDocument, TantivyError};

#[derive(Debug, PartialEq)]
struct ScoreTerm {
    pub term: Term,
    pub score: f32,
}

impl ScoreTerm {
    fn new(term: Term, score: f32) -> Self {
        Self { term, score }
    }
}

impl Eq for ScoreTerm {}

impl PartialOrd for ScoreTerm {
    fn partial_cmp(&self, other: &Self) -> Option<std::cmp::Ordering> {
        Some(self.cmp(other))
    }
}

impl Ord for ScoreTerm {
    fn cmp(&self, other: &Self) -> std::cmp::Ordering {
        self.score
            .partial_cmp(&other.score)
            .unwrap_or(std::cmp::Ordering::Equal)
    }
}

/// A struct used as helper to build [`MoreLikeThisQuery`](crate::query::MoreLikeThisQuery)
/// This more-like-this implementation is inspired by the Apache Lucene
/// and closely follows the same implementation with adaptation to Tantivy vocabulary and API.
///
/// [MoreLikeThis](https://github.com/apache/lucene/blob/main/lucene/queries/src/java/org/apache/lucene/queries/mlt/MoreLikeThis.java#L147)
/// [MoreLikeThisQuery](https://github.com/apache/lucene/blob/main/lucene/queries/src/java/org/apache/lucene/queries/mlt/MoreLikeThisQuery.java#L36)
#[derive(Debug, Clone)]
pub struct MoreLikeThis {
    /// Ignore words which do not occur in at least this many docs.
    pub min_doc_frequency: Option<u64>,
    /// Ignore words which occur in more than this many docs.
    pub max_doc_frequency: Option<u64>,
    /// Ignore words less frequent than this.
    pub min_term_frequency: Option<usize>,
    /// Don't return a query longer than this.
    pub max_query_terms: Option<usize>,
    /// Ignore words if less than this length.
    pub min_word_length: Option<usize>,
    /// Ignore words if greater than this length.
    pub max_word_length: Option<usize>,
    /// Boost factor to use when boosting the terms
    pub boost_factor: Option<f32>,
    /// Current set of stop words.
    pub stop_words: Vec<String>,
}

impl Default for MoreLikeThis {
    fn default() -> Self {
        Self {
            min_doc_frequency: Some(5),
            max_doc_frequency: None,
            min_term_frequency: Some(2),
            max_query_terms: Some(25),
            min_word_length: None,
            max_word_length: None,
            boost_factor: Some(1.0),
            stop_words: vec![],
        }
    }
}

impl MoreLikeThis {
    /// Creates a [`BooleanQuery`] using a document address to collect
    /// the top stored field values.
    pub fn query_with_document(
        &self,
        searcher: &Searcher,
        doc_address: DocAddress,
    ) -> Result<BooleanQuery> {
        let score_terms = self.retrieve_terms_from_doc_address(searcher, doc_address)?;
        let query = self.create_query(score_terms);
        Ok(query)
    }

    /// Creates a [`BooleanQuery`] using a set of field values.
    pub fn query_with_document_fields<'a, V: Value<'a>>(
        &self,
        searcher: &Searcher,
        doc_fields: &[(Field, Vec<V>)],
    ) -> Result<BooleanQuery> {
        let score_terms = self.retrieve_terms_from_doc_fields(searcher, doc_fields)?;
        let query = self.create_query(score_terms);
        Ok(query)
    }

    /// Creates a [`BooleanQuery`] from an ascendingly sorted list of ScoreTerm
    /// This will map the list of ScoreTerm to a list of [`TermQuery`]  and compose a
    /// BooleanQuery using that list as sub queries.
    fn create_query(&self, mut score_terms: Vec<ScoreTerm>) -> BooleanQuery {
        score_terms.sort_by(|left_ts, right_ts| right_ts.cmp(left_ts));
        let best_score = score_terms.first().map_or(1f32, |x| x.score);
        let mut queries = Vec::new();

        for ScoreTerm { term, score } in score_terms {
            let mut query: Box<dyn Query> =
                Box::new(TermQuery::new(term, IndexRecordOption::Basic));
            if let Some(factor) = self.boost_factor {
                query = Box::new(BoostQuery::new(query, score * factor / best_score));
            }
            queries.push((Occur::Should, query));
        }
        BooleanQuery::from(queries)
    }

    /// Finds terms for a more-like-this query.
    /// doc_address is the address of document from which to find terms.
    fn retrieve_terms_from_doc_address(
        &self,
        searcher: &Searcher,
        doc_address: DocAddress,
    ) -> Result<Vec<ScoreTerm>> {
        let doc = searcher.doc::<TantivyDocument>(doc_address)?;

        let field_to_values = doc.get_sorted_field_values();
        self.retrieve_terms_from_doc_fields(searcher, &field_to_values)
    }

    /// Finds terms for a more-like-this query.
    /// field_to_field_values is a mapping from field to possible values of that field.
    fn retrieve_terms_from_doc_fields<'a, V: Value<'a>>(
        &self,
        searcher: &Searcher,
        field_to_values: &[(Field, Vec<V>)],
    ) -> Result<Vec<ScoreTerm>> {
        if field_to_values.is_empty() {
            return Err(TantivyError::InvalidArgument(
                "Cannot create more like this query on empty field values. The document may not \
                 have stored fields"
                    .to_string(),
            ));
        }
        let mut field_to_term_freq_map = HashMap::new();
        for (field, values) in field_to_values {
            self.add_term_frequencies(searcher, *field, values, &mut field_to_term_freq_map)?;
        }
        self.create_score_term(searcher, field_to_term_freq_map)
    }

    /// Computes the frequency of values for a field while updating the term frequencies
    /// Note: A FieldValue can be made up of multiple terms.
    /// We are interested in extracting terms within FieldValue
    fn add_term_frequencies<'a, V: Value<'a>>(
        &self,
        searcher: &Searcher,
        field: Field,
        values: &[V],
        term_frequencies: &mut HashMap<Term, usize>,
    ) -> Result<()> {
        let schema = searcher.schema();
        let tokenizer_manager = searcher.index().tokenizers();

        let field_entry = schema.get_field_entry(field);
        if !field_entry.is_indexed() {
            return Ok(());
        }

        // extract the raw value, possibly tokenizing & filtering to update the term frequency map
        match field_entry.field_type() {
            FieldType::Facet(_) => {
                let facets: Vec<&str> = values
                    .iter()
                    .map(|value| {
                        value.as_facet().ok_or_else(|| {
                            TantivyError::InvalidArgument("invalid field value".to_string())
                        })
                    })
                    .collect::<Result<Vec<_>>>()?;
                for fake_str in facets {
                    FacetTokenizer::default()
                        .token_stream(fake_str)
                        .process(&mut |token| {
                            if self.is_noise_word(token.text.clone()) {
                                let term = Term::from_field_text(field, &token.text);
                                *term_frequencies.entry(term).or_insert(0) += 1;
                            }
                        });
                }
            }
            FieldType::Str(text_options) => {
                let mut tokenizer_opt = text_options
                    .get_indexing_options()
                    .map(|options| options.tokenizer())
                    .and_then(|tokenizer_name| tokenizer_manager.get(tokenizer_name));

                let sink = &mut |token: &Token| {
                    if !self.is_noise_word(token.text.clone()) {
                        let term = Term::from_field_text(field, &token.text);
                        *term_frequencies.entry(term).or_insert(0) += 1;
                    }
                };

                // TODO: Validate these changed align with the HEAD branch.
                for value in values {
                    if let Some(text) = value.as_str() {
                        let tokenizer = match &mut tokenizer_opt {
                            None => continue,
                            Some(tokenizer) => tokenizer,
                        };

                        let mut token_stream = tokenizer.token_stream(text);
                        token_stream.process(sink);
                    } else if let Some(tok_str) = value.as_pre_tokenized_text() {
                        let mut token_stream = PreTokenizedStream::from(*tok_str.clone());
                        token_stream.process(sink);
                    }
                }
            }
            FieldType::U64(_) => {
                for value in values {
                    let val = value.as_u64().ok_or_else(|| {
                        TantivyError::InvalidArgument("invalid value".to_string())
                    })?;
                    if !self.is_noise_word(val.to_string()) {
                        let term = Term::from_field_u64(field, val);
                        *term_frequencies.entry(term).or_insert(0) += 1;
                    }
                }
            }
            FieldType::Date(_) => {
                for value in values {
                    let timestamp = value.as_datetime().ok_or_else(|| {
                        TantivyError::InvalidArgument("invalid value".to_string())
                    })?;
                    let term = Term::from_field_date_for_search(field, timestamp);
                    *term_frequencies.entry(term).or_insert(0) += 1;
                }
            }
            FieldType::I64(_) => {
                for value in values {
                    let val = value.as_i64().ok_or_else(|| {
                        TantivyError::InvalidArgument("invalid value".to_string())
                    })?;
                    if !self.is_noise_word(val.to_string()) {
                        let term = Term::from_field_i64(field, val);
                        *term_frequencies.entry(term).or_insert(0) += 1;
                    }
                }
            }
            FieldType::F64(_) => {
                for value in values {
                    let val = value.as_f64().ok_or_else(|| {
                        TantivyError::InvalidArgument("invalid value".to_string())
                    })?;
                    if !self.is_noise_word(val.to_string()) {
                        let term = Term::from_field_f64(field, val);
                        *term_frequencies.entry(term).or_insert(0) += 1;
                    }
                }
            }
            _ => {}
        }
        Ok(())
    }

    /// Determines if the term is likely to be of interest based on "more-like-this" settings
    fn is_noise_word(&self, word: String) -> bool {
        let word_length = word.len();
        if word_length == 0 {
            return true;
        }
        if self
            .min_word_length
            .map(|min| word_length < min)
            .unwrap_or(false)
        {
            return true;
        }
        if self
            .max_word_length
            .map(|max| word_length > max)
            .unwrap_or(false)
        {
            return true;
        }
        self.stop_words.contains(&word)
    }

    /// Computes the score for each term while ignoring not useful terms
    fn create_score_term(
        &self,
        searcher: &Searcher,
        per_field_term_frequencies: HashMap<Term, usize>,
    ) -> Result<Vec<ScoreTerm>> {
        let mut score_terms: BinaryHeap<Reverse<ScoreTerm>> = BinaryHeap::new();
        let num_docs = searcher
            .segment_readers()
            .iter()
            .map(|segment_reader| segment_reader.num_docs() as u64)
            .sum::<u64>();

        for (term, term_frequency) in per_field_term_frequencies.iter() {
            // ignore terms with less than min_term_frequency
            if self
                .min_term_frequency
                .map(|min_term_frequency| *term_frequency < min_term_frequency)
                .unwrap_or(false)
            {
                continue;
            }

            let doc_freq = searcher.doc_freq(term)?;

            // ignore terms with less than min_doc_frequency
            if self
                .min_doc_frequency
                .map(|min_doc_frequency| doc_freq < min_doc_frequency)
                .unwrap_or(false)
            {
                continue;
            }

            // ignore terms with more than max_doc_frequency
            if self
                .max_doc_frequency
                .map(|max_doc_frequency| doc_freq > max_doc_frequency)
                .unwrap_or(false)
            {
                continue;
            }

            // ignore terms with zero frequency
            if doc_freq == 0 {
                continue;
            }

            // compute similarity & score
            let idf = idf(doc_freq, num_docs);
            let score = (*term_frequency as f32) * idf;
            if let Some(limit) = self.max_query_terms {
                if score_terms.len() > limit {
                    // update the least significant term
                    let least_significant_term_score = score_terms.peek().unwrap().0.score;
                    if least_significant_term_score < score {
                        score_terms.peek_mut().unwrap().0 = ScoreTerm::new(term.clone(), score);
                    }
                } else {
                    score_terms.push(Reverse(ScoreTerm::new(term.clone(), score)));
                }
            } else {
                score_terms.push(Reverse(ScoreTerm::new(term.clone(), score)));
            }
        }

        let score_terms_vec: Vec<ScoreTerm> = score_terms
            .into_iter()
            .map(|reverse_score_term| reverse_score_term.0)
            .collect();

        Ok(score_terms_vec)
    }
}


================================================
FILE: src/query/more_like_this/query.rs
================================================
use std::fmt::Debug;

use super::MoreLikeThis;
use crate::query::{EnableScoring, Query, Weight};
use crate::schema::{Field, OwnedValue};
use crate::DocAddress;

/// A query that matches all of the documents similar to a document
/// or a set of field values provided.
///
/// # Examples
///
/// ```
/// use tantivy::DocAddress;
/// use tantivy::query::MoreLikeThisQuery;
///
/// let query = MoreLikeThisQuery::builder()
///     .with_min_doc_frequency(1)
///     .with_max_doc_frequency(10)
///     .with_min_term_frequency(1)
///     .with_min_word_length(2)
///     .with_max_word_length(5)
///     .with_boost_factor(1.0)
///     .with_stop_words(vec!["for".to_string()])
///     .with_document(DocAddress::new(2, 1));
/// ```
#[derive(Debug, Clone)]
pub struct MoreLikeThisQuery {
    mlt: MoreLikeThis,
    target: TargetDocument,
}

#[derive(Debug, Clone, PartialEq)]
enum TargetDocument {
    DocumentAddress(DocAddress),
    DocumentFields(Vec<(Field, Vec<OwnedValue>)>),
}

impl MoreLikeThisQuery {
    /// Creates a new builder.
    pub fn builder() -> MoreLikeThisQueryBuilder {
        MoreLikeThisQueryBuilder::default()
    }
}

impl Query for MoreLikeThisQuery {
    fn weight(&self, enable_scoring: EnableScoring<'_>) -> crate::Result<Box<dyn Weight>> {
        let searcher = match enable_scoring {
            EnableScoring::Enabled { searcher, .. } => searcher,
            EnableScoring::Disabled { .. } => {
                let err = "MoreLikeThisQuery requires to enable scoring.".to_string();
                return Err(crate::TantivyError::InvalidArgument(err));
            }
        };
        match &self.target {
            TargetDocument::DocumentAddress(doc_address) => self
                .mlt
                .query_with_document(searcher, *doc_address)?
                .weight(enable_scoring),
            TargetDocument::DocumentFields(doc_fields) => {
                let values = doc_fields
                    .iter()
                    .map(|(field, values)| (*field, values.iter().collect::<Vec<&OwnedValue>>()))
                    .collect::<Vec<_>>();

                self.mlt
                    .query_with_document_fields(searcher, &values)?
                    .weight(enable_scoring)
            }
        }
    }
}

/// The builder for more-like-this query
#[derive(Debug, Clone, Default)]
pub struct MoreLikeThisQueryBuilder {
    mlt: MoreLikeThis,
}

impl MoreLikeThisQueryBuilder {
    /// Sets the minimum document frequency.
    ///
    /// The resulting query will ignore words which do not occur
    /// in at least this many docs.
    #[must_use]
    pub fn with_min_doc_frequency(mut self, value: u64) -> Self {
        self.mlt.min_doc_frequency = Some(value);
        self
    }

    /// Sets the maximum document frequency.
    ///
    /// The resulting query will ignore words which occur
    /// in more than this many docs.
    #[must_use]
    pub fn with_max_doc_frequency(mut self, value: u64) -> Self {
        self.mlt.max_doc_frequency = Some(value);
        self
    }

    /// Sets the minimum term frequency.
    ///
    /// The resulting query will ignore words less
    /// frequent that this number.
    #[must_use]
    pub fn with_min_term_frequency(mut self, value: usize) -> Self {
        self.mlt.min_term_frequency = Some(value);
        self
    }

    /// Sets the maximum query terms.
    ///
    /// The resulting query will not return a query with more clause than this.
    #[must_use]
    pub fn with_max_query_terms(mut self, value: usize) -> Self {
        self.mlt.max_query_terms = Some(value);
        self
    }

    /// Sets the minimum word length.
    ///
    /// The resulting query will ignore words shorter than this length.
    #[must_use]
    pub fn with_min_word_length(mut self, value: usize) -> Self {
        self.mlt.min_word_length = Some(value);
        self
    }

    /// Sets the maximum word length.
    ///
    /// The resulting query will ignore words longer than this length.
    #[must_use]
    pub fn with_max_word_length(mut self, value: usize) -> Self {
        self.mlt.max_word_length = Some(value);
        self
    }

    /// Sets the boost factor
    ///
    /// The boost factor used by the resulting query for boosting terms.
    #[must_use]
    pub fn with_boost_factor(mut self, value: f32) -> Self {
        self.mlt.boost_factor = Some(value);
        self
    }

    /// Sets the set of stop words
    ///
    /// The resulting query will ignore these set of words.
    #[must_use]
    pub fn with_stop_words(mut self, value: Vec<String>) -> Self {
        self.mlt.stop_words = value;
        self
    }

    /// Sets the document address
    /// Returns the constructed [`MoreLikeThisQuery`]
    ///
    /// This document will be used to collect field values, extract frequent terms
    /// needed for composing the query.
    ///
    /// Note that field values will only be collected from stored fields in the index.
    /// You can construct your own field values from any source.
    pub fn with_document(self, doc_address: DocAddress) -> MoreLikeThisQuery {
        MoreLikeThisQuery {
            mlt: self.mlt,
            target: TargetDocument::DocumentAddress(doc_address),
        }
    }

    /// Sets the document fields
    /// Returns the constructed [`MoreLikeThisQuery`]
    ///
    /// This represents the list field values possibly collected from multiple documents
    /// that will be used to compose the resulting query.
    /// This interface is meant to be used when you want to provide your own set of fields
    /// not necessarily from a specific document.
    pub fn with_document_fields(
        self,
        doc_fields: Vec<(Field, Vec<OwnedValue>)>,
    ) -> MoreLikeThisQuery {
        MoreLikeThisQuery {
            mlt: self.mlt,
            target: TargetDocument::DocumentFields(doc_fields),
        }
    }
}

#[cfg(test)]
mod tests {
    use super::{MoreLikeThisQuery, TargetDocument};
    use crate::collector::TopDocs;
    use crate::schema::{Schema, STORED, TEXT};
    use crate::{DocAddress, Index, IndexWriter};

    fn create_test_index() -> crate::Result<Index> {
        let mut schema_builder = Schema::builder();
        let title = schema_builder.add_text_field("title", TEXT);
        let body = schema_builder.add_text_field("body", TEXT | STORED);
        let schema = schema_builder.build();
        let index = Index::create_in_ram(schema);
        let mut index_writer: IndexWriter = index.writer_for_tests().unwrap();
        index_writer.add_document(doc!(title => "aaa", body => "the old man and the sea"))?;
        index_writer.add_document(doc!(title => "bbb", body => "an old man sailing on the sea"))?;
        index_writer.add_document(doc!(title => "ccc", body=> "send this message to alice"))?;
        index_writer.add_document(doc!(title => "ddd", body=> "a lady was riding and old bike"))?;
        index_writer.add_document(doc!(title => "eee", body=> "Yes, my lady."))?;
        index_writer.commit()?;
        Ok(index)
    }

    #[test]
    fn test_more_like_this_query_builder() {
        // default settings
        let query = MoreLikeThisQuery::builder().with_document_fields(vec![]);

        assert_eq!(query.mlt.min_doc_frequency, Some(5));
        assert_eq!(query.mlt.max_doc_frequency, None);
        assert_eq!(query.mlt.min_term_frequency, Some(2));
        assert_eq!(query.mlt.max_query_terms, Some(25));
        assert_eq!(query.mlt.min_word_length, None);
        assert_eq!(query.mlt.max_word_length, None);
        assert_eq!(query.mlt.boost_factor, Some(1.0));
        assert_eq!(query.mlt.stop_words, Vec::<String>::new());
        assert_eq!(query.target, TargetDocument::DocumentFields(vec![]));

        // custom settings
        let query = MoreLikeThisQuery::builder()
            .with_min_doc_frequency(2)
            .with_max_doc_frequency(5)
            .with_min_term_frequency(2)
            .with_min_word_length(2)
            .with_max_word_length(4)
            .with_boost_factor(0.5)
            .with_stop_words(vec!["all".to_string(), "for".to_string()])
            .with_document(DocAddress::new(1, 2));

        assert_eq!(query.mlt.min_doc_frequency, Some(2));
        assert_eq!(query.mlt.max_doc_frequency, Some(5));
        assert_eq!(query.mlt.min_term_frequency, Some(2));
        assert_eq!(query.mlt.min_word_length, Some(2));
        assert_eq!(query.mlt.max_word_length, Some(4));
        assert_eq!(query.mlt.boost_factor, Some(0.5));
        assert_eq!(
            query.mlt.stop_words,
            vec!["all".to_string(), "for".to_string()]
        );
        assert_eq!(
            query.target,
            TargetDocument::DocumentAddress(DocAddress::new(1, 2))
        );
    }

    #[test]
    fn test_more_like_this_query() -> crate::Result<()> {
        let index = create_test_index()?;
        let reader = index.reader()?;
        let searcher = reader.searcher();

        // search base 1st doc with words [sea, and] skipping [old]
        let query = MoreLikeThisQuery::builder()
            .with_min_doc_frequency(1)
            .with_max_doc_frequency(10)
            .with_min_term_frequency(1)
            .with_min_word_length(2)
            .with_max_word_length(5)
            .with_boost_factor(1.0)
            .with_stop_words(vec!["old".to_string()])
            .with_document(DocAddress::new(0, 0));
        let top_docs = searcher.search(&query, &TopDocs::with_limit(5).order_by_score())?;
        let mut doc_ids: Vec<_> = top_docs.iter().map(|item| item.1.doc_id).collect();
        doc_ids.sort_unstable();

        assert_eq!(doc_ids.len(), 3);
        assert_eq!(doc_ids, vec![0, 1, 3]);

        // search base 5th doc with words [lady]
        let query = MoreLikeThisQuery::builder()
            .with_min_doc_frequency(1)
            .with_max_doc_frequency(10)
            .with_min_term_frequency(1)
            .with_min_word_length(2)
            .with_max_word_length(5)
            .with_boost_factor(1.0)
            .with_document(DocAddress::new(0, 4));
        let top_docs = searcher.search(&query, &TopDocs::with_limit(5).order_by_score())?;
        let mut doc_ids: Vec<_> = top_docs.iter().map(|item| item.1.doc_id).collect();
        doc_ids.sort_unstable();

        assert_eq!(doc_ids.len(), 2);
        assert_eq!(doc_ids, vec![3, 4]);
        Ok(())
    }
}


================================================
FILE: src/query/phrase_prefix_query/mod.rs
================================================
mod phrase_prefix_query;
mod phrase_prefix_scorer;
mod phrase_prefix_weight;

pub use phrase_prefix_query::PhrasePrefixQuery;
pub use phrase_prefix_scorer::PhrasePrefixScorer;
pub use phrase_prefix_weight::PhrasePrefixWeight;

pub(crate) fn prefix_end(prefix_start: &[u8]) -> Option<Vec<u8>> {
    let mut res = prefix_start.to_owned();
    while !res.is_empty() {
        let end = res.len() - 1;
        if res[end] == u8::MAX {
            res.pop();
        } else {
            res[end] += 1;
            return Some(res);
        }
    }
    None
}

#[cfg(test)]
mod tests {
    use super::*;

    #[test]
    fn test_prefix_end() {
        assert_eq!(prefix_end(b"aaa"), Some(b"aab".to_vec()));
        assert_eq!(prefix_end(b"aa\xff"), Some(b"ab".to_vec()));
        assert_eq!(prefix_end(b"a\xff\xff"), Some(b"b".to_vec()));
        assert_eq!(prefix_end(b"\xff\xff\xff"), None);
    }
}


================================================
FILE: src/query/phrase_prefix_query/phrase_prefix_query.rs
================================================
use std::ops::Bound;

use super::{prefix_end, PhrasePrefixWeight};
use crate::query::bm25::Bm25Weight;
use crate::query::{EnableScoring, InvertedIndexRangeWeight, Query, Weight};
use crate::schema::{Field, IndexRecordOption, Term};

const DEFAULT_MAX_EXPANSIONS: u32 = 50;

/// `PhrasePrefixQuery` matches a specific sequence of words followed by term of which only a
/// prefix is known.
///
/// For instance the phrase prefix query for `"part t"` will match
/// the sentence
///
/// **Alan just got a part time job.**
///
/// On the other hand it will not match the sentence.
///
/// **This is my favorite part of the job.**
///
/// Using a `PhrasePrefixQuery` on a field requires positions
/// to be indexed for this field.
#[derive(Clone, Debug)]
pub struct PhrasePrefixQuery {
    field: Field,
    phrase_terms: Vec<(usize, Term)>,
    prefix: (usize, Term),
    max_expansions: u32,
}

impl PhrasePrefixQuery {
    /// Creates a new `PhrasePrefixQuery` given a list of terms.
    ///
    /// There must be at least two terms, and all terms
    /// must belong to the same field.
    /// Offset for each term will be same as index in the Vector
    /// The last Term is a prefix and not a full value
    pub fn new(terms: Vec<Term>) -> PhrasePrefixQuery {
        let terms_with_offset = terms.into_iter().enumerate().collect();
        PhrasePrefixQuery::new_with_offset(terms_with_offset)
    }

    /// Creates a new `PhrasePrefixQuery` given a list of terms and their offsets.
    ///
    /// Can be used to provide custom offset for each term.
    pub fn new_with_offset(mut terms: Vec<(usize, Term)>) -> PhrasePrefixQuery {
        assert!(
            !terms.is_empty(),
            "A phrase prefix query is required to have at least one term."
        );
        terms.sort_by_key(|&(offset, _)| offset);
        let field = terms[0].1.field();
        assert!(
            terms[1..].iter().all(|term| term.1.field() == field),
            "All terms from a phrase query must belong to the same field"
        );
        PhrasePrefixQuery {
            field,
            prefix: terms.pop().unwrap(),
            phrase_terms: terms,
            max_expansions: DEFAULT_MAX_EXPANSIONS,
        }
    }

    /// Maximum number of terms to which the last provided term will expand.
    pub fn set_max_expansions(&mut self, value: u32) {
        self.max_expansions = value;
    }

    /// The [`Field`] this `PhrasePrefixQuery` is targeting.
    pub fn field(&self) -> Field {
        self.field
    }

    /// `Term`s in the phrase without the associated offsets.
    pub fn phrase_terms(&self) -> Vec<Term> {
        // TODO should we include the last term too?
        self.phrase_terms
            .iter()
            .map(|(_, term)| term.clone())
            .collect::<Vec<Term>>()
    }

    /// Returns the [`PhrasePrefixWeight`] for the given phrase query given a specific `searcher`.
    ///
    /// This function is the same as [`Query::weight()`] except it returns
    /// a specialized type [`PhraseQueryWeight`] instead of a Boxed trait.
    /// If the query was only one term long, this returns `None` whereas [`Query::weight`]
    /// returns a boxed [`RangeWeight`]
    pub(crate) fn phrase_prefix_query_weight(
        &self,
        enable_scoring: EnableScoring<'_>,
    ) -> crate::Result<Option<PhrasePrefixWeight>> {
        if self.phrase_terms.is_empty() {
            return Ok(None);
        }
        let schema = enable_scoring.schema();
        let field_entry = schema.get_field_entry(self.field);
        let has_positions = field_entry
            .field_type()
            .get_index_record_option()
            .map(IndexRecordOption::has_positions)
            .unwrap_or(false);
        if !has_positions {
            let field_name = field_entry.name();
            return Err(crate::TantivyError::SchemaError(format!(
                "Applied phrase query on field {field_name:?}, which does not have positions \
                 indexed"
            )));
        }
        let terms = self.phrase_terms();
        let bm25_weight_opt = match enable_scoring {
            EnableScoring::Enabled { searcher, .. } => {
                Some(Bm25Weight::for_terms(searcher, &terms)?)
            }
            EnableScoring::Disabled { .. } => None,
        };
        let weight = PhrasePrefixWeight::new(
            self.phrase_terms.clone(),
            self.prefix.clone(),
            bm25_weight_opt,
            self.max_expansions,
        );
        Ok(Some(weight))
    }
}

impl Query for PhrasePrefixQuery {
    /// Create the weight associated with a query.
    ///
    /// See [`Weight`].
    fn weight(&self, enable_scoring: EnableScoring<'_>) -> crate::Result<Box<dyn Weight>> {
        if let Some(phrase_weight) = self.phrase_prefix_query_weight(enable_scoring)? {
            Ok(Box::new(phrase_weight))
        } else {
            // There are no prefix. Let's just match the suffix.
            let end_term =
                if let Some(end_value) = prefix_end(self.prefix.1.serialized_value_bytes()) {
                    let mut end_term = Term::with_capacity(end_value.len());
                    end_term.set_field_and_type(self.field, self.prefix.1.typ());
                    end_term.append_bytes(&end_value);
                    Bound::Excluded(end_term)
                } else {
                    Bound::Unbounded
                };

            let lower_bound = Bound::Included(self.prefix.1.clone());
            let upper_bound = end_term;

            Ok(Box::new(InvertedIndexRangeWeight::new(
                self.field,
                &lower_bound,
                &upper_bound,
                Some(self.max_expansions as u64),
            )))
        }
    }

    fn query_terms<'a>(&'a self, visitor: &mut dyn FnMut(&'a Term, bool)) {
        for (_, term) in &self.phrase_terms {
            visitor(term, true);
        }
    }
}


================================================
FILE: src/query/phrase_prefix_query/phrase_prefix_scorer.rs
================================================
use crate::docset::{DocSet, SeekDangerResult, TERMINATED};
use crate::fieldnorm::FieldNormReader;
use crate::postings::Postings;
use crate::query::bm25::Bm25Weight;
use crate::query::phrase_query::{intersection_count, PhraseScorer};
use crate::query::Scorer;
use crate::{DocId, Score};

// MultiPrefix is the larger variant, and also the one we expect most often. PhraseScorer is > 1kB
// though, it would be interesting to slim it down if possible.
#[expect(clippy::large_enum_variant)]
enum PhraseKind<TPostings: Postings> {
    SinglePrefix {
        position_offset: u32,
        postings: TPostings,
        positions: Vec<u32>,
    },
    MultiPrefix(PhraseScorer<TPostings>),
}

impl<TPostings: Postings> PhraseKind<TPostings> {
    fn get_intersection(&mut self) -> &[u32] {
        match self {
            PhraseKind::SinglePrefix {
                position_offset,
                postings,
                positions,
            } => {
                if positions.is_empty() {
                    postings.positions_with_offset(*position_offset, positions);
                }
                positions
            }
            PhraseKind::MultiPrefix(postings) => postings.get_intersection(),
        }
    }
}

impl<TPostings: Postings> DocSet for PhraseKind<TPostings> {
    fn advance(&mut self) -> DocId {
        match self {
            PhraseKind::SinglePrefix {
                postings,
                positions,
                ..
            } => {
                positions.clear();
                postings.advance()
            }
            PhraseKind::MultiPrefix(postings) => postings.advance(),
        }
    }

    fn doc(&self) -> DocId {
        match self {
            PhraseKind::SinglePrefix { postings, .. } => postings.doc(),
            PhraseKind::MultiPrefix(postings) => postings.doc(),
        }
    }

    fn size_hint(&self) -> u32 {
        match self {
            PhraseKind::SinglePrefix { postings, .. } => postings.size_hint(),
            PhraseKind::MultiPrefix(postings) => postings.size_hint(),
        }
    }

    fn seek(&mut self, target: DocId) -> DocId {
        match self {
            PhraseKind::SinglePrefix {
                postings,
                positions,
                ..
            } => {
                positions.clear();
                postings.seek(target)
            }
            PhraseKind::MultiPrefix(postings) => postings.seek(target),
        }
    }
}

impl<TPostings: Postings> Scorer for PhraseKind<TPostings> {
    #[inline]
    fn score(&mut self) -> Score {
        match self {
            PhraseKind::SinglePrefix { positions, .. } => {
                if positions.is_empty() {
                    0.0
                } else {
                    1.0
                }
            }
            PhraseKind::MultiPrefix(postings) => postings.score(),
        }
    }
}

pub struct PhrasePrefixScorer<TPostings: Postings> {
    phrase_scorer: PhraseKind<TPostings>,
    suffixes: Vec<TPostings>,
    suffix_offset: u32,
    phrase_count: u32,
    suffix_position_buffer: Vec<u32>,
}

impl<TPostings: Postings> PhrasePrefixScorer<TPostings> {
    // If similarity_weight is None, then scoring is disabled.
    pub fn new(
        mut term_postings: Vec<(usize, TPostings)>,
        similarity_weight_opt: Option<Bm25Weight>,
        fieldnorm_reader: FieldNormReader,
        suffixes: Vec<TPostings>,
        suffix_pos: usize,
    ) -> PhrasePrefixScorer<TPostings> {
        // correct indices so we can merge with our suffix term the PhraseScorer doesn't know about
        let max_offset = term_postings
            .iter()
            .map(|(pos, _)| *pos)
            .chain(std::iter::once(suffix_pos))
            .max()
            .unwrap();

        let phrase_scorer = if term_postings.len() > 1 {
            PhraseKind::MultiPrefix(PhraseScorer::new_with_offset(
                term_postings,
                similarity_weight_opt,
                fieldnorm_reader,
                0,
                1,
            ))
        } else {
            let (pos, postings) = term_postings
                .pop()
                .expect("PhrasePrefixScorer must have at least two terms");
            let offset = suffix_pos - pos;
            PhraseKind::SinglePrefix {
                position_offset: offset as u32,
                postings,
                positions: Vec::with_capacity(100),
            }
        };
        let mut phrase_prefix_scorer = PhrasePrefixScorer {
            phrase_scorer,
            suffixes,
            suffix_offset: (max_offset - suffix_pos) as u32,
            phrase_count: 0,
            suffix_position_buffer: Vec::with_capacity(100),
        };
        if phrase_prefix_scorer.doc() != TERMINATED && !phrase_prefix_scorer.matches_prefix() {
            phrase_prefix_scorer.advance();
        }
        phrase_prefix_scorer
    }

    pub fn phrase_count(&self) -> u32 {
        self.phrase_count
    }

    fn matches_prefix(&mut self) -> bool {
        let mut count = 0;
        let current_doc = self.doc();
        let pos_matching = self.phrase_scorer.get_intersection();
        for suffix in &mut self.suffixes {
            if suffix.doc() > current_doc {
                continue;
            }
            let doc = suffix.seek(current_doc);
            if doc == current_doc {
                suffix.positions_with_offset(self.suffix_offset, &mut self.suffix_position_buffer);
                count += intersection_count(pos_matching, &self.suffix_position_buffer);
            }
        }
        self.phrase_count = count as u32;
        count != 0
    }
}

impl<TPostings: Postings> DocSet for PhrasePrefixScorer<TPostings> {
    fn advance(&mut self) -> DocId {
        loop {
            let doc = self.phrase_scorer.advance();
            if doc == TERMINATED || self.matches_prefix() {
                return doc;
            }
        }
    }

    fn seek(&mut self, target: DocId) -> DocId {
        let doc = self.phrase_scorer.seek(target);
        if doc == TERMINATED || self.matches_prefix() {
            return doc;
        }
        self.advance()
    }

    fn seek_danger(&mut self, target: DocId) -> SeekDangerResult {
        let seek_res = self.phrase_scorer.seek_danger(target);
        if seek_res != SeekDangerResult::Found {
            return seek_res;
        }
        // The intersection matched. Now let's see if we match the prefix.
        if self.matches_prefix() {
            SeekDangerResult::Found
        } else {
            SeekDangerResult::SeekLowerBound(target + 1)
        }
    }

    fn doc(&self) -> DocId {
        self.phrase_scorer.doc()
    }

    fn size_hint(&self) -> u32 {
        self.phrase_scorer.size_hint()
    }

    fn cost(&self) -> u64 {
        self.phrase_scorer.cost()
    }
}

impl<TPostings: Postings> Scorer for PhrasePrefixScorer<TPostings> {
    #[inline]
    fn score(&mut self) -> Score {
        // TODO modify score??
        self.phrase_scorer.score()
    }
}


================================================
FILE: src/query/phrase_prefix_query/phrase_prefix_weight.rs
================================================
use super::{prefix_end, PhrasePrefixScorer};
use crate::fieldnorm::FieldNormReader;
use crate::index::SegmentReader;
use crate::postings::SegmentPostings;
use crate::query::bm25::Bm25Weight;
use crate::query::explanation::does_not_match;
use crate::query::{EmptyScorer, Explanation, Scorer, Weight};
use crate::schema::{IndexRecordOption, Term};
use crate::{DocId, DocSet, Score};

pub struct PhrasePrefixWeight {
    phrase_terms: Vec<(usize, Term)>,
    prefix: (usize, Term),
    similarity_weight_opt: Option<Bm25Weight>,
    max_expansions: u32,
}

impl PhrasePrefixWeight {
    /// Creates a new phrase weight.
    /// If `similarity_weight_opt` is None, then scoring is disabled
    pub fn new(
        phrase_terms: Vec<(usize, Term)>,
        prefix: (usize, Term),
        similarity_weight_opt: Option<Bm25Weight>,
        max_expansions: u32,
    ) -> PhrasePrefixWeight {
        PhrasePrefixWeight {
            phrase_terms,
            prefix,
            similarity_weight_opt,
            max_expansions,
        }
    }

    fn fieldnorm_reader(&self, reader: &SegmentReader) -> crate::Result<FieldNormReader> {
        let field = self.phrase_terms[0].1.field();
        if self.similarity_weight_opt.is_some() {
            if let Some(fieldnorm_reader) = reader.fieldnorms_readers().get_field(field)? {
                return Ok(fieldnorm_reader);
            }
        }
        Ok(FieldNormReader::constant(reader.max_doc(), 1))
    }

    pub(crate) fn phrase_scorer(
        &self,
        reader: &SegmentReader,
        boost: Score,
    ) -> crate::Result<Option<PhrasePrefixScorer<SegmentPostings>>> {
        let similarity_weight_opt = self
            .similarity_weight_opt
            .as_ref()
            .map(|similarity_weight| similarity_weight.boost_by(boost));
        let fieldnorm_reader = self.fieldnorm_reader(reader)?;
        let mut term_postings_list = Vec::new();
        for &(offset, ref term) in &self.phrase_terms {
            if let Some(postings) = reader
                .inverted_index(term.field())?
                .read_postings(term, IndexRecordOption::WithFreqsAndPositions)?
            {
                term_postings_list.push((offset, postings));
            } else {
                return Ok(None);
            }
        }

        let inv_index = reader.inverted_index(self.prefix.1.field())?;
        let mut stream = inv_index
            .terms()
            .range()
            .ge(self.prefix.1.serialized_value_bytes());
        if let Some(end) = prefix_end(self.prefix.1.serialized_value_bytes()) {
            stream = stream.lt(&end);
        }

        #[cfg(feature = "quickwit")]
        {
            // We don't have this on the fst, hence  we end up needing a feature flag.
            //
            // This is not a problem however as we enforce the limit below too.
            // The point of `stream.limit` is to limit the number of term dictionary
            // blocks being downloaded.
            stream = stream.limit(self.max_expansions as u64);
        }

        let mut stream = stream.into_stream()?;

        let mut suffixes = Vec::with_capacity(self.max_expansions as usize);
        let mut new_term = self.prefix.1.clone();
        while stream.advance() && (suffixes.len() as u32) < self.max_expansions {
            new_term.clear_with_type(new_term.typ());
            new_term.append_bytes(stream.key());
            if reader.has_deletes() {
                if let Some(postings) =
                    inv_index.read_postings(&new_term, IndexRecordOption::WithFreqsAndPositions)?
                {
                    suffixes.push(postings);
                }
            } else if let Some(postings) =
                inv_index.read_postings(&new_term, IndexRecordOption::WithFreqsAndPositions)?
            {
                suffixes.push(postings);
            }
        }

        Ok(Some(PhrasePrefixScorer::new(
            term_postings_list,
            similarity_weight_opt,
            fieldnorm_reader,
            suffixes,
            self.prefix.0,
        )))
    }
}

impl Weight for PhrasePrefixWeight {
    fn scorer(&self, reader: &SegmentReader, boost: Score) -> crate::Result<Box<dyn Scorer>> {
        if let Some(scorer) = self.phrase_scorer(reader, boost)? {
            Ok(Box::new(scorer))
        } else {
            Ok(Box::new(EmptyScorer))
        }
    }

    fn explain(&self, reader: &SegmentReader, doc: DocId) -> crate::Result<Explanation> {
        let scorer_opt = self.phrase_scorer(reader, 1.0)?;
        if scorer_opt.is_none() {
            return Err(does_not_match(doc));
        }
        let mut scorer = scorer_opt.unwrap();
        if scorer.seek(doc) != doc {
            return Err(does_not_match(doc));
        }
        let fieldnorm_reader = self.fieldnorm_reader(reader)?;
        let fieldnorm_id = fieldnorm_reader.fieldnorm_id(doc);
        let phrase_count = scorer.phrase_count();
        let mut explanation = Explanation::new("Phrase Prefix Scorer", scorer.score());
        if let Some(similarity_weight) = self.similarity_weight_opt.as_ref() {
            explanation.add_detail(similarity_weight.explain(fieldnorm_id, phrase_count));
        }
        Ok(explanation)
    }
}

#[cfg(test)]
mod tests {
    use crate::docset::TERMINATED;
    use crate::index::Index;
    use crate::query::{EnableScoring, PhrasePrefixQuery, Query};
    use crate::schema::{Schema, TEXT};
    use crate::{DocSet, IndexWriter, Term};

    pub fn create_index(texts: &[&'static str]) -> crate::Result<Index> {
        let mut schema_builder = Schema::builder();
        let text_field = schema_builder.add_text_field("text", TEXT);
        let schema = schema_builder.build();
        let index = Index::create_in_ram(schema);
        {
            let mut index_writer: IndexWriter = index.writer_for_tests()?;
            for &text in texts {
                let doc = doc!(text_field=>text);
                index_writer.add_document(doc)?;
            }
            index_writer.commit()?;
        }
        Ok(index)
    }

    #[test]
    pub fn test_phrase_count_long() -> crate::Result<()> {
        let index = create_index(&[
            "aa bb dd cc",
            "aa aa bb c dd aa bb cc aa bb dc",
            " aa bb cd",
        ])?;
        let schema = index.schema();
        let text_field = schema.get_field("text").unwrap();
        let searcher = index.reader()?.searcher();
        let phrase_query = PhrasePrefixQuery::new(vec![
            Term::from_field_text(text_field, "aa"),
            Term::from_field_text(text_field, "bb"),
            Term::from_field_text(text_field, "c"),
        ]);
        let enable_scoring = EnableScoring::enabled_from_searcher(&searcher);
        let phrase_weight = phrase_query
            .phrase_prefix_query_weight(enable_scoring)
            .unwrap()
            .unwrap();
        let mut phrase_scorer = phrase_weight
            .phrase_scorer(searcher.segment_reader(0u32), 1.0)?
            .unwrap();
        assert_eq!(phrase_scorer.doc(), 1);
        assert_eq!(phrase_scorer.phrase_count(), 2);
        assert_eq!(phrase_scorer.advance(), 2);
        assert_eq!(phrase_scorer.doc(), 2);
        assert_eq!(phrase_scorer.phrase_count(), 1);
        assert_eq!(phrase_scorer.advance(), TERMINATED);
        Ok(())
    }

    #[test]
    pub fn test_phrase_count_mid() -> crate::Result<()> {
        let index = create_index(&["aa dd cc", "aa aa bb c dd aa bb cc aa dc", " aa bb cd"])?;
        let schema = index.schema();
        let text_field = schema.get_field("text").unwrap();
        let searcher = index.reader()?.searcher();
        let phrase_query = PhrasePrefixQuery::new(vec![
            Term::from_field_text(text_field, "aa"),
            Term::from_field_text(text_field, "b"),
        ]);
        let enable_scoring = EnableScoring::enabled_from_searcher(&searcher);
        let phrase_weight = phrase_query
            .phrase_prefix_query_weight(enable_scoring)
            .unwrap()
            .unwrap();
        let mut phrase_scorer = phrase_weight
            .phrase_scorer(searcher.segment_reader(0u32), 1.0)?
            .unwrap();
        assert_eq!(phrase_scorer.doc(), 1);
        assert_eq!(phrase_scorer.phrase_count(), 2);
        assert_eq!(phrase_scorer.advance(), 2);
        assert_eq!(phrase_scorer.doc(), 2);
        assert_eq!(phrase_scorer.phrase_count(), 1);
        assert_eq!(phrase_scorer.advance(), TERMINATED);
        Ok(())
    }

    #[test]
    pub fn test_phrase_count_short() -> crate::Result<()> {
        let index = create_index(&["aa dd", "aa aa bb c dd aa bb cc aa dc", " aa bb cd"])?;
        let schema = index.schema();
        let text_field = schema.get_field("text").unwrap();
        let searcher = index.reader()?.searcher();
        let phrase_query = PhrasePrefixQuery::new(vec![Term::from_field_text(text_field, "c")]);
        let enable_scoring = EnableScoring::enabled_from_searcher(&searcher);
        assert!(phrase_query
            .phrase_prefix_query_weight(enable_scoring)
            .unwrap()
            .is_none());
        let weight = phrase_query.weight(enable_scoring).unwrap();
        let mut phrase_scorer = weight.scorer(searcher.segment_reader(0u32), 1.0)?;
        assert_eq!(phrase_scorer.doc(), 1);
        assert_eq!(phrase_scorer.advance(), 2);
        assert_eq!(phrase_scorer.doc(), 2);
        assert_eq!(phrase_scorer.advance(), TERMINATED);
        Ok(())
    }

    #[test]
    pub fn test_phrase_no_match() -> crate::Result<()> {
        let index = create_index(&["aa dd", "aa aa bb c dd aa bb cc aa dc", " aa bb cd"])?;
        let schema = index.schema();
        let text_field = schema.get_field("text").unwrap();
        let searcher = index.reader()?.searcher();
        let phrase_query = PhrasePrefixQuery::new(vec![
            Term::from_field_text(text_field, "aa"),
            Term::from_field_text(text_field, "cc"),
            Term::from_field_text(text_field, "d"),
        ]);
        let enable_scoring = EnableScoring::enabled_from_searcher(&searcher);
        let weight = phrase_query.weight(enable_scoring).unwrap();
        let mut phrase_scorer = weight.scorer(searcher.segment_reader(0u32), 1.0)?;
        assert_eq!(phrase_scorer.advance(), TERMINATED);
        Ok(())
    }
}


================================================
FILE: src/query/phrase_query/mod.rs
================================================
mod phrase_query;
mod phrase_scorer;
mod phrase_weight;
pub mod regex_phrase_query;
mod regex_phrase_weight;

pub use self::phrase_query::PhraseQuery;
pub(crate) use self::phrase_scorer::intersection_count;
pub use self::phrase_scorer::PhraseScorer;
pub use self::phrase_weight::PhraseWeight;

#[cfg(test)]
pub(crate) mod tests {

    use serde_json::json;

    use super::*;
    use crate::collector::tests::{TEST_COLLECTOR_WITHOUT_SCORE, TEST_COLLECTOR_WITH_SCORE};
    use crate::index::Index;
    use crate::query::{EnableScoring, QueryParser, Weight};
    use crate::schema::{Schema, Term, TEXT};
    use crate::{assert_nearly_equals, DocAddress, DocId, IndexWriter, TERMINATED};

    pub fn create_index<S: AsRef<str>>(texts: &[S]) -> crate::Result<Index> {
        let mut schema_builder = Schema::builder();
        let text_field = schema_builder.add_text_field("text", TEXT);
        let schema = schema_builder.build();
        let index = Index::create_in_ram(schema);
        {
            let mut index_writer: IndexWriter = index.writer_for_tests()?;
            for text in texts {
                let doc = doc!(text_field=>text.as_ref());
                index_writer.add_document(doc)?;
            }
            index_writer.commit()?;
        }
        Ok(index)
    }

    #[test]
    pub fn test_phrase_query() -> crate::Result<()> {
        let index = create_index(&[
            "b b b d c g c",
            "a b b d c g c",
            "a b a b c",
            "c a b a d ga a",
            "a b c",
        ])?;
        let schema = index.schema();
        let text_field = schema.get_field("text").unwrap();
        let searcher = index.reader()?.searcher();
        let test_query = |texts: Vec<&str>| {
            let terms: Vec<Term> = texts
                .iter()
                .map(|text| Term::from_field_text(text_field, text))
                .collect();
            let phrase_query = PhraseQuery::new(terms);
            let test_fruits = searcher
                .search(&phrase_query, &TEST_COLLECTOR_WITH_SCORE)
                .unwrap();
            test_fruits
                .docs()
                .iter()
                .map(|docaddr| docaddr.doc_id)
                .collect::<Vec<_>>()
        };
        assert_eq!(test_query(vec!["a", "b"]), vec![1, 2, 3, 4]);
        assert_eq!(test_query(vec!["a", "b", "c"]), vec![2, 4]);
        assert_eq!(test_query(vec!["b", "b"]), vec![0, 1]);
        assert!(test_query(vec!["g", "ewrwer"]).is_empty());
        assert!(test_query(vec!["g", "a"]).is_empty());
        Ok(())
    }

    #[test]
    pub fn test_phrase_query_simple() -> crate::Result<()> {
        let index = create_index(&["a b b d c g c", "a b a b c"])?;
        let text_field = index.schema().get_field("text").unwrap();
        let searcher = index.reader()?.searcher();
        let terms: Vec<Term> = ["a", "b", "c"]
            .iter()
            .map(|text| Term::from_field_text(text_field, text))
            .collect();
        let phrase_query = PhraseQuery::new(terms);
        let phrase_weight =
            phrase_query.phrase_weight(EnableScoring::disabled_from_schema(searcher.schema()))?;
        let mut phrase_scorer = phrase_weight.scorer(searcher.segment_reader(0), 1.0)?;
        assert_eq!(phrase_scorer.doc(), 1);
        assert_eq!(phrase_scorer.advance(), TERMINATED);
        Ok(())
    }

    #[test]
    pub fn test_phrase_query_no_score() -> crate::Result<()> {
        let index = create_index(&[
            "b b b d c g c",
            "a b b d c g c",
            "a b a b c",
            "c a b a d ga a",
            "a b c",
        ])?;
        let schema = index.schema();
        let text_field = schema.get_field("text").unwrap();
        let searcher = index.reader()?.searcher();
        let test_query = |texts: Vec<&str>| {
            let terms: Vec<Term> = texts
                .iter()
                .map(|text| Term::from_field_text(text_field, text))
                .collect();
            let phrase_query = PhraseQuery::new(terms);
            let test_fruits = searcher
                .search(&phrase_query, &TEST_COLLECTOR_WITHOUT_SCORE)
                .unwrap();
            test_fruits
                .docs()
                .iter()
                .map(|docaddr| docaddr.doc_id)
                .collect::<Vec<_>>()
        };
        assert_eq!(test_query(vec!["a", "b", "c"]), vec![2, 4]);
        assert_eq!(test_query(vec!["a", "b"]), vec![1, 2, 3, 4]);
        assert_eq!(test_query(vec!["b", "b"]), vec![0, 1]);
        assert!(test_query(vec!["g", "ewrwer"]).is_empty());
        assert!(test_query(vec!["g", "a"]).is_empty());
        Ok(())
    }

    #[test]
    pub fn test_phrase_query_no_positions() -> crate::Result<()> {
        let mut schema_builder = Schema::builder();
        use crate::schema::{IndexRecordOption, TextFieldIndexing, TextOptions};
        let no_positions = TextOptions::default().set_indexing_options(
            TextFieldIndexing::default().set_index_option(IndexRecordOption::WithFreqs),
        );

        let text_field = schema_builder.add_text_field("text", no_positions);
        let schema = schema_builder.build();
        let index = Index::create_in_ram(schema);
        {
            let mut index_writer: IndexWriter = index.writer_for_tests()?;
            index_writer.add_document(doc!(text_field=>"a b c"))?;
            index_writer.commit()?;
        }
        let searcher = index.reader()?.searcher();
        let phrase_query = PhraseQuery::new(vec![
            Term::from_field_text(text_field, "a"),
            Term::from_field_text(text_field, "b"),
        ]);

        let search_error = searcher
            .search(&phrase_query, &TEST_COLLECTOR_WITH_SCORE)
            .err();
        assert!(matches!(
            search_error,
            Some(crate::TantivyError::SchemaError(msg))
            if msg == "Applied phrase query on field \"text\", which does not have positions \
            indexed"
        ));
        Ok(())
    }

    #[test]
    pub fn test_phrase_score() -> crate::Result<()> {
        let index = create_index(&["a b c", "a b c a b"])?;
        let scores = test_query(0, &index, vec!["a", "b"]);
        assert_nearly_equals!(scores[0], 0.40618482);
        assert_nearly_equals!(scores[1], 0.46844664);
        Ok(())
    }

    #[ignore]
    #[test]
    pub fn test_phrase_score_with_slop() -> crate::Result<()> {
        let index = create_index(&["a c b", "a b c a b"])?;
        let scores = test_query(1, &index, vec!["a", "b"]);
        assert_nearly_equals!(scores[0], 0.40618482);
        assert_nearly_equals!(scores[1], 0.46844664);
        Ok(())
    }

    #[test]
    pub fn test_phrase_score_with_slop_bug() -> crate::Result<()> {
        let index = create_index(&["asdf asdf Captain Subject Wendy", "Captain"])?;
        let scores = test_query(1, &index, vec!["captain", "wendy"]);
        assert_eq!(scores.len(), 1);
        Ok(())
    }

    #[test]
    pub fn test_phrase_score_with_slop_bug_2() -> crate::Result<()> {
        // fails
        let index = create_index(&["a x b x c", "a a c"])?;
        let scores = test_query(2, &index, vec!["a", "b", "c"]);
        assert_eq!(scores.len(), 1);

        let index = create_index(&["a x b x c", "b c c"])?;
        let scores = test_query(2, &index, vec!["a", "b", "c"]);
        assert_eq!(scores.len(), 1);

        Ok(())
    }

    fn test_query(slop: u32, index: &Index, texts: Vec<&str>) -> Vec<f32> {
        let text_field = index.schema().get_field("text").unwrap();
        let searcher = index.reader().unwrap().searcher();
        let terms: Vec<Term> = texts
            .iter()
            .map(|text| Term::from_field_text(text_field, text))
            .collect();
        let mut phrase_query = PhraseQuery::new(terms);
        phrase_query.set_slop(slop);
        searcher
            .search(&phrase_query, &TEST_COLLECTOR_WITH_SCORE)
            .expect("search should succeed")
            .scores()
            .to_vec()
    }

    #[test]
    pub fn test_phrase_score_with_slop_repeating() -> crate::Result<()> {
        let index = create_index(&["wendy subject subject captain", "Captain"])?;
        let scores = test_query(1, &index, vec!["wendy", "subject", "captain"]);
        assert_eq!(scores.len(), 1);
        Ok(())
    }

    #[test]
    pub fn test_phrase_score_with_slop_size() -> crate::Result<()> {
        let index = create_index(&["a b e c", "a e e e c", "a e e e e c"])?;
        let scores = test_query(3, &index, vec!["a", "c"]);
        assert_eq!(scores.len(), 2);
        assert_nearly_equals!(scores[0], 0.29086056);
        assert_nearly_equals!(scores[1], 0.26706287);
        Ok(())
    }

    #[test]
    pub fn test_phrase_slop() -> crate::Result<()> {
        let index = create_index(&["a x b c"])?;
        let scores = test_query(1, &index, vec!["a", "b", "c"]);
        assert_eq!(scores.len(), 1);

        let index = create_index(&["a x b x c"])?;
        let scores = test_query(1, &index, vec!["a", "b", "c"]);
        assert_eq!(scores.len(), 0);

        let index = create_index(&["a b"])?;
        let scores = test_query(1, &index, vec!["b", "a"]);
        assert_eq!(scores.len(), 0);

        let index = create_index(&["a b"])?;
        let scores = test_query(2, &index, vec!["b", "a"]);
        assert_eq!(scores.len(), 1);

        Ok(())
    }

    #[test]
    pub fn test_phrase_score_with_slop_ordering() -> crate::Result<()> {
        let index = create_index(&[
            "a e b e c",
            "a e e e e e b e e e e c",
            "a c b", // also matches
            "a c e b e",
            "a e c b",
            "a e b c",
        ])?;
        let scores = test_query(3, &index, vec!["a", "b", "c"]);
        // The first and last matches.
        assert_nearly_equals!(scores[0], 0.23091172);
        assert_nearly_equals!(scores[1], 0.27310878);
        assert_nearly_equals!(scores[3], 0.25024384);
        Ok(())
    }

    #[test] // motivated by #234
    pub fn test_phrase_query_docfreq_order() -> crate::Result<()> {
        let mut schema_builder = Schema::builder();
        let text_field = schema_builder.add_text_field("text", TEXT);
        let schema = schema_builder.build();
        let index = Index::create_in_ram(schema);
        {
            let mut index_writer: IndexWriter = index.writer_for_tests()?;
            index_writer.add_document(doc!(text_field=>"b"))?;
            index_writer.add_document(doc!(text_field=>"a b"))?;
            index_writer.add_document(doc!(text_field=>"b a"))?;
            index_writer.commit()?;
        }

        let searcher = index.reader()?.searcher();
        let test_query = |texts: Vec<&str>| {
            let terms: Vec<Term> = texts
                .iter()
                .map(|text| Term::from_field_text(text_field, text))
                .collect();
            let phrase_query = PhraseQuery::new(terms);
            searcher
                .search(&phrase_query, &TEST_COLLECTOR_WITH_SCORE)
                .expect("search should succeed")
                .docs()
                .to_vec()
        };
        assert_eq!(test_query(vec!["a", "b"]), vec![DocAddress::new(0, 1)]);
        assert_eq!(test_query(vec!["b", "a"]), vec![DocAddress::new(0, 2)]);
        Ok(())
    }

    #[test] // motivated by #234
    pub fn test_phrase_query_non_trivial_offsets() -> crate::Result<()> {
        let mut schema_builder = Schema::builder();
        let text_field = schema_builder.add_text_field("text", TEXT);
        let schema = schema_builder.build();
        let index = Index::create_in_ram(schema);
        {
            let mut index_writer: IndexWriter = index.writer_for_tests()?;
            index_writer.add_document(doc!(text_field=>"a b c d e f g h"))?;
            index_writer.commit()?;
        }
        let searcher = index.reader().unwrap().searcher();
        let test_query = |texts: Vec<(usize, &str)>| {
            let terms: Vec<(usize, Term)> = texts
                .iter()
                .map(|(offset, text)| (*offset, Term::from_field_text(text_field, text)))
                .collect();
            let phrase_query = PhraseQuery::new_with_offset(terms);
            searcher
                .search(&phrase_query, &TEST_COLLECTOR_WITH_SCORE)
                .expect("search should succeed")
                .docs()
                .iter()
                .map(|doc_address| doc_address.doc_id)
                .collect::<Vec<DocId>>()
        };
        assert_eq!(test_query(vec![(0, "a"), (1, "b")]), vec![0]);
        assert_eq!(test_query(vec![(1, "b"), (0, "a")]), vec![0]);
        assert!(test_query(vec![(0, "a"), (2, "b")]).is_empty());
        assert_eq!(test_query(vec![(0, "a"), (2, "c")]), vec![0]);
        assert_eq!(test_query(vec![(0, "a"), (2, "c"), (3, "d")]), vec![0]);
        assert_eq!(test_query(vec![(0, "a"), (2, "c"), (4, "e")]), vec![0]);
        assert_eq!(test_query(vec![(4, "e"), (0, "a"), (2, "c")]), vec![0]);
        assert!(test_query(vec![(0, "a"), (2, "d")]).is_empty());
        assert_eq!(test_query(vec![(1, "a"), (3, "c")]), vec![0]);
        Ok(())
    }

    #[test]
    pub fn test_phrase_query_on_json() -> crate::Result<()> {
        let mut schema_builder = Schema::builder();
        let json_field = schema_builder.add_json_field("json", TEXT);
        let schema = schema_builder.build();
        let index = Index::create_in_ram(schema);
        {
            let mut index_writer: IndexWriter = index.writer_for_tests()?;
            index_writer.add_document(doc!(json_field=>json!({
                "text": "elliot smith the happy who"
            })))?;
            index_writer.add_document(doc!(json_field=>json!({
                "text": "the who elliot smith"
            })))?;
            index_writer.add_document(doc!(json_field=>json!({
                "arr": [{"text":"the who"}, {"text":"elliot smith"}]
            })))?;
            index_writer.add_document(doc!(json_field=>json!({
                "text2": "the smith"
            })))?;
            index_writer.commit()?;
        }
        let searcher = index.reader()?.searcher();
        let matching_docs = |query: &str| {
            let query_parser = QueryParser::for_index(&index, vec![json_field]);
            let phrase_query = query_parser.parse_query(query).unwrap();
            let phrase_weight = phrase_query
                .weight(EnableScoring::disabled_from_schema(searcher.schema()))
                .unwrap();
            let mut phrase_scorer = phrase_weight
                .scorer(searcher.segment_reader(0), 1.0f32)
                .unwrap();
            let mut docs = Vec::new();
            loop {
                let doc = phrase_scorer.doc();
                if doc == TERMINATED {
                    break;
                }
                docs.push(doc);
                phrase_scorer.advance();
            }
            docs
        };
        assert!(matching_docs(r#"text:"the smith""#).is_empty());
        assert_eq!(&matching_docs(r#"text:the"#), &[0u32, 1u32]);
        assert_eq!(&matching_docs(r#"text:"the""#), &[0u32, 1u32]);
        assert_eq!(&matching_docs(r#"text:"smith""#), &[0u32, 1u32]);
        assert_eq!(&matching_docs(r#"text:"elliot smith""#), &[0u32, 1u32]);
        assert_eq!(&matching_docs(r#"text2:"the smith""#), &[3u32]);
        assert!(&matching_docs(r#"arr.text:"the smith""#).is_empty());
        assert_eq!(&matching_docs(r#"arr.text:"elliot smith""#), &[2]);
        Ok(())
    }
}


================================================
FILE: src/query/phrase_query/phrase_query.rs
================================================
use super::PhraseWeight;
use crate::query::bm25::Bm25Weight;
use crate::query::{EnableScoring, Query, Weight};
use crate::schema::{Field, IndexRecordOption, Term};

/// `PhraseQuery` matches a specific sequence of words.
///
/// For instance, the phrase query for `"part time"` will match
/// the sentence:
///
/// **Alan just got a part time job.**
///
/// On the other hand it will not match the sentence.
///
/// **This is my favorite part of the job.**
///
/// [Slop](PhraseQuery::set_slop) allows leniency in term proximity
/// for some performance trade-off.
///
/// Using a `PhraseQuery` on a field requires positions
/// to be indexed for this field.
#[derive(Clone, Debug)]
pub struct PhraseQuery {
    field: Field,
    phrase_terms: Vec<(usize, Term)>,
    slop: u32,
}

impl PhraseQuery {
    /// Creates a new `PhraseQuery` given a list of terms.
    ///
    /// There must be at least two terms, and all terms
    /// must belong to the same field.
    /// Offset for each term will be same as index in the Vector
    pub fn new(terms: Vec<Term>) -> PhraseQuery {
        let terms_with_offset = terms.into_iter().enumerate().collect();
        PhraseQuery::new_with_offset(terms_with_offset)
    }

    /// Creates a new `PhraseQuery` given a list of terms and their offsets.
    ///
    /// Can be used to provide custom offset for each term.
    pub fn new_with_offset(terms: Vec<(usize, Term)>) -> PhraseQuery {
        PhraseQuery::new_with_offset_and_slop(terms, 0)
    }

    /// Creates a new `PhraseQuery` given a list of terms, their offsets and a slop
    pub fn new_with_offset_and_slop(mut terms: Vec<(usize, Term)>, slop: u32) -> PhraseQuery {
        assert!(
            terms.len() > 1,
            "A phrase query is required to have strictly more than one term."
        );
        terms.sort_by_key(|&(offset, _)| offset);
        let field = terms[0].1.field();
        assert!(
            terms[1..].iter().all(|term| term.1.field() == field),
            "All terms from a phrase query must belong to the same field"
        );
        PhraseQuery {
            field,
            phrase_terms: terms,
            slop,
        }
    }

    /// Slop allowed for the phrase.
    ///
    /// The query will match if its terms are separated by `slop` terms at most.
    /// The slop can be considered a budget between all terms.
    /// E.g. "A B C" with slop 1 allows "A X B C", "A B X C", but not "A X B X C".
    ///
    /// Transposition costs 2, e.g. "A B" with slop 1 will not match "B A" but it would with slop 2
    /// Transposition is not a special case, in the example above A is moved 1 position and B is
    /// moved 1 position, so the slop is 2.
    ///
    /// As a result slop works in both directions, so the order of the terms may changed as long as
    /// they respect the slop.
    ///
    /// By default the slop is 0 meaning query terms need to be adjacent.
    pub fn set_slop(&mut self, value: u32) {
        self.slop = value;
    }

    /// The [`Field`] this `PhraseQuery` is targeting.
    pub fn field(&self) -> Field {
        self.field
    }

    /// `Term`s in the phrase without the associated offsets.
    pub fn phrase_terms(&self) -> Vec<Term> {
        self.phrase_terms
            .iter()
            .map(|(_, term)| term.clone())
            .collect::<Vec<Term>>()
    }

    /// Returns the [`PhraseWeight`] for the given phrase query given a specific `searcher`.
    ///
    /// This function is the same as [`Query::weight()`] except it returns
    /// a specialized type [`PhraseWeight`] instead of a Boxed trait.
    pub(crate) fn phrase_weight(
        &self,
        enable_scoring: EnableScoring<'_>,
    ) -> crate::Result<PhraseWeight> {
        let schema = enable_scoring.schema();
        let field_entry = schema.get_field_entry(self.field);
        let has_positions = field_entry
            .field_type()
            .get_index_record_option()
            .map(IndexRecordOption::has_positions)
            .unwrap_or(false);
        if !has_positions {
            let field_name = field_entry.name();
            return Err(crate::TantivyError::SchemaError(format!(
                "Applied phrase query on field {field_name:?}, which does not have positions \
                 indexed"
            )));
        }
        let terms = self.phrase_terms();
        let bm25_weight_opt = match enable_scoring {
            EnableScoring::Enabled {
                statistics_provider,
                ..
            } => Some(Bm25Weight::for_terms(statistics_provider, &terms)?),
            EnableScoring::Disabled { .. } => None,
        };
        let mut weight = PhraseWeight::new(self.phrase_terms.clone(), bm25_weight_opt);
        if self.slop > 0 {
            weight.slop(self.slop);
        }
        Ok(weight)
    }
}

impl Query for PhraseQuery {
    /// Create the weight associated with a query.
    ///
    /// See [`Weight`].
    fn weight(&self, enable_scoring: EnableScoring<'_>) -> crate::Result<Box<dyn Weight>> {
        let phrase_weight = self.phrase_weight(enable_scoring)?;
        Ok(Box::new(phrase_weight))
    }

    fn query_terms<'a>(&'a self, visitor: &mut dyn FnMut(&'a Term, bool)) {
        for (_, term) in &self.phrase_terms {
            visitor(term, true);
        }
    }
}


================================================
FILE: src/query/phrase_query/phrase_scorer.rs
================================================
use std::cmp::Ordering;

use crate::docset::{DocSet, SeekDangerResult, TERMINATED};
use crate::fieldnorm::FieldNormReader;
use crate::postings::Postings;
use crate::query::bm25::Bm25Weight;
use crate::query::{Intersection, Scorer};
use crate::{DocId, Score};

struct PostingsWithOffset<TPostings> {
    offset: u32,
    postings: TPostings,
}

impl<TPostings: Postings> PostingsWithOffset<TPostings> {
    pub fn new(segment_postings: TPostings, offset: u32) -> PostingsWithOffset<TPostings> {
        PostingsWithOffset {
            offset,
            postings: segment_postings,
        }
    }

    pub fn positions(&mut self, output: &mut Vec<u32>) {
        self.postings.positions_with_offset(self.offset, output)
    }
}

impl<TPostings: Postings> DocSet for PostingsWithOffset<TPostings> {
    fn advance(&mut self) -> DocId {
        self.postings.advance()
    }

    fn seek(&mut self, target: DocId) -> DocId {
        self.postings.seek(target)
    }

    fn doc(&self) -> DocId {
        self.postings.doc()
    }

    fn size_hint(&self) -> u32 {
        self.postings.size_hint()
    }
}

pub struct PhraseScorer<TPostings: Postings> {
    intersection_docset: Intersection<PostingsWithOffset<TPostings>, PostingsWithOffset<TPostings>>,
    num_terms: usize,
    left_positions: Vec<u32>,
    right_positions: Vec<u32>,
    phrase_count: u32,
    fieldnorm_reader: FieldNormReader,
    similarity_weight_opt: Option<Bm25Weight>,
    slop: u32,
    left_slops: Vec<u8>,
    positions_buffer: Vec<u32>,
    slops_buffer: Vec<u8>,
}

/// Returns true if and only if the two sorted arrays contain a common element
fn intersection_exists(left: &[u32], right: &[u32]) -> bool {
    let mut left_index = 0;
    let mut right_index = 0;
    while left_index < left.len() && right_index < right.len() {
        let left_val = left[left_index];
        let right_val = right[right_index];
        match left_val.cmp(&right_val) {
            Ordering::Less => {
                left_index += 1;
            }
            Ordering::Equal => {
                return true;
            }
            Ordering::Greater => {
                right_index += 1;
            }
        }
    }
    false
}

pub(crate) fn intersection_count(left: &[u32], right: &[u32]) -> usize {
    let mut left_index = 0;
    let mut right_index = 0;
    let mut count = 0;
    while left_index < left.len() && right_index < right.len() {
        let left_val = left[left_index];
        let right_val = right[right_index];
        match left_val.cmp(&right_val) {
            Ordering::Less => {
                left_index += 1;
            }
            Ordering::Equal => {
                count += 1;
                left_index += 1;
                right_index += 1;
            }
            Ordering::Greater => {
                right_index += 1;
            }
        }
    }
    count
}

/// Intersect twos sorted arrays `left` and `right` and outputs the
/// resulting array in left.
///
/// Returns the length of the intersection
#[inline]
fn intersection(left: &mut Vec<u32>, right: &[u32]) {
    let mut left_index = 0;
    let mut right_index = 0;
    let mut count = 0;
    let left_len = left.len();
    let right_len = right.len();
    while left_index < left_len && right_index < right_len {
        let left_val = left[left_index];
        let right_val = right[right_index];
        match left_val.cmp(&right_val) {
            Ordering::Less => {
                left_index += 1;
            }
            Ordering::Equal => {
                left[count] = left_val;
                count += 1;
                left_index += 1;
                right_index += 1;
            }
            Ordering::Greater => {
                right_index += 1;
            }
        }
    }
    left.truncate(count);
}

/// Intersect twos sorted arrays `left` and `right` and outputs the
/// resulting array in left_positions if update_left is true.
///
/// Condition for match is that the distance between left and right is less than or equal to `slop`.
///
/// Returns the length of the intersection
#[inline]
fn intersection_count_with_slop(
    left_positions: &mut Vec<u32>,
    right_positions: &[u32],
    slop: u32,
    update_left: bool,
) -> usize {
    let mut left_index = 0;
    let mut right_index = 0;
    let mut count = 0;
    let left_len = left_positions.len();
    let right_len = right_positions.len();
    while left_index < left_len && right_index < right_len {
        let left_val = left_positions[left_index];
        let right_val = right_positions[right_index];

        let distance = left_val.abs_diff(right_val);
        if distance <= slop {
            while left_index + 1 < left_len {
                // there could be a better match
                let next_left_val = left_positions[left_index + 1];
                if next_left_val > right_val {
                    // the next value is outside the range, so current one is the best.
                    break;
                }
                // the next value is better.
                left_index += 1;
            }

            // store the match in left.
            if update_left {
                left_positions[count] = right_val;
            }
            count += 1;
            left_index += 1;
            right_index += 1;
        } else if left_val < right_val {
            left_index += 1;
        } else {
            right_index += 1;
        }
    }
    if update_left {
        left_positions.truncate(count);
    }

    count
}

fn intersection_exists_with_slop(
    left_positions: &[u32],
    right_positions: &[u32],
    slop: u32,
) -> bool {
    let mut left_index = 0;
    let mut right_index = 0;
    let left_len = left_positions.len();
    let right_len = right_positions.len();
    while left_index < left_len && right_index < right_len {
        let left_val = left_positions[left_index];
        let right_val = right_positions[right_index];
        let distance = left_val.abs_diff(right_val);
        if distance <= slop {
            return true;
        } else if left_val < right_val {
            left_index += 1;
        } else {
            right_index += 1;
        }
    }
    false
}

/// Intersection variant for multi term searches that keeps track of slop so far.
///
/// In contrast to the regular algorithm this solves some issues:
/// - Keep track of the slop so far. Slop is a budget that is spent on the distance between terms.
/// - When encountering a match between two positions, which position is the best match is unclear
///   and depends on intersections afterwards, therefore this algorithm keeps left and right as
///   matches, but only counts one.
///
/// This algorithm may return an incorrect count in some cases (e.g. left, right expansion and is
/// then matches both on the following term.)
/// I think to fix this we would need to iterate all positions simultaneously,
/// but not sure if that's worth it. (It may be considerable slower - untested)
///
/// left_slops is allowed to be empty, which equals to a slop of 0 so far.
#[inline]
fn intersection_count_with_carrying_slop(
    left_positions: &mut Vec<u32>,
    left_slops: &mut Vec<u8>,
    right_positions: &[u32],
    max_slop: u32,
    update_left: bool,
    positions_buffer: &mut Vec<u32>,
    slops_buffer: &mut Vec<u8>,
) -> u32 {
    let mut left_index = 0;
    let mut right_index = 0;
    let mut count = 0;

    if left_positions.is_empty() || right_positions.is_empty() {
        if update_left {
            left_positions.clear();
            left_slops.clear();
        }
        return 0;
    }

    let add_val = |val: (u8, u32), new_left: &mut Vec<u32>, new_slops: &mut Vec<u8>| {
        if update_left {
            let pos_exists = new_left.last().map(|v| *v == val.1).unwrap_or(false);
            if pos_exists {
                let last_slop = new_slops.last_mut().unwrap();
                *last_slop = (*last_slop).min(val.0);
            } else {
                new_left.push(val.1);
                new_slops.push(val.0);
            }
        }
    };
    loop {
        let left_val = left_positions[left_index];
        let slop_so_far = left_slops.get(left_index).cloned().unwrap_or(0);
        let right_val = right_positions[right_index];

        let distance = slop_so_far as u32 + left_val.abs_diff(right_val);
        if distance <= max_slop {
            let (smaller_val, larger_val, mut smaller_val_idx, smaller_val_positions) =
                if left_val < right_val {
                    (left_val, right_val, left_index, left_positions.as_slice())
                } else {
                    (right_val, left_val, right_index, right_positions)
                };

            let mut new_slop = distance;
            add_val(
                (new_slop as u8, smaller_val),
                positions_buffer,
                slops_buffer,
            );
            while smaller_val_idx + 1 < smaller_val_positions.len() {
                // there could be a better match
                let next_val = smaller_val_positions[smaller_val_idx + 1];
                if next_val > larger_val {
                    // the next value is outside the range, so current one is the best.
                    break;
                }
                let distance = next_val.abs_diff(larger_val);

                // the next value is better.
                smaller_val_idx += 1;
                // better slop
                new_slop = slop_so_far as u32 + distance;
                add_val((new_slop as u8, next_val), positions_buffer, slops_buffer);
            }

            add_val((new_slop as u8, larger_val), positions_buffer, slops_buffer);
            count += 1;
            left_index += 1;
            right_index += 1;
        } else if left_val < right_val {
            left_index += 1;
        } else {
            right_index += 1;
        }

        if left_index >= left_positions.len() || right_index >= right_positions.len() {
            // finish rest
            if left_index >= left_positions.len() {
                let left_val = *left_positions.last().unwrap();
                let slop_so_far: u8 = *left_slops.last().unwrap_or(&0);
                for right_val in &right_positions[right_index..] {
                    let new_slop = left_val.abs_diff(*right_val) + slop_so_far as u32;
                    if new_slop <= max_slop {
                        add_val((new_slop as u8, *right_val), positions_buffer, slops_buffer);
                    }
                }
            } else {
                let right_val = *right_positions.last().unwrap();
                for left_idx in left_index..left_positions.len() {
                    let left_val = left_positions[left_idx];
                    let slop_so_far = *left_slops.get(left_idx).unwrap_or(&0);
                    let new_slop = left_val.abs_diff(right_val) + slop_so_far as u32;
                    if new_slop <= max_slop {
                        add_val((new_slop as u8, left_val), positions_buffer, slops_buffer);
                    }
                }
            };

            break;
        }
    }
    if update_left {
        std::mem::swap(left_positions, positions_buffer);
        std::mem::swap(left_slops, slops_buffer);
        positions_buffer.clear();
        slops_buffer.clear();
    }

    count
}

impl<TPostings: Postings> PhraseScorer<TPostings> {
    // If similarity_weight is None, then scoring is disabled.
    pub fn new(
        term_postings: Vec<(usize, TPostings)>,
        similarity_weight_opt: Option<Bm25Weight>,
        fieldnorm_reader: FieldNormReader,
        slop: u32,
    ) -> PhraseScorer<TPostings> {
        Self::new_with_offset(
            term_postings,
            similarity_weight_opt,
            fieldnorm_reader,
            slop,
            0,
        )
    }

    pub(crate) fn new_with_offset(
        term_postings_with_offset: Vec<(usize, TPostings)>,
        similarity_weight_opt: Option<Bm25Weight>,
        fieldnorm_reader: FieldNormReader,
        slop: u32,
        offset: usize,
    ) -> PhraseScorer<TPostings> {
        let num_docs = fieldnorm_reader.num_docs();
        let max_offset = term_postings_with_offset
            .iter()
            .map(|&(offset, _)| offset)
            .max()
            .unwrap_or(0)
            + offset;
        let num_docsets = term_postings_with_offset.len();
        let postings_with_offsets = term_postings_with_offset
            .into_iter()
            .map(|(offset, postings)| {
                PostingsWithOffset::new(postings, (max_offset - offset) as u32)
            })
            .collect::<Vec<_>>();
        let intersection_docset = Intersection::new(postings_with_offsets, num_docs);
        let mut scorer = PhraseScorer {
            intersection_docset,
            num_terms: num_docsets,
            left_positions: Vec::with_capacity(100),
            right_positions: Vec::with_capacity(100),
            phrase_count: 0u32,
            similarity_weight_opt,
            fieldnorm_reader,
            slop,
            left_slops: Vec::with_capacity(100),
            slops_buffer: Vec::with_capacity(100),
            positions_buffer: Vec::with_capacity(100),
        };
        if scorer.doc() != TERMINATED && !scorer.phrase_match() {
            scorer.advance();
        }
        scorer
    }

    pub fn phrase_count(&self) -> u32 {
        self.phrase_count
    }

    pub(crate) fn get_intersection(&mut self) -> &[u32] {
        intersection(&mut self.left_positions, &self.right_positions);
        &self.left_positions
    }

    fn phrase_match(&mut self) -> bool {
        if self.similarity_weight_opt.is_some() {
            let count = self.compute_phrase_count();
            self.phrase_count = count;
            count > 0u32
        } else {
            self.phrase_exists()
        }
    }

    fn phrase_exists(&mut self) -> bool {
        self.compute_phrase_match();
        if self.has_slop() {
            intersection_exists_with_slop(
                &self.left_positions,
                &self.right_positions[..],
                self.slop,
            )
        } else {
            intersection_exists(&self.left_positions, &self.right_positions[..])
        }
    }

    fn compute_phrase_count(&mut self) -> u32 {
        self.compute_phrase_match();
        if self.has_slop() {
            if self.num_terms > 2 {
                intersection_count_with_carrying_slop(
                    &mut self.left_positions,
                    &mut self.left_slops,
                    &self.right_positions[..],
                    self.slop,
                    false,
                    &mut self.positions_buffer,
                    &mut self.slops_buffer,
                )
            } else {
                intersection_count_with_slop(
                    &mut self.left_positions,
                    &self.right_positions[..],
                    self.slop,
                    false,
                ) as u32
            }
        } else {
            intersection_count(&self.left_positions, &self.right_positions[..]) as u32
        }
    }

    fn compute_phrase_match(&mut self) {
        {
            self.intersection_docset
                .docset_mut_specialized(0)
                .positions(&mut self.left_positions);
            if self.has_slop() {
                self.left_slops.clear();
            }
        }
        for i in 1..self.num_terms - 1 {
            {
                self.intersection_docset
                    .docset_mut_specialized(i)
                    .positions(&mut self.right_positions);
            }
            if self.has_slop() {
                if self.num_terms > 2 {
                    intersection_count_with_carrying_slop(
                        &mut self.left_positions,
                        &mut self.left_slops,
                        &self.right_positions[..],
                        self.slop,
                        true,
                        &mut self.positions_buffer,
                        &mut self.slops_buffer,
                    );
                } else {
                    intersection_count_with_slop(
                        &mut self.left_positions,
                        &self.right_positions[..],
                        self.slop,
                        true,
                    );
                }
            } else {
                intersection(&mut self.left_positions, &self.right_positions);
            };
            if self.left_positions.is_empty() {
                return;
            }
        }
        self.intersection_docset
            .docset_mut_specialized(self.num_terms - 1)
            .positions(&mut self.right_positions);
    }

    fn has_slop(&self) -> bool {
        self.slop > 0
    }
}

impl<TPostings: Postings> DocSet for PhraseScorer<TPostings> {
    fn advance(&mut self) -> DocId {
        loop {
            let doc = self.intersection_docset.advance();
            if doc == TERMINATED || self.phrase_match() {
                return doc;
            }
        }
    }

    fn seek(&mut self, target: DocId) -> DocId {
        debug_assert!(target >= self.doc());
        let doc = self.intersection_docset.seek(target);
        if doc == TERMINATED || self.phrase_match() {
            return doc;
        }
        self.advance()
    }

    fn seek_danger(&mut self, target: DocId) -> SeekDangerResult {
        debug_assert!(
            target >= self.doc(),
            "target ({}) should be greater than or equal to doc ({})",
            target,
            self.doc()
        );
        let seek_res = self.intersection_docset.seek_danger(target);
        if seek_res != SeekDangerResult::Found {
            return seek_res;
        }
        // The intersection matched. Now let's see if we match the phrase.
        if self.phrase_match() {
            SeekDangerResult::Found
        } else {
            SeekDangerResult::SeekLowerBound(target + 1)
        }
    }

    fn doc(&self) -> DocId {
        self.intersection_docset.doc()
    }

    fn size_hint(&self) -> u32 {
        // We adjust the intersection estimate, since actual phrase hits are much lower than where
        // the all appear.
        // The estimate should depend on average field length, e.g. if the field is really short
        // a phrase hit is more likely
        self.intersection_docset.size_hint() / (10 * self.num_terms as u32)
    }

    /// Returns a best-effort hint of the
    /// cost to drive the docset.
    fn cost(&self) -> u64 {
        // While determing a potential hit is cheap for phrases, evaluating an actual hit is
        // expensive since it requires to load positions for a doc and check if they are next to
        // each other.
        // So the cost estimation would be the number of times we need to check if a doc is a hit *
        // 10 * self.num_terms.
        self.intersection_docset.size_hint() as u64 * 10 * self.num_terms as u64
    }
}

impl<TPostings: Postings> Scorer for PhraseScorer<TPostings> {
    #[inline]
    fn score(&mut self) -> Score {
        let doc = self.doc();
        let fieldnorm_id = self.fieldnorm_reader.fieldnorm_id(doc);
        if let Some(similarity_weight) = self.similarity_weight_opt.as_ref() {
            similarity_weight.score(fieldnorm_id, self.phrase_count)
        } else {
            1.0f32
        }
    }
}

#[cfg(test)]
mod tests {
    use super::*;

    fn test_intersection_sym(left: &[u32], right: &[u32], expected: &[u32]) {
        test_intersection_aux(left, right, expected, 0);
        test_intersection_aux(right, left, expected, 0);
    }

    fn test_intersection_aux(left: &[u32], right: &[u32], expected: &[u32], slop: u32) {
        let mut left_vec = Vec::from(left);
        if slop == 0 {
            assert_eq!(intersection_count(&left_vec, right), expected.len());
            intersection(&mut left_vec, right);
            assert_eq!(&left_vec, expected);
        } else {
            let mut right_vec = Vec::from(right);
            let right_mut = &mut right_vec[..];
            intersection_count_with_slop(&mut left_vec, right_mut, slop, true);
            assert_eq!(&left_vec, expected);
        }
    }

    #[test]
    fn test_intersection() {
        test_intersection_sym(&[1], &[1], &[1]);
        test_intersection_sym(&[1], &[2], &[]);
        test_intersection_sym(&[], &[2], &[]);
        test_intersection_sym(&[5, 7], &[1, 5, 10, 12], &[5]);
        test_intersection_sym(&[1, 5, 6, 9, 10, 12], &[6, 8, 9, 12], &[6, 9, 12]);
    }
    #[test]
    fn test_slop() {
        // The slop is not symmetric. It does not allow for the phrase to be out of order.
        test_intersection_aux(&[1], &[2], &[2], 1);
        test_intersection_aux(&[1], &[3], &[], 1);
        test_intersection_aux(&[1], &[3], &[3], 2);
        test_intersection_aux(&[], &[2], &[], 100000);
        test_intersection_aux(&[5, 7, 11], &[1, 5, 10, 12], &[5, 10], 1);
        test_intersection_aux(&[1, 5, 6, 9, 10, 12], &[6, 8, 9, 12], &[6, 8, 9, 12], 1);
        test_intersection_aux(&[1, 5, 6, 9, 10, 12], &[6, 8, 9, 12], &[6, 8, 9, 12], 10);
        test_intersection_aux(&[1, 3, 5], &[2, 4, 6], &[2, 4, 6], 1);
        test_intersection_aux(&[1, 3, 5], &[2, 4, 6], &[], 0);
    }

    fn test_merge(left: &[u32], right: &[u32], expected_left: &[u32], slop: u32) {
        let mut left_vec = Vec::from(left);
        let mut right_vec = Vec::from(right);
        let right_mut = &mut right_vec[..];
        intersection_count_with_slop(&mut left_vec, right_mut, slop, true);
        assert_eq!(&left_vec, expected_left);
    }

    #[test]
    fn test_merge_slop() {
        test_merge(&[1, 2], &[1], &[1], 1);
        test_merge(&[3], &[4], &[4], 2);
        test_merge(&[3], &[4], &[4], 2);
        test_merge(&[1, 5, 6, 9, 10, 12], &[6, 8, 9, 12], &[6, 8, 9, 12], 10);
    }

    fn test_carry_slop_intersection_aux(
        right: &[&[u32]],
        expected: &[(u8, u32)],
        slop: u32,
        expected_count: u32,
    ) {
        let mut left_vec = right[0].to_vec();
        let mut slops = vec![0; left_vec.len()];
        let mut count = 0;
        for right in &right[1..] {
            count = intersection_count_with_carrying_slop(
                &mut left_vec,
                &mut slops,
                right,
                slop,
                true,
                &mut Vec::new(),
                &mut Vec::new(),
            );
        }
        let out: Vec<(u8, u32)> = slops
            .iter()
            .cloned()
            .zip(left_vec.iter().cloned())
            .collect();
        assert_eq!(&out, expected);
        assert_eq!(count, expected_count);
    }

    #[test]
    fn test_carry_slop_intersection() {
        test_carry_slop_intersection_aux(&[&[1], &[]], &[], 1, 0);
        test_carry_slop_intersection_aux(&[&[1], &[2]], &[(1, 1), (1, 2)], 1, 1);
        test_carry_slop_intersection_aux(&[&[1], &[3]], &[], 1, 0);
        test_carry_slop_intersection_aux(&[&[1], &[2]], &[(1, 1), (1, 2)], 1, 1);

        // The order may still matter
        test_carry_slop_intersection_aux(&[&[1], &[2], &[2]], &[(1, 2)], 1, 1);
        test_carry_slop_intersection_aux(&[&[2], &[1], &[2]], &[(1, 2)], 1, 1);
        test_carry_slop_intersection_aux(&[&[2], &[2], &[1]], &[(1, 1), (1, 2)], 1, 1);

        test_carry_slop_intersection_aux(&[&[2], &[2], &[1], &[2]], &[(1, 2)], 1, 1);
        test_carry_slop_intersection_aux(&[&[1], &[2], &[2], &[2]], &[(1, 2)], 1, 1);

        test_carry_slop_intersection_aux(&[&[1], &[2], &[1]], &[(1, 1)], 1, 1);

        test_carry_slop_intersection_aux(&[&[11], &[10, 12]], &[(1, 10), (1, 11), (1, 12)], 1, 1);
        test_carry_slop_intersection_aux(&[&[10, 12], &[11]], &[(1, 10), (1, 11), (1, 12)], 1, 1);

        test_carry_slop_intersection_aux(
            &[&[5, 7, 11], &[1, 5, 10, 12]],
            &[(0, 5), (1, 10), (1, 11), (1, 12)],
            1,
            2,
        );
    }
}

#[cfg(all(test, feature = "unstable"))]
mod bench {

    use test::Bencher;

    use super::*;

    #[bench]
    fn bench_intersection_short_slop_carrying(b: &mut Bencher) {
        let mut left = Vec::new();
        let mut left_slops = Vec::new();
        let mut buffer = Vec::new();
        let mut slop_buffer = Vec::new();
        b.iter(|| {
            left.clear();
            left.extend_from_slice(&[1, 5, 10, 12]);
            left_slops.extend_from_slice(&[0, 0, 0, 0]);
            let right = [5, 7];
            intersection(&mut left, &right);

            intersection_count_with_carrying_slop(
                &mut left,
                &mut left_slops,
                &right,
                2,
                true,
                &mut buffer,
                &mut slop_buffer,
            )
        });
    }

    #[bench]
    fn bench_intersection_short(b: &mut Bencher) {
        let mut left = Vec::new();
        b.iter(|| {
            left.clear();
            left.extend_from_slice(&[1, 5, 10, 12]);
            let right = [5, 7];
            intersection(&mut left, &right);
        });
    }

    #[bench]
    fn bench_intersection_medium_slop_carrying(b: &mut Bencher) {
        let mut left = Vec::new();
        let mut left_slops: Vec<u8> = Vec::new();
        let mut buffer = Vec::new();
        let mut slop_buffer = Vec::new();
        let left_data: Vec<u32> = (0..100).collect();
        let left_slop_data: Vec<u8> = (0..100).map(|_| 0).collect();

        b.iter(|| {
            left.clear();
            left.extend_from_slice(&left_data);
            left_slops.clear();
            left_slops.extend_from_slice(&left_slop_data);
            let right = [5, 7, 55, 200];

            intersection_count_with_carrying_slop(
                &mut left,
                &mut left_slops,
                &right,
                2,
                true,
                &mut buffer,
                &mut slop_buffer,
            )
        });
    }

    #[bench]
    fn bench_intersection_medium_slop(b: &mut Bencher) {
        let mut left = Vec::new();
        let left_data: Vec<u32> = (0..100).collect();

        b.iter(|| {
            left.clear();
            left.extend_from_slice(&left_data);
            let right = [5, 7, 55, 200];
            intersection_count_with_slop(&mut left, &right[..], 2, true) as u32
        });
    }

    #[bench]
    fn bench_intersection_medium(b: &mut Bencher) {
        let mut left = Vec::new();
        let left_data: Vec<u32> = (0..100).collect();
        b.iter(|| {
            left.clear();
            left.extend_from_slice(&left_data);
            let right = [5, 7, 55, 200];
            intersection(&mut left, &right);
        });
    }

    #[bench]
    fn bench_intersection_count_short(b: &mut Bencher) {
        b.iter(|| {
            let left = [1, 5, 10, 12];
            let right = [5, 7];
            intersection_count(&left, &right);
        });
    }
}


================================================
FILE: src/query/phrase_query/phrase_weight.rs
================================================
use super::PhraseScorer;
use crate::fieldnorm::FieldNormReader;
use crate::index::SegmentReader;
use crate::postings::SegmentPostings;
use crate::query::bm25::Bm25Weight;
use crate::query::explanation::does_not_match;
use crate::query::{EmptyScorer, Explanation, Scorer, Weight};
use crate::schema::{IndexRecordOption, Term};
use crate::{DocId, DocSet, Score};

pub struct PhraseWeight {
    phrase_terms: Vec<(usize, Term)>,
    similarity_weight_opt: Option<Bm25Weight>,
    slop: u32,
}

impl PhraseWeight {
    /// Creates a new phrase weight.
    /// If `similarity_weight_opt` is None, then scoring is disabled
    pub fn new(
        phrase_terms: Vec<(usize, Term)>,
        similarity_weight_opt: Option<Bm25Weight>,
    ) -> PhraseWeight {
        let slop = 0;
        PhraseWeight {
            phrase_terms,
            similarity_weight_opt,
            slop,
        }
    }

    fn fieldnorm_reader(&self, reader: &SegmentReader) -> crate::Result<FieldNormReader> {
        let field = self.phrase_terms[0].1.field();
        if self.similarity_weight_opt.is_some() {
            if let Some(fieldnorm_reader) = reader.fieldnorms_readers().get_field(field)? {
                return Ok(fieldnorm_reader);
            }
        }
        Ok(FieldNormReader::constant(reader.max_doc(), 1))
    }

    pub(crate) fn phrase_scorer(
        &self,
        reader: &SegmentReader,
        boost: Score,
    ) -> crate::Result<Option<PhraseScorer<SegmentPostings>>> {
        let similarity_weight_opt = self
            .similarity_weight_opt
            .as_ref()
            .map(|similarity_weight| similarity_weight.boost_by(boost));
        let fieldnorm_reader = self.fieldnorm_reader(reader)?;
        let mut term_postings_list = Vec::new();
        for &(offset, ref term) in &self.phrase_terms {
            if let Some(postings) = reader
                .inverted_index(term.field())?
                .read_postings(term, IndexRecordOption::WithFreqsAndPositions)?
            {
                term_postings_list.push((offset, postings));
            } else {
                return Ok(None);
            }
        }
        Ok(Some(PhraseScorer::new(
            term_postings_list,
            similarity_weight_opt,
            fieldnorm_reader,
            self.slop,
        )))
    }

    pub fn slop(&mut self, slop: u32) {
        self.slop = slop;
    }
}

impl Weight for PhraseWeight {
    fn scorer(&self, reader: &SegmentReader, boost: Score) -> crate::Result<Box<dyn Scorer>> {
        if let Some(scorer) = self.phrase_scorer(reader, boost)? {
            Ok(Box::new(scorer))
        } else {
            Ok(Box::new(EmptyScorer))
        }
    }

    fn explain(&self, reader: &SegmentReader, doc: DocId) -> crate::Result<Explanation> {
        let scorer_opt = self.phrase_scorer(reader, 1.0)?;
        if scorer_opt.is_none() {
            return Err(does_not_match(doc));
        }
        let mut scorer = scorer_opt.unwrap();
        if scorer.seek(doc) != doc {
            return Err(does_not_match(doc));
        }
        let fieldnorm_reader = self.fieldnorm_reader(reader)?;
        let fieldnorm_id = fieldnorm_reader.fieldnorm_id(doc);
        let phrase_count = scorer.phrase_count();
        let mut explanation = Explanation::new("Phrase Scorer", scorer.score());
        if let Some(similarity_weight) = self.similarity_weight_opt.as_ref() {
            explanation.add_detail(similarity_weight.explain(fieldnorm_id, phrase_count));
        }
        Ok(explanation)
    }
}

#[cfg(test)]
mod tests {
    use super::super::tests::create_index;
    use crate::docset::TERMINATED;
    use crate::query::{EnableScoring, PhraseQuery};
    use crate::{DocSet, Term};

    #[test]
    pub fn test_phrase_count() -> crate::Result<()> {
        let index = create_index(&["a c", "a a b d a b c", " a b"])?;
        let schema = index.schema();
        let text_field = schema.get_field("text").unwrap();
        let searcher = index.reader()?.searcher();
        let phrase_query = PhraseQuery::new(vec![
            Term::from_field_text(text_field, "a"),
            Term::from_field_text(text_field, "b"),
        ]);
        let enable_scoring = EnableScoring::enabled_from_searcher(&searcher);
        let phrase_weight = phrase_query.phrase_weight(enable_scoring).unwrap();
        let mut phrase_scorer = phrase_weight
            .phrase_scorer(searcher.segment_reader(0u32), 1.0)?
            .unwrap();
        assert_eq!(phrase_scorer.doc(), 1);
        assert_eq!(phrase_scorer.phrase_count(), 2);
        assert_eq!(phrase_scorer.advance(), 2);
        assert_eq!(phrase_scorer.doc(), 2);
        assert_eq!(phrase_scorer.phrase_count(), 1);
        assert_eq!(phrase_scorer.advance(), TERMINATED);
        Ok(())
    }
}


================================================
FILE: src/query/phrase_query/regex_phrase_query.rs
================================================
use super::regex_phrase_weight::RegexPhraseWeight;
use crate::query::bm25::Bm25Weight;
use crate::query::{EnableScoring, Query, Weight};
use crate::schema::{Field, IndexRecordOption, Term, Type};

/// `RegexPhraseQuery` matches a specific sequence of regex queries.
///
/// For instance, the phrase query for `"pa.* time"` will match
/// the sentence:
///
/// **Alan just got a part time job.**
///
/// On the other hand it will not match the sentence.
///
/// **This is my favorite part of the job.**
///
/// [Slop](RegexPhraseQuery::set_slop) allows leniency in term proximity
/// for some performance trade-off.
///
/// Using a `RegexPhraseQuery` on a field requires positions
/// to be indexed for this field.
#[derive(Clone, Debug)]
pub struct RegexPhraseQuery {
    field: Field,
    phrase_terms: Vec<(usize, String)>,
    slop: u32,
    max_expansions: u32,
}

/// Transform a wildcard query to a regex string.
///
/// `AB*CD` for example is converted to `AB.*CD`
///
/// All other chars are regex escaped.
pub fn wildcard_query_to_regex_str(term: &str) -> String {
    regex::escape(term).replace(r"\*", ".*")
}

impl RegexPhraseQuery {
    /// Creates a new `RegexPhraseQuery` given a list of terms.
    ///
    /// There must be at least two terms, and all terms
    /// must belong to the same field.
    ///
    /// Offset for each term will be same as index in the Vector
    pub fn new(field: Field, terms: Vec<String>) -> RegexPhraseQuery {
        let terms_with_offset = terms.into_iter().enumerate().collect();
        RegexPhraseQuery::new_with_offset(field, terms_with_offset)
    }

    /// Creates a new `RegexPhraseQuery` given a list of terms and their offsets.
    ///
    /// Can be used to provide custom offset for each term.
    pub fn new_with_offset(field: Field, terms: Vec<(usize, String)>) -> RegexPhraseQuery {
        RegexPhraseQuery::new_with_offset_and_slop(field, terms, 0)
    }

    /// Creates a new `RegexPhraseQuery` given a list of terms, their offsets and a slop
    pub fn new_with_offset_and_slop(
        field: Field,
        mut terms: Vec<(usize, String)>,
        slop: u32,
    ) -> RegexPhraseQuery {
        assert!(
            terms.len() > 1,
            "A phrase query is required to have strictly more than one term."
        );
        terms.sort_by_key(|&(offset, _)| offset);
        RegexPhraseQuery {
            field,
            phrase_terms: terms,
            slop,
            max_expansions: 1 << 14,
        }
    }

    /// Slop allowed for the phrase.
    ///
    /// The query will match if its terms are separated by `slop` terms at most.
    /// The slop can be considered a budget between all terms.
    /// E.g. "A B C" with slop 1 allows "A X B C", "A B X C", but not "A X B X C".
    ///
    /// Transposition costs 2, e.g. "A B" with slop 1 will not match "B A" but it would with slop 2
    /// Transposition is not a special case, in the example above A is moved 1 position and B is
    /// moved 1 position, so the slop is 2.
    ///
    /// As a result slop works in both directions, so the order of the terms may changed as long as
    /// they respect the slop.
    ///
    /// By default the slop is 0 meaning query terms need to be adjacent.
    pub fn set_slop(&mut self, value: u32) {
        self.slop = value;
    }

    /// Sets the max expansions a regex term can match. The limit will be over all terms.
    /// After the limit is hit an error will be returned.
    pub fn set_max_expansions(&mut self, value: u32) {
        self.max_expansions = value;
    }

    /// The [`Field`] this `RegexPhraseQuery` is targeting.
    pub fn field(&self) -> Field {
        self.field
    }

    /// `Term`s in the phrase without the associated offsets.
    pub fn phrase_terms(&self) -> Vec<Term> {
        self.phrase_terms
            .iter()
            .map(|(_, term)| Term::from_field_text(self.field, term))
            .collect::<Vec<Term>>()
    }

    /// Returns the [`RegexPhraseWeight`] for the given phrase query given a specific `searcher`.
    ///
    /// This function is the same as [`Query::weight()`] except it returns
    /// a specialized type [`RegexPhraseWeight`] instead of a Boxed trait.
    pub(crate) fn regex_phrase_weight(
        &self,
        enable_scoring: EnableScoring<'_>,
    ) -> crate::Result<RegexPhraseWeight> {
        let schema = enable_scoring.schema();
        let field_type = schema.get_field_entry(self.field).field_type().value_type();
        if field_type != Type::Str {
            return Err(crate::TantivyError::SchemaError(format!(
                "RegexPhraseQuery can only be used with a field of type text currently, but got \
                 {field_type:?}"
            )));
        }

        let field_entry = schema.get_field_entry(self.field);
        let has_positions = field_entry
            .field_type()
            .get_index_record_option()
            .map(IndexRecordOption::has_positions)
            .unwrap_or(false);
        if !has_positions {
            let field_name = field_entry.name();
            return Err(crate::TantivyError::SchemaError(format!(
                "Applied phrase query on field {field_name:?}, which does not have positions \
                 indexed"
            )));
        }
        let terms = self.phrase_terms();
        let bm25_weight_opt = match enable_scoring {
            EnableScoring::Enabled {
                statistics_provider,
                ..
            } => Some(Bm25Weight::for_terms(statistics_provider, &terms)?),
            EnableScoring::Disabled { .. } => None,
        };
        let weight = RegexPhraseWeight::new(
            self.field,
            self.phrase_terms.clone(),
            bm25_weight_opt,
            self.max_expansions,
            self.slop,
        );
        Ok(weight)
    }
}

impl Query for RegexPhraseQuery {
    /// Create the weight associated with a query.
    ///
    /// See [`Weight`].
    fn weight(&self, enable_scoring: EnableScoring<'_>) -> crate::Result<Box<dyn Weight>> {
        let phrase_weight = self.regex_phrase_weight(enable_scoring)?;
        Ok(Box::new(phrase_weight))
    }
}


================================================
FILE: src/query/phrase_query/regex_phrase_weight.rs
================================================
use std::sync::Arc;

use common::BitSet;
use tantivy_fst::Regex;

use super::PhraseScorer;
use crate::fieldnorm::FieldNormReader;
use crate::index::SegmentReader;
use crate::postings::{LoadedPostings, Postings, SegmentPostings, TermInfo};
use crate::query::bm25::Bm25Weight;
use crate::query::explanation::does_not_match;
use crate::query::union::{BitSetPostingUnion, SimpleUnion};
use crate::query::{AutomatonWeight, BitSetDocSet, EmptyScorer, Explanation, Scorer, Weight};
use crate::schema::{Field, IndexRecordOption};
use crate::{DocId, DocSet, InvertedIndexReader, Score};

type UnionType = SimpleUnion<Box<dyn Postings + 'static>>;

/// The `RegexPhraseWeight` is the weight associated to a regex phrase query.
/// See RegexPhraseWeight::get_union_from_term_infos for some design decisions.
pub struct RegexPhraseWeight {
    field: Field,
    phrase_terms: Vec<(usize, String)>,
    similarity_weight_opt: Option<Bm25Weight>,
    slop: u32,
    max_expansions: u32,
}

impl RegexPhraseWeight {
    /// Creates a new phrase weight.
    /// If `similarity_weight_opt` is None, then scoring is disabled
    pub fn new(
        field: Field,
        phrase_terms: Vec<(usize, String)>,
        similarity_weight_opt: Option<Bm25Weight>,
        max_expansions: u32,
        slop: u32,
    ) -> RegexPhraseWeight {
        RegexPhraseWeight {
            field,
            phrase_terms,
            similarity_weight_opt,
            slop,
            max_expansions,
        }
    }

    fn fieldnorm_reader(&self, reader: &SegmentReader) -> crate::Result<FieldNormReader> {
        if self.similarity_weight_opt.is_some() {
            if let Some(fieldnorm_reader) = reader.fieldnorms_readers().get_field(self.field)? {
                return Ok(fieldnorm_reader);
            }
        }
        Ok(FieldNormReader::constant(reader.max_doc(), 1))
    }

    pub(crate) fn phrase_scorer(
        &self,
        reader: &SegmentReader,
        boost: Score,
    ) -> crate::Result<Option<PhraseScorer<UnionType>>> {
        let similarity_weight_opt = self
            .similarity_weight_opt
            .as_ref()
            .map(|similarity_weight| similarity_weight.boost_by(boost));
        let fieldnorm_reader = self.fieldnorm_reader(reader)?;
        let mut posting_lists = Vec::new();
        let inverted_index = reader.inverted_index(self.field)?;
        let mut num_terms = 0;
        for &(offset, ref term) in &self.phrase_terms {
            let regex = Regex::new(term)
                .map_err(|e| crate::TantivyError::InvalidArgument(format!("Invalid regex: {e}")))?;

            let automaton: AutomatonWeight<Regex> =
                AutomatonWeight::new(self.field, Arc::new(regex));
            let term_infos = automaton.get_match_term_infos(reader)?;
            // If term_infos is empty, the phrase can not match any documents.
            if term_infos.is_empty() {
                return Ok(None);
            }
            num_terms += term_infos.len();
            if num_terms > self.max_expansions as usize {
                return Err(crate::TantivyError::InvalidArgument(format!(
                    "Phrase query exceeded max expansions {num_terms}"
                )));
            }
            let union = Self::get_union_from_term_infos(&term_infos, reader, &inverted_index)?;

            posting_lists.push((offset, union));
        }

        Ok(Some(PhraseScorer::new(
            posting_lists,
            similarity_weight_opt,
            fieldnorm_reader,
            self.slop,
        )))
    }

    /// Add all docs of the term to the docset
    fn add_to_bitset(
        inverted_index: &InvertedIndexReader,
        term_info: &TermInfo,
        doc_bitset: &mut BitSet,
    ) -> crate::Result<()> {
        let mut block_segment_postings = inverted_index
            .read_block_postings_from_terminfo(term_info, IndexRecordOption::Basic)?;
        loop {
            let docs = block_segment_postings.docs();
            if docs.is_empty() {
                break;
            }
            for &doc in docs {
                doc_bitset.insert(doc);
            }
            block_segment_postings.advance();
        }
        Ok(())
    }

    /// This function generates a union of document sets from multiple term information
    /// (`TermInfo`).
    ///
    /// It uses bucketing based on term frequency to optimize query performance and memory usage.
    /// The terms are divided into buckets based on their document frequency (the number of
    /// documents they appear in).
    ///
    /// ### Bucketing Strategy:
    /// Once a bucket contains more than 512 terms, it is moved to the end of the list and replaced
    /// with a new empty bucket.
    ///
    /// - **Sparse Term Buckets**: Terms with document frequency `< 100`.
    ///
    ///   Each sparse bucket contains:
    ///   - A `BitSet` to efficiently track which document IDs are present in the bucket, which is
    ///     used to drive the `DocSet`.
    ///   - A `Vec<LoadedPostings>` to store the postings for each term in that bucket.
    ///
    /// - **Other Term Buckets**:
    ///   - **Bucket 0**: Terms appearing in less than `0.1%` of documents.
    ///   - **Bucket 1**: Terms appearing in `0.1%` to `1%` of documents.
    ///   - **Bucket 2**: Terms appearing in `1%` to `10%` of documents.
    ///   - **Bucket 3**: Terms appearing in more than `10%` of documents.
    ///
    ///   Each bucket contains:
    ///   - A `BitSet` to efficiently track which document IDs are present in the bucket.
    ///   - A `Vec<SegmentPostings>` to store the postings for each term in that bucket.
    ///
    /// ### Design Choices:
    /// The main cost for a _unbucketed_ regex phrase query with a medium/high amount of terms is
    /// the `append_positions_with_offset` from `Postings`.
    /// We don't know which docsets hit, so we need to scan all of them to check if they contain the
    /// docid.
    /// The bucketing strategy groups less common DocSets together, so we can rule out the
    /// whole docset group in many cases.
    ///
    /// E.g. consider the phrase "th* world"
    /// It contains the term "the", which may occur in almost all documents.
    /// It may also contain 10_000s very rare terms like "theologian".
    ///
    /// For very low-frequency terms (sparse terms), we use `LoadedPostings` and aggregate
    /// their document IDs into a `BitSet`, which is more memory-efficient than using
    /// `SegmentPostings`. E.g. 100_000 terms with SegmentPostings would consume 184MB.
    /// `SegmentPostings` uses memory equivalent to 460 docids. The 100 docs limit should be
    /// fine as long as a term doesn't have too many positions per doc.
    ///
    /// ### Future Optimization:
    /// A larger performance improvement would be an additional partitioning of the space
    /// vertically of u16::MAX blocks, where we mark which docset ord has values in each block.
    /// E.g. partitioning in a index with 5 million documents this would reduce the number of
    /// docsets to scan to around 1/20 in the sparse term bucket where the terms only have a few
    /// docs. For higher cardinality buckets this is irrelevant as they are in most blocks.
    ///
    /// Use Roaring Bitmaps for sparse terms. The full bitvec is main memory consumer currently.
    pub(crate) fn get_union_from_term_infos(
        term_infos: &[TermInfo],
        reader: &SegmentReader,
        inverted_index: &InvertedIndexReader,
    ) -> crate::Result<UnionType> {
        let max_doc = reader.max_doc();

        // Buckets for sparse terms
        let mut sparse_buckets: Vec<(BitSet, Vec<LoadedPostings>)> =
            vec![(BitSet::with_max_value(max_doc), Vec::new())];

        // Buckets for other terms based on document frequency percentages:
        // - Bucket 0: Terms appearing in less than 0.1% of documents
        // - Bucket 1: Terms appearing in 0.1% to 1% of documents
        // - Bucket 2: Terms appearing in 1% to 10% of documents
        // - Bucket 3: Terms appearing in more than 10% of documents
        let mut buckets: Vec<(BitSet, Vec<SegmentPostings>)> = (0..4)
            .map(|_| (BitSet::with_max_value(max_doc), Vec::new()))
            .collect();

        const SPARSE_TERM_DOC_THRESHOLD: u32 = 100;

        for term_info in term_infos {
            let mut term_posting = inverted_index
                .read_postings_from_terminfo(term_info, IndexRecordOption::WithFreqsAndPositions)?;
            let num_docs = term_posting.doc_freq();

            if num_docs < SPARSE_TERM_DOC_THRESHOLD {
                let current_bucket = &mut sparse_buckets[0];
                Self::add_to_bitset(inverted_index, term_info, &mut current_bucket.0)?;
                let docset = LoadedPostings::load(&mut term_posting);
                current_bucket.1.push(docset);

                // Move the bucket to the end if the term limit is reached
                if current_bucket.1.len() == 512 {
                    sparse_buckets.push((BitSet::with_max_value(max_doc), Vec::new()));
                    let end_index = sparse_buckets.len() - 1;
                    sparse_buckets.swap(0, end_index);
                }
            } else {
                // Calculate the percentage of documents the term appears in
                let doc_freq_percentage = (num_docs as f32) / (max_doc as f32) * 100.0;

                // Determine the appropriate bucket based on percentage thresholds
                let bucket_index = if doc_freq_percentage < 0.1 {
                    0
                } else if doc_freq_percentage < 1.0 {
                    1
                } else if doc_freq_percentage < 10.0 {
                    2
                } else {
                    3
                };
                let bucket = &mut buckets[bucket_index];

                // Add term postings to the appropriate bucket
                Self::add_to_bitset(inverted_index, term_info, &mut bucket.0)?;
                bucket.1.push(term_posting);

                // Move the bucket to the end if the term limit is reached
                if bucket.1.len() == 512 {
                    buckets.push((BitSet::with_max_value(max_doc), Vec::new()));
                    let end_index = buckets.len() - 1;
                    buckets.swap(bucket_index, end_index);
                }
            }
        }

        // Build unions for sparse term buckets
        let sparse_term_docsets: Vec<_> = sparse_buckets
            .into_iter()
            .filter(|(_, postings)| !postings.is_empty())
            .map(|(bitset, postings)| {
                BitSetPostingUnion::build(postings, BitSetDocSet::from(bitset))
            })
            .collect();
        let sparse_term_unions = SimpleUnion::build(sparse_term_docsets);

        // Build unions for other term buckets
        let bitset_unions_per_bucket: Vec<_> = buckets
            .into_iter()
            .filter(|(_, postings)| !postings.is_empty())
            .map(|(bitset, postings)| {
                BitSetPostingUnion::build(postings, BitSetDocSet::from(bitset))
            })
            .collect();
        let other_union = SimpleUnion::build(bitset_unions_per_bucket);

        let union: SimpleUnion<Box<dyn Postings + 'static>> =
            SimpleUnion::build(vec![Box::new(sparse_term_unions), Box::new(other_union)]);

        // Return a union of sparse term unions and other term unions
        Ok(union)
    }
}

impl Weight for RegexPhraseWeight {
    fn scorer(&self, reader: &SegmentReader, boost: Score) -> crate::Result<Box<dyn Scorer>> {
        if let Some(scorer) = self.phrase_scorer(reader, boost)? {
            Ok(Box::new(scorer))
        } else {
            Ok(Box::new(EmptyScorer))
        }
    }

    fn explain(&self, reader: &SegmentReader, doc: DocId) -> crate::Result<Explanation> {
        let scorer_opt = self.phrase_scorer(reader, 1.0)?;
        if scorer_opt.is_none() {
            return Err(does_not_match(doc));
        }
        let mut scorer = scorer_opt.unwrap();
        if scorer.seek(doc) != doc {
            return Err(does_not_match(doc));
        }
        let fieldnorm_reader = self.fieldnorm_reader(reader)?;
        let fieldnorm_id = fieldnorm_reader.fieldnorm_id(doc);
        let phrase_count = scorer.phrase_count();
        let mut explanation = Explanation::new("Phrase Scorer", scorer.score());
        if let Some(similarity_weight) = self.similarity_weight_opt.as_ref() {
            explanation.add_detail(similarity_weight.explain(fieldnorm_id, phrase_count));
        }
        Ok(explanation)
    }
}

#[cfg(test)]
mod tests {
    use proptest::prelude::*;
    use rand::seq::SliceRandom;

    use super::super::tests::create_index;
    use crate::docset::TERMINATED;
    use crate::query::{wildcard_query_to_regex_str, EnableScoring, RegexPhraseQuery};
    use crate::DocSet;

    proptest! {
        #![proptest_config(ProptestConfig::with_cases(50))]
        #[test]
        fn test_phrase_regex_with_random_strings(mut random_strings in proptest::collection::vec("[c-z ]{0,10}", 1..100), num_occurrences in 1..150_usize) {
            let mut rng = rand::rng();

            // Insert "aaa ccc" the specified number of times into the list
            for _ in 0..num_occurrences {
                random_strings.push("aaa ccc".to_string());
            }
            // Shuffle the list, which now contains random strings and the inserted "aaa ccc"
            random_strings.shuffle(&mut rng);

            // Compute the positions of "aaa ccc" after the shuffle
            let aaa_ccc_positions: Vec<usize> = random_strings
                .iter()
                .enumerate()
                .filter_map(|(idx, s)| if s == "aaa ccc" { Some(idx) } else { None })
                .collect();

            // Create the index with random strings and the fixed string "aaa ccc"
            let index = create_index(&random_strings.iter().map(AsRef::as_ref).collect::<Vec<&str>>())?;
            let schema = index.schema();
            let text_field = schema.get_field("text").unwrap();
            let searcher = index.reader()?.searcher();

            let phrase_query = RegexPhraseQuery::new(text_field, vec![wildcard_query_to_regex_str("a*"), wildcard_query_to_regex_str("c*")]);

            let enable_scoring = EnableScoring::enabled_from_searcher(&searcher);
            let phrase_weight = phrase_query.regex_phrase_weight(enable_scoring).unwrap();
            let mut phrase_scorer = phrase_weight
                .phrase_scorer(searcher.segment_reader(0u32), 1.0)?
                .unwrap();

            // Check if the scorer returns the correct document positions for "aaa ccc"
            for expected_doc in aaa_ccc_positions {
                prop_assert_eq!(phrase_scorer.doc(), expected_doc as u32);
                prop_assert_eq!(phrase_scorer.phrase_count(), 1);
                phrase_scorer.advance();
            }
            prop_assert_eq!(phrase_scorer.advance(), TERMINATED);
        }
    }

    #[test]
    pub fn test_phrase_count() -> crate::Result<()> {
        let index = create_index(&["a c", "a a b d a b c", " a b"])?;
        let schema = index.schema();
        let text_field = schema.get_field("text").unwrap();
        let searcher = index.reader()?.searcher();
        let phrase_query = RegexPhraseQuery::new(text_field, vec!["a".into(), "b".into()]);
        let enable_scoring = EnableScoring::enabled_from_searcher(&searcher);
        let phrase_weight = phrase_query.regex_phrase_weight(enable_scoring).unwrap();
        let mut phrase_scorer = phrase_weight
            .phrase_scorer(searcher.segment_reader(0u32), 1.0)?
            .unwrap();
        assert_eq!(phrase_scorer.doc(), 1);
        assert_eq!(phrase_scorer.phrase_count(), 2);
        assert_eq!(phrase_scorer.advance(), 2);
        assert_eq!(phrase_scorer.doc(), 2);
        assert_eq!(phrase_scorer.phrase_count(), 1);
        assert_eq!(phrase_scorer.advance(), TERMINATED);
        Ok(())
    }

    #[test]
    pub fn test_phrase_wildcard() -> crate::Result<()> {
        let index = create_index(&["a c", "a aa b d ad b c", " ac b", "bac b"])?;
        let schema = index.schema();
        let text_field = schema.get_field("text").unwrap();
        let searcher = index.reader()?.searcher();
        let phrase_query = RegexPhraseQuery::new(text_field, vec!["a.*".into(), "b".into()]);
        let enable_scoring = EnableScoring::enabled_from_searcher(&searcher);
        let phrase_weight = phrase_query.regex_phrase_weight(enable_scoring).unwrap();
        let mut phrase_scorer = phrase_weight
            .phrase_scorer(searcher.segment_reader(0u32), 1.0)?
            .unwrap();
        assert_eq!(phrase_scorer.doc(), 1);
        assert_eq!(phrase_scorer.phrase_count(), 2);
        assert_eq!(phrase_scorer.advance(), 2);
        assert_eq!(phrase_scorer.doc(), 2);
        assert_eq!(phrase_scorer.phrase_count(), 1);
        assert_eq!(phrase_scorer.advance(), TERMINATED);

        Ok(())
    }

    #[test]
    pub fn test_phrase_regex() -> crate::Result<()> {
        let index = create_index(&["ba b", "a aa b d ad b c", "bac b"])?;
        let schema = index.schema();
        let text_field = schema.get_field("text").unwrap();
        let searcher = index.reader()?.searcher();
        let phrase_query = RegexPhraseQuery::new(text_field, vec!["b?a.*".into(), "b".into()]);
        let enable_scoring = EnableScoring::enabled_from_searcher(&searcher);
        let phrase_weight = phrase_query.regex_phrase_weight(enable_scoring).unwrap();
        let mut phrase_scorer = phrase_weight
            .phrase_scorer(searcher.segment_reader(0u32), 1.0)?
            .unwrap();
        assert_eq!(phrase_scorer.doc(), 0);
        assert_eq!(phrase_scorer.phrase_count(), 1);
        assert_eq!(phrase_scorer.advance(), 1);
        assert_eq!(phrase_scorer.phrase_count(), 2);
        assert_eq!(phrase_scorer.advance(), 2);
        assert_eq!(phrase_scorer.doc(), 2);
        assert_eq!(phrase_scorer.phrase_count(), 1);
        assert_eq!(phrase_scorer.advance(), TERMINATED);

        Ok(())
    }

    #[test]
    pub fn test_phrase_regex_with_slop() -> crate::Result<()> {
        let index = create_index(&["aaa bbb ccc ___ abc ddd bbb ccc"])?;
        let schema = index.schema();
        let text_field = schema.get_field("text").unwrap();
        let searcher = index.reader()?.searcher();
        let mut phrase_query = RegexPhraseQuery::new(text_field, vec!["a.*".into(), "c.*".into()]);
        phrase_query.set_slop(1);
        let enable_scoring = EnableScoring::enabled_from_searcher(&searcher);
        let phrase_weight = phrase_query.regex_phrase_weight(enable_scoring).unwrap();
        let mut phrase_scorer = phrase_weight
            .phrase_scorer(searcher.segment_reader(0u32), 1.0)?
            .unwrap();
        assert_eq!(phrase_scorer.doc(), 0);
        assert_eq!(phrase_scorer.phrase_count(), 1);
        assert_eq!(phrase_scorer.advance(), TERMINATED);

        phrase_query.set_slop(2);
        let enable_scoring = EnableScoring::enabled_from_searcher(&searcher);
        let phrase_weight = phrase_query.regex_phrase_weight(enable_scoring).unwrap();
        let mut phrase_scorer = phrase_weight
            .phrase_scorer(searcher.segment_reader(0u32), 1.0)?
            .unwrap();
        assert_eq!(phrase_scorer.doc(), 0);
        assert_eq!(phrase_scorer.phrase_count(), 2);
        assert_eq!(phrase_scorer.advance(), TERMINATED);

        Ok(())
    }

    #[test]
    pub fn test_phrase_regex_double_wildcard() -> crate::Result<()> {
        let index = create_index(&["baaab bccccb"])?;
        let schema = index.schema();
        let text_field = schema.get_field("text").unwrap();
        let searcher = index.reader()?.searcher();
        let phrase_query = RegexPhraseQuery::new(
            text_field,
            vec![
                wildcard_query_to_regex_str("*a*"),
                wildcard_query_to_regex_str("*c*"),
            ],
        );
        let enable_scoring = EnableScoring::enabled_from_searcher(&searcher);
        let phrase_weight = phrase_query.regex_phrase_weight(enable_scoring).unwrap();
        let mut phrase_scorer = phrase_weight
            .phrase_scorer(searcher.segment_reader(0u32), 1.0)?
            .unwrap();
        assert_eq!(phrase_scorer.doc(), 0);
        assert_eq!(phrase_scorer.phrase_count(), 1);
        assert_eq!(phrase_scorer.advance(), TERMINATED);
        Ok(())
    }
}


================================================
FILE: src/query/query.rs
================================================
use std::fmt;

use downcast_rs::impl_downcast;

use super::bm25::Bm25StatisticsProvider;
use super::Weight;
use crate::core::searcher::Searcher;
use crate::query::Explanation;
use crate::schema::Schema;
use crate::{DocAddress, Term};

/// Argument used in `Query::weight(..)`
#[derive(Copy, Clone)]
pub enum EnableScoring<'a> {
    /// Pass this to enable scoring.
    Enabled {
        /// The searcher to use during scoring.
        searcher: &'a Searcher,

        /// A [Bm25StatisticsProvider] used to compute BM25 scores.
        ///
        /// Normally this should be the [Searcher], but you can specify a custom
        /// one to adjust the statistics.
        statistics_provider: &'a dyn Bm25StatisticsProvider,
    },
    /// Pass this to disable scoring.
    /// This can improve performance.
    Disabled {
        /// Schema is required.
        schema: &'a Schema,
        /// Searcher should be provided if available.
        searcher_opt: Option<&'a Searcher>,
    },
}

impl<'a> EnableScoring<'a> {
    /// Create using [Searcher] with scoring enabled.
    pub fn enabled_from_searcher(searcher: &'a Searcher) -> EnableScoring<'a> {
        EnableScoring::Enabled {
            searcher,
            statistics_provider: searcher,
        }
    }

    /// Create using a custom [Bm25StatisticsProvider] with scoring enabled.
    pub fn enabled_from_statistics_provider(
        statistics_provider: &'a dyn Bm25StatisticsProvider,
        searcher: &'a Searcher,
    ) -> EnableScoring<'a> {
        EnableScoring::Enabled {
            statistics_provider,
            searcher,
        }
    }

    /// Create using [Searcher] with scoring disabled.
    pub fn disabled_from_searcher(searcher: &'a Searcher) -> EnableScoring<'a> {
        EnableScoring::Disabled {
            schema: searcher.schema(),
            searcher_opt: Some(searcher),
        }
    }

    /// Create using [Schema] with scoring disabled.
    pub fn disabled_from_schema(schema: &'a Schema) -> EnableScoring<'a> {
        Self::Disabled {
            schema,
            searcher_opt: None,
        }
    }

    /// Returns the searcher if available.
    pub fn searcher(&self) -> Option<&Searcher> {
        match self {
            EnableScoring::Enabled { searcher, .. } => Some(*searcher),
            EnableScoring::Disabled { searcher_opt, .. } => searcher_opt.to_owned(),
        }
    }

    /// Returns the schema.
    pub fn schema(&self) -> &Schema {
        match self {
            EnableScoring::Enabled { searcher, .. } => searcher.schema(),
            EnableScoring::Disabled { schema, .. } => schema,
        }
    }

    /// Returns true if the scoring is enabled.
    pub fn is_scoring_enabled(&self) -> bool {
        matches!(self, EnableScoring::Enabled { .. })
    }
}

/// The `Query` trait defines a set of documents and a scoring method
/// for those documents.
///
/// The `Query` trait is in charge of defining :
///
/// - a set of documents
/// - a way to score these documents
///
/// When performing a [search](Searcher::search), these documents will then
/// be pushed to a [`Collector`](crate::collector::Collector),
/// which will in turn be in charge of deciding what to do with them.
///
/// Concretely, this scored docset is represented by the
/// [`Scorer`] trait.
///
/// Because our index is actually split into segments, the
/// query does not actually directly creates [`DocSet`](crate::DocSet) object.
/// Instead, the query creates a [`Weight`] object for a given searcher.
///
/// The weight object, in turn, makes it possible to create
/// a scorer for a specific [`SegmentReader`].
///
/// So to sum it up :
/// - a `Query` is a recipe to define a set of documents as well the way to score them.
/// - a [`Weight`] is this recipe tied to a specific [`Searcher`]. It may for instance hold
///   statistics about the different term of the query. It is created by the query.
/// - a [`Scorer`] is a cursor over the set of matching documents, for a specific [`SegmentReader`].
///   It is created by the [`Weight`].
///
/// When implementing a new type of `Query`, it is normal to implement a
/// dedicated `Query`, [`Weight`] and [`Scorer`].
///
/// [`Scorer`]: crate::query::Scorer
/// [`SegmentReader`]: crate::SegmentReader
pub trait Query: QueryClone + Send + Sync + downcast_rs::Downcast + fmt::Debug {
    /// Create the weight associated with a query.
    ///
    /// If scoring is not required, setting `scoring_enabled` to `false`
    /// can increase performances.
    ///
    /// See [`Weight`].
    fn weight(&self, enable_scoring: EnableScoring<'_>) -> crate::Result<Box<dyn Weight>>;

    /// Returns an `Explanation` for the score of the document.
    fn explain(&self, searcher: &Searcher, doc_address: DocAddress) -> crate::Result<Explanation> {
        let weight = self.weight(EnableScoring::enabled_from_searcher(searcher))?;
        let reader = searcher.segment_reader(doc_address.segment_ord);
        weight.explain(reader, doc_address.doc_id)
    }

    /// Returns the number of documents matching the query.
    fn count(&self, searcher: &Searcher) -> crate::Result<usize> {
        let weight = self.weight(EnableScoring::disabled_from_searcher(searcher))?;
        let mut result = 0;
        for reader in searcher.segment_readers() {
            result += weight.count(reader)? as usize;
        }
        Ok(result)
    }

    /// Extract all of the terms associated with the query and pass them to the
    /// given closure.
    ///
    /// Each term is associated with a boolean indicating whether
    /// positions are required or not.
    ///
    /// Note that there can be multiple instances of any given term
    /// in a query and deduplication must be handled by the visitor.
    fn query_terms<'a>(&'a self, _visitor: &mut dyn FnMut(&'a Term, bool)) {}
}

/// Implements `box_clone`.
pub trait QueryClone {
    /// Returns a boxed clone of `self`.
    fn box_clone(&self) -> Box<dyn Query>;
}

impl<T> QueryClone for T
where T: 'static + Query + Clone
{
    fn box_clone(&self) -> Box<dyn Query> {
        Box::new(self.clone())
    }
}

impl Query for Box<dyn Query> {
    fn weight(&self, enabled_scoring: EnableScoring) -> crate::Result<Box<dyn Weight>> {
        self.as_ref().weight(enabled_scoring)
    }

    fn count(&self, searcher: &Searcher) -> crate::Result<usize> {
        self.as_ref().count(searcher)
    }

    fn query_terms<'a>(&'a self, visitor: &mut dyn FnMut(&'a Term, bool)) {
        self.as_ref().query_terms(visitor);
    }
}

impl QueryClone for Box<dyn Query> {
    fn box_clone(&self) -> Box<dyn Query> {
        self.as_ref().box_clone()
    }
}

impl_downcast!(Query);


================================================
FILE: src/query/query_parser/logical_ast.rs
================================================
use std::fmt;
use std::ops::Bound;
use std::sync::Arc;

use tantivy_fst::Regex;

use crate::query::Occur;
use crate::schema::{Field, Term};
use crate::Score;

#[derive(Clone)]
pub enum LogicalLiteral {
    Term(Term),
    Phrase {
        terms: Vec<(usize, Term)>,
        slop: u32,
        prefix: bool,
    },
    Range {
        lower: Bound<Term>,
        upper: Bound<Term>,
    },
    Set {
        elements: Vec<Term>,
    },
    All,
    Regex {
        pattern: Arc<Regex>,
        field: Field,
    },
}

pub enum LogicalAst {
    Clause(Vec<(Occur, LogicalAst)>),
    Leaf(Box<LogicalLiteral>),
    Boost(Box<LogicalAst>, Score),
}

impl LogicalAst {
    pub fn boost(self, boost: Score) -> LogicalAst {
        if (boost - 1.0).abs() < Score::EPSILON {
            self
        } else {
            LogicalAst::Boost(Box::new(self), boost)
        }
    }

    // TODO: Move to rewrite_ast in query_grammar
    pub fn simplify(self) -> LogicalAst {
        match self {
            LogicalAst::Clause(clauses) => {
                let mut new_clauses: Vec<(Occur, LogicalAst)> = Vec::new();

                for (occur, sub_ast) in clauses {
                    let simplified_sub_ast = sub_ast.simplify();

                    // If clauses below have the same `Occur`, we can pull them up
                    match simplified_sub_ast {
                        LogicalAst::Clause(sub_clauses)
                            if (occur == Occur::Should || occur == Occur::Must)
                                && sub_clauses.iter().all(|(o, _)| *o == occur) =>
                        {
                            for sub_clause in sub_clauses {
                                new_clauses.push(sub_clause);
                            }
                        }
                        _ => new_clauses.push((occur, simplified_sub_ast)),
                    }
                }

                LogicalAst::Clause(new_clauses)
            }
            LogicalAst::Leaf(_) | LogicalAst::Boost(_, _) => self,
        }
    }
}

fn occur_letter(occur: Occur) -> &'static str {
    match occur {
        Occur::Must => "+",
        Occur::MustNot => "-",
        Occur::Should => "",
    }
}

impl fmt::Debug for LogicalAst {
    fn fmt(&self, formatter: &mut fmt::Formatter<'_>) -> Result<(), fmt::Error> {
        match *self {
            LogicalAst::Clause(ref clause) => {
                if clause.is_empty() {
                    write!(formatter, "<emptyclause>")?;
                } else {
                    let (occur, subquery) = &clause[0];
                    write!(formatter, "({}{subquery:?}", occur_letter(*occur))?;
                    for (occur, subquery) in &clause[1..] {
                        write!(formatter, " {}{subquery:?}", occur_letter(*occur))?;
                    }
                    formatter.write_str(")")?;
                }
                Ok(())
            }
            LogicalAst::Boost(ref ast, boost) => write!(formatter, "{ast:?}^{boost}"),
            LogicalAst::Leaf(ref literal) => write!(formatter, "{literal:?}"),
        }
    }
}

impl From<LogicalLiteral> for LogicalAst {
    fn from(literal: LogicalLiteral) -> LogicalAst {
        LogicalAst::Leaf(Box::new(literal))
    }
}

impl fmt::Debug for LogicalLiteral {
    fn fmt(&self, formatter: &mut fmt::Formatter<'_>) -> Result<(), fmt::Error> {
        match *self {
            LogicalLiteral::Term(ref term) => write!(formatter, "{term:?}"),
            LogicalLiteral::Phrase {
                ref terms,
                slop,
                prefix,
            } => {
                write!(formatter, "\"{terms:?}\"")?;
                if slop > 0 {
                    write!(formatter, "~{slop:?}")
                } else if prefix {
                    write!(formatter, "*")
                } else {
                    Ok(())
                }
            }
            LogicalLiteral::Range {
                ref lower,
                ref upper,
                ..
            } => write!(formatter, "({lower:?} TO {upper:?})"),
            LogicalLiteral::Set { ref elements, .. } => {
                const MAX_DISPLAYED: usize = 10;

                write!(formatter, "IN [")?;
                for (i, element) in elements.iter().enumerate() {
                    if i == 0 {
                        write!(formatter, "{element:?}")?;
                    } else if i == MAX_DISPLAYED - 1 {
                        write!(
                            formatter,
                            ", {element:?}, ... ({} more)",
                            elements.len() - i - 1
                        )?;
                        break;
                    } else {
                        write!(formatter, ", {element:?}")?;
                    }
                }
                write!(formatter, "]")
            }
            LogicalLiteral::All => write!(formatter, "*"),
            LogicalLiteral::Regex {
                ref pattern,
                ref field,
            } => write!(formatter, "Regex({field:?}, {pattern:?})"),
        }
    }
}


================================================
FILE: src/query/query_parser/mod.rs
================================================
mod query_parser;

pub mod logical_ast;
pub use self::query_parser::{QueryParser, QueryParserError};


================================================
FILE: src/query/query_parser/query_parser.rs
================================================
use std::net::{AddrParseError, IpAddr};
use std::num::{ParseFloatError, ParseIntError};
use std::ops::Bound;
use std::str::{FromStr, ParseBoolError};
use std::sync::Arc;

use base64::engine::general_purpose::STANDARD as BASE64;
use base64::Engine;
use itertools::Itertools;
use query_grammar::{UserInputAst, UserInputBound, UserInputLeaf, UserInputLiteral};
use rustc_hash::FxHashMap;
use tantivy_fst::Regex;

use super::logical_ast::*;
use crate::index::Index;
use crate::json_utils::convert_to_fast_value_and_append_to_json_term;
use crate::query::range_query::{is_type_valid_for_fastfield_range_query, RangeQuery};
use crate::query::{
    AllQuery, BooleanQuery, BoostQuery, EmptyQuery, FuzzyTermQuery, Occur, PhrasePrefixQuery,
    PhraseQuery, Query, RegexQuery, TermQuery, TermSetQuery,
};
use crate::schema::{
    Facet, FacetParseError, Field, FieldType, IndexRecordOption, IntoIpv6Addr, JsonObjectOptions,
    Schema, Term, TextFieldIndexing, Type,
};
use crate::time::format_description::well_known::Rfc3339;
use crate::time::OffsetDateTime;
use crate::tokenizer::{TextAnalyzer, TokenizerManager};
use crate::{DateTime, Score};

/// Possible error that may happen when parsing a query.
#[derive(Debug, PartialEq, Eq, Error)]
pub enum QueryParserError {
    /// Error in the query syntax
    #[error("Syntax Error: {0}")]
    SyntaxError(String),
    /// This query is unsupported.
    #[error("Unsupported query: {0}")]
    UnsupportedQuery(String),
    /// The query references a field that is not in the schema
    #[error("Field does not exist: '{0}'")]
    FieldDoesNotExist(String),
    /// The query contains a term for a `u64` or `i64`-field, but the value
    /// is neither.
    #[error("Expected a valid integer: '{0:?}'")]
    ExpectedInt(#[from] ParseIntError),
    /// The query contains a term for a bytes field, but the value is not valid
    /// base64.
    #[error("Expected base64: '{0:?}'")]
    ExpectedBase64(#[from] base64::DecodeError),
    /// The query contains a term for a `f64`-field, but the value
    /// is not a f64.
    #[error("Invalid query: Only excluding terms given")]
    ExpectedFloat(#[from] ParseFloatError),
    /// The query contains a term for a bool field, but the value
    /// is not a bool.
    #[error("Expected a bool value: '{0:?}'")]
    ExpectedBool(#[from] ParseBoolError),
    /// It is forbidden queries that are only "excluding". (e.g. -title:pop)
    #[error("Invalid query: Only excluding terms given")]
    AllButQueryForbidden,
    /// If no default field is declared, running a query without any
    /// field specified is forbidden.
    #[error("No default field declared and no field specified in query")]
    NoDefaultFieldDeclared,
    /// The field searched for is not declared
    /// as indexed in the schema.
    #[error("The field '{0}' is not declared as indexed")]
    FieldNotIndexed(String),
    /// A phrase query was requested for a field that does not
    /// have any positions indexed.
    #[error("The field '{0}' does not have positions indexed")]
    FieldDoesNotHavePositionsIndexed(String),
    /// A phrase-prefix query requires at least two terms
    #[error(
        "The phrase '{phrase:?}' does not produce at least two terms using the tokenizer \
         '{tokenizer:?}'"
    )]
    PhrasePrefixRequiresAtLeastTwoTerms {
        /// The phrase which triggered the issue
        phrase: String,
        /// The tokenizer configured for the field
        tokenizer: String,
    },
    /// The tokenizer for the given field is unknown
    /// The two argument strings are the name of the field, the name of the tokenizer
    #[error("The tokenizer '{tokenizer:?}' for the field '{field:?}' is unknown")]
    UnknownTokenizer {
        /// The name of the tokenizer
        tokenizer: String,
        /// The field name
        field: String,
    },
    /// The query contains a range query with a phrase as one of the bounds.
    /// Only terms can be used as bounds.
    #[error("A range query cannot have a phrase as one of the bounds")]
    RangeMustNotHavePhrase,
    /// The format for the date field is not RFC 3339 compliant.
    #[error("The date field has an invalid format")]
    DateFormatError(#[from] time::error::Parse),
    /// The format for the facet field is invalid.
    #[error("The facet field is malformed: {0}")]
    FacetFormatError(#[from] FacetParseError),
    /// The format for the ip field is invalid.
    #[error("The ip field is malformed: {0}")]
    IpFormatError(#[from] AddrParseError),
}

/// Recursively remove empty clause from the AST
///
/// Returns `None` if and only if the `logical_ast` ended up being empty.
fn trim_ast(logical_ast: LogicalAst) -> Option<LogicalAst> {
    match logical_ast {
        LogicalAst::Clause(children) => {
            let trimmed_children = children
                .into_iter()
                .flat_map(|(occur, child)| {
                    trim_ast(child).map(|trimmed_child| (occur, trimmed_child))
                })
                .collect::<Vec<_>>();
            if trimmed_children.is_empty() {
                None
            } else {
                Some(LogicalAst::Clause(trimmed_children))
            }
        }
        _ => Some(logical_ast),
    }
}

/// Tantivy's Query parser
///
/// The language covered by the current parser is extremely simple.
///
/// * simple terms: "e.g.: `Barack Obama` will be seen as a sequence of two tokens Barack and Obama.
///   By default, the query parser will interpret this as a disjunction (see
///   `.set_conjunction_by_default()`) and will match all documents that contains either "Barack" or
///   "Obama" or both. Since we did not target a specific field, the query parser will look into the
///   so-called default fields (as set up in the constructor).
///
///   Assuming that the default fields are `body` and `title`, and the query parser is set with
///   conjunction as a default, our query will be interpreted as.
///   `(body:Barack OR title:Barack) AND (title:Obama OR body:Obama)`.
///   By default, all tokenized and indexed fields are default fields.
///
///   It is possible to explicitly target a field by prefixing the text by the `fieldname:`.
///   Note this only applies to the term directly following.
///   For instance, assuming the query parser is configured to use conjunction by default,
///   `body:Barack Obama` is not interpreted as `body:Barack AND body:Obama` but as
///   `body:Barack OR (body:Barack OR text:Obama)` .
///
/// * boolean operators `AND`, `OR`. `AND` takes precedence over `OR`, so that `a AND b OR c` is
///   interpreted as `(a AND b) OR c`.
///
/// * In addition to the boolean operators, the `-`, `+` can help define. These operators are
///   sufficient to express all queries using boolean operators. For instance `x AND y OR z` can be
///   written (`(+x +y) z`). In addition, these operators can help define "required optional"
///   queries. `(+x y)` matches the same document set as simply `x`, but `y` will help refining the
///   score.
///
/// * negative terms: By prepending a term by a `-`, a term can be excluded from the search. This is
///   useful for disambiguating a query. e.g. `apple -fruit`
///
/// * must terms: By prepending a term by a `+`, a term can be made required for the search.
///
/// * phrase terms: Quoted terms become phrase searches on fields that have positions indexed. e.g.,
///   `title:"Barack Obama"` will only find documents that have "barack" immediately followed by
///   "obama". Single quotes can also be used. If the text to be searched contains quotation mark,
///   it is possible to escape them with a `\`.
///
/// * range terms: Range searches can be done by specifying the start and end bound. These can be
///   inclusive or exclusive. e.g., `title:[a TO c}` will find all documents whose title contains a
///   word lexicographically between `a` and `c` (inclusive lower bound, exclusive upper bound).
///   Inclusive bounds are `[]`, exclusive are `{}`.
///
/// * set terms: Using the `IN` operator, a field can be matched against a set of literals, e.g.
///   `title: IN [a b cd]` will match documents where `title` is either `a`, `b` or `cd`, but do so
///   more efficiently than the alternative query `title:a OR title:b OR title:c` does.
///
/// * date values: The query parser supports rfc3339 formatted dates. For example
///   `"2002-10-02T15:00:00.05Z"` or `some_date_field:[2002-10-02T15:00:00Z TO
///   2002-10-02T18:00:00Z}`
///
/// * all docs query: A plain `*` will match all documents in the index.
///
/// Parts of the queries can be boosted by appending `^boostfactor`.
/// For instance, `"SRE"^2.0 OR devops^0.4` will boost documents containing `SRE` instead of
/// devops. Negative boosts are not allowed.
///
/// It is also possible to define a boost for a some specific field, at the query parser level.
/// (See [`set_field_boost(...)`](QueryParser::set_field_boost)). Typically you may want to boost a
/// title field.
///
/// Additionally, specific fields can be marked to use fuzzy term queries for each literal
/// via the [`QueryParser::set_field_fuzzy`] method.
///
/// Phrase terms support the `~` slop operator which allows to set the phrase's matching
/// distance in words. `"big wolf"~1` will return documents containing the phrase `"big bad wolf"`.
///
/// Phrase terms also support the `*` prefix operator which switches the phrase's matching
/// to consider all documents which contain the last term as a prefix, e.g. `"big bad wo"*` will
/// match `"big bad wolf"`.
#[derive(Clone)]
pub struct QueryParser {
    schema: Schema,
    default_fields: Vec<Field>,
    conjunction_by_default: bool,
    tokenizer_manager: TokenizerManager,
    boost: FxHashMap<Field, Score>,
    fuzzy: FxHashMap<Field, Fuzzy>,
    regexes_allowed: bool,
}

#[derive(Clone)]
struct Fuzzy {
    prefix: bool,
    distance: u8,
    transpose_cost_one: bool,
}

fn all_negative(ast: &LogicalAst) -> bool {
    match ast {
        LogicalAst::Leaf(_) => false,
        LogicalAst::Boost(ref child_ast, _) => all_negative(child_ast),
        LogicalAst::Clause(children) => children
            .iter()
            .all(|(ref occur, child)| (*occur == Occur::MustNot) || all_negative(child)),
    }
}

// Make an all-negative ast into a normal ast. Must not be used on an already okay ast.
fn make_non_negative(ast: &mut LogicalAst) {
    match ast {
        LogicalAst::Leaf(_) => (),
        LogicalAst::Boost(ref mut child_ast, _) => make_non_negative(child_ast),
        LogicalAst::Clause(children) => children.push((Occur::Should, LogicalLiteral::All.into())),
    }
}

/// Similar to the try/? macro, but returns a tuple of (None, Vec<Error>) instead of Err(Error)
macro_rules! try_tuple {
    ($expr:expr) => {{
        match $expr {
            Ok(val) => val,
            Err(e) => return (None, vec![e.into()]),
        }
    }};
}

impl QueryParser {
    /// Creates a `QueryParser`, given
    /// * schema - index Schema
    /// * default_fields - fields used to search if no field is specifically defined in the query.
    pub fn new(
        schema: Schema,
        default_fields: Vec<Field>,
        tokenizer_manager: TokenizerManager,
    ) -> QueryParser {
        QueryParser {
            schema,
            default_fields,
            tokenizer_manager,
            conjunction_by_default: false,
            boost: Default::default(),
            fuzzy: Default::default(),
            regexes_allowed: false,
        }
    }

    // Splits a full_path as written in a query, into a field name and a
    // json path.
    pub(crate) fn split_full_path<'a>(&self, full_path: &'a str) -> Option<(Field, &'a str)> {
        self.schema.find_field(full_path)
    }

    /// Creates a `QueryParser`, given
    ///  * an index
    ///  * a set of default fields used to search if no field is specifically defined in the query.
    pub fn for_index(index: &Index, default_fields: Vec<Field>) -> QueryParser {
        QueryParser::new(index.schema(), default_fields, index.tokenizers().clone())
    }

    /// Set the default way to compose queries to a conjunction.
    ///
    /// By default, the query `happy tax payer` is equivalent to the query
    /// `happy OR tax OR payer`. After calling `.set_conjunction_by_default()`
    /// `happy tax payer` will be interpreted by the parser as `happy AND tax AND payer`.
    pub fn set_conjunction_by_default(&mut self) {
        self.conjunction_by_default = true;
    }

    /// Sets a boost for a specific field.
    ///
    /// The parse query will automatically boost this field.
    ///
    /// If the query defines a query boost through the query language (e.g: `country:France^3.0`),
    /// the two boosts (the one defined in the query, and the one defined in the `QueryParser`)
    /// are multiplied together.
    pub fn set_field_boost(&mut self, field: Field, boost: Score) {
        self.boost.insert(field, boost);
    }

    /// Sets the given [field][`Field`] to use [fuzzy term queries][`FuzzyTermQuery`]
    ///
    /// If set, the parse will produce queries using fuzzy term queries
    /// with the given parameters for each literal matched against the given field.
    ///
    /// See the [`FuzzyTermQuery::new`] and [`FuzzyTermQuery::new_prefix`] methods
    /// for the meaning of the individual parameters.
    pub fn set_field_fuzzy(
        &mut self,
        field: Field,
        prefix: bool,
        distance: u8,
        transpose_cost_one: bool,
    ) {
        self.fuzzy.insert(
            field,
            Fuzzy {
                prefix,
                distance,
                transpose_cost_one,
            },
        );
    }

    /// Allow regexes in queries
    pub fn allow_regexes(&mut self) {
        self.regexes_allowed = true;
    }

    /// Parse a query
    ///
    /// Note that `parse_query` returns an error if the input
    /// is not a valid query.
    pub fn parse_query(&self, query: &str) -> Result<Box<dyn Query>, QueryParserError> {
        let logical_ast = self.parse_query_to_logical_ast(query)?;
        Ok(convert_to_query(&self.fuzzy, logical_ast))
    }

    /// Parse a query leniently
    ///
    /// This variant parses invalid query on a best effort basis. If some part of the query can't
    /// reasonably be executed (range query without field, searching on a non existing field,
    /// searching without precising field when no default field is provided...), they may get
    /// turned into a "match-nothing" subquery.
    ///
    /// In case it encountered such issues, they are reported as a Vec of errors.
    pub fn parse_query_lenient(&self, query: &str) -> (Box<dyn Query>, Vec<QueryParserError>) {
        let (logical_ast, errors) = self.parse_query_to_logical_ast_lenient(query);
        (convert_to_query(&self.fuzzy, logical_ast), errors)
    }

    /// Build a query from an already parsed user input AST
    ///
    /// This can be useful if the user input AST parsed using [`query_grammar`]
    /// needs to be inspected before the query is re-interpreted w.r.t.
    /// index specifics like field names and tokenizers.
    pub fn build_query_from_user_input_ast(
        &self,
        user_input_ast: UserInputAst,
    ) -> Result<Box<dyn Query>, QueryParserError> {
        let (logical_ast, mut err) = self.compute_logical_ast_lenient(user_input_ast);
        if !err.is_empty() {
            return Err(err.swap_remove(0));
        }
        Ok(convert_to_query(&self.fuzzy, logical_ast))
    }

    /// Build leniently a query from an already parsed user input AST.
    ///
    /// See also [`QueryParser::build_query_from_user_input_ast`]
    pub fn build_query_from_user_input_ast_lenient(
        &self,
        user_input_ast: UserInputAst,
    ) -> (Box<dyn Query>, Vec<QueryParserError>) {
        let (logical_ast, errors) = self.compute_logical_ast_lenient(user_input_ast);
        (convert_to_query(&self.fuzzy, logical_ast), errors)
    }

    /// Parse the user query into an AST.
    fn parse_query_to_logical_ast(&self, query: &str) -> Result<LogicalAst, QueryParserError> {
        let user_input_ast = query_grammar::parse_query(query)
            .map_err(|_| QueryParserError::SyntaxError(query.to_string()))?;
        let (ast, mut err) = self.compute_logical_ast_lenient(user_input_ast);
        if !err.is_empty() {
            return Err(err.swap_remove(0));
        }
        Ok(ast.simplify())
    }

    /// Parse the user query into an AST.
    fn parse_query_to_logical_ast_lenient(
        &self,
        query: &str,
    ) -> (LogicalAst, Vec<QueryParserError>) {
        let (user_input_ast, errors) = query_grammar::parse_query_lenient(query);
        let mut errors: Vec<_> = errors
            .into_iter()
            .map(|error| {
                QueryParserError::SyntaxError(format!(
                    "{} at position {}",
                    error.message, error.pos
                ))
            })
            .collect();
        let (ast, mut ast_errors) = self.compute_logical_ast_lenient(user_input_ast);
        errors.append(&mut ast_errors);
        (ast, errors)
    }

    fn compute_logical_ast_lenient(
        &self,
        user_input_ast: UserInputAst,
    ) -> (LogicalAst, Vec<QueryParserError>) {
        let (mut ast, mut err) = self.compute_logical_ast_with_occur_lenient(user_input_ast);
        if let LogicalAst::Clause(children) = &ast {
            if children.is_empty() {
                return (ast, err);
            }
        }
        if all_negative(&ast) {
            err.push(QueryParserError::AllButQueryForbidden);
            make_non_negative(&mut ast);
        }
        (ast, err)
    }

    fn compute_boundary_term(
        &self,
        field: Field,
        json_path: &str,
        phrase: &str,
    ) -> Result<Term, QueryParserError> {
        let field_entry = self.schema.get_field_entry(field);
        let field_type = field_entry.field_type();
        let field_supports_ff_range_queries = field_type.is_fast()
            && is_type_valid_for_fastfield_range_query(field_type.value_type());

        if !field_type.is_indexed() && !field_supports_ff_range_queries {
            return Err(QueryParserError::FieldNotIndexed(
                field_entry.name().to_string(),
            ));
        }
        if !json_path.is_empty() && field_type.value_type() != Type::Json {
            return Err(QueryParserError::UnsupportedQuery(format!(
                "Json path is not supported for field {:?}",
                field_entry.name()
            )));
        }
        match *field_type {
            FieldType::U64(_) => {
                let val: u64 = u64::from_str(phrase)?;
                Ok(Term::from_field_u64(field, val))
            }
            FieldType::I64(_) => {
                let val: i64 = i64::from_str(phrase)?;
                Ok(Term::from_field_i64(field, val))
            }
            FieldType::F64(_) => {
                let val: f64 = f64::from_str(phrase)?;
                Ok(Term::from_field_f64(field, val))
            }
            FieldType::Bool(_) => {
                let val: bool = bool::from_str(phrase)?;
                Ok(Term::from_field_bool(field, val))
            }
            FieldType::Date(_) => {
                let dt = OffsetDateTime::parse(phrase, &Rfc3339)?;
                Ok(Term::from_field_date(field, DateTime::from_utc(dt)))
            }
            FieldType::Str(ref str_options) => {
                let option = str_options.get_indexing_options().ok_or_else(|| {
                    // This should have been seen earlier really.
                    QueryParserError::FieldNotIndexed(field_entry.name().to_string())
                })?;
                let mut text_analyzer =
                    self.tokenizer_manager
                        .get(option.tokenizer())
                        .ok_or_else(|| QueryParserError::UnknownTokenizer {
                            field: field_entry.name().to_string(),
                            tokenizer: option.tokenizer().to_string(),
                        })?;
                let mut terms: Vec<Term> = Vec::new();
                let mut token_stream = text_analyzer.token_stream(phrase);
                token_stream.process(&mut |token| {
                    let term = Term::from_field_text(field, &token.text);
                    terms.push(term);
                });
                if terms.len() != 1 {
                    return Err(QueryParserError::UnsupportedQuery(format!(
                        "Range query boundary cannot have multiple tokens: {phrase:?} [{terms:?}]."
                    )));
                }
                Ok(terms.into_iter().next().unwrap())
            }
            FieldType::JsonObject(ref json_options) => {
                let mut term = Term::from_field_json_path(
                    field,
                    json_path,
                    json_options.is_expand_dots_enabled(),
                );
                if let Some(term) =
                    // Try to convert the phrase to a fast value
                    convert_to_fast_value_and_append_to_json_term(&term, phrase, false)
                {
                    Ok(term)
                } else {
                    term.append_type_and_str(phrase);
                    Ok(term)
                }
            }
            FieldType::Facet(_) => match Facet::from_text(phrase) {
                Ok(facet) => Ok(Term::from_facet(field, &facet)),
                Err(e) => Err(QueryParserError::from(e)),
            },
            FieldType::Bytes(_) => {
                let bytes = BASE64
                    .decode(phrase)
                    .map_err(QueryParserError::ExpectedBase64)?;
                Ok(Term::from_field_bytes(field, &bytes))
            }
            FieldType::IpAddr(_) => {
                let ip_v6 = IpAddr::from_str(phrase)?.into_ipv6_addr();
                Ok(Term::from_field_ip_addr(field, ip_v6))
            }
        }
    }

    fn compute_logical_ast_for_leaf(
        &self,
        field: Field,
        json_path: &str,
        phrase: &str,
        slop: u32,
        prefix: bool,
    ) -> Result<Vec<LogicalLiteral>, QueryParserError> {
        let field_entry = self.schema.get_field_entry(field);
        let field_type = field_entry.field_type();
        let field_name = field_entry.name();
        if !field_type.is_indexed() {
            return Err(QueryParserError::FieldNotIndexed(field_name.to_string()));
        }
        if field_type.value_type() != Type::Json && !json_path.is_empty() {
            let field_name = self.schema.get_field_name(field);
            return Err(QueryParserError::FieldDoesNotExist(format!(
                "{field_name}.{json_path}"
            )));
        }
        match *field_type {
            FieldType::U64(_) => {
                let val: u64 = u64::from_str(phrase)?;
                let i64_term = Term::from_field_u64(field, val);
                Ok(vec![LogicalLiteral::Term(i64_term)])
            }
            FieldType::I64(_) => {
                let val: i64 = i64::from_str(phrase)?;
                let i64_term = Term::from_field_i64(field, val);
                Ok(vec![LogicalLiteral::Term(i64_term)])
            }
            FieldType::F64(_) => {
                let val: f64 = f64::from_str(phrase)?;
                let f64_term = Term::from_field_f64(field, val);
                Ok(vec![LogicalLiteral::Term(f64_term)])
            }
            FieldType::Bool(_) => {
                let val: bool = bool::from_str(phrase)?;
                let bool_term = Term::from_field_bool(field, val);
                Ok(vec![LogicalLiteral::Term(bool_term)])
            }
            FieldType::Date(_) => {
                let dt = OffsetDateTime::parse(phrase, &Rfc3339)?;
                let dt_term = Term::from_field_date_for_search(field, DateTime::from_utc(dt));
                Ok(vec![LogicalLiteral::Term(dt_term)])
            }
            FieldType::Str(ref str_options) => {
                let indexing_options = str_options.get_indexing_options().ok_or_else(|| {
                    // This should have been seen earlier really.
                    QueryParserError::FieldNotIndexed(field_name.to_string())
                })?;
                let mut text_analyzer = self
                    .tokenizer_manager
                    .get(indexing_options.tokenizer())
                    .ok_or_else(|| QueryParserError::UnknownTokenizer {
                        field: field_name.to_string(),
                        tokenizer: indexing_options.tokenizer().to_string(),
                    })?;
                Ok(generate_literals_for_str(
                    field_name,
                    field,
                    phrase,
                    slop,
                    prefix,
                    indexing_options,
                    &mut text_analyzer,
                )?
                .into_iter()
                .collect())
            }
            FieldType::JsonObject(ref json_options) => generate_literals_for_json_object(
                field_name,
                field,
                json_path,
                phrase,
                &self.tokenizer_manager,
                json_options,
            ),
            FieldType::Facet(_) => match Facet::from_text(phrase) {
                Ok(facet) => {
                    let facet_term = Term::from_facet(field, &facet);
                    Ok(vec![LogicalLiteral::Term(facet_term)])
                }
                Err(e) => Err(QueryParserError::from(e)),
            },
            FieldType::Bytes(_) => {
                let bytes = BASE64
                    .decode(phrase)
                    .map_err(QueryParserError::ExpectedBase64)?;
                let bytes_term = Term::from_field_bytes(field, &bytes);
                Ok(vec![LogicalLiteral::Term(bytes_term)])
            }
            FieldType::IpAddr(_) => {
                let ip_v6 = IpAddr::from_str(phrase)?.into_ipv6_addr();
                let term = Term::from_field_ip_addr(field, ip_v6);
                Ok(vec![LogicalLiteral::Term(term)])
            }
        }
    }

    fn default_occur(&self) -> Occur {
        if self.conjunction_by_default {
            Occur::Must
        } else {
            Occur::Should
        }
    }

    fn resolve_bound(
        &self,
        field: Field,
        json_path: &str,
        bound: &UserInputBound,
    ) -> Result<Bound<Term>, QueryParserError> {
        if bound.term_str() == "*" {
            return Ok(Bound::Unbounded);
        }
        let term = self.compute_boundary_term(field, json_path, bound.term_str())?;
        match *bound {
            UserInputBound::Inclusive(_) => Ok(Bound::Included(term)),
            UserInputBound::Exclusive(_) => Ok(Bound::Excluded(term)),
            UserInputBound::Unbounded => Ok(Bound::Unbounded),
        }
    }

    fn compute_logical_ast_with_occur_lenient(
        &self,
        user_input_ast: UserInputAst,
    ) -> (LogicalAst, Vec<QueryParserError>) {
        match user_input_ast {
            UserInputAst::Clause(sub_queries) => {
                let default_occur = self.default_occur();
                let mut logical_sub_queries: Vec<(Occur, LogicalAst)> = Vec::new();
                let mut errors = Vec::new();
                for (occur_opt, sub_ast) in sub_queries {
                    let (sub_ast, mut sub_errors) =
                        self.compute_logical_ast_with_occur_lenient(sub_ast);
                    let occur = occur_opt.unwrap_or(default_occur);
                    logical_sub_queries.push((occur, sub_ast));
                    errors.append(&mut sub_errors);
                }
                (LogicalAst::Clause(logical_sub_queries), errors)
            }
            UserInputAst::Boost(ast, boost) => {
                let (ast, errors) = self.compute_logical_ast_with_occur_lenient(*ast);
                (ast.boost(boost.into_inner() as Score), errors)
            }
            UserInputAst::Leaf(leaf) => {
                let (ast, errors) = self.compute_logical_ast_from_leaf_lenient(*leaf);
                // if the error is not recoverable, replace it with an empty clause. We will end up
                // trimming those later
                (
                    ast.unwrap_or_else(|| LogicalAst::Clause(Vec::new())),
                    errors,
                )
            }
        }
    }

    fn field_boost(&self, field: Field) -> Score {
        self.boost.get(&field).cloned().unwrap_or(1.0)
    }

    fn default_indexed_json_fields(&self) -> impl Iterator<Item = Field> + '_ {
        let schema = self.schema.clone();
        self.default_fields.iter().cloned().filter(move |field| {
            let field_type = schema.get_field_entry(*field).field_type();
            field_type.value_type() == Type::Json && field_type.is_indexed()
        })
    }

    /// Given a literal, returns the list of terms that should be searched.
    ///
    /// The terms are identified by a triplet:
    /// - tantivy field
    /// - field_path: tantivy has JSON fields. It is possible to target a member of a JSON object by
    ///   naturally extending the json field name with a "." separated field_path
    /// - field_phrase: the phrase that is being searched.
    ///
    /// The literal identifies the targeted field by a so-called *full field path*,
    /// specified before the ":". (e.g. identity.username:fulmicoton).
    ///
    /// The way we split the full field path into (field_name, field_path) can be ambiguous,
    /// because field_names can contain "." themselves.
    // For instance if a field is named `one.two` and another one is named `one`,
    /// should `one.two:three` target `one.two` with field path `` or or `one` with
    /// the field path `two`.
    ///
    /// In this case tantivy, just picks the solution with the longest field name.
    ///
    /// Quirk: As a hack for quickwit, we do not split over a dot that appear escaped '\.'.
    fn compute_path_triplets_for_literal<'a>(
        &self,
        literal: &'a UserInputLiteral,
    ) -> Result<Vec<(Field, &'a str, &'a str)>, QueryParserError> {
        let full_path = if let Some(full_path) = &literal.field_name {
            full_path
        } else {
            // The user did not specify any path...
            // We simply target default fields.
            if self.default_fields.is_empty() {
                return Err(QueryParserError::NoDefaultFieldDeclared);
            }
            return Ok(self
                .default_fields
                .iter()
                .map(|default_field| (*default_field, "", literal.phrase.as_str()))
                .collect::<Vec<(Field, &str, &str)>>());
        };
        if let Some((field, path)) = self.split_full_path(full_path) {
            return Ok(vec![(field, path, literal.phrase.as_str())]);
        }
        // We need to add terms associated with json default fields.
        let triplets: Vec<(Field, &str, &str)> = self
            .default_indexed_json_fields()
            .map(|json_field| (json_field, full_path.as_str(), literal.phrase.as_str()))
            .collect();
        if triplets.is_empty() {
            return Err(QueryParserError::FieldDoesNotExist(full_path.to_string()));
        }
        Ok(triplets)
    }

    fn compute_logical_ast_from_leaf_lenient(
        &self,
        leaf: UserInputLeaf,
    ) -> (Option<LogicalAst>, Vec<QueryParserError>) {
        match leaf {
            UserInputLeaf::Literal(literal) => {
                let term_phrases: Vec<(Field, &str, &str)> =
                    try_tuple!(self.compute_path_triplets_for_literal(&literal));
                let mut asts: Vec<LogicalAst> = Vec::new();
                let mut errors: Vec<QueryParserError> = Vec::new();
                for (field, json_path, phrase) in term_phrases {
                    let unboosted_asts = match self.compute_logical_ast_for_leaf(
                        field,
                        json_path,
                        phrase,
                        literal.slop,
                        literal.prefix,
                    ) {
                        Ok(asts) => asts,
                        Err(e) => {
                            errors.push(e);
                            continue;
                        }
                    };
                    for ast in unboosted_asts {
                        // Apply some field specific boost defined at the query parser level.
                        let boost = self.field_boost(field);
                        asts.push(LogicalAst::Leaf(Box::new(ast)).boost(boost));
                    }
                }
                if !asts.is_empty() {
                    // if some fields failed but other succeeded, we consider this a success, it
                    // probably means the default_fields contains
                    // text and non-text fields, and the non-text ones failed
                    errors.clear();
                }
                let result_ast: LogicalAst = if asts.len() == 1 {
                    asts.into_iter().next().unwrap()
                } else {
                    LogicalAst::Clause(asts.into_iter().map(|ast| (Occur::Should, ast)).collect())
                };
                (Some(result_ast), errors)
            }
            UserInputLeaf::All => (
                Some(LogicalAst::Leaf(Box::new(LogicalLiteral::All))),
                Vec::new(),
            ),
            UserInputLeaf::Range {
                field: full_field_opt,
                lower,
                upper,
            } => {
                let Some(full_path) = full_field_opt else {
                    return (
                        None,
                        vec![QueryParserError::UnsupportedQuery(
                            "Range query need to target a specific field.".to_string(),
                        )],
                    );
                };
                let (field, json_path) = try_tuple!(self
                    .split_full_path(&full_path)
                    .ok_or_else(|| QueryParserError::FieldDoesNotExist(full_path.clone())));
                let mut errors = Vec::new();
                let lower = match self.resolve_bound(field, json_path, &lower) {
                    Ok(bound) => bound,
                    Err(error) => {
                        errors.push(error);
                        Bound::Unbounded
                    }
                };
                let upper = match self.resolve_bound(field, json_path, &upper) {
                    Ok(bound) => bound,
                    Err(error) => {
                        errors.push(error);
                        Bound::Unbounded
                    }
                };
                if lower == Bound::Unbounded && upper == Bound::Unbounded {
                    // this range is useless, either because a user requested [* TO *], or because
                    // we failed to parse something. Either way, there is no point emitting it
                    return (None, errors);
                }
                let logical_ast =
                    LogicalAst::Leaf(Box::new(LogicalLiteral::Range { lower, upper }));
                (Some(logical_ast), errors)
            }
            UserInputLeaf::Set {
                field: full_field_opt,
                elements,
            } => {
                let full_path = try_tuple!(full_field_opt.ok_or_else(|| {
                    QueryParserError::UnsupportedQuery(
                        "Range query need to target a specific field.".to_string(),
                    )
                }));
                let (field, json_path) = try_tuple!(self
                    .split_full_path(&full_path)
                    .ok_or_else(|| QueryParserError::FieldDoesNotExist(full_path.clone())));
                let (elements, errors) = elements
                    .into_iter()
                    .map(|element| self.compute_boundary_term(field, json_path, &element))
                    .partition_result();
                let logical_ast = LogicalAst::Leaf(Box::new(LogicalLiteral::Set { elements }));
                (Some(logical_ast), errors)
            }
            UserInputLeaf::Exists { .. } => (
                None,
                vec![QueryParserError::UnsupportedQuery(
                    "Range query need to target a specific field.".to_string(),
                )],
            ),
            UserInputLeaf::Regex { field, pattern } => {
                if !self.regexes_allowed {
                    return (
                        None,
                        vec![QueryParserError::UnsupportedQuery(
                            "Regex queries are not allowed.".to_string(),
                        )],
                    );
                }
                let full_path = try_tuple!(field.ok_or_else(|| {
                    QueryParserError::UnsupportedQuery(
                        "Regex query need to target a specific field.".to_string(),
                    )
                }));
                let (field, json_path) = try_tuple!(self
                    .split_full_path(&full_path)
                    .ok_or_else(|| QueryParserError::FieldDoesNotExist(full_path.clone())));
                if !json_path.is_empty() {
                    return (
                        None,
                        vec![QueryParserError::UnsupportedQuery(
                            "Regex query does not support json paths.".to_string(),
                        )],
                    );
                }
                if !matches!(
                    self.schema.get_field_entry(field).field_type(),
                    FieldType::Str(_)
                ) {
                    return (
                        None,
                        vec![QueryParserError::UnsupportedQuery(
                            "Regex query only supported on text fields".to_string(),
                        )],
                    );
                }
                let pattern = try_tuple!(Regex::new(&pattern).map_err(|e| {
                    QueryParserError::UnsupportedQuery(format!("Invalid regex: {e}"))
                }));
                let logical_ast = LogicalAst::Leaf(Box::new(LogicalLiteral::Regex {
                    pattern: Arc::new(pattern),
                    field,
                }));
                (Some(logical_ast), Vec::new())
            }
        }
    }
}

fn convert_literal_to_query(
    fuzzy: &FxHashMap<Field, Fuzzy>,
    logical_literal: LogicalLiteral,
) -> Box<dyn Query> {
    match logical_literal {
        LogicalLiteral::Term(term) => {
            if let Some(fuzzy) = fuzzy.get(&term.field()) {
                if fuzzy.prefix {
                    Box::new(FuzzyTermQuery::new_prefix(
                        term,
                        fuzzy.distance,
                        fuzzy.transpose_cost_one,
                    ))
                } else {
                    Box::new(FuzzyTermQuery::new(
                        term,
                        fuzzy.distance,
                        fuzzy.transpose_cost_one,
                    ))
                }
            } else {
                Box::new(TermQuery::new(term, IndexRecordOption::WithFreqs))
            }
        }
        LogicalLiteral::Phrase {
            terms,
            slop,
            prefix,
        } => {
            if prefix {
                Box::new(PhrasePrefixQuery::new_with_offset(terms))
            } else {
                Box::new(PhraseQuery::new_with_offset_and_slop(terms, slop))
            }
        }
        LogicalLiteral::Range { lower, upper } => Box::new(RangeQuery::new(lower, upper)),
        LogicalLiteral::Set { elements, .. } => Box::new(TermSetQuery::new(elements)),
        LogicalLiteral::All => Box::new(AllQuery),
        LogicalLiteral::Regex { pattern, field } => {
            Box::new(RegexQuery::from_regex(pattern, field))
        }
    }
}

fn generate_literals_for_str(
    field_name: &str,
    field: Field,
    phrase: &str,
    slop: u32,
    prefix: bool,
    indexing_options: &TextFieldIndexing,
    text_analyzer: &mut TextAnalyzer,
) -> Result<Option<LogicalLiteral>, QueryParserError> {
    let mut terms: Vec<(usize, Term)> = Vec::new();
    let mut token_stream = text_analyzer.token_stream(phrase);
    token_stream.process(&mut |token| {
        let term = Term::from_field_text(field, &token.text);
        terms.push((token.position, term));
    });
    if terms.len() <= 1 {
        if prefix {
            return Err(QueryParserError::PhrasePrefixRequiresAtLeastTwoTerms {
                phrase: phrase.to_owned(),
                tokenizer: indexing_options.tokenizer().to_owned(),
            });
        }
        let term_literal_opt = terms
            .into_iter()
            .next()
            .map(|(_, term)| LogicalLiteral::Term(term));
        return Ok(term_literal_opt);
    }
    if !indexing_options.index_option().has_positions() {
        return Err(QueryParserError::FieldDoesNotHavePositionsIndexed(
            field_name.to_string(),
        ));
    }
    Ok(Some(LogicalLiteral::Phrase {
        terms,
        slop,
        prefix,
    }))
}

fn generate_literals_for_json_object(
    field_name: &str,
    field: Field,
    json_path: &str,
    phrase: &str,
    tokenizer_manager: &TokenizerManager,
    json_options: &JsonObjectOptions,
) -> Result<Vec<LogicalLiteral>, QueryParserError> {
    let text_options = json_options.get_text_indexing_options().ok_or_else(|| {
        // This should have been seen earlier really.
        QueryParserError::FieldNotIndexed(field_name.to_string())
    })?;
    let mut text_analyzer = tokenizer_manager
        .get(text_options.tokenizer())
        .ok_or_else(|| QueryParserError::UnknownTokenizer {
            field: field_name.to_string(),
            tokenizer: text_options.tokenizer().to_string(),
        })?;
    let index_record_option = text_options.index_option();
    let mut logical_literals = Vec::new();

    let get_term_with_path =
        || Term::from_field_json_path(field, json_path, json_options.is_expand_dots_enabled());

    // Try to convert the phrase to a fast value
    if let Some(term) =
        convert_to_fast_value_and_append_to_json_term(&get_term_with_path(), phrase, true)
    {
        logical_literals.push(LogicalLiteral::Term(term));
    }

    // Try to tokenize the phrase and create Terms.
    let mut positions_and_terms = Vec::<(usize, Term)>::new();
    let mut token_stream = text_analyzer.token_stream(phrase);
    token_stream.process(&mut |token| {
        let mut term = get_term_with_path();
        term.append_type_and_str(&token.text);
        positions_and_terms.push((token.position, term.clone()));
    });

    if positions_and_terms.len() <= 1 {
        for (_, term) in positions_and_terms {
            logical_literals.push(LogicalLiteral::Term(term));
        }
        return Ok(logical_literals);
    }
    if !index_record_option.has_positions() {
        return Err(QueryParserError::FieldDoesNotHavePositionsIndexed(
            field_name.to_string(),
        ));
    }
    logical_literals.push(LogicalLiteral::Phrase {
        terms: positions_and_terms,
        slop: 0,
        prefix: false,
    });
    Ok(logical_literals)
}

fn convert_to_query(fuzzy: &FxHashMap<Field, Fuzzy>, logical_ast: LogicalAst) -> Box<dyn Query> {
    match trim_ast(logical_ast) {
        Some(LogicalAst::Clause(trimmed_clause)) => {
            let occur_subqueries = trimmed_clause
                .into_iter()
                .map(|(occur, subquery)| (occur, convert_to_query(fuzzy, subquery)))
                .collect::<Vec<_>>();
            assert!(
                !occur_subqueries.is_empty(),
                "Should not be empty after trimming"
            );
            Box::new(BooleanQuery::new(occur_subqueries))
        }
        Some(LogicalAst::Leaf(trimmed_logical_literal)) => {
            convert_literal_to_query(fuzzy, *trimmed_logical_literal)
        }
        Some(LogicalAst::Boost(ast, boost)) => {
            let query = convert_to_query(fuzzy, *ast);
            let boosted_query = BoostQuery::new(query, boost);
            Box::new(boosted_query)
        }
        None => Box::new(EmptyQuery),
    }
}

#[cfg(test)]
mod test {
    use matches::assert_matches;

    use super::super::logical_ast::*;
    use super::{QueryParser, QueryParserError};
    use crate::query::Query;
    use crate::schema::{
        FacetOptions, Field, IndexRecordOption, Schema, Term, TextFieldIndexing, TextOptions, FAST,
        INDEXED, STORED, STRING, TEXT,
    };
    use crate::tokenizer::{
        LowerCaser, SimpleTokenizer, StopWordFilter, TextAnalyzer, TokenizerManager,
    };
    use crate::Index;

    fn make_schema() -> Schema {
        let mut schema_builder = Schema::builder();
        let text_field_indexing = TextFieldIndexing::default()
            .set_tokenizer("en_with_stop_words")
            .set_index_option(IndexRecordOption::WithFreqsAndPositions);
        let text_options = TextOptions::default()
            .set_indexing_options(text_field_indexing)
            .set_stored();
        schema_builder.add_text_field("title", TEXT);
        schema_builder.add_text_field("text", TEXT);
        schema_builder.add_i64_field("signed", INDEXED);
        schema_builder.add_u64_field("unsigned", INDEXED);
        schema_builder.add_text_field("notindexed_text", STORED);
        schema_builder.add_text_field("notindexed_u64", STORED);
        schema_builder.add_text_field("notindexed_i64", STORED);
        schema_builder.add_text_field("nottokenized", STRING);
        schema_builder.add_text_field("with_stop_words", text_options);
        schema_builder.add_date_field("date", INDEXED);
        schema_builder.add_f64_field("float", INDEXED);
        schema_builder.add_facet_field("facet", FacetOptions::default());
        schema_builder.add_bytes_field("bytes", INDEXED);
        schema_builder.add_bytes_field("bytes_not_indexed", STORED);
        schema_builder.add_json_field("json", TEXT);
        schema_builder.add_json_field("json_not_indexed", STORED);
        schema_builder.add_bool_field("bool", INDEXED);
        schema_builder.add_bool_field("notindexed_bool", STORED);
        schema_builder.add_u64_field("u64_ff", FAST);
        schema_builder.build()
    }

    fn make_query_parser_with_default_fields(default_fields: &[&'static str]) -> QueryParser {
        let schema = make_schema();
        let default_fields: Vec<Field> = default_fields
            .iter()
            .flat_map(|field_name| schema.get_field(field_name))
            .collect();
        let tokenizer_manager = TokenizerManager::default();
        tokenizer_manager.register(
            "en_with_stop_words",
            TextAnalyzer::builder(SimpleTokenizer::default())
                .filter(LowerCaser)
                .filter(StopWordFilter::remove(vec!["the".to_string()]))
                .build(),
        );
        QueryParser::new(schema, default_fields, tokenizer_manager)
    }

    fn make_query_parser() -> QueryParser {
        make_query_parser_with_default_fields(&["title", "text"])
    }

    fn parse_query_to_logical_ast_with_default_fields(
        query: &str,
        default_conjunction: bool,
        default_fields: &[&'static str],
        allow_regexes: bool,
    ) -> Result<LogicalAst, QueryParserError> {
        let mut query_parser = make_query_parser_with_default_fields(default_fields);
        if default_conjunction {
            query_parser.set_conjunction_by_default();
        }
        if allow_regexes {
            query_parser.allow_regexes();
        }
        query_parser.parse_query_to_logical_ast(query)
    }

    fn parse_query_to_logical_ast(
        query: &str,
        default_conjunction: bool,
    ) -> Result<LogicalAst, QueryParserError> {
        parse_query_to_logical_ast_with_default_fields(
            query,
            default_conjunction,
            &["title", "text"],
            true,
        )
    }

    #[track_caller]
    fn test_parse_query_to_logical_ast_helper_with_default_fields(
        query: &str,
        expected: &str,
        default_conjunction: bool,
        default_fields: &[&'static str],
    ) {
        let query = parse_query_to_logical_ast_with_default_fields(
            query,
            default_conjunction,
            default_fields,
            true,
        )
        .unwrap();
        let query_str = format!("{query:?}");
        assert_eq!(query_str, expected);
    }

    #[track_caller]
    fn test_parse_query_to_logical_ast_helper(
        query: &str,
        expected: &str,
        default_conjunction: bool,
    ) {
        test_parse_query_to_logical_ast_helper_with_default_fields(
            query,
            expected,
            default_conjunction,
            &["title", "text"],
        )
    }

    #[test]
    pub fn test_parse_query_facet() {
        let query_parser = make_query_parser();
        let query = query_parser.parse_query("facet:/root/branch/leaf").unwrap();
        assert_eq!(
            format!("{query:?}"),
            r#"TermQuery(Term(field=11, type=Facet, Facet(/root/branch/leaf)))"#
        );
    }

    #[test]
    pub fn test_parse_query_with_boost() {
        let mut query_parser = make_query_parser();
        let schema = make_schema();
        let text_field = schema.get_field("text").unwrap();
        query_parser.set_field_boost(text_field, 2.0);
        let query = query_parser.parse_query("text:hello").unwrap();
        assert_eq!(
            format!("{query:?}"),
            r#"Boost(query=TermQuery(Term(field=1, type=Str, "hello")), boost=2)"#
        );
    }

    #[test]
    pub fn test_parse_query_range_with_boost() {
        let query = make_query_parser().parse_query("title:[A TO B]").unwrap();
        assert_eq!(
            format!("{query:?}"),
            "RangeQuery { bounds: BoundsRange { lower_bound: Included(Term(field=0, type=Str, \
             \"a\")), upper_bound: Included(Term(field=0, type=Str, \"b\")) } }"
        );
    }

    #[test]
    pub fn test_parse_query_with_default_boost_and_custom_boost() {
        let mut query_parser = make_query_parser();
        let schema = make_schema();
        let text_field = schema.get_field("text").unwrap();
        query_parser.set_field_boost(text_field, 2.0);
        let query = query_parser.parse_query("text:hello^2").unwrap();
        assert_eq!(
            format!("{query:?}"),
            r#"Boost(query=Boost(query=TermQuery(Term(field=1, type=Str, "hello")), boost=2), boost=2)"#
        );
    }

    #[test]
    pub fn test_parse_nonindexed_field_yields_error() {
        let query_parser = make_query_parser();

        let is_not_indexed_err = |query: &str| {
            let result: Result<Box<dyn Query>, QueryParserError> = query_parser.parse_query(query);
            if let Err(QueryParserError::FieldNotIndexed(field_name)) = result {
                Some(field_name)
            } else {
                None
            }
        };

        assert_eq!(
            is_not_indexed_err("notindexed_text:titi"),
            Some(String::from("notindexed_text"))
        );
        assert_eq!(
            is_not_indexed_err("notindexed_u64:23424"),
            Some(String::from("notindexed_u64"))
        );
        assert_eq!(
            is_not_indexed_err("notindexed_i64:-234324"),
            Some(String::from("notindexed_i64"))
        );
        assert_eq!(
            is_not_indexed_err("notindexed_bool:true"),
            Some(String::from("notindexed_bool"))
        );
    }

    #[test]
    pub fn test_parse_query_untokenized() {
        test_parse_query_to_logical_ast_helper(
            "nottokenized:\"wordone wordtwo\"",
            r#"Term(field=7, type=Str, "wordone wordtwo")"#,
            false,
        );
    }

    #[test]
    pub fn test_parse_query_empty() {
        test_parse_query_to_logical_ast_helper("", "<emptyclause>", false);
        test_parse_query_to_logical_ast_helper(" ", "<emptyclause>", false);
        let query_parser = make_query_parser();
        let query_result = query_parser.parse_query("");
        let query = query_result.unwrap();
        assert_eq!(format!("{query:?}"), "EmptyQuery");
    }

    #[test]
    pub fn test_parse_query_ints() {
        let query_parser = make_query_parser();
        assert!(query_parser.parse_query("signed:2324").is_ok());
        assert!(query_parser.parse_query("signed:\"22\"").is_ok());
        assert!(query_parser.parse_query("signed:\"-2234\"").is_ok());
        assert!(query_parser
            .parse_query("signed:\"-9999999999999\"")
            .is_ok());
        assert!(query_parser.parse_query("signed:\"a\"").is_err());
        assert!(query_parser.parse_query("signed:\"2a\"").is_err());
        assert!(query_parser
            .parse_query("signed:\"18446744073709551615\"")
            .is_err());
        assert!(query_parser.parse_query("unsigned:\"2\"").is_ok());
        assert!(query_parser.parse_query("unsigned:\"-2\"").is_err());
        assert!(query_parser
            .parse_query("unsigned:\"18446744073709551615\"")
            .is_ok());
        assert!(query_parser.parse_query("float:\"3.1\"").is_ok());
        assert!(query_parser.parse_query("float:\"-2.4\"").is_ok());
        assert!(query_parser.parse_query("float:\"2.1.2\"").is_err());
        assert!(query_parser.parse_query("float:\"2.1a\"").is_err());
        assert!(query_parser
            .parse_query("float:\"18446744073709551615.0\"")
            .is_ok());
        test_parse_query_to_logical_ast_helper(
            "unsigned:2324",
            "Term(field=3, type=U64, 2324)",
            false,
        );

        test_parse_query_to_logical_ast_helper(
            "signed:-2324",
            &format!(
                "{:?}",
                Term::from_field_i64(Field::from_field_id(2u32), -2324)
            ),
            false,
        );

        test_parse_query_to_logical_ast_helper(
            "float:2.5",
            &format!(
                "{:?}",
                Term::from_field_f64(Field::from_field_id(10u32), 2.5)
            ),
            false,
        );
    }

    #[test]
    fn test_parse_bytes() {
        test_parse_query_to_logical_ast_helper(
            "bytes:YnVidQ==",
            "Term(field=12, type=Bytes, [98, 117, 98, 117])",
            false,
        );
    }

    #[test]
    fn test_parse_bool() {
        test_parse_query_to_logical_ast_helper(
            "bool:true",
            &format!(
                "{:?}",
                Term::from_field_bool(Field::from_field_id(16u32), true),
            ),
            false,
        );
    }

    #[test]
    fn test_parse_bytes_not_indexed() {
        let error = parse_query_to_logical_ast("bytes_not_indexed:aaa", false).unwrap_err();
        assert!(matches!(error, QueryParserError::FieldNotIndexed(_)));
    }

    #[test]
    fn test_json_field() {
        test_parse_query_to_logical_ast_helper(
            "json.titi:hello",
            "Term(field=14, type=Json, path=titi, type=Str, \"hello\")",
            false,
        );
    }

    fn extract_query_term_json_path(query: &str) -> String {
        let LogicalAst::Leaf(literal) = parse_query_to_logical_ast(query, false).unwrap() else {
            panic!();
        };
        let LogicalLiteral::Term(term) = *literal else {
            panic!();
        };
        std::str::from_utf8(term.serialized_value_bytes())
            .unwrap()
            .to_string()
    }

    #[test]
    fn test_json_field_query_with_escaped_dot() {
        assert_eq!(
            extract_query_term_json_path(r#"json.k8s.node.name:hello"#),
            "k8s\u{1}node\u{1}name\0shello"
        );
        assert_eq!(
            extract_query_term_json_path(r"json.k8s\.node\.name:hello"),
            "k8s.node.name\0shello"
        );
    }

    #[test]
    fn test_json_field_possibly_a_number() {
        test_parse_query_to_logical_ast_helper(
            "json.titi:5",
            r#"(Term(field=14, type=Json, path=titi, type=I64, 5) Term(field=14, type=Json, path=titi, type=Str, "5"))"#,
            true,
        );
        test_parse_query_to_logical_ast_helper(
            "json.titi:-5",
            r#"(Term(field=14, type=Json, path=titi, type=I64, -5) Term(field=14, type=Json, path=titi, type=Str, "5"))"#, //< Yes this is a bit weird after going through the tokenizer we lose the "-".
            true,
        );
        test_parse_query_to_logical_ast_helper(
            "json.titi:10000000000000000000",
            r#"(Term(field=14, type=Json, path=titi, type=U64, 10000000000000000000) Term(field=14, type=Json, path=titi, type=Str, "10000000000000000000"))"#,
            true,
        );
        test_parse_query_to_logical_ast_helper(
            "json.titi:-5.2",
            r#"(Term(field=14, type=Json, path=titi, type=F64, -5.2) "[(0, Term(field=14, type=Json, path=titi, type=Str, "5")), (1, Term(field=14, type=Json, path=titi, type=Str, "2"))]")"#,
            true,
        );
    }

    #[test]
    fn test_json_field_possibly_a_date() {
        test_parse_query_to_logical_ast_helper(
            r#"json.date:"2019-10-12T07:20:50.52Z""#,
            r#"(Term(field=14, type=Json, path=date, type=Date, 2019-10-12T07:20:50Z) "[(0, Term(field=14, type=Json, path=date, type=Str, "2019")), (1, Term(field=14, type=Json, path=date, type=Str, "10")), (2, Term(field=14, type=Json, path=date, type=Str, "12t07")), (3, Term(field=14, type=Json, path=date, type=Str, "20")), (4, Term(field=14, type=Json, path=date, type=Str, "50")), (5, Term(field=14, type=Json, path=date, type=Str, "52z"))]")"#,
            true,
        );
    }

    #[test]
    fn test_json_field_possibly_a_bool() {
        test_parse_query_to_logical_ast_helper(
            "json.titi:true",
            r#"(Term(field=14, type=Json, path=titi, type=Bool, true) Term(field=14, type=Json, path=titi, type=Str, "true"))"#,
            true,
        );
    }

    #[test]
    fn test_json_field_not_indexed() {
        let error = parse_query_to_logical_ast("json_not_indexed.titi:hello", false).unwrap_err();
        assert!(matches!(error, QueryParserError::FieldNotIndexed(_)));
    }

    fn test_query_to_logical_ast_with_default_json(
        query: &str,
        expected: &str,
        default_conjunction: bool,
    ) {
        let mut query_parser = make_query_parser_with_default_fields(&["json"]);
        if default_conjunction {
            query_parser.set_conjunction_by_default();
        }
        let ast = query_parser.parse_query_to_logical_ast(query).unwrap();
        let ast_str = format!("{ast:?}");
        assert_eq!(ast_str, expected);
    }

    #[test]
    fn test_json_default() {
        test_query_to_logical_ast_with_default_json(
            "titi:4",
            "(Term(field=14, type=Json, path=titi, type=I64, 4) Term(field=14, type=Json, \
             path=titi, type=Str, \"4\"))",
            false,
        );
    }

    #[test]
    fn test_json_default_with_different_field() {
        for conjunction in [false, true] {
            test_query_to_logical_ast_with_default_json(
                "text:4",
                r#"Term(field=1, type=Str, "4")"#,
                conjunction,
            );
        }
    }

    #[test]
    fn test_json_default_with_same_field() {
        for conjunction in [false, true] {
            test_query_to_logical_ast_with_default_json(
                "json:4",
                r#"(Term(field=14, type=Json, path=, type=I64, 4) Term(field=14, type=Json, path=, type=Str, "4"))"#,
                conjunction,
            );
        }
    }

    #[test]
    fn test_parse_bytes_phrase() {
        test_parse_query_to_logical_ast_helper(
            "bytes:\"YnVidQ==\"",
            "Term(field=12, type=Bytes, [98, 117, 98, 117])",
            false,
        );
    }

    #[test]
    fn test_parse_bytes_invalid_base64() {
        let base64_err: QueryParserError =
            parse_query_to_logical_ast("bytes:aa", false).unwrap_err();
        assert!(matches!(base64_err, QueryParserError::ExpectedBase64(_)));
    }

    #[test]
    fn test_parse_query_to_ast_ab_c() {
        test_parse_query_to_logical_ast_helper(
            "(+title:a +title:b) title:c",
            r#"((+Term(field=0, type=Str, "a") +Term(field=0, type=Str, "b")) Term(field=0, type=Str, "c"))"#,
            false,
        );
        test_parse_query_to_logical_ast_helper(
            "(+title:a +title:b) title:c",
            r#"(+Term(field=0, type=Str, "a") +Term(field=0, type=Str, "b") +Term(field=0, type=Str, "c"))"#,
            true,
        );
    }

    #[test]
    pub fn test_parse_query_to_ast_single_term() {
        test_parse_query_to_logical_ast_helper(
            "title:toto",
            r#"Term(field=0, type=Str, "toto")"#,
            false,
        );
        test_parse_query_to_logical_ast_helper(
            "+title:toto",
            r#"Term(field=0, type=Str, "toto")"#,
            false,
        );
        test_parse_query_to_logical_ast_helper(
            "+title:toto -titi",
            r#"(+Term(field=0, type=Str, "toto") -(Term(field=0, type=Str, "titi") Term(field=1, type=Str, "titi")))"#,
            false,
        );
    }

    #[test]
    fn test_single_negative_term() {
        assert_matches!(
            parse_query_to_logical_ast("-title:toto", false),
            Err(QueryParserError::AllButQueryForbidden)
        );
    }

    #[test]
    pub fn test_parse_query_to_ast_two_terms() {
        test_parse_query_to_logical_ast_helper(
            "title:a b",
            r#"(Term(field=0, type=Str, "a") Term(field=0, type=Str, "b") Term(field=1, type=Str, "b"))"#,
            false,
        );
        test_parse_query_to_logical_ast_helper(
            r#"title:"a b""#,
            r#""[(0, Term(field=0, type=Str, "a")), (1, Term(field=0, type=Str, "b"))]""#,
            false,
        );
    }
    #[test]
    pub fn test_parse_query_all_query() {
        let logical_ast = parse_query_to_logical_ast("*", false).unwrap();
        assert_eq!(format!("{logical_ast:?}"), "*");
    }

    #[test]
    pub fn test_parse_query_range_require_a_target_field() {
        let query_parser_error = parse_query_to_logical_ast("[A TO B]", false).err().unwrap();
        assert_eq!(
            query_parser_error.to_string(),
            "Unsupported query: Range query need to target a specific field."
        );
    }

    #[test]
    pub fn test_parse_query_to_ast_ranges() {
        test_parse_query_to_logical_ast_helper(
            "title:[a TO b]",
            r#"(Included(Term(field=0, type=Str, "a")) TO Included(Term(field=0, type=Str, "b")))"#,
            false,
        );
        test_parse_query_to_logical_ast_helper(
            "title:{titi TO toto}",
            r#"(Excluded(Term(field=0, type=Str, "titi")) TO Excluded(Term(field=0, type=Str, "toto")))"#,
            false,
        );
        test_parse_query_to_logical_ast_helper(
            "title:{* TO toto}",
            r#"(Unbounded TO Excluded(Term(field=0, type=Str, "toto")))"#,
            false,
        );
        test_parse_query_to_logical_ast_helper(
            "title:{titi TO *}",
            r#"(Excluded(Term(field=0, type=Str, "titi")) TO Unbounded)"#,
            false,
        );
        test_parse_query_to_logical_ast_helper(
            "signed:{-5 TO 3}",
            r#"(Excluded(Term(field=2, type=I64, -5)) TO Excluded(Term(field=2, type=I64, 3)))"#,
            false,
        );
        test_parse_query_to_logical_ast_helper(
            "float:{-1.5 TO 1.5}",
            r#"(Excluded(Term(field=10, type=F64, -1.5)) TO Excluded(Term(field=10, type=F64, 1.5)))"#,
            false,
        );
        test_parse_query_to_logical_ast_helper(
            "u64_ff:[7 TO 77]",
            r#"(Included(Term(field=18, type=U64, 7)) TO Included(Term(field=18, type=U64, 77)))"#,
            false,
        );
    }

    #[test]
    pub fn test_query_parser_field_does_not_exist() {
        let query_parser = make_query_parser();
        assert_eq!(
            query_parser
                .parse_query("boujou:\"18446744073709551615\"")
                .unwrap_err(),
            QueryParserError::FieldDoesNotExist("boujou".to_string())
        );
    }

    #[test]
    pub fn test_query_parser_field_not_indexed() {
        let query_parser = make_query_parser();
        assert_matches!(
            query_parser.parse_query("notindexed_text:\"18446744073709551615\""),
            Err(QueryParserError::FieldNotIndexed(_))
        );
    }

    #[test]
    pub fn test_unknown_tokenizer() {
        let mut schema_builder = Schema::builder();
        let text_field_indexing = TextFieldIndexing::default()
            .set_tokenizer("nonexistingtokenizer")
            .set_index_option(IndexRecordOption::Basic);
        let text_options = TextOptions::default().set_indexing_options(text_field_indexing);
        let title = schema_builder.add_text_field("title", text_options);
        let schema = schema_builder.build();
        let default_fields = vec![title];
        let tokenizer_manager = TokenizerManager::default();
        let query_parser = QueryParser::new(schema, default_fields, tokenizer_manager);

        assert_matches!(
            query_parser.parse_query("title:\"happy tax payer\""),
            Err(QueryParserError::UnknownTokenizer { .. })
        );
    }

    #[test]
    pub fn test_query_parser_no_positions() {
        let mut schema_builder = Schema::builder();
        let text_field_indexing = TextFieldIndexing::default()
            .set_tokenizer("customtokenizer")
            .set_index_option(IndexRecordOption::Basic);
        let text_options = TextOptions::default().set_indexing_options(text_field_indexing);
        let title = schema_builder.add_text_field("title", text_options);
        let schema = schema_builder.build();
        let index = Index::create_in_ram(schema);
        index
            .tokenizers()
            .register("customtokenizer", SimpleTokenizer::default());
        let query_parser = QueryParser::for_index(&index, vec![title]);
        assert_eq!(
            query_parser.parse_query("title:\"happy tax\"").unwrap_err(),
            QueryParserError::FieldDoesNotHavePositionsIndexed("title".to_string())
        );
    }

    #[test]
    pub fn test_query_parser_expected_int() {
        let query_parser = make_query_parser();
        assert_matches!(
            query_parser.parse_query("unsigned:18a"),
            Err(QueryParserError::ExpectedInt(_))
        );
        assert!(query_parser.parse_query("unsigned:\"18\"").is_ok());
        assert_matches!(
            query_parser.parse_query("signed:18b"),
            Err(QueryParserError::ExpectedInt(_))
        );
        assert!(query_parser.parse_query("float:\"1.8\"").is_ok());
        assert_matches!(
            query_parser.parse_query("float:1.8a"),
            Err(QueryParserError::ExpectedFloat(_))
        );
    }

    #[test]
    pub fn test_query_parser_expected_bool() {
        let query_parser = make_query_parser();
        assert_matches!(
            query_parser.parse_query("bool:brie"),
            Err(QueryParserError::ExpectedBool(_))
        );
        assert!(query_parser.parse_query("bool:\"true\"").is_ok());
        assert!(query_parser.parse_query("bool:\"false\"").is_ok());
    }

    #[test]
    pub fn test_query_parser_expected_date() {
        let query_parser = make_query_parser();
        assert_matches!(
            query_parser.parse_query("date:18a"),
            Err(QueryParserError::DateFormatError(_))
        );
        test_parse_query_to_logical_ast_helper(
            r#"date:"2010-11-21T09:55:06.000000000+02:00""#,
            r#"Term(field=9, type=Date, 2010-11-21T07:55:06Z)"#,
            true,
        );
        test_parse_query_to_logical_ast_helper(
            r#"date:"1985-04-12T23:20:50.52Z""#,
            r#"Term(field=9, type=Date, 1985-04-12T23:20:50Z)"#,
            true,
        );
    }

    #[test]
    pub fn test_query_parser_expected_facet() {
        let query_parser = make_query_parser();
        match query_parser.parse_query("facet:INVALID") {
            Ok(_) => panic!("should never succeed"),
            Err(e) => assert_eq!(
                "The facet field is malformed: Failed to parse the facet string: 'INVALID'",
                format!("{e}")
            ),
        }
        assert!(query_parser.parse_query("facet:\"/foo/bar\"").is_ok());
    }

    #[test]
    pub fn test_query_parser_not_empty_but_no_tokens() {
        let query_parser = make_query_parser();
        assert!(query_parser.parse_query(" !, ").is_ok());
        assert!(query_parser.parse_query("with_stop_words:the").is_ok());
    }

    #[test]
    pub fn test_parse_query_single_negative_term_through_error() {
        assert_matches!(
            parse_query_to_logical_ast("-title:toto", true),
            Err(QueryParserError::AllButQueryForbidden)
        );
        assert_matches!(
            parse_query_to_logical_ast("-title:toto", false),
            Err(QueryParserError::AllButQueryForbidden)
        );
    }

    #[test]
    pub fn test_parse_query_to_ast_conjunction() {
        test_parse_query_to_logical_ast_helper(
            "title:toto",
            r#"Term(field=0, type=Str, "toto")"#,
            true,
        );
        test_parse_query_to_logical_ast_helper(
            "+title:toto",
            r#"Term(field=0, type=Str, "toto")"#,
            true,
        );
        test_parse_query_to_logical_ast_helper(
            "+title:toto -titi",
            r#"(+Term(field=0, type=Str, "toto") -(Term(field=0, type=Str, "titi") Term(field=1, type=Str, "titi")))"#,
            true,
        );
        test_parse_query_to_logical_ast_helper(
            "title:a b",
            r#"(+Term(field=0, type=Str, "a") +(Term(field=0, type=Str, "b") Term(field=1, type=Str, "b")))"#,
            true,
        );
        test_parse_query_to_logical_ast_helper(
            "title:\"a b\"",
            r#""[(0, Term(field=0, type=Str, "a")), (1, Term(field=0, type=Str, "b"))]""#,
            true,
        );
    }

    #[test]
    pub fn test_parse_query_negative() {
        test_parse_query_to_logical_ast_helper(
            "title:b -title:a",
            r#"(+Term(field=0, type=Str, "b") -Term(field=0, type=Str, "a"))"#,
            true,
        );

        test_parse_query_to_logical_ast_helper(
            "title:b -(-title:a -title:c)",
            r#"(+Term(field=0, type=Str, "b") -(-Term(field=0, type=Str, "a") -Term(field=0, type=Str, "c")))"#,
            true,
        );
    }

    #[test]
    pub fn test_query_parser_hyphen() {
        test_parse_query_to_logical_ast_helper(
            "title:www-form-encoded",
            r#""[(0, Term(field=0, type=Str, "www")), (1, Term(field=0, type=Str, "form")), (2, Term(field=0, type=Str, "encoded"))]""#,
            false,
        );
    }

    #[test]
    fn test_and_default_regardless_of_default_conjunctive() {
        for &default_conjunction in &[false, true] {
            test_parse_query_to_logical_ast_helper(
                "title:a AND title:b",
                r#"(+Term(field=0, type=Str, "a") +Term(field=0, type=Str, "b"))"#,
                default_conjunction,
            );
        }
    }

    #[test]
    fn test_or_default_conjunctive() {
        for &default_conjunction in &[false, true] {
            test_parse_query_to_logical_ast_helper(
                "title:a OR title:b",
                r#"(Term(field=0, type=Str, "a") Term(field=0, type=Str, "b"))"#,
                default_conjunction,
            );
        }
    }

    #[test]
    fn test_space_before_value() {
        test_parse_query_to_logical_ast_helper(
            "title: a",
            r#"Term(field=0, type=Str, "a")"#,
            false,
        );
    }

    #[test]
    fn test_escaped_field() {
        let mut schema_builder = Schema::builder();
        schema_builder.add_text_field(r"a\.b", STRING);
        let schema = schema_builder.build();
        let query_parser = QueryParser::new(schema, Vec::new(), TokenizerManager::default());
        let query = query_parser.parse_query(r"a\.b:hello").unwrap();
        assert_eq!(
            format!("{query:?}"),
            "TermQuery(Term(field=0, type=Str, \"hello\"))"
        );
    }

    #[test]
    fn test_split_full_path() {
        let mut schema_builder = Schema::builder();
        schema_builder.add_text_field("second", STRING);
        schema_builder.add_text_field("first", STRING);
        schema_builder.add_text_field("first.toto", STRING);
        schema_builder.add_text_field("first.toto.titi", STRING);
        schema_builder.add_text_field("third.a.b.c", STRING);
        let schema = schema_builder.build();
        let query_parser =
            QueryParser::new(schema.clone(), Vec::new(), TokenizerManager::default());
        assert_eq!(
            query_parser.split_full_path("first.toto"),
            Some((schema.get_field("first.toto").unwrap(), ""))
        );
        assert_eq!(
            query_parser.split_full_path("first.toto.bubu"),
            Some((schema.get_field("first.toto").unwrap(), "bubu"))
        );
        assert_eq!(
            query_parser.split_full_path("first.toto.titi"),
            Some((schema.get_field("first.toto.titi").unwrap(), ""))
        );
        assert_eq!(
            query_parser.split_full_path("first.titi"),
            Some((schema.get_field("first").unwrap(), "titi"))
        );
        assert_eq!(query_parser.split_full_path("third"), None);
        assert_eq!(query_parser.split_full_path("hello.toto"), None);
        assert_eq!(query_parser.split_full_path(""), None);
        assert_eq!(query_parser.split_full_path("firsty"), None);
    }

    #[test]
    pub fn test_phrase_slop() {
        test_parse_query_to_logical_ast_helper(
            "\"a b\"~0",
            r#"("[(0, Term(field=0, type=Str, "a")), (1, Term(field=0, type=Str, "b"))]" "[(0, Term(field=1, type=Str, "a")), (1, Term(field=1, type=Str, "b"))]")"#,
            false,
        );
        test_parse_query_to_logical_ast_helper(
            "\"a b\"~2",
            r#"("[(0, Term(field=0, type=Str, "a")), (1, Term(field=0, type=Str, "b"))]"~2 "[(0, Term(field=1, type=Str, "a")), (1, Term(field=1, type=Str, "b"))]"~2)"#,
            false,
        );
        test_parse_query_to_logical_ast_helper(
            "title:\"a b~4\"~2",
            r#""[(0, Term(field=0, type=Str, "a")), (1, Term(field=0, type=Str, "b")), (2, Term(field=0, type=Str, "4"))]"~2"#,
            false,
        );
    }

    #[test]
    pub fn test_phrase_prefix() {
        test_parse_query_to_logical_ast_helper(
            "\"big bad wo\"*",
            r#"("[(0, Term(field=0, type=Str, "big")), (1, Term(field=0, type=Str, "bad")), (2, Term(field=0, type=Str, "wo"))]"* "[(0, Term(field=1, type=Str, "big")), (1, Term(field=1, type=Str, "bad")), (2, Term(field=1, type=Str, "wo"))]"*)"#,
            false,
        );

        let query_parser = make_query_parser();
        let query = query_parser.parse_query("\"big bad wo\"*").unwrap();
        assert_eq!(
            format!("{query:?}"),
            "BooleanQuery { subqueries: [(Should, PhrasePrefixQuery { field: Field(0), \
             phrase_terms: [(0, Term(field=0, type=Str, \"big\")), (1, Term(field=0, type=Str, \
             \"bad\"))], prefix: (2, Term(field=0, type=Str, \"wo\")), max_expansions: 50 }), \
             (Should, PhrasePrefixQuery { field: Field(1), phrase_terms: [(0, Term(field=1, \
             type=Str, \"big\")), (1, Term(field=1, type=Str, \"bad\"))], prefix: (2, \
             Term(field=1, type=Str, \"wo\")), max_expansions: 50 })], \
             minimum_number_should_match: 1 }"
        );
    }

    #[test]
    pub fn test_phrase_prefix_too_short() {
        let err = parse_query_to_logical_ast("\"wo\"*", true).unwrap_err();
        assert_eq!(
            err,
            QueryParserError::PhrasePrefixRequiresAtLeastTwoTerms {
                phrase: "wo".to_owned(),
                tokenizer: "default".to_owned()
            }
        );

        let err = parse_query_to_logical_ast("\"\"*", true).unwrap_err();
        assert_eq!(
            err,
            QueryParserError::PhrasePrefixRequiresAtLeastTwoTerms {
                phrase: "".to_owned(),
                tokenizer: "default".to_owned()
            }
        );
    }

    #[test]
    pub fn test_term_set_query() {
        test_parse_query_to_logical_ast_helper(
            "title: IN [a b cd]",
            r#"IN [Term(field=0, type=Str, "a"), Term(field=0, type=Str, "b"), Term(field=0, type=Str, "cd")]"#,
            false,
        );
        test_parse_query_to_logical_ast_helper(
            "bytes: IN [AA== ABA= ABCD]",
            r#"IN [Term(field=12, type=Bytes, [0]), Term(field=12, type=Bytes, [0, 16]), Term(field=12, type=Bytes, [0, 16, 131])]"#,
            false,
        );
        test_parse_query_to_logical_ast_helper(
            "signed: IN [1 2 -3]",
            r#"IN [Term(field=2, type=I64, 1), Term(field=2, type=I64, 2), Term(field=2, type=I64, -3)]"#,
            false,
        );

        test_parse_query_to_logical_ast_helper(
            "float: IN [1.1 2.2 -3.3]",
            r#"IN [Term(field=10, type=F64, 1.1), Term(field=10, type=F64, 2.2), Term(field=10, type=F64, -3.3)]"#,
            false,
        );
    }

    #[test]
    pub fn test_set_field_fuzzy() {
        {
            let mut query_parser = make_query_parser();
            query_parser.set_field_fuzzy(
                query_parser.schema.get_field("title").unwrap(),
                false,
                1,
                true,
            );
            let query = query_parser.parse_query("abc").unwrap();
            assert_eq!(
                format!("{query:?}"),
                "BooleanQuery { subqueries: [(Should, FuzzyTermQuery { term: Term(field=0, \
                 type=Str, \"abc\"), distance: 1, transposition_cost_one: true, prefix: false }), \
                 (Should, TermQuery(Term(field=1, type=Str, \"abc\")))], \
                 minimum_number_should_match: 1 }"
            );
        }

        {
            let mut query_parser = make_query_parser();
            query_parser.set_field_fuzzy(
                query_parser.schema.get_field("text").unwrap(),
                true,
                2,
                false,
            );
            let query = query_parser.parse_query("abc").unwrap();
            assert_eq!(
                format!("{query:?}"),
                "BooleanQuery { subqueries: [(Should, TermQuery(Term(field=0, type=Str, \
                 \"abc\"))), (Should, FuzzyTermQuery { term: Term(field=1, type=Str, \"abc\"), \
                 distance: 2, transposition_cost_one: false, prefix: true })], \
                 minimum_number_should_match: 1 }"
            );
        }
    }

    #[test]
    pub fn test_set_default_field_integer() {
        test_parse_query_to_logical_ast_helper_with_default_fields(
            "2324",
            "(Term(field=0, type=Str, \"2324\") Term(field=2, type=I64, 2324))",
            false,
            &["title", "signed"],
        );

        test_parse_query_to_logical_ast_helper_with_default_fields(
            "abc",
            "Term(field=0, type=Str, \"abc\")",
            false,
            &["title", "signed"],
        );

        let query_parser = make_query_parser_with_default_fields(&["signed"]);
        assert_matches!(
            query_parser.parse_query("abc"),
            Err(QueryParserError::ExpectedInt(_))
        );
    }

    #[test]
    pub fn test_deduplication() {
        let query = "be be";
        test_parse_query_to_logical_ast_helper(
            query,
            "(Term(field=0, type=Str, \"be\") Term(field=1, type=Str, \"be\"))",
            false,
        );
    }

    #[test]
    pub fn test_regex() {
        let expected_regex = tantivy_fst::Regex::new(r".*b").unwrap();
        test_parse_query_to_logical_ast_helper(
            "title:/.*b/",
            format!("Regex(Field(0), {:#?})", expected_regex).as_str(),
            false,
        );
        let expected_regex2 = tantivy_fst::Regex::new(r".*a").unwrap();
        test_parse_query_to_logical_ast_helper(
            "title:(/.*b/ OR /.*a/)",
            format!(
                "(Regex(Field(0), {:#?}) Regex(Field(0), {:#?}))",
                expected_regex, expected_regex2
            )
            .as_str(),
            false,
        );

        // Invalid field
        let err = parse_query_to_logical_ast("float:/.*b/", false).unwrap_err();
        assert_eq!(
            err.to_string(),
            "Unsupported query: Regex query only supported on text fields"
        );

        // No field specified
        let err = parse_query_to_logical_ast("/.*b/", false).unwrap_err();
        assert_eq!(
            err.to_string(),
            "Unsupported query: Regex query need to target a specific field."
        );

        // Regex on a json path
        let err = parse_query_to_logical_ast("title.subpath:/.*b/", false).unwrap_err();
        assert_eq!(
            err.to_string(),
            "Unsupported query: Regex query does not support json paths."
        );

        // Invalid regex
        let err = parse_query_to_logical_ast("title:/[A-Z*b/", false).unwrap_err();
        assert_eq!(
            err.to_string(),
            "Unsupported query: Invalid regex: regex parse error:\n    [A-Z*b\n    ^\nerror: \
             unclosed character class"
        );

        // Regexes not allowed
        let err = parse_query_to_logical_ast_with_default_fields(
            "title:/.*b/",
            false,
            &["title", "text"],
            false,
        )
        .unwrap_err();
        assert_eq!(
            err.to_string(),
            "Unsupported query: Regex queries are not allowed."
        );
    }
}


================================================
FILE: src/query/range_query/fast_field_range_doc_set.rs
================================================
use core::fmt::Debug;
use std::ops::RangeInclusive;

use columnar::Column;

use crate::{DocId, DocSet, TERMINATED};

/// Helper to have a cursor over a vec of docids
#[derive(Debug)]
struct VecCursor {
    docs: Vec<u32>,
    current_pos: usize,
}
impl VecCursor {
    fn new() -> Self {
        Self {
            docs: Vec::with_capacity(32),
            current_pos: 0,
        }
    }
    fn next(&mut self) -> Option<u32> {
        self.current_pos += 1;
        self.current()
    }
    #[inline]
    fn current(&self) -> Option<u32> {
        self.docs.get(self.current_pos).copied()
    }
    fn get_cleared_data(&mut self) -> &mut Vec<u32> {
        self.docs.clear();
        self.current_pos = 0;
        &mut self.docs
    }
    fn last_doc(&self) -> Option<u32> {
        self.docs.last().cloned()
    }
    fn is_empty(&self) -> bool {
        self.current().is_none()
    }
}

pub(crate) struct RangeDocSet<T> {
    /// The range filter on the values.
    value_range: RangeInclusive<T>,
    column: Column<T>,
    /// The next docid start range to fetch (inclusive).
    next_fetch_start: u32,
    /// Number of docs range checked in a batch.
    ///
    /// There are two patterns.
    /// - We do a full scan. => We can load large chunks. We don't know in advance if seek call
    ///   will come, so we start with small chunks
    /// - We load docs, interspersed with seek calls. When there are big jumps in the seek, we
    ///   should load small chunks. When the seeks are small, we can employ the same strategy as on
    ///   a full scan.
    fetch_horizon: u32,
    /// Current batch of loaded docs.
    loaded_docs: VecCursor,
    last_seek_pos_opt: Option<u32>,
}

const DEFAULT_FETCH_HORIZON: u32 = 128;
impl<T: Send + Sync + PartialOrd + Copy + Debug + 'static> RangeDocSet<T> {
    pub(crate) fn new(value_range: RangeInclusive<T>, column: Column<T>) -> Self {
        if *value_range.start() > column.max_value() || *value_range.end() < column.min_value() {
            return Self {
                value_range,
                column,
                loaded_docs: VecCursor::new(),
                next_fetch_start: TERMINATED,
                fetch_horizon: DEFAULT_FETCH_HORIZON,
                last_seek_pos_opt: None,
            };
        }

        let mut range_docset = Self {
            value_range,
            column,
            loaded_docs: VecCursor::new(),
            next_fetch_start: 0,
            fetch_horizon: DEFAULT_FETCH_HORIZON,
            last_seek_pos_opt: None,
        };
        range_docset.reset_fetch_range();
        range_docset.fetch_block();
        range_docset
    }

    fn reset_fetch_range(&mut self) {
        self.fetch_horizon = DEFAULT_FETCH_HORIZON;
    }

    /// Returns true if more data could be fetched
    fn fetch_block(&mut self) {
        if self.next_fetch_start >= self.column.num_docs() {
            return;
        }
        const MAX_HORIZON: u32 = 100_000;
        while self.loaded_docs.is_empty() {
            let finished_to_end = self.fetch_horizon(self.fetch_horizon);
            if finished_to_end {
                break;
            }
            // Fetch more data, increase horizon. Horizon only gets reset when doing a seek.
            self.fetch_horizon = (self.fetch_horizon * 2).min(MAX_HORIZON);
        }
    }

    /// check if the distance between the seek calls is large
    fn is_last_seek_distance_large(&self, new_seek: DocId) -> bool {
        if let Some(last_seek_pos) = self.last_seek_pos_opt {
            (new_seek - last_seek_pos) >= 128
        } else {
            true
        }
    }

    /// Fetches a block for docid range [next_fetch_start .. next_fetch_start + HORIZON]
    fn fetch_horizon(&mut self, horizon: u32) -> bool {
        let mut finished_to_end = false;

        let num_docs = self.column.num_docs();
        let mut fetch_end = self.next_fetch_start + horizon;
        if fetch_end >= num_docs {
            fetch_end = num_docs;
            finished_to_end = true;
        }

        let last_doc = self.loaded_docs.last_doc();
        let doc_buffer: &mut Vec<DocId> = self.loaded_docs.get_cleared_data();
        self.column.get_docids_for_value_range(
            self.value_range.clone(),
            self.next_fetch_start..fetch_end,
            doc_buffer,
        );
        if let Some(last_doc) = last_doc {
            while self.loaded_docs.current() == Some(last_doc) {
                self.loaded_docs.next();
            }
        }
        self.next_fetch_start = fetch_end;

        finished_to_end
    }
}

impl<T: Send + Sync + PartialOrd + Copy + Debug + 'static> DocSet for RangeDocSet<T> {
    #[inline]
    fn advance(&mut self) -> DocId {
        if let Some(docid) = self.loaded_docs.next() {
            return docid;
        }
        self.fetch_block();
        self.loaded_docs.current().unwrap_or(TERMINATED)
    }

    #[inline]
    fn doc(&self) -> DocId {
        self.loaded_docs.current().unwrap_or(TERMINATED)
    }

    /// Advances the `DocSet` forward until reaching the target, or going to the
    /// lowest [`DocId`] greater than the target.
    ///
    /// If the end of the `DocSet` is reached, [`TERMINATED`] is returned.
    ///
    /// Calling `.seek(target)` on a terminated `DocSet` is legal. Implementation
    /// of `DocSet` should support it.
    ///
    /// Calling `seek(TERMINATED)` is also legal and is the normal way to consume a `DocSet`.
    fn seek(&mut self, target: DocId) -> DocId {
        if self.is_last_seek_distance_large(target) {
            self.reset_fetch_range();
        }
        if target > self.next_fetch_start {
            self.next_fetch_start = target;
        }
        let mut doc = self.doc();
        debug_assert!(doc <= target);
        while doc < target {
            doc = self.advance();
        }
        self.last_seek_pos_opt = Some(target);
        doc
    }

    fn size_hint(&self) -> u32 {
        // TODO: Implement a better size hint
        self.column.num_docs() / 10
    }

    /// Returns a best-effort hint of the
    /// cost to drive the docset.
    fn cost(&self) -> u64 {
        // Advancing the docset is pretty expensive since it scans the whole column, there is no
        // index currently (will change with an kd-tree)
        // Since we use SIMD to scan the fast field range query we lower the cost a little bit,
        // assuming that we hit 10% of the docs like in size_hint.
        //
        // If we would return a cost higher than num_docs, we would never choose ff range query as
        // the driver in a DocSet, when intersecting a term query with a fast field. But
        // it's the faster choice when the term query has a lot of docids and the range
        // query has not.
        //
        // Ideally this would take the fast field codec into account
        (self.column.num_docs() as f64 * 0.8) as u64
    }
}

#[cfg(test)]
mod tests {
    use std::ops::Bound;

    use crate::collector::Count;
    use crate::directory::RamDirectory;
    use crate::query::RangeQuery;
    use crate::{schema, IndexBuilder, TantivyDocument, Term};

    #[test]
    fn range_query_fast_optional_field_minimum() {
        let mut schema_builder = schema::SchemaBuilder::new();
        let id_field = schema_builder.add_text_field("id", schema::STRING);
        let score_field = schema_builder.add_u64_field("score", schema::FAST | schema::INDEXED);

        let dir = RamDirectory::default();
        let index = IndexBuilder::new()
            .schema(schema_builder.build())
            .open_or_create(dir)
            .unwrap();

        {
            let mut writer = index.writer(15_000_000).unwrap();

            let count = 1000;
            for i in 0..count {
                let mut doc = TantivyDocument::new();
                doc.add_text(id_field, format!("doc{i}"));

                let nb_scores = i % 2; // 0 or 1 scores
                for _ in 0..nb_scores {
                    doc.add_u64(score_field, 80);
                }

                writer.add_document(doc).unwrap();
            }
            writer.commit().unwrap();
        }

        let reader = index.reader().unwrap();
        let searcher = reader.searcher();

        let query = RangeQuery::new(
            Bound::Included(Term::from_field_u64(score_field, 70)),
            Bound::Unbounded,
        );

        let count = searcher.search(&query, &Count).unwrap();
        assert_eq!(count, 500);
    }

    #[test]
    fn range_query_no_overlap_optimization() {
        let mut schema_builder = schema::SchemaBuilder::new();
        let id_field = schema_builder.add_text_field("id", schema::STRING);
        let value_field = schema_builder.add_u64_field("value", schema::FAST | schema::INDEXED);

        let dir = RamDirectory::default();
        let index = IndexBuilder::new()
            .schema(schema_builder.build())
            .open_or_create(dir)
            .unwrap();

        {
            let mut writer = index.writer(15_000_000).unwrap();

            // Add documents with values in the range [10, 20]
            for i in 0..100 {
                let mut doc = TantivyDocument::new();
                doc.add_text(id_field, format!("doc{i}"));
                doc.add_u64(value_field, 10 + (i % 11) as u64); // values in range 10-20

                writer.add_document(doc).unwrap();
            }
            writer.commit().unwrap();
        }

        let reader = index.reader().unwrap();
        let searcher = reader.searcher();

        // Test a range query [100, 200] that has no overlap with data range [10, 20]
        let query = RangeQuery::new(
            Bound::Included(Term::from_field_u64(value_field, 100)),
            Bound::Included(Term::from_field_u64(value_field, 200)),
        );

        let count = searcher.search(&query, &Count).unwrap();
        assert_eq!(count, 0); // should return 0 results since there's no overlap

        // Test another non-overlapping range: [0, 5] while data range is [10, 20]
        let query2 = RangeQuery::new(
            Bound::Included(Term::from_field_u64(value_field, 0)),
            Bound::Included(Term::from_field_u64(value_field, 5)),
        );

        let count2 = searcher.search(&query2, &Count).unwrap();
        assert_eq!(count2, 0); // should return 0 results since there's no overlap
    }
}


================================================
FILE: src/query/range_query/mod.rs
================================================
use crate::schema::Type;

mod fast_field_range_doc_set;
mod range_query;
mod range_query_fastfield;

pub use common::bounds::BoundsRange;

pub use self::range_query::*;
pub use self::range_query_fastfield::*;

// TODO is this correct?
pub(crate) fn is_type_valid_for_fastfield_range_query(typ: Type) -> bool {
    match typ {
        Type::Str
        | Type::U64
        | Type::I64
        | Type::F64
        | Type::Bool
        | Type::Date
        | Type::Json
        | Type::IpAddr
        | Type::Bytes => true,
        Type::Facet => false,
    }
}


================================================
FILE: src/query/range_query/range_query.rs
================================================
use std::io;
use std::ops::Bound;

use common::bounds::{map_bound, BoundsRange};
use common::BitSet;

use super::range_query_fastfield::FastFieldRangeWeight;
use crate::index::SegmentReader;
use crate::query::explanation::does_not_match;
use crate::query::range_query::is_type_valid_for_fastfield_range_query;
use crate::query::{BitSetDocSet, ConstScorer, EnableScoring, Explanation, Query, Scorer, Weight};
use crate::schema::{Field, IndexRecordOption, Term, Type};
use crate::termdict::{TermDictionary, TermStreamer};
use crate::{DocId, Score};

/// `RangeQuery` matches all documents that have at least one term within a defined range.
///
/// Matched document will all get a constant `Score` of one.
///
/// # Implementation
///
/// ## Default
/// The default implementation collects all documents _upfront_ into a `BitSet`.
/// This is done by iterating over the terms within the range and loading all docs for each
/// `TermInfo` from the inverted index (posting list) and put them into a `BitSet`.
/// Depending on the number of terms matched, this is a potentially expensive operation.
///
/// ## IP fast field
/// For IP fast fields a custom variant is used, by scanning the fast field. Unlike the default
/// variant we can walk in a lazy fashion over it, since the fastfield is implicit orderered by
/// DocId.
///
///
/// # Example
///
/// ```rust
/// use tantivy::collector::Count;
/// use tantivy::query::RangeQuery;
/// use tantivy::Term;
/// use tantivy::schema::{Schema, INDEXED};
/// use tantivy::{doc, Index, IndexWriter};
/// use std::ops::Bound;
/// # fn test() -> tantivy::Result<()> {
/// let mut schema_builder = Schema::builder();
/// let year_field = schema_builder.add_u64_field("year", INDEXED);
/// let schema = schema_builder.build();
///
/// let index = Index::create_in_ram(schema);
/// let mut index_writer: IndexWriter = index.writer_with_num_threads(1, 20_000_000)?;
/// for year in 1950u64..2017u64 {
///     let num_docs_within_year = 10 + (year - 1950) * (year - 1950);
///     for _ in 0..num_docs_within_year {
///       index_writer.add_document(doc!(year_field => year))?;
///     }
/// }
/// index_writer.commit()?;
///
/// let reader = index.reader()?;
/// let searcher = reader.searcher();
/// let docs_in_the_sixties = RangeQuery::new(
///     Bound::Included(Term::from_field_u64(year_field, 1960)),
///     Bound::Excluded(Term::from_field_u64(year_field, 1970)),
/// );
/// let num_60s_books = searcher.search(&docs_in_the_sixties, &Count)?;
/// assert_eq!(num_60s_books, 2285);
/// Ok(())
/// # }
/// # assert!(test().is_ok());
/// ```
#[derive(Clone, Debug)]
pub struct RangeQuery {
    bounds: BoundsRange<Term>,
}

impl RangeQuery {
    /// Creates a new `RangeQuery` from bounded start and end terms.
    ///
    /// If the value type is not correct, something may go terribly wrong when
    /// the `Weight` object is created.
    pub fn new(lower_bound: Bound<Term>, upper_bound: Bound<Term>) -> RangeQuery {
        RangeQuery {
            bounds: BoundsRange::new(lower_bound, upper_bound),
        }
    }

    /// Field to search over
    pub fn field(&self) -> Field {
        self.get_term().field()
    }

    /// The value type of the field
    pub fn value_type(&self) -> Type {
        self.get_term().typ()
    }

    pub(crate) fn get_term(&self) -> &Term {
        self.bounds
            .get_inner()
            .expect("At least one bound must be set")
    }
}

impl Query for RangeQuery {
    fn weight(&self, enable_scoring: EnableScoring<'_>) -> crate::Result<Box<dyn Weight>> {
        let schema = enable_scoring.schema();
        let field_type = schema.get_field_entry(self.field()).field_type();

        if field_type.is_fast() && is_type_valid_for_fastfield_range_query(self.value_type()) {
            Ok(Box::new(FastFieldRangeWeight::new(self.bounds.clone())))
        } else {
            if field_type.is_json() {
                return Err(crate::TantivyError::InvalidArgument(
                    "RangeQuery on JSON is only supported for fast fields currently".to_string(),
                ));
            }
            Ok(Box::new(InvertedIndexRangeWeight::new(
                self.field(),
                &self.bounds.lower_bound,
                &self.bounds.upper_bound,
                None,
            )))
        }
    }
}

#[derive(Clone, Debug)]
/// `InvertedIndexRangeQuery` is the same as [RangeQuery] but only uses the inverted index
pub struct InvertedIndexRangeQuery {
    bounds: BoundsRange<Term>,
    limit: Option<u64>,
}
impl InvertedIndexRangeQuery {
    /// Create new `InvertedIndexRangeQuery`
    pub fn new(lower_bound: Bound<Term>, upper_bound: Bound<Term>) -> InvertedIndexRangeQuery {
        InvertedIndexRangeQuery {
            bounds: BoundsRange::new(lower_bound, upper_bound),
            limit: None,
        }
    }
    /// Limit the number of term the `RangeQuery` will go through.
    ///
    /// This does not limit the number of matching document, only the number of
    /// different terms that get matched.
    pub fn limit(&mut self, limit: u64) {
        self.limit = Some(limit);
    }
}

impl Query for InvertedIndexRangeQuery {
    fn weight(&self, _enable_scoring: EnableScoring<'_>) -> crate::Result<Box<dyn Weight>> {
        let field = self
            .bounds
            .get_inner()
            .expect("At least one bound must be set")
            .field();

        Ok(Box::new(InvertedIndexRangeWeight::new(
            field,
            &self.bounds.lower_bound,
            &self.bounds.upper_bound,
            self.limit,
        )))
    }
}

/// Range weight on the inverted index
pub struct InvertedIndexRangeWeight {
    field: Field,
    lower_bound: Bound<Vec<u8>>,
    upper_bound: Bound<Vec<u8>>,
    limit: Option<u64>,
}

impl InvertedIndexRangeWeight {
    /// Creates a new RangeWeight
    ///
    /// Note: The limit is only enabled with the quickwit feature flag.
    pub fn new(
        field: Field,
        lower_bound: &Bound<Term>,
        upper_bound: &Bound<Term>,
        limit: Option<u64>,
    ) -> Self {
        let verify_and_unwrap_term = |val: &Term| val.serialized_value_bytes().to_owned();
        Self {
            field,
            lower_bound: map_bound(lower_bound, verify_and_unwrap_term),
            upper_bound: map_bound(upper_bound, verify_and_unwrap_term),
            limit,
        }
    }

    fn term_range<'a>(&self, term_dict: &'a TermDictionary) -> io::Result<TermStreamer<'a>> {
        use std::ops::Bound::*;
        let mut term_stream_builder = term_dict.range();
        term_stream_builder = match self.lower_bound {
            Included(ref term_val) => term_stream_builder.ge(term_val),
            Excluded(ref term_val) => term_stream_builder.gt(term_val),
            Unbounded => term_stream_builder,
        };
        term_stream_builder = match self.upper_bound {
            Included(ref term_val) => term_stream_builder.le(term_val),
            Excluded(ref term_val) => term_stream_builder.lt(term_val),
            Unbounded => term_stream_builder,
        };
        #[cfg(feature = "quickwit")]
        if let Some(limit) = self.limit {
            term_stream_builder = term_stream_builder.limit(limit);
        }
        term_stream_builder.into_stream()
    }
}

impl Weight for InvertedIndexRangeWeight {
    fn scorer(&self, reader: &SegmentReader, boost: Score) -> crate::Result<Box<dyn Scorer>> {
        let max_doc = reader.max_doc();
        let mut doc_bitset = BitSet::with_max_value(max_doc);

        let inverted_index = reader.inverted_index(self.field)?;
        let term_dict = inverted_index.terms();
        let mut term_range = self.term_range(term_dict)?;
        let mut processed_count = 0;
        while term_range.advance() {
            if let Some(limit) = self.limit {
                if limit <= processed_count {
                    break;
                }
            }
            processed_count += 1;
            let term_info = term_range.value();
            let mut block_segment_postings = inverted_index
                .read_block_postings_from_terminfo(term_info, IndexRecordOption::Basic)?;
            loop {
                let docs = block_segment_postings.docs();
                if docs.is_empty() {
                    break;
                }
                for &doc in block_segment_postings.docs() {
                    doc_bitset.insert(doc);
                }
                block_segment_postings.advance();
            }
        }
        let doc_bitset = BitSetDocSet::from(doc_bitset);
        Ok(Box::new(ConstScorer::new(doc_bitset, boost)))
    }

    fn explain(&self, reader: &SegmentReader, doc: DocId) -> crate::Result<Explanation> {
        let mut scorer = self.scorer(reader, 1.0)?;
        if scorer.seek(doc) != doc {
            return Err(does_not_match(doc));
        }
        Ok(Explanation::new("RangeQuery", 1.0))
    }
}

#[cfg(test)]
mod tests {

    use std::net::IpAddr;
    use std::ops::Bound;
    use std::str::FromStr;

    use rand::seq::SliceRandom;

    use super::RangeQuery;
    use crate::collector::{Count, TopDocs};
    use crate::indexer::NoMergePolicy;
    use crate::query::range_query::fast_field_range_doc_set::RangeDocSet;
    use crate::query::range_query::range_query::InvertedIndexRangeQuery;
    use crate::query::{AllScorer, ConstScorer, EmptyScorer, EnableScoring, Query, QueryParser};
    use crate::schema::{
        Field, IntoIpv6Addr, Schema, TantivyDocument, FAST, INDEXED, STORED, TEXT,
    };
    use crate::{Index, IndexWriter, Term};

    #[test]
    fn test_range_query_simple() -> crate::Result<()> {
        let mut schema_builder = Schema::builder();
        let year_field = schema_builder.add_u64_field("year", INDEXED);
        let schema = schema_builder.build();

        let index = Index::create_in_ram(schema);
        {
            let mut index_writer = index.writer_for_tests()?;
            for year in 1950u64..2017u64 {
                let num_docs_within_year = 10 + (year - 1950) * (year - 1950);
                for _ in 0..num_docs_within_year {
                    index_writer.add_document(doc!(year_field => year))?;
                }
            }
            index_writer.commit()?;
        }
        let reader = index.reader()?;
        let searcher = reader.searcher();

        let docs_in_the_sixties = InvertedIndexRangeQuery::new(
            Bound::Included(Term::from_field_u64(year_field, 1960)),
            Bound::Excluded(Term::from_field_u64(year_field, 1970)),
        );

        // ... or `1960..=1969` if inclusive range is enabled.
        let count = searcher.search(&docs_in_the_sixties, &Count)?;
        assert_eq!(count, 2285);
        Ok(())
    }

    #[test]
    fn test_range_query_with_limit() -> crate::Result<()> {
        let mut schema_builder = Schema::builder();
        let year_field = schema_builder.add_u64_field("year", INDEXED);
        let schema = schema_builder.build();

        let index = Index::create_in_ram(schema);
        {
            let mut index_writer = index.writer_for_tests()?;
            for year in 1950u64..2017u64 {
                if year == 1963 {
                    continue;
                }
                let num_docs_within_year = 10 + (year - 1950) * (year - 1950);
                for _ in 0..num_docs_within_year {
                    index_writer.add_document(doc!(year_field => year))?;
                }
            }
            index_writer.commit()?;
        }
        let reader = index.reader()?;
        let searcher = reader.searcher();

        let mut docs_in_the_sixties = InvertedIndexRangeQuery::new(
            Bound::Included(Term::from_field_u64(year_field, 1960)),
            Bound::Excluded(Term::from_field_u64(year_field, 1970)),
        );
        docs_in_the_sixties.limit(5);

        // due to the limit and no docs in 1963, it's really only 1960..=1965
        let count = searcher.search(&docs_in_the_sixties, &Count)?;
        assert_eq!(count, 836);
        Ok(())
    }

    #[test]
    fn test_range_query() -> crate::Result<()> {
        let int_field: Field;
        let schema = {
            let mut schema_builder = Schema::builder();
            int_field = schema_builder.add_i64_field("intfield", INDEXED);
            schema_builder.build()
        };

        let index = Index::create_in_ram(schema);
        {
            let mut index_writer = index.writer_with_num_threads(1, 60_000_000)?;
            index_writer.set_merge_policy(Box::new(NoMergePolicy));

            for i in 1..100 {
                let mut doc = TantivyDocument::new();
                for j in 1..100 {
                    if i % j == 0 {
                        doc.add_i64(int_field, j as i64);
                    }
                }
                index_writer.add_document(doc)?;
                if i == 10 {
                    index_writer.commit()?;
                }
            }

            index_writer.commit()?;
        }
        let reader = index.reader().unwrap();
        let searcher = reader.searcher();
        assert_eq!(searcher.segment_readers().len(), 2);
        let count_multiples =
            |range_query: RangeQuery| searcher.search(&range_query, &Count).unwrap();

        assert_eq!(
            count_multiples(RangeQuery::new(
                Bound::Included(Term::from_field_i64(int_field, 10)),
                Bound::Excluded(Term::from_field_i64(int_field, 11)),
            )),
            9
        );
        assert_eq!(
            count_multiples(RangeQuery::new(
                Bound::Included(Term::from_field_i64(int_field, 10)),
                Bound::Included(Term::from_field_i64(int_field, 11)),
            )),
            18
        );
        assert_eq!(
            count_multiples(RangeQuery::new(
                Bound::Excluded(Term::from_field_i64(int_field, 9)),
                Bound::Included(Term::from_field_i64(int_field, 10)),
            )),
            9
        );
        assert_eq!(
            count_multiples(RangeQuery::new(
                Bound::Included(Term::from_field_i64(int_field, 9)),
                Bound::Unbounded
            )),
            91
        );
        Ok(())
    }

    #[test]
    fn test_range_float() -> crate::Result<()> {
        let float_field: Field;
        let schema = {
            let mut schema_builder = Schema::builder();
            float_field = schema_builder.add_f64_field("floatfield", INDEXED);
            schema_builder.build()
        };

        let index = Index::create_in_ram(schema);
        {
            let mut index_writer = index.writer_with_num_threads(1, 60_000_000).unwrap();
            let mut docs = Vec::new();
            for i in 1..100 {
                let mut doc = TantivyDocument::new();
                for j in 1..100 {
                    if i % j == 0 {
                        doc.add_f64(float_field, j as f64);
                    }
                }
                docs.push(doc);
            }

            docs.shuffle(&mut rand::rng());
            let mut docs_it = docs.into_iter();
            for doc in (&mut docs_it).take(50) {
                index_writer.add_document(doc)?;
            }
            index_writer.commit()?;
            for doc in docs_it {
                index_writer.add_document(doc)?;
            }
            index_writer.commit()?;
        }
        let reader = index.reader()?;
        let searcher = reader.searcher();
        assert_eq!(searcher.segment_readers().len(), 2);
        let count_multiples =
            |range_query: RangeQuery| searcher.search(&range_query, &Count).unwrap();

        assert_eq!(
            count_multiples(RangeQuery::new(
                Bound::Included(Term::from_field_f64(float_field, 10.0)),
                Bound::Excluded(Term::from_field_f64(float_field, 11.0)),
            )),
            9
        );
        assert_eq!(
            count_multiples(RangeQuery::new(
                Bound::Included(Term::from_field_f64(float_field, 10.0)),
                Bound::Included(Term::from_field_f64(float_field, 11.0)),
            )),
            18
        );
        assert_eq!(
            count_multiples(RangeQuery::new(
                Bound::Excluded(Term::from_field_f64(float_field, 9.0)),
                Bound::Included(Term::from_field_f64(float_field, 10.0)),
            )),
            9
        );
        assert_eq!(
            count_multiples(RangeQuery::new(
                Bound::Included(Term::from_field_f64(float_field, 9.0)),
                Bound::Unbounded
            )),
            91
        );
        Ok(())
    }

    #[test]
    fn test_bug_reproduce_range_query() -> crate::Result<()> {
        let mut schema_builder = Schema::builder();
        schema_builder.add_text_field("title", TEXT);
        schema_builder.add_i64_field("year", INDEXED);
        let schema = schema_builder.build();
        let index = Index::create_in_ram(schema.clone());
        let mut index_writer = index.writer_for_tests()?;
        let title = schema.get_field("title").unwrap();
        let year = schema.get_field("year").unwrap();
        index_writer.add_document(doc!(
          title => "hemoglobin blood",
          year => 1990_i64
        ))?;
        index_writer.commit()?;
        let reader = index.reader()?;
        let searcher = reader.searcher();
        let query_parser = QueryParser::for_index(&index, vec![title]);
        let query = query_parser.parse_query("hemoglobin AND year:[1970 TO 1990]")?;
        let top_docs = searcher.search(&query, &TopDocs::with_limit(10).order_by_score())?;
        assert_eq!(top_docs.len(), 1);
        Ok(())
    }

    #[test]
    fn search_ip_range_test_posting_list() {
        search_ip_range_test_opt(false);
    }

    #[test]
    fn search_ip_range_test() {
        search_ip_range_test_opt(true);
    }

    fn search_ip_range_test_opt(with_fast_field: bool) {
        let mut schema_builder = Schema::builder();
        let ip_field = if with_fast_field {
            schema_builder.add_ip_addr_field("ip", INDEXED | STORED | FAST)
        } else {
            schema_builder.add_ip_addr_field("ip", INDEXED | STORED)
        };
        let text_field = schema_builder.add_text_field("text", TEXT | STORED);
        let schema = schema_builder.build();
        let index = Index::create_in_ram(schema);
        let ip_addr_1 = IpAddr::from_str("127.0.0.10").unwrap().into_ipv6_addr();
        let ip_addr_2 = IpAddr::from_str("127.0.0.20").unwrap().into_ipv6_addr();

        {
            let mut index_writer: IndexWriter = index.writer_for_tests().unwrap();
            for _ in 0..1_000 {
                index_writer
                    .add_document(doc!(
                        ip_field => ip_addr_1,
                        text_field => "BLUBBER"
                    ))
                    .unwrap();
            }
            for _ in 0..1_000 {
                index_writer
                    .add_document(doc!(
                        ip_field => ip_addr_2,
                        text_field => "BLOBBER"
                    ))
                    .unwrap();
            }
            index_writer.commit().unwrap();
        }
        let reader = index.reader().unwrap();
        let searcher = reader.searcher();
        assert_eq!(searcher.segment_readers().len(), 1);

        let get_num_hits = |query| {
            let (_top_docs, count) = searcher
                .search(&query, &(TopDocs::with_limit(10).order_by_score(), Count))
                .unwrap();
            count
        };
        let query_from_text = |text: &str| {
            QueryParser::for_index(&index, vec![])
                .parse_query(text)
                .unwrap()
        };

        // Inclusive range
        assert_eq!(
            get_num_hits(query_from_text("ip:[127.0.0.1 TO 127.0.0.20]")),
            2000
        );

        assert_eq!(
            get_num_hits(query_from_text("ip:[127.0.0.10 TO 127.0.0.20]")),
            2000
        );

        assert_eq!(
            get_num_hits(query_from_text("ip:[127.0.0.11 TO 127.0.0.20]")),
            1000
        );

        assert_eq!(
            get_num_hits(query_from_text("ip:[127.0.0.11 TO 127.0.0.19]")),
            0
        );

        assert_eq!(get_num_hits(query_from_text("ip:[127.0.0.11 TO *]")), 1000);
        assert_eq!(get_num_hits(query_from_text("ip:[127.0.0.21 TO *]")), 0);
        assert_eq!(get_num_hits(query_from_text("ip:[* TO 127.0.0.9]")), 0);
        assert_eq!(get_num_hits(query_from_text("ip:[* TO 127.0.0.10]")), 1000);

        // Exclusive range
        assert_eq!(
            get_num_hits(query_from_text("ip:{127.0.0.1 TO 127.0.0.20}")),
            1000
        );

        assert_eq!(
            get_num_hits(query_from_text("ip:{127.0.0.1 TO 127.0.0.21}")),
            2000
        );

        assert_eq!(
            get_num_hits(query_from_text("ip:{127.0.0.10 TO 127.0.0.20}")),
            0
        );

        assert_eq!(
            get_num_hits(query_from_text("ip:{127.0.0.11 TO 127.0.0.20}")),
            0
        );

        assert_eq!(
            get_num_hits(query_from_text("ip:{127.0.0.11 TO 127.0.0.19}")),
            0
        );

        assert_eq!(get_num_hits(query_from_text("ip:{127.0.0.11 TO *}")), 1000);
        assert_eq!(get_num_hits(query_from_text("ip:{127.0.0.10 TO *}")), 1000);
        assert_eq!(get_num_hits(query_from_text("ip:{127.0.0.21 TO *}")), 0);
        assert_eq!(get_num_hits(query_from_text("ip:{127.0.0.20 TO *}")), 0);
        assert_eq!(get_num_hits(query_from_text("ip:{127.0.0.19 TO *}")), 1000);
        assert_eq!(get_num_hits(query_from_text("ip:{* TO 127.0.0.9}")), 0);
        assert_eq!(get_num_hits(query_from_text("ip:{* TO 127.0.0.10}")), 0);
        assert_eq!(get_num_hits(query_from_text("ip:{* TO 127.0.0.11}")), 1000);

        // Inclusive/Exclusive range
        assert_eq!(
            get_num_hits(query_from_text("ip:[127.0.0.1 TO 127.0.0.20}")),
            1000
        );

        assert_eq!(
            get_num_hits(query_from_text("ip:{127.0.0.1 TO 127.0.0.20]")),
            2000
        );

        // Intersection
        assert_eq!(
            get_num_hits(query_from_text(
                "text:BLUBBER AND ip:[127.0.0.10 TO 127.0.0.10]"
            )),
            1000
        );

        assert_eq!(
            get_num_hits(query_from_text(
                "text:BLOBBER AND ip:[127.0.0.10 TO 127.0.0.10]"
            )),
            0
        );

        assert_eq!(
            get_num_hits(query_from_text(
                "text:BLOBBER AND ip:[127.0.0.20 TO 127.0.0.20]"
            )),
            1000
        );

        assert_eq!(
            get_num_hits(query_from_text(
                "text:BLUBBER AND ip:[127.0.0.20 TO 127.0.0.20]"
            )),
            0
        );
    }

    #[test]
    fn test_range_query_simplified() {
        // This test checks that if the targeted column values are entirely
        // within the range, and the column is full, we end up with a AllScorer.
        let mut schema_builder = Schema::builder();
        let u64_field = schema_builder.add_u64_field("u64_field", FAST);
        let schema = schema_builder.build();
        let index = Index::create_in_ram(schema.clone());
        let mut index_writer = index.writer_for_tests().unwrap();
        index_writer.add_document(doc!(u64_field=> 2u64)).unwrap();
        index_writer.add_document(doc!(u64_field=> 4u64)).unwrap();
        index_writer.commit().unwrap();
        let reader = index.reader().unwrap();
        let searcher = reader.searcher();
        assert_eq!(searcher.segment_readers().len(), 1);
        let make_term = |value: u64| Term::from_field_u64(u64_field, value);
        let make_scorer = move |lower_bound: Bound<u64>, upper_bound: Bound<u64>| {
            let lower_bound_term = lower_bound.map(make_term);
            let upper_bound_term = upper_bound.map(make_term);
            let range_query = RangeQuery::new(lower_bound_term, upper_bound_term);
            let range_weight = range_query
                .weight(EnableScoring::disabled_from_schema(&schema))
                .unwrap();
            let range_scorer = range_weight
                .scorer(&searcher.segment_readers()[0], 1.0f32)
                .unwrap();
            range_scorer
        };
        let range_scorer = make_scorer(Bound::Included(1), Bound::Included(4));
        assert!(range_scorer.is::<AllScorer>());
        let range_scorer = make_scorer(Bound::Included(0), Bound::Included(2));
        assert!(range_scorer.is::<ConstScorer<RangeDocSet<u64>>>());
        let range_scorer = make_scorer(Bound::Included(3), Bound::Included(10));
        assert!(range_scorer.is::<ConstScorer<RangeDocSet<u64>>>());
        let range_scorer = make_scorer(Bound::Included(10), Bound::Included(12));
        assert!(range_scorer.is::<ConstScorer<RangeDocSet<u64>>>());
        let range_scorer = make_scorer(Bound::Included(0), Bound::Included(1));
        assert!(range_scorer.is::<EmptyScorer>());
        let range_scorer = make_scorer(Bound::Included(0), Bound::Excluded(2));
        assert!(range_scorer.is::<EmptyScorer>());
    }
}


================================================
FILE: src/query/range_query/range_query_fastfield.rs
================================================
//! Fastfields support efficient scanning for range queries.
//! We use this variant only if the fastfield exists, otherwise the default in `range_query` is
//! used, which uses the term dictionary + postings.

use std::net::Ipv6Addr;
use std::ops::{Bound, RangeInclusive};

use columnar::{
    BytesColumn, Cardinality, Column, ColumnType, MonotonicallyMappableToU128,
    MonotonicallyMappableToU64, NumericalType, StrColumn,
};
use common::bounds::{BoundsRange, TransformBound};

use super::fast_field_range_doc_set::RangeDocSet;
use crate::query::{
    AllScorer, ConstScorer, EmptyScorer, EnableScoring, Explanation, Query, Scorer, Weight,
};
use crate::schema::{Type, ValueBytes};
use crate::{DocId, DocSet, Score, SegmentReader, TantivyError, Term};

#[derive(Clone, Debug)]
/// `FastFieldRangeQuery` is the same as [RangeQuery] but only uses the fast field
pub struct FastFieldRangeQuery {
    bounds: BoundsRange<Term>,
}
impl FastFieldRangeQuery {
    /// Create new `FastFieldRangeQuery`
    pub fn new(lower_bound: Bound<Term>, upper_bound: Bound<Term>) -> FastFieldRangeQuery {
        Self {
            bounds: BoundsRange::new(lower_bound, upper_bound),
        }
    }
}

impl Query for FastFieldRangeQuery {
    fn weight(&self, _enable_scoring: EnableScoring<'_>) -> crate::Result<Box<dyn Weight>> {
        Ok(Box::new(FastFieldRangeWeight::new(self.bounds.clone())))
    }
}

/// `FastFieldRangeWeight` uses the fast field to execute range queries.
#[derive(Clone, Debug)]
pub struct FastFieldRangeWeight {
    bounds: BoundsRange<Term>,
}

impl FastFieldRangeWeight {
    /// Create a new FastFieldRangeWeight
    pub fn new(bounds: BoundsRange<Term>) -> Self {
        Self { bounds }
    }
}

impl Weight for FastFieldRangeWeight {
    fn scorer(&self, reader: &SegmentReader, boost: Score) -> crate::Result<Box<dyn Scorer>> {
        // Check if both bounds are Bound::Unbounded
        if self.bounds.is_unbounded() {
            return Ok(Box::new(AllScorer::new(reader.max_doc())));
        }

        let term = self
            .bounds
            .get_inner()
            .expect("At least one bound must be set");
        let schema = reader.schema();
        let field_type = schema.get_field_entry(term.field()).field_type();
        assert_eq!(
            term.typ(),
            field_type.value_type(),
            "Field is of type {:?}, but got term of type {:?}",
            field_type,
            term.typ()
        );
        let field_name = term.get_full_path(reader.schema());

        let get_value_bytes = |term: &Term| term.value().value_bytes_payload();

        let term_value = term.value();
        if field_type.is_json() {
            let bounds = self
                .bounds
                .map_bound(|term| term.value().as_json_value_bytes().unwrap().to_owned());
            // Unlike with other field types JSON may have multiple columns of different types
            // under the same name
            //
            // In the JSON case the provided type in term may not exactly match the column type,
            // especially with the numeric type interpolation
            let json_value_bytes = term_value
                .as_json_value_bytes()
                .expect("expected json type in term");
            let typ = json_value_bytes.typ();

            match typ {
                Type::Str => {
                    let Some(str_dict_column): Option<StrColumn> =
                        reader.fast_fields().str(&field_name)?
                    else {
                        return Ok(Box::new(EmptyScorer));
                    };
                    let dict = str_dict_column.dictionary();

                    let bounds = self.bounds.map_bound(get_value_bytes);
                    // Get term ids for terms
                    let (lower_bound, upper_bound) =
                        dict.term_bounds_to_ord(bounds.lower_bound, bounds.upper_bound)?;
                    let fast_field_reader = reader.fast_fields();
                    let Some((column, _col_type)) = fast_field_reader
                        .u64_lenient_for_type(Some(&[ColumnType::Str]), &field_name)?
                    else {
                        return Ok(Box::new(EmptyScorer));
                    };
                    search_on_u64_ff(column, boost, BoundsRange::new(lower_bound, upper_bound))
                }
                Type::U64 | Type::I64 | Type::F64 => {
                    search_on_json_numerical_field(reader, &field_name, typ, bounds, boost)
                }
                Type::Date => {
                    let fast_field_reader = reader.fast_fields();
                    let Some((column, _col_type)) = fast_field_reader
                        .u64_lenient_for_type(Some(&[ColumnType::DateTime]), &field_name)?
                    else {
                        return Ok(Box::new(EmptyScorer));
                    };
                    let bounds = bounds.map_bound(|term| term.as_date().unwrap().to_u64());
                    search_on_u64_ff(
                        column,
                        boost,
                        BoundsRange::new(bounds.lower_bound, bounds.upper_bound),
                    )
                }
                Type::Bool | Type::Facet | Type::Bytes | Type::Json | Type::IpAddr => {
                    Err(crate::TantivyError::InvalidArgument(format!(
                        "unsupported value bytes type in json term value_bytes {:?}",
                        term_value.typ()
                    )))
                }
            }
        } else if field_type.is_ip_addr() {
            let parse_ip_from_bytes = |term: &Term| {
                term.value().as_ip_addr().ok_or_else(|| {
                    crate::TantivyError::InvalidArgument("Expected ip address".to_string())
                })
            };
            let bounds: BoundsRange<Ipv6Addr> = self.bounds.map_bound_res(parse_ip_from_bytes)?;

            let Some(ip_addr_column): Option<Column<Ipv6Addr>> =
                reader.fast_fields().column_opt(&field_name)?
            else {
                return Ok(Box::new(EmptyScorer));
            };
            let value_range = bound_range_inclusive_ip(
                &bounds.lower_bound,
                &bounds.upper_bound,
                ip_addr_column.min_value(),
                ip_addr_column.max_value(),
            );
            let docset = RangeDocSet::new(value_range, ip_addr_column);
            Ok(Box::new(ConstScorer::new(docset, boost)))
        } else if field_type.is_str() {
            let Some(str_dict_column): Option<StrColumn> = reader.fast_fields().str(&field_name)?
            else {
                return Ok(Box::new(EmptyScorer));
            };
            let dict = str_dict_column.dictionary();

            let bounds = self.bounds.map_bound(get_value_bytes);
            // Get term ids for terms
            let (lower_bound, upper_bound) =
                dict.term_bounds_to_ord(bounds.lower_bound, bounds.upper_bound)?;
            let fast_field_reader = reader.fast_fields();
            let Some((column, _col_type)) =
                fast_field_reader.u64_lenient_for_type(None, &field_name)?
            else {
                return Ok(Box::new(EmptyScorer));
            };
            search_on_u64_ff(column, boost, BoundsRange::new(lower_bound, upper_bound))
        } else if field_type.is_bytes() {
            let Some(bytes_column): Option<BytesColumn> =
                reader.fast_fields().bytes(&field_name)?
            else {
                return Ok(Box::new(EmptyScorer));
            };
            let dict = bytes_column.dictionary();

            let bounds = self.bounds.map_bound(get_value_bytes);
            // Get term ids for terms
            let (lower_bound, upper_bound) =
                dict.term_bounds_to_ord(bounds.lower_bound, bounds.upper_bound)?;
            let fast_field_reader = reader.fast_fields();
            let Some((column, _col_type)) =
                fast_field_reader.u64_lenient_for_type(None, &field_name)?
            else {
                return Ok(Box::new(EmptyScorer));
            };
            search_on_u64_ff(column, boost, BoundsRange::new(lower_bound, upper_bound))
        } else {
            assert!(
                maps_to_u64_fastfield(field_type.value_type()),
                "{field_type:?}"
            );

            let bounds = self.bounds.map_bound_res(|term| {
                let value = term.value();
                let val = if let Some(val) = value.as_u64() {
                    val
                } else if let Some(val) = value.as_i64() {
                    val.to_u64()
                } else if let Some(val) = value.as_f64() {
                    val.to_u64()
                } else if let Some(val) = value.as_date() {
                    val.to_u64()
                } else {
                    return Err(TantivyError::InvalidArgument(format!(
                        "Expected term with u64, i64, f64 or date, but got {term:?}"
                    )));
                };
                Ok(val)
            })?;

            let fast_field_reader = reader.fast_fields();
            let Some((column, _col_type)) = fast_field_reader.u64_lenient_for_type(
                Some(&[
                    ColumnType::U64,
                    ColumnType::I64,
                    ColumnType::F64,
                    ColumnType::DateTime,
                ]),
                &field_name,
            )?
            else {
                return Ok(Box::new(EmptyScorer));
            };
            search_on_u64_ff(
                column,
                boost,
                BoundsRange::new(bounds.lower_bound, bounds.upper_bound),
            )
        }
    }

    fn explain(&self, reader: &SegmentReader, doc: DocId) -> crate::Result<Explanation> {
        let mut scorer = self.scorer(reader, 1.0)?;
        if scorer.seek(doc) != doc {
            return Err(TantivyError::InvalidArgument(format!(
                "Document #({doc}) does not match"
            )));
        }
        let explanation = Explanation::new("Const", scorer.score());

        Ok(explanation)
    }
}

/// On numerical fields the column type may not match the user provided one.
///
/// Convert into fast field value space and search.
fn search_on_json_numerical_field(
    reader: &SegmentReader,
    field_name: &str,
    typ: Type,
    bounds: BoundsRange<ValueBytes<Vec<u8>>>,
    boost: Score,
) -> crate::Result<Box<dyn Scorer>> {
    // Since we don't know which type was interpolated for the internal column we
    // have to check for all numeric types (only one exists)
    let allowed_column_types: Option<&[ColumnType]> =
        Some(&[ColumnType::F64, ColumnType::I64, ColumnType::U64]);
    let fast_field_reader = reader.fast_fields();
    let Some((column, col_type)) =
        fast_field_reader.u64_lenient_for_type(allowed_column_types, field_name)?
    else {
        return Ok(Box::new(EmptyScorer));
    };
    let actual_column_type: NumericalType = col_type
        .numerical_type()
        .unwrap_or_else(|| panic!("internal error: couldn't cast to numerical_type: {col_type:?}"));

    let bounds = match typ.numerical_type().unwrap() {
        NumericalType::I64 => {
            let bounds = bounds.map_bound(|term| term.as_i64().unwrap());
            match actual_column_type {
                NumericalType::I64 => bounds.map_bound(|&term| term.to_u64()),
                NumericalType::U64 => {
                    bounds.transform_inner(
                        |&val| {
                            if val < 0 {
                                return TransformBound::NewBound(Bound::Unbounded);
                            }
                            TransformBound::Existing(val as u64)
                        },
                        |&val| {
                            if val < 0 {
                                // no hits case
                                return TransformBound::NewBound(Bound::Excluded(0));
                            }
                            TransformBound::Existing(val as u64)
                        },
                    )
                }
                NumericalType::F64 => bounds.map_bound(|&term| (term as f64).to_u64()),
            }
        }
        NumericalType::U64 => {
            let bounds = bounds.map_bound(|term| term.as_u64().unwrap());
            match actual_column_type {
                NumericalType::U64 => bounds.map_bound(|&term| term.to_u64()),
                NumericalType::I64 => {
                    bounds.transform_inner(
                        |&val| {
                            if val > i64::MAX as u64 {
                                // Actual no hits case
                                return TransformBound::NewBound(Bound::Excluded(i64::MAX as u64));
                            }
                            TransformBound::Existing((val as i64).to_u64())
                        },
                        |&val| {
                            if val > i64::MAX as u64 {
                                return TransformBound::NewBound(Bound::Unbounded);
                            }
                            TransformBound::Existing((val as i64).to_u64())
                        },
                    )
                }
                NumericalType::F64 => bounds.map_bound(|&term| (term as f64).to_u64()),
            }
        }
        NumericalType::F64 => {
            let bounds = bounds.map_bound(|term| term.as_f64().unwrap());
            match actual_column_type {
                NumericalType::U64 => transform_from_f64_bounds::<u64>(&bounds),
                NumericalType::I64 => transform_from_f64_bounds::<i64>(&bounds),
                NumericalType::F64 => bounds.map_bound(|&term| term.to_u64()),
            }
        }
    };
    search_on_u64_ff(
        column,
        boost,
        BoundsRange::new(bounds.lower_bound, bounds.upper_bound),
    )
}

trait IntType {
    fn min() -> Self;
    fn max() -> Self;
    fn to_f64(self) -> f64;
    fn from_f64(val: f64) -> Self;
}
impl IntType for i64 {
    fn min() -> Self {
        Self::MIN
    }
    fn max() -> Self {
        Self::MAX
    }
    fn to_f64(self) -> f64 {
        self as f64
    }
    fn from_f64(val: f64) -> Self {
        val as Self
    }
}
impl IntType for u64 {
    fn min() -> Self {
        Self::MIN
    }
    fn max() -> Self {
        Self::MAX
    }
    fn to_f64(self) -> f64 {
        self as f64
    }
    fn from_f64(val: f64) -> Self {
        val as Self
    }
}

fn transform_from_f64_bounds<T: IntType + MonotonicallyMappableToU64>(
    bounds: &BoundsRange<f64>,
) -> BoundsRange<u64> {
    bounds.transform_inner(
        |&lower_bound| {
            if lower_bound < T::min().to_f64() {
                return TransformBound::NewBound(Bound::Unbounded);
            }
            if lower_bound > T::max().to_f64() {
                // no hits case
                return TransformBound::NewBound(Bound::Excluded(u64::MAX));
            }

            if lower_bound.fract() == 0.0 {
                TransformBound::Existing(T::from_f64(lower_bound).to_u64())
            } else {
                TransformBound::NewBound(Bound::Included(T::from_f64(lower_bound.trunc()).to_u64()))
            }
        },
        |&upper_bound| {
            if upper_bound < T::min().to_f64() {
                return TransformBound::NewBound(Bound::Unbounded);
            }
            if upper_bound > T::max().to_f64() {
                // no hits case
                return TransformBound::NewBound(Bound::Included(u64::MAX));
            }
            if upper_bound.fract() == 0.0 {
                TransformBound::Existing(T::from_f64(upper_bound).to_u64())
            } else {
                TransformBound::NewBound(Bound::Included(T::from_f64(upper_bound.trunc()).to_u64()))
            }
        },
    )
}

fn search_on_u64_ff(
    column: Column<u64>,
    boost: Score,
    bounds: BoundsRange<u64>,
) -> crate::Result<Box<dyn Scorer>> {
    let col_min_value = column.min_value();
    let col_max_value = column.max_value();
    #[expect(clippy::reversed_empty_ranges)]
    let value_range = bound_to_value_range(
        &bounds.lower_bound,
        &bounds.upper_bound,
        column.min_value(),
        column.max_value(),
    )
    .unwrap_or(1..=0); // empty range
    if value_range.is_empty() {
        return Ok(Box::new(EmptyScorer));
    }
    if col_min_value >= *value_range.start() && col_max_value <= *value_range.end() {
        // all values in the column are within the range.
        if column.index.get_cardinality() == Cardinality::Full {
            if boost != 1.0f32 {
                return Ok(Box::new(ConstScorer::new(
                    AllScorer::new(column.num_docs()),
                    boost,
                )));
            } else {
                return Ok(Box::new(AllScorer::new(column.num_docs())));
            }
        } else {
            // TODO Make it a field presence request for that specific column
        }
    }

    let docset = RangeDocSet::new(value_range, column);
    Ok(Box::new(ConstScorer::new(docset, boost)))
}

/// Returns true if the type maps to a u64 fast field
pub(crate) fn maps_to_u64_fastfield(typ: Type) -> bool {
    match typ {
        Type::U64 | Type::I64 | Type::F64 | Type::Bool | Type::Date => true,
        Type::IpAddr => false,
        Type::Str | Type::Facet | Type::Bytes | Type::Json => false,
    }
}

fn bound_range_inclusive_ip(
    lower_bound: &Bound<Ipv6Addr>,
    upper_bound: &Bound<Ipv6Addr>,
    min_value: Ipv6Addr,
    max_value: Ipv6Addr,
) -> RangeInclusive<Ipv6Addr> {
    let start_value = match lower_bound {
        Bound::Included(ip_addr) => *ip_addr,
        Bound::Excluded(ip_addr) => Ipv6Addr::from(ip_addr.to_u128() + 1),
        Bound::Unbounded => min_value,
    };

    let end_value = match upper_bound {
        Bound::Included(ip_addr) => *ip_addr,
        Bound::Excluded(ip_addr) => Ipv6Addr::from(ip_addr.to_u128() - 1),
        Bound::Unbounded => max_value,
    };
    start_value..=end_value
}

// Returns None, if the range cannot be converted to a inclusive range (which equals to a empty
// range).
fn bound_to_value_range<T: MonotonicallyMappableToU64>(
    lower_bound: &Bound<T>,
    upper_bound: &Bound<T>,
    min_value: T,
    max_value: T,
) -> Option<RangeInclusive<T>> {
    let mut start_value = match lower_bound {
        Bound::Included(val) => *val,
        Bound::Excluded(val) => T::from_u64(val.to_u64().checked_add(1)?),
        Bound::Unbounded => min_value,
    };
    if start_value.partial_cmp(&min_value) == Some(std::cmp::Ordering::Less) {
        start_value = min_value;
    }
    let end_value = match upper_bound {
        Bound::Included(val) => *val,
        Bound::Excluded(val) => T::from_u64(val.to_u64().checked_sub(1)?),
        Bound::Unbounded => max_value,
    };
    Some(start_value..=end_value)
}

#[cfg(test)]
mod tests {
    use std::ops::{Bound, RangeInclusive};

    use common::bounds::BoundsRange;
    use common::DateTime;
    use proptest::prelude::*;
    use rand::rngs::StdRng;
    use rand::seq::IndexedRandom;
    use rand::SeedableRng;
    use time::format_description::well_known::Rfc3339;
    use time::OffsetDateTime;

    use crate::collector::{Count, TopDocs};
    use crate::fastfield::FastValue;
    use crate::query::range_query::range_query_fastfield::FastFieldRangeWeight;
    use crate::query::{QueryParser, RangeQuery, Weight};
    use crate::schema::{
        DateOptions, Field, NumericOptions, Schema, SchemaBuilder, FAST, INDEXED, STORED, STRING,
        TEXT,
    };
    use crate::{Index, IndexWriter, TantivyDocument, Term, TERMINATED};

    #[test]
    fn test_text_field_ff_range_query() -> crate::Result<()> {
        let mut schema_builder = Schema::builder();
        schema_builder.add_text_field("title", TEXT | FAST);
        let schema = schema_builder.build();
        let index = Index::create_in_ram(schema.clone());
        let mut index_writer = index.writer_for_tests()?;
        let title = schema.get_field("title").unwrap();
        index_writer.add_document(doc!(
          title => "bbb"
        ))?;
        index_writer.add_document(doc!(
          title => "ddd"
        ))?;
        index_writer.commit()?;
        let reader = index.reader()?;
        let searcher = reader.searcher();
        let query_parser = QueryParser::for_index(&index, vec![title]);

        let test_query = |query, num_hits| {
            let query = query_parser.parse_query(query).unwrap();
            let top_docs = searcher
                .search(&query, &TopDocs::with_limit(10).order_by_score())
                .unwrap();
            assert_eq!(top_docs.len(), num_hits);
        };

        test_query("title:[aaa TO ccc]", 1);
        test_query("title:[aaa TO bbb]", 1);
        test_query("title:[bbb TO bbb]", 1);
        test_query("title:[bbb TO ddd]", 2);
        test_query("title:[bbb TO eee]", 2);
        test_query("title:[bb TO eee]", 2);
        test_query("title:[ccc TO ccc]", 0);
        test_query("title:[ccc TO ddd]", 1);
        test_query("title:[ccc TO eee]", 1);

        test_query("title:[aaa TO *}", 2);
        test_query("title:[bbb TO *]", 2);
        test_query("title:[bb TO *]", 2);
        test_query("title:[ccc TO *]", 1);
        test_query("title:[ddd TO *]", 1);
        test_query("title:[dddd TO *]", 0);

        test_query("title:{aaa TO *}", 2);
        test_query("title:{bbb TO *]", 1);
        test_query("title:{bb TO *]", 2);
        test_query("title:{ccc TO *]", 1);
        test_query("title:{ddd TO *]", 0);
        test_query("title:{dddd TO *]", 0);

        test_query("title:[* TO bb]", 0);
        test_query("title:[* TO bbb]", 1);
        test_query("title:[* TO ccc]", 1);
        test_query("title:[* TO ddd]", 2);
        test_query("title:[* TO ddd}", 1);
        test_query("title:[* TO eee]", 2);

        Ok(())
    }

    #[test]
    fn test_date_range_query() {
        let mut schema_builder = Schema::builder();
        let options = DateOptions::default()
            .set_precision(common::DateTimePrecision::Microseconds)
            .set_fast();
        let date_field = schema_builder.add_date_field("date", options);
        let schema = schema_builder.build();

        let index = Index::create_in_ram(schema.clone());
        {
            let mut index_writer = index.writer_with_num_threads(1, 50_000_000).unwrap();
            // This is added a string and creates a string column!
            index_writer
                .add_document(doc!(date_field => DateTime::from_utc(
                    OffsetDateTime::parse("2022-12-01T00:00:01Z", &Rfc3339).unwrap(),
                )))
                .unwrap();
            index_writer
                .add_document(doc!(date_field => DateTime::from_utc(
                    OffsetDateTime::parse("2023-12-01T00:00:01Z", &Rfc3339).unwrap(),
                )))
                .unwrap();
            index_writer
                .add_document(doc!(date_field => DateTime::from_utc(
                    OffsetDateTime::parse("2015-02-01T00:00:00.001Z", &Rfc3339).unwrap(),
                )))
                .unwrap();
            index_writer.commit().unwrap();
        }

        // Date field
        let dt1 =
            DateTime::from_utc(OffsetDateTime::parse("2022-12-01T00:00:01Z", &Rfc3339).unwrap());
        let dt2 =
            DateTime::from_utc(OffsetDateTime::parse("2023-12-01T00:00:01Z", &Rfc3339).unwrap());
        let dt3 = DateTime::from_utc(
            OffsetDateTime::parse("2015-02-01T00:00:00.001Z", &Rfc3339).unwrap(),
        );
        let dt4 = DateTime::from_utc(
            OffsetDateTime::parse("2015-02-01T00:00:00.002Z", &Rfc3339).unwrap(),
        );

        let reader = index.reader().unwrap();
        let searcher = reader.searcher();
        let query_parser = QueryParser::for_index(&index, vec![date_field]);
        let test_query = |query, num_hits| {
            let query = query_parser.parse_query(query).unwrap();
            let top_docs = searcher
                .search(&query, &TopDocs::with_limit(10).order_by_score())
                .unwrap();
            assert_eq!(top_docs.len(), num_hits);
        };

        test_query(
            "date:[2015-02-01T00:00:00.001Z TO 2015-02-01T00:00:00.001Z]",
            1,
        );
        test_query(
            "date:[2015-02-01T00:00:00.001Z TO 2015-02-01T00:00:00.002Z}",
            1,
        );
        test_query(
            "date:[2015-02-01T00:00:00.001Z TO 2015-02-01T00:00:00.002Z]",
            1,
        );
        test_query(
            "date:{2015-02-01T00:00:00.001Z TO 2015-02-01T00:00:00.002Z]",
            0,
        );

        let count = |range_query: RangeQuery| searcher.search(&range_query, &Count).unwrap();
        assert_eq!(
            count(RangeQuery::new(
                Bound::Included(Term::from_field_date(date_field, dt3)),
                Bound::Excluded(Term::from_field_date(date_field, dt4)),
            )),
            1
        );
        assert_eq!(
            count(RangeQuery::new(
                Bound::Included(Term::from_field_date(date_field, dt3)),
                Bound::Included(Term::from_field_date(date_field, dt4)),
            )),
            1
        );
        assert_eq!(
            count(RangeQuery::new(
                Bound::Included(Term::from_field_date(date_field, dt1)),
                Bound::Included(Term::from_field_date(date_field, dt2)),
            )),
            2
        );
        assert_eq!(
            count(RangeQuery::new(
                Bound::Included(Term::from_field_date(date_field, dt1)),
                Bound::Excluded(Term::from_field_date(date_field, dt2)),
            )),
            1
        );
        assert_eq!(
            count(RangeQuery::new(
                Bound::Excluded(Term::from_field_date(date_field, dt1)),
                Bound::Excluded(Term::from_field_date(date_field, dt2)),
            )),
            0
        );
    }

    fn get_json_term<T: FastValue>(field: Field, path: &str, value: T) -> Term {
        let mut term = Term::from_field_json_path(field, path, true);
        term.append_type_and_fast_value(value);
        term
    }

    #[test]
    fn mixed_numerical_test() {
        let mut schema_builder = Schema::builder();
        schema_builder.add_i64_field("id_i64", STORED | FAST);
        schema_builder.add_u64_field("id_u64", STORED | FAST);
        schema_builder.add_f64_field("id_f64", STORED | FAST);
        let schema = schema_builder.build();

        fn get_json_term<T: FastValue>(schema: &Schema, path: &str, value: T) -> Term {
            let field = schema.get_field(path).unwrap();
            Term::from_fast_value(field, &value)
            // term.append_type_and_fast_value(value);
            // term
        }
        let index = Index::create_in_ram(schema.clone());
        {
            let mut index_writer = index.writer_with_num_threads(1, 50_000_000).unwrap();

            let doc = json!({
                "id_u64": 0,
                "id_i64": 50,
            });
            let doc = TantivyDocument::parse_json(&schema, &serde_json::to_string(&doc).unwrap())
                .unwrap();
            index_writer.add_document(doc).unwrap();
            let doc = json!({
                "id_u64": 10,
                "id_i64": 1000,
            });
            let doc = TantivyDocument::parse_json(&schema, &serde_json::to_string(&doc).unwrap())
                .unwrap();
            index_writer.add_document(doc).unwrap();

            index_writer.commit().unwrap();
        }

        let reader = index.reader().unwrap();
        let searcher = reader.searcher();
        let count = |range_query: RangeQuery| searcher.search(&range_query, &Count).unwrap();

        // u64 on u64
        assert_eq!(
            count(RangeQuery::new(
                Bound::Included(get_json_term(&schema, "id_u64", 10u64)),
                Bound::Included(get_json_term(&schema, "id_u64", 10u64)),
            )),
            1
        );
        assert_eq!(
            count(RangeQuery::new(
                Bound::Included(get_json_term(&schema, "id_u64", 9u64)),
                Bound::Excluded(get_json_term(&schema, "id_u64", 10u64)),
            )),
            0
        );

        // i64 on i64
        assert_eq!(
            count(RangeQuery::new(
                Bound::Included(get_json_term(&schema, "id_i64", 50i64)),
                Bound::Included(get_json_term(&schema, "id_i64", 1000i64)),
            )),
            2
        );
        assert_eq!(
            count(RangeQuery::new(
                Bound::Included(get_json_term(&schema, "id_i64", 50i64)),
                Bound::Excluded(get_json_term(&schema, "id_i64", 1000i64)),
            )),
            1
        );
    }

    #[test]
    fn json_range_mixed_val() {
        let mut schema_builder = Schema::builder();
        let json_field = schema_builder.add_json_field("json", TEXT | STORED | FAST);
        let schema = schema_builder.build();

        let index = Index::create_in_ram(schema);
        {
            let mut index_writer = index.writer_with_num_threads(1, 50_000_000).unwrap();
            let doc = json!({
                "mixed_val": 10000,
            });
            index_writer.add_document(doc!(json_field => doc)).unwrap();
            let doc = json!({
                "mixed_val": 20000,
            });
            index_writer.add_document(doc!(json_field => doc)).unwrap();
            let doc = json!({
                "mixed_val": "1000a",
            });
            index_writer.add_document(doc!(json_field => doc)).unwrap();
            let doc = json!({
                "mixed_val": "2000a",
            });
            index_writer.add_document(doc!(json_field => doc)).unwrap();
            index_writer.commit().unwrap();
        }
        let reader = index.reader().unwrap();
        let searcher = reader.searcher();
        let count = |range_query: RangeQuery| searcher.search(&range_query, &Count).unwrap();

        assert_eq!(
            count(RangeQuery::new(
                Bound::Included(get_json_term(json_field, "mixed_val", 10000u64)),
                Bound::Included(get_json_term(json_field, "mixed_val", 20000u64)),
            )),
            2
        );
        fn get_json_term_str(field: Field, path: &str, value: &str) -> Term {
            let mut term = Term::from_field_json_path(field, path, true);
            term.append_type_and_str(value);
            term
        }
        assert_eq!(
            count(RangeQuery::new(
                Bound::Included(get_json_term_str(json_field, "mixed_val", "1000a")),
                Bound::Included(get_json_term_str(json_field, "mixed_val", "2000b")),
            )),
            2
        );
        assert_eq!(
            count(RangeQuery::new(
                Bound::Included(get_json_term_str(json_field, "mixed_val", "1000")),
                Bound::Included(get_json_term_str(json_field, "mixed_val", "2000a")),
            )),
            2
        );
    }

    #[test]
    fn json_range_test() {
        let mut schema_builder = Schema::builder();
        let json_field = schema_builder.add_json_field("json", TEXT | STORED | FAST);
        let schema = schema_builder.build();

        let index = Index::create_in_ram(schema);
        let u64_val = u64::MAX - 1;
        {
            let mut index_writer = index.writer_with_num_threads(1, 50_000_000).unwrap();
            let doc = json!({
                "id_u64": 0,
                "id_f64": 10.5,
                "id_i64": -100,
                "date": "2022-12-01T00:00:01Z"
            });
            index_writer.add_document(doc!(json_field => doc)).unwrap();
            let doc = json!({
                "id_u64": u64_val,
                "id_f64": 1000.5,
                "id_i64": 1000,
                "date": "2023-12-01T00:00:01Z"
            });
            index_writer.add_document(doc!(json_field => doc)).unwrap();
            let doc = json!({
                "date": "2015-02-01T00:00:00.001Z"
            });
            index_writer.add_document(doc!(json_field => doc)).unwrap();

            index_writer.commit().unwrap();
        }

        let reader = index.reader().unwrap();
        let searcher = reader.searcher();
        let count = |range_query: RangeQuery| searcher.search(&range_query, &Count).unwrap();

        // u64 on u64
        assert_eq!(
            count(RangeQuery::new(
                Bound::Included(get_json_term(json_field, "id_u64", u64_val)),
                Bound::Included(get_json_term(json_field, "id_u64", u64_val)),
            )),
            1
        );
        assert_eq!(
            count(RangeQuery::new(
                Bound::Included(get_json_term(json_field, "id_u64", u64_val)),
                Bound::Excluded(get_json_term(json_field, "id_u64", u64_val)),
            )),
            0
        );
        // f64 on u64 field
        assert_eq!(
            count(RangeQuery::new(
                // We need to subtract since there is some inaccuracy
                Bound::Included(get_json_term(
                    json_field,
                    "id_u64",
                    (u64_val - 10000) as f64
                )),
                Bound::Included(get_json_term(json_field, "id_u64", (u64_val) as f64)),
            )),
            1
        );
        // i64 on u64
        assert_eq!(
            count(RangeQuery::new(
                Bound::Included(get_json_term(json_field, "id_u64", 0_i64)),
                Bound::Included(get_json_term(json_field, "id_u64", 0_i64)),
            )),
            1
        );
        assert_eq!(
            count(RangeQuery::new(
                Bound::Included(get_json_term(json_field, "id_u64", 1_i64)),
                Bound::Included(get_json_term(json_field, "id_u64", 1_i64)),
            )),
            0
        );
        // u64 on f64
        assert_eq!(
            count(RangeQuery::new(
                Bound::Included(get_json_term(json_field, "id_f64", 10_u64)),
                Bound::Included(get_json_term(json_field, "id_f64", 11_u64)),
            )),
            1
        );
        assert_eq!(
            count(RangeQuery::new(
                Bound::Included(get_json_term(json_field, "id_f64", 10_u64)),
                Bound::Included(get_json_term(json_field, "id_f64", 2000_u64)),
            )),
            2
        );
        // i64 on f64
        assert_eq!(
            count(RangeQuery::new(
                Bound::Included(get_json_term(json_field, "id_f64", 10_i64)),
                Bound::Included(get_json_term(json_field, "id_f64", 2000_i64)),
            )),
            2
        );

        // i64 on i64
        assert_eq!(
            count(RangeQuery::new(
                Bound::Included(get_json_term(json_field, "id_i64", -1000i64)),
                Bound::Included(get_json_term(json_field, "id_i64", 1000i64)),
            )),
            2
        );
        assert_eq!(
            count(RangeQuery::new(
                Bound::Included(get_json_term(json_field, "id_i64", 1000i64)),
                Bound::Excluded(get_json_term(json_field, "id_i64", 1001i64)),
            )),
            1
        );

        // u64 on i64
        assert_eq!(
            count(RangeQuery::new(
                Bound::Included(get_json_term(json_field, "id_i64", 0_u64)),
                Bound::Included(get_json_term(json_field, "id_i64", 1000u64)),
            )),
            1
        );
        assert_eq!(
            count(RangeQuery::new(
                Bound::Included(get_json_term(json_field, "id_i64", 0_u64)),
                Bound::Included(get_json_term(json_field, "id_i64", 999u64)),
            )),
            0
        );
        // f64 on i64 field
        assert_eq!(
            count(RangeQuery::new(
                Bound::Included(get_json_term(json_field, "id_i64", -1000.0)),
                Bound::Included(get_json_term(json_field, "id_i64", 1000.0)),
            )),
            2
        );
        assert_eq!(
            count(RangeQuery::new(
                Bound::Included(get_json_term(json_field, "id_i64", -1000.0f64)),
                Bound::Excluded(get_json_term(json_field, "id_i64", 1000.0f64)),
            )),
            1
        );
        assert_eq!(
            count(RangeQuery::new(
                Bound::Included(get_json_term(json_field, "id_i64", -1000.0f64)),
                Bound::Included(get_json_term(json_field, "id_i64", 1000.0f64)),
            )),
            2
        );
        assert_eq!(
            count(RangeQuery::new(
                Bound::Included(get_json_term(json_field, "id_i64", -1000.0f64)),
                Bound::Excluded(get_json_term(json_field, "id_i64", 1000.01f64)),
            )),
            2
        );
        assert_eq!(
            count(RangeQuery::new(
                Bound::Included(get_json_term(json_field, "id_i64", -1000.0f64)),
                Bound::Included(get_json_term(json_field, "id_i64", 999.99f64)),
            )),
            1
        );
        assert_eq!(
            count(RangeQuery::new(
                Bound::Excluded(get_json_term(json_field, "id_i64", 999.9)),
                Bound::Excluded(get_json_term(json_field, "id_i64", 1000.1)),
            )),
            1
        );

        let reader = index.reader().unwrap();
        let searcher = reader.searcher();
        let query_parser = QueryParser::for_index(&index, vec![json_field]);
        let test_query = |query, num_hits| {
            let query = query_parser.parse_query(query).unwrap();
            let top_docs = searcher
                .search(&query, &TopDocs::with_limit(10).order_by_score())
                .unwrap();
            assert_eq!(top_docs.len(), num_hits);
        };

        test_query(
            "json.date:[2015-02-01T00:00:00.001Z TO 2015-02-01T00:00:00.001Z]",
            1,
        );
        test_query(
            "json.date:[2015-02-01T00:00:00.001Z TO 2015-02-01T00:00:00.002Z}",
            1,
        );
        test_query(
            "json.date:[2015-02-01T00:00:00.001Z TO 2015-02-01T00:00:00.002Z]",
            1,
        );
        test_query(
            "json.date:{2015-02-01T00:00:00.001Z TO 2015-02-01T00:00:00.002Z]",
            0,
        );

        // Date field
        let dt1 =
            DateTime::from_utc(OffsetDateTime::parse("2022-12-01T00:00:01Z", &Rfc3339).unwrap());
        let dt2 =
            DateTime::from_utc(OffsetDateTime::parse("2023-12-01T00:00:01Z", &Rfc3339).unwrap());

        assert_eq!(
            count(RangeQuery::new(
                Bound::Included(get_json_term(json_field, "date", dt1)),
                Bound::Included(get_json_term(json_field, "date", dt2)),
            )),
            2
        );
        assert_eq!(
            count(RangeQuery::new(
                Bound::Included(get_json_term(json_field, "date", dt1)),
                Bound::Excluded(get_json_term(json_field, "date", dt2)),
            )),
            1
        );
        assert_eq!(
            count(RangeQuery::new(
                Bound::Excluded(get_json_term(json_field, "date", dt1)),
                Bound::Excluded(get_json_term(json_field, "date", dt2)),
            )),
            0
        );
        // Date precision test. We don't want to truncate the precision
        let dt3 = DateTime::from_utc(
            OffsetDateTime::parse("2015-02-01T00:00:00.001Z", &Rfc3339).unwrap(),
        );
        let dt4 = DateTime::from_utc(
            OffsetDateTime::parse("2015-02-01T00:00:00.002Z", &Rfc3339).unwrap(),
        );
        let query = RangeQuery::new(
            Bound::Included(get_json_term(json_field, "date", dt3)),
            Bound::Excluded(get_json_term(json_field, "date", dt4)),
        );
        assert_eq!(count(query), 1);
    }

    #[derive(Clone, Debug)]
    pub struct Doc {
        pub id_name: String,
        pub id: u64,
    }

    fn operation_strategy() -> impl Strategy<Value = Doc> {
        prop_oneof![
            (0u64..10_000u64).prop_map(doc_from_id_1),
            (1u64..10_000u64).prop_map(doc_from_id_2),
        ]
    }

    fn doc_from_id_1(id: u64) -> Doc {
        let id = id * 1000;
        Doc {
            id_name: format!("id_name{id:010}"),
            id,
        }
    }
    fn doc_from_id_2(id: u64) -> Doc {
        let id = id * 1000;
        Doc {
            id_name: format!("id_name{:010}", id - 1),
            id,
        }
    }

    proptest! {
        #![proptest_config(ProptestConfig::with_cases(10))]
        #[test]
        fn test_range_for_docs_prop(ops in proptest::collection::vec(operation_strategy(), 1..1000)) {
            assert!(test_id_range_for_docs(ops).is_ok());
        }
    }

    #[test]
    fn range_regression1_test() {
        let ops = vec![doc_from_id_1(0)];
        assert!(test_id_range_for_docs(ops).is_ok());
    }

    #[test]
    fn range_regression1_test_json() {
        let ops = vec![doc_from_id_1(0)];
        assert!(test_id_range_for_docs_json(ops).is_ok());
    }

    #[test]
    fn test_range_regression2() {
        let ops = vec![
            doc_from_id_1(52),
            doc_from_id_1(63),
            doc_from_id_1(12),
            doc_from_id_2(91),
            doc_from_id_2(33),
        ];
        assert!(test_id_range_for_docs(ops).is_ok());
    }

    #[test]
    fn test_range_regression3() {
        let ops = vec![doc_from_id_1(9), doc_from_id_1(0), doc_from_id_1(13)];
        assert!(test_id_range_for_docs(ops).is_ok());
    }

    #[test]
    fn test_range_regression_simplified() {
        let mut schema_builder = SchemaBuilder::new();
        let field = schema_builder.add_u64_field("test_field", FAST);
        let schema = schema_builder.build();
        let index = Index::create_in_ram(schema);
        let mut writer: IndexWriter = index.writer_for_tests().unwrap();
        writer.add_document(doc!(field=>52_000u64)).unwrap();
        writer.commit().unwrap();
        let searcher = index.reader().unwrap().searcher();
        let range_query = FastFieldRangeWeight::new(BoundsRange::new(
            Bound::Included(Term::from_field_u64(field, 50_000)),
            Bound::Included(Term::from_field_u64(field, 50_002)),
        ));
        let scorer = range_query
            .scorer(searcher.segment_reader(0), 1.0f32)
            .unwrap();
        assert_eq!(scorer.doc(), TERMINATED);
    }

    #[test]
    fn range_regression3_test() {
        let ops = vec![doc_from_id_1(1), doc_from_id_1(2), doc_from_id_1(3)];
        assert!(test_id_range_for_docs(ops).is_ok());
    }

    #[test]
    fn range_regression4_test() {
        let ops = vec![doc_from_id_2(100)];
        assert!(test_id_range_for_docs(ops).is_ok());
    }

    pub fn create_index_from_docs(docs: &[Doc], json_field: bool) -> Index {
        let mut schema_builder = Schema::builder();
        if json_field {
            let json_field = schema_builder.add_json_field("json", TEXT | STORED | FAST);
            let schema = schema_builder.build();

            let index = Index::create_in_ram(schema);

            {
                let mut index_writer = index.writer_with_num_threads(1, 50_000_000).unwrap();
                for doc in docs.iter() {
                    let doc = json!({
                        "ids_i64": doc.id as i64,
                        "ids_i64": doc.id as i64,
                        "ids_f64": doc.id as f64,
                        "ids_f64": doc.id as f64,
                        "ids": doc.id,
                        "ids": doc.id,
                        "id": doc.id,
                        "id_f64": doc.id as f64,
                        "id_i64": doc.id as i64,
                        "id_name": doc.id_name.to_string(),
                        "id_name_fast": doc.id_name.to_string(),
                    });
                    index_writer.add_document(doc!(json_field => doc)).unwrap();
                }

                index_writer.commit().unwrap();
            }
            index
        } else {
            let id_u64_field = schema_builder.add_u64_field("id", INDEXED | STORED | FAST);
            let ids_u64_field = schema_builder
                .add_u64_field("ids", NumericOptions::default().set_fast().set_indexed());

            let id_f64_field = schema_builder.add_f64_field("id_f64", INDEXED | STORED | FAST);
            let ids_f64_field = schema_builder.add_f64_field(
                "ids_f64",
                NumericOptions::default().set_fast().set_indexed(),
            );

            let id_i64_field = schema_builder.add_i64_field("id_i64", INDEXED | STORED | FAST);
            let ids_i64_field = schema_builder.add_i64_field(
                "ids_i64",
                NumericOptions::default().set_fast().set_indexed(),
            );

            let text_field = schema_builder.add_text_field("id_name", STRING | STORED);
            let text_field2 = schema_builder.add_text_field("id_name_fast", STRING | STORED | FAST);
            let schema = schema_builder.build();

            let index = Index::create_in_ram(schema);

            {
                let mut index_writer = index.writer_with_num_threads(1, 50_000_000).unwrap();
                for doc in docs.iter() {
                    index_writer
                        .add_document(doc!(
                            ids_i64_field => doc.id as i64,
                            ids_i64_field => doc.id as i64,
                            ids_f64_field => doc.id as f64,
                            ids_f64_field => doc.id as f64,
                            ids_u64_field => doc.id,
                            ids_u64_field => doc.id,
                            id_u64_field => doc.id,
                            id_f64_field => doc.id as f64,
                            id_i64_field => doc.id as i64,
                            text_field => doc.id_name.to_string(),
                            text_field2 => doc.id_name.to_string(),
                        ))
                        .unwrap();
                }

                index_writer.commit().unwrap();
            }
            index
        }
    }

    fn test_id_range_for_docs(docs: Vec<Doc>) -> crate::Result<()> {
        test_id_range_for_docs_with_opt(docs, false)
    }
    fn test_id_range_for_docs_json(docs: Vec<Doc>) -> crate::Result<()> {
        test_id_range_for_docs_with_opt(docs, true)
    }

    fn test_id_range_for_docs_with_opt(docs: Vec<Doc>, json: bool) -> crate::Result<()> {
        let index = create_index_from_docs(&docs, json);
        let reader = index.reader().unwrap();
        let searcher = reader.searcher();

        let mut rng: StdRng = StdRng::from_seed([1u8; 32]);

        let get_num_hits = |query| searcher.search(&query, &Count).unwrap();
        let query_from_text = |text: &str| {
            QueryParser::for_index(&index, vec![])
                .parse_query(text)
                .unwrap()
        };

        let field_path = |field: &str| {
            if json {
                format!("json.{field}")
            } else {
                field.to_string()
            }
        };

        let gen_query_inclusive = |field: &str, range: RangeInclusive<u64>| {
            format!(
                "{}:[{} TO {}]",
                field_path(field),
                range.start(),
                range.end()
            )
        };
        let gen_query_exclusive = |field: &str, range: RangeInclusive<u64>| {
            format!(
                "{}:{{{} TO {}}}",
                field_path(field),
                range.start(),
                range.end()
            )
        };

        let test_sample = |sample_docs: Vec<Doc>| {
            let mut ids: Vec<u64> = sample_docs.iter().map(|doc| doc.id).collect();
            ids.sort();
            let expected_num_hits = docs
                .iter()
                .filter(|doc| (ids[0]..=ids[1]).contains(&doc.id))
                .count();

            let query = gen_query_inclusive("id", ids[0]..=ids[1]);
            assert_eq!(get_num_hits(query_from_text(&query)), expected_num_hits);

            let query = gen_query_inclusive("ids", ids[0]..=ids[1]);
            assert_eq!(get_num_hits(query_from_text(&query)), expected_num_hits);

            // Text query
            {
                let test_text_query = |field_name: &str| {
                    let mut id_names: Vec<&str> =
                        sample_docs.iter().map(|doc| doc.id_name.as_str()).collect();
                    id_names.sort();
                    let expected_num_hits = docs
                        .iter()
                        .filter(|doc| (id_names[0]..=id_names[1]).contains(&doc.id_name.as_str()))
                        .count();
                    let query = format!(
                        "{}:[{} TO {}]",
                        field_path(field_name),
                        id_names[0],
                        id_names[1]
                    );
                    assert_eq!(get_num_hits(query_from_text(&query)), expected_num_hits);
                };

                test_text_query("id_name");
                test_text_query("id_name_fast");
            }

            // Exclusive range
            let expected_num_hits = docs
                .iter()
                .filter(|doc| {
                    (ids[0].saturating_add(1)..=ids[1].saturating_sub(1)).contains(&doc.id)
                })
                .count();

            let query = gen_query_exclusive("id", ids[0]..=ids[1]);
            assert_eq!(get_num_hits(query_from_text(&query)), expected_num_hits);

            let query = gen_query_exclusive("ids", ids[0]..=ids[1]);
            assert_eq!(get_num_hits(query_from_text(&query)), expected_num_hits);

            // Intersection search
            let id_filter = sample_docs[0].id_name.to_string();
            let expected_num_hits = docs
                .iter()
                .filter(|doc| (ids[0]..=ids[1]).contains(&doc.id) && doc.id_name == id_filter)
                .count();
            let query = format!(
                "{} AND {}:{}",
                gen_query_inclusive("id", ids[0]..=ids[1]),
                field_path("id_name"),
                &id_filter
            );
            assert_eq!(get_num_hits(query_from_text(&query)), expected_num_hits);
            let query = format!(
                "{} AND {}:{}",
                gen_query_inclusive("id_f64", ids[0]..=ids[1]),
                field_path("id_name"),
                &id_filter
            );
            assert_eq!(get_num_hits(query_from_text(&query)), expected_num_hits);
            let query = format!(
                "{} AND {}:{}",
                gen_query_inclusive("id_i64", ids[0]..=ids[1]),
                field_path("id_name"),
                &id_filter
            );
            assert_eq!(get_num_hits(query_from_text(&query)), expected_num_hits);

            // Intersection search on multivalue id field
            let id_filter = sample_docs[0].id_name.to_string();
            let query = format!(
                "{} AND {}:{}",
                gen_query_inclusive("ids", ids[0]..=ids[1]),
                field_path("id_name"),
                &id_filter
            );
            assert_eq!(get_num_hits(query_from_text(&query)), expected_num_hits);
            let query = format!(
                "{} AND {}:{}",
                gen_query_inclusive("ids_f64", ids[0]..=ids[1]),
                field_path("id_name"),
                &id_filter
            );
            assert_eq!(get_num_hits(query_from_text(&query)), expected_num_hits);
            let query = format!(
                "{} AND {}:{}",
                gen_query_inclusive("ids_i64", ids[0]..=ids[1]),
                field_path("id_name"),
                &id_filter
            );
            assert_eq!(get_num_hits(query_from_text(&query)), expected_num_hits);
        };

        test_sample(vec![docs[0].clone(), docs[0].clone()]);

        let samples: Vec<_> = docs.choose_multiple(&mut rng, 3).collect();

        if samples.len() > 1 {
            test_sample(vec![samples[0].clone(), samples[1].clone()]);
            test_sample(vec![samples[1].clone(), samples[1].clone()]);
        }
        if samples.len() > 2 {
            test_sample(vec![samples[1].clone(), samples[2].clone()]);
        }

        Ok(())
    }

    #[test]
    fn test_bytes_field_ff_range_query() -> crate::Result<()> {
        use crate::schema::BytesOptions;

        let mut schema_builder = Schema::builder();
        let bytes_field = schema_builder
            .add_bytes_field("data", BytesOptions::default().set_fast().set_indexed());
        let schema = schema_builder.build();
        let index = Index::create_in_ram(schema.clone());
        let mut index_writer: IndexWriter = index.writer_for_tests()?;

        // Insert documents with lexicographically sortable byte values
        // Using simple byte sequences that have clear ordering
        let values: Vec<Vec<u8>> = vec![
            vec![0x00, 0x10],
            vec![0x00, 0x20],
            vec![0x00, 0x30],
            vec![0x01, 0x00],
            vec![0x01, 0x10],
            vec![0x02, 0x00],
        ];

        for value in &values {
            let mut doc = TantivyDocument::new();
            doc.add_bytes(bytes_field, value);
            index_writer.add_document(doc)?;
        }
        index_writer.commit()?;

        let reader = index.reader()?;
        let searcher = reader.searcher();

        // Test: Range query [0x00, 0x20] to [0x01, 0x00] (inclusive)
        // Should match: [0x00, 0x20], [0x00, 0x30], [0x01, 0x00]
        let lower = Term::from_field_bytes(bytes_field, &[0x00, 0x20]);
        let upper = Term::from_field_bytes(bytes_field, &[0x01, 0x00]);
        let range_query = RangeQuery::new(Bound::Included(lower), Bound::Included(upper));
        let count = searcher.search(&range_query, &Count)?;
        assert_eq!(
            count, 3,
            "Expected 3 documents in range [0x00,0x20] to [0x01,0x00]"
        );

        // Test: Range query > [0x01, 0x00] (exclusive lower bound)
        // Should match: [0x01, 0x10], [0x02, 0x00]
        let lower = Term::from_field_bytes(bytes_field, &[0x01, 0x00]);
        let range_query = RangeQuery::new(Bound::Excluded(lower), Bound::Unbounded);
        let count = searcher.search(&range_query, &Count)?;
        assert_eq!(count, 2, "Expected 2 documents > [0x01,0x00]");

        // Test: Range query < [0x00, 0x30] (exclusive upper bound)
        // Should match: [0x00, 0x10], [0x00, 0x20]
        let upper = Term::from_field_bytes(bytes_field, &[0x00, 0x30]);
        let range_query = RangeQuery::new(Bound::Unbounded, Bound::Excluded(upper));
        let count = searcher.search(&range_query, &Count)?;
        assert_eq!(count, 2, "Expected 2 documents < [0x00,0x30]");

        Ok(())
    }
}

#[cfg(test)]
pub(crate) mod ip_range_tests {
    use proptest::prelude::ProptestConfig;
    use proptest::strategy::Strategy;
    use proptest::{prop_oneof, proptest};

    use super::*;
    use crate::collector::Count;
    use crate::query::QueryParser;
    use crate::schema::{Schema, FAST, INDEXED, STORED, STRING};
    use crate::{Index, IndexWriter};

    #[derive(Clone, Debug)]
    pub struct Doc {
        pub id: String,
        pub ip: Ipv6Addr,
    }

    fn operation_strategy() -> impl Strategy<Value = Doc> {
        prop_oneof![
            (0u64..10_000u64).prop_map(doc_from_id_1),
            (1u64..10_000u64).prop_map(doc_from_id_2),
        ]
    }

    pub fn doc_from_id_1(id: u64) -> Doc {
        let id = id * 1000;
        Doc {
            // ip != id
            id: id.to_string(),
            ip: Ipv6Addr::from_u128(id as u128),
        }
    }
    fn doc_from_id_2(id: u64) -> Doc {
        let id = id * 1000;
        Doc {
            // ip != id
            id: (id - 1).to_string(),
            ip: Ipv6Addr::from_u128(id as u128),
        }
    }

    proptest! {
        #![proptest_config(ProptestConfig::with_cases(10))]
        #[test]
        fn test_ip_range_for_docs_prop(ops in proptest::collection::vec(operation_strategy(), 1..1000)) {
            assert!(test_ip_range_for_docs(&ops).is_ok());
        }
    }

    #[test]
    fn test_ip_range_regression1() {
        let ops = &[doc_from_id_1(0)];
        assert!(test_ip_range_for_docs(ops).is_ok());
    }

    #[test]
    fn test_ip_range_regression2() {
        let ops = &[
            doc_from_id_1(52),
            doc_from_id_1(63),
            doc_from_id_1(12),
            doc_from_id_2(91),
            doc_from_id_2(33),
        ];
        assert!(test_ip_range_for_docs(ops).is_ok());
    }

    #[test]
    fn test_ip_range_regression3() {
        let ops = &[doc_from_id_1(1), doc_from_id_1(2), doc_from_id_1(3)];
        assert!(test_ip_range_for_docs(ops).is_ok());
    }

    #[test]
    fn test_ip_range_regression3_simple() {
        let mut schema_builder = Schema::builder();
        let ips_field = schema_builder.add_ip_addr_field("ips", FAST | INDEXED);
        let schema = schema_builder.build();
        let index = Index::create_in_ram(schema);
        let mut writer: IndexWriter = index.writer_for_tests().unwrap();
        let ip_addrs: Vec<Ipv6Addr> = [1000, 2000, 3000]
            .into_iter()
            .map(Ipv6Addr::from_u128)
            .collect();
        for &ip_addr in &ip_addrs {
            writer
                .add_document(doc!(ips_field=>ip_addr, ips_field=>ip_addr))
                .unwrap();
        }
        writer.commit().unwrap();
        let searcher = index.reader().unwrap().searcher();
        let range_weight = FastFieldRangeWeight::new(BoundsRange::new(
            Bound::Included(Term::from_field_ip_addr(ips_field, ip_addrs[1])),
            Bound::Included(Term::from_field_ip_addr(ips_field, ip_addrs[2])),
        ));

        let count =
            crate::query::weight::Weight::count(&range_weight, searcher.segment_reader(0)).unwrap();
        assert_eq!(count, 2);
    }

    pub fn create_index_from_ip_docs(docs: &[Doc]) -> Index {
        let mut schema_builder = Schema::builder();
        let ip_field = schema_builder.add_ip_addr_field("ip", STORED | FAST);
        let ips_field = schema_builder.add_ip_addr_field("ips", FAST | INDEXED);
        let text_field = schema_builder.add_text_field("id", STRING | STORED);
        let schema = schema_builder.build();
        let index = Index::create_in_ram(schema);

        {
            let mut index_writer = index.writer_with_num_threads(2, 60_000_000).unwrap();
            for doc in docs.iter() {
                index_writer
                    .add_document(doc!(
                        ips_field => doc.ip,
                        ips_field => doc.ip,
                        ip_field => doc.ip,
                        text_field => doc.id.to_string(),
                    ))
                    .unwrap();
            }

            index_writer.commit().unwrap();
        }
        index
    }

    fn test_ip_range_for_docs(docs: &[Doc]) -> crate::Result<()> {
        let index = create_index_from_ip_docs(docs);
        let reader = index.reader().unwrap();
        let searcher = reader.searcher();

        let get_num_hits = |query| searcher.search(&query, &Count).unwrap();
        let query_from_text = |text: &str| {
            QueryParser::for_index(&index, vec![])
                .parse_query(text)
                .unwrap()
        };

        let gen_query_inclusive = |field: &str, ip_range: &RangeInclusive<Ipv6Addr>| {
            format!("{field}:[{} TO {}]", ip_range.start(), ip_range.end())
        };

        let test_sample = |sample_docs: &[Doc]| {
            let mut ips: Vec<Ipv6Addr> = sample_docs.iter().map(|doc| doc.ip).collect();
            ips.sort();
            let ip_range = ips[0]..=ips[1];
            let expected_num_hits = docs
                .iter()
                .filter(|doc| (ips[0]..=ips[1]).contains(&doc.ip))
                .count();

            let query = gen_query_inclusive("ip", &ip_range);
            assert_eq!(get_num_hits(query_from_text(&query)), expected_num_hits);

            let query = gen_query_inclusive("ips", &ip_range);
            assert_eq!(get_num_hits(query_from_text(&query)), expected_num_hits);

            // Intersection search
            let id_filter = sample_docs[0].id.to_string();
            let expected_num_hits = docs
                .iter()
                .filter(|doc| ip_range.contains(&doc.ip) && doc.id == id_filter)
                .count();
            let query = format!(
                "{} AND id:{}",
                gen_query_inclusive("ip", &ip_range),
                &id_filter
            );
            assert_eq!(get_num_hits(query_from_text(&query)), expected_num_hits);

            // Intersection search on multivalue ip field
            let id_filter = sample_docs[0].id.to_string();
            let query = format!(
                "{} AND id:{}",
                gen_query_inclusive("ips", &ip_range),
                &id_filter
            );
            assert_eq!(get_num_hits(query_from_text(&query)), expected_num_hits);
        };

        test_sample(&[docs[0].clone(), docs[0].clone()]);
        if docs.len() > 1 {
            test_sample(&[docs[0].clone(), docs[1].clone()]);
            test_sample(&[docs[1].clone(), docs[1].clone()]);
        }
        if docs.len() > 2 {
            test_sample(&[docs[1].clone(), docs[2].clone()]);
        }

        Ok(())
    }
}


================================================
FILE: src/query/regex_query.rs
================================================
use std::clone::Clone;
use std::sync::Arc;

use tantivy_fst::Regex;

use crate::error::TantivyError;
use crate::query::{AutomatonWeight, EnableScoring, Query, Weight};
use crate::schema::Field;

/// A Regex Query matches all of the documents
/// containing a specific term that matches
/// a regex pattern.
///
/// Wildcard queries (e.g. ho*se) can be achieved
/// by converting them to their regex counterparts.
///
/// ```rust
/// use tantivy::collector::Count;
/// use tantivy::query::RegexQuery;
/// use tantivy::schema::{Schema, TEXT};
/// use tantivy::{doc, Index, IndexWriter, Term};
///
/// # fn test() -> tantivy::Result<()> {
/// let mut schema_builder = Schema::builder();
/// let title = schema_builder.add_text_field("title", TEXT);
/// let schema = schema_builder.build();
/// let index = Index::create_in_ram(schema);
/// {
///     let mut index_writer: IndexWriter = index.writer(15_000_000)?;
///     index_writer.add_document(doc!(
///         title => "The Name of the Wind",
///     ))?;
///     index_writer.add_document(doc!(
///         title => "The Diary of Muadib",
///     ))?;
///     index_writer.add_document(doc!(
///         title => "A Dairy Cow",
///     ))?;
///     index_writer.add_document(doc!(
///         title => "The Diary of a Young Girl",
///     ))?;
///     index_writer.commit()?;
/// }
///
/// let reader = index.reader()?;
/// let searcher = reader.searcher();
///
/// let term = Term::from_field_text(title, "Diary");
/// let query = RegexQuery::from_pattern("d[ai]{2}ry", title)?;
/// let count = searcher.search(&query, &Count)?;
/// assert_eq!(count, 3);
/// Ok(())
/// # }
/// # assert!(test().is_ok());
/// ```
#[derive(Debug, Clone)]
pub struct RegexQuery {
    regex: Arc<Regex>,
    field: Field,
}

impl RegexQuery {
    /// Creates a new RegexQuery from a given pattern
    pub fn from_pattern(regex_pattern: &str, field: Field) -> crate::Result<Self> {
        let regex = Regex::new(regex_pattern)
            .map_err(|err| TantivyError::InvalidArgument(format!("RegexQueryError: {err}")))?;
        Ok(RegexQuery::from_regex(regex, field))
    }

    /// Creates a new RegexQuery from a fully built Regex
    pub fn from_regex<T: Into<Arc<Regex>>>(regex: T, field: Field) -> Self {
        RegexQuery {
            regex: regex.into(),
            field,
        }
    }

    fn specialized_weight(&self) -> AutomatonWeight<Regex> {
        AutomatonWeight::new(self.field, self.regex.clone())
    }
}

impl Query for RegexQuery {
    fn weight(&self, _enabled_scoring: EnableScoring<'_>) -> crate::Result<Box<dyn Weight>> {
        Ok(Box::new(self.specialized_weight()))
    }
}

#[cfg(test)]
mod test {
    use std::sync::Arc;

    use tantivy_fst::Regex;

    use super::RegexQuery;
    use crate::collector::TopDocs;
    use crate::schema::{Field, Schema, TEXT};
    use crate::{assert_nearly_equals, Index, IndexReader, IndexWriter};

    fn build_test_index() -> crate::Result<(IndexReader, Field)> {
        let mut schema_builder = Schema::builder();
        let country_field = schema_builder.add_text_field("country", TEXT);
        let schema = schema_builder.build();
        let index = Index::create_in_ram(schema);
        {
            let mut index_writer: IndexWriter = index.writer_for_tests().unwrap();
            index_writer.add_document(doc!(
                country_field => "japan",
            ))?;
            index_writer.add_document(doc!(
                country_field => "korea",
            ))?;
            index_writer.commit()?;
        }
        let reader = index.reader()?;

        Ok((reader, country_field))
    }

    fn verify_regex_query(
        query_matching_one: RegexQuery,
        query_matching_zero: RegexQuery,
        reader: IndexReader,
    ) {
        let searcher = reader.searcher();
        {
            let scored_docs = searcher
                .search(
                    &query_matching_one,
                    &TopDocs::with_limit(2).order_by_score(),
                )
                .unwrap();
            assert_eq!(scored_docs.len(), 1, "Expected only 1 document");
            let (score, _) = scored_docs[0];
            assert_nearly_equals!(1.0, score);
        }
        let top_docs = searcher
            .search(
                &query_matching_zero,
                &TopDocs::with_limit(2).order_by_score(),
            )
            .unwrap();
        assert!(top_docs.is_empty(), "Expected ZERO document");
    }

    #[test]
    pub fn test_regex_query() -> crate::Result<()> {
        let (reader, field) = build_test_index()?;

        let matching_one = RegexQuery::from_pattern("jap[ao]n", field)?;
        let matching_zero = RegexQuery::from_pattern("jap[A-Z]n", field)?;
        verify_regex_query(matching_one, matching_zero, reader);
        Ok(())
    }

    #[test]
    pub fn test_construct_from_regex() -> crate::Result<()> {
        let (reader, field) = build_test_index()?;

        let matching_one = RegexQuery::from_regex(Regex::new("jap[ao]n").unwrap(), field);
        let matching_zero = RegexQuery::from_regex(Regex::new("jap[A-Z]n").unwrap(), field);

        verify_regex_query(matching_one, matching_zero, reader);
        Ok(())
    }

    #[test]
    pub fn test_construct_from_reused_regex() -> crate::Result<()> {
        let r1 = Arc::new(Regex::new("jap[ao]n").unwrap());
        let r2 = Arc::new(Regex::new("jap[A-Z]n").unwrap());

        let (reader, field) = build_test_index()?;

        let matching_one = RegexQuery::from_regex(r1.clone(), field);
        let matching_zero = RegexQuery::from_regex(r2.clone(), field);

        verify_regex_query(matching_one, matching_zero, reader.clone());

        let matching_one = RegexQuery::from_regex(r1, field);
        let matching_zero = RegexQuery::from_regex(r2, field);

        verify_regex_query(matching_one, matching_zero, reader);
        Ok(())
    }

    #[test]
    pub fn test_pattern_error() {
        let (_reader, field) = build_test_index().unwrap();

        match RegexQuery::from_pattern(r"(foo", field) {
            Err(crate::TantivyError::InvalidArgument(msg)) => {
                assert!(msg.contains("error: unclosed group"))
            }
            res => panic!("unexpected result: {res:?}"),
        }
    }
}


================================================
FILE: src/query/reqopt_scorer.rs
================================================
use std::marker::PhantomData;

use crate::docset::{DocSet, SeekDangerResult};
use crate::query::score_combiner::ScoreCombiner;
use crate::query::Scorer;
use crate::{DocId, Score};

/// Given a required scorer and an optional scorer
/// matches all document from the required scorer
/// and complements the score using the optional scorer.
///
/// This is useful for queries like `+somethingrequired somethingoptional`.
///
/// Note that `somethingoptional` has no impact on the `DocSet`.
pub struct RequiredOptionalScorer<TReqScorer, TOptScorer, TScoreCombiner: ScoreCombiner> {
    req_scorer: TReqScorer,
    opt_scorer: TOptScorer,
    score_cache: Option<Score>,
    _phantom: PhantomData<TScoreCombiner>,
}

impl<TReqScorer, TOptScorer, TScoreCombiner>
    RequiredOptionalScorer<TReqScorer, TOptScorer, TScoreCombiner>
where
    TOptScorer: DocSet,
    TScoreCombiner: ScoreCombiner,
{
    /// Creates a new `RequiredOptionalScorer`.
    pub fn new(
        req_scorer: TReqScorer,
        opt_scorer: TOptScorer,
    ) -> RequiredOptionalScorer<TReqScorer, TOptScorer, TScoreCombiner> {
        RequiredOptionalScorer {
            req_scorer,
            opt_scorer,
            score_cache: None,
            _phantom: PhantomData,
        }
    }
}

impl<TReqScorer, TOptScorer, TScoreCombiner> DocSet
    for RequiredOptionalScorer<TReqScorer, TOptScorer, TScoreCombiner>
where
    TReqScorer: DocSet,
    TOptScorer: DocSet,
    TScoreCombiner: ScoreCombiner,
{
    fn advance(&mut self) -> DocId {
        self.score_cache = None;
        self.req_scorer.advance()
    }

    fn seek(&mut self, target: DocId) -> DocId {
        self.score_cache = None;
        self.req_scorer.seek(target)
    }

    fn seek_danger(&mut self, target: DocId) -> SeekDangerResult {
        self.score_cache = None;
        self.req_scorer.seek_danger(target)
    }

    fn doc(&self) -> DocId {
        self.req_scorer.doc()
    }

    fn size_hint(&self) -> u32 {
        self.req_scorer.size_hint()
    }

    fn cost(&self) -> u64 {
        self.req_scorer.cost()
    }
}

impl<TReqScorer, TOptScorer, TScoreCombiner> Scorer
    for RequiredOptionalScorer<TReqScorer, TOptScorer, TScoreCombiner>
where
    TReqScorer: Scorer,
    TOptScorer: Scorer,
    TScoreCombiner: ScoreCombiner,
{
    #[inline]
    fn score(&mut self) -> Score {
        if let Some(score) = self.score_cache {
            return score;
        }
        let doc = self.doc();
        let mut score_combiner = TScoreCombiner::default();
        score_combiner.update(&mut self.req_scorer);
        if self.opt_scorer.doc() <= doc && self.opt_scorer.seek(doc) == doc {
            score_combiner.update(&mut self.opt_scorer);
        }
        let score = score_combiner.score();
        self.score_cache = Some(score);
        score
    }
}

#[cfg(test)]
mod tests {
    use super::RequiredOptionalScorer;
    use crate::docset::{DocSet, TERMINATED};
    use crate::postings::tests::test_skip_against_unoptimized;
    use crate::query::score_combiner::{DoNothingCombiner, SumCombiner};
    use crate::query::{ConstScorer, Scorer, VecDocSet};
    use crate::tests::sample_with_seed;

    #[test]
    fn test_reqopt_scorer_empty() {
        let req = vec![1, 3, 7];
        let mut reqoptscorer: RequiredOptionalScorer<_, _, SumCombiner> =
            RequiredOptionalScorer::new(
                ConstScorer::from(VecDocSet::from(req.clone())),
                ConstScorer::from(VecDocSet::from(vec![])),
            );
        let mut docs = vec![];
        while reqoptscorer.doc() != TERMINATED {
            docs.push(reqoptscorer.doc());
            reqoptscorer.advance();
        }
        assert_eq!(docs, req);
    }

    #[test]
    fn test_reqopt_scorer() {
        let mut reqoptscorer: RequiredOptionalScorer<_, _, SumCombiner> =
            RequiredOptionalScorer::new(
                ConstScorer::new(VecDocSet::from(vec![1, 3, 7, 8, 9, 10, 13, 15]), 1.0),
                ConstScorer::new(VecDocSet::from(vec![1, 2, 7, 11, 12, 15]), 1.0),
            );
        {
            assert_eq!(reqoptscorer.doc(), 1);
            assert_eq!(reqoptscorer.score(), 2.0);
        }
        {
            assert_eq!(reqoptscorer.advance(), 3);
            assert_eq!(reqoptscorer.doc(), 3);
            assert_eq!(reqoptscorer.score(), 1.0);
        }
        {
            assert_eq!(reqoptscorer.advance(), 7);
            assert_eq!(reqoptscorer.doc(), 7);
            assert_eq!(reqoptscorer.score(), 2.0);
        }
        {
            assert_eq!(reqoptscorer.advance(), 8);
            assert_eq!(reqoptscorer.doc(), 8);
            assert_eq!(reqoptscorer.score(), 1.0);
        }
        {
            assert_eq!(reqoptscorer.advance(), 9);
            assert_eq!(reqoptscorer.doc(), 9);
            assert_eq!(reqoptscorer.score(), 1.0);
        }
        {
            assert_eq!(reqoptscorer.advance(), 10);
            assert_eq!(reqoptscorer.doc(), 10);
            assert_eq!(reqoptscorer.score(), 1.0);
        }
        {
            assert_eq!(reqoptscorer.advance(), 13);
            assert_eq!(reqoptscorer.doc(), 13);
            assert_eq!(reqoptscorer.score(), 1.0);
        }
        {
            assert_eq!(reqoptscorer.advance(), 15);
            assert_eq!(reqoptscorer.doc(), 15);
            assert_eq!(reqoptscorer.score(), 2.0);
        }
        assert_eq!(reqoptscorer.advance(), TERMINATED);
    }

    #[test]
    fn test_reqopt_scorer_skip() {
        let req_docs = sample_with_seed(10_000, 0.02, 1);
        let opt_docs = sample_with_seed(10_000, 0.02, 2);
        let skip_docs = sample_with_seed(10_000, 0.001, 3);
        test_skip_against_unoptimized(
            || {
                Box::new(RequiredOptionalScorer::<_, _, DoNothingCombiner>::new(
                    ConstScorer::from(VecDocSet::from(req_docs.clone())),
                    ConstScorer::from(VecDocSet::from(opt_docs.clone())),
                ))
            },
            skip_docs,
        );
    }

    #[test]
    fn test_reqopt_scorer_seek() {
        let mut reqoptscorer: RequiredOptionalScorer<_, _, SumCombiner> =
            RequiredOptionalScorer::new(
                ConstScorer::new(VecDocSet::from(vec![1, 3, 7, 8, 9, 10, 13, 15]), 1.0),
                ConstScorer::new(VecDocSet::from(vec![2, 7, 11, 12, 15]), 1.0),
            );
        {
            assert_eq!(reqoptscorer.score(), 1.0);
            assert_eq!(reqoptscorer.seek(7), 7);
            assert_eq!(reqoptscorer.score(), 2.0);
        }
        {
            assert_eq!(reqoptscorer.score(), 2.0);
            assert_eq!(reqoptscorer.seek(12), 13);
            assert_eq!(reqoptscorer.score(), 1.0);
        }
    }
}


================================================
FILE: src/query/score_combiner.rs
================================================
use crate::query::Scorer;
use crate::Score;

/// The `ScoreCombiner` trait defines how to compute
/// an overall score given a list of scores.
pub trait ScoreCombiner: Default + Clone + Send + Copy + 'static {
    /// Aggregates the score combiner with the given scorer.
    ///
    /// The `ScoreCombiner` may decide to call `.scorer.score()`
    /// or not.
    fn update<TScorer: Scorer>(&mut self, scorer: &mut TScorer);

    /// Clears the score combiner state back to its initial state.
    fn clear(&mut self);

    /// Returns the aggregate score.
    fn score(&self) -> Score;
}

/// Just ignores scores. The `DoNothingCombiner` does not
/// even call the scorers `.score()` function.
///
/// It is useful to optimize the case when scoring is disabled.
#[derive(Default, Clone, Copy)] //< these should not be too much work :)
pub struct DoNothingCombiner;

impl ScoreCombiner for DoNothingCombiner {
    fn update<TScorer: Scorer>(&mut self, _scorer: &mut TScorer) {}

    fn clear(&mut self) {}

    #[inline]
    fn score(&self) -> Score {
        1.0
    }
}

/// Sums the score of different scorers.
#[derive(Default, Clone, Copy)]
pub struct SumCombiner {
    score: Score,
}

impl ScoreCombiner for SumCombiner {
    fn update<TScorer: Scorer>(&mut self, scorer: &mut TScorer) {
        self.score += scorer.score();
    }

    fn clear(&mut self) {
        self.score = 0.0;
    }

    #[inline]
    fn score(&self) -> Score {
        self.score
    }
}

/// Take max score of different scorers
/// and optionally sum it with other matches multiplied by `tie_breaker`
#[derive(Default, Clone, Copy)]
pub struct DisjunctionMaxCombiner {
    max: Score,
    sum: Score,
    tie_breaker: Score,
}

impl DisjunctionMaxCombiner {
    /// Creates `DisjunctionMaxCombiner` with tie breaker
    pub fn with_tie_breaker(tie_breaker: Score) -> DisjunctionMaxCombiner {
        DisjunctionMaxCombiner {
            max: 0.0,
            sum: 0.0,
            tie_breaker,
        }
    }
}

impl ScoreCombiner for DisjunctionMaxCombiner {
    fn update<TScorer: Scorer>(&mut self, scorer: &mut TScorer) {
        let score = scorer.score();
        self.max = Score::max(score, self.max);
        self.sum += score;
    }

    fn clear(&mut self) {
        self.max = 0.0;
        self.sum = 0.0;
    }

    #[inline]
    fn score(&self) -> Score {
        self.max + (self.sum - self.max) * self.tie_breaker
    }
}


================================================
FILE: src/query/scorer.rs
================================================
use std::ops::DerefMut;

use downcast_rs::impl_downcast;

use crate::docset::DocSet;
use crate::Score;

/// Scored set of documents matching a query within a specific segment.
///
/// See [`Query`](crate::query::Query).
pub trait Scorer: downcast_rs::Downcast + DocSet + 'static {
    /// Returns the score.
    ///
    /// This method will perform a bit of computation and is not cached.
    fn score(&mut self) -> Score;
}

impl_downcast!(Scorer);

impl Scorer for Box<dyn Scorer> {
    #[inline]
    fn score(&mut self) -> Score {
        self.deref_mut().score()
    }
}


================================================
FILE: src/query/set_query.rs
================================================
use std::collections::HashMap;

use tantivy_fst::raw::CompiledAddr;
use tantivy_fst::{Automaton, Map};

use crate::query::score_combiner::DoNothingCombiner;
use crate::query::{AutomatonWeight, BooleanWeight, EnableScoring, Occur, Query, Weight};
use crate::schema::{Field, Schema};
use crate::Term;

/// A Term Set Query matches all of the documents containing any of the Term provided
#[derive(Debug, Clone)]
pub struct TermSetQuery {
    terms_map: HashMap<Field, Vec<Term>>,
}

impl TermSetQuery {
    /// Create a Term Set Query
    pub fn new<T: IntoIterator<Item = Term>>(terms: T) -> Self {
        let mut terms_map: HashMap<_, Vec<_>> = HashMap::new();
        for term in terms {
            terms_map.entry(term.field()).or_default().push(term);
        }

        for terms in terms_map.values_mut() {
            terms.sort_unstable();
            terms.dedup();
        }

        TermSetQuery { terms_map }
    }

    fn specialized_weight(
        &self,
        schema: &Schema,
    ) -> crate::Result<BooleanWeight<DoNothingCombiner>> {
        let mut sub_queries: Vec<(_, Box<dyn Weight>)> = Vec::with_capacity(self.terms_map.len());

        for (&field, sorted_terms) in self.terms_map.iter() {
            let field_entry = schema.get_field_entry(field);
            let field_type = field_entry.field_type();
            if !field_type.is_indexed() {
                let error_msg = format!("Field {:?} is not indexed.", field_entry.name());
                return Err(crate::TantivyError::SchemaError(error_msg));
            }

            // In practice this won't fail because:
            // - we are writing to memory, so no IoError
            // - Terms are ordered
            let map = Map::from_iter(
                sorted_terms
                    .iter()
                    .map(|key| (key.serialized_value_bytes(), 0)),
            )
            .map_err(std::io::Error::other)?;

            sub_queries.push((
                Occur::Should,
                Box::new(AutomatonWeight::new(field, SetDfaWrapper(map))),
            ));
        }

        Ok(BooleanWeight::new(
            sub_queries,
            false,
            Box::new(|| DoNothingCombiner),
        ))
    }
}

impl Query for TermSetQuery {
    fn weight(&self, enable_scoring: EnableScoring<'_>) -> crate::Result<Box<dyn Weight>> {
        Ok(Box::new(self.specialized_weight(enable_scoring.schema())?))
    }

    fn query_terms<'a>(&'a self, visitor: &mut dyn FnMut(&'a Term, bool)) {
        for terms in self.terms_map.values() {
            for term in terms {
                visitor(term, false);
            }
        }
    }
}

struct SetDfaWrapper(Map<Vec<u8>>);

impl Automaton for SetDfaWrapper {
    type State = Option<CompiledAddr>;

    fn start(&self) -> Option<CompiledAddr> {
        Some(self.0.as_ref().root().addr())
    }

    fn is_match(&self, state_opt: &Option<CompiledAddr>) -> bool {
        if let Some(state) = state_opt {
            self.0.as_ref().node(*state).is_final()
        } else {
            false
        }
    }

    fn accept(&self, state_opt: &Option<CompiledAddr>, byte: u8) -> Option<CompiledAddr> {
        let state = state_opt.as_ref()?;
        let node = self.0.as_ref().node(*state);
        let transition = node.find_input(byte)?;
        Some(node.transition_addr(transition))
    }

    fn can_match(&self, state: &Self::State) -> bool {
        state.is_some()
    }
}

#[cfg(test)]
mod tests {
    use crate::collector::TopDocs;
    use crate::query::{QueryParser, TermSetQuery};
    use crate::schema::{Schema, TEXT};
    use crate::{assert_nearly_equals, Index, IndexWriter, Term};

    #[test]
    pub fn test_term_set_query() -> crate::Result<()> {
        let mut schema_builder = Schema::builder();
        let field1 = schema_builder.add_text_field("field1", TEXT);
        let field2 = schema_builder.add_text_field("field2", TEXT);
        let schema = schema_builder.build();
        let index = Index::create_in_ram(schema);
        {
            let mut index_writer: IndexWriter = index.writer_for_tests()?;
            index_writer.add_document(doc!(
                field1 => "doc1",
                field2 => "val1",
            ))?;
            index_writer.add_document(doc!(
                field1 => "doc2",
                field2 => "val2",
            ))?;
            index_writer.add_document(doc!(
                field1 => "doc3",
                field2 => "val3",
            ))?;
            index_writer.add_document(doc!(
                field1 => "val3",
                field2 => "doc3",
            ))?;
            index_writer.commit()?;
        }
        let reader = index.reader()?;
        let searcher = reader.searcher();

        {
            // single element
            let terms = vec![Term::from_field_text(field1, "doc1")];

            let term_set_query = TermSetQuery::new(terms);
            let top_docs =
                searcher.search(&term_set_query, &TopDocs::with_limit(2).order_by_score())?;
            assert_eq!(top_docs.len(), 1, "Expected 1 document");
            let (score, _) = top_docs[0];
            assert_nearly_equals!(1.0, score);
        }

        {
            // single element, absent
            let terms = vec![Term::from_field_text(field1, "doc4")];

            let term_set_query = TermSetQuery::new(terms);
            let top_docs =
                searcher.search(&term_set_query, &TopDocs::with_limit(1).order_by_score())?;
            assert!(top_docs.is_empty(), "Expected 0 document");
        }

        {
            // multiple elements
            let terms = vec![
                Term::from_field_text(field1, "doc1"),
                Term::from_field_text(field1, "doc2"),
            ];

            let term_set_query = TermSetQuery::new(terms);
            let top_docs =
                searcher.search(&term_set_query, &TopDocs::with_limit(2).order_by_score())?;
            assert_eq!(top_docs.len(), 2, "Expected 2 documents");
            for (score, _) in top_docs {
                assert_nearly_equals!(1.0, score);
            }
        }

        {
            // multiple elements, mixed fields
            let terms = vec![
                Term::from_field_text(field1, "doc1"),
                Term::from_field_text(field1, "doc1"),
                Term::from_field_text(field2, "val2"),
            ];

            let term_set_query = TermSetQuery::new(terms);
            let top_docs =
                searcher.search(&term_set_query, &TopDocs::with_limit(3).order_by_score())?;

            assert_eq!(top_docs.len(), 2, "Expected 2 document");
            for (score, _) in top_docs {
                assert_nearly_equals!(1.0, score);
            }
        }

        {
            // no field crosstalk
            let terms = vec![Term::from_field_text(field1, "doc3")];

            let term_set_query = TermSetQuery::new(terms);
            let top_docs =
                searcher.search(&term_set_query, &TopDocs::with_limit(3).order_by_score())?;
            assert_eq!(top_docs.len(), 1, "Expected 1 document");

            let terms = vec![Term::from_field_text(field2, "doc3")];

            let term_set_query = TermSetQuery::new(terms);
            let top_docs =
                searcher.search(&term_set_query, &TopDocs::with_limit(3).order_by_score())?;
            assert_eq!(top_docs.len(), 1, "Expected 1 document");

            let terms = vec![
                Term::from_field_text(field1, "doc3"),
                Term::from_field_text(field2, "doc3"),
            ];

            let term_set_query = TermSetQuery::new(terms);
            let top_docs =
                searcher.search(&term_set_query, &TopDocs::with_limit(3).order_by_score())?;
            assert_eq!(top_docs.len(), 2, "Expected 2 document");
        }

        Ok(())
    }

    #[test]
    fn test_term_set_query_parser() -> crate::Result<()> {
        let mut schema_builder = Schema::builder();
        schema_builder.add_text_field("field", TEXT);
        let schema = schema_builder.build();
        let index = Index::create_in_ram(schema.clone());
        let mut index_writer: IndexWriter = index.writer_for_tests()?;
        let field = schema.get_field("field").unwrap();
        index_writer.add_document(doc!(
          field => "val1",
        ))?;
        index_writer.add_document(doc!(
          field => "val2",
        ))?;
        index_writer.add_document(doc!(
          field => "val3",
        ))?;
        index_writer.commit()?;
        let reader = index.reader()?;
        let searcher = reader.searcher();
        let query_parser = QueryParser::for_index(&index, vec![]);
        let query = query_parser.parse_query("field: IN [val1 val2]")?;
        let top_docs = searcher.search(&query, &TopDocs::with_limit(3).order_by_score())?;
        assert_eq!(top_docs.len(), 2);
        Ok(())
    }
}


================================================
FILE: src/query/size_hint.rs
================================================
/// Computes the estimated number of documents in the intersection of multiple docsets
/// given their sizes.
///
/// # Arguments
/// * `docset_sizes` - An iterator over the sizes of the docsets (number of documents in each set).
/// * `max_docs` - The maximum number of docs that can hit, usually number of documents in the
///   segment.
///
/// # Returns
/// The estimated number of documents in the intersection.
pub fn estimate_intersection<I>(mut docset_sizes: I, max_docs: u32) -> u32
where I: Iterator<Item = u32> {
    if max_docs == 0u32 {
        return 0u32;
    }
    // Terms tend to be not really randomly distributed.
    // This factor is used to adjust the estimate.
    let mut co_loc_factor: f64 = 1.3;

    let mut intersection_estimate = match docset_sizes.next() {
        Some(first_size) => first_size as f64,
        None => return 0, // No docsets provided, so return 0.
    };

    let mut smallest_docset_size = intersection_estimate;
    // Assuming random distribution of terms, the probability of a document being in the
    // intersection
    for size in docset_sizes {
        // Diminish the co-location factor for each additional set, or we will overestimate.
        co_loc_factor = (co_loc_factor - 0.1).max(1.0);
        intersection_estimate *= (size as f64 / max_docs as f64) * co_loc_factor;
        smallest_docset_size = smallest_docset_size.min(size as f64);
    }

    intersection_estimate.round().min(smallest_docset_size) as u32
}

/// Computes the estimated number of documents in the union of multiple docsets
/// given their sizes.
///
/// # Arguments
/// * `docset_sizes` - An iterator over the sizes of the docsets (number of documents in each set).
/// * `max_docs` - The maximum number of docs that can hit, usually number of documents in the
///   segment.
///
/// # Returns
/// The estimated number of documents in the union.
pub fn estimate_union<I>(docset_sizes: I, max_docs: u32) -> u32
where I: Iterator<Item = u32> {
    // Terms tend to be not really randomly distributed.
    // This factor is used to adjust the estimate.
    // Unlike intersection, the co-location reduces the estimate.
    let co_loc_factor = 0.8;

    // The approach for union is to compute the probability of a document not being in any of the
    // sets
    let mut not_in_any_set_prob = 1.0;

    // Assuming random distribution of terms, the probability of a document being in the
    // union is the complement of the probability of it not being in any of the sets.
    for size in docset_sizes {
        let prob_in_set = (size as f64 / max_docs as f64) * co_loc_factor;
        not_in_any_set_prob *= 1.0 - prob_in_set;
    }

    let union_estimate = (max_docs as f64 * (1.0 - not_in_any_set_prob)).round();

    union_estimate.min(max_docs as f64) as u32
}

#[cfg(test)]
mod tests {
    use super::*;

    #[test]
    fn test_estimate_intersection_small1() {
        let docset_sizes = &[500, 1000];
        let n = 10_000;
        let result = estimate_intersection(docset_sizes.iter().copied(), n);
        assert_eq!(result, 60);
    }

    #[test]
    fn test_estimate_intersection_small2() {
        let docset_sizes = &[500, 1000, 1500];
        let n = 10_000;
        let result = estimate_intersection(docset_sizes.iter().copied(), n);
        assert_eq!(result, 10);
    }

    #[test]
    fn test_estimate_intersection_large_values() {
        let docset_sizes = &[100_000, 50_000, 30_000];
        let n = 1_000_000;
        let result = estimate_intersection(docset_sizes.iter().copied(), n);
        assert_eq!(result, 198);
    }

    #[test]
    fn test_estimate_union_small() {
        let docset_sizes = &[500, 1000, 1500];
        let n = 10000;
        let result = estimate_union(docset_sizes.iter().copied(), n);
        assert_eq!(result, 2228);
    }

    #[test]
    fn test_estimate_union_large_values() {
        let docset_sizes = &[100000, 50000, 30000];
        let n = 1000000;
        let result = estimate_union(docset_sizes.iter().copied(), n);
        assert_eq!(result, 137997);
    }

    #[test]
    fn test_estimate_intersection_large() {
        let docset_sizes: Vec<_> = (0..10).map(|_| 4_000_000).collect();
        let n = 5_000_000;
        let result = estimate_intersection(docset_sizes.iter().copied(), n);
        // Check that it doesn't overflow and returns a reasonable result
        assert_eq!(result, 708_670);
    }

    #[test]
    fn test_estimate_intersection_overflow_safety() {
        let docset_sizes: Vec<_> = (0..100).map(|_| 4_000_000).collect();
        let n = 5_000_000;
        let result = estimate_intersection(docset_sizes.iter().copied(), n);
        // Check that it doesn't overflow and returns a reasonable result
        assert_eq!(result, 0);
    }

    #[test]
    fn test_estimate_union_overflow_safety() {
        let docset_sizes: Vec<_> = (0..100).map(|_| 1_000_000).collect();
        let n = 20_000_000;
        let result = estimate_union(docset_sizes.iter().copied(), n);
        // Check that it doesn't overflow and returns a reasonable result
        assert_eq!(result, 19_662_594);
    }
}


================================================
FILE: src/query/term_query/mod.rs
================================================
mod term_query;
mod term_scorer;
mod term_weight;

pub use self::term_query::TermQuery;
pub use self::term_scorer::TermScorer;
#[cfg(test)]
mod tests {

    use crate::collector::TopDocs;
    use crate::docset::DocSet;
    use crate::postings::compression::COMPRESSION_BLOCK_SIZE;
    use crate::query::term_query::TermScorer;
    use crate::query::{
        AllScorer, EmptyScorer, EnableScoring, Query, QueryParser, Scorer, TermQuery,
    };
    use crate::schema::{Field, IndexRecordOption, Schema, FAST, STRING, TEXT};
    use crate::{assert_nearly_equals, DocAddress, Index, IndexWriter, Term, TERMINATED};

    #[test]
    pub fn test_term_query_no_freq() -> crate::Result<()> {
        let mut schema_builder = Schema::builder();
        let text_field = schema_builder.add_text_field("text", STRING);
        let schema = schema_builder.build();
        let index = Index::create_in_ram(schema);
        {
            // writing the segment
            let mut index_writer: IndexWriter = index.writer_for_tests()?;
            let doc = doc!(text_field => "a");
            index_writer.add_document(doc)?;
            index_writer.commit()?;
        }
        let searcher = index.reader()?.searcher();
        let term_query = TermQuery::new(
            Term::from_field_text(text_field, "a"),
            IndexRecordOption::Basic,
        );
        let term_weight = term_query.weight(EnableScoring::enabled_from_searcher(&searcher))?;
        let segment_reader = searcher.segment_reader(0);
        let mut term_scorer = term_weight.scorer(segment_reader, 1.0)?;
        assert_eq!(term_scorer.doc(), 0);
        assert_nearly_equals!(term_scorer.score(), 0.28768212);
        Ok(())
    }

    #[test]
    pub fn test_term_query_multiple_of_block_len() -> crate::Result<()> {
        let mut schema_builder = Schema::builder();
        let text_field = schema_builder.add_text_field("text", STRING);
        let schema = schema_builder.build();
        let index = Index::create_in_ram(schema);
        {
            // writing the segment
            let mut index_writer: IndexWriter = index.writer_for_tests()?;
            for _ in 0..COMPRESSION_BLOCK_SIZE {
                let doc = doc!(text_field => "a");
                index_writer.add_document(doc)?;
            }
            index_writer.commit()?;
        }
        let searcher = index.reader()?.searcher();
        let term_query = TermQuery::new(
            Term::from_field_text(text_field, "a"),
            IndexRecordOption::Basic,
        );
        let term_weight = term_query.weight(EnableScoring::enabled_from_searcher(&searcher))?;
        let segment_reader = searcher.segment_reader(0);
        let mut term_scorer = term_weight.scorer(segment_reader, 1.0)?;
        for i in 0u32..COMPRESSION_BLOCK_SIZE as u32 {
            assert_eq!(term_scorer.doc(), i);
            if i == COMPRESSION_BLOCK_SIZE as u32 - 1u32 {
                assert_eq!(term_scorer.advance(), TERMINATED);
            } else {
                assert_eq!(term_scorer.advance(), i + 1);
            }
        }
        assert_eq!(term_scorer.doc(), TERMINATED);
        Ok(())
    }

    #[test]
    pub fn test_term_weight() -> crate::Result<()> {
        let mut schema_builder = Schema::builder();
        let left_field = schema_builder.add_text_field("left", TEXT);
        let right_field = schema_builder.add_text_field("right", TEXT);
        let large_field = schema_builder.add_text_field("large", TEXT);
        let schema = schema_builder.build();
        let index = Index::create_in_ram(schema);
        {
            let mut index_writer: IndexWriter = index.writer_for_tests()?;
            index_writer.add_document(doc!(
                left_field => "left1 left2 left2 left2f2 left2f2 left3 abcde abcde abcde abcde abcde abcde abcde abcde abcde abcewde abcde abcde",
                right_field => "right1 right2",
                large_field => "large0 large1 large2 large3 large4 large5 large6 large7 large8 large9 large10 large11 large12 large13 large14 large15 large16 large17 large18 large19 large20 large21 large22 large23 large24 large25 large26 large27 large28 large29 large30 large31 large32 large33 large34 large35 large36 large37 large38 large39 large40 large41 large42 large43 large44 large45 large46 large47 large48 large49 large50 large51 large52 large53 large54 large55 large56 large57 large58 large59 large60 large61 large62 large63 large64 large65 large66 large67 large68 large69 large70 large71 large72 large73 large74 large75 large76 large77 large78 large79 large80 large81 large82 large83 large84 large85 large86 large87 large88 large89 large90 large91 large92 large93 large94 large95 large96 large97 large98 large99 large100 large101 large102 large103 large104 large105 large106 large107 large108 large109 large110 large111 large112 large113 large114 large115 large116 large117 large118 large119 large120 large121 large122 large123 large124 large125 large126 large127 large128 large129 large130 large131 large132 large133 large134 large135 large136 large137 large138 large139 large140 large141 large142 large143 large144 large145 large146 large147 large148 large149 large150 large151 large152 large153 large154 large155 large156 large157 large158 large159 large160 large161 large162 large163 large164 large165 large166 large167 large168 large169 large170 large171 large172 large173 large174 large175 large176 large177 large178 large179 large180 large181 large182 large183 large184 large185 large186 large187 large188 large189 large190 large191 large192 large193 large194 large195 large196 large197 large198 large199 large200 large201 large202 large203 large204 large205 large206 large207 large208 large209 large210 large211 large212 large213 large214 large215 large216 large217 large218 large219 large220 large221 large222 large223 large224 large225 large226 large227 large228 large229 large230 large231 large232 large233 large234 large235 large236 large237 large238 large239 large240 large241 large242 large243 large244 large245 large246 large247 large248 large249 large250 large251 large252 large253 large254 large255 large256 large257 large258 large259 large260 large261 large262 large263 large264 large265 large266 large267 large268 large269 large270 large271 large272 large273 large274 large275 large276 large277 large278 large279 large280 large281 large282 large283 large284 large285 large286"
            ))?;
            index_writer.add_document(doc!(left_field => "left4 left1"))?;
            index_writer.commit()?;
        }
        let searcher = index.reader()?.searcher();
        {
            let term = Term::from_field_text(left_field, "left2");
            let term_query = TermQuery::new(term, IndexRecordOption::WithFreqs);
            let topdocs = searcher.search(&term_query, &TopDocs::with_limit(2).order_by_score())?;
            assert_eq!(topdocs.len(), 1);
            let (score, _) = topdocs[0];
            assert_nearly_equals!(0.77802235, score);
        }
        {
            let term = Term::from_field_text(left_field, "left1");
            let term_query = TermQuery::new(term, IndexRecordOption::WithFreqs);
            let top_docs =
                searcher.search(&term_query, &TopDocs::with_limit(2).order_by_score())?;
            assert_eq!(top_docs.len(), 2);
            let (score1, _) = top_docs[0];
            assert_nearly_equals!(0.27101856, score1);
            let (score2, _) = top_docs[1];
            assert_nearly_equals!(0.13736556, score2);
        }
        {
            let query_parser = QueryParser::for_index(&index, Vec::new());
            let query = query_parser.parse_query("left:left2 left:left1")?;
            let top_docs = searcher.search(&query, &TopDocs::with_limit(2).order_by_score())?;
            assert_eq!(top_docs.len(), 2);
            let (score1, _) = top_docs[0];
            assert_nearly_equals!(0.9153879, score1);
            let (score2, _) = top_docs[1];
            assert_nearly_equals!(0.27101856, score2);
        }
        Ok(())
    }

    #[test]
    fn test_term_query_count_when_there_are_deletes() -> crate::Result<()> {
        let mut schema_builder = Schema::builder();
        let text_field = schema_builder.add_text_field("text", TEXT);
        let schema = schema_builder.build();
        let index = Index::create_in_ram(schema);
        let mut index_writer: IndexWriter = index.writer_for_tests()?;
        index_writer.add_document(doc!(text_field=>"a b"))?;
        index_writer.add_document(doc!(text_field=>"a c"))?;
        index_writer.delete_term(Term::from_field_text(text_field, "b"));
        index_writer.commit()?;
        let term_a = Term::from_field_text(text_field, "a");
        let term_query = TermQuery::new(term_a, IndexRecordOption::Basic);
        let reader = index.reader()?;
        assert_eq!(term_query.count(&reader.searcher())?, 1);
        Ok(())
    }

    #[test]
    fn test_term_query_simple_seek() -> crate::Result<()> {
        let mut schema_builder = Schema::builder();
        let text_field = schema_builder.add_text_field("text", TEXT);
        let schema = schema_builder.build();
        let index = Index::create_in_ram(schema);
        let mut index_writer: IndexWriter = index.writer_for_tests()?;
        index_writer.add_document(doc!(text_field=>"a"))?;
        index_writer.add_document(doc!(text_field=>"a"))?;
        index_writer.commit()?;
        let term_a = Term::from_field_text(text_field, "a");
        let term_query = TermQuery::new(term_a, IndexRecordOption::Basic);
        let searcher = index.reader()?.searcher();
        let term_weight =
            term_query.weight(EnableScoring::disabled_from_schema(searcher.schema()))?;
        let mut term_scorer = term_weight.scorer(searcher.segment_reader(0u32), 1.0)?;
        assert_eq!(term_scorer.doc(), 0u32);
        term_scorer.seek(1u32);
        assert_eq!(term_scorer.doc(), 1u32);
        Ok(())
    }

    #[test]
    fn test_term_query_debug() {
        let term_query = TermQuery::new(
            Term::from_field_text(Field::from_field_id(1), "hello"),
            IndexRecordOption::WithFreqs,
        );
        assert_eq!(
            format!("{term_query:?}"),
            r#"TermQuery(Term(field=1, type=Str, "hello"))"#
        );
    }

    #[test]
    fn test_term_query_explain() -> crate::Result<()> {
        let mut schema_builder = Schema::builder();
        let text_field = schema_builder.add_text_field("text", TEXT);
        let schema = schema_builder.build();
        let index = Index::create_in_ram(schema);
        let mut index_writer: IndexWriter = index.writer_for_tests()?;
        index_writer.add_document(doc!(text_field=>"b"))?;
        index_writer.add_document(doc!(text_field=>"a"))?;
        index_writer.add_document(doc!(text_field=>"a"))?;
        index_writer.add_document(doc!(text_field=>"b"))?;
        index_writer.commit()?;
        let term_a = Term::from_field_text(text_field, "a");
        let term_query = TermQuery::new(term_a, IndexRecordOption::Basic);
        let searcher = index.reader()?.searcher();
        {
            let explanation = term_query.explain(&searcher, DocAddress::new(0u32, 1u32))?;
            assert_nearly_equals!(explanation.value(), std::f32::consts::LN_2);
        }
        {
            let explanation_err = term_query.explain(&searcher, DocAddress::new(0u32, 0u32));
            assert!(matches!(
                explanation_err,
                Err(crate::TantivyError::InvalidArgument(_msg))
            ));
        }
        {
            let explanation_err = term_query.explain(&searcher, DocAddress::new(0u32, 3u32));
            assert!(matches!(
                explanation_err,
                Err(crate::TantivyError::InvalidArgument(_msg))
            ));
        }
        Ok(())
    }

    #[test]
    fn test_term_query_fallback_to_fastfield() -> crate::Result<()> {
        use crate::collector::Count;
        use crate::schema::FAST;

        // Create a FAST-only numeric field (not indexed)
        let mut schema_builder = Schema::builder();
        let num_field = schema_builder.add_u64_field("num", FAST);
        let schema = schema_builder.build();
        let index = Index::create_in_ram(schema);

        {
            let mut index_writer: IndexWriter = index.writer_for_tests()?;
            index_writer.add_document(doc!(num_field => 10u64))?;
            index_writer.add_document(doc!(num_field => 20u64))?;
            index_writer.add_document(doc!(num_field => 10u64))?;
            index_writer.commit()?;
        }

        let reader = index.reader()?;
        let searcher = reader.searcher();

        // TermQuery should fall back to a fastfield range query and match correctly.
        let tq_10 = TermQuery::new(
            Term::from_field_u64(num_field, 10u64),
            IndexRecordOption::Basic,
        );
        let tq_20 = TermQuery::new(
            Term::from_field_u64(num_field, 20u64),
            IndexRecordOption::Basic,
        );
        let tq_30 = TermQuery::new(
            Term::from_field_u64(num_field, 30u64),
            IndexRecordOption::Basic,
        );

        let count_10 = searcher.search(&tq_10, &Count)?;
        let count_20 = searcher.search(&tq_20, &Count)?;
        let count_30 = searcher.search(&tq_30, &Count)?;

        assert_eq!(count_10, 2);
        assert_eq!(count_20, 1);
        assert_eq!(count_30, 0);

        Ok(())
    }

    #[test]
    fn test_term_query_fallback_text_fast_only() -> crate::Result<()> {
        use crate::collector::Count;

        // FAST-only text field (not indexed)
        let mut schema_builder = Schema::builder();
        let text_field = schema_builder.add_text_field("text", FAST);
        let schema = schema_builder.build();
        let index = Index::create_in_ram(schema);

        {
            let mut index_writer: IndexWriter = index.writer_for_tests()?;
            index_writer.add_document(doc!(text_field => "hello"))?;
            index_writer.add_document(doc!(text_field => "world"))?;
            index_writer.add_document(doc!(text_field => "hello"))?;
            index_writer.commit()?;
        }

        let searcher = index.reader()?.searcher();
        let tq_hello = TermQuery::new(
            Term::from_field_text(text_field, "hello"),
            IndexRecordOption::Basic,
        );
        let tq_world = TermQuery::new(
            Term::from_field_text(text_field, "world"),
            IndexRecordOption::Basic,
        );
        let tq_missing = TermQuery::new(
            Term::from_field_text(text_field, "nope"),
            IndexRecordOption::Basic,
        );

        assert_eq!(searcher.search(&tq_hello, &Count)?, 2);
        assert_eq!(searcher.search(&tq_world, &Count)?, 1);
        assert_eq!(searcher.search(&tq_missing, &Count)?, 0);

        Ok(())
    }

    #[test]
    fn test_term_query_fallback_json_fast_only() -> crate::Result<()> {
        use crate::collector::Count;
        use crate::fastfield::FastValue;
        use crate::schema::FAST;

        let mut schema_builder = Schema::builder();
        let json_field = schema_builder.add_json_field("json", FAST);
        let schema = schema_builder.build();
        let index = Index::create_in_ram(schema.clone());

        {
            let mut index_writer: IndexWriter = index.writer_for_tests()?;
            index_writer.add_document(doc!(json_field => json!({"a": 10, "b": "x"})))?;
            index_writer.add_document(doc!(json_field => json!({"a": 20, "b": "y"})))?;
            index_writer.add_document(doc!(json_field => json!({"a": 10, "b": "z"})))?;
            index_writer.commit()?;
        }

        fn json_term_fast<T: FastValue>(field: Field, path: &str, v: T) -> Term {
            let mut term = Term::from_field_json_path(field, path, true);
            term.append_type_and_fast_value(v);
            term
        }
        fn json_term_str(field: Field, path: &str, v: &str) -> Term {
            let mut term = Term::from_field_json_path(field, path, true);
            term.append_type_and_str(v);
            term
        }

        let searcher = index.reader()?.searcher();
        // numeric path match
        let tq_a10 = TermQuery::new(
            json_term_fast(json_field, "a", 10u64),
            IndexRecordOption::Basic,
        );
        let tq_a20 = TermQuery::new(
            json_term_fast(json_field, "a", 20u64),
            IndexRecordOption::Basic,
        );
        let tq_a30 = TermQuery::new(
            json_term_fast(json_field, "a", 30u64),
            IndexRecordOption::Basic,
        );
        assert_eq!(searcher.search(&tq_a10, &Count)?, 2);
        assert_eq!(searcher.search(&tq_a20, &Count)?, 1);
        assert_eq!(searcher.search(&tq_a30, &Count)?, 0);

        // string path match
        let tq_bx = TermQuery::new(
            json_term_str(json_field, "b", "x"),
            IndexRecordOption::Basic,
        );
        let tq_by = TermQuery::new(
            json_term_str(json_field, "b", "y"),
            IndexRecordOption::Basic,
        );
        let tq_bm = TermQuery::new(
            json_term_str(json_field, "b", "missing"),
            IndexRecordOption::Basic,
        );
        assert_eq!(searcher.search(&tq_bx, &Count)?, 1);
        assert_eq!(searcher.search(&tq_by, &Count)?, 1);
        assert_eq!(searcher.search(&tq_bm, &Count)?, 0);
        Ok(())
    }

    #[test]
    fn test_term_query_fallback_ip_fast_only() -> crate::Result<()> {
        use std::net::IpAddr;
        use std::str::FromStr;

        use crate::collector::Count;
        use crate::schema::{IntoIpv6Addr, FAST};

        let mut schema_builder = Schema::builder();
        let ip_field = schema_builder.add_ip_addr_field("ip", FAST);
        let schema = schema_builder.build();
        let index = Index::create_in_ram(schema);

        let ip1 = IpAddr::from_str("127.0.0.1").unwrap().into_ipv6_addr();
        let ip2 = IpAddr::from_str("127.0.0.2").unwrap().into_ipv6_addr();
        {
            let mut index_writer: IndexWriter = index.writer_for_tests()?;
            index_writer.add_document(doc!(ip_field => ip1))?;
            index_writer.add_document(doc!(ip_field => ip2))?;
            index_writer.add_document(doc!(ip_field => ip1))?;
            index_writer.commit()?;
        }

        let searcher = index.reader()?.searcher();
        let tq_ip1 = TermQuery::new(
            Term::from_field_ip_addr(ip_field, ip1),
            IndexRecordOption::Basic,
        );
        let tq_ip2 = TermQuery::new(
            Term::from_field_ip_addr(ip_field, ip2),
            IndexRecordOption::Basic,
        );
        let ip3 = IpAddr::from_str("127.0.0.3").unwrap().into_ipv6_addr();
        let tq_ip3 = TermQuery::new(
            Term::from_field_ip_addr(ip_field, ip3),
            IndexRecordOption::Basic,
        );

        assert_eq!(searcher.search(&tq_ip1, &Count)?, 2);
        assert_eq!(searcher.search(&tq_ip2, &Count)?, 1);
        assert_eq!(searcher.search(&tq_ip3, &Count)?, 0);
        Ok(())
    }

    #[test]
    fn test_term_query_fallback_fastfield_with_scores_errors() -> crate::Result<()> {
        use crate::collector::TopDocs;

        // FAST-only numeric field (not indexed) should error when scoring is required
        let mut schema_builder = Schema::builder();
        let num_field = schema_builder.add_u64_field("num", FAST);
        let schema = schema_builder.build();
        let index = Index::create_in_ram(schema);

        {
            let mut index_writer: IndexWriter = index.writer_for_tests()?;
            index_writer.add_document(doc!(num_field => 10u64))?;
            index_writer.add_document(doc!(num_field => 20u64))?;
            index_writer.commit()?;
        }

        let searcher = index.reader()?.searcher();
        let tq = TermQuery::new(
            Term::from_field_u64(num_field, 10u64),
            IndexRecordOption::Basic,
        );

        // Using TopDocs requires scoring; since the field is not indexed,
        // TermQuery cannot score and should return a SchemaError.
        let res = searcher.search(&tq, &TopDocs::with_limit(1).order_by_score());
        assert!(matches!(res, Err(crate::TantivyError::SchemaError(_))));

        Ok(())
    }

    #[test]
    fn test_term_weight_all_query_optimization() {
        let mut schema_builder = Schema::builder();
        let text_field = schema_builder.add_text_field("text", crate::schema::TEXT);
        let schema = schema_builder.build();
        let index = Index::create_in_ram(schema.clone());
        let mut index_writer = index.writer_for_tests().unwrap();
        index_writer
            .add_document(doc!(text_field=>"hello"))
            .unwrap();
        index_writer
            .add_document(doc!(text_field=>"hello happy"))
            .unwrap();
        index_writer.commit().unwrap();
        let reader = index.reader().unwrap();
        let searcher = reader.searcher();
        let get_scorer_for_term = |term: &str| {
            let term_query = TermQuery::new(
                Term::from_field_text(text_field, term),
                IndexRecordOption::Basic,
            );
            let term_weight = term_query
                .weight(EnableScoring::disabled_from_schema(&schema))
                .unwrap();
            term_weight
                .scorer(searcher.segment_reader(0u32), 1.0f32)
                .unwrap()
        };
        // Should be an allscorer
        let match_all_scorer = get_scorer_for_term("hello");
        // Should be a term scorer
        let match_some_scorer = get_scorer_for_term("happy");
        // Should be an empty scorer
        let empty_scorer = get_scorer_for_term("tax");
        assert!(match_all_scorer.is::<AllScorer>());
        assert!(match_some_scorer.is::<TermScorer>());
        assert!(empty_scorer.is::<EmptyScorer>());
    }

    #[test]
    fn test_term_weight_all_query_optimization_disable_when_scoring_enabled() {
        let mut schema_builder = Schema::builder();
        let text_field = schema_builder.add_text_field("text", crate::schema::TEXT);
        let schema = schema_builder.build();
        let index = Index::create_in_ram(schema.clone());
        let mut index_writer = index.writer_for_tests().unwrap();
        index_writer
            .add_document(doc!(text_field=>"hello"))
            .unwrap();
        index_writer
            .add_document(doc!(text_field=>"hello happy"))
            .unwrap();
        index_writer.commit().unwrap();
        let reader = index.reader().unwrap();
        let searcher = reader.searcher();
        let get_scorer_for_term = |term: &str| {
            let term_query = TermQuery::new(
                Term::from_field_text(text_field, term),
                IndexRecordOption::Basic,
            );
            let term_weight = term_query
                .weight(EnableScoring::enabled_from_searcher(&searcher))
                .unwrap();
            term_weight
                .scorer(searcher.segment_reader(0u32), 1.0f32)
                .unwrap()
        };
        // Should be an allscorer
        let match_all_scorer = get_scorer_for_term("hello");
        // Should be a term scorer
        let one_scorer = get_scorer_for_term("happy");
        // Should be an empty scorer
        let empty_scorer = get_scorer_for_term("tax");
        assert!(match_all_scorer.is::<TermScorer>());
        assert!(one_scorer.is::<TermScorer>());
        assert!(empty_scorer.is::<EmptyScorer>());
    }
}


================================================
FILE: src/query/term_query/term_query.rs
================================================
use std::fmt;
use std::ops::Bound;

use super::term_weight::TermWeight;
use crate::query::bm25::Bm25Weight;
use crate::query::range_query::is_type_valid_for_fastfield_range_query;
use crate::query::{EnableScoring, Explanation, Query, RangeQuery, Weight};
use crate::schema::IndexRecordOption;
use crate::Term;

/// A Term query matches all of the documents
/// containing a specific term.
///
/// The score associated is defined as
/// `idf` *  sqrt(`term_freq` / `field norm`)
/// in which :
/// * `idf`        - inverse document frequency.
/// * `term_freq`  - number of occurrences of the term in the field
/// * `field norm` - number of tokens in the field.
///
/// ```rust
/// use tantivy::collector::{Count, TopDocs};
/// use tantivy::query::TermQuery;
/// use tantivy::schema::{Schema, TEXT, IndexRecordOption};
/// use tantivy::{doc, Index, IndexWriter, Term};
/// # fn test() -> tantivy::Result<()> {
/// let mut schema_builder = Schema::builder();
/// let title = schema_builder.add_text_field("title", TEXT);
/// let schema = schema_builder.build();
/// let index = Index::create_in_ram(schema);
/// {
///     let mut index_writer: IndexWriter = index.writer(15_000_000)?;
///     index_writer.add_document(doc!(
///         title => "The Name of the Wind",
///     ))?;
///     index_writer.add_document(doc!(
///         title => "The Diary of Muadib",
///     ))?;
///     index_writer.add_document(doc!(
///         title => "A Dairy Cow",
///     ))?;
///     index_writer.add_document(doc!(
///         title => "The Diary of a Young Girl",
///     ))?;
///     index_writer.commit()?;
/// }
/// let reader = index.reader()?;
/// let searcher = reader.searcher();
/// let query = TermQuery::new(
///     Term::from_field_text(title, "diary"),
///     IndexRecordOption::Basic,
/// );
/// let (top_docs, count) = searcher.search(&query, &(TopDocs::with_limit(2).order_by_score(), Count))?;
/// assert_eq!(count, 2);
/// Ok(())
/// # }
/// # assert!(test().is_ok());
/// ```
#[derive(Clone)]
pub struct TermQuery {
    term: Term,
    index_record_option: IndexRecordOption,
}

impl fmt::Debug for TermQuery {
    fn fmt(&self, f: &mut fmt::Formatter) -> fmt::Result {
        write!(f, "TermQuery({:?})", self.term)
    }
}

impl TermQuery {
    /// Creates a new term query.
    pub fn new(term: Term, segment_postings_options: IndexRecordOption) -> TermQuery {
        TermQuery {
            term,
            index_record_option: segment_postings_options,
        }
    }

    /// The `Term` this query is built out of.
    pub fn term(&self) -> &Term {
        &self.term
    }

    /// Returns a weight object.
    ///
    /// While `.weight(...)` returns a boxed trait object,
    /// this method return a specific implementation.
    /// This is useful for optimization purpose.
    pub fn specialized_weight(
        &self,
        enable_scoring: EnableScoring<'_>,
    ) -> crate::Result<TermWeight> {
        let schema = enable_scoring.schema();
        let field_entry = schema.get_field_entry(self.term.field());
        if !field_entry.is_indexed() {
            let error_msg = format!("Field {:?} is not indexed.", field_entry.name());
            return Err(crate::TantivyError::SchemaError(error_msg));
        }
        let bm25_weight = match enable_scoring {
            EnableScoring::Enabled {
                statistics_provider,
                ..
            } => Bm25Weight::for_terms(statistics_provider, std::slice::from_ref(&self.term))?,
            EnableScoring::Disabled { .. } => {
                Bm25Weight::new(Explanation::new("<no score>", 1.0f32), 1.0f32)
            }
        };
        let scoring_enabled = enable_scoring.is_scoring_enabled();
        let index_record_option = if scoring_enabled {
            self.index_record_option
        } else {
            IndexRecordOption::Basic
        };

        Ok(TermWeight::new(
            self.term.clone(),
            index_record_option,
            bm25_weight,
            scoring_enabled,
        ))
    }
}

impl Query for TermQuery {
    fn weight(&self, enable_scoring: EnableScoring<'_>) -> crate::Result<Box<dyn Weight>> {
        // If the field is not indexed but is a suitable fast field, fall back to a range query
        // on the fast field matching exactly this term.
        //
        // Note: This is considerable slower since it requires to scan the entire fast field.
        // TODO: The range query would gain from having a single-value optimization
        let schema = enable_scoring.schema();
        let field_entry = schema.get_field_entry(self.term.field());
        if !field_entry.is_indexed()
            && field_entry.is_fast()
            && is_type_valid_for_fastfield_range_query(self.term.typ())
            && !enable_scoring.is_scoring_enabled()
        {
            let range_query = RangeQuery::new(
                Bound::Included(self.term.clone()),
                Bound::Included(self.term.clone()),
            );
            return range_query.weight(enable_scoring);
        }
        Ok(Box::new(self.specialized_weight(enable_scoring)?))
    }
    fn query_terms<'a>(&'a self, visitor: &mut dyn FnMut(&'a Term, bool)) {
        visitor(&self.term, false);
    }
}

#[cfg(test)]
mod tests {
    use std::net::{IpAddr, Ipv6Addr};
    use std::str::FromStr;

    use columnar::MonotonicallyMappableToU128;

    use crate::collector::{Count, TopDocs};
    use crate::query::{Query, QueryParser, TermQuery};
    use crate::schema::{IndexRecordOption, IntoIpv6Addr, Schema, INDEXED, STORED};
    use crate::{Index, IndexWriter, Term};

    #[test]
    fn search_ip_test() {
        let mut schema_builder = Schema::builder();
        let ip_field = schema_builder.add_ip_addr_field("ip", INDEXED | STORED);
        let schema = schema_builder.build();
        let index = Index::create_in_ram(schema);
        let ip_addr_1 = IpAddr::from_str("127.0.0.1").unwrap().into_ipv6_addr();
        let ip_addr_2 = Ipv6Addr::from_u128(10);

        {
            let mut index_writer: IndexWriter = index.writer_for_tests().unwrap();
            index_writer
                .add_document(doc!(
                    ip_field => ip_addr_1
                ))
                .unwrap();
            index_writer
                .add_document(doc!(
                    ip_field => ip_addr_2
                ))
                .unwrap();

            index_writer.commit().unwrap();
        }
        let reader = index.reader().unwrap();
        let searcher = reader.searcher();

        let assert_single_hit = |query| {
            let (_top_docs, count) = searcher
                .search(&query, &(TopDocs::with_limit(2).order_by_score(), Count))
                .unwrap();
            assert_eq!(count, 1);
        };
        let query_from_text = |text: String| {
            QueryParser::for_index(&index, vec![ip_field])
                .parse_query(&text)
                .unwrap()
        };

        let query_from_ip = |ip_addr| -> Box<dyn Query> {
            Box::new(TermQuery::new(
                Term::from_field_ip_addr(ip_field, ip_addr),
                IndexRecordOption::Basic,
            ))
        };

        assert_single_hit(query_from_ip(ip_addr_1));
        assert_single_hit(query_from_ip(ip_addr_2));
        assert_single_hit(query_from_text("127.0.0.1".to_string()));
        assert_single_hit(query_from_text("\"127.0.0.1\"".to_string()));
        assert_single_hit(query_from_text(format!("\"{ip_addr_1}\"")));
        assert_single_hit(query_from_text(format!("\"{ip_addr_2}\"")));
    }
}


================================================
FILE: src/query/term_query/term_scorer.rs
================================================
use crate::docset::DocSet;
use crate::fieldnorm::FieldNormReader;
use crate::postings::{FreqReadingOption, Postings, SegmentPostings};
use crate::query::bm25::Bm25Weight;
use crate::query::{Explanation, Scorer};
use crate::{DocId, Score};

#[derive(Clone)]
pub struct TermScorer {
    postings: SegmentPostings,
    fieldnorm_reader: FieldNormReader,
    similarity_weight: Bm25Weight,
}

impl TermScorer {
    pub fn new(
        postings: SegmentPostings,
        fieldnorm_reader: FieldNormReader,
        similarity_weight: Bm25Weight,
    ) -> TermScorer {
        TermScorer {
            postings,
            fieldnorm_reader,
            similarity_weight,
        }
    }

    pub(crate) fn seek_block(&mut self, target_doc: DocId) {
        self.postings.block_cursor.seek_block(target_doc);
    }

    #[cfg(test)]
    pub fn create_for_test(
        doc_and_tfs: &[(DocId, u32)],
        fieldnorms: &[u32],
        similarity_weight: Bm25Weight,
    ) -> TermScorer {
        assert!(!doc_and_tfs.is_empty());
        assert!(
            doc_and_tfs
                .iter()
                .map(|(doc, _tf)| *doc)
                .max()
                .unwrap_or(0u32)
                < fieldnorms.len() as u32
        );
        let segment_postings =
            SegmentPostings::create_from_docs_and_tfs(doc_and_tfs, Some(fieldnorms));
        let fieldnorm_reader = FieldNormReader::for_test(fieldnorms);
        TermScorer::new(segment_postings, fieldnorm_reader, similarity_weight)
    }

    /// See `FreqReadingOption`.
    pub(crate) fn freq_reading_option(&self) -> FreqReadingOption {
        self.postings.block_cursor.freq_reading_option()
    }

    /// Returns the maximum score for the current block.
    ///
    /// In some rare case, the result may not be exact. In this case a lower value is returned,
    /// (and may lead us to return a lesser document).
    ///
    /// At index time, we store the (fieldnorm_id, term frequency) pair that maximizes the
    /// score assuming the average fieldnorm computed on this segment.
    ///
    /// Though extremely rare, it is theoretically possible that the actual average fieldnorm
    /// is different enough from the current segment average fieldnorm that the maximum over a
    /// specific is achieved on a different document.
    ///
    /// (The result is on the other hand guaranteed to be correct if there is only one segment).
    pub fn block_max_score(&mut self) -> Score {
        self.postings
            .block_cursor
            .block_max_score(&self.fieldnorm_reader, &self.similarity_weight)
    }

    pub fn term_freq(&self) -> u32 {
        self.postings.term_freq()
    }

    pub fn fieldnorm_id(&self) -> u8 {
        self.fieldnorm_reader.fieldnorm_id(self.doc())
    }

    pub fn explain(&self) -> Explanation {
        let fieldnorm_id = self.fieldnorm_id();
        let term_freq = self.term_freq();
        self.similarity_weight.explain(fieldnorm_id, term_freq)
    }

    pub fn max_score(&self) -> Score {
        self.similarity_weight.max_score()
    }

    pub fn last_doc_in_block(&self) -> DocId {
        self.postings.block_cursor.skip_reader().last_doc_in_block()
    }
}

impl DocSet for TermScorer {
    #[inline]
    fn advance(&mut self) -> DocId {
        self.postings.advance()
    }

    #[inline]
    fn seek(&mut self, target: DocId) -> DocId {
        debug_assert!(target >= self.doc());
        self.postings.seek(target)
    }

    #[inline]
    fn doc(&self) -> DocId {
        self.postings.doc()
    }

    fn size_hint(&self) -> u32 {
        self.postings.size_hint()
    }
}

impl Scorer for TermScorer {
    #[inline]
    fn score(&mut self) -> Score {
        let fieldnorm_id = self.fieldnorm_id();
        let term_freq = self.term_freq();
        self.similarity_weight.score(fieldnorm_id, term_freq)
    }
}

#[cfg(test)]
mod tests {
    use proptest::prelude::*;

    use crate::index::SegmentId;
    use crate::indexer::index_writer::MEMORY_BUDGET_NUM_BYTES_MIN;
    use crate::merge_policy::NoMergePolicy;
    use crate::postings::compression::COMPRESSION_BLOCK_SIZE;
    use crate::query::term_query::TermScorer;
    use crate::query::{Bm25Weight, EnableScoring, Scorer, TermQuery};
    use crate::schema::{IndexRecordOption, Schema, TEXT};
    use crate::{
        assert_nearly_equals, DocId, DocSet, Index, IndexWriter, Score, Searcher, Term, TERMINATED,
    };

    #[test]
    fn test_term_scorer_max_score() -> crate::Result<()> {
        let bm25_weight = Bm25Weight::for_one_term(3, 6, 10.0);
        let mut term_scorer = TermScorer::create_for_test(
            &[(2, 3), (3, 12), (7, 8)],
            &[0, 0, 10, 12, 0, 0, 0, 100],
            bm25_weight,
        );
        let max_scorer = term_scorer.max_score();
        crate::assert_nearly_equals!(max_scorer, 1.3990127);
        assert_eq!(term_scorer.doc(), 2);
        assert_eq!(term_scorer.term_freq(), 3);
        assert_nearly_equals!(term_scorer.block_max_score(), 1.3676447);
        assert_nearly_equals!(term_scorer.score(), 1.0892314);
        assert_eq!(term_scorer.advance(), 3);
        assert_eq!(term_scorer.doc(), 3);
        assert_eq!(term_scorer.term_freq(), 12);
        assert_nearly_equals!(term_scorer.score(), 1.3676447);
        assert_eq!(term_scorer.advance(), 7);
        assert_eq!(term_scorer.doc(), 7);
        assert_eq!(term_scorer.term_freq(), 8);
        assert_nearly_equals!(term_scorer.score(), 0.72015285);
        assert_eq!(term_scorer.advance(), TERMINATED);
        Ok(())
    }

    #[test]
    fn test_term_scorer_shallow_advance() -> crate::Result<()> {
        let bm25_weight = Bm25Weight::for_one_term(300, 1024, 10.0);
        let mut doc_and_tfs = vec![];
        for i in 0u32..300u32 {
            let doc = i * 10;
            doc_and_tfs.push((doc, 1u32 + doc % 3u32));
        }
        let fieldnorms: Vec<u32> = std::iter::repeat_n(10u32, 3_000).collect();
        let mut term_scorer = TermScorer::create_for_test(&doc_and_tfs, &fieldnorms, bm25_weight);
        assert_eq!(term_scorer.doc(), 0u32);
        term_scorer.seek_block(1289);
        assert_eq!(term_scorer.doc(), 0u32);
        term_scorer.seek(1289);
        assert_eq!(term_scorer.doc(), 1290);
        Ok(())
    }

    proptest! {
        #[test]
        fn test_term_scorer_block_max_score(term_freqs_fieldnorms in proptest::collection::vec((1u32..10u32, 0u32..100u32), 80..300)) {
        let term_doc_freq = term_freqs_fieldnorms.len();
         let doc_tfs: Vec<(u32, u32)> = term_freqs_fieldnorms.iter()
                   .cloned()
                  .enumerate()
                  .map(|(doc, (tf, _))| (doc as u32, tf))
                  .collect();

         let mut fieldnorms: Vec<u32> = vec![];
         for item in term_freqs_fieldnorms.iter().take(term_doc_freq) {
             let (tf, num_extra_terms) = item;
             fieldnorms.push(tf + num_extra_terms);
         }
         let average_fieldnorm = fieldnorms
             .iter()
             .cloned()
             .sum::<u32>() as Score / term_doc_freq as Score;
             // Average fieldnorm is over the entire index,
             // not necessarily the docs that are in the posting list.
             // For this reason we multiply by 1.1 to make a realistic value.
         let bm25_weight = Bm25Weight::for_one_term(term_doc_freq as u64,
            term_doc_freq as u64 * 10u64,
            average_fieldnorm);

         let mut term_scorer =
              TermScorer::create_for_test(&doc_tfs[..], &fieldnorms[..], bm25_weight);

         let docs: Vec<DocId> = (0..term_doc_freq).map(|doc| doc as DocId).collect();
         for block in docs.chunks(COMPRESSION_BLOCK_SIZE) {
             let block_max_score: Score = term_scorer.block_max_score();
             let mut block_max_score_computed: Score = 0.0;
             for &doc in block {
                assert_eq!(term_scorer.doc(), doc);
                block_max_score_computed = block_max_score_computed.max(term_scorer.score());
                term_scorer.advance();
             }
             assert_nearly_equals!(block_max_score_computed, block_max_score);
         }
        }
    }

    #[test]
    fn test_block_wand() {
        let mut doc_tfs: Vec<(u32, u32)> = vec![];
        for doc in 0u32..128u32 {
            doc_tfs.push((doc, 1u32));
        }
        for doc in 128u32..256u32 {
            doc_tfs.push((doc, if doc == 200 { 2u32 } else { 1u32 }));
        }
        doc_tfs.push((256, 1u32));
        doc_tfs.push((257, 3u32));
        doc_tfs.push((258, 1u32));

        let fieldnorms: Vec<u32> = std::iter::repeat_n(20u32, 300).collect();
        let bm25_weight = Bm25Weight::for_one_term(10, 129, 20.0);
        let mut docs = TermScorer::create_for_test(&doc_tfs[..], &fieldnorms[..], bm25_weight);
        assert_nearly_equals!(docs.block_max_score(), 2.5161593);
        docs.seek_block(135);
        assert_nearly_equals!(docs.block_max_score(), 3.4597192);
        docs.seek_block(256);
        // the block is not loaded yet.
        assert_nearly_equals!(docs.block_max_score(), 5.2971773);
        assert_eq!(256, docs.seek(256));
        assert_nearly_equals!(docs.block_max_score(), 3.9539647);
    }

    fn test_block_wand_aux(term_query: &TermQuery, searcher: &Searcher) -> crate::Result<()> {
        let term_weight =
            term_query.specialized_weight(EnableScoring::enabled_from_searcher(searcher))?;
        for reader in searcher.segment_readers() {
            let mut block_max_scores = vec![];
            let mut block_max_scores_b = vec![];
            let mut docs = vec![];
            {
                let mut term_scorer = term_weight.term_scorer_for_test(reader, 1.0)?.unwrap();
                while term_scorer.doc() != TERMINATED {
                    let mut score = term_scorer.score();
                    docs.push(term_scorer.doc());
                    for _ in 0..128 {
                        score = score.max(term_scorer.score());
                        if term_scorer.advance() == TERMINATED {
                            break;
                        }
                    }
                    block_max_scores.push(score);
                }
            }
            {
                let mut term_scorer = term_weight.term_scorer_for_test(reader, 1.0)?.unwrap();
                for d in docs {
                    term_scorer.seek_block(d);
                    block_max_scores_b.push(term_scorer.block_max_score());
                }
            }
            for (l, r) in block_max_scores
                .iter()
                .cloned()
                .zip(block_max_scores_b.iter().cloned())
            {
                assert_nearly_equals!(l, r);
            }
        }
        Ok(())
    }

    #[ignore]
    #[test]
    fn test_block_wand_long_test() -> crate::Result<()> {
        let mut schema_builder = Schema::builder();
        let text_field = schema_builder.add_text_field("text", TEXT);
        let schema = schema_builder.build();
        let index = Index::create_in_ram(schema);
        let mut writer: IndexWriter =
            index.writer_with_num_threads(3, 3 * MEMORY_BUDGET_NUM_BYTES_MIN)?;
        use rand::Rng;
        let mut rng = rand::rng();
        writer.set_merge_policy(Box::new(NoMergePolicy));
        for _ in 0..3_000 {
            let term_freq = rng.random_range(1..10000);
            let words: Vec<&str> = std::iter::repeat_n("bbbb", term_freq).collect();
            let text = words.join(" ");
            writer.add_document(doc!(text_field=>text))?;
        }
        writer.commit()?;
        let term_query = TermQuery::new(
            Term::from_field_text(text_field, "bbbb"),
            IndexRecordOption::WithFreqs,
        );
        let segment_ids: Vec<SegmentId>;
        let reader = index.reader()?;
        {
            let searcher = reader.searcher();
            segment_ids = searcher
                .segment_readers()
                .iter()
                .map(|segment| segment.segment_id())
                .collect();
            test_block_wand_aux(&term_query, &searcher)?;
        }
        writer.merge(&segment_ids[..]).wait().unwrap();
        {
            reader.reload()?;
            let searcher = reader.searcher();
            assert_eq!(searcher.segment_readers().len(), 1);
            test_block_wand_aux(&term_query, &searcher)?;
        }
        Ok(())
    }
}


================================================
FILE: src/query/term_query/term_weight.rs
================================================
use super::term_scorer::TermScorer;
use crate::docset::{DocSet, COLLECT_BLOCK_BUFFER_LEN};
use crate::fieldnorm::FieldNormReader;
use crate::index::SegmentReader;
use crate::postings::SegmentPostings;
use crate::query::bm25::Bm25Weight;
use crate::query::explanation::does_not_match;
use crate::query::weight::{for_each_docset_buffered, for_each_scorer};
use crate::query::{AllScorer, AllWeight, EmptyScorer, Explanation, Scorer, Weight};
use crate::schema::IndexRecordOption;
use crate::{DocId, Score, TantivyError, Term};

pub struct TermWeight {
    term: Term,
    index_record_option: IndexRecordOption,
    similarity_weight: Bm25Weight,
    scoring_enabled: bool,
}

enum TermOrEmptyOrAllScorer {
    TermScorer(Box<TermScorer>),
    Empty,
    AllMatch(AllScorer),
}

impl TermOrEmptyOrAllScorer {
    pub fn into_boxed_scorer(self) -> Box<dyn Scorer> {
        match self {
            TermOrEmptyOrAllScorer::TermScorer(scorer) => scorer,
            TermOrEmptyOrAllScorer::Empty => Box::new(EmptyScorer),
            TermOrEmptyOrAllScorer::AllMatch(scorer) => Box::new(scorer),
        }
    }
}

impl Weight for TermWeight {
    fn scorer(&self, reader: &SegmentReader, boost: Score) -> crate::Result<Box<dyn Scorer>> {
        Ok(self.specialized_scorer(reader, boost)?.into_boxed_scorer())
    }

    fn explain(&self, reader: &SegmentReader, doc: DocId) -> crate::Result<Explanation> {
        match self.specialized_scorer(reader, 1.0)? {
            TermOrEmptyOrAllScorer::TermScorer(mut term_scorer) => {
                if term_scorer.doc() > doc || term_scorer.seek(doc) != doc {
                    return Err(does_not_match(doc));
                }
                let mut explanation = term_scorer.explain();
                explanation.add_context(format!("Term={:?}", self.term,));
                Ok(explanation)
            }
            TermOrEmptyOrAllScorer::Empty => Err(does_not_match(doc)),
            TermOrEmptyOrAllScorer::AllMatch(_) => AllWeight.explain(reader, doc),
        }
    }

    fn count(&self, reader: &SegmentReader) -> crate::Result<u32> {
        if let Some(alive_bitset) = reader.alive_bitset() {
            Ok(self.scorer(reader, 1.0)?.count(alive_bitset))
        } else {
            let field = self.term.field();
            let inv_index = reader.inverted_index(field)?;
            let term_info = inv_index.get_term_info(&self.term)?;
            Ok(term_info.map(|term_info| term_info.doc_freq).unwrap_or(0))
        }
    }

    /// Iterates through all of the document matched by the DocSet
    /// `DocSet` and push the scored documents to the collector.
    fn for_each(
        &self,
        reader: &SegmentReader,
        callback: &mut dyn FnMut(DocId, Score),
    ) -> crate::Result<()> {
        match self.specialized_scorer(reader, 1.0)? {
            TermOrEmptyOrAllScorer::TermScorer(mut term_scorer) => {
                for_each_scorer(&mut *term_scorer, callback);
            }
            TermOrEmptyOrAllScorer::Empty => {}
            TermOrEmptyOrAllScorer::AllMatch(mut all_scorer) => {
                for_each_scorer(&mut all_scorer, callback);
            }
        }
        Ok(())
    }

    /// Iterates through all of the document matched by the DocSet
    /// `DocSet` and push the scored documents to the collector.
    fn for_each_no_score(
        &self,
        reader: &SegmentReader,
        callback: &mut dyn FnMut(&[DocId]),
    ) -> crate::Result<()> {
        match self.specialized_scorer(reader, 1.0)? {
            TermOrEmptyOrAllScorer::TermScorer(mut term_scorer) => {
                let mut buffer = [0u32; COLLECT_BLOCK_BUFFER_LEN];
                for_each_docset_buffered(&mut term_scorer, &mut buffer, callback);
            }
            TermOrEmptyOrAllScorer::Empty => {}
            TermOrEmptyOrAllScorer::AllMatch(mut all_scorer) => {
                let mut buffer = [0u32; COLLECT_BLOCK_BUFFER_LEN];
                for_each_docset_buffered(&mut all_scorer, &mut buffer, callback);
            }
        };

        Ok(())
    }

    /// Calls `callback` with all of the `(doc, score)` for which score
    /// is exceeding a given threshold.
    ///
    /// This method is useful for the TopDocs collector.
    /// For all docsets, the blanket implementation has the benefit
    /// of prefiltering (doc, score) pairs, avoiding the
    /// virtual dispatch cost.
    ///
    /// More importantly, it makes it possible for scorers to implement
    /// important optimization (e.g. BlockWAND for union).
    fn for_each_pruning(
        &self,
        threshold: Score,
        reader: &SegmentReader,
        callback: &mut dyn FnMut(DocId, Score) -> Score,
    ) -> crate::Result<()> {
        let specialized_scorer = self.specialized_scorer(reader, 1.0)?;
        match specialized_scorer {
            TermOrEmptyOrAllScorer::TermScorer(term_scorer) => {
                crate::query::boolean_query::block_wand_single_scorer(
                    *term_scorer,
                    threshold,
                    callback,
                );
            }
            TermOrEmptyOrAllScorer::Empty => {}
            TermOrEmptyOrAllScorer::AllMatch(_) => {
                return Err(TantivyError::InvalidArgument(
                    "for each pruning should only be called if scoring is enabled".to_string(),
                ));
            }
        }
        Ok(())
    }
}

impl TermWeight {
    pub fn new(
        term: Term,
        index_record_option: IndexRecordOption,
        similarity_weight: Bm25Weight,
        scoring_enabled: bool,
    ) -> TermWeight {
        TermWeight {
            term,
            index_record_option,
            similarity_weight,
            scoring_enabled,
        }
    }

    pub fn term(&self) -> &Term {
        &self.term
    }

    /// We need a method to access the actual `TermScorer` implementation
    /// for `white box` test, checking in particular that the block max
    /// is correct.
    #[cfg(test)]
    pub(crate) fn term_scorer_for_test(
        &self,
        reader: &SegmentReader,
        boost: Score,
    ) -> crate::Result<Option<TermScorer>> {
        let scorer = self.specialized_scorer(reader, boost)?;
        Ok(match scorer {
            TermOrEmptyOrAllScorer::TermScorer(scorer) => Some(*scorer),
            _ => None,
        })
    }

    fn specialized_scorer(
        &self,
        reader: &SegmentReader,
        boost: Score,
    ) -> crate::Result<TermOrEmptyOrAllScorer> {
        let field = self.term.field();
        let inverted_index = reader.inverted_index(field)?;
        let Some(term_info) = inverted_index.get_term_info(&self.term)? else {
            // The term was not found.
            return Ok(TermOrEmptyOrAllScorer::Empty);
        };

        // If we don't care about scores, and our posting lists matches all doc, we can return the
        // AllMatch scorer.
        if !self.scoring_enabled && term_info.doc_freq == reader.max_doc() {
            return Ok(TermOrEmptyOrAllScorer::AllMatch(AllScorer::new(
                reader.max_doc(),
            )));
        }

        let segment_postings: SegmentPostings =
            inverted_index.read_postings_from_terminfo(&term_info, self.index_record_option)?;

        let fieldnorm_reader = self.fieldnorm_reader(reader)?;
        let similarity_weight = self.similarity_weight.boost_by(boost);
        Ok(TermOrEmptyOrAllScorer::TermScorer(Box::new(
            TermScorer::new(segment_postings, fieldnorm_reader, similarity_weight),
        )))
    }

    fn fieldnorm_reader(&self, segment_reader: &SegmentReader) -> crate::Result<FieldNormReader> {
        if self.scoring_enabled {
            if let Some(field_norm_reader) = segment_reader
                .fieldnorms_readers()
                .get_field(self.term.field())?
            {
                return Ok(field_norm_reader);
            }
        }
        Ok(FieldNormReader::constant(segment_reader.max_doc(), 1))
    }
}


================================================
FILE: src/query/union/bitset_union.rs
================================================
use std::cell::RefCell;

use crate::docset::DocSet;
use crate::postings::Postings;
use crate::query::BitSetDocSet;
use crate::DocId;

/// Creates a `Posting` that uses the bitset for hits and the docsets for PostingLists.
///
/// It is used for the regex phrase query, where we need the union of a large amount of
/// terms, but need to keep the docsets for the postings.
pub struct BitSetPostingUnion<TDocSet> {
    /// The docsets are required to load positions
    ///
    /// RefCell because we mutate in term_freq
    docsets: RefCell<Vec<TDocSet>>,
    /// The already unionized BitSet of the docsets
    bitset: BitSetDocSet,
}

impl<TDocSet: DocSet> BitSetPostingUnion<TDocSet> {
    pub(crate) fn build(
        docsets: Vec<TDocSet>,
        bitset: BitSetDocSet,
    ) -> BitSetPostingUnion<TDocSet> {
        BitSetPostingUnion {
            docsets: RefCell::new(docsets),
            bitset,
        }
    }
}

impl<TDocSet: Postings> Postings for BitSetPostingUnion<TDocSet> {
    fn term_freq(&self) -> u32 {
        let curr_doc = self.bitset.doc();
        let mut term_freq = 0;
        let mut docsets = self.docsets.borrow_mut();
        for docset in docsets.iter_mut() {
            if docset.doc() < curr_doc {
                docset.seek(curr_doc);
            }
            if docset.doc() == curr_doc {
                term_freq += docset.term_freq();
            }
        }
        term_freq
    }

    fn append_positions_with_offset(&mut self, offset: u32, output: &mut Vec<u32>) {
        let curr_doc = self.bitset.doc();
        let mut docsets = self.docsets.borrow_mut();
        for docset in docsets.iter_mut() {
            if docset.doc() < curr_doc {
                docset.seek(curr_doc);
            }
            if docset.doc() == curr_doc {
                docset.append_positions_with_offset(offset, output);
            }
        }
        debug_assert!(
            !output.is_empty(),
            "this method should only be called if positions are available"
        );
        output.sort_unstable();
        output.dedup();
    }
}

impl<TDocSet: DocSet> DocSet for BitSetPostingUnion<TDocSet> {
    fn advance(&mut self) -> DocId {
        self.bitset.advance()
    }

    fn seek(&mut self, target: DocId) -> DocId {
        self.bitset.seek(target)
    }

    fn doc(&self) -> DocId {
        self.bitset.doc()
    }

    fn size_hint(&self) -> u32 {
        self.bitset.size_hint()
    }

    fn count_including_deleted(&mut self) -> u32 {
        self.bitset.count_including_deleted()
    }
}


================================================
FILE: src/query/union/buffered_union.rs
================================================
use common::TinySet;

use crate::docset::{DocSet, SeekDangerResult, TERMINATED};
use crate::query::score_combiner::{DoNothingCombiner, ScoreCombiner};
use crate::query::size_hint::estimate_union;
use crate::query::Scorer;
use crate::{DocId, Score};

// The buffered union looks ahead within a fixed-size sliding window
// of upcoming document IDs (the "horizon").
const HORIZON_NUM_TINYBITSETS: usize = HORIZON as usize / 64;
const HORIZON: u32 = 64u32 * 64u32;

// `drain_filter` is not stable yet.
// This function is similar except that it does is not unstable, and
// it does not keep the original vector ordering.
//
// Elements are dropped and not yielded.
fn unordered_drain_filter<T, P>(v: &mut Vec<T>, mut predicate: P)
where P: FnMut(&mut T) -> bool {
    let mut i = 0;
    while i < v.len() {
        if predicate(&mut v[i]) {
            v.swap_remove(i);
        } else {
            i += 1;
        }
    }
}

/// Creates a `DocSet` that iterate through the union of two or more `DocSet`s.
pub struct BufferedUnionScorer<TScorer, TScoreCombiner = DoNothingCombiner> {
    /// Active scorers (already filtered of `TERMINATED`).
    docsets: Vec<TScorer>,
    /// Sliding window presence map for upcoming docs.
    ///
    /// There are `HORIZON_NUM_TINYBITSETS` buckets, each covering
    /// a span of 64 doc IDs. Bucket `i` represents the range
    /// `[window_start_doc + i*64, window_start_doc + (i+1)*64)`.
    bitsets: Box<[TinySet; HORIZON_NUM_TINYBITSETS]>,
    // Index of the current TinySet bucket within the sliding window.
    bucket_idx: usize,
    /// Per-doc score combiners for the current window.
    ///
    /// these accumulators merge contributions from all scorers that
    /// hit the same doc within the buffered window.
    scores: Box<[TScoreCombiner; HORIZON as usize]>,
    /// Start doc ID (inclusive) of the current sliding window.
    window_start_doc: DocId,
    /// Current doc ID of the union.
    doc: DocId,
    /// Combined score for current `doc` as produced by `TScoreCombiner`.
    score: Score,
    /// Number of documents in the segment.
    num_docs: u32,
}

fn refill<TScorer: Scorer, TScoreCombiner: ScoreCombiner>(
    scorers: &mut Vec<TScorer>,
    bitsets: &mut [TinySet; HORIZON_NUM_TINYBITSETS],
    score_combiner: &mut [TScoreCombiner; HORIZON as usize],
    min_doc: DocId,
) {
    unordered_drain_filter(scorers, |scorer| {
        let horizon = min_doc + HORIZON;
        loop {
            let doc = scorer.doc();
            if doc >= horizon {
                return false;
            }
            // add this document
            let delta = doc - min_doc;
            bitsets[(delta / 64) as usize].insert_mut(delta % 64u32);
            score_combiner[delta as usize].update(scorer);
            if scorer.advance() == TERMINATED {
                // remove the docset, it has been entirely consumed.
                return true;
            }
        }
    });
}

impl<TScorer: Scorer, TScoreCombiner: ScoreCombiner> BufferedUnionScorer<TScorer, TScoreCombiner> {
    /// num_docs is the number of documents in the segment.
    pub(crate) fn build(
        docsets: Vec<TScorer>,
        score_combiner_fn: impl FnOnce() -> TScoreCombiner,
        num_docs: u32,
    ) -> BufferedUnionScorer<TScorer, TScoreCombiner> {
        let non_empty_docsets: Vec<TScorer> = docsets
            .into_iter()
            .filter(|docset| docset.doc() != TERMINATED)
            .collect();
        let mut union = BufferedUnionScorer {
            docsets: non_empty_docsets,
            bitsets: Box::new([TinySet::empty(); HORIZON_NUM_TINYBITSETS]),
            scores: Box::new([score_combiner_fn(); HORIZON as usize]),
            bucket_idx: HORIZON_NUM_TINYBITSETS,
            window_start_doc: 0,
            doc: 0,
            score: 0.0,
            num_docs,
        };
        if union.refill() {
            union.advance();
        } else {
            union.doc = TERMINATED;
        }
        union
    }

    fn refill(&mut self) -> bool {
        if let Some(min_doc) = self.docsets.iter().map(DocSet::doc).min() {
            // Reset the sliding window to start at the smallest doc
            // across all scorers and prebuffer within the horizon.
            self.window_start_doc = min_doc;
            self.bucket_idx = 0;
            self.doc = min_doc;
            refill(
                &mut self.docsets,
                &mut self.bitsets,
                &mut self.scores,
                min_doc,
            );
            true
        } else {
            false
        }
    }

    #[inline]
    fn advance_buffered(&mut self) -> bool {
        while self.bucket_idx < HORIZON_NUM_TINYBITSETS {
            if let Some(val) = self.bitsets[self.bucket_idx].pop_lowest() {
                let delta = val + (self.bucket_idx as u32) * 64;
                self.doc = self.window_start_doc + delta;
                let score_combiner = &mut self.scores[delta as usize];
                self.score = score_combiner.score();
                score_combiner.clear();
                return true;
            } else {
                self.bucket_idx += 1;
            }
        }
        false
    }

    fn is_in_horizon(&self, target: DocId) -> bool {
        // wrapping_sub, because target may be < window_start_doc
        let gap = target.wrapping_sub(self.window_start_doc);
        gap < HORIZON
    }
}

impl<TScorer, TScoreCombiner> DocSet for BufferedUnionScorer<TScorer, TScoreCombiner>
where
    TScorer: Scorer,
    TScoreCombiner: ScoreCombiner,
{
    #[inline]
    fn advance(&mut self) -> DocId {
        if self.advance_buffered() {
            return self.doc;
        }
        if !self.refill() {
            self.doc = TERMINATED;
            return TERMINATED;
        }
        if !self.advance_buffered() {
            return TERMINATED;
        }
        self.doc
    }

    fn seek(&mut self, target: DocId) -> DocId {
        if self.doc >= target {
            return self.doc;
        }
        let gap = target - self.window_start_doc;
        if gap < HORIZON {
            // Our value is within the buffered horizon.

            // Skipping to corresponding bucket.
            let new_bucket_idx = gap as usize / 64;
            for obsolete_tinyset in &mut self.bitsets[self.bucket_idx..new_bucket_idx] {
                obsolete_tinyset.clear();
            }
            for score_combiner in &mut self.scores[self.bucket_idx * 64..new_bucket_idx * 64] {
                score_combiner.clear();
            }
            self.bucket_idx = new_bucket_idx;

            // Advancing until we reach the end of the bucket
            // or we reach a doc greater or equal to the target.
            let mut doc = self.doc();
            while doc < target {
                doc = self.advance();
            }
            doc
        } else {
            // clear the buffered info.
            for obsolete_tinyset in self.bitsets.iter_mut() {
                *obsolete_tinyset = TinySet::empty();
            }
            for score_combiner in self.scores.iter_mut() {
                score_combiner.clear();
            }

            // The target is outside of the buffered horizon.
            // advance all docsets to a doc >= to the target.
            unordered_drain_filter(&mut self.docsets, |docset| {
                if docset.doc() < target {
                    docset.seek(target);
                }
                docset.doc() == TERMINATED
            });

            // at this point all of the docsets
            // are positioned on a doc >= to the target.
            if !self.refill() {
                self.doc = TERMINATED;
                return TERMINATED;
            }
            self.advance()
        }
    }

    fn seek_danger(&mut self, target: DocId) -> SeekDangerResult {
        if target >= TERMINATED {
            return SeekDangerResult::SeekLowerBound(TERMINATED);
        }
        if self.is_in_horizon(target) {
            // Our value is within the buffered horizon and the docset may already have been
            // processed and removed, so we need to use seek, which uses the regular advance.
            let seek_doc = self.seek(target);
            if seek_doc == target {
                return SeekDangerResult::Found;
            } else {
                return SeekDangerResult::SeekLowerBound(seek_doc);
            };
        }

        // The docsets are not in the buffered range, so we can use seek_into_the_danger_zone
        // of the underlying docsets
        let mut is_hit = false;
        let mut min_new_target = TERMINATED;

        for docset in self.docsets.iter_mut() {
            match docset.seek_danger(target) {
                SeekDangerResult::Found => {
                    is_hit = true;
                    break;
                }
                SeekDangerResult::SeekLowerBound(new_target) => {
                    min_new_target = min_new_target.min(new_target);
                }
            }
        }

        // The API requires the DocSet to be in a valid state when `seek_into_the_danger_zone`
        // returns Found.
        if is_hit {
            // The doc is found. Let's make sure we position the union on the target
            // to bring it back to a valid state.
            self.seek(target);
            SeekDangerResult::Found
        } else {
            SeekDangerResult::SeekLowerBound(min_new_target)
        }
    }

    #[inline]
    fn doc(&self) -> DocId {
        self.doc
    }

    fn size_hint(&self) -> u32 {
        estimate_union(self.docsets.iter().map(DocSet::size_hint), self.num_docs)
    }

    fn cost(&self) -> u64 {
        self.docsets.iter().map(|docset| docset.cost()).sum()
    }

    // TODO Also implement `count` with deletes efficiently.
    fn count_including_deleted(&mut self) -> u32 {
        if self.doc == TERMINATED {
            return 0;
        }
        let mut count = self.bitsets[self.bucket_idx..HORIZON_NUM_TINYBITSETS]
            .iter()
            .map(|bitset| bitset.len())
            .sum::<u32>()
            + 1;
        for bitset in self.bitsets.iter_mut() {
            bitset.clear();
        }
        while self.refill() {
            count += self.bitsets.iter().map(|bitset| bitset.len()).sum::<u32>();
            for bitset in self.bitsets.iter_mut() {
                bitset.clear();
            }
        }
        self.bucket_idx = HORIZON_NUM_TINYBITSETS;
        count
    }
}

impl<TScorer, TScoreCombiner> Scorer for BufferedUnionScorer<TScorer, TScoreCombiner>
where
    TScoreCombiner: ScoreCombiner,
    TScorer: Scorer,
{
    #[inline]
    fn score(&mut self) -> Score {
        self.score
    }
}


================================================
FILE: src/query/union/mod.rs
================================================
mod bitset_union;
mod buffered_union;
mod simple_union;

pub use bitset_union::BitSetPostingUnion;
pub use buffered_union::BufferedUnionScorer;
pub use simple_union::SimpleUnion;

#[cfg(test)]
mod tests {

    use std::collections::BTreeSet;

    use common::BitSet;

    use super::{SimpleUnion, *};
    use crate::docset::{DocSet, SeekDangerResult, TERMINATED};
    use crate::postings::tests::test_skip_against_unoptimized;
    use crate::query::score_combiner::DoNothingCombiner;
    use crate::query::union::bitset_union::BitSetPostingUnion;
    use crate::query::{BitSetDocSet, ConstScorer, VecDocSet};
    use crate::{tests, DocId};

    fn vec_doc_set_from_docs_list(
        docs_list: &[Vec<DocId>],
    ) -> impl Iterator<Item = VecDocSet> + '_ {
        docs_list.iter().cloned().map(VecDocSet::from)
    }
    fn union_from_docs_list(docs_list: &[Vec<DocId>]) -> Box<dyn DocSet> {
        let max_doc = docs_list
            .iter()
            .flat_map(|docs| docs.iter().copied())
            .max()
            .unwrap_or(0);
        Box::new(BufferedUnionScorer::build(
            vec_doc_set_from_docs_list(docs_list)
                .map(|docset| ConstScorer::new(docset, 1.0))
                .collect::<Vec<ConstScorer<VecDocSet>>>(),
            DoNothingCombiner::default,
            max_doc,
        ))
    }

    fn posting_list_union_from_docs_list(docs_list: &[Vec<DocId>]) -> Box<dyn DocSet> {
        Box::new(BitSetPostingUnion::build(
            vec_doc_set_from_docs_list(docs_list).collect::<Vec<VecDocSet>>(),
            bitset_from_docs_list(docs_list),
        ))
    }
    fn simple_union_from_docs_list(docs_list: &[Vec<DocId>]) -> Box<dyn DocSet> {
        Box::new(SimpleUnion::build(
            vec_doc_set_from_docs_list(docs_list).collect::<Vec<VecDocSet>>(),
        ))
    }
    fn bitset_from_docs_list(docs_list: &[Vec<DocId>]) -> BitSetDocSet {
        let max_doc = docs_list
            .iter()
            .flat_map(|docs| docs.iter().copied())
            .max()
            .unwrap_or(0);
        let mut doc_bitset = BitSet::with_max_value(max_doc + 1);
        for docs in docs_list {
            for &doc in docs {
                doc_bitset.insert(doc);
            }
        }
        BitSetDocSet::from(doc_bitset)
    }
    fn aux_test_union(docs_list: &[Vec<DocId>]) {
        for constructor in [
            posting_list_union_from_docs_list,
            simple_union_from_docs_list,
            union_from_docs_list,
        ] {
            aux_test_union_with_constructor(constructor, docs_list);
        }
    }
    fn aux_test_union_with_constructor<F>(constructor: F, docs_list: &[Vec<DocId>])
    where F: Fn(&[Vec<DocId>]) -> Box<dyn DocSet> {
        let mut val_set: BTreeSet<u32> = BTreeSet::new();
        for vs in docs_list {
            for &v in vs {
                val_set.insert(v);
            }
        }
        let union_vals: Vec<u32> = val_set.into_iter().collect();
        let mut union_expected = VecDocSet::from(union_vals);
        let make_union = || constructor(docs_list);
        let mut union = make_union();
        let mut count = 0;
        while union.doc() != TERMINATED {
            assert_eq!(union_expected.doc(), union.doc());
            assert_eq!(union_expected.advance(), union.advance());
            count += 1;
        }
        assert_eq!(union_expected.advance(), TERMINATED);
        assert_eq!(count, make_union().count_including_deleted());
    }

    use proptest::prelude::*;

    proptest! {
        #[test]
        fn test_union_is_same(vecs in prop::collection::vec(
            prop::collection::vec(0u32..100, 1..10)
                .prop_map(|mut inner| {
                    inner.sort_unstable();
                    inner.dedup();
                    inner
                }),
            1..10
        ),
        seek_docids in prop::collection::vec(0u32..100, 0..10).prop_map(|mut inner| {
            inner.sort_unstable();
            inner
        })) {
            test_docid_with_skip(&vecs, &seek_docids);
        }
    }

    fn test_docid_with_skip(vecs: &[Vec<DocId>], skip_targets: &[DocId]) {
        let mut union1 = posting_list_union_from_docs_list(vecs);
        let mut union2 = simple_union_from_docs_list(vecs);
        let mut union3 = union_from_docs_list(vecs);

        // Check initial sequential advance
        while union1.doc() != TERMINATED {
            assert_eq!(union1.doc(), union2.doc());
            assert_eq!(union1.doc(), union3.doc());
            assert_eq!(union1.advance(), union2.advance());
            assert_eq!(union1.doc(), union3.advance());
        }

        // Reset and test seek functionality
        let mut union1 = posting_list_union_from_docs_list(vecs);
        let mut union2 = simple_union_from_docs_list(vecs);
        let mut union3 = union_from_docs_list(vecs);

        for &seek_docid in skip_targets {
            union1.seek(seek_docid);
            union2.seek(seek_docid);
            union3.seek(seek_docid);

            // Verify that all unions have the same document after seeking
            assert_eq!(union3.doc(), union1.doc());
            assert_eq!(union3.doc(), union2.doc());
        }
    }

    #[test]
    fn test_union() {
        aux_test_union(&[
            vec![1, 3333, 100000000u32],
            vec![1, 2, 100000000u32],
            vec![1, 2, 100000000u32],
            vec![],
        ]);
        aux_test_union(&[
            vec![1, 3333, 100000000u32],
            vec![1, 2, 100000000u32],
            vec![1, 2, 100000000u32],
            vec![],
        ]);
        aux_test_union(&[
            tests::sample_with_seed(100_000, 0.01, 1),
            tests::sample_with_seed(100_000, 0.05, 2),
            tests::sample_with_seed(100_000, 0.001, 3),
        ]);
    }

    fn test_aux_union_skip(docs_list: &[Vec<DocId>], skip_targets: Vec<DocId>) {
        for constructor in [
            posting_list_union_from_docs_list,
            simple_union_from_docs_list,
            union_from_docs_list,
        ] {
            test_aux_union_skip_with_constructor(constructor, docs_list, skip_targets.clone());
        }
    }
    fn test_aux_union_skip_with_constructor<F>(
        constructor: F,
        docs_list: &[Vec<DocId>],
        skip_targets: Vec<DocId>,
    ) where
        F: Fn(&[Vec<DocId>]) -> Box<dyn DocSet>,
    {
        let mut btree_set = BTreeSet::new();
        for docs in docs_list {
            btree_set.extend(docs.iter().cloned());
        }
        let docset_factory = || {
            let res: Box<dyn DocSet> = constructor(docs_list);
            res
        };
        let mut docset = constructor(docs_list);
        for el in btree_set {
            assert_eq!(el, docset.doc());
            docset.advance();
        }
        assert_eq!(docset.doc(), TERMINATED);
        test_skip_against_unoptimized(docset_factory, skip_targets);
    }

    #[test]
    fn test_union_skip_corner_case() {
        test_aux_union_skip(&[vec![165132, 167382], vec![25029, 25091]], vec![25029]);
    }

    #[test]
    fn test_union_skip_corner_case2() {
        test_aux_union_skip(
            &[vec![1u32, 1u32 + 100], vec![2u32, 1000u32, 10_000u32]],
            vec![0u32, 1u32, 2u32, 3u32, 1u32 + 100, 2u32 + 100],
        );
    }

    #[test]
    fn test_union_skip_corner_case3() {
        let mut docset = posting_list_union_from_docs_list(&[vec![0u32, 5u32], vec![1u32, 4u32]]);
        assert_eq!(docset.doc(), 0u32);
        assert_eq!(docset.seek(0u32), 0u32);
        assert_eq!(docset.seek(0u32), 0u32);
        assert_eq!(docset.doc(), 0u32)
    }

    #[test]
    fn test_union_skip_random() {
        test_aux_union_skip(
            &[
                vec![1, 2, 3, 7],
                vec![1, 3, 9, 10000],
                vec![1, 3, 8, 9, 100],
            ],
            vec![1, 2, 3, 5, 6, 7, 8, 100],
        );
        test_aux_union_skip(
            &[
                tests::sample_with_seed(100_000, 0.001, 1),
                tests::sample_with_seed(100_000, 0.002, 2),
                tests::sample_with_seed(100_000, 0.005, 3),
            ],
            tests::sample_with_seed(100_000, 0.01, 4),
        );
    }

    #[test]
    fn test_union_skip_specific() {
        test_aux_union_skip(
            &[
                vec![1, 2, 3, 7],
                vec![1, 3, 9, 10000],
                vec![1, 3, 8, 9, 100],
            ],
            vec![1, 2, 3, 7, 8, 9, 99, 100, 101, 500, 20000],
        );
    }

    #[test]
    fn test_buffered_union_seek_into_danger_zone_terminated() {
        let scorer1 = ConstScorer::new(VecDocSet::from(vec![1, 2]), 1.0);
        let scorer2 = ConstScorer::new(VecDocSet::from(vec![2, 3]), 1.0);

        let mut union_scorer =
            BufferedUnionScorer::build(vec![scorer1, scorer2], DoNothingCombiner::default, 100);

        // Advance to end
        while union_scorer.doc() != TERMINATED {
            union_scorer.advance();
        }

        assert_eq!(union_scorer.doc(), TERMINATED);

        assert_eq!(
            union_scorer.seek_danger(TERMINATED),
            SeekDangerResult::SeekLowerBound(TERMINATED)
        );
    }
}

#[cfg(all(test, feature = "unstable"))]
mod bench {

    use test::Bencher;

    use crate::query::score_combiner::DoNothingCombiner;
    use crate::query::{BufferedUnionScorer, ConstScorer, VecDocSet};
    use crate::{tests, DocId, DocSet, TERMINATED};

    #[bench]
    fn bench_union_3_high(bench: &mut Bencher) {
        let union_docset: Vec<Vec<DocId>> = vec![
            tests::sample_with_seed(100_000, 0.1, 0),
            tests::sample_with_seed(100_000, 0.2, 1),
        ];
        bench.iter(|| {
            let mut v = BufferedUnionScorer::build(
                union_docset
                    .iter()
                    .map(|doc_ids| VecDocSet::from(doc_ids.clone()))
                    .map(|docset| ConstScorer::new(docset, 1.0))
                    .collect::<Vec<_>>(),
                DoNothingCombiner::default,
                100_000,
            );
            while v.doc() != TERMINATED {
                v.advance();
            }
        });
    }
    #[bench]
    fn bench_union_3_low(bench: &mut Bencher) {
        let union_docset: Vec<Vec<DocId>> = vec![
            tests::sample_with_seed(100_000, 0.01, 0),
            tests::sample_with_seed(100_000, 0.05, 1),
            tests::sample_with_seed(100_000, 0.001, 2),
        ];
        bench.iter(|| {
            let mut v = BufferedUnionScorer::build(
                union_docset
                    .iter()
                    .map(|doc_ids| VecDocSet::from(doc_ids.clone()))
                    .map(|docset| ConstScorer::new(docset, 1.0))
                    .collect::<Vec<_>>(),
                DoNothingCombiner::default,
                100_000,
            );
            while v.doc() != TERMINATED {
                v.advance();
            }
        });
    }
}


================================================
FILE: src/query/union/simple_union.rs
================================================
use crate::docset::{DocSet, TERMINATED};
use crate::postings::Postings;
use crate::DocId;

/// A `SimpleUnion` is a `DocSet` that is the union of multiple `DocSet`.
/// Unlike `BufferedUnion`, it doesn't do any horizon precomputation.
///
/// For that reason SimpleUnion is a good choice for queries that skip a lot.
pub struct SimpleUnion<TDocSet> {
    docsets: Vec<TDocSet>,
    doc: DocId,
}

impl<TDocSet: DocSet> SimpleUnion<TDocSet> {
    pub(crate) fn build(mut docsets: Vec<TDocSet>) -> SimpleUnion<TDocSet> {
        docsets.retain(|docset| docset.doc() != TERMINATED);
        let mut docset = SimpleUnion { docsets, doc: 0 };

        docset.initialize_first_doc_id();

        docset
    }

    fn initialize_first_doc_id(&mut self) {
        let mut next_doc = TERMINATED;

        for docset in &self.docsets {
            next_doc = next_doc.min(docset.doc());
        }
        self.doc = next_doc;
    }

    fn advance_to_next(&mut self) -> DocId {
        let mut next_doc = TERMINATED;

        for docset in &mut self.docsets {
            if docset.doc() <= self.doc {
                docset.advance();
            }
            next_doc = next_doc.min(docset.doc());
        }
        self.doc = next_doc;
        self.doc
    }
}

impl<TDocSet: Postings> Postings for SimpleUnion<TDocSet> {
    fn term_freq(&self) -> u32 {
        let mut term_freq = 0;
        for docset in &self.docsets {
            let doc = docset.doc();
            if doc == self.doc {
                term_freq += docset.term_freq();
            }
        }
        term_freq
    }

    fn append_positions_with_offset(&mut self, offset: u32, output: &mut Vec<u32>) {
        for docset in &mut self.docsets {
            let doc = docset.doc();
            if doc == self.doc {
                docset.append_positions_with_offset(offset, output);
            }
        }
        output.sort_unstable();
        output.dedup();
    }
}

impl<TDocSet: DocSet> DocSet for SimpleUnion<TDocSet> {
    fn advance(&mut self) -> DocId {
        self.advance_to_next();
        self.doc
    }

    fn seek(&mut self, target: DocId) -> DocId {
        self.doc = TERMINATED;
        for docset in &mut self.docsets {
            if docset.doc() < target {
                docset.seek(target);
            }
            if docset.doc() < self.doc {
                self.doc = docset.doc();
            }
        }
        self.doc
    }

    fn doc(&self) -> DocId {
        self.doc
    }

    fn size_hint(&self) -> u32 {
        // TODO: use estimate_union
        self.docsets
            .iter()
            .map(|docset| docset.size_hint())
            .max()
            .unwrap_or(0u32)
    }

    fn cost(&self) -> u64 {
        self.docsets.iter().map(|docset| docset.cost()).sum()
    }

    fn count_including_deleted(&mut self) -> u32 {
        if self.doc == TERMINATED {
            return 0u32;
        }
        let mut count = 1u32;
        while self.advance_to_next() != TERMINATED {
            count += 1;
        }
        count
    }
}


================================================
FILE: src/query/vec_docset.rs
================================================
#![allow(dead_code)]

use common::HasLen;

use crate::docset::{DocSet, TERMINATED};
use crate::DocId;

/// Simulate a `Postings` objects from a `VecPostings`.
/// `VecPostings` only exist for testing purposes.
///
/// Term frequencies always return 1.
/// No positions are returned.
pub struct VecDocSet {
    doc_ids: Vec<DocId>,
    cursor: usize,
}

impl From<Vec<DocId>> for VecDocSet {
    fn from(doc_ids: Vec<DocId>) -> VecDocSet {
        // We do not use `slice::is_sorted`, as we want to check for doc ids to be strictly
        // sorted.
        assert!(doc_ids.windows(2).all(|w| w[0] < w[1]));
        VecDocSet { doc_ids, cursor: 0 }
    }
}

impl DocSet for VecDocSet {
    fn advance(&mut self) -> DocId {
        self.cursor += 1;
        if self.cursor >= self.doc_ids.len() {
            self.cursor = self.doc_ids.len();
            return TERMINATED;
        }
        self.doc()
    }

    fn doc(&self) -> DocId {
        if self.cursor == self.doc_ids.len() {
            return TERMINATED;
        }
        self.doc_ids[self.cursor]
    }

    fn size_hint(&self) -> u32 {
        self.len() as u32
    }
}

impl HasLen for VecDocSet {
    fn len(&self) -> usize {
        self.doc_ids.len()
    }
}

#[cfg(test)]
pub(crate) mod tests {

    use super::*;
    use crate::docset::COLLECT_BLOCK_BUFFER_LEN;

    #[test]
    pub fn test_vec_postings() {
        let doc_ids: Vec<DocId> = (0u32..1024u32).map(|e| e * 3).collect();
        let mut postings = VecDocSet::from(doc_ids);
        assert_eq!(postings.doc(), 0u32);
        assert_eq!(postings.advance(), 3u32);
        assert_eq!(postings.doc(), 3u32);
        assert_eq!(postings.seek(14u32), 15u32);
        assert_eq!(postings.doc(), 15u32);
        assert_eq!(postings.seek(300u32), 300u32);
        assert_eq!(postings.doc(), 300u32);
        assert_eq!(postings.seek(6000u32), TERMINATED);
    }

    #[test]
    pub fn test_fill_buffer() {
        let doc_ids: Vec<DocId> = (1u32..=(COLLECT_BLOCK_BUFFER_LEN as u32 * 2 + 9)).collect();
        let mut postings = VecDocSet::from(doc_ids);
        let mut buffer = [0u32; COLLECT_BLOCK_BUFFER_LEN];
        assert_eq!(postings.fill_buffer(&mut buffer), COLLECT_BLOCK_BUFFER_LEN);
        for i in 0u32..COLLECT_BLOCK_BUFFER_LEN as u32 {
            assert_eq!(buffer[i as usize], i + 1);
        }
        assert_eq!(postings.fill_buffer(&mut buffer), COLLECT_BLOCK_BUFFER_LEN);
        for i in 0u32..COLLECT_BLOCK_BUFFER_LEN as u32 {
            assert_eq!(buffer[i as usize], i + 1 + COLLECT_BLOCK_BUFFER_LEN as u32);
        }
        assert_eq!(postings.fill_buffer(&mut buffer), 9);
    }
}


================================================
FILE: src/query/weight.rs
================================================
use super::Scorer;
use crate::docset::COLLECT_BLOCK_BUFFER_LEN;
use crate::index::SegmentReader;
use crate::query::Explanation;
use crate::{DocId, DocSet, Score, TERMINATED};

/// Iterates through all of the documents and scores matched by the DocSet
/// `DocSet`.
pub(crate) fn for_each_scorer<TScorer: Scorer + ?Sized>(
    scorer: &mut TScorer,
    callback: &mut dyn FnMut(DocId, Score),
) {
    let mut doc = scorer.doc();
    while doc != TERMINATED {
        callback(doc, scorer.score());
        doc = scorer.advance();
    }
}

/// Iterates through all of the documents matched by the DocSet
/// `DocSet`.
#[inline]
pub(crate) fn for_each_docset_buffered<T: DocSet + ?Sized>(
    docset: &mut T,
    buffer: &mut [DocId; COLLECT_BLOCK_BUFFER_LEN],
    mut callback: impl FnMut(&[DocId]),
) {
    loop {
        let num_items = docset.fill_buffer(buffer);
        callback(&buffer[..num_items]);
        if num_items != buffer.len() {
            break;
        }
    }
}

/// Calls `callback` with all of the `(doc, score)` for which score
/// is exceeding a given threshold.
///
/// This method is useful for the [`TopDocs`](crate::collector::TopDocs) collector.
/// For all docsets, the blanket implementation has the benefit
/// of prefiltering (doc, score) pairs, avoiding the
/// virtual dispatch cost.
///
/// More importantly, it makes it possible for scorers to implement
/// important optimization (e.g. BlockWAND for union).
pub(crate) fn for_each_pruning_scorer<TScorer: Scorer + ?Sized>(
    scorer: &mut TScorer,
    mut threshold: Score,
    callback: &mut dyn FnMut(DocId, Score) -> Score,
) {
    let mut doc = scorer.doc();
    while doc != TERMINATED {
        let score = scorer.score();
        if score > threshold {
            threshold = callback(doc, score);
        }
        doc = scorer.advance();
    }
}

/// A Weight is the specialization of a `Query`
/// for a given set of segments.
///
/// See [`Query`](crate::query::Query).
pub trait Weight: Send + Sync + 'static {
    /// Returns the scorer for the given segment.
    ///
    /// `boost` is a multiplier to apply to the score.
    ///
    /// See [`Query`](crate::query::Query).
    fn scorer(&self, reader: &SegmentReader, boost: Score) -> crate::Result<Box<dyn Scorer>>;

    /// Returns an [`Explanation`] for the given document.
    fn explain(&self, reader: &SegmentReader, doc: DocId) -> crate::Result<Explanation>;

    /// Returns the number documents within the given [`SegmentReader`].
    fn count(&self, reader: &SegmentReader) -> crate::Result<u32> {
        let mut scorer = self.scorer(reader, 1.0)?;
        if let Some(alive_bitset) = reader.alive_bitset() {
            Ok(scorer.count(alive_bitset))
        } else {
            Ok(scorer.count_including_deleted())
        }
    }

    /// Iterates through all of the document matched by the DocSet
    /// `DocSet` and push the scored documents to the collector.
    fn for_each(
        &self,
        reader: &SegmentReader,
        callback: &mut dyn FnMut(DocId, Score),
    ) -> crate::Result<()> {
        let mut scorer = self.scorer(reader, 1.0)?;
        for_each_scorer(scorer.as_mut(), callback);
        Ok(())
    }

    /// Iterates through all of the document matched by the DocSet
    /// `DocSet` and push the scored documents to the collector.
    fn for_each_no_score(
        &self,
        reader: &SegmentReader,
        callback: &mut dyn FnMut(&[DocId]),
    ) -> crate::Result<()> {
        let mut docset = self.scorer(reader, 1.0)?;

        let mut buffer = [0u32; COLLECT_BLOCK_BUFFER_LEN];
        for_each_docset_buffered(&mut docset, &mut buffer, callback);
        Ok(())
    }

    /// Calls `callback` with all of the `(doc, score)` for which score
    /// is exceeding a given threshold.
    ///
    /// This method is useful for the [`TopDocs`](crate::collector::TopDocs) collector.
    /// For all docsets, the blanket implementation has the benefit
    /// of prefiltering (doc, score) pairs, avoiding the
    /// virtual dispatch cost.
    ///
    /// More importantly, it makes it possible for scorers to implement
    /// important optimization (e.g. BlockWAND for union).
    fn for_each_pruning(
        &self,
        threshold: Score,
        reader: &SegmentReader,
        callback: &mut dyn FnMut(DocId, Score) -> Score,
    ) -> crate::Result<()> {
        let mut scorer = self.scorer(reader, 1.0)?;
        for_each_pruning_scorer(scorer.as_mut(), threshold, callback);
        Ok(())
    }
}


================================================
FILE: src/reader/mod.rs
================================================
mod warming;

use std::sync::atomic::AtomicU64;
use std::sync::{atomic, Arc, Weak};

use arc_swap::ArcSwap;
pub use warming::Warmer;

use self::warming::WarmingState;
use crate::core::searcher::{SearcherGeneration, SearcherInner};
use crate::directory::{Directory, WatchCallback, WatchHandle, META_LOCK};
use crate::store::DOCSTORE_CACHE_CAPACITY;
use crate::{Index, Inventory, Searcher, SegmentReader, TrackedObject};

/// Defines when a new version of the index should be reloaded.
///
/// Regardless of whether you search and index in the same process, tantivy does not necessarily
/// reflects the change that are committed to your index. `ReloadPolicy` precisely helps you define
/// when you want your index to be reloaded.
#[derive(Clone, Copy)]
pub enum ReloadPolicy {
    /// The index is entirely reloaded manually.
    /// All updates of the index should be manual.
    ///
    /// No change is reflected automatically. You are required to call [`IndexReader::reload()`]
    /// manually.
    Manual,
    /// The index is reloaded within milliseconds after a new commit is available.
    /// This is made possible by watching changes in the `meta.json` file.
    OnCommitWithDelay, // TODO add NEAR_REAL_TIME(target_ms)
}

/// [`IndexReader`] builder
///
/// It makes it possible to configure:
/// - [`ReloadPolicy`] defining when new index versions are detected
/// - [`Warmer`] implementations
/// - number of warming threads, for parallelizing warming work
/// - The cache size of the underlying doc store readers.
#[derive(Clone)]
pub struct IndexReaderBuilder {
    reload_policy: ReloadPolicy,
    index: Index,
    warmers: Vec<Weak<dyn Warmer>>,
    num_warming_threads: usize,
    doc_store_cache_num_blocks: usize,
}

impl IndexReaderBuilder {
    #[must_use]
    pub(crate) fn new(index: Index) -> IndexReaderBuilder {
        IndexReaderBuilder {
            reload_policy: ReloadPolicy::OnCommitWithDelay,
            index,
            warmers: Vec::new(),
            num_warming_threads: 1,
            doc_store_cache_num_blocks: DOCSTORE_CACHE_CAPACITY,
        }
    }

    /// Builds the reader.
    ///
    /// Building the reader is a non-trivial operation that requires
    /// to open different segment readers. It may take hundreds of milliseconds
    /// of time and it may return an error.
    pub fn try_into(self) -> crate::Result<IndexReader> {
        let searcher_generation_inventory = Inventory::default();
        let warming_state = WarmingState::new(
            self.num_warming_threads,
            self.warmers,
            searcher_generation_inventory.clone(),
        )?;
        let inner_reader = InnerIndexReader::new(
            self.doc_store_cache_num_blocks,
            self.index,
            warming_state,
            searcher_generation_inventory,
        )?;
        let inner_reader_arc = Arc::new(inner_reader);
        let watch_handle_opt: Option<WatchHandle> = match self.reload_policy {
            ReloadPolicy::Manual => {
                // No need to set anything...
                None
            }
            ReloadPolicy::OnCommitWithDelay => {
                let inner_reader_arc_clone = inner_reader_arc.clone();
                let callback = move || {
                    if let Err(err) = inner_reader_arc_clone.reload() {
                        error!("Error while loading searcher after commit was detected. {err:?}");
                    }
                };
                let watch_handle = inner_reader_arc
                    .index
                    .directory()
                    .watch(WatchCallback::new(callback))?;
                Some(watch_handle)
            }
        };
        Ok(IndexReader {
            inner: inner_reader_arc,
            _watch_handle_opt: watch_handle_opt,
        })
    }

    /// Sets the reload_policy.
    ///
    /// See [`ReloadPolicy`] for more details.
    #[must_use]
    pub fn reload_policy(mut self, reload_policy: ReloadPolicy) -> IndexReaderBuilder {
        self.reload_policy = reload_policy;
        self
    }

    /// Sets the cache size of the doc store readers.
    ///
    /// The doc store readers cache by default DOCSTORE_CACHE_CAPACITY(100) decompressed blocks.
    #[must_use]
    pub fn doc_store_cache_num_blocks(
        mut self,
        doc_store_cache_num_blocks: usize,
    ) -> IndexReaderBuilder {
        self.doc_store_cache_num_blocks = doc_store_cache_num_blocks;
        self
    }

    /// Set the [`Warmer`]s that are invoked when reloading searchable segments.
    #[must_use]
    pub fn warmers(mut self, warmers: Vec<Weak<dyn Warmer>>) -> IndexReaderBuilder {
        self.warmers = warmers;
        self
    }

    /// Sets the number of warming threads.
    ///
    /// This allows parallelizing warming work when there are multiple [`Warmer`] registered with
    /// the [`IndexReader`].
    #[must_use]
    pub fn num_warming_threads(mut self, num_warming_threads: usize) -> IndexReaderBuilder {
        self.num_warming_threads = num_warming_threads;
        self
    }
}

impl TryInto<IndexReader> for IndexReaderBuilder {
    type Error = crate::TantivyError;

    fn try_into(self) -> crate::Result<IndexReader> {
        IndexReaderBuilder::try_into(self)
    }
}

struct InnerIndexReader {
    doc_store_cache_num_blocks: usize,
    index: Index,
    warming_state: WarmingState,
    searcher: arc_swap::ArcSwap<SearcherInner>,
    searcher_generation_counter: Arc<AtomicU64>,
    searcher_generation_inventory: Inventory<SearcherGeneration>,
}

impl InnerIndexReader {
    fn new(
        doc_store_cache_num_blocks: usize,
        index: Index,
        warming_state: WarmingState,
        // The searcher_generation_inventory is not used as source, but as target to track the
        // loaded segments.
        searcher_generation_inventory: Inventory<SearcherGeneration>,
    ) -> crate::Result<Self> {
        let searcher_generation_counter: Arc<AtomicU64> = Default::default();

        let searcher = Self::create_searcher(
            &index,
            doc_store_cache_num_blocks,
            &warming_state,
            &searcher_generation_counter,
            &searcher_generation_inventory,
        )?;
        Ok(InnerIndexReader {
            doc_store_cache_num_blocks,
            index,
            warming_state,
            searcher: ArcSwap::from(searcher),
            searcher_generation_counter,
            searcher_generation_inventory,
        })
    }
    /// Opens the freshest segments [`SegmentReader`].
    ///
    /// This function acquires a lock to prevent GC from removing files
    /// as we are opening our index.
    fn open_segment_readers(index: &Index) -> crate::Result<Vec<SegmentReader>> {
        // Prevents segment files from getting deleted while we are in the process of opening them
        let _meta_lock = index.directory().acquire_lock(&META_LOCK)?;
        let searchable_segments = index.searchable_segments()?;
        let segment_readers = searchable_segments
            .iter()
            .map(SegmentReader::open)
            .collect::<crate::Result<_>>()?;
        Ok(segment_readers)
    }

    fn track_segment_readers_in_inventory(
        segment_readers: &[SegmentReader],
        searcher_generation_counter: &Arc<AtomicU64>,
        searcher_generation_inventory: &Inventory<SearcherGeneration>,
    ) -> TrackedObject<SearcherGeneration> {
        let generation_id = searcher_generation_counter.fetch_add(1, atomic::Ordering::AcqRel);
        let searcher_generation =
            SearcherGeneration::from_segment_readers(segment_readers, generation_id);
        searcher_generation_inventory.track(searcher_generation)
    }

    fn create_searcher(
        index: &Index,
        doc_store_cache_num_blocks: usize,
        warming_state: &WarmingState,
        searcher_generation_counter: &Arc<AtomicU64>,
        searcher_generation_inventory: &Inventory<SearcherGeneration>,
    ) -> crate::Result<Arc<SearcherInner>> {
        let segment_readers = Self::open_segment_readers(index)?;
        let searcher_generation = Self::track_segment_readers_in_inventory(
            &segment_readers,
            searcher_generation_counter,
            searcher_generation_inventory,
        );

        let schema = index.schema();
        let searcher = Arc::new(SearcherInner::new(
            schema,
            index.clone(),
            segment_readers,
            searcher_generation,
            doc_store_cache_num_blocks,
        )?);

        warming_state.warm_new_searcher_generation(&searcher.clone().into())?;
        Ok(searcher)
    }

    fn reload(&self) -> crate::Result<()> {
        let searcher = Self::create_searcher(
            &self.index,
            self.doc_store_cache_num_blocks,
            &self.warming_state,
            &self.searcher_generation_counter,
            &self.searcher_generation_inventory,
        )?;

        self.searcher.store(searcher);

        Ok(())
    }

    fn searcher(&self) -> Searcher {
        self.searcher.load().clone().into()
    }
}

/// `IndexReader` is your entry point to read and search the index.
///
/// It controls when a new version of the index should be loaded and lends
/// you instances of `Searcher` for the last loaded version.
///
/// `IndexReader` just wraps an `Arc`.
#[derive(Clone)]
pub struct IndexReader {
    inner: Arc<InnerIndexReader>,
    _watch_handle_opt: Option<WatchHandle>,
}

impl IndexReader {
    #[cfg(test)]
    pub(crate) fn index(&self) -> Index {
        self.inner.index.clone()
    }

    /// Update searchers so that they reflect the state of the last
    /// `.commit()`.
    ///
    /// If you set up the [`ReloadPolicy::OnCommitWithDelay`] (which is the default)
    /// every commit should be rapidly reflected on your `IndexReader` and you should
    /// not need to call `reload()` at all.
    ///
    /// This automatic reload can take 10s of milliseconds to kick in however, and in unit tests
    /// it can be nice to deterministically force the reload of searchers.
    pub fn reload(&self) -> crate::Result<()> {
        self.inner.reload()
    }

    /// Returns a searcher
    ///
    /// This method should be called every single time a search
    /// query is performed.
    ///
    /// The same searcher must be used for a given query, as it ensures
    /// the use of a consistent segment set.
    pub fn searcher(&self) -> Searcher {
        self.inner.searcher()
    }
}


================================================
FILE: src/reader/warming.rs
================================================
use std::collections::HashSet;
use std::ops::Deref;
use std::sync::{Arc, Mutex, Weak};
use std::thread::JoinHandle;
use std::time::Duration;

use crate::{Executor, Inventory, Searcher, SearcherGeneration, TantivyError};

pub const GC_INTERVAL: Duration = Duration::from_secs(1);

/// `Warmer` can be used to maintain segment-level state e.g. caches.
///
/// They must be registered with the [`IndexReaderBuilder`](super::IndexReaderBuilder).
pub trait Warmer: Sync + Send {
    /// Perform any warming work using the provided [`Searcher`].
    fn warm(&self, searcher: &Searcher) -> crate::Result<()>;

    /// Discards internal state for any [`SearcherGeneration`] not provided.
    fn garbage_collect(&self, live_generations: &[&SearcherGeneration]);
}

/// Warming-related state with interior mutability.
#[derive(Clone)]
pub(crate) struct WarmingState(Arc<Mutex<WarmingStateInner>>);

impl WarmingState {
    pub fn new(
        num_warming_threads: usize,
        warmers: Vec<Weak<dyn Warmer>>,
        searcher_generation_inventory: Inventory<SearcherGeneration>,
    ) -> crate::Result<Self> {
        Ok(Self(Arc::new(Mutex::new(WarmingStateInner {
            num_warming_threads,
            warmers,
            gc_thread: None,
            warmed_generation_ids: Default::default(),
            searcher_generation_inventory,
        }))))
    }

    /// Start tracking a new generation of [`Searcher`], and [`Warmer::warm`] it if there are active
    /// warmers.
    ///
    /// A background GC thread for [`Warmer::garbage_collect`] calls is uniquely created if there
    /// are active warmers.
    pub fn warm_new_searcher_generation(&self, searcher: &Searcher) -> crate::Result<()> {
        self.0
            .lock()
            .unwrap()
            .warm_new_searcher_generation(searcher, &self.0)
    }

    #[cfg(test)]
    fn gc_maybe(&self) -> bool {
        self.0.lock().unwrap().gc_maybe()
    }
}

struct WarmingStateInner {
    num_warming_threads: usize,
    warmers: Vec<Weak<dyn Warmer>>,
    gc_thread: Option<JoinHandle<()>>,
    // Contains all generations that have been warmed up.
    // This list is used to avoid triggers the individual Warmer GCs
    // if no warmed generation needs to be collected.
    warmed_generation_ids: HashSet<u64>,
    searcher_generation_inventory: Inventory<SearcherGeneration>,
}

impl WarmingStateInner {
    /// Start tracking provided searcher as an exemplar of a new generation.
    /// If there are active warmers, warm them with the provided searcher, and kick background GC
    /// thread if it has not yet been kicked. Otherwise, prune state for dropped searcher
    /// generations inline.
    fn warm_new_searcher_generation(
        &mut self,
        searcher: &Searcher,
        this: &Arc<Mutex<Self>>,
    ) -> crate::Result<()> {
        let warmers = self.pruned_warmers();
        // Avoid threads (warming as well as background GC) if there are no warmers
        if warmers.is_empty() {
            return Ok(());
        }
        self.start_gc_thread_maybe(this)?;
        self.warmed_generation_ids
            .insert(searcher.generation().generation_id());
        warming_executor(self.num_warming_threads.min(warmers.len()))?
            .map(|warmer| warmer.warm(searcher), warmers.into_iter())?;
        Ok(())
    }

    /// Attempt to upgrade the weak `Warmer` references, pruning those which cannot be upgraded.
    /// Return the strong references.
    fn pruned_warmers(&mut self) -> Vec<Arc<dyn Warmer>> {
        let strong_warmers = self
            .warmers
            .iter()
            .flat_map(|weak_warmer| weak_warmer.upgrade())
            .collect::<Vec<_>>();
        self.warmers = strong_warmers.iter().map(Arc::downgrade).collect();
        strong_warmers
    }

    /// [`Warmer::garbage_collect`] active warmers if some searcher generation is observed to have
    /// been dropped.
    fn gc_maybe(&mut self) -> bool {
        let live_generations = self.searcher_generation_inventory.list();
        let live_generation_ids: HashSet<u64> = live_generations
            .iter()
            .map(|searcher_generation| searcher_generation.generation_id())
            .collect();
        let gc_not_required = self
            .warmed_generation_ids
            .iter()
            .all(|warmed_up_generation| live_generation_ids.contains(warmed_up_generation));
        if gc_not_required {
            return false;
        }
        let live_generation_refs = live_generations
            .iter()
            .map(Deref::deref)
            .collect::<Vec<_>>();
        for warmer in self.pruned_warmers() {
            warmer.garbage_collect(&live_generation_refs);
        }
        self.warmed_generation_ids = live_generation_ids;
        true
    }

    /// Start GC thread if one has not already been started.
    fn start_gc_thread_maybe(&mut self, this: &Arc<Mutex<Self>>) -> crate::Result<bool> {
        if self.gc_thread.is_some() {
            return Ok(false);
        }
        let weak_inner = Arc::downgrade(this);
        let handle = std::thread::Builder::new()
            .name("tantivy-warm-gc".to_owned())
            .spawn(|| Self::gc_loop(weak_inner))
            .map_err(|_| {
                TantivyError::SystemError("Failed to spawn warmer GC thread".to_owned())
            })?;
        self.gc_thread = Some(handle);
        Ok(true)
    }

    /// Every [`GC_INTERVAL`] attempt to GC, with panics caught and logged using
    /// [`std::panic::catch_unwind`].
    fn gc_loop(inner: Weak<Mutex<WarmingStateInner>>) {
        for _ in crossbeam_channel::tick(GC_INTERVAL) {
            if let Some(inner) = inner.upgrade() {
                // rely on deterministic gc in tests
                #[cfg(not(test))]
                if let Err(err) = std::panic::catch_unwind(|| inner.lock().unwrap().gc_maybe()) {
                    error!("Panic in Warmer GC {err:?}");
                }
                // avoid unused var warning in tests
                #[cfg(test)]
                drop(inner);
            }
        }
    }
}

fn warming_executor(num_threads: usize) -> crate::Result<Executor> {
    if num_threads <= 1 {
        Ok(Executor::single_thread())
    } else {
        Executor::multi_thread(num_threads, "tantivy-warm-")
    }
}

#[cfg(test)]
mod tests {
    use std::collections::HashSet;
    use std::sync::atomic::{self, AtomicUsize};
    use std::sync::{Arc, RwLock, Weak};

    use super::Warmer;
    use crate::core::searcher::SearcherGeneration;
    use crate::directory::RamDirectory;
    use crate::index::SegmentId;
    use crate::indexer::index_writer::MEMORY_BUDGET_NUM_BYTES_MIN;
    use crate::schema::{Schema, INDEXED};
    use crate::{Index, IndexSettings, ReloadPolicy, Searcher};

    #[derive(Default)]
    struct TestWarmer {
        active_segment_ids: RwLock<HashSet<SegmentId>>,
        warm_calls: AtomicUsize,
        gc_calls: AtomicUsize,
    }

    impl TestWarmer {
        fn live_segment_ids(&self) -> HashSet<SegmentId> {
            self.active_segment_ids.read().unwrap().clone()
        }

        fn warm_calls(&self) -> usize {
            self.warm_calls.load(atomic::Ordering::Acquire)
        }

        fn gc_calls(&self) -> usize {
            self.gc_calls.load(atomic::Ordering::Acquire)
        }

        fn verify(
            &self,
            expected_warm_calls: usize,
            expected_gc_calls: usize,
            expected_segment_ids: HashSet<SegmentId>,
        ) {
            assert_eq!(self.warm_calls(), expected_warm_calls);
            assert_eq!(self.gc_calls(), expected_gc_calls);
            assert_eq!(self.live_segment_ids(), expected_segment_ids);
        }
    }

    impl Warmer for TestWarmer {
        fn warm(&self, searcher: &crate::Searcher) -> crate::Result<()> {
            self.warm_calls.fetch_add(1, atomic::Ordering::SeqCst);
            for reader in searcher.segment_readers() {
                self.active_segment_ids
                    .write()
                    .unwrap()
                    .insert(reader.segment_id());
            }
            Ok(())
        }

        fn garbage_collect(&self, live_generations: &[&SearcherGeneration]) {
            self.gc_calls
                .fetch_add(1, std::sync::atomic::Ordering::SeqCst);
            let active_segment_ids = live_generations
                .iter()
                .flat_map(|searcher_generation| searcher_generation.segments().keys().copied())
                .collect();
            *self.active_segment_ids.write().unwrap() = active_segment_ids;
        }
    }

    fn segment_ids(searcher: &Searcher) -> HashSet<SegmentId> {
        searcher
            .segment_readers()
            .iter()
            .map(|reader| reader.segment_id())
            .collect()
    }

    fn test_warming(num_warming_threads: usize) -> crate::Result<()> {
        let mut schema_builder = Schema::builder();
        let field = schema_builder.add_u64_field("pk", INDEXED);
        let schema = schema_builder.build();

        let directory = RamDirectory::create();
        let index = Index::create(directory, schema, IndexSettings::default())?;

        let num_writer_threads = 4;
        let mut writer = index
            .writer_with_num_threads(
                num_writer_threads,
                MEMORY_BUDGET_NUM_BYTES_MIN * num_writer_threads,
            )
            .unwrap();

        for i in 0u64..1000u64 {
            writer.add_document(doc!(field => i))?;
        }
        writer.commit()?;

        let warmer1 = Arc::new(TestWarmer::default());
        let warmer2 = Arc::new(TestWarmer::default());
        warmer1.verify(0, 0, HashSet::new());
        warmer2.verify(0, 0, HashSet::new());

        let num_searchers = 4;
        let reader = index
            .reader_builder()
            .reload_policy(ReloadPolicy::Manual)
            .num_warming_threads(num_warming_threads)
            .warmers(vec![
                Arc::downgrade(&warmer1) as Weak<dyn Warmer>,
                Arc::downgrade(&warmer2) as Weak<dyn Warmer>,
            ])
            .try_into()?;

        let warming_state = &reader.inner.warming_state;

        let searcher = reader.searcher();
        assert!(
            !warming_state.gc_maybe(),
            "no GC after first searcher generation"
        );
        warmer1.verify(1, 0, segment_ids(&searcher));
        warmer2.verify(1, 0, segment_ids(&searcher));
        assert_eq!(searcher.num_docs(), 1000);

        for i in 1000u64..2000u64 {
            writer.add_document(doc!(field => i))?;
        }
        writer.commit()?;
        writer.wait_merging_threads()?;

        drop(warmer1);

        let old_searcher = searcher;

        reader.reload()?;

        assert!(!warming_state.gc_maybe(), "old searcher still around");

        let searcher = reader.searcher();
        assert_eq!(searcher.num_docs(), 2000);

        warmer2.verify(
            2,
            0,
            segment_ids(&old_searcher)
                .union(&segment_ids(&searcher))
                .copied()
                .collect(),
        );

        drop(old_searcher);
        for _ in 0..num_searchers {
            // make sure the old searcher is dropped by the pool too
            let _ = reader.searcher();
        }
        assert!(warming_state.gc_maybe(), "old searcher dropped");

        warmer2.verify(2, 1, segment_ids(&searcher));

        Ok(())
    }

    #[test]
    fn warming_single_thread() -> crate::Result<()> {
        test_warming(1)
    }

    #[test]
    fn warming_four_threads() -> crate::Result<()> {
        test_warming(4)
    }
}


================================================
FILE: src/schema/bytes_options.rs
================================================
use std::ops::BitOr;

use serde::{Deserialize, Serialize};

use super::flags::{FastFlag, IndexedFlag, SchemaFlagList, StoredFlag};
/// Define how a bytes field should be handled by tantivy.
#[derive(Clone, Debug, Default, PartialEq, Eq, Serialize, Deserialize)]
#[serde(from = "BytesOptionsDeser")]
pub struct BytesOptions {
    indexed: bool,
    fieldnorms: bool,
    fast: bool,
    stored: bool,
}

/// For backward compatibility we add an intermediary to interpret the
/// lack of fieldnorms attribute as "true" if and only if indexed.
///
/// (Downstream, for the moment, this attribute is not used if not indexed...)
/// Note that: newly serialized NumericOptions will include the new attribute.
#[derive(Deserialize)]
struct BytesOptionsDeser {
    indexed: bool,
    #[serde(default)]
    fieldnorms: Option<bool>,
    fast: bool,
    stored: bool,
}

impl From<BytesOptionsDeser> for BytesOptions {
    fn from(deser: BytesOptionsDeser) -> Self {
        BytesOptions {
            indexed: deser.indexed,
            fieldnorms: deser.fieldnorms.unwrap_or(deser.indexed),
            fast: deser.fast,
            stored: deser.stored,
        }
    }
}

impl BytesOptions {
    /// Returns true if the value is indexed.
    #[inline]
    pub fn is_indexed(&self) -> bool {
        self.indexed
    }

    /// Returns true if and only if the value is normed.
    #[inline]
    pub fn fieldnorms(&self) -> bool {
        self.fieldnorms
    }

    /// Returns true if the value is a fast field.
    #[inline]
    pub fn is_fast(&self) -> bool {
        self.fast
    }

    /// Returns true if the value is stored.
    #[inline]
    pub fn is_stored(&self) -> bool {
        self.stored
    }

    /// Set the field as indexed.
    ///
    /// Setting an integer as indexed will generate
    /// a posting list for each value taken by the integer.
    #[must_use]
    pub fn set_indexed(mut self) -> BytesOptions {
        self.indexed = true;
        self
    }

    /// Set the field as normed.
    ///
    /// Setting an integer as normed will generate
    /// the fieldnorm data for it.
    #[must_use]
    pub fn set_fieldnorms(mut self) -> BytesOptions {
        self.fieldnorms = true;
        self
    }

    /// Set the field as a fast field.
    ///
    /// Fast fields are designed for random access.
    #[must_use]
    pub fn set_fast(mut self) -> BytesOptions {
        self.fast = true;
        self
    }

    /// Set the field as stored.
    ///
    /// Only the fields that are set as *stored* are
    /// persisted into the Tantivy's store.
    #[must_use]
    pub fn set_stored(mut self) -> BytesOptions {
        self.stored = true;
        self
    }
}

impl<T: Into<BytesOptions>> BitOr<T> for BytesOptions {
    type Output = BytesOptions;

    fn bitor(self, other: T) -> BytesOptions {
        let other = other.into();
        BytesOptions {
            indexed: self.indexed | other.indexed,
            fieldnorms: self.fieldnorms | other.fieldnorms,
            stored: self.stored | other.stored,
            fast: self.fast | other.fast,
        }
    }
}

impl From<()> for BytesOptions {
    fn from(_: ()) -> Self {
        Self::default()
    }
}

impl From<FastFlag> for BytesOptions {
    fn from(_: FastFlag) -> Self {
        BytesOptions {
            indexed: false,
            fieldnorms: false,
            stored: false,
            fast: true,
        }
    }
}

impl From<StoredFlag> for BytesOptions {
    fn from(_: StoredFlag) -> Self {
        BytesOptions {
            indexed: false,
            fieldnorms: false,
            stored: true,
            fast: false,
        }
    }
}

impl From<IndexedFlag> for BytesOptions {
    fn from(_: IndexedFlag) -> Self {
        BytesOptions {
            indexed: true,
            fieldnorms: true,
            stored: false,
            fast: false,
        }
    }
}

impl<Head, Tail> From<SchemaFlagList<Head, Tail>> for BytesOptions
where
    Head: Clone,
    Tail: Clone,
    Self: BitOr<Output = Self> + From<Head> + From<Tail>,
{
    fn from(head_tail: SchemaFlagList<Head, Tail>) -> Self {
        Self::from(head_tail.head) | Self::from(head_tail.tail)
    }
}

#[cfg(test)]
mod tests {
    use crate::schema::{BytesOptions, FAST, INDEXED, STORED};

    #[test]
    fn test_bytes_option_fast_flag() {
        assert_eq!(BytesOptions::default().set_fast(), FAST.into());
        assert_eq!(
            BytesOptions::default().set_indexed().set_fieldnorms(),
            INDEXED.into()
        );
        assert_eq!(BytesOptions::default().set_stored(), STORED.into());
    }
    #[test]
    fn test_bytes_option_fast_flag_composition() {
        assert_eq!(
            BytesOptions::default().set_fast().set_stored(),
            (FAST | STORED).into()
        );
        assert_eq!(
            BytesOptions::default()
                .set_indexed()
                .set_fieldnorms()
                .set_fast(),
            (INDEXED | FAST).into()
        );
        assert_eq!(
            BytesOptions::default()
                .set_stored()
                .set_fieldnorms()
                .set_indexed(),
            (STORED | INDEXED).into()
        );
    }

    #[test]
    fn test_bytes_option_fast_() {
        assert!(!BytesOptions::default().is_stored());
        assert!(!BytesOptions::default().is_fast());
        assert!(!BytesOptions::default().is_indexed());
        assert!(!BytesOptions::default().fieldnorms());
        assert!(BytesOptions::default().set_stored().is_stored());
        assert!(BytesOptions::default().set_fast().is_fast());
        assert!(BytesOptions::default().set_indexed().is_indexed());
        assert!(BytesOptions::default().set_fieldnorms().fieldnorms());
    }

    #[test]
    fn test_bytes_options_deser_if_fieldnorm_missing_indexed_true() {
        let json = r#"{
            "indexed": true,
            "fast": false,
            "stored": false
        }"#;
        let bytes_options: BytesOptions = serde_json::from_str(json).unwrap();
        assert_eq!(
            &bytes_options,
            &BytesOptions {
                indexed: true,
                fieldnorms: true,
                fast: false,
                stored: false
            }
        );
    }

    #[test]
    fn test_bytes_options_deser_if_fieldnorm_missing_indexed_false() {
        let json = r#"{
            "indexed": false,
            "stored": false,
            "fast": false
        }"#;
        let bytes_options: BytesOptions = serde_json::from_str(json).unwrap();
        assert_eq!(
            &bytes_options,
            &BytesOptions {
                indexed: false,
                fieldnorms: false,
                fast: false,
                stored: false
            }
        );
    }

    #[test]
    fn test_bytes_options_deser_if_fieldnorm_false_indexed_true() {
        let json = r#"{
            "indexed": true,
            "fieldnorms": false,
            "fast": false,
            "stored": false
        }"#;
        let bytes_options: BytesOptions = serde_json::from_str(json).unwrap();
        assert_eq!(
            &bytes_options,
            &BytesOptions {
                indexed: true,
                fieldnorms: false,
                fast: false,
                stored: false
            }
        );
    }

    #[test]
    fn test_bytes_options_deser_if_fieldnorm_true_indexed_false() {
        // this one is kind of useless, at least at the moment
        let json = r#"{
            "indexed": false,
            "fieldnorms": true,
            "fast": false,
            "stored": false
        }"#;
        let bytes_options: BytesOptions = serde_json::from_str(json).unwrap();
        assert_eq!(
            &bytes_options,
            &BytesOptions {
                indexed: false,
                fieldnorms: true,
                fast: false,
                stored: false
            }
        );
    }
}


================================================
FILE: src/schema/date_time_options.rs
================================================
use std::ops::BitOr;

pub use common::DateTimePrecision;
use serde::{Deserialize, Serialize};

use crate::schema::flags::{FastFlag, IndexedFlag, SchemaFlagList, StoredFlag};

/// The precision of the indexed date/time values in the inverted index.
pub const DATE_TIME_PRECISION_INDEXED: DateTimePrecision = DateTimePrecision::Seconds;

/// Defines how DateTime field should be handled by tantivy.
#[derive(Clone, Debug, PartialEq, Eq, Serialize, Deserialize, Default)]
pub struct DateOptions {
    indexed: bool,
    // This boolean has no effect if the field is not marked as indexed true.
    fieldnorms: bool,
    #[serde(default)]
    fast: bool,
    stored: bool,
    // Internal storage precision, used to optimize storage
    // compression on fast fields.
    #[serde(default)]
    precision: DateTimePrecision,
}

impl DateOptions {
    /// Returns true iff the value is stored.
    #[inline]
    pub fn is_stored(&self) -> bool {
        self.stored
    }

    /// Returns true iff the value is indexed and therefore searchable.
    #[inline]
    pub fn is_indexed(&self) -> bool {
        self.indexed
    }

    /// Returns true iff the field has fieldnorm.
    #[inline]
    pub fn fieldnorms(&self) -> bool {
        self.fieldnorms && self.indexed
    }

    /// Returns true iff the value is a fast field.
    #[inline]
    pub fn is_fast(&self) -> bool {
        self.fast
    }

    /// Set the field as stored.
    ///
    /// Only the fields that are set as *stored* are
    /// persisted into the Tantivy's store.
    #[must_use]
    pub fn set_stored(mut self) -> DateOptions {
        self.stored = true;
        self
    }

    /// Set the field as indexed.
    ///
    /// Setting an integer as indexed will generate
    /// a posting list for each value taken by the integer.
    ///
    /// This is required for the field to be searchable.
    #[must_use]
    pub fn set_indexed(mut self) -> DateOptions {
        self.indexed = true;
        self
    }

    /// Set the field with fieldnorm.
    ///
    /// Setting an integer as fieldnorm will generate
    /// the fieldnorm data for it.
    #[must_use]
    pub fn set_fieldnorm(mut self) -> DateOptions {
        self.fieldnorms = true;
        self
    }

    /// Set the field as a fast field.
    ///
    /// Fast fields are designed for random access.
    #[must_use]
    pub fn set_fast(mut self) -> DateOptions {
        self.fast = true;
        self
    }

    /// Sets the precision for this DateTime field on the fast field.
    /// Indexed precision is always [`DATE_TIME_PRECISION_INDEXED`].
    ///
    /// Internal storage precision, used to optimize storage
    /// compression on fast fields.
    pub fn set_precision(mut self, precision: DateTimePrecision) -> DateOptions {
        self.precision = precision;
        self
    }

    /// Returns the storage precision for this DateTime field.
    ///
    /// Internal storage precision, used to optimize storage
    /// compression on fast fields.
    pub fn get_precision(&self) -> DateTimePrecision {
        self.precision
    }
}

impl From<()> for DateOptions {
    fn from(_: ()) -> DateOptions {
        DateOptions::default()
    }
}

impl From<FastFlag> for DateOptions {
    fn from(_: FastFlag) -> Self {
        DateOptions {
            fast: true,
            ..Default::default()
        }
    }
}

impl From<StoredFlag> for DateOptions {
    fn from(_: StoredFlag) -> Self {
        DateOptions {
            stored: true,
            ..Default::default()
        }
    }
}

impl From<IndexedFlag> for DateOptions {
    fn from(_: IndexedFlag) -> Self {
        DateOptions {
            indexed: true,
            fieldnorms: true,
            ..Default::default()
        }
    }
}

impl<T: Into<DateOptions>> BitOr<T> for DateOptions {
    type Output = DateOptions;

    fn bitor(self, other: T) -> DateOptions {
        let other = other.into();
        DateOptions {
            indexed: self.indexed | other.indexed,
            fieldnorms: self.fieldnorms | other.fieldnorms,
            stored: self.stored | other.stored,
            fast: self.fast | other.fast,
            precision: self.precision,
        }
    }
}

impl<Head, Tail> From<SchemaFlagList<Head, Tail>> for DateOptions
where
    Head: Clone,
    Tail: Clone,
    Self: BitOr<Output = Self> + From<Head> + From<Tail>,
{
    fn from(head_tail: SchemaFlagList<Head, Tail>) -> Self {
        Self::from(head_tail.head) | Self::from(head_tail.tail)
    }
}

#[cfg(test)]
mod tests {
    use super::*;

    #[test]
    fn test_date_options_consistent_with_default() {
        let date_time_options: DateOptions = serde_json::from_str(
            r#"{
            "indexed": false,
            "fieldnorms": false,
            "stored": false
        }"#,
        )
        .unwrap();
        assert_eq!(date_time_options, DateOptions::default());
    }

    #[test]
    fn test_serialize_date_option() {
        let date_options = serde_json::from_str::<DateOptions>(
            r#"
            {
                "indexed": true,
                "fieldnorms": false,
                "stored": false,
                "precision": "milliseconds"
            }"#,
        )
        .unwrap();

        let date_options_json = serde_json::to_value(date_options).unwrap();
        assert_eq!(
            date_options_json,
            serde_json::json!({
                "precision": "milliseconds",
                "indexed": true,
                "fast": false,
                "fieldnorms": false,
                "stored": false
            })
        );
    }

    #[test]
    fn test_deserialize_date_options_with_wrong_options() {
        assert!(serde_json::from_str::<DateOptions>(
            r#"{
            "indexed": true,
            "fieldnorms": false,
            "stored": "wrong_value"
        }"#
        )
        .unwrap_err()
        .to_string()
        .contains("expected a boolean"));

        assert!(serde_json::from_str::<DateOptions>(
            r#"{
            "indexed": true,
            "fieldnorms": false,
            "stored": false,
            "precision": "hours"
        }"#
        )
        .unwrap_err()
        .to_string()
        .contains("unknown variant `hours`"));
    }
}


================================================
FILE: src/schema/document/de.rs
================================================
//! Document binary deserialization API
//!
//! The deserialization API is strongly inspired by serde's API but with
//! some tweaks, mostly around some of the types being concrete (errors)
//! and some more specific types being visited (Ips, datetime, etc...)
//!
//! The motivation behind this API is to provide a easy to implement and
//! efficient way of deserializing a potentially arbitrarily nested object.

use std::collections::{BTreeMap, HashMap};
use std::fmt::Display;
use std::io;
use std::io::Read;
use std::marker::PhantomData;
use std::net::Ipv6Addr;
use std::sync::Arc;

use columnar::MonotonicallyMappableToU128;
use common::{u64_to_f64, BinarySerializable, DateTime, VInt};

use super::se::BinaryObjectSerializer;
use super::{OwnedValue, Value};
use crate::schema::document::type_codes;
use crate::schema::{Facet, Field};
use crate::store::DocStoreVersion;
use crate::tokenizer::PreTokenizedString;

#[derive(Debug, thiserror::Error, Clone)]
/// An error which occurs while attempting to deserialize a given value
/// by using the provided value visitor.
pub enum DeserializeError {
    #[error("Unsupported Type: {0:?} cannot be deserialized from the given visitor")]
    /// The value cannot be deserialized from the given type.
    UnsupportedType(ValueType),
    #[error("Type Mismatch: Expected {expected:?} but found {actual:?}")]
    /// The value cannot be deserialized from the given type.
    TypeMismatch {
        /// The expected value type.
        expected: ValueType,
        /// The actual value type read.
        actual: ValueType,
    },
    #[error("The value could not be read: {0}")]
    /// The value was unable to be read due to the error.
    CorruptedValue(Arc<io::Error>),
    #[error("{0}")]
    /// A custom error message.
    Custom(String),
    #[error("Version {0}, Max version supported: {1}")]
    /// Unsupported version error.
    UnsupportedVersion(u32, u32),
}

impl DeserializeError {
    /// Creates a new custom deserialize error.
    pub fn custom(msg: impl Display) -> Self {
        Self::Custom(msg.to_string())
    }
}

impl From<io::Error> for DeserializeError {
    fn from(error: io::Error) -> Self {
        Self::CorruptedValue(Arc::new(error))
    }
}

/// The core trait for deserializing a document.
///
/// TODO: Improve docs
pub trait DocumentDeserialize: Sized {
    /// Attempts to deserialize Self from a given document deserializer.
    fn deserialize<'de, D>(deserializer: D) -> Result<Self, DeserializeError>
    where D: DocumentDeserializer<'de>;
}

/// A deserializer that can walk through each entry in the document.
pub trait DocumentDeserializer<'de> {
    /// A indicator as to how many values are in the document.
    ///
    /// This can be used to pre-allocate entries but should not
    /// be depended on as a fixed size.
    fn size_hint(&self) -> usize;

    /// Attempts to deserialize the next field in the document.
    fn next_field<V: ValueDeserialize>(&mut self) -> Result<Option<(Field, V)>, DeserializeError>;
}

/// The core trait for deserializing values.
///
/// TODO: Improve docs
pub trait ValueDeserialize: Sized {
    /// Attempts to deserialize Self from a given value deserializer.
    fn deserialize<'de, D>(deserializer: D) -> Result<Self, DeserializeError>
    where D: ValueDeserializer<'de>;
}

/// A value deserializer.
pub trait ValueDeserializer<'de> {
    /// Attempts to deserialize a null value from the deserializer.
    fn deserialize_null(self) -> Result<(), DeserializeError>;

    /// Attempts to deserialize a string value from the deserializer.
    fn deserialize_string(self) -> Result<String, DeserializeError>;

    /// Attempts to deserialize a u64 value from the deserializer.
    fn deserialize_u64(self) -> Result<u64, DeserializeError>;

    /// Attempts to deserialize an i64 value from the deserializer.
    fn deserialize_i64(self) -> Result<i64, DeserializeError>;

    /// Attempts to deserialize a f64 value from the deserializer.
    fn deserialize_f64(self) -> Result<f64, DeserializeError>;

    /// Attempts to deserialize a datetime value from the deserializer.
    fn deserialize_datetime(self) -> Result<DateTime, DeserializeError>;

    /// Attempts to deserialize a facet value from the deserializer.
    fn deserialize_facet(self) -> Result<Facet, DeserializeError>;

    /// Attempts to deserialize a bytes value from the deserializer.
    fn deserialize_bytes(self) -> Result<Vec<u8>, DeserializeError>;

    /// Attempts to deserialize an IP address value from the deserializer.
    fn deserialize_ip_address(self) -> Result<Ipv6Addr, DeserializeError>;

    /// Attempts to deserialize a bool value from the deserializer.
    fn deserialize_bool(self) -> Result<bool, DeserializeError>;

    /// Attempts to deserialize a pre-tokenized string value from the deserializer.
    fn deserialize_pre_tokenized_string(self) -> Result<PreTokenizedString, DeserializeError>;

    /// Attempts to deserialize the value using a given visitor.
    fn deserialize_any<V>(self, visitor: V) -> Result<V::Value, DeserializeError>
    where V: ValueVisitor;
}

#[derive(Debug, Copy, Clone, Eq, PartialEq)]
/// The type of the value attempting to be deserialized.
pub enum ValueType {
    /// A null value.
    Null,
    /// A string value.
    String,
    /// A u64 value.
    U64,
    /// A i64 value.
    I64,
    /// A f64 value.
    F64,
    /// A datetime value.
    DateTime,
    /// A facet value.
    Facet,
    /// A bytes value.
    Bytes,
    /// A IP address value.
    IpAddr,
    /// A boolean value.
    Bool,
    /// A pre-tokenized string value.
    PreTokStr,
    /// An array of value.
    Array,
    /// A dynamic object value.
    Object,
    /// A JSON object value. Deprecated.
    #[deprecated(note = "We keep this for backwards compatibility, use Object instead")]
    JSONObject,
}

/// A value visitor for deserializing a document value.
///
/// This is strongly inspired by serde but has a few extra types.
///
/// TODO: Improve docs
pub trait ValueVisitor {
    /// The value produced by the visitor.
    type Value;

    #[inline]
    /// Called when the deserializer visits a string value.
    fn visit_null(&self) -> Result<Self::Value, DeserializeError> {
        Err(DeserializeError::UnsupportedType(ValueType::Null))
    }

    #[inline]
    /// Called when the deserializer visits a string value.
    fn visit_string(&self, _val: String) -> Result<Self::Value, DeserializeError> {
        Err(DeserializeError::UnsupportedType(ValueType::String))
    }

    #[inline]
    /// Called when the deserializer visits a u64 value.
    fn visit_u64(&self, _val: u64) -> Result<Self::Value, DeserializeError> {
        Err(DeserializeError::UnsupportedType(ValueType::U64))
    }

    #[inline]
    /// Called when the deserializer visits a i64 value.
    fn visit_i64(&self, _val: i64) -> Result<Self::Value, DeserializeError> {
        Err(DeserializeError::UnsupportedType(ValueType::I64))
    }

    #[inline]
    /// Called when the deserializer visits a f64 value.
    fn visit_f64(&self, _val: f64) -> Result<Self::Value, DeserializeError> {
        Err(DeserializeError::UnsupportedType(ValueType::F64))
    }

    #[inline]
    /// Called when the deserializer visits a bool value.
    fn visit_bool(&self, _val: bool) -> Result<Self::Value, DeserializeError> {
        Err(DeserializeError::UnsupportedType(ValueType::Bool))
    }

    #[inline]
    /// Called when the deserializer visits a datetime value.
    fn visit_datetime(&self, _val: DateTime) -> Result<Self::Value, DeserializeError> {
        Err(DeserializeError::UnsupportedType(ValueType::DateTime))
    }

    #[inline]
    /// Called when the deserializer visits an IP address value.
    fn visit_ip_address(&self, _val: Ipv6Addr) -> Result<Self::Value, DeserializeError> {
        Err(DeserializeError::UnsupportedType(ValueType::IpAddr))
    }

    #[inline]
    /// Called when the deserializer visits a facet value.
    fn visit_facet(&self, _val: Facet) -> Result<Self::Value, DeserializeError> {
        Err(DeserializeError::UnsupportedType(ValueType::Facet))
    }

    #[inline]
    /// Called when the deserializer visits a bytes value.
    fn visit_bytes(&self, _val: Vec<u8>) -> Result<Self::Value, DeserializeError> {
        Err(DeserializeError::UnsupportedType(ValueType::Bytes))
    }

    #[inline]
    /// Called when the deserializer visits a pre-tokenized string value.
    fn visit_pre_tokenized_string(
        &self,
        _val: PreTokenizedString,
    ) -> Result<Self::Value, DeserializeError> {
        Err(DeserializeError::UnsupportedType(ValueType::PreTokStr))
    }

    #[inline]
    /// Called when the deserializer visits an array.
    fn visit_array<'de, A>(&self, _access: A) -> Result<Self::Value, DeserializeError>
    where A: ArrayAccess<'de> {
        Err(DeserializeError::UnsupportedType(ValueType::Array))
    }

    #[inline]
    /// Called when the deserializer visits a object value.
    fn visit_object<'de, A>(&self, _access: A) -> Result<Self::Value, DeserializeError>
    where A: ObjectAccess<'de> {
        Err(DeserializeError::UnsupportedType(ValueType::Object))
    }
}

/// Access to a sequence of values which can be deserialized.
pub trait ArrayAccess<'de> {
    /// A indicator as to how many values are in the object.
    ///
    /// This can be used to pre-allocate entries but should not
    /// be depended on as a fixed size.
    fn size_hint(&self) -> usize;

    /// Attempts to deserialize the next element in the sequence.
    fn next_element<V: ValueDeserialize>(&mut self) -> Result<Option<V>, DeserializeError>;
}

/// TODO: Improve docs
pub trait ObjectAccess<'de> {
    /// A indicator as to how many values are in the object.
    ///
    /// This can be used to pre-allocate entries but should not
    /// be depended on as a fixed size.
    fn size_hint(&self) -> usize;

    /// Attempts to deserialize the next key-value pair in the object.
    fn next_entry<V: ValueDeserialize>(&mut self) -> Result<Option<(String, V)>, DeserializeError>;
}

/// The document deserializer used to read the tantivy documents serialized with
/// `BinarySerializable`.
///
/// This acts very similarly to serde's deserialize types and can incrementally
/// deserialize each field of the document from the provided reader (`R`).
///
/// TODO: Switch to slice instead?
pub struct BinaryDocumentDeserializer<'de, R> {
    length: usize,
    position: usize,
    doc_store_version: DocStoreVersion,
    reader: &'de mut R,
}

impl<'de, R> BinaryDocumentDeserializer<'de, R>
where R: Read
{
    /// Attempts to create a new document deserializer from a given reader.
    pub(crate) fn from_reader(
        reader: &'de mut R,
        doc_store_version: DocStoreVersion,
    ) -> Result<Self, DeserializeError> {
        let length = VInt::deserialize(reader)?;

        Ok(Self {
            length: length.val() as usize,
            position: 0,
            doc_store_version,
            reader,
        })
    }

    /// Returns true if the deserializer has deserialized all the entries
    /// within the document.
    fn is_complete(&self) -> bool {
        self.position >= self.length
    }
}

impl<'de, R> DocumentDeserializer<'de> for BinaryDocumentDeserializer<'de, R>
where R: Read
{
    #[inline]
    fn size_hint(&self) -> usize {
        self.length
    }

    fn next_field<V: ValueDeserialize>(&mut self) -> Result<Option<(Field, V)>, DeserializeError> {
        if self.is_complete() {
            return Ok(None);
        }

        let field = Field::deserialize(self.reader).map_err(DeserializeError::from)?;
        let deserializer =
            BinaryValueDeserializer::from_reader(self.reader, self.doc_store_version)?;
        let value = V::deserialize(deserializer)?;

        self.position += 1;

        Ok(Some((field, value)))
    }
}

/// A single value deserializer that deserializes a value serialized with `BinarySerializable`.
/// TODO: Improve docs
pub struct BinaryValueDeserializer<'de, R> {
    value_type: ValueType,
    reader: &'de mut R,
    doc_store_version: DocStoreVersion,
}

impl<'de, R> BinaryValueDeserializer<'de, R>
where R: Read
{
    /// Attempts to create a new value deserializer from a given reader.
    fn from_reader(
        reader: &'de mut R,
        doc_store_version: DocStoreVersion,
    ) -> Result<Self, DeserializeError> {
        let type_code = <u8 as BinarySerializable>::deserialize(reader)?;

        let value_type = match type_code {
            type_codes::TEXT_CODE => ValueType::String,
            type_codes::U64_CODE => ValueType::U64,
            type_codes::I64_CODE => ValueType::I64,
            type_codes::F64_CODE => ValueType::F64,
            type_codes::BOOL_CODE => ValueType::Bool,
            type_codes::DATE_CODE => ValueType::DateTime,
            type_codes::HIERARCHICAL_FACET_CODE => ValueType::Facet,
            type_codes::BYTES_CODE => ValueType::Bytes,
            type_codes::EXT_CODE => {
                let ext_type_code = <u8 as BinarySerializable>::deserialize(reader)?;

                match ext_type_code {
                    type_codes::TOK_STR_EXT_CODE => ValueType::PreTokStr,
                    _ => {
                        return Err(DeserializeError::from(io::Error::new(
                            io::ErrorKind::InvalidData,
                            format!(
                                "No extended field type is associated with code {ext_type_code:?}"
                            ),
                        )))
                    }
                }
            }
            type_codes::IP_CODE => ValueType::IpAddr,
            type_codes::NULL_CODE => ValueType::Null,
            type_codes::ARRAY_CODE => ValueType::Array,
            type_codes::OBJECT_CODE => ValueType::Object,
            #[expect(deprecated)]
            type_codes::JSON_OBJ_CODE => ValueType::JSONObject,
            _ => {
                return Err(DeserializeError::from(io::Error::new(
                    io::ErrorKind::InvalidData,
                    format!("No field type is associated with code {type_code:?}"),
                )))
            }
        };

        Ok(Self {
            value_type,
            reader,
            doc_store_version,
        })
    }

    fn validate_type(&self, expected_type: ValueType) -> Result<(), DeserializeError> {
        if self.value_type == expected_type {
            Ok(())
        } else {
            Err(DeserializeError::TypeMismatch {
                expected: expected_type,
                actual: self.value_type,
            })
        }
    }
}

impl<'de, R> ValueDeserializer<'de> for BinaryValueDeserializer<'de, R>
where R: Read
{
    fn deserialize_null(self) -> Result<(), DeserializeError> {
        self.validate_type(ValueType::Null)?;
        Ok(())
    }

    fn deserialize_string(self) -> Result<String, DeserializeError> {
        self.validate_type(ValueType::String)?;
        <String as BinarySerializable>::deserialize(self.reader).map_err(DeserializeError::from)
    }

    fn deserialize_u64(self) -> Result<u64, DeserializeError> {
        self.validate_type(ValueType::U64)?;
        <u64 as BinarySerializable>::deserialize(self.reader).map_err(DeserializeError::from)
    }

    fn deserialize_i64(self) -> Result<i64, DeserializeError> {
        self.validate_type(ValueType::I64)?;
        <i64 as BinarySerializable>::deserialize(self.reader).map_err(DeserializeError::from)
    }

    fn deserialize_f64(self) -> Result<f64, DeserializeError> {
        self.validate_type(ValueType::F64)?;
        <u64 as BinarySerializable>::deserialize(self.reader)
            .map(u64_to_f64)
            .map_err(DeserializeError::from)
    }

    fn deserialize_datetime(self) -> Result<DateTime, DeserializeError> {
        self.validate_type(ValueType::DateTime)?;
        match self.doc_store_version {
            DocStoreVersion::V1 => {
                let timestamp_micros = <i64 as BinarySerializable>::deserialize(self.reader)?;
                Ok(DateTime::from_timestamp_micros(timestamp_micros))
            }
            DocStoreVersion::V2 => {
                let timestamp_nanos = <i64 as BinarySerializable>::deserialize(self.reader)?;
                Ok(DateTime::from_timestamp_nanos(timestamp_nanos))
            }
        }
    }

    fn deserialize_facet(self) -> Result<Facet, DeserializeError> {
        self.validate_type(ValueType::Facet)?;
        <Facet as BinarySerializable>::deserialize(self.reader).map_err(DeserializeError::from)
    }

    fn deserialize_bytes(self) -> Result<Vec<u8>, DeserializeError> {
        self.validate_type(ValueType::Bytes)?;
        <Vec<u8> as BinarySerializable>::deserialize(self.reader).map_err(DeserializeError::from)
    }

    fn deserialize_ip_address(self) -> Result<Ipv6Addr, DeserializeError> {
        self.validate_type(ValueType::IpAddr)?;
        <u128 as BinarySerializable>::deserialize(self.reader)
            .map(Ipv6Addr::from_u128)
            .map_err(DeserializeError::from)
    }

    fn deserialize_bool(self) -> Result<bool, DeserializeError> {
        self.validate_type(ValueType::Bool)?;
        <bool as BinarySerializable>::deserialize(self.reader).map_err(DeserializeError::from)
    }

    fn deserialize_pre_tokenized_string(self) -> Result<PreTokenizedString, DeserializeError> {
        self.validate_type(ValueType::PreTokStr)?;
        <PreTokenizedString as BinarySerializable>::deserialize(self.reader)
            .map_err(DeserializeError::from)
    }

    fn deserialize_any<V>(self, visitor: V) -> Result<V::Value, DeserializeError>
    where V: ValueVisitor {
        match self.value_type {
            ValueType::Null => visitor.visit_null(),
            ValueType::String => {
                let val = self.deserialize_string()?;
                visitor.visit_string(val)
            }
            ValueType::U64 => {
                let val = self.deserialize_u64()?;
                visitor.visit_u64(val)
            }
            ValueType::I64 => {
                let val = self.deserialize_i64()?;
                visitor.visit_i64(val)
            }
            ValueType::F64 => {
                let val = self.deserialize_f64()?;
                visitor.visit_f64(val)
            }
            ValueType::DateTime => {
                let val = self.deserialize_datetime()?;
                visitor.visit_datetime(val)
            }
            ValueType::Facet => {
                let val = self.deserialize_facet()?;
                visitor.visit_facet(val)
            }
            ValueType::Bytes => {
                let val = self.deserialize_bytes()?;
                visitor.visit_bytes(val)
            }
            ValueType::IpAddr => {
                let val = self.deserialize_ip_address()?;
                visitor.visit_ip_address(val)
            }
            ValueType::Bool => {
                let val = self.deserialize_bool()?;
                visitor.visit_bool(val)
            }
            ValueType::PreTokStr => {
                let val = self.deserialize_pre_tokenized_string()?;
                visitor.visit_pre_tokenized_string(val)
            }
            ValueType::Array => {
                let access =
                    BinaryArrayDeserializer::from_reader(self.reader, self.doc_store_version)?;
                visitor.visit_array(access)
            }
            ValueType::Object => {
                let access =
                    BinaryObjectDeserializer::from_reader(self.reader, self.doc_store_version)?;
                visitor.visit_object(access)
            }
            #[allow(deprecated)]
            ValueType::JSONObject => {
                // This is a compatibility layer
                // The implementation is slow, but is temporary anyways
                let mut de = serde_json::Deserializer::from_reader(self.reader);
                let json_map = <serde_json::Map::<String, serde_json::Value> as serde::Deserialize>::deserialize(&mut de).map_err(|err| DeserializeError::Custom(err.to_string()))?;
                let mut out = Vec::new();
                let mut serializer = BinaryObjectSerializer::begin(json_map.len(), &mut out)?;
                for (key, val) in json_map {
                    let val: OwnedValue = val.into();
                    serializer.serialize_entry(&key, (&val).as_value())?;
                }
                serializer.end()?;

                let out_rc = std::rc::Rc::new(out);
                let mut slice: &[u8] = &out_rc;
                let access =
                    BinaryObjectDeserializer::from_reader(&mut slice, self.doc_store_version)?;

                visitor.visit_object(access)
            }
        }
    }
}

/// A deserializer for an array of values serialized with `BinarySerializable`.
/// TODO: Improve docs
pub struct BinaryArrayDeserializer<'de, R> {
    length: usize,
    position: usize,
    reader: &'de mut R,
    doc_store_version: DocStoreVersion,
}

impl<'de, R> BinaryArrayDeserializer<'de, R>
where R: Read
{
    /// Attempts to create a new array deserializer from a given reader.
    fn from_reader(
        reader: &'de mut R,
        doc_store_version: DocStoreVersion,
    ) -> Result<Self, DeserializeError> {
        let length = <VInt as BinarySerializable>::deserialize(reader)?;

        Ok(Self {
            length: length.val() as usize,
            position: 0,
            reader,
            doc_store_version,
        })
    }

    /// Returns true if the deserializer has deserialized all the elements
    /// within the array.
    fn is_complete(&self) -> bool {
        self.position >= self.length
    }
}

impl<'de, R> ArrayAccess<'de> for BinaryArrayDeserializer<'de, R>
where R: Read
{
    #[inline]
    fn size_hint(&self) -> usize {
        self.length
    }

    fn next_element<V: ValueDeserialize>(&mut self) -> Result<Option<V>, DeserializeError> {
        if self.is_complete() {
            return Ok(None);
        }

        let deserializer =
            BinaryValueDeserializer::from_reader(self.reader, self.doc_store_version)?;
        let value = V::deserialize(deserializer)?;

        // Advance the position cursor.
        self.position += 1;

        Ok(Some(value))
    }
}

/// A deserializer for a object consisting of key-value pairs.
pub struct BinaryObjectDeserializer<'de, R> {
    /// The inner deserializer.
    ///
    /// Internally an object is just represented by an array
    /// in the format of `[key, value, key, value, key, value]`.
    inner: BinaryArrayDeserializer<'de, R>,
}

impl<'de, R> BinaryObjectDeserializer<'de, R>
where R: Read
{
    /// Attempts to create a new object deserializer from a given reader.
    fn from_reader(
        reader: &'de mut R,
        doc_store_version: DocStoreVersion,
    ) -> Result<Self, DeserializeError> {
        let inner = BinaryArrayDeserializer::from_reader(reader, doc_store_version)?;
        Ok(Self { inner })
    }
}

impl<'de, R> ObjectAccess<'de> for BinaryObjectDeserializer<'de, R>
where R: Read
{
    #[inline]
    /// A indicator as to how many values are in the object.
    ///
    /// This can be used to pre-allocate entries but should not
    /// be depended on as a fixed size.
    fn size_hint(&self) -> usize {
        // We divide by 2 here as we know our elements are going to be
        // in the format of `[key, value, key, value, key, value]`.
        self.inner.size_hint() / 2
    }

    /// Attempts to deserialize the next key-value pair in the object.
    fn next_entry<V: ValueDeserialize>(&mut self) -> Result<Option<(String, V)>, DeserializeError> {
        if self.inner.is_complete() {
            return Ok(None);
        }

        let key = self.inner.next_element::<String>()?.expect(
            "Deserializer should not be empty as it is not marked as complete, this is a bug",
        );
        let value = self.inner.next_element::<V>()?.expect(
            "Deserializer should not be empty as it is not marked as complete, this is a bug",
        );

        Ok(Some((key, value)))
    }
}

// Core type implementations

impl ValueDeserialize for String {
    #[inline]
    fn deserialize<'de, D>(deserializer: D) -> Result<Self, DeserializeError>
    where D: ValueDeserializer<'de> {
        deserializer.deserialize_string()
    }
}

impl ValueDeserialize for u64 {
    #[inline]
    fn deserialize<'de, D>(deserializer: D) -> Result<Self, DeserializeError>
    where D: ValueDeserializer<'de> {
        deserializer.deserialize_u64()
    }
}

impl ValueDeserialize for i64 {
    #[inline]
    fn deserialize<'de, D>(deserializer: D) -> Result<Self, DeserializeError>
    where D: ValueDeserializer<'de> {
        deserializer.deserialize_i64()
    }
}

impl ValueDeserialize for f64 {
    #[inline]
    fn deserialize<'de, D>(deserializer: D) -> Result<Self, DeserializeError>
    where D: ValueDeserializer<'de> {
        deserializer.deserialize_f64()
    }
}

impl ValueDeserialize for DateTime {
    #[inline]
    fn deserialize<'de, D>(deserializer: D) -> Result<Self, DeserializeError>
    where D: ValueDeserializer<'de> {
        deserializer.deserialize_datetime()
    }
}

impl ValueDeserialize for Ipv6Addr {
    #[inline]
    fn deserialize<'de, D>(deserializer: D) -> Result<Self, DeserializeError>
    where D: ValueDeserializer<'de> {
        deserializer.deserialize_ip_address()
    }
}

impl ValueDeserialize for Facet {
    #[inline]
    fn deserialize<'de, D>(deserializer: D) -> Result<Self, DeserializeError>
    where D: ValueDeserializer<'de> {
        deserializer.deserialize_facet()
    }
}

impl ValueDeserialize for Vec<u8> {
    #[inline]
    fn deserialize<'de, D>(deserializer: D) -> Result<Self, DeserializeError>
    where D: ValueDeserializer<'de> {
        deserializer.deserialize_bytes()
    }
}

impl ValueDeserialize for PreTokenizedString {
    #[inline]
    fn deserialize<'de, D>(deserializer: D) -> Result<Self, DeserializeError>
    where D: ValueDeserializer<'de> {
        deserializer.deserialize_pre_tokenized_string()
    }
}

// Collections kind of suck, but can't think of a nicer way of doing this generically
// without quite literally cloning serde entirely...

struct VecVisitor<T: ValueDeserialize>(PhantomData<T>);
impl<T: ValueDeserialize> ValueVisitor for VecVisitor<T> {
    type Value = Vec<T>;

    fn visit_array<'de, A>(&self, mut access: A) -> Result<Self::Value, DeserializeError>
    where A: ArrayAccess<'de> {
        let mut entries = Vec::with_capacity(access.size_hint());
        while let Some(value) = access.next_element()? {
            entries.push(value);
        }
        Ok(entries)
    }
}
impl<T: ValueDeserialize> ValueDeserialize for Vec<T> {
    #[inline]
    fn deserialize<'de, D>(deserializer: D) -> Result<Self, DeserializeError>
    where D: ValueDeserializer<'de> {
        deserializer.deserialize_any(VecVisitor(PhantomData))
    }
}

struct BTreeMapVisitor<T: ValueDeserialize>(PhantomData<T>);
impl<T: ValueDeserialize> ValueVisitor for BTreeMapVisitor<T> {
    type Value = BTreeMap<String, T>;

    fn visit_object<'de, A>(&self, mut access: A) -> Result<Self::Value, DeserializeError>
    where A: ObjectAccess<'de> {
        let mut entries = BTreeMap::new();
        while let Some((key, value)) = access.next_entry()? {
            entries.insert(key, value);
        }
        Ok(entries)
    }
}
impl<T: ValueDeserialize> ValueDeserialize for BTreeMap<String, T> {
    #[inline]
    fn deserialize<'de, D>(deserializer: D) -> Result<Self, DeserializeError>
    where D: ValueDeserializer<'de> {
        deserializer.deserialize_any(BTreeMapVisitor(PhantomData))
    }
}

struct HashMapVisitor<T: ValueDeserialize>(PhantomData<T>);
impl<T: ValueDeserialize> ValueVisitor for HashMapVisitor<T> {
    type Value = HashMap<String, T>;

    fn visit_object<'de, A>(&self, mut access: A) -> Result<Self::Value, DeserializeError>
    where A: ObjectAccess<'de> {
        let mut entries = HashMap::with_capacity(access.size_hint());
        while let Some((key, value)) = access.next_entry()? {
            entries.insert(key, value);
        }
        Ok(entries)
    }
}
impl<T: ValueDeserialize> ValueDeserialize for HashMap<String, T> {
    #[inline]
    fn deserialize<'de, D>(deserializer: D) -> Result<Self, DeserializeError>
    where D: ValueDeserializer<'de> {
        deserializer.deserialize_any(HashMapVisitor(PhantomData))
    }
}

struct KeyValuesVecVisitor<T: ValueDeserialize>(PhantomData<T>);
impl<T: ValueDeserialize> ValueVisitor for KeyValuesVecVisitor<T> {
    type Value = Vec<(String, T)>;

    fn visit_object<'de, A>(&self, mut access: A) -> Result<Self::Value, DeserializeError>
    where A: ObjectAccess<'de> {
        let mut entries = Vec::with_capacity(access.size_hint());
        while let Some(entry) = access.next_entry()? {
            entries.push(entry);
        }
        Ok(entries)
    }
}
impl<T: ValueDeserialize> ValueDeserialize for Vec<(String, T)> {
    #[inline]
    fn deserialize<'de, D>(deserializer: D) -> Result<Self, DeserializeError>
    where D: ValueDeserializer<'de> {
        deserializer.deserialize_any(KeyValuesVecVisitor(PhantomData))
    }
}

#[cfg(test)]
mod tests {
    use std::io::Cursor;

    use serde_json::Number;
    use tokenizer_api::Token;

    use super::*;
    use crate::schema::document::existing_type_impls::JsonObjectIter;
    use crate::schema::document::se::BinaryValueSerializer;
    use crate::schema::document::{ReferenceValue, ReferenceValueLeaf};
    use crate::store::DOC_STORE_VERSION;

    fn serialize_value<'a>(value: ReferenceValue<'a, &'a serde_json::Value>) -> Vec<u8> {
        let mut writer = Vec::new();

        let mut serializer = BinaryValueSerializer::new(&mut writer);
        serializer.serialize_value(value).expect("Serialize value");

        writer
    }

    fn serialize_owned_value<'a>(value: ReferenceValue<'a, &'a OwnedValue>) -> Vec<u8> {
        let mut writer = Vec::new();

        let mut serializer = BinaryValueSerializer::new(&mut writer);
        serializer.serialize_value(value).expect("Serialize value");

        writer
    }

    fn deserialize_value(buffer: Vec<u8>) -> crate::schema::OwnedValue {
        let mut cursor = Cursor::new(buffer);
        let deserializer =
            BinaryValueDeserializer::from_reader(&mut cursor, DOC_STORE_VERSION).unwrap();
        crate::schema::OwnedValue::deserialize(deserializer).expect("Deserialize value")
    }

    #[test]
    fn test_simple_value_serialize() {
        let result = serialize_value(ReferenceValueLeaf::Null.into());
        let value = deserialize_value(result);
        assert_eq!(value, crate::schema::OwnedValue::Null);

        let result = serialize_value(ReferenceValueLeaf::Str("hello, world").into());
        let value = deserialize_value(result);
        assert_eq!(
            value,
            crate::schema::OwnedValue::Str(String::from("hello, world"))
        );

        let result = serialize_value(ReferenceValueLeaf::U64(123).into());
        let value = deserialize_value(result);
        assert_eq!(value, crate::schema::OwnedValue::U64(123));

        let result = serialize_value(ReferenceValueLeaf::I64(-123).into());
        let value = deserialize_value(result);
        assert_eq!(value, crate::schema::OwnedValue::I64(-123));

        let result = serialize_value(ReferenceValueLeaf::F64(123.3845).into());
        let value = deserialize_value(result);
        assert_eq!(value, crate::schema::OwnedValue::F64(123.3845));

        let result = serialize_value(ReferenceValueLeaf::Bool(false).into());
        let value = deserialize_value(result);
        assert_eq!(value, crate::schema::OwnedValue::Bool(false));

        let result =
            serialize_value(ReferenceValueLeaf::Date(DateTime::from_timestamp_micros(100)).into());
        let value = deserialize_value(result);
        assert_eq!(
            value,
            crate::schema::OwnedValue::Date(DateTime::from_timestamp_micros(100))
        );

        let facet = Facet::from_text("/hello/world").unwrap();
        let result = serialize_value(ReferenceValueLeaf::Facet(facet.encoded_str()).into());
        let value = deserialize_value(result);
        assert_eq!(value, crate::schema::OwnedValue::Facet(facet));

        let pre_tok_str = PreTokenizedString {
            text: "hello, world".to_string(),
            tokens: vec![Token::default(), Token::default()],
        };
        let result =
            serialize_value(ReferenceValueLeaf::PreTokStr(pre_tok_str.clone().into()).into());
        let value = deserialize_value(result);
        assert_eq!(value, crate::schema::OwnedValue::PreTokStr(pre_tok_str));
    }

    #[test]
    fn test_array_serialize() {
        let elements = [serde_json::Value::Null, serde_json::Value::Null];
        let result = serialize_value(ReferenceValue::Array(elements.iter()));
        let value = deserialize_value(result);
        assert_eq!(
            value,
            crate::schema::OwnedValue::Array(vec![
                crate::schema::OwnedValue::Null,
                crate::schema::OwnedValue::Null,
            ]),
        );

        let elements = [
            serde_json::Value::String("Hello, world".into()),
            serde_json::Value::String("Some demo".into()),
        ];
        let result = serialize_value(ReferenceValue::Array(elements.iter()));
        let value = deserialize_value(result);
        assert_eq!(
            value,
            crate::schema::OwnedValue::Array(vec![
                crate::schema::OwnedValue::Str(String::from("Hello, world")),
                crate::schema::OwnedValue::Str(String::from("Some demo")),
            ]),
        );

        let elements = [];
        let result = serialize_value(ReferenceValue::Array(elements.iter()));
        let value = deserialize_value(result);
        assert_eq!(value, crate::schema::OwnedValue::Array(vec![]));

        let elements = [
            serde_json::Value::Null,
            serde_json::Value::String("Hello, world".into()),
            serde_json::Value::Number(12345.into()),
        ];
        let result = serialize_value(ReferenceValue::Array(elements.iter()));
        let value = deserialize_value(result);
        assert_eq!(
            value,
            crate::schema::OwnedValue::Array(vec![
                crate::schema::OwnedValue::Null,
                crate::schema::OwnedValue::Str(String::from("Hello, world")),
                crate::schema::OwnedValue::I64(12345),
            ]),
        );
    }

    #[test]
    fn test_object_serialize() {
        let mut object = serde_json::Map::new();
        object.insert(
            "my-first-key".into(),
            serde_json::Value::String("Hello".into()),
        );
        object.insert("my-second-key".into(), serde_json::Value::Null);
        object.insert(
            "my-third-key".into(),
            serde_json::Value::Number(Number::from_f64(123.0).unwrap()),
        );
        let result = serialize_value(ReferenceValue::Object(JsonObjectIter(object.iter())));
        let value = deserialize_value(result);

        let mut expected_object = BTreeMap::new();
        expected_object.insert(
            "my-first-key".to_string(),
            crate::schema::OwnedValue::Str(String::from("Hello")),
        );
        expected_object.insert("my-second-key".to_string(), crate::schema::OwnedValue::Null);
        expected_object.insert(
            "my-third-key".to_string(),
            crate::schema::OwnedValue::F64(123.0),
        );
        assert_eq!(
            value,
            crate::schema::OwnedValue::Object(expected_object.into_iter().collect())
        );

        let object = serde_json::Map::new();
        let result = serialize_value(ReferenceValue::Object(JsonObjectIter(object.iter())));
        let value = deserialize_value(result);
        let expected_object = BTreeMap::new();
        assert_eq!(
            value,
            crate::schema::OwnedValue::Object(expected_object.into_iter().collect())
        );

        let mut object = serde_json::Map::new();
        object.insert("my-first-key".into(), serde_json::Value::Null);
        object.insert("my-second-key".into(), serde_json::Value::Null);
        object.insert("my-third-key".into(), serde_json::Value::Null);
        let result = serialize_value(ReferenceValue::Object(JsonObjectIter(object.iter())));
        let value = deserialize_value(result);
        let mut expected_object = BTreeMap::new();
        expected_object.insert("my-first-key".to_string(), crate::schema::OwnedValue::Null);
        expected_object.insert("my-second-key".to_string(), crate::schema::OwnedValue::Null);
        expected_object.insert("my-third-key".to_string(), crate::schema::OwnedValue::Null);
        assert_eq!(
            value,
            crate::schema::OwnedValue::Object(expected_object.into_iter().collect())
        );
    }

    #[test]
    fn test_json_compat() {
        let data = [
            8, 123, 34, 107, 101, 121, 97, 58, 34, 58, 34, 98, 108, 117, 98, 34, 44, 34, 118, 97,
            108, 115, 34, 58, 123, 34, 104, 101, 121, 34, 58, 34, 104, 111, 34, 125, 125,
        ]
        .to_vec();
        let expected = json!({
            "keya:": "blub",
            "vals": {
                "hey": "ho"
            }
        });
        let expected_val: OwnedValue = expected.clone().into();

        let value = deserialize_value(data);
        assert_eq!(value, expected_val);
    }

    #[test]
    fn test_nested_date_precision() {
        let object = OwnedValue::Object(vec![(
            "my-date".into(),
            OwnedValue::Date(DateTime::from_timestamp_nanos(323456)),
        )]);
        let result = serialize_owned_value((&object).as_value());
        let value = deserialize_value(result);
        assert_eq!(value, object);
    }

    #[test]
    fn test_nested_serialize() {
        let mut object = serde_json::Map::new();
        object.insert(
            "my-array".into(),
            serde_json::Value::Array(vec![
                serde_json::Value::Null,
                serde_json::Value::String(String::from("bobby of the sea")),
            ]),
        );
        object.insert(
            "my-object".into(),
            serde_json::Value::Object(
                vec![
                    (
                        "inner-1".to_string(),
                        serde_json::Value::Number((-123i64).into()),
                    ),
                    (
                        "inner-2".to_string(),
                        serde_json::Value::String(String::from("bobby of the sea 2")),
                    ),
                ]
                .into_iter()
                .collect(),
            ),
        );
        let result = serialize_value(ReferenceValue::Object(JsonObjectIter(object.iter())));
        let value = deserialize_value(result);

        let mut expected_object = BTreeMap::new();
        expected_object.insert(
            "my-array".to_string(),
            crate::schema::OwnedValue::Array(vec![
                crate::schema::OwnedValue::Null,
                crate::schema::OwnedValue::Str(String::from("bobby of the sea")),
            ]),
        );
        expected_object.insert(
            "my-object".to_string(),
            crate::schema::OwnedValue::Object(
                vec![
                    (
                        "inner-1".to_string(),
                        crate::schema::OwnedValue::I64(-123i64),
                    ),
                    (
                        "inner-2".to_string(),
                        crate::schema::OwnedValue::Str(String::from("bobby of the sea 2")),
                    ),
                ]
                .into_iter()
                .collect(),
            ),
        );
        assert_eq!(
            value,
            crate::schema::OwnedValue::Object(expected_object.into_iter().collect())
        );

        // Some more extreme nesting that might behave weirdly
        let mut object = serde_json::Map::new();
        object.insert(
            "my-array".into(),
            serde_json::Value::Array(vec![serde_json::Value::Array(vec![
                serde_json::Value::Array(vec![]),
                serde_json::Value::Array(vec![serde_json::Value::Null]),
            ])]),
        );
        let result = serialize_value(ReferenceValue::Object(JsonObjectIter(object.iter())));
        let value = deserialize_value(result);

        let mut expected_object = BTreeMap::new();
        expected_object.insert(
            "my-array".to_string(),
            OwnedValue::Array(vec![OwnedValue::Array(vec![
                OwnedValue::Array(vec![]),
                OwnedValue::Array(vec![OwnedValue::Null]),
            ])]),
        );
        assert_eq!(
            value,
            OwnedValue::Object(expected_object.into_iter().collect())
        );
    }
}


================================================
FILE: src/schema/document/default_document.rs
================================================
use std::collections::{BTreeMap, HashMap, HashSet};
use std::io::{self, Read, Write};
use std::net::Ipv6Addr;

use columnar::MonotonicallyMappableToU128;
use common::{read_u32_vint_no_advance, serialize_vint_u32, BinarySerializable, DateTime, VInt};
use serde_json::Map;
pub use CompactDoc as TantivyDocument;

use super::{ReferenceValue, ReferenceValueLeaf, Value};
use crate::schema::document::{
    DeserializeError, Document, DocumentDeserialize, DocumentDeserializer,
};
use crate::schema::field_type::ValueParsingError;
use crate::schema::{Facet, Field, NamedFieldDocument, OwnedValue, Schema};
use crate::tokenizer::PreTokenizedString;

#[repr(C, packed)]
#[derive(Debug, Clone)]
/// A field value pair in the compact tantivy document
struct FieldValueAddr {
    pub field: u16,
    pub value_addr: ValueAddr,
}

#[derive(Debug, Clone)]
/// The default document in tantivy. It encodes data in a compact form.
pub struct CompactDoc {
    /// `node_data` is a vec of bytes, where each value is serialized into bytes and stored. It
    /// includes all the data of the document and also metadata like where the nodes are located
    /// in an object or array.
    pub node_data: Vec<u8>,
    /// The root (Field, Value) pairs
    field_values: Vec<FieldValueAddr>,
}

impl Default for CompactDoc {
    fn default() -> Self {
        Self::new()
    }
}

impl CompactDoc {
    /// Creates a new, empty document object
    /// The reserved capacity is for the total serialized data
    pub fn with_capacity(bytes: usize) -> CompactDoc {
        CompactDoc {
            node_data: Vec::with_capacity(bytes),
            field_values: Vec::with_capacity(4),
        }
    }

    /// Creates a new, empty document object
    pub fn new() -> CompactDoc {
        CompactDoc::with_capacity(1024)
    }

    /// Skrinks the capacity of the document to fit the data
    pub fn shrink_to_fit(&mut self) {
        self.node_data.shrink_to_fit();
        self.field_values.shrink_to_fit();
    }

    /// Returns the length of the document.
    pub fn len(&self) -> usize {
        self.field_values.len()
    }

    /// Adding a facet to the document.
    pub fn add_facet<F>(&mut self, field: Field, path: F)
    where Facet: From<F> {
        let facet = Facet::from(path);
        self.add_leaf_field_value(field, ReferenceValueLeaf::Facet(facet.encoded_str()));
    }

    /// Add a text field.
    pub fn add_text<S: AsRef<str>>(&mut self, field: Field, text: S) {
        self.add_leaf_field_value(field, ReferenceValueLeaf::Str(text.as_ref()));
    }

    /// Add a pre-tokenized text field.
    pub fn add_pre_tokenized_text(&mut self, field: Field, pre_tokenized_text: PreTokenizedString) {
        self.add_leaf_field_value(field, pre_tokenized_text);
    }

    /// Add a u64 field
    pub fn add_u64(&mut self, field: Field, value: u64) {
        self.add_leaf_field_value(field, value);
    }

    /// Add a IP address field. Internally only Ipv6Addr is used.
    pub fn add_ip_addr(&mut self, field: Field, value: Ipv6Addr) {
        self.add_leaf_field_value(field, value);
    }

    /// Add a i64 field
    pub fn add_i64(&mut self, field: Field, value: i64) {
        self.add_leaf_field_value(field, value);
    }

    /// Add a f64 field
    pub fn add_f64(&mut self, field: Field, value: f64) {
        self.add_leaf_field_value(field, value);
    }

    /// Add a bool field
    pub fn add_bool(&mut self, field: Field, value: bool) {
        self.add_leaf_field_value(field, value);
    }

    /// Add a date field with unspecified time zone offset
    pub fn add_date(&mut self, field: Field, value: DateTime) {
        self.add_leaf_field_value(field, value);
    }

    /// Add a bytes field
    pub fn add_bytes(&mut self, field: Field, value: &[u8]) {
        self.add_leaf_field_value(field, value);
    }

    /// Add a dynamic object field
    pub fn add_object(&mut self, field: Field, object: BTreeMap<String, OwnedValue>) {
        self.add_field_value(field, &OwnedValue::from(object));
    }

    /// Add a (field, value) to the document.
    ///
    /// `OwnedValue` implements Value, which should be easiest to use, but is not the most
    /// performant.
    pub fn add_field_value<'a, V: Value<'a>>(&mut self, field: Field, value: V) {
        let field_value = FieldValueAddr {
            field: field
                .field_id()
                .try_into()
                .expect("support only up to u16::MAX field ids"),
            value_addr: self.add_value(value),
        };
        self.field_values.push(field_value);
    }

    /// Add a (field, leaf value) to the document.
    /// Leaf values don't have nested values.
    pub fn add_leaf_field_value<'a, T: Into<ReferenceValueLeaf<'a>>>(
        &mut self,
        field: Field,
        typed_val: T,
    ) {
        let value = typed_val.into();
        let field_value = FieldValueAddr {
            field: field
                .field_id()
                .try_into()
                .expect("support only up to u16::MAX field ids"),
            value_addr: self.add_value_leaf(value),
        };
        self.field_values.push(field_value);
    }

    /// field_values accessor
    pub fn field_values(&self) -> impl Iterator<Item = (Field, CompactDocValue<'_>)> {
        self.field_values.iter().map(|field_val| {
            let field = Field::from_field_id(field_val.field as u32);
            let val = self.get_compact_doc_value(field_val.value_addr);
            (field, val)
        })
    }

    /// Returns all of the `ReferenceValue`s associated the given field
    pub fn get_all(&self, field: Field) -> impl Iterator<Item = CompactDocValue<'_>> + '_ {
        self.field_values
            .iter()
            .filter(move |field_value| Field::from_field_id(field_value.field as u32) == field)
            .map(|val| self.get_compact_doc_value(val.value_addr))
    }

    /// Returns the first `ReferenceValue` associated the given field
    pub fn get_first(&self, field: Field) -> Option<CompactDocValue<'_>> {
        self.get_all(field).next()
    }

    /// Create document from a named doc.
    pub fn convert_named_doc(
        schema: &Schema,
        named_doc: NamedFieldDocument,
    ) -> Result<Self, DocParsingError> {
        let mut document = Self::new();
        for (field_name, values) in named_doc.0 {
            if let Ok(field) = schema.get_field(&field_name) {
                for value in values {
                    document.add_field_value(field, &value);
                }
            }
        }
        Ok(document)
    }

    /// Build a document object from a json-object.
    pub fn parse_json(schema: &Schema, doc_json: &str) -> Result<Self, DocParsingError> {
        let json_obj: Map<String, serde_json::Value> =
            serde_json::from_str(doc_json).map_err(|_| DocParsingError::invalid_json(doc_json))?;
        Self::from_json_object(schema, json_obj)
    }

    /// Build a document object from a json-object.
    pub fn from_json_object(
        schema: &Schema,
        json_obj: Map<String, serde_json::Value>,
    ) -> Result<Self, DocParsingError> {
        let mut doc = Self::default();
        for (field_name, json_value) in json_obj {
            if let Ok(field) = schema.get_field(&field_name) {
                let field_entry = schema.get_field_entry(field);
                let field_type = field_entry.field_type();
                match json_value {
                    serde_json::Value::Array(json_items) => {
                        for json_item in json_items {
                            let value = field_type
                                .value_from_json(json_item)
                                .map_err(|e| DocParsingError::ValueError(field_name.clone(), e))?;
                            doc.add_field_value(field, &value);
                        }
                    }
                    _ => {
                        let value = field_type
                            .value_from_json(json_value)
                            .map_err(|e| DocParsingError::ValueError(field_name.clone(), e))?;
                        doc.add_field_value(field, &value);
                    }
                }
            }
        }
        Ok(doc)
    }

    fn add_value_leaf(&mut self, leaf: ReferenceValueLeaf) -> ValueAddr {
        let type_id = ValueType::from(&leaf);
        // Write into `node_data` and return u32 position as its address
        // Null and bool are inlined into the address
        let val_addr = match leaf {
            ReferenceValueLeaf::Null => 0,
            ReferenceValueLeaf::Str(bytes) => {
                write_bytes_into(&mut self.node_data, bytes.as_bytes())
            }
            ReferenceValueLeaf::Facet(bytes) => {
                write_bytes_into(&mut self.node_data, bytes.as_bytes())
            }
            ReferenceValueLeaf::Bytes(bytes) => write_bytes_into(&mut self.node_data, bytes),
            ReferenceValueLeaf::U64(num) => write_into(&mut self.node_data, num),
            ReferenceValueLeaf::I64(num) => write_into(&mut self.node_data, num),
            ReferenceValueLeaf::F64(num) => write_into(&mut self.node_data, num),
            ReferenceValueLeaf::Bool(b) => b as u32,
            ReferenceValueLeaf::Date(date) => {
                write_into(&mut self.node_data, date.into_timestamp_nanos())
            }
            ReferenceValueLeaf::IpAddr(num) => write_into(&mut self.node_data, num.to_u128()),
            ReferenceValueLeaf::PreTokStr(pre_tok) => write_into(&mut self.node_data, *pre_tok),
        };
        ValueAddr { type_id, val_addr }
    }
    /// Adds a value and returns in address into the
    fn add_value<'a, V: Value<'a>>(&mut self, value: V) -> ValueAddr {
        let value = value.as_value();
        let type_id = ValueType::from(&value);
        match value {
            ReferenceValue::Leaf(leaf) => self.add_value_leaf(leaf),
            ReferenceValue::Array(elements) => {
                // addresses of the elements in node_data
                // Reusing a vec would be nicer, but it's not easy because of the recursion
                // A global vec would work if every writer get it's discriminator
                let mut addresses = Vec::new();
                for elem in elements {
                    let value_addr = self.add_value(elem);
                    write_into(&mut addresses, value_addr);
                }
                ValueAddr {
                    type_id,
                    val_addr: write_bytes_into(&mut self.node_data, &addresses),
                }
            }
            ReferenceValue::Object(entries) => {
                // addresses of the elements in node_data
                let mut addresses = Vec::new();
                for (key, value) in entries {
                    let key_addr = self.add_value_leaf(ReferenceValueLeaf::Str(key));
                    let value_addr = self.add_value(value);
                    write_into(&mut addresses, key_addr);
                    write_into(&mut addresses, value_addr);
                }
                ValueAddr {
                    type_id,
                    val_addr: write_bytes_into(&mut self.node_data, &addresses),
                }
            }
        }
    }

    /// Get CompactDocValue for address
    fn get_compact_doc_value(&self, value_addr: ValueAddr) -> CompactDocValue<'_> {
        CompactDocValue {
            container: self,
            value_addr,
        }
    }

    /// get &[u8] reference from node_data
    fn extract_bytes(&self, addr: Addr) -> &[u8] {
        binary_deserialize_bytes(self.get_slice(addr))
    }

    /// get &str reference from node_data
    fn extract_str(&self, addr: Addr) -> &str {
        let data = self.extract_bytes(addr);
        // Utf-8 checks would have a noticeable performance overhead here
        unsafe { std::str::from_utf8_unchecked(data) }
    }

    /// deserialized owned value from node_data
    fn read_from<T: BinarySerializable>(&self, addr: Addr) -> io::Result<T> {
        let data_slice = &self.node_data[addr as usize..];
        let mut cursor = std::io::Cursor::new(data_slice);
        T::deserialize(&mut cursor)
    }

    /// get slice from address. The returned slice is open ended
    fn get_slice(&self, addr: Addr) -> &[u8] {
        &self.node_data[addr as usize..]
    }
}

/// BinarySerializable alternative to read references
fn binary_deserialize_bytes(data: &[u8]) -> &[u8] {
    let (len, bytes_read) = read_u32_vint_no_advance(data);
    &data[bytes_read..bytes_read + len as usize]
}

/// Write bytes and return the position of the written data.
///
/// BinarySerializable alternative to write references
fn write_bytes_into(vec: &mut Vec<u8>, data: &[u8]) -> u32 {
    let pos = vec.len() as u32;
    let mut buf = [0u8; 8];
    let len_vint_bytes = serialize_vint_u32(data.len() as u32, &mut buf);
    vec.extend_from_slice(len_vint_bytes);
    vec.extend_from_slice(data);
    pos
}

/// Serialize and return the position
fn write_into<T: BinarySerializable>(vec: &mut Vec<u8>, value: T) -> u32 {
    let pos = vec.len() as u32;
    value.serialize(vec).unwrap();
    pos
}

impl PartialEq for CompactDoc {
    fn eq(&self, other: &Self) -> bool {
        // super slow, but only here for tests
        let convert_to_comparable_map = |doc: &CompactDoc| {
            let mut field_value_set: HashMap<Field, HashSet<String>> = Default::default();
            for field_value in doc.field_values.iter() {
                let value: OwnedValue = doc.get_compact_doc_value(field_value.value_addr).into();
                let value = serde_json::to_string(&value).unwrap();
                field_value_set
                    .entry(Field::from_field_id(field_value.field as u32))
                    .or_default()
                    .insert(value);
            }
            field_value_set
        };
        let self_field_values: HashMap<Field, HashSet<String>> = convert_to_comparable_map(self);
        let other_field_values: HashMap<Field, HashSet<String>> = convert_to_comparable_map(other);
        self_field_values.eq(&other_field_values)
    }
}

impl Eq for CompactDoc {}

impl DocumentDeserialize for CompactDoc {
    fn deserialize<'de, D>(mut deserializer: D) -> Result<Self, DeserializeError>
    where D: DocumentDeserializer<'de> {
        let mut doc = CompactDoc::default();
        // TODO: Deserializing into OwnedValue is wasteful. The deserializer should be able to work
        // on slices and referenced data.
        while let Some((field, value)) = deserializer.next_field::<OwnedValue>()? {
            doc.add_field_value(field, &value);
        }
        Ok(doc)
    }
}

/// A value of Compact Doc needs a reference to the container to extract its payload
#[derive(Debug, Clone, Copy)]
pub struct CompactDocValue<'a> {
    container: &'a CompactDoc,
    value_addr: ValueAddr,
}
impl PartialEq for CompactDocValue<'_> {
    fn eq(&self, other: &Self) -> bool {
        let value1: OwnedValue = (*self).into();
        let value2: OwnedValue = (*other).into();
        value1 == value2
    }
}
impl From<CompactDocValue<'_>> for OwnedValue {
    fn from(value: CompactDocValue) -> Self {
        value.as_value().into()
    }
}
impl<'a> Value<'a> for CompactDocValue<'a> {
    type ArrayIter = CompactDocArrayIter<'a>;

    type ObjectIter = CompactDocObjectIter<'a>;

    fn as_value(&self) -> ReferenceValue<'a, Self> {
        self.get_ref_value().unwrap()
    }
}
impl<'a> CompactDocValue<'a> {
    fn get_ref_value(&self) -> io::Result<ReferenceValue<'a, CompactDocValue<'a>>> {
        let addr = self.value_addr.val_addr;
        match self.value_addr.type_id {
            ValueType::Null => Ok(ReferenceValueLeaf::Null.into()),
            ValueType::Str => {
                let str_ref = self.container.extract_str(addr);
                Ok(ReferenceValueLeaf::Str(str_ref).into())
            }
            ValueType::Facet => {
                let str_ref = self.container.extract_str(addr);
                Ok(ReferenceValueLeaf::Facet(str_ref).into())
            }
            ValueType::Bytes => {
                let data = self.container.extract_bytes(addr);
                Ok(ReferenceValueLeaf::Bytes(data).into())
            }
            ValueType::U64 => self
                .container
                .read_from::<u64>(addr)
                .map(ReferenceValueLeaf::U64)
                .map(Into::into),
            ValueType::I64 => self
                .container
                .read_from::<i64>(addr)
                .map(ReferenceValueLeaf::I64)
                .map(Into::into),
            ValueType::F64 => self
                .container
                .read_from::<f64>(addr)
                .map(ReferenceValueLeaf::F64)
                .map(Into::into),
            ValueType::Bool => Ok(ReferenceValueLeaf::Bool(addr != 0).into()),
            ValueType::Date => self
                .container
                .read_from::<i64>(addr)
                .map(|ts| ReferenceValueLeaf::Date(DateTime::from_timestamp_nanos(ts)))
                .map(Into::into),
            ValueType::IpAddr => self
                .container
                .read_from::<u128>(addr)
                .map(|num| ReferenceValueLeaf::IpAddr(Ipv6Addr::from_u128(num)))
                .map(Into::into),
            ValueType::PreTokStr => self
                .container
                .read_from::<PreTokenizedString>(addr)
                .map(Into::into)
                .map(ReferenceValueLeaf::PreTokStr)
                .map(Into::into),
            ValueType::Object => Ok(ReferenceValue::Object(CompactDocObjectIter::new(
                self.container,
                addr,
            )?)),
            ValueType::Array => Ok(ReferenceValue::Array(CompactDocArrayIter::new(
                self.container,
                addr,
            )?)),
        }
    }
}

/// The address in the vec
type Addr = u32;

#[derive(Clone, Copy, Default)]
#[repr(C, packed)]
/// The value type and the address to its payload in the container.
struct ValueAddr {
    type_id: ValueType,
    /// This is the address to the value in the vec, except for bool and null, which are inlined
    val_addr: Addr,
}
impl BinarySerializable for ValueAddr {
    fn serialize<W: Write + ?Sized>(&self, writer: &mut W) -> io::Result<()> {
        self.type_id.serialize(writer)?;
        VInt(self.val_addr as u64).serialize(writer)
    }

    fn deserialize<R: Read>(reader: &mut R) -> io::Result<Self> {
        let type_id = ValueType::deserialize(reader)?;
        let val_addr = VInt::deserialize(reader)?.0 as u32;
        Ok(ValueAddr { type_id, val_addr })
    }
}
impl std::fmt::Debug for ValueAddr {
    fn fmt(&self, f: &mut std::fmt::Formatter<'_>) -> std::fmt::Result {
        let val_addr = self.val_addr;
        f.write_fmt(format_args!("{:?} at {:?}", self.type_id, val_addr))
    }
}

/// A enum representing a value for tantivy to index.
///
/// ** Any changes need to be reflected in `BinarySerializable` for `ValueType` **
///
/// We can't use [schema::Type] or [columnar::ColumnType] here, because they are missing
/// some items like Array and PreTokStr.
#[derive(Default, Clone, Copy, Debug, PartialEq)]
#[repr(u8)]
pub enum ValueType {
    /// A null value.
    #[default]
    Null = 0,
    /// The str type is used for any text information.
    Str = 1,
    /// Unsigned 64-bits Integer `u64`
    U64 = 2,
    /// Signed 64-bits Integer `i64`
    I64 = 3,
    /// 64-bits Float `f64`
    F64 = 4,
    /// Date/time with nanoseconds precision
    Date = 5,
    /// Facet
    Facet = 6,
    /// Arbitrarily sized byte array
    Bytes = 7,
    /// IpV6 Address. Internally there is no IpV4, it needs to be converted to `Ipv6Addr`.
    IpAddr = 8,
    /// Bool value
    Bool = 9,
    /// Pre-tokenized str type,
    PreTokStr = 10,
    /// Object
    Object = 11,
    /// Pre-tokenized str type,
    Array = 12,
}

impl BinarySerializable for ValueType {
    fn serialize<W: Write + ?Sized>(&self, writer: &mut W) -> io::Result<()> {
        (*self as u8).serialize(writer)?;
        Ok(())
    }

    fn deserialize<R: Read>(reader: &mut R) -> io::Result<Self> {
        let num = u8::deserialize(reader)?;
        let type_id = if (0..=12).contains(&num) {
            unsafe { std::mem::transmute::<u8, ValueType>(num) }
        } else {
            return Err(io::Error::new(
                io::ErrorKind::InvalidData,
                format!("Invalid value type id: {num}"),
            ));
        };
        Ok(type_id)
    }
}

impl<'a, V: Value<'a>> From<&ReferenceValue<'a, V>> for ValueType {
    fn from(value: &ReferenceValue<'a, V>) -> Self {
        match value {
            ReferenceValue::Leaf(leaf) => leaf.into(),
            ReferenceValue::Array(_) => ValueType::Array,
            ReferenceValue::Object(_) => ValueType::Object,
        }
    }
}
impl<'a> From<&ReferenceValueLeaf<'a>> for ValueType {
    fn from(value: &ReferenceValueLeaf<'a>) -> Self {
        match value {
            ReferenceValueLeaf::Null => ValueType::Null,
            ReferenceValueLeaf::Str(_) => ValueType::Str,
            ReferenceValueLeaf::U64(_) => ValueType::U64,
            ReferenceValueLeaf::I64(_) => ValueType::I64,
            ReferenceValueLeaf::F64(_) => ValueType::F64,
            ReferenceValueLeaf::Bool(_) => ValueType::Bool,
            ReferenceValueLeaf::Date(_) => ValueType::Date,
            ReferenceValueLeaf::IpAddr(_) => ValueType::IpAddr,
            ReferenceValueLeaf::PreTokStr(_) => ValueType::PreTokStr,
            ReferenceValueLeaf::Facet(_) => ValueType::Facet,
            ReferenceValueLeaf::Bytes(_) => ValueType::Bytes,
        }
    }
}

#[derive(Debug, Clone)]
/// The Iterator for the object values in the compact document
pub struct CompactDocObjectIter<'a> {
    container: &'a CompactDoc,
    node_addresses_slice: &'a [u8],
}

impl<'a> CompactDocObjectIter<'a> {
    fn new(container: &'a CompactDoc, addr: Addr) -> io::Result<Self> {
        // Objects are `&[ValueAddr]` serialized into bytes
        let node_addresses_slice = container.extract_bytes(addr);
        Ok(Self {
            container,
            node_addresses_slice,
        })
    }
}

impl<'a> Iterator for CompactDocObjectIter<'a> {
    type Item = (&'a str, CompactDocValue<'a>);

    fn next(&mut self) -> Option<Self::Item> {
        if self.node_addresses_slice.is_empty() {
            return None;
        }
        let key_addr = ValueAddr::deserialize(&mut self.node_addresses_slice).ok()?;
        let key = self.container.extract_str(key_addr.val_addr);
        let value = ValueAddr::deserialize(&mut self.node_addresses_slice).ok()?;
        let value = CompactDocValue {
            container: self.container,
            value_addr: value,
        };
        Some((key, value))
    }
}

#[derive(Debug, Clone)]
/// The Iterator for the array values in the compact document
pub struct CompactDocArrayIter<'a> {
    container: &'a CompactDoc,
    node_addresses_slice: &'a [u8],
}

impl<'a> CompactDocArrayIter<'a> {
    fn new(container: &'a CompactDoc, addr: Addr) -> io::Result<Self> {
        // Arrays are &[ValueAddr] serialized into bytes
        let node_addresses_slice = container.extract_bytes(addr);
        Ok(Self {
            container,
            node_addresses_slice,
        })
    }
}

impl<'a> Iterator for CompactDocArrayIter<'a> {
    type Item = CompactDocValue<'a>;

    fn next(&mut self) -> Option<Self::Item> {
        if self.node_addresses_slice.is_empty() {
            return None;
        }
        let value = ValueAddr::deserialize(&mut self.node_addresses_slice).ok()?;
        let value = CompactDocValue {
            container: self.container,
            value_addr: value,
        };
        Some(value)
    }
}

impl Document for CompactDoc {
    type Value<'a> = CompactDocValue<'a>;
    type FieldsValuesIter<'a> = FieldValueIterRef<'a>;

    fn iter_fields_and_values(&self) -> Self::FieldsValuesIter<'_> {
        FieldValueIterRef {
            slice: self.field_values.iter(),
            container: self,
        }
    }
}

/// A helper wrapper for creating an iterator over the field values
pub struct FieldValueIterRef<'a> {
    slice: std::slice::Iter<'a, FieldValueAddr>,
    container: &'a CompactDoc,
}

impl<'a> Iterator for FieldValueIterRef<'a> {
    type Item = (Field, CompactDocValue<'a>);

    fn next(&mut self) -> Option<Self::Item> {
        self.slice.next().map(|field_value| {
            (
                Field::from_field_id(field_value.field as u32),
                CompactDocValue::<'a> {
                    container: self.container,
                    value_addr: field_value.value_addr,
                },
            )
        })
    }
}

/// Error that may happen when deserializing
/// a document from JSON.
#[derive(Debug, Error, PartialEq)]
pub enum DocParsingError {
    /// The payload given is not valid JSON.
    #[error("The provided string is not valid JSON")]
    InvalidJson(String),
    /// One of the value node could not be parsed.
    #[error("The field '{0:?}' could not be parsed: {1:?}")]
    ValueError(String, ValueParsingError),
}

impl DocParsingError {
    /// Builds a NotJson DocParsingError
    fn invalid_json(invalid_json: &str) -> Self {
        let sample = invalid_json.chars().take(20).collect();
        DocParsingError::InvalidJson(sample)
    }
}

#[cfg(test)]
mod tests {
    use crate::schema::*;

    #[test]
    fn test_doc() {
        let mut schema_builder = Schema::builder();
        let text_field = schema_builder.add_text_field("title", TEXT);
        let mut doc = TantivyDocument::default();
        doc.add_text(text_field, "My title");
        assert_eq!(doc.field_values().count(), 1);

        let schema = schema_builder.build();
        let _val = doc.get_first(text_field).unwrap();
        let _json = doc.to_named_doc(&schema);
    }

    #[test]
    fn test_json_value() {
        let json_str = r#"{
            "toto": "titi",
            "float": -0.2,
            "bool": true,
            "unsigned": 1,
            "signed": -2,
            "complexobject": {
                "field.with.dot": 1
            },
            "date": "1985-04-12T23:20:50.52Z",
            "my_arr": [2, 3, {"my_key": "two tokens"}, 4, {"nested_array": [2, 5, 6, [7, 8, {"a": [{"d": {"e":[99]}}, 9000]}, 9, 10], [5, 5]]}]
        }"#;
        let json_val: std::collections::BTreeMap<String, OwnedValue> =
            serde_json::from_str(json_str).unwrap();

        let mut schema_builder = Schema::builder();
        let json_field = schema_builder.add_json_field("json", TEXT);
        let mut doc = TantivyDocument::default();
        doc.add_object(json_field, json_val);

        let schema = schema_builder.build();
        let json = doc.to_json(&schema);
        let actual_json: serde_json::Value = serde_json::from_str(&json).unwrap();
        let expected_json: serde_json::Value = serde_json::from_str(json_str).unwrap();
        assert_eq!(actual_json["json"][0], expected_json);
    }

    // TODO: Should this be re-added with the serialize method
    //       technically this is no longer useful since the doc types
    //       do not implement BinarySerializable due to orphan rules.
    // #[test]
    // fn test_doc_serialization_issue() {
    //     let mut doc = Document::default();
    //     doc.add_json_object(
    //         Field::from_field_id(0),
    //         serde_json::json!({"key": 2u64})
    //             .as_object()
    //             .unwrap()
    //             .clone(),
    //     );
    //     doc.add_text(Field::from_field_id(1), "hello");
    //     assert_eq!(doc.field_values().len(), 2);
    //     let mut payload: Vec<u8> = Vec::new();
    //     doc_binary_wrappers::serialize(&doc, &mut payload).unwrap();
    //     assert_eq!(payload.len(), 26);
    //     doc_binary_wrappers::deserialize::<Document, _>(&mut &payload[..]).unwrap();
    // }
}


================================================
FILE: src/schema/document/existing_type_impls.rs
================================================
//! Implementations of some of the core traits on various types to improve the ergonomics
//! of the API when providing custom documents.
//!
//! This allows users a bit more freedom and ergonomics if they want a simple API
//! and don't care about some of the more specialised types or only want to customise
//! part of the document structure.
use std::collections::{btree_map, hash_map, BTreeMap, HashMap};
use std::iter::Empty;
use std::net::Ipv6Addr;

use common::DateTime;
use serde_json::Number;
use time::format_description::well_known::Rfc3339;
use time::OffsetDateTime;

use super::facet::Facet;
use super::ReferenceValueLeaf;
use crate::schema::document::{
    ArrayAccess, DeserializeError, Document, DocumentDeserialize, DocumentDeserializer,
    ObjectAccess, ReferenceValue, Value, ValueDeserialize, ValueDeserializer, ValueVisitor,
};
use crate::schema::Field;
use crate::tokenizer::PreTokenizedString;

// Serde compatibility support.
pub fn can_be_rfc3339_date_time(text: &str) -> bool {
    if let Some(&first_byte) = text.as_bytes().first() {
        if first_byte.is_ascii_digit() {
            return true;
        }
    }

    false
}

impl<'a> Value<'a> for &'a serde_json::Value {
    type ArrayIter = std::slice::Iter<'a, serde_json::Value>;
    type ObjectIter = JsonObjectIter<'a>;

    #[inline]
    fn as_value(&self) -> ReferenceValue<'a, Self> {
        match self {
            serde_json::Value::Null => ReferenceValueLeaf::Null.into(),
            serde_json::Value::Bool(value) => ReferenceValueLeaf::Bool(*value).into(),
            serde_json::Value::Number(number) => {
                if let Some(val) = number.as_i64() {
                    ReferenceValueLeaf::I64(val).into()
                } else if let Some(val) = number.as_u64() {
                    ReferenceValueLeaf::U64(val).into()
                } else if let Some(val) = number.as_f64() {
                    ReferenceValueLeaf::F64(val).into()
                } else {
                    panic!("Unsupported serde_json number {number}");
                }
            }
            serde_json::Value::String(text) => {
                if can_be_rfc3339_date_time(text) {
                    match OffsetDateTime::parse(text, &Rfc3339) {
                        Ok(dt) => {
                            let dt_utc = dt.to_offset(time::UtcOffset::UTC);
                            ReferenceValueLeaf::Date(DateTime::from_utc(dt_utc)).into()
                        }
                        Err(_) => ReferenceValueLeaf::Str(text).into(),
                    }
                } else {
                    ReferenceValueLeaf::Str(text).into()
                }
            }
            serde_json::Value::Array(elements) => ReferenceValue::Array(elements.iter()),
            serde_json::Value::Object(object) => {
                ReferenceValue::Object(JsonObjectIter(object.iter()))
            }
        }
    }
}

impl<'a> Value<'a> for &'a String {
    type ArrayIter = Empty<&'a String>;
    type ObjectIter = Empty<(&'a str, &'a String)>;
    #[inline]
    fn as_value(&self) -> ReferenceValue<'a, Self> {
        ReferenceValue::Leaf(ReferenceValueLeaf::Str(self))
    }
}

impl<'a> Value<'a> for &'a Facet {
    type ArrayIter = Empty<&'a Facet>;
    type ObjectIter = Empty<(&'a str, &'a Facet)>;
    #[inline]
    fn as_value(&self) -> ReferenceValue<'a, Self> {
        ReferenceValue::Leaf(ReferenceValueLeaf::Facet(self.encoded_str()))
    }
}

impl<'a> Value<'a> for &'a u64 {
    type ArrayIter = Empty<&'a u64>;
    type ObjectIter = Empty<(&'a str, &'a u64)>;
    #[inline]
    fn as_value(&self) -> ReferenceValue<'a, Self> {
        ReferenceValue::Leaf(ReferenceValueLeaf::U64(**self))
    }
}

impl<'a> Value<'a> for &'a i64 {
    type ArrayIter = Empty<&'a i64>;
    type ObjectIter = Empty<(&'a str, &'a i64)>;
    #[inline]
    fn as_value(&self) -> ReferenceValue<'a, Self> {
        ReferenceValue::Leaf(ReferenceValueLeaf::I64(**self))
    }
}
impl<'a> Value<'a> for &'a f64 {
    type ArrayIter = Empty<&'a f64>;
    type ObjectIter = Empty<(&'a str, &'a f64)>;
    #[inline]
    fn as_value(&self) -> ReferenceValue<'a, Self> {
        ReferenceValue::Leaf(ReferenceValueLeaf::F64(**self))
    }
}
impl<'a> Value<'a> for &'a bool {
    type ArrayIter = Empty<&'a bool>;
    type ObjectIter = Empty<(&'a str, &'a bool)>;
    #[inline]
    fn as_value(&self) -> ReferenceValue<'a, Self> {
        ReferenceValue::Leaf(ReferenceValueLeaf::Bool(**self))
    }
}
impl<'a> Value<'a> for &'a str {
    type ArrayIter = Empty<&'a str>;
    type ObjectIter = Empty<(&'a str, &'a str)>;
    #[inline]
    fn as_value(&self) -> ReferenceValue<'a, Self> {
        ReferenceValue::Leaf(ReferenceValueLeaf::Str(self))
    }
}
impl<'a> Value<'a> for &'a &'a str {
    type ArrayIter = Empty<&'a &'a str>;
    type ObjectIter = Empty<(&'a str, &'a &'a str)>;
    #[inline]
    fn as_value(&self) -> ReferenceValue<'a, Self> {
        ReferenceValue::Leaf(ReferenceValueLeaf::Str(self))
    }
}

impl<'a> Value<'a> for &'a [u8] {
    type ArrayIter = Empty<&'a [u8]>;
    type ObjectIter = Empty<(&'a str, &'a [u8])>;
    #[inline]
    fn as_value(&self) -> ReferenceValue<'a, Self> {
        ReferenceValue::Leaf(ReferenceValueLeaf::Bytes(self))
    }
}

impl<'a> Value<'a> for &'a &'a [u8] {
    type ArrayIter = Empty<&'a &'a [u8]>;
    type ObjectIter = Empty<(&'a str, &'a &'a [u8])>;
    #[inline]
    fn as_value(&self) -> ReferenceValue<'a, Self> {
        ReferenceValue::Leaf(ReferenceValueLeaf::Bytes(self))
    }
}

impl<'a> Value<'a> for &'a Vec<u8> {
    type ArrayIter = Empty<&'a Vec<u8>>;
    type ObjectIter = Empty<(&'a str, &'a Vec<u8>)>;
    #[inline]
    fn as_value(&self) -> ReferenceValue<'a, Self> {
        ReferenceValue::Leaf(ReferenceValueLeaf::Bytes(self))
    }
}

impl<'a> Value<'a> for &'a DateTime {
    type ArrayIter = Empty<&'a DateTime>;
    type ObjectIter = Empty<(&'a str, &'a DateTime)>;
    #[inline]
    fn as_value(&self) -> ReferenceValue<'a, Self> {
        ReferenceValue::Leaf(ReferenceValueLeaf::Date(**self))
    }
}
impl<'a> Value<'a> for &'a Ipv6Addr {
    type ArrayIter = Empty<&'a Ipv6Addr>;
    type ObjectIter = Empty<(&'a str, &'a Ipv6Addr)>;
    #[inline]
    fn as_value(&self) -> ReferenceValue<'a, Self> {
        ReferenceValue::Leaf(ReferenceValueLeaf::IpAddr(**self))
    }
}
impl<'a> Value<'a> for &'a PreTokenizedString {
    type ArrayIter = Empty<&'a PreTokenizedString>;
    type ObjectIter = Empty<(&'a str, &'a PreTokenizedString)>;
    #[inline]
    fn as_value(&self) -> ReferenceValue<'a, Self> {
        ReferenceValue::Leaf(ReferenceValueLeaf::PreTokStr(Box::new((*self).clone())))
    }
}

impl ValueDeserialize for serde_json::Value {
    fn deserialize<'de, D>(deserializer: D) -> Result<Self, DeserializeError>
    where D: ValueDeserializer<'de> {
        struct SerdeValueVisitor;

        impl ValueVisitor for SerdeValueVisitor {
            type Value = serde_json::Value;

            fn visit_null(&self) -> Result<Self::Value, DeserializeError> {
                Ok(serde_json::Value::Null)
            }

            fn visit_string(&self, val: String) -> Result<Self::Value, DeserializeError> {
                Ok(serde_json::Value::String(val))
            }

            fn visit_u64(&self, val: u64) -> Result<Self::Value, DeserializeError> {
                Ok(serde_json::Value::Number(val.into()))
            }

            fn visit_i64(&self, val: i64) -> Result<Self::Value, DeserializeError> {
                Ok(serde_json::Value::Number(val.into()))
            }

            fn visit_f64(&self, val: f64) -> Result<Self::Value, DeserializeError> {
                let num = Number::from_f64(val).ok_or_else(|| {
                    DeserializeError::custom(format!(
                        "serde_json::Value cannot deserialize float {val}"
                    ))
                })?;
                Ok(serde_json::Value::Number(num))
            }

            fn visit_bool(&self, val: bool) -> Result<Self::Value, DeserializeError> {
                Ok(serde_json::Value::Bool(val))
            }

            fn visit_array<'de, A>(&self, mut access: A) -> Result<Self::Value, DeserializeError>
            where A: ArrayAccess<'de> {
                let mut elements = Vec::with_capacity(access.size_hint());

                while let Some(value) = access.next_element()? {
                    elements.push(value);
                }

                Ok(serde_json::Value::Array(elements))
            }

            fn visit_object<'de, A>(&self, mut access: A) -> Result<Self::Value, DeserializeError>
            where A: ObjectAccess<'de> {
                let mut object = serde_json::Map::with_capacity(access.size_hint());

                while let Some((key, value)) = access.next_entry()? {
                    object.insert(key, value);
                }

                Ok(serde_json::Value::Object(object))
            }
        }

        deserializer.deserialize_any(SerdeValueVisitor)
    }
}

/// A wrapper struct for an iterator producing [Value]s.
pub struct JsonObjectIter<'a>(pub(crate) serde_json::map::Iter<'a>);

impl<'a> Iterator for JsonObjectIter<'a> {
    type Item = (&'a str, &'a serde_json::Value);

    fn next(&mut self) -> Option<Self::Item> {
        let (key, value) = self.0.next()?;
        Some((key, value))
    }
}

// Custom document types

// BTreeMap based documents
impl Document for BTreeMap<Field, crate::schema::OwnedValue> {
    type Value<'a> = &'a crate::schema::OwnedValue;
    type FieldsValuesIter<'a> = FieldCopyingIterator<
        'a,
        btree_map::Iter<'a, Field, crate::schema::OwnedValue>,
        crate::schema::OwnedValue,
    >;

    fn iter_fields_and_values(&self) -> Self::FieldsValuesIter<'_> {
        FieldCopyingIterator(self.iter())
    }
}
impl DocumentDeserialize for BTreeMap<Field, crate::schema::OwnedValue> {
    fn deserialize<'de, D>(mut deserializer: D) -> Result<Self, DeserializeError>
    where D: DocumentDeserializer<'de> {
        let mut document = BTreeMap::new();

        while let Some((field, value)) = deserializer.next_field()? {
            document.insert(field, value);
        }

        Ok(document)
    }
}

// HashMap based documents
impl Document for HashMap<Field, crate::schema::OwnedValue> {
    type Value<'a> = &'a crate::schema::OwnedValue;
    type FieldsValuesIter<'a> = FieldCopyingIterator<
        'a,
        hash_map::Iter<'a, Field, crate::schema::OwnedValue>,
        crate::schema::OwnedValue,
    >;

    fn iter_fields_and_values(&self) -> Self::FieldsValuesIter<'_> {
        FieldCopyingIterator(self.iter())
    }
}
impl DocumentDeserialize for HashMap<Field, crate::schema::OwnedValue> {
    fn deserialize<'de, D>(mut deserializer: D) -> Result<Self, DeserializeError>
    where D: DocumentDeserializer<'de> {
        let mut document = HashMap::with_capacity(deserializer.size_hint());

        while let Some((field, value)) = deserializer.next_field()? {
            document.insert(field, value);
        }

        Ok(document)
    }
}

pub struct FieldCopyingIterator<'a, I, V>(I)
where
    V: 'a,
    I: Iterator<Item = (&'a Field, &'a V)>;

impl<'a, I, V> Iterator for FieldCopyingIterator<'a, I, V>
where
    V: 'a,
    I: Iterator<Item = (&'a Field, &'a V)>,
{
    type Item = (Field, &'a V);

    fn next(&mut self) -> Option<Self::Item> {
        let (field, value) = self.0.next()?;
        Some((*field, value))
    }
}


================================================
FILE: src/schema/document/mod.rs
================================================
//! Document definition for Tantivy to index and store.
//!
//! A document and its values are defined by a couple core traits:
//! - [Document] which describes your top-level document and it's fields.
//! - [Value] which provides tantivy with a way to access the document's values in a common way
//!   without performing any additional allocations.
//! - [DocumentDeserialize] which implements the necessary code to deserialize the document from the
//!   doc store. If you are fine with fetching [TantivyDocument] from the doc store, you can skip
//!   implementing this trait for your type.
//!
//! Tantivy provides a few out-of-box implementations of these core traits to provide
//! some simple usage if you don't want to implement these traits on a custom type yourself.
//!
//! # Out-of-box document implementations
//! - [TantivyDocument] the old document type used by Tantivy before the trait based approach was
//!   implemented. This type is still valid and provides all of the original behaviour you might
//!   expect.
//! - `BTreeMap<Field, OwnedValue>` a mapping of field_ids to their relevant schema value using a
//!   BTreeMap.
//! - `HashMap<Field, OwnedValue>` a mapping of field_ids to their relevant schema value using a
//!   HashMap.
//!
//! # Implementing your custom documents
//! Often in larger projects or higher performance applications you want to avoid the extra overhead
//! of converting your own types to the [TantivyDocument] type, this can often save you a
//! significant amount of time when indexing by avoiding the additional allocations.
//!
//! ### Important Note
//! The implementer of the `Document` trait must be `'static` and safe to send across
//! thread boundaries.
//!
//! ## Reusing existing types
//! The API design of the document traits allow you to reuse as much of as little of the
//! existing trait implementations as you like, this can save quite a bit of boilerplate
//! as shown by the following example.
//!
//! ## A basic custom document
//! ```
//! use std::collections::{btree_map, BTreeMap};
//! use tantivy::schema::{Document, Field};
//! use tantivy::schema::document::{DeserializeError, DocumentDeserialize, DocumentDeserializer};
//!
//! /// Our custom document to let us use a map of `serde_json::Values`.
//! #[allow(dead_code)]
//! pub struct MyCustomDocument {
//!     // Tantivy provides trait implementations for common `serde_json` types.
//!     fields: BTreeMap<Field, serde_json::Value>
//! }
//!
//! impl Document for MyCustomDocument {
//!     // The value type produced by the `iter_fields_and_values` iterator.
//!     // tantivy already implements the Value trait for serde_json::Value.
//!     type Value<'a> = &'a serde_json::Value;
//!     // The iterator which is produced by `iter_fields_and_values`.
//!     // Often this is a simple new-type wrapper unless you like super long generics.
//!     type FieldsValuesIter<'a> = MyCustomIter<'a>;
//!
//!     /// Produces an iterator over the document fields and values.
//!     /// This method will be called multiple times, it's important
//!     /// to not do anything too heavy in this step, any heavy operations
//!     /// should be done before and effectively cached.
//!     fn iter_fields_and_values(&self) -> Self::FieldsValuesIter<'_> {
//!         MyCustomIter(self.fields.iter())
//!     }
//! }
//!
//! // Our document must also provide a way to get the original doc
//! // back when it's deserialized from the doc store.
//! // The API for this is very similar to serde but a little bit
//! // more specialised, giving you access to types like IP addresses, datetime, etc...
//! impl DocumentDeserialize for MyCustomDocument {
//!     fn deserialize<'de, D>(deserializer: D) -> Result<Self, DeserializeError>
//!     where D: DocumentDeserializer<'de>
//!     {
//!         // We're not going to implement the necessary logic for this example
//!         // see the `Deserialization` section of implementing a custom document
//!         // for more information on how this works.
//!         unimplemented!()
//!     }
//! }
//!
//! /// Our custom iterator just helps us to avoid some messy generics.
//! #[allow(dead_code)]
//! pub struct MyCustomIter<'a>(btree_map::Iter<'a, Field, serde_json::Value>);
//! impl<'a> Iterator for MyCustomIter<'a> {
//!     // Here we can see our field-value pairs being produced by the iterator.
//!     // The value returned alongside the field is the same type as `Document::Value<'_>`.
//!     type Item = (Field, &'a serde_json::Value);
//!
//!     fn next(&mut self) -> Option<Self::Item> {
//!         let (field, value) = self.0.next()?;
//!         Some((*field, value))
//!     }
//! }
//! ```
//!
//! You may have noticed in this example that we haven't needed to implement any custom value types,
//! instead we've just used a [serde_json::Value] type which tantivy provides an existing
//! implementation for.
//!
//! ## Implementing custom values
//! In order to allow documents to return custom types, they must implement
//! the [Value] trait which provides a way for Tantivy to get a `ReferenceValue` that it can then
//! index and store.
//! Internally, Tantivy only works with `ReferenceValue` which is an enum that tries to borrow
//! as much data as it can
//!
//! Values can just as easily be customised as documents by implementing the `Value` trait.
//!
//! The implementer of this type should not own the data it's returning, instead it should just
//! hold references of the data held by the parent [Document] which can then be passed
//! on to the [ReferenceValue].
//!
//! This is why [Value] is implemented for `&'a serde_json::Value` and
//! [&'a tantivy::schema::document::OwnedValue](OwnedValue) but not for their owned counterparts, as
//! we cannot satisfy the lifetime bounds necessary when indexing the documents.
//!
//! ### A note about returning values
//! The custom value type does not have to be the type stored by the document, instead the
//! implementer of a `Value` can just be used as a way to convert between the owned type
//! kept in the parent document, and the value passed into Tantivy.
//!
//! ```
//! use tantivy::schema::document::ReferenceValue;
//! use tantivy::schema::document::ReferenceValueLeaf;
//! use tantivy::schema::{Value};
//!
//! #[derive(Debug)]
//! /// Our custom value type which has 3 types, a string, float and bool.
//! #[allow(dead_code)]
//! pub enum MyCustomValue<'a> {
//!     // Our string data is owned by the parent document, instead we just
//!     // hold onto a reference of this data.
//!     String(&'a str),
//!     Float(f64),
//!     Bool(bool),
//! }
//!
//! impl<'a> Value<'a> for MyCustomValue<'a> {
//!     // We don't need to worry about these types here as we're not
//!     // working with nested types, but if we wanted to we would
//!     // define our two iterator types, a sequence of ReferenceValues
//!     // for the array iterator and a sequence of key-value pairs for objects.
//!     type ArrayIter = std::iter::Empty<Self>;
//!     type ObjectIter = std::iter::Empty<(&'a str, Self)>;
//!
//!     // The ReferenceValue which Tantivy can use.
//!     fn as_value(&self) -> ReferenceValue<'a, Self> {
//!         // We can support any type that Tantivy itself supports.
//!         match self {
//!             MyCustomValue::String(val) => ReferenceValue::Leaf(ReferenceValueLeaf::Str(*val)),
//!             MyCustomValue::Float(val) => ReferenceValue::Leaf(ReferenceValueLeaf::F64(*val)),
//!             MyCustomValue::Bool(val) => ReferenceValue::Leaf(ReferenceValueLeaf::Bool(*val)),
//!         }
//!     }
//!
//! }
//! ```
//!
//! TODO: Complete this section...

mod de;
mod default_document;
mod existing_type_impls;
mod owned_value;
mod se;
mod value;

use std::collections::BTreeMap;
use std::mem;

pub(crate) use self::de::BinaryDocumentDeserializer;
pub use self::de::{
    ArrayAccess, DeserializeError, DocumentDeserialize, DocumentDeserializer, ObjectAccess,
    ValueDeserialize, ValueDeserializer, ValueType, ValueVisitor,
};
pub use self::default_document::{
    CompactDocArrayIter, CompactDocObjectIter, CompactDocValue, DocParsingError, TantivyDocument,
};
pub use self::owned_value::OwnedValue;
pub(crate) use self::se::BinaryDocumentSerializer;
pub use self::value::{ReferenceValue, ReferenceValueLeaf, Value};
use super::*;

/// The core trait representing a document within the index.
pub trait Document: Send + Sync + 'static {
    /// The value of the field.
    type Value<'a>: Value<'a> + Clone
    where Self: 'a;

    /// The iterator over all of the fields and values within the doc.
    type FieldsValuesIter<'a>: Iterator<Item = (Field, Self::Value<'a>)>
    where Self: 'a;

    /// Get an iterator iterating over all fields and values in a document.
    fn iter_fields_and_values(&self) -> Self::FieldsValuesIter<'_>;

    /// Sort and groups the field_values by field.
    ///
    /// The result of this method is not cached and is
    /// computed on the fly when this method is called.
    fn get_sorted_field_values(&self) -> Vec<(Field, Vec<Self::Value<'_>>)> {
        let mut field_values: Vec<(Field, Self::Value<'_>)> =
            self.iter_fields_and_values().collect();
        field_values.sort_by_key(|(field, _)| *field);

        let mut field_values_it = field_values.into_iter();

        let first_field_value = if let Some(first_field_value) = field_values_it.next() {
            first_field_value
        } else {
            return Vec::new();
        };

        let mut grouped_field_values = vec![];
        let mut current_field = first_field_value.0;
        let mut current_group = vec![first_field_value.1];

        for (field, value) in field_values_it {
            if field == current_field {
                current_group.push(value);
            } else {
                grouped_field_values
                    .push((current_field, mem::replace(&mut current_group, vec![value])));
                current_field = field;
            }
        }

        grouped_field_values.push((current_field, current_group));
        grouped_field_values
    }

    /// Create a named document from the doc.
    fn to_named_doc(&self, schema: &Schema) -> NamedFieldDocument {
        let mut field_map = BTreeMap::new();
        for (field, field_values) in self.get_sorted_field_values() {
            let field_name = schema.get_field_name(field);
            let values: Vec<OwnedValue> = field_values
                .into_iter()
                .map(|val| OwnedValue::from(val.as_value()))
                .collect();
            field_map.insert(field_name.to_string(), values);
        }
        NamedFieldDocument(field_map)
    }

    /// Encode the doc in JSON.
    ///
    /// Encoding a document cannot fail.
    fn to_json(&self, schema: &Schema) -> String {
        serde_json::to_string(&self.to_named_doc(schema))
            .expect("doc encoding failed. This is a bug")
    }
}

pub(crate) mod type_codes {
    pub const TEXT_CODE: u8 = 0;
    pub const U64_CODE: u8 = 1;
    pub const I64_CODE: u8 = 2;
    pub const HIERARCHICAL_FACET_CODE: u8 = 3;
    pub const BYTES_CODE: u8 = 4;
    pub const DATE_CODE: u8 = 5;
    pub const F64_CODE: u8 = 6;
    pub const EXT_CODE: u8 = 7;

    #[deprecated]
    pub const JSON_OBJ_CODE: u8 = 8; // Replaced by the `OBJECT_CODE`.
    pub const BOOL_CODE: u8 = 9;
    pub const IP_CODE: u8 = 10;
    pub const NULL_CODE: u8 = 11;
    pub const ARRAY_CODE: u8 = 12;
    pub const OBJECT_CODE: u8 = 13;

    // Extended type codes
    pub const TOK_STR_EXT_CODE: u8 = 0;
}


================================================
FILE: src/schema/document/owned_value.rs
================================================
use std::collections::BTreeMap;
use std::fmt;
use std::net::Ipv6Addr;

use base64::engine::general_purpose::STANDARD as BASE64;
use base64::Engine;
use serde::de::{MapAccess, SeqAccess};
use time::format_description::well_known::Rfc3339;
use time::OffsetDateTime;

use super::existing_type_impls::can_be_rfc3339_date_time;
use super::ReferenceValueLeaf;
use crate::schema::document::{
    ArrayAccess, DeserializeError, ObjectAccess, ReferenceValue, Value, ValueDeserialize,
    ValueDeserializer, ValueVisitor,
};
use crate::schema::Facet;
use crate::tokenizer::PreTokenizedString;
use crate::DateTime;

/// This is a owned variant of `Value`, that can be passed around without lifetimes.
/// Represents the value of a any field.
/// It is an enum over all over all of the possible field type.
#[derive(Debug, Clone, PartialEq)]
pub enum OwnedValue {
    /// A null value.
    Null,
    /// The str type is used for any text information.
    Str(String),
    /// Pre-tokenized str type,
    PreTokStr(PreTokenizedString),
    /// Unsigned 64-bits Integer `u64`
    U64(u64),
    /// Signed 64-bits Integer `i64`
    I64(i64),
    /// 64-bits Float `f64`
    F64(f64),
    /// Bool value
    Bool(bool),
    /// Date/time with nanoseconds precision
    Date(DateTime),
    /// Facet
    Facet(Facet),
    /// Arbitrarily sized byte array
    Bytes(Vec<u8>),
    /// A set of values.
    Array(Vec<Self>),
    /// Dynamic object value.
    Object(Vec<(String, Self)>),
    /// IpV6 Address. Internally there is no IpV4, it needs to be converted to `Ipv6Addr`.
    IpAddr(Ipv6Addr),
}

impl AsRef<OwnedValue> for OwnedValue {
    #[inline]
    fn as_ref(&self) -> &OwnedValue {
        self
    }
}

impl OwnedValue {
    /// Returns a u8 discriminant value for the `OwnedValue` variant.
    ///
    /// This can be used to sort `OwnedValue` instances by their type.
    pub fn discriminant_value(&self) -> u8 {
        match self {
            OwnedValue::Null => 0,
            OwnedValue::Str(_) => 1,
            OwnedValue::PreTokStr(_) => 2,
            // It is key to make sure U64, I64, F64 are grouped together in there, otherwise we
            // might be breaking transivity.
            OwnedValue::U64(_) => 3,
            OwnedValue::I64(_) => 4,
            OwnedValue::F64(_) => 5,
            OwnedValue::Bool(_) => 6,
            OwnedValue::Date(_) => 7,
            OwnedValue::Facet(_) => 8,
            OwnedValue::Bytes(_) => 9,
            OwnedValue::Array(_) => 10,
            OwnedValue::Object(_) => 11,
            OwnedValue::IpAddr(_) => 12,
        }
    }
}

impl<'a> Value<'a> for &'a OwnedValue {
    type ArrayIter = std::slice::Iter<'a, OwnedValue>;
    type ObjectIter = ObjectMapIter<'a>;

    fn as_value(&self) -> ReferenceValue<'a, Self> {
        match self {
            OwnedValue::Null => ReferenceValueLeaf::Null.into(),
            OwnedValue::Str(val) => ReferenceValueLeaf::Str(val).into(),
            OwnedValue::PreTokStr(val) => ReferenceValueLeaf::PreTokStr(val.clone().into()).into(),
            OwnedValue::U64(val) => ReferenceValueLeaf::U64(*val).into(),
            OwnedValue::I64(val) => ReferenceValueLeaf::I64(*val).into(),
            OwnedValue::F64(val) => ReferenceValueLeaf::F64(*val).into(),
            OwnedValue::Bool(val) => ReferenceValueLeaf::Bool(*val).into(),
            OwnedValue::Date(val) => ReferenceValueLeaf::Date(*val).into(),
            OwnedValue::Facet(val) => ReferenceValueLeaf::Facet(val.encoded_str()).into(),
            OwnedValue::Bytes(val) => ReferenceValueLeaf::Bytes(val).into(),
            OwnedValue::IpAddr(val) => ReferenceValueLeaf::IpAddr(*val).into(),
            OwnedValue::Array(array) => ReferenceValue::Array(array.iter()),
            OwnedValue::Object(object) => ReferenceValue::Object(ObjectMapIter(object.iter())),
        }
    }
}

impl ValueDeserialize for OwnedValue {
    fn deserialize<'de, D>(deserializer: D) -> Result<Self, DeserializeError>
    where D: ValueDeserializer<'de> {
        struct Visitor;

        impl ValueVisitor for Visitor {
            type Value = OwnedValue;

            fn visit_null(&self) -> Result<Self::Value, DeserializeError> {
                Ok(OwnedValue::Null)
            }

            fn visit_string(&self, val: String) -> Result<Self::Value, DeserializeError> {
                Ok(OwnedValue::Str(val))
            }

            fn visit_u64(&self, val: u64) -> Result<Self::Value, DeserializeError> {
                Ok(OwnedValue::U64(val))
            }

            fn visit_i64(&self, val: i64) -> Result<Self::Value, DeserializeError> {
                Ok(OwnedValue::I64(val))
            }

            fn visit_f64(&self, val: f64) -> Result<Self::Value, DeserializeError> {
                Ok(OwnedValue::F64(val))
            }

            fn visit_bool(&self, val: bool) -> Result<Self::Value, DeserializeError> {
                Ok(OwnedValue::Bool(val))
            }

            fn visit_datetime(&self, val: DateTime) -> Result<Self::Value, DeserializeError> {
                Ok(OwnedValue::Date(val))
            }

            fn visit_ip_address(&self, val: Ipv6Addr) -> Result<Self::Value, DeserializeError> {
                Ok(OwnedValue::IpAddr(val))
            }

            fn visit_facet(&self, val: Facet) -> Result<Self::Value, DeserializeError> {
                Ok(OwnedValue::Facet(val))
            }

            fn visit_bytes(&self, val: Vec<u8>) -> Result<Self::Value, DeserializeError> {
                Ok(OwnedValue::Bytes(val))
            }

            fn visit_pre_tokenized_string(
                &self,
                val: PreTokenizedString,
            ) -> Result<Self::Value, DeserializeError> {
                Ok(OwnedValue::PreTokStr(val))
            }

            fn visit_array<'de, A>(&self, mut access: A) -> Result<Self::Value, DeserializeError>
            where A: ArrayAccess<'de> {
                let mut elements = Vec::with_capacity(access.size_hint());

                while let Some(value) = access.next_element()? {
                    elements.push(value);
                }

                Ok(OwnedValue::Array(elements))
            }

            fn visit_object<'de, A>(&self, mut access: A) -> Result<Self::Value, DeserializeError>
            where A: ObjectAccess<'de> {
                let mut elements = Vec::with_capacity(access.size_hint());

                while let Some((key, value)) = access.next_entry()? {
                    elements.push((key, value));
                }

                Ok(OwnedValue::Object(elements))
            }
        }

        deserializer.deserialize_any(Visitor)
    }
}

impl Eq for OwnedValue {}

impl serde::Serialize for OwnedValue {
    fn serialize<S>(&self, serializer: S) -> Result<S::Ok, S::Error>
    where S: serde::Serializer {
        use serde::ser::SerializeMap;
        match *self {
            OwnedValue::Null => serializer.serialize_unit(),
            OwnedValue::Str(ref v) => serializer.serialize_str(v),
            OwnedValue::PreTokStr(ref v) => v.serialize(serializer),
            OwnedValue::U64(u) => serializer.serialize_u64(u),
            OwnedValue::I64(u) => serializer.serialize_i64(u),
            OwnedValue::F64(u) => serializer.serialize_f64(u),
            OwnedValue::Bool(b) => serializer.serialize_bool(b),
            OwnedValue::Date(ref date) => {
                time::serde::rfc3339::serialize(&date.into_utc(), serializer)
            }
            OwnedValue::Facet(ref facet) => facet.serialize(serializer),
            OwnedValue::Bytes(ref bytes) => serializer.serialize_str(&BASE64.encode(bytes)),
            OwnedValue::Object(ref obj) => {
                let mut map = serializer.serialize_map(Some(obj.len()))?;
                for (k, v) in obj {
                    map.serialize_entry(k, v)?;
                }
                map.end()
            }
            OwnedValue::IpAddr(ref ip_v6) => {
                // Ensure IpV4 addresses get serialized as IpV4, but excluding IpV6 loopback.
                if let Some(ip_v4) = ip_v6.to_ipv4_mapped() {
                    ip_v4.serialize(serializer)
                } else {
                    ip_v6.serialize(serializer)
                }
            }
            OwnedValue::Array(ref array) => array.serialize(serializer),
        }
    }
}

impl<'de> serde::Deserialize<'de> for OwnedValue {
    fn deserialize<D>(deserializer: D) -> Result<Self, D::Error>
    where D: serde::Deserializer<'de> {
        struct ValueVisitor;

        impl<'de> serde::de::Visitor<'de> for ValueVisitor {
            type Value = OwnedValue;

            fn expecting(&self, formatter: &mut fmt::Formatter<'_>) -> fmt::Result {
                formatter.write_str("a string or u32")
            }

            fn visit_bool<E>(self, v: bool) -> Result<Self::Value, E> {
                Ok(OwnedValue::Bool(v))
            }

            fn visit_i64<E>(self, v: i64) -> Result<Self::Value, E> {
                Ok(OwnedValue::I64(v))
            }

            fn visit_u64<E>(self, v: u64) -> Result<Self::Value, E> {
                Ok(OwnedValue::U64(v))
            }

            fn visit_f64<E>(self, v: f64) -> Result<Self::Value, E> {
                Ok(OwnedValue::F64(v))
            }

            fn visit_str<E>(self, v: &str) -> Result<Self::Value, E> {
                Ok(OwnedValue::Str(v.to_owned()))
            }

            fn visit_string<E>(self, v: String) -> Result<Self::Value, E> {
                Ok(OwnedValue::Str(v))
            }

            fn visit_unit<E>(self) -> Result<Self::Value, E>
            where E: serde::de::Error {
                Ok(OwnedValue::Null)
            }

            fn visit_seq<A>(self, mut seq: A) -> Result<Self::Value, A::Error>
            where A: SeqAccess<'de> {
                let mut elements = Vec::with_capacity(seq.size_hint().unwrap_or_default());

                while let Some(value) = seq.next_element()? {
                    elements.push(value);
                }

                Ok(OwnedValue::Array(elements))
            }

            fn visit_map<A>(self, mut map: A) -> Result<Self::Value, A::Error>
            where A: MapAccess<'de> {
                let mut object = map.size_hint().map(Vec::with_capacity).unwrap_or_default();
                while let Some((key, value)) = map.next_entry()? {
                    object.push((key, value));
                }
                Ok(OwnedValue::Object(object))
            }
        }

        deserializer.deserialize_any(ValueVisitor)
    }
}

impl<'a, V: Value<'a>> From<ReferenceValue<'a, V>> for OwnedValue {
    fn from(val: ReferenceValue<'a, V>) -> OwnedValue {
        match val {
            ReferenceValue::Leaf(leaf) => match leaf {
                ReferenceValueLeaf::Null => OwnedValue::Null,
                ReferenceValueLeaf::Str(val) => OwnedValue::Str(val.to_string()),
                ReferenceValueLeaf::U64(val) => OwnedValue::U64(val),
                ReferenceValueLeaf::I64(val) => OwnedValue::I64(val),
                ReferenceValueLeaf::F64(val) => OwnedValue::F64(val),
                ReferenceValueLeaf::Date(val) => OwnedValue::Date(val),
                ReferenceValueLeaf::Facet(val) => {
                    OwnedValue::Facet(Facet::from_encoded_string(val.to_string()))
                }
                ReferenceValueLeaf::Bytes(val) => OwnedValue::Bytes(val.to_vec()),
                ReferenceValueLeaf::IpAddr(val) => OwnedValue::IpAddr(val),
                ReferenceValueLeaf::Bool(val) => OwnedValue::Bool(val),
                ReferenceValueLeaf::PreTokStr(val) => OwnedValue::PreTokStr(*val.clone()),
            },
            ReferenceValue::Array(val) => {
                OwnedValue::Array(val.map(|v| v.as_value().into()).collect())
            }
            ReferenceValue::Object(val) => OwnedValue::Object(
                val.map(|(k, v)| (k.to_string(), v.as_value().into()))
                    .collect(),
            ),
        }
    }
}

impl From<String> for OwnedValue {
    fn from(s: String) -> OwnedValue {
        OwnedValue::Str(s)
    }
}

impl From<Ipv6Addr> for OwnedValue {
    fn from(v: Ipv6Addr) -> OwnedValue {
        OwnedValue::IpAddr(v)
    }
}

impl From<u64> for OwnedValue {
    fn from(v: u64) -> OwnedValue {
        OwnedValue::U64(v)
    }
}

impl From<i64> for OwnedValue {
    fn from(v: i64) -> OwnedValue {
        OwnedValue::I64(v)
    }
}

impl From<f64> for OwnedValue {
    fn from(v: f64) -> OwnedValue {
        OwnedValue::F64(v)
    }
}

impl From<bool> for OwnedValue {
    fn from(b: bool) -> Self {
        OwnedValue::Bool(b)
    }
}

impl From<DateTime> for OwnedValue {
    fn from(dt: DateTime) -> OwnedValue {
        OwnedValue::Date(dt)
    }
}

impl<'a> From<&'a str> for OwnedValue {
    fn from(s: &'a str) -> OwnedValue {
        OwnedValue::Str(s.to_string())
    }
}

impl<'a> From<&'a [u8]> for OwnedValue {
    fn from(bytes: &'a [u8]) -> OwnedValue {
        OwnedValue::Bytes(bytes.to_vec())
    }
}

impl From<Facet> for OwnedValue {
    fn from(facet: Facet) -> OwnedValue {
        OwnedValue::Facet(facet)
    }
}

impl From<Vec<u8>> for OwnedValue {
    fn from(bytes: Vec<u8>) -> OwnedValue {
        OwnedValue::Bytes(bytes)
    }
}

impl From<PreTokenizedString> for OwnedValue {
    fn from(pretokenized_string: PreTokenizedString) -> OwnedValue {
        OwnedValue::PreTokStr(pretokenized_string)
    }
}

impl From<BTreeMap<String, OwnedValue>> for OwnedValue {
    fn from(object: BTreeMap<String, OwnedValue>) -> OwnedValue {
        let key_values = object.into_iter().collect();
        OwnedValue::Object(key_values)
    }
}

impl From<serde_json::Value> for OwnedValue {
    fn from(value: serde_json::Value) -> Self {
        match value {
            serde_json::Value::Null => Self::Null,
            serde_json::Value::Bool(val) => Self::Bool(val),
            serde_json::Value::Number(number) => {
                if let Some(val) = number.as_i64() {
                    Self::I64(val)
                } else if let Some(val) = number.as_u64() {
                    Self::U64(val)
                } else if let Some(val) = number.as_f64() {
                    Self::F64(val)
                } else {
                    panic!("Unsupported serde_json number {number}");
                }
            }
            serde_json::Value::String(text) => {
                if can_be_rfc3339_date_time(&text) {
                    match OffsetDateTime::parse(&text, &Rfc3339) {
                        Ok(dt) => {
                            let dt_utc = dt.to_offset(time::UtcOffset::UTC);
                            Self::Date(DateTime::from_utc(dt_utc))
                        }
                        Err(_) => Self::Str(text),
                    }
                } else {
                    Self::Str(text)
                }
            }
            serde_json::Value::Array(elements) => {
                let converted_elements = elements.into_iter().map(Self::from).collect();
                Self::Array(converted_elements)
            }
            serde_json::Value::Object(object) => Self::from(object),
        }
    }
}

impl From<serde_json::Map<String, serde_json::Value>> for OwnedValue {
    fn from(map: serde_json::Map<String, serde_json::Value>) -> Self {
        let object: Vec<(String, OwnedValue)> = map
            .into_iter()
            .map(|(key, value)| (key, OwnedValue::from(value)))
            .collect();
        OwnedValue::Object(object)
    }
}

/// A wrapper type for iterating over a serde_json object producing reference values.
pub struct ObjectMapIter<'a>(std::slice::Iter<'a, (String, OwnedValue)>);

impl<'a> Iterator for ObjectMapIter<'a> {
    type Item = (&'a str, &'a OwnedValue);

    fn next(&mut self) -> Option<Self::Item> {
        let (key, value) = self.0.next()?;
        Some((key.as_str(), value))
    }
}

#[cfg(test)]
mod tests {
    use super::*;
    use crate::schema::{BytesOptions, Schema};
    use crate::{Document, TantivyDocument};

    #[test]
    fn test_parse_bytes_doc() {
        let mut schema_builder = Schema::builder();
        let bytes_options = BytesOptions::default();
        let bytes_field = schema_builder.add_bytes_field("my_bytes", bytes_options);
        let schema = schema_builder.build();
        let mut doc = TantivyDocument::default();
        doc.add_bytes(bytes_field, "this is a test".as_bytes());
        let json_string = doc.to_json(&schema);
        assert_eq!(json_string, r#"{"my_bytes":["dGhpcyBpcyBhIHRlc3Q="]}"#);
    }

    #[test]
    fn test_parse_empty_bytes_doc() {
        let mut schema_builder = Schema::builder();
        let bytes_options = BytesOptions::default();
        let bytes_field = schema_builder.add_bytes_field("my_bytes", bytes_options);
        let schema = schema_builder.build();
        let mut doc = TantivyDocument::default();
        doc.add_bytes(bytes_field, "".as_bytes());
        let json_string = doc.to_json(&schema);

        assert_eq!(json_string, r#"{"my_bytes":[""]}"#);
    }

    #[test]
    fn test_parse_many_bytes_doc() {
        let mut schema_builder = Schema::builder();
        let bytes_options = BytesOptions::default();
        let bytes_field = schema_builder.add_bytes_field("my_bytes", bytes_options);
        let schema = schema_builder.build();
        let mut doc = TantivyDocument::default();
        doc.add_bytes(
            bytes_field,
            "A bigger test I guess\nspanning on multiple lines\nhoping this will work".as_bytes(),
        );
        let json_string = doc.to_json(&schema);
        assert_eq!(
            json_string,
            r#"{"my_bytes":["QSBiaWdnZXIgdGVzdCBJIGd1ZXNzCnNwYW5uaW5nIG9uIG11bHRpcGxlIGxpbmVzCmhvcGluZyB0aGlzIHdpbGwgd29yaw=="]}"#
        );
    }

    #[test]
    fn test_serialize_date() {
        let value = OwnedValue::from(DateTime::from_utc(
            OffsetDateTime::parse("1996-12-20T00:39:57+00:00", &Rfc3339).unwrap(),
        ));
        let serialized_value_json = serde_json::to_string_pretty(&value).unwrap();
        assert_eq!(serialized_value_json, r#""1996-12-20T00:39:57Z""#);
        let value = OwnedValue::from(DateTime::from_utc(
            OffsetDateTime::parse("1996-12-20T00:39:57-01:00", &Rfc3339).unwrap(),
        ));
        let serialized_value_json = serde_json::to_string_pretty(&value).unwrap();
        // The time zone information gets lost by conversion into `Value::Date` and
        // implicitly becomes UTC.
        assert_eq!(serialized_value_json, r#""1996-12-20T01:39:57Z""#);
    }
}


================================================
FILE: src/schema/document/se.rs
================================================
use std::borrow::Cow;
use std::io;
use std::io::Write;

use columnar::MonotonicallyMappableToU128;
use common::{f64_to_u64, BinarySerializable, VInt};

use super::{OwnedValue, ReferenceValueLeaf};
use crate::schema::document::{type_codes, Document, ReferenceValue, Value};
use crate::schema::Schema;

/// A serializer writing documents which implement [`Document`] to a provided writer.
pub struct BinaryDocumentSerializer<'se, W> {
    writer: &'se mut W,
    schema: &'se Schema,
}

impl<'se, W> BinaryDocumentSerializer<'se, W>
where W: Write
{
    /// Creates a new serializer with a provided writer.
    pub(crate) fn new(writer: &'se mut W, schema: &'se Schema) -> Self {
        Self { writer, schema }
    }

    /// Attempts to serialize a given document and write the output
    /// to the writer.
    #[inline]
    pub(crate) fn serialize_doc<D>(&mut self, doc: &D) -> io::Result<()>
    where D: Document {
        let stored_field_values = || {
            doc.iter_fields_and_values()
                .filter(|(field, _)| self.schema.get_field_entry(*field).is_stored())
        };
        let num_field_values = stored_field_values().count();
        let mut actual_length = 0;

        VInt(num_field_values as u64).serialize(self.writer)?;
        for (field, value_access) in stored_field_values() {
            field.serialize(self.writer)?;

            let mut serializer = BinaryValueSerializer::new(self.writer);
            match value_access.as_value() {
                ReferenceValue::Leaf(ReferenceValueLeaf::PreTokStr(pre_tokenized_text)) => {
                    serializer.serialize_value(ReferenceValue::Leaf::<&'_ OwnedValue>(
                        ReferenceValueLeaf::Str(&pre_tokenized_text.text),
                    ))?;
                }
                _ => {
                    serializer.serialize_value(value_access.as_value())?;
                }
            }

            actual_length += 1;
        }

        if num_field_values != actual_length {
            return Err(io::Error::other(format!(
                "Unexpected number of entries written to serializer, expected {num_field_values} \
                 entries, got {actual_length} entries",
            )));
        }

        Ok(())
    }
}

/// A serializer for a single value.
pub struct BinaryValueSerializer<'se, W> {
    writer: &'se mut W,
}

impl<'se, W> BinaryValueSerializer<'se, W>
where W: Write
{
    /// Creates a new serializer with a provided writer.
    pub(crate) fn new(writer: &'se mut W) -> Self {
        Self { writer }
    }

    fn serialize_with_type_code<T: BinarySerializable>(
        &mut self,
        code: u8,
        val: &T,
    ) -> io::Result<()> {
        self.write_type_code(code)?;
        BinarySerializable::serialize(val, self.writer)
    }

    /// Attempts to serialize a given value and write the output
    /// to the writer.
    pub(crate) fn serialize_value<'a, V>(
        &mut self,
        value: ReferenceValue<'a, V>,
    ) -> io::Result<()>
    where
        V: Value<'a>,
    {
        match value {
            ReferenceValue::Leaf(leaf) => match leaf {
                ReferenceValueLeaf::Null => self.write_type_code(type_codes::NULL_CODE),
                ReferenceValueLeaf::Str(val) => {
                    self.serialize_with_type_code(type_codes::TEXT_CODE, &Cow::Borrowed(val))
                }
                ReferenceValueLeaf::U64(val) => {
                    self.serialize_with_type_code(type_codes::U64_CODE, &val)
                }
                ReferenceValueLeaf::I64(val) => {
                    self.serialize_with_type_code(type_codes::I64_CODE, &val)
                }
                ReferenceValueLeaf::F64(val) => {
                    self.serialize_with_type_code(type_codes::F64_CODE, &f64_to_u64(val))
                }
                ReferenceValueLeaf::Date(val) => {
                    self.write_type_code(type_codes::DATE_CODE)?;
                    let timestamp_nanos: i64 = val.into_timestamp_nanos();
                    BinarySerializable::serialize(&timestamp_nanos, self.writer)
                }
                ReferenceValueLeaf::Facet(val) => self.serialize_with_type_code(
                    type_codes::HIERARCHICAL_FACET_CODE,
                    &Cow::Borrowed(val),
                ),
                ReferenceValueLeaf::Bytes(val) => {
                    self.serialize_with_type_code(type_codes::BYTES_CODE, &Cow::Borrowed(val))
                }
                ReferenceValueLeaf::IpAddr(val) => {
                    self.serialize_with_type_code(type_codes::IP_CODE, &val.to_u128())
                }
                ReferenceValueLeaf::Bool(val) => {
                    self.serialize_with_type_code(type_codes::BOOL_CODE, &val)
                }
                ReferenceValueLeaf::PreTokStr(val) => {
                    self.write_type_code(type_codes::EXT_CODE)?;
                    self.serialize_with_type_code(type_codes::TOK_STR_EXT_CODE, &*val)
                }
            },
            ReferenceValue::Array(elements) => {
                self.write_type_code(type_codes::ARRAY_CODE)?;

                // Somewhat unfortunate that we do this here however, writing the
                // length at the end of the complicates things quite considerably.
                let elements: Vec<V> = elements.collect();

                let mut serializer = BinaryArraySerializer::begin(elements.len(), self.writer)?;

                for value in elements {
                    serializer.serialize_value(value.as_value())?;
                }

                serializer.end()
            }
            ReferenceValue::Object(object) => {
                self.write_type_code(type_codes::OBJECT_CODE)?;

                // Somewhat unfortunate that we do this here however, writing the
                // length at the end of the complicates things quite considerably.
                let entries: Vec<(&str, V)> = object.collect();

                let mut serializer = BinaryObjectSerializer::begin(entries.len(), self.writer)?;

                for (key, value) in entries {
                    serializer.serialize_entry(key, value.as_value())?;
                }

                serializer.end()
            }
        }
    }

    fn write_type_code(&mut self, code: u8) -> io::Result<()> {
        code.serialize(self.writer)
    }
}

/// A serializer for writing a sequence of values to a writer.
pub struct BinaryArraySerializer<'se, W> {
    writer: &'se mut W,
    expected_length: usize,
    actual_length: usize,
}

impl<'se, W> BinaryArraySerializer<'se, W>
where W: Write
{
    /// Creates a new array serializer and writes the length of the array to the writer.
    pub(crate) fn begin(length: usize, writer: &'se mut W) -> io::Result<Self> {
        VInt(length as u64).serialize(writer)?;

        Ok(Self {
            writer,
            expected_length: length,
            actual_length: 0,
        })
    }

    /// Attempts to serialize a given value and write the output
    /// to the writer.
    pub(crate) fn serialize_value<'a, V>(
        &mut self,
        value: ReferenceValue<'a, V>,
    ) -> io::Result<()>
    where
        V: Value<'a>,
    {
        let mut serializer = BinaryValueSerializer::new(self.writer);
        serializer.serialize_value(value)?;

        self.actual_length += 1;
        Ok(())
    }

    /// Finishes writing the array to the writer and validates it.
    pub(crate) fn end(self) -> io::Result<()> {
        if self.expected_length != self.actual_length {
            return Err(io::Error::other(format!(
                "Unexpected number of entries written to serializer, expected {} entries, got {} \
                 entries",
                self.expected_length, self.actual_length,
            )));
        }
        Ok(())
    }
}

/// A serializer for writing a set of key-value pairs to a writer.
pub struct BinaryObjectSerializer<'se, W> {
    inner: BinaryArraySerializer<'se, W>,
    expected_length: usize,
    actual_length: usize,
}

impl<'se, W> BinaryObjectSerializer<'se, W>
where W: Write
{
    /// Creates a new object serializer and writes the length of the object to the writer.
    pub(crate) fn begin(length: usize, writer: &'se mut W) -> io::Result<Self> {
        // We mul by 2 here to count the keys and values separately:
        // [("a", 1), ("b", 2)] is actually stored as ["a", 1, "b", 2]
        let inner = BinaryArraySerializer::begin(length * 2, writer)?;

        Ok(Self {
            inner,
            expected_length: length,
            actual_length: 0,
        })
    }

    /// Attempts to serialize a given value and write the output
    /// to the writer.
    pub(crate) fn serialize_entry<'a, V>(
        &mut self,
        key: &'a str,
        value: ReferenceValue<'a, V>,
    ) -> io::Result<()>
    where
        V: Value<'a>,
    {
        // Keys and values are stored inline with one another.
        // Technically this isn't the *most* optimal way of storing the objects
        // as we could avoid writing the extra byte per key. But the gain is
        // largely not worth it for the extra complexity it brings.
        self.inner
            .serialize_value(ReferenceValue::<'a, V>::Leaf(ReferenceValueLeaf::Str(key)))?;
        self.inner.serialize_value(value)?;

        self.actual_length += 1;
        Ok(())
    }

    /// Finishes writing the array to the writer and validates it.
    pub(crate) fn end(self) -> io::Result<()> {
        if self.expected_length != self.actual_length {
            return Err(io::Error::other(format!(
                "Unexpected number of entries written to serializer, expected {} entries, got {} \
                 entries",
                self.expected_length, self.actual_length,
            )));
        }

        // This should never fail if the above statement is valid.
        self.inner.end()?;

        Ok(())
    }
}

#[cfg(test)]
mod tests {
    use std::collections::BTreeMap;

    use serde_json::Number;
    use tokenizer_api::Token;

    use super::*;
    use crate::schema::document::existing_type_impls::JsonObjectIter;
    use crate::schema::{Facet, Field, FAST, STORED, TEXT};
    use crate::tokenizer::PreTokenizedString;

    fn serialize_value<'a>(value: ReferenceValue<'a, &'a serde_json::Value>) -> Vec<u8> {
        let mut writer = Vec::new();

        let mut serializer = BinaryValueSerializer::new(&mut writer);
        serializer.serialize_value(value).expect("Serialize value");

        writer
    }

    /// A macro for defining the expected binary representation
    /// of the serialized values in a somewhat human readable way.
    macro_rules! binary_repr {
        ($( $type_code:expr $(, $ext_code:expr)? => $value:expr $(,)?)*) => {{
            let mut writer = Vec::new();

            $(
                $type_code.serialize(&mut writer).unwrap();

                $(
                    $ext_code.serialize(&mut writer).unwrap();
                )?

                BinarySerializable::serialize(
                    &$value,
                    &mut writer,
                ).unwrap();
            )*

            writer
        }};
        (collection $code:expr, length $len:expr, $( $type_code:expr $(, $ext_code:expr)? => $value:expr $(,)?)*) => {{
            let mut writer = Vec::new();

            $code.serialize(&mut writer).unwrap();
            VInt($len as u64).serialize(&mut writer).unwrap();

            $(
                $type_code.serialize(&mut writer).unwrap();

                $(
                    $ext_code.serialize(&mut writer).unwrap();
                )?

                BinarySerializable::serialize(
                    &$value,
                    &mut writer,
                ).unwrap();
            )*

            writer
        }};
    }

    #[test]
    fn test_simple_value_serialize() {
        let result = serialize_value(ReferenceValueLeaf::Null.into());
        let expected = binary_repr!(
            type_codes::NULL_CODE => (),
        );
        assert_eq!(
            result, expected,
            "Expected serialized value to match the binary representation"
        );

        let result = serialize_value(ReferenceValueLeaf::Str("hello, world").into());
        let expected = binary_repr!(
            type_codes::TEXT_CODE => String::from("hello, world"),
        );
        assert_eq!(
            result, expected,
            "Expected serialized value to match the binary representation"
        );

        let result = serialize_value(ReferenceValueLeaf::U64(123).into());
        let expected = binary_repr!(
            type_codes::U64_CODE => 123u64,
        );
        assert_eq!(
            result, expected,
            "Expected serialized value to match the binary representation"
        );

        let result = serialize_value(ReferenceValueLeaf::I64(-123).into());
        let expected = binary_repr!(
            type_codes::I64_CODE => -123i64,
        );
        assert_eq!(
            result, expected,
            "Expected serialized value to match the binary representation"
        );

        let result = serialize_value(ReferenceValueLeaf::F64(123.3845f64).into());
        let expected = binary_repr!(
            type_codes::F64_CODE => f64_to_u64(123.3845f64),
        );
        assert_eq!(
            result, expected,
            "Expected serialized value to match the binary representation"
        );

        let result = serialize_value(ReferenceValueLeaf::Bool(false).into());
        let expected = binary_repr!(
            type_codes::BOOL_CODE => false,
        );
        assert_eq!(
            result, expected,
            "Expected serialized value to match the binary representation"
        );

        let facet = Facet::from_text("/hello/world").unwrap();
        let result = serialize_value(ReferenceValueLeaf::Facet(facet.encoded_str()).into());
        let expected = binary_repr!(
            type_codes::HIERARCHICAL_FACET_CODE => Facet::from_text("/hello/world").unwrap(),
        );
        assert_eq!(
            result, expected,
            "Expected serialized value to match the binary representation"
        );

        let pre_tok_str = PreTokenizedString {
            text: "hello, world".to_string(),
            tokens: vec![Token::default(), Token::default()],
        };
        let result =
            serialize_value(ReferenceValueLeaf::PreTokStr(pre_tok_str.clone().into()).into());
        let expected = binary_repr!(
            type_codes::EXT_CODE, type_codes::TOK_STR_EXT_CODE => pre_tok_str,
        );
        assert_eq!(
            result, expected,
            "Expected serialized value to match the binary representation"
        );
    }

    #[test]
    fn test_array_serialize() {
        let elements = [serde_json::Value::Null, serde_json::Value::Null];
        let result = serialize_value(ReferenceValue::Array(elements.iter()));
        let expected = binary_repr!(
            collection type_codes::ARRAY_CODE,
            length elements.len(),
            type_codes::NULL_CODE => (),
            type_codes::NULL_CODE => (),
        );
        assert_eq!(
            result, expected,
            "Expected serialized value to match the binary representation"
        );

        let elements = [
            serde_json::Value::String("Hello, world".into()),
            serde_json::Value::String("Some demo".into()),
        ];
        let result = serialize_value(ReferenceValue::Array(elements.iter()));
        let expected = binary_repr!(
            collection type_codes::ARRAY_CODE,
            length elements.len(),
            type_codes::TEXT_CODE => String::from("Hello, world"),
            type_codes::TEXT_CODE => String::from("Some demo"),
        );
        assert_eq!(
            result, expected,
            "Expected serialized value to match the binary representation"
        );

        let elements = [];
        let result = serialize_value(ReferenceValue::Array(elements.iter()));
        let expected = binary_repr!(
            collection type_codes::ARRAY_CODE,
            length elements.len(),
        );
        assert_eq!(
            result, expected,
            "Expected serialized value to match the binary representation"
        );

        let elements = [
            serde_json::Value::Null,
            serde_json::Value::String("Hello, world".into()),
            serde_json::Value::Number(12345.into()),
        ];
        let result = serialize_value(ReferenceValue::Array(elements.iter()));
        let expected = binary_repr!(
            collection type_codes::ARRAY_CODE,
            length elements.len(),
            type_codes::NULL_CODE => (),
            type_codes::TEXT_CODE => String::from("Hello, world"),
            type_codes::I64_CODE => 12345i64,
        );
        assert_eq!(
            result, expected,
            "Expected serialized value to match the binary representation"
        );
    }

    #[test]
    fn test_object_serialize() {
        let mut object = serde_json::Map::new();
        object.insert(
            "my-first-key".into(),
            serde_json::Value::String("Hello".into()),
        );
        object.insert("my-second-key".into(), serde_json::Value::Null);
        object.insert(
            "my-third-key".into(),
            serde_json::Value::Number(Number::from_f64(123.0).unwrap()),
        );
        let result = serialize_value(ReferenceValue::Object(JsonObjectIter(object.iter())));
        let expected = binary_repr!(
            collection type_codes::OBJECT_CODE,
            length object.len() * 2,  // To account for keys counting towards the length
            type_codes::TEXT_CODE => String::from("my-first-key"),
            type_codes::TEXT_CODE => String::from("Hello"),
            type_codes::TEXT_CODE => String::from("my-second-key"),
            type_codes::NULL_CODE => (),
            type_codes::TEXT_CODE => String::from("my-third-key"),
            type_codes::F64_CODE => f64_to_u64(123.0),
        );
        assert_eq!(
            result, expected,
            "Expected serialized value to match the binary representation"
        );

        let object = serde_json::Map::new();
        let result = serialize_value(ReferenceValue::Object(JsonObjectIter(object.iter())));
        let expected = binary_repr!(
            collection type_codes::OBJECT_CODE,
            length object.len(),
        );
        assert_eq!(
            result, expected,
            "Expected serialized value to match the binary representation"
        );

        let mut object = serde_json::Map::new();
        object.insert("my-first-key".into(), serde_json::Value::Null);
        object.insert("my-second-key".into(), serde_json::Value::Null);
        object.insert("my-third-key".into(), serde_json::Value::Null);
        let result = serialize_value(ReferenceValue::Object(JsonObjectIter(object.iter())));
        let expected = binary_repr!(
            collection type_codes::OBJECT_CODE,
            length object.len() * 2, // To account for keys counting towards the length
            type_codes::TEXT_CODE => String::from("my-first-key"),
            type_codes::NULL_CODE => (),
            type_codes::TEXT_CODE => String::from("my-second-key"),
            type_codes::NULL_CODE => (),
            type_codes::TEXT_CODE => String::from("my-third-key"),
            type_codes::NULL_CODE => (),
        );
        assert_eq!(
            result, expected,
            "Expected serialized value to match the binary representation"
        );
    }

    #[test]
    fn test_nested_serialize() {
        let mut object = serde_json::Map::new();
        object.insert(
            "my-array".into(),
            serde_json::Value::Array(vec![
                serde_json::Value::Null,
                serde_json::Value::String(String::from("bobby of the sea")),
            ]),
        );
        object.insert(
            "my-object".into(),
            serde_json::Value::Object(
                vec![
                    (
                        "inner-1".to_string(),
                        serde_json::Value::Number((-123i64).into()),
                    ),
                    (
                        "inner-2".to_string(),
                        serde_json::Value::String(String::from("bobby of the sea 2")),
                    ),
                ]
                .into_iter()
                .collect(),
            ),
        );
        let result = serialize_value(ReferenceValue::Object(JsonObjectIter(object.iter())));

        let mut expected = Vec::new();
        let header = binary_repr!(
            collection type_codes::OBJECT_CODE,
            length object.len() * 2,
        );
        expected.extend_from_slice(&header);
        expected
            .extend_from_slice(&binary_repr!(type_codes::TEXT_CODE => String::from("my-array")));
        let nested_array = binary_repr!(
            collection type_codes::ARRAY_CODE,
            length 2,
            type_codes::NULL_CODE => (),
            type_codes::TEXT_CODE => String::from("bobby of the sea"),
        );
        expected.extend_from_slice(&nested_array);
        expected
            .extend_from_slice(&binary_repr!(type_codes::TEXT_CODE => String::from("my-object")));
        let nested_object = binary_repr!(
            collection type_codes::OBJECT_CODE,
            length 4,   // 2 keys, 2 values
            type_codes::TEXT_CODE => String::from("inner-1"),
            type_codes::I64_CODE => -123i64,
            type_codes::TEXT_CODE => String::from("inner-2"),
            type_codes::TEXT_CODE => String::from("bobby of the sea 2"),
        );
        expected.extend_from_slice(&nested_object);
        assert_eq!(
            result, expected,
            "Expected serialized value to match the binary representation"
        );

        // Some more extreme nesting that might behave weirdly
        let mut object = serde_json::Map::new();
        object.insert(
            "my-array".into(),
            serde_json::Value::Array(vec![serde_json::Value::Array(vec![
                serde_json::Value::Array(vec![]),
                serde_json::Value::Array(vec![serde_json::Value::Null]),
            ])]),
        );
        let result = serialize_value(ReferenceValue::Object(JsonObjectIter(object.iter())));

        let mut expected = Vec::new();
        let header = binary_repr!(
            collection type_codes::OBJECT_CODE,
            length object.len() * 2,
        );
        expected.extend_from_slice(&header);
        expected
            .extend_from_slice(&binary_repr!(type_codes::TEXT_CODE => String::from("my-array")));
        let nested_array = binary_repr!(
            collection type_codes::ARRAY_CODE,
            length 1,
        );
        expected.extend_from_slice(&nested_array);
        let nested_array = binary_repr!(
            collection type_codes::ARRAY_CODE,
            length 2,
        );
        expected.extend_from_slice(&nested_array);
        let nested_array = binary_repr!(
            collection type_codes::ARRAY_CODE,
            length 0,
        );
        expected.extend_from_slice(&nested_array);
        let nested_array = binary_repr!(
            collection type_codes::ARRAY_CODE,
            length 1,
            type_codes::NULL_CODE => (),
        );
        expected.extend_from_slice(&nested_array);
        assert_eq!(
            result, expected,
            "Expected serialized value to match the binary representation"
        );
    }

    #[inline]
    fn serialize_doc<D: Document>(doc: &D, schema: &Schema) -> Vec<u8> {
        let mut writer = Vec::new();

        let mut serializer = BinaryDocumentSerializer::new(&mut writer, schema);
        serializer.serialize_doc(doc).expect("Serialize value");

        writer
    }

    /// A helper macro for generating the expected binary representation of the document.
    macro_rules! expected_doc_data {
        (length $len:expr) => {{
            let mut writer = Vec::new();
            VInt($len as u64).serialize(&mut writer).unwrap();
            writer
        }};
        (length $len:expr, $( $field_id:expr => $value:expr $(,)?)*) => {{
            let mut writer = Vec::new();

            VInt($len as u64).serialize(&mut writer).unwrap();
            $(
                $field_id.serialize(&mut writer).unwrap();
                $value.serialize(&mut writer).unwrap();
            )*

            writer
        }};
    }

    #[test]
    fn test_document_serialize() {
        let mut builder = Schema::builder();
        let name = builder.add_text_field("name", TEXT | STORED);
        let age = builder.add_u64_field("age", FAST | STORED);
        let schema = builder.build();

        let mut document = BTreeMap::new();
        document.insert(name, crate::schema::OwnedValue::Str("ChillFish8".into()));
        document.insert(age, crate::schema::OwnedValue::U64(20));

        let result = serialize_doc(&document, &schema);
        let mut expected = expected_doc_data!(length document.len());
        name.serialize(&mut expected).unwrap();
        expected
            .extend_from_slice(&binary_repr!(type_codes::TEXT_CODE => String::from("ChillFish8")));
        age.serialize(&mut expected).unwrap();
        expected.extend_from_slice(&binary_repr!(type_codes::U64_CODE => 20u64));
        assert_eq!(
            result, expected,
            "Expected serialized document to match the binary representation"
        );

        let mut builder = Schema::builder();
        let name = builder.add_text_field("name", TEXT | STORED);
        // This should be skipped when serializing.
        let age = builder.add_u64_field("age", FAST);
        let schema = builder.build();

        let mut document = BTreeMap::new();
        document.insert(name, crate::schema::OwnedValue::Str("ChillFish8".into()));
        document.insert(age, crate::schema::OwnedValue::U64(20));

        let result = serialize_doc(&document, &schema);
        let mut expected = expected_doc_data!(length 1);
        name.serialize(&mut expected).unwrap();
        expected
            .extend_from_slice(&binary_repr!(type_codes::TEXT_CODE => String::from("ChillFish8")));
        assert_eq!(
            result, expected,
            "Expected serialized document to match the binary representation"
        );

        let builder = Schema::builder();
        let schema = builder.build();
        let document = BTreeMap::<Field, crate::schema::OwnedValue>::new();
        let result = serialize_doc(&document, &schema);
        let expected = expected_doc_data!(length document.len());
        assert_eq!(
            result, expected,
            "Expected serialized document to match the binary representation"
        );
    }
}


================================================
FILE: src/schema/document/value.rs
================================================
use std::fmt::Debug;
use std::net::Ipv6Addr;

use common::DateTime;

use crate::tokenizer::PreTokenizedString;

/// A single field value.
pub trait Value<'a>: Send + Sync + Debug {
    /// The child value type returned by this doc value.
    /// The iterator for walking through the elements within the array.
    type ArrayIter: Iterator<Item = Self>;
    /// The visitor walking through the key-value pairs within
    /// the object.
    type ObjectIter: Iterator<Item = (&'a str, Self)>;

    /// Returns the field value represented by an enum which borrows it's data.
    fn as_value(&self) -> ReferenceValue<'a, Self>;

    #[inline]
    /// If the Value is a leaf, returns the associated leaf. Returns None otherwise.
    fn as_leaf(&self) -> Option<ReferenceValueLeaf<'a>> {
        if let ReferenceValue::Leaf(val) = self.as_value() {
            Some(val)
        } else {
            None
        }
    }

    #[inline]
    /// If the Value is a String, returns the associated str. Returns None otherwise.
    fn as_str(&self) -> Option<&'a str> {
        self.as_leaf().and_then(|leaf| leaf.as_str())
    }

    #[inline]
    /// If the Value is a u64, returns the associated u64. Returns None otherwise.
    fn as_u64(&self) -> Option<u64> {
        self.as_leaf().and_then(|leaf| leaf.as_u64())
    }

    #[inline]
    /// If the Value is a i64, returns the associated i64. Returns None otherwise.
    fn as_i64(&self) -> Option<i64> {
        self.as_leaf().and_then(|leaf| leaf.as_i64())
    }

    #[inline]
    /// If the Value is a f64, returns the associated f64. Returns None otherwise.
    fn as_f64(&self) -> Option<f64> {
        self.as_leaf().and_then(|leaf| leaf.as_f64())
    }

    #[inline]
    /// If the Value is a datetime, returns the associated datetime. Returns None otherwise.
    fn as_datetime(&self) -> Option<DateTime> {
        self.as_leaf().and_then(|leaf| leaf.as_datetime())
    }

    #[inline]
    /// If the Value is a IP address, returns the associated IP. Returns None otherwise.
    fn as_ip_addr(&self) -> Option<Ipv6Addr> {
        self.as_leaf().and_then(|leaf| leaf.as_ip_addr())
    }

    #[inline]
    /// If the Value is a bool, returns the associated bool. Returns None otherwise.
    fn as_bool(&self) -> Option<bool> {
        self.as_leaf().and_then(|leaf| leaf.as_bool())
    }

    #[inline]
    /// If the Value is a pre-tokenized string, returns the associated string. Returns None
    /// otherwise.
    fn as_pre_tokenized_text(&self) -> Option<Box<PreTokenizedString>> {
        self.as_leaf()
            .and_then(|leaf| leaf.into_pre_tokenized_text())
    }

    #[inline]
    /// If the Value is a bytes value, returns the associated set of bytes. Returns None otherwise.
    fn as_bytes(&self) -> Option<&'a [u8]> {
        self.as_leaf().and_then(|leaf| leaf.as_bytes())
    }

    #[inline]
    /// If the Value is a facet, returns the associated facet. Returns None otherwise.
    fn as_facet(&self) -> Option<&'a str> {
        self.as_leaf().and_then(|leaf| leaf.as_facet())
    }

    #[inline]
    /// Returns the iterator over the array if the Value is an array.
    fn as_array(&self) -> Option<Self::ArrayIter> {
        if let ReferenceValue::Array(val) = self.as_value() {
            Some(val)
        } else {
            None
        }
    }

    #[inline]
    /// Returns the iterator over the object if the Value is an object.
    fn as_object(&self) -> Option<Self::ObjectIter> {
        if let ReferenceValue::Object(val) = self.as_value() {
            Some(val)
        } else {
            None
        }
    }
}

/// A enum representing a leaf value for tantivy to index.
#[derive(Clone, Debug, PartialEq)]
pub enum ReferenceValueLeaf<'a> {
    /// A null value.
    Null,
    /// The str type is used for any text information.
    Str(&'a str),
    /// Unsigned 64-bits Integer `u64`
    U64(u64),
    /// Signed 64-bits Integer `i64`
    I64(i64),
    /// 64-bits Float `f64`
    F64(f64),
    /// Date/time with nanoseconds precision
    Date(DateTime),
    /// Facet string needs to match the format of
    /// [Facet::encoded_str](crate::schema::Facet::encoded_str).
    Facet(&'a str),
    /// Arbitrarily sized byte array
    Bytes(&'a [u8]),
    /// IpV6 Address. Internally there is no IpV4, it needs to be converted to `Ipv6Addr`.
    IpAddr(Ipv6Addr),
    /// Bool value
    Bool(bool),
    /// Pre-tokenized str type,
    PreTokStr(Box<PreTokenizedString>),
}

impl From<u64> for ReferenceValueLeaf<'_> {
    #[inline]
    fn from(value: u64) -> Self {
        ReferenceValueLeaf::U64(value)
    }
}

impl From<i64> for ReferenceValueLeaf<'_> {
    #[inline]
    fn from(value: i64) -> Self {
        ReferenceValueLeaf::I64(value)
    }
}

impl From<f64> for ReferenceValueLeaf<'_> {
    #[inline]
    fn from(value: f64) -> Self {
        ReferenceValueLeaf::F64(value)
    }
}

impl From<bool> for ReferenceValueLeaf<'_> {
    #[inline]
    fn from(value: bool) -> Self {
        ReferenceValueLeaf::Bool(value)
    }
}

impl<'a> From<&'a str> for ReferenceValueLeaf<'a> {
    #[inline]
    fn from(value: &'a str) -> Self {
        ReferenceValueLeaf::Str(value)
    }
}

impl<'a> From<&'a [u8]> for ReferenceValueLeaf<'a> {
    #[inline]
    fn from(value: &'a [u8]) -> Self {
        ReferenceValueLeaf::Bytes(value)
    }
}

impl From<DateTime> for ReferenceValueLeaf<'_> {
    #[inline]
    fn from(value: DateTime) -> Self {
        ReferenceValueLeaf::Date(value)
    }
}

impl From<Ipv6Addr> for ReferenceValueLeaf<'_> {
    #[inline]
    fn from(value: Ipv6Addr) -> Self {
        ReferenceValueLeaf::IpAddr(value)
    }
}

impl From<PreTokenizedString> for ReferenceValueLeaf<'_> {
    #[inline]
    fn from(val: PreTokenizedString) -> Self {
        ReferenceValueLeaf::PreTokStr(Box::new(val))
    }
}

impl<'a, T: Value<'a> + ?Sized> From<ReferenceValueLeaf<'a>> for ReferenceValue<'a, T> {
    #[inline]
    fn from(value: ReferenceValueLeaf<'a>) -> Self {
        match value {
            ReferenceValueLeaf::Null => ReferenceValue::Leaf(ReferenceValueLeaf::Null),
            ReferenceValueLeaf::Str(val) => ReferenceValue::Leaf(ReferenceValueLeaf::Str(val)),
            ReferenceValueLeaf::U64(val) => ReferenceValue::Leaf(ReferenceValueLeaf::U64(val)),
            ReferenceValueLeaf::I64(val) => ReferenceValue::Leaf(ReferenceValueLeaf::I64(val)),
            ReferenceValueLeaf::F64(val) => ReferenceValue::Leaf(ReferenceValueLeaf::F64(val)),
            ReferenceValueLeaf::Date(val) => ReferenceValue::Leaf(ReferenceValueLeaf::Date(val)),
            ReferenceValueLeaf::Facet(val) => ReferenceValue::Leaf(ReferenceValueLeaf::Facet(val)),
            ReferenceValueLeaf::Bytes(val) => ReferenceValue::Leaf(ReferenceValueLeaf::Bytes(val)),
            ReferenceValueLeaf::IpAddr(val) => {
                ReferenceValue::Leaf(ReferenceValueLeaf::IpAddr(val))
            }
            ReferenceValueLeaf::Bool(val) => ReferenceValue::Leaf(ReferenceValueLeaf::Bool(val)),
            ReferenceValueLeaf::PreTokStr(val) => {
                ReferenceValue::Leaf(ReferenceValueLeaf::PreTokStr(val))
            }
        }
    }
}

impl<'a> ReferenceValueLeaf<'a> {
    #[inline]
    /// Returns if the value is `null` or not.
    pub fn is_null(&self) -> bool {
        matches!(self, Self::Null)
    }

    #[inline]
    /// If the Value is a String, returns the associated str. Returns None otherwise.
    pub fn as_str(&self) -> Option<&'a str> {
        if let Self::Str(val) = self {
            Some(val)
        } else {
            None
        }
    }

    #[inline]
    /// If the Value is a u64, returns the associated u64. Returns None otherwise.
    pub fn as_u64(&self) -> Option<u64> {
        if let Self::U64(val) = self {
            Some(*val)
        } else {
            None
        }
    }

    #[inline]
    /// If the Value is a i64, returns the associated i64. Returns None otherwise.
    pub fn as_i64(&self) -> Option<i64> {
        if let Self::I64(val) = self {
            Some(*val)
        } else {
            None
        }
    }

    #[inline]
    /// If the Value is a f64, returns the associated f64. Returns None otherwise.
    pub fn as_f64(&self) -> Option<f64> {
        if let Self::F64(val) = self {
            Some(*val)
        } else {
            None
        }
    }

    #[inline]
    /// If the Value is a datetime, returns the associated datetime. Returns None otherwise.
    pub fn as_datetime(&self) -> Option<DateTime> {
        if let Self::Date(val) = self {
            Some(*val)
        } else {
            None
        }
    }

    #[inline]
    /// If the Value is a IP address, returns the associated IP. Returns None otherwise.
    pub fn as_ip_addr(&self) -> Option<Ipv6Addr> {
        if let Self::IpAddr(val) = self {
            Some(*val)
        } else {
            None
        }
    }

    #[inline]
    /// If the Value is a bool, returns the associated bool. Returns None otherwise.
    pub fn as_bool(&self) -> Option<bool> {
        if let Self::Bool(val) = self {
            Some(*val)
        } else {
            None
        }
    }

    #[inline]
    /// If the Value is a pre-tokenized string, consumes it and returns the string.
    /// Returns None otherwise.
    pub fn into_pre_tokenized_text(self) -> Option<Box<PreTokenizedString>> {
        if let Self::PreTokStr(val) = self {
            Some(val)
        } else {
            None
        }
    }

    #[inline]
    /// If the Value is a bytes value, returns the associated set of bytes. Returns None otherwise.
    pub fn as_bytes(&self) -> Option<&'a [u8]> {
        if let Self::Bytes(val) = self {
            Some(val)
        } else {
            None
        }
    }

    #[inline]
    /// If the Value is a facet, returns the associated facet. Returns None otherwise.
    pub fn as_facet(&self) -> Option<&'a str> {
        if let Self::Facet(val) = self {
            Some(val)
        } else {
            None
        }
    }
}

/// A enum representing a value for tantivy to index.
#[derive(Clone, Debug, PartialEq)]
pub enum ReferenceValue<'a, V>
where V: Value<'a> + ?Sized
{
    /// A null value.
    Leaf(ReferenceValueLeaf<'a>),
    /// A an array containing multiple values.
    Array(V::ArrayIter),
    /// A nested / dynamic object.
    Object(V::ObjectIter),
}

impl<'a, V> ReferenceValue<'a, V>
where V: Value<'a>
{
    #[inline]
    /// Returns if the value is `null` or not.
    pub fn is_null(&self) -> bool {
        matches!(self, Self::Leaf(ReferenceValueLeaf::Null))
    }

    #[inline]
    /// If the Value is a leaf, returns the associated leaf. Returns None otherwise.
    pub fn as_leaf(&self) -> Option<&ReferenceValueLeaf<'a>> {
        if let Self::Leaf(val) = self {
            Some(val)
        } else {
            None
        }
    }

    #[inline]
    /// If the Value is a leaf, consume it and return the leaf. Returns None otherwise.
    pub fn into_leaf(self) -> Option<ReferenceValueLeaf<'a>> {
        if let Self::Leaf(val) = self {
            Some(val)
        } else {
            None
        }
    }

    #[inline]
    /// If the Value is a String, returns the associated str. Returns None otherwise.
    pub fn as_str(&self) -> Option<&'a str> {
        self.as_leaf().and_then(|leaf| leaf.as_str())
    }

    #[inline]
    /// If the Value is a u64, returns the associated u64. Returns None otherwise.
    pub fn as_u64(&self) -> Option<u64> {
        self.as_leaf().and_then(|leaf| leaf.as_u64())
    }

    #[inline]
    /// If the Value is a i64, returns the associated i64. Returns None otherwise.
    pub fn as_i64(&self) -> Option<i64> {
        self.as_leaf().and_then(|leaf| leaf.as_i64())
    }

    #[inline]
    /// If the Value is a f64, returns the associated f64. Returns None otherwise.
    pub fn as_f64(&self) -> Option<f64> {
        self.as_leaf().and_then(|leaf| leaf.as_f64())
    }

    #[inline]
    /// If the Value is a datetime, returns the associated datetime. Returns None otherwise.
    pub fn as_datetime(&self) -> Option<DateTime> {
        self.as_leaf().and_then(|leaf| leaf.as_datetime())
    }

    #[inline]
    /// If the Value is a IP address, returns the associated IP. Returns None otherwise.
    pub fn as_ip_addr(&self) -> Option<Ipv6Addr> {
        self.as_leaf().and_then(|leaf| leaf.as_ip_addr())
    }

    #[inline]
    /// If the Value is a bool, returns the associated bool. Returns None otherwise.
    pub fn as_bool(&self) -> Option<bool> {
        self.as_leaf().and_then(|leaf| leaf.as_bool())
    }

    #[inline]
    /// If the Value is a pre-tokenized string, consumes it and returns the string.
    /// Returns None otherwise.
    pub fn into_pre_tokenized_text(self) -> Option<Box<PreTokenizedString>> {
        self.into_leaf()
            .and_then(|leaf| leaf.into_pre_tokenized_text())
    }

    #[inline]
    /// If the Value is a bytes value, returns the associated set of bytes. Returns None otherwise.
    pub fn as_bytes(&self) -> Option<&'a [u8]> {
        self.as_leaf().and_then(|leaf| leaf.as_bytes())
    }

    #[inline]
    /// If the Value is a facet, returns the associated facet. Returns None otherwise.
    pub fn as_facet(&self) -> Option<&'a str> {
        self.as_leaf().and_then(|leaf| leaf.as_facet())
    }

    #[inline]
    /// Returns true if the Value is an array.
    pub fn is_array(&self) -> bool {
        matches!(self, Self::Array(_))
    }

    #[inline]
    /// Returns true if the Value is an object.
    pub fn is_object(&self) -> bool {
        matches!(self, Self::Object(_))
    }
}


================================================
FILE: src/schema/facet.rs
================================================
use std::borrow::{Borrow, Cow};
use std::fmt::{self, Debug, Display, Formatter};
use std::io::{self, Read, Write};
use std::str;
use std::string::FromUtf8Error;

use common::*;
use once_cell::sync::Lazy;
use regex::Regex;
use serde::de::Error as _;
use serde::{Deserialize, Deserializer, Serialize, Serializer};

const SLASH_BYTE: u8 = b'/';
const ESCAPE_BYTE: u8 = b'\\';

/// BYTE used as a level separation in the binary
/// representation of facets.
pub const FACET_SEP_BYTE: u8 = 0u8;

/// `char` used as a level separation in the binary
/// representation of facets. (It is the null codepoint.)
pub const FACET_SEP_CHAR: char = '\u{0}';

/// An error enum for facet parser.
#[derive(Debug, PartialEq, Eq, Error)]
pub enum FacetParseError {
    /// The facet text representation is unparsable.
    #[error("Failed to parse the facet string: '{0}'")]
    FacetParseError(String),
}

/// A Facet represent a point in a given hierarchy.
///
/// They are typically represented similarly to a filepath.
/// For instance, an e-commerce website could
/// have a `Facet` for `/electronics/tv_and_video/led_tv`.
///
/// A document can be associated with any number of facets.
/// The hierarchy implicitly imply that a document
/// belonging to a facet also belongs to the ancestor of
/// its facet. In the example above, `/electronics/tv_and_video/`
/// and `/electronics`.
#[derive(Clone, Default, Eq, Hash, PartialEq, Ord, PartialOrd)]
pub struct Facet(pub(crate) String);

impl Facet {
    /// Returns a new instance of the "root facet"
    /// Equivalent to `/`.
    pub fn root() -> Facet {
        Facet("".to_string())
    }

    /// Returns true if the facet is the root facet `/`.
    pub fn is_root(&self) -> bool {
        self.encoded_str().is_empty()
    }

    /// Returns a binary representation of the facet.
    ///
    /// In this representation, `0u8` is used as a separator
    /// and the string parts of the facet are unescaped.
    /// (The first `/` is not encoded at all).
    ///
    /// This representation has the benefit of making it possible to
    /// express "being a child of a given facet" as a range over
    /// the term ordinals.
    pub fn encoded_str(&self) -> &str {
        &self.0
    }

    pub(crate) fn from_encoded_string(facet_string: String) -> Facet {
        Facet(facet_string)
    }

    /// Creates a `Facet` from its binary representation.
    pub fn from_encoded(encoded_bytes: Vec<u8>) -> Result<Facet, FromUtf8Error> {
        // facet bytes validation. `0u8` is used a separator but that is still legal utf-8
        String::from_utf8(encoded_bytes).map(Facet)
    }

    /// Parse a text representation of a facet.
    ///
    /// If one of the segments of this path
    /// contains a `/`, it should be escaped
    /// using an anti-slash `\`.
    pub fn from_text<T>(path: &T) -> Result<Facet, FacetParseError>
    where T: ?Sized + AsRef<str> {
        #[derive(Copy, Clone)]
        enum State {
            Escaped,
            Idle,
        }
        let path_ref = path.as_ref();
        if path_ref.is_empty() {
            return Err(FacetParseError::FacetParseError(path_ref.to_string()));
        }
        if !path_ref.starts_with('/') {
            return Err(FacetParseError::FacetParseError(path_ref.to_string()));
        }
        let mut facet_encoded = String::new();
        let mut state = State::Idle;
        let path_bytes = path_ref.as_bytes();
        let mut last_offset = 1;
        for i in 1..path_bytes.len() {
            let c = path_bytes[i];
            match (state, c) {
                (State::Idle, ESCAPE_BYTE) => {
                    facet_encoded.push_str(&path_ref[last_offset..i]);
                    last_offset = i + 1;
                    state = State::Escaped
                }
                (State::Idle, SLASH_BYTE) => {
                    facet_encoded.push_str(&path_ref[last_offset..i]);
                    facet_encoded.push(FACET_SEP_CHAR);
                    last_offset = i + 1;
                }
                (State::Escaped, _escaped_char) => {
                    state = State::Idle;
                }
                (State::Idle, _any_char) => {}
            }
        }
        facet_encoded.push_str(&path_ref[last_offset..]);
        Ok(Facet(facet_encoded))
    }

    /// Returns a `Facet` from an iterator over the different
    /// steps of the facet path.
    ///
    /// The steps are expected to be unescaped.
    pub fn from_path<Path>(path: Path) -> Facet
    where
        Path: IntoIterator,
        Path::Item: AsRef<str>,
    {
        let mut facet_string: String = String::with_capacity(100);
        let mut step_it = path.into_iter();
        if let Some(step) = step_it.next() {
            facet_string.push_str(step.as_ref());
        }
        for step in step_it {
            facet_string.push(FACET_SEP_CHAR);
            facet_string.push_str(step.as_ref());
        }
        Facet(facet_string)
    }

    /// Returns `true` if other is a `strict` subfacet of `self`.
    ///
    /// Disclaimer: By strict we mean that the relation is not reflexive.
    /// `/happy` is not a prefix of `/happy`.
    pub fn is_prefix_of(&self, other: &Facet) -> bool {
        let self_str = self.encoded_str();
        let other_str = other.encoded_str();

        // Fast path, but also required to ensure that / is not a prefix of /.
        if other_str.len() <= self_str.len() {
            return false;
        }

        // Root is a prefix of every other path.
        // This is not just an optimisation. It is necessary for correctness.
        if self.is_root() {
            return true;
        }

        other_str.starts_with(self_str) && other_str.as_bytes()[self_str.len()] == FACET_SEP_BYTE
    }

    /// Extract path from the `Facet`.
    pub fn to_path(&self) -> Vec<&str> {
        self.encoded_str().split(FACET_SEP_CHAR).collect()
    }

    /// This function is the inverse of Facet::from(&str).
    pub fn to_path_string(&self) -> String {
        format!("{self}")
    }
}

impl Borrow<str> for Facet {
    fn borrow(&self) -> &str {
        self.encoded_str()
    }
}

impl<'a, T: ?Sized + AsRef<str>> From<&'a T> for Facet {
    fn from(path_asref: &'a T) -> Facet {
        Facet::from_text(path_asref).unwrap()
    }
}

impl BinarySerializable for Facet {
    fn serialize<W: Write + ?Sized>(&self, writer: &mut W) -> io::Result<()> {
        <String as BinarySerializable>::serialize(&self.0, writer)
    }

    fn deserialize<R: Read>(reader: &mut R) -> io::Result<Self> {
        Ok(Facet(<String as BinarySerializable>::deserialize(reader)?))
    }
}

impl Display for Facet {
    fn fmt(&self, f: &mut Formatter<'_>) -> fmt::Result {
        for step in self.0.split(FACET_SEP_CHAR) {
            write!(f, "/")?;
            write!(f, "{}", escape_slashes(step))?;
        }
        Ok(())
    }
}

fn escape_slashes(s: &str) -> Cow<'_, str> {
    static SLASH_PTN: Lazy<Regex> = Lazy::new(|| Regex::new(r"[\\/]").unwrap());
    SLASH_PTN.replace_all(s, "\\/")
}

impl Serialize for Facet {
    fn serialize<S>(&self, serializer: S) -> Result<S::Ok, S::Error>
    where S: Serializer {
        serializer.serialize_str(&self.to_string())
    }
}

impl<'de> Deserialize<'de> for Facet {
    fn deserialize<D>(deserializer: D) -> Result<Self, D::Error>
    where D: Deserializer<'de> {
        <Cow<'de, str> as Deserialize<'de>>::deserialize(deserializer).and_then(|path| {
            Facet::from_text(&*path).map_err(|err| D::Error::custom(err.to_string()))
        })
    }
}

impl Debug for Facet {
    fn fmt(&self, f: &mut Formatter<'_>) -> fmt::Result {
        write!(f, "Facet({self})")?;
        Ok(())
    }
}

#[cfg(test)]
mod tests {

    use super::{Facet, FacetParseError};

    #[test]
    fn test_root() {
        assert_eq!(Facet::root(), Facet::from("/"));
        assert_eq!(format!("{}", Facet::root()), "/");
        assert!(Facet::root().is_root());
        assert_eq!(Facet::root().encoded_str(), "");
    }

    #[test]
    fn test_from_path() {
        assert_eq!(
            Facet::from_path(vec!["top", "a", "firstdoc"]),
            Facet::from("/top/a/firstdoc")
        );
    }

    #[test]
    fn test_facet_display() {
        {
            let v = ["first", "second", "third"];
            let facet = Facet::from_path(v.iter());
            assert_eq!(format!("{facet}"), "/first/second/third");
        }
        {
            let v = ["first", "sec/ond", "third"];
            let facet = Facet::from_path(v.iter());
            assert_eq!(format!("{facet}"), "/first/sec\\/ond/third");
        }
    }

    #[test]
    fn test_facet_debug() {
        let v = ["first", "second", "third"];
        let facet = Facet::from_path(v.iter());
        assert_eq!(format!("{facet:?}"), "Facet(/first/second/third)");
    }

    #[test]
    fn test_to_path() {
        let v = ["first", "second", "third\\/not_fourth"];
        let facet = Facet::from_path(v.iter());
        assert_eq!(facet.to_path(), v);
    }

    #[test]
    fn test_to_path_string() {
        let v = ["first", "second", "third/not_fourth"];
        let facet = Facet::from_path(v.iter());
        assert_eq!(
            facet.to_path_string(),
            String::from("/first/second/third\\/not_fourth")
        );
    }

    #[test]
    fn test_to_path_string_empty() {
        let v: Vec<&str> = vec![];
        let facet = Facet::from_path(v.iter());
        assert_eq!(facet.to_path_string(), "/");
    }

    #[test]
    fn test_from_text() {
        assert_eq!(
            Err(FacetParseError::FacetParseError("INVALID".to_string())),
            Facet::from_text("INVALID")
        );
    }

    #[test]
    fn only_proper_prefixes() {
        assert!(Facet::from("/foo").is_prefix_of(&Facet::from("/foo/bar")));

        assert!(!Facet::from("/foo/bar").is_prefix_of(&Facet::from("/foo/bar")));
    }

    #[test]
    fn root_is_a_prefix() {
        assert!(Facet::from("/").is_prefix_of(&Facet::from("/foobar")));
        assert!(!Facet::from("/").is_prefix_of(&Facet::from("/")));
    }

    #[test]
    fn deserialize_from_borrowed_string() {
        let facet = serde_json::from_str::<Facet>(r#""/foo/bar""#).unwrap();
        assert_eq!(facet, Facet::from_path(["foo", "bar"]));
    }

    #[test]
    fn deserialize_from_owned_string() {
        let facet = serde_json::from_str::<Facet>(r#""/foo/\u263A""#).unwrap();
        assert_eq!(facet, Facet::from_path(["foo", "☺"]));
    }

    #[test]
    fn deserialize_from_invalid_string() {
        let error = serde_json::from_str::<Facet>(r#""foo/bar""#).unwrap_err();
        assert_eq!(
            error.to_string(),
            "Failed to parse the facet string: 'foo/bar'"
        );
    }
}


================================================
FILE: src/schema/facet_options.rs
================================================
use std::ops::BitOr;

use serde::{Deserialize, Serialize};

use crate::schema::flags::{IndexedFlag, SchemaFlagList, StoredFlag};

/// Define how a facet field should be handled by tantivy.
///
/// Note that a Facet is always indexed and stored as a fastfield.
#[derive(Clone, Debug, PartialEq, Eq, Serialize, Deserialize, Default)]
pub struct FacetOptions {
    stored: bool,
}

impl FacetOptions {
    /// Returns true if the value is stored.
    #[inline]
    pub fn is_stored(&self) -> bool {
        self.stored
    }

    /// Set the field as stored.
    ///
    /// Only the fields that are set as *stored* are
    /// persisted into the Tantivy's store.
    #[must_use]
    pub fn set_stored(mut self) -> FacetOptions {
        self.stored = true;
        self
    }
}

impl From<()> for FacetOptions {
    fn from(_: ()) -> FacetOptions {
        FacetOptions::default()
    }
}

impl From<StoredFlag> for FacetOptions {
    fn from(_: StoredFlag) -> Self {
        FacetOptions { stored: true }
    }
}

impl<T: Into<FacetOptions>> BitOr<T> for FacetOptions {
    type Output = FacetOptions;

    fn bitor(self, other: T) -> FacetOptions {
        let other = other.into();
        FacetOptions {
            stored: self.stored | other.stored,
        }
    }
}

impl<Head, Tail> From<SchemaFlagList<Head, Tail>> for FacetOptions
where
    Head: Clone,
    Tail: Clone,
    Self: BitOr<Output = Self> + From<Head> + From<Tail>,
{
    fn from(head_tail: SchemaFlagList<Head, Tail>) -> Self {
        Self::from(head_tail.head) | Self::from(head_tail.tail)
    }
}

impl From<IndexedFlag> for FacetOptions {
    fn from(_: IndexedFlag) -> Self {
        FacetOptions { stored: false }
    }
}

#[cfg(test)]
mod tests {
    use crate::schema::{FacetOptions, INDEXED};

    #[test]
    fn test_from_index_flag() {
        let facet_option = FacetOptions::from(INDEXED);
        assert_eq!(facet_option, FacetOptions::default());
    }
}


================================================
FILE: src/schema/field.rs
================================================
use std::io;
use std::io::{Read, Write};

use common::BinarySerializable;

/// `Field` is represented by an unsigned 32-bit integer type.
/// The schema holds the mapping between field names and `Field` objects.
#[derive(
    Copy, Clone, Debug, PartialEq, PartialOrd, Eq, Ord, Hash, serde::Serialize, serde::Deserialize,
)]
pub struct Field(u32);

impl Field {
    /// Create a new field object for the given FieldId.
    pub const fn from_field_id(field_id: u32) -> Field {
        Field(field_id)
    }

    /// Returns a u32 identifying uniquely a field within a schema.
    pub const fn field_id(self) -> u32 {
        self.0
    }
}

impl BinarySerializable for Field {
    fn serialize<W: Write + ?Sized>(&self, writer: &mut W) -> io::Result<()> {
        self.0.serialize(writer)
    }

    fn deserialize<R: Read>(reader: &mut R) -> io::Result<Field> {
        u32::deserialize(reader).map(Field)
    }
}


================================================
FILE: src/schema/field_entry.rs
================================================
use serde::{Deserialize, Serialize};

use super::ip_options::IpAddrOptions;
use crate::schema::bytes_options::BytesOptions;
use crate::schema::{
    is_valid_field_name, DateOptions, FacetOptions, FieldType, JsonObjectOptions, NumericOptions,
    TextOptions,
};

/// A `FieldEntry` represents a field and its configuration.
/// `Schema` are a collection of `FieldEntry`
///
/// It consists of
/// - a field name
/// - a field type, itself wrapping up options describing how the field should be indexed.
#[derive(Clone, Debug, PartialEq, Serialize, Deserialize)]
pub struct FieldEntry {
    name: String,
    #[serde(flatten)]
    field_type: FieldType,
}

impl FieldEntry {
    /// Creates a new field entry given a name and a field type
    pub fn new(field_name: String, field_type: FieldType) -> FieldEntry {
        assert!(is_valid_field_name(&field_name));
        FieldEntry {
            name: field_name,
            field_type,
        }
    }

    /// Creates a new text field entry.
    pub fn new_text(field_name: String, text_options: TextOptions) -> FieldEntry {
        Self::new(field_name, FieldType::Str(text_options))
    }

    /// Creates a new u64 field entry.
    pub fn new_u64(field_name: String, int_options: NumericOptions) -> FieldEntry {
        Self::new(field_name, FieldType::U64(int_options))
    }

    /// Creates a new i64 field entry.
    pub fn new_i64(field_name: String, int_options: NumericOptions) -> FieldEntry {
        Self::new(field_name, FieldType::I64(int_options))
    }

    /// Creates a new f64 field entry.
    pub fn new_f64(field_name: String, f64_options: NumericOptions) -> FieldEntry {
        Self::new(field_name, FieldType::F64(f64_options))
    }

    /// Creates a new bool field entry.
    pub fn new_bool(field_name: String, bool_options: NumericOptions) -> FieldEntry {
        Self::new(field_name, FieldType::Bool(bool_options))
    }

    /// Creates a new date field entry.
    pub fn new_date(field_name: String, date_options: DateOptions) -> FieldEntry {
        Self::new(field_name, FieldType::Date(date_options))
    }

    /// Creates a new ip address field entry.
    pub fn new_ip_addr(field_name: String, ip_options: IpAddrOptions) -> FieldEntry {
        Self::new(field_name, FieldType::IpAddr(ip_options))
    }

    /// Creates a field entry for a facet.
    pub fn new_facet(field_name: String, facet_options: FacetOptions) -> FieldEntry {
        Self::new(field_name, FieldType::Facet(facet_options))
    }

    /// Creates a field entry for a bytes field
    pub fn new_bytes(field_name: String, bytes_options: BytesOptions) -> FieldEntry {
        Self::new(field_name, FieldType::Bytes(bytes_options))
    }

    /// Creates a field entry for a json field
    pub fn new_json(field_name: String, json_object_options: JsonObjectOptions) -> FieldEntry {
        Self::new(field_name, FieldType::JsonObject(json_object_options))
    }

    /// Returns the name of the field
    pub fn name(&self) -> &str {
        &self.name
    }

    /// Returns the field type
    pub fn field_type(&self) -> &FieldType {
        &self.field_type
    }

    /// Returns true if the field is indexed.
    ///
    /// An indexed field is searchable.
    pub fn is_indexed(&self) -> bool {
        self.field_type.is_indexed()
    }

    /// Returns true if the field is normed
    pub fn has_fieldnorms(&self) -> bool {
        self.field_type.has_fieldnorms()
    }

    /// Returns true if the field is a fast field
    pub fn is_fast(&self) -> bool {
        self.field_type.is_fast()
    }

    /// Returns true if the field has the expand dots option set (for json fields)
    pub fn is_expand_dots_enabled(&self) -> bool {
        match self.field_type {
            FieldType::JsonObject(ref options) => options.is_expand_dots_enabled(),
            _ => false,
        }
    }

    /// Returns true if the field is stored
    #[inline]
    pub fn is_stored(&self) -> bool {
        match self.field_type {
            FieldType::U64(ref options)
            | FieldType::I64(ref options)
            | FieldType::F64(ref options)
            | FieldType::Bool(ref options) => options.is_stored(),
            FieldType::Date(ref options) => options.is_stored(),
            FieldType::Str(ref options) => options.is_stored(),
            FieldType::Facet(ref options) => options.is_stored(),
            FieldType::Bytes(ref options) => options.is_stored(),
            FieldType::JsonObject(ref options) => options.is_stored(),
            FieldType::IpAddr(ref options) => options.is_stored(),
        }
    }
}

#[cfg(test)]
mod tests {

    use super::*;
    use crate::schema::{Schema, TextFieldIndexing, TEXT};
    use crate::Index;

    #[test]
    #[should_panic]
    fn test_invalid_field_name_should_panic() {
        FieldEntry::new_text("-hello".to_string(), TEXT);
    }

    #[test]
    fn test_json_serialization() {
        let field_value = FieldEntry::new_text(String::from("title"), TEXT);

        let expected = r#"{
  "name": "title",
  "type": "text",
  "options": {
    "indexing": {
      "record": "position",
      "fieldnorms": true,
      "tokenizer": "default"
    },
    "stored": false,
    "fast": false
  }
}"#;
        let field_value_json = serde_json::to_string_pretty(&field_value).unwrap();

        assert_eq!(expected, &field_value_json);

        let field_value: FieldEntry = serde_json::from_str(expected).unwrap();

        assert_eq!("title", field_value.name);

        match field_value.field_type {
            FieldType::Str(_) => {}
            _ => panic!("expected FieldType::Str"),
        }
    }

    #[test]
    fn test_json_deserialization() {
        let json_str = r#"{
  "name": "title",
  "options": {
    "indexing": {
      "record": "position",
      "fieldnorms": true,
      "tokenizer": "default"
    },
    "stored": false
  },
  "type": "text"
}"#;
        let field_entry: FieldEntry = serde_json::from_str(json_str).unwrap();
        match field_entry.field_type {
            FieldType::Str(_) => {}
            _ => panic!("expected FieldType::Str"),
        }
    }

    #[test]
    fn test_missing_fieldnorms() -> crate::Result<()> {
        let mut schema_builder = Schema::builder();
        let no_field_norm = TextOptions::default()
            .set_indexing_options(TextFieldIndexing::default().set_fieldnorms(false));
        let text = schema_builder.add_text_field("text", no_field_norm);
        let schema = schema_builder.build();
        let index = Index::create_in_ram(schema);
        let mut index_writer = index.writer_for_tests()?;
        index_writer.add_document(doc!(text=>"abc"))?;
        index_writer.commit()?;
        let searcher = index.reader()?.searcher();
        let err = searcher.segment_reader(0u32).get_fieldnorms_reader(text);
        assert!(matches!(err, Err(crate::TantivyError::SchemaError(_))));
        Ok(())
    }
}


================================================
FILE: src/schema/field_type.rs
================================================
use std::net::IpAddr;
use std::str::FromStr;

use base64::engine::general_purpose::STANDARD as BASE64;
use base64::Engine;
use columnar::{ColumnType, NumericalType};
use serde::{Deserialize, Serialize};
use serde_json::Value as JsonValue;
use thiserror::Error;

use super::ip_options::IpAddrOptions;
use super::IntoIpv6Addr;
use crate::schema::bytes_options::BytesOptions;
use crate::schema::facet_options::FacetOptions;
use crate::schema::{
    DateOptions, Facet, IndexRecordOption, JsonObjectOptions, NumericOptions, OwnedValue,
    TextFieldIndexing, TextOptions,
};
use crate::time::format_description::well_known::Rfc3339;
use crate::time::OffsetDateTime;
use crate::tokenizer::PreTokenizedString;
use crate::DateTime;

/// Possible error that may occur while parsing a field value
/// At this point the JSON is known to be valid.
#[derive(Debug, PartialEq, Error)]
pub enum ValueParsingError {
    #[error("Overflow error. Expected {expected}, got {json}")]
    OverflowError {
        expected: &'static str,
        json: serde_json::Value,
    },
    #[error("Type error. Expected {expected}, got {json}")]
    TypeError {
        expected: &'static str,
        json: serde_json::Value,
    },
    #[error("Parse  error on {json}: {error}")]
    ParseError {
        error: String,
        json: serde_json::Value,
    },
    #[error("Invalid base64: {base64}")]
    InvalidBase64 { base64: String },
}

/// Type of the value that a field can take.
///
/// Contrary to FieldType, this does
/// not include the way the field must be indexed.
#[derive(Copy, Clone, Debug, Eq, PartialEq, Ord, PartialOrd, Hash)]
#[repr(u8)]
pub enum Type {
    /// `&str`
    Str = b's',
    /// `u64`
    U64 = b'u',
    /// `i64`
    I64 = b'i',
    /// `f64`
    F64 = b'f',
    /// `bool`
    Bool = b'o',
    /// `date(i64) timestamp`
    Date = b'd',
    /// `tantivy::schema::Facet`. Passed as a string in JSON.
    Facet = b'h',
    /// `Vec<u8>`
    Bytes = b'b',
    /// Leaf in a Json object.
    Json = b'j',
    /// IpAddr
    IpAddr = b'p',
}

impl From<ColumnType> for Type {
    fn from(value: ColumnType) -> Self {
        match value {
            ColumnType::Str => Type::Str,
            ColumnType::U64 => Type::U64,
            ColumnType::I64 => Type::I64,
            ColumnType::F64 => Type::F64,
            ColumnType::Bool => Type::Bool,
            ColumnType::DateTime => Type::Date,
            ColumnType::Bytes => Type::Bytes,
            ColumnType::IpAddr => Type::IpAddr,
        }
    }
}

const ALL_TYPES: [Type; 10] = [
    Type::Str,
    Type::U64,
    Type::I64,
    Type::F64,
    Type::Bool,
    Type::Date,
    Type::Facet,
    Type::Bytes,
    Type::Json,
    Type::IpAddr,
];

impl Type {
    /// Returns the numerical type if applicable
    /// It does not do any mapping, e.g. Date is None although it's also stored as I64 in the
    /// column store
    pub fn numerical_type(&self) -> Option<NumericalType> {
        match self {
            Type::I64 => Some(NumericalType::I64),
            Type::U64 => Some(NumericalType::U64),
            Type::F64 => Some(NumericalType::F64),
            _ => None,
        }
    }

    /// Returns an iterator over the different values
    /// the Type enum can tape.
    pub fn iter_values() -> impl Iterator<Item = Type> {
        ALL_TYPES.iter().cloned()
    }

    /// Returns a 1 byte code used to identify the type.
    #[inline]
    pub fn to_code(&self) -> u8 {
        *self as u8
    }

    /// Returns a human readable name for the Type.
    pub fn name(&self) -> &'static str {
        match self {
            Type::Str => "Str",
            Type::U64 => "U64",
            Type::I64 => "I64",
            Type::F64 => "F64",
            Type::Bool => "Bool",
            Type::Date => "Date",
            Type::Facet => "Facet",
            Type::Bytes => "Bytes",
            Type::Json => "Json",
            Type::IpAddr => "IpAddr",
        }
    }

    /// Interprets a 1byte code as a type.
    /// Returns `None` if the code is invalid.
    #[inline]
    pub fn from_code(code: u8) -> Option<Self> {
        match code {
            b's' => Some(Type::Str),
            b'u' => Some(Type::U64),
            b'i' => Some(Type::I64),
            b'f' => Some(Type::F64),
            b'o' => Some(Type::Bool),
            b'd' => Some(Type::Date),
            b'h' => Some(Type::Facet),
            b'b' => Some(Type::Bytes),
            b'j' => Some(Type::Json),
            b'p' => Some(Type::IpAddr),
            _ => None,
        }
    }
}

/// A `FieldType` describes the type (text, u64) of a field as well as
/// how it should be handled by tantivy.
#[derive(Clone, Debug, PartialEq, Serialize, Deserialize)]
#[serde(tag = "type", content = "options")]
#[serde(rename_all = "snake_case")]
pub enum FieldType {
    /// String field type configuration
    #[serde(rename = "text")]
    Str(TextOptions),
    /// Unsigned 64-bits integers field type configuration
    U64(NumericOptions),
    /// Signed 64-bits integers 64 field type configuration
    I64(NumericOptions),
    /// 64-bits float 64 field type configuration
    F64(NumericOptions),
    /// Bool field type configuration
    Bool(NumericOptions),
    /// Signed 64-bits Date 64 field type configuration,
    Date(DateOptions),
    /// Hierarchical Facet
    Facet(FacetOptions),
    /// Bytes (one per document)
    Bytes(BytesOptions),
    /// Json object
    JsonObject(JsonObjectOptions),
    /// IpAddr field
    IpAddr(IpAddrOptions),
}

impl FieldType {
    /// Returns the value type associated for this field.
    pub fn value_type(&self) -> Type {
        match *self {
            FieldType::Str(_) => Type::Str,
            FieldType::U64(_) => Type::U64,
            FieldType::I64(_) => Type::I64,
            FieldType::F64(_) => Type::F64,
            FieldType::Bool(_) => Type::Bool,
            FieldType::Date(_) => Type::Date,
            FieldType::Facet(_) => Type::Facet,
            FieldType::Bytes(_) => Type::Bytes,
            FieldType::JsonObject(_) => Type::Json,
            FieldType::IpAddr(_) => Type::IpAddr,
        }
    }

    /// returns true if this is an json field
    pub fn is_json(&self) -> bool {
        matches!(self, FieldType::JsonObject(_))
    }

    /// returns true if this is an ip address field
    pub fn is_ip_addr(&self) -> bool {
        matches!(self, FieldType::IpAddr(_))
    }

    /// returns true if this is an str field
    pub fn is_str(&self) -> bool {
        matches!(self, FieldType::Str(_))
    }

    /// returns true if this is a bytes field
    pub fn is_bytes(&self) -> bool {
        matches!(self, FieldType::Bytes(_))
    }

    /// returns true if this is an date field
    pub fn is_date(&self) -> bool {
        matches!(self, FieldType::Date(_))
    }

    /// returns true if the field is indexed.
    pub fn is_indexed(&self) -> bool {
        match *self {
            FieldType::Str(ref text_options) => text_options.get_indexing_options().is_some(),
            FieldType::U64(ref int_options)
            | FieldType::I64(ref int_options)
            | FieldType::F64(ref int_options)
            | FieldType::Bool(ref int_options) => int_options.is_indexed(),
            FieldType::Date(ref date_options) => date_options.is_indexed(),
            FieldType::Facet(ref _facet_options) => true,
            FieldType::Bytes(ref bytes_options) => bytes_options.is_indexed(),
            FieldType::JsonObject(ref json_object_options) => json_object_options.is_indexed(),
            FieldType::IpAddr(ref ip_addr_options) => ip_addr_options.is_indexed(),
        }
    }

    /// Returns the index record option for the field.
    ///
    /// If the field is not indexed, returns `None`.
    pub fn index_record_option(&self) -> Option<IndexRecordOption> {
        match self {
            FieldType::Str(text_options) => text_options
                .get_indexing_options()
                .map(|text_indexing| text_indexing.index_option()),
            FieldType::JsonObject(json_object_options) => json_object_options
                .get_text_indexing_options()
                .map(|text_indexing| text_indexing.index_option()),
            field_type => {
                if field_type.is_indexed() {
                    Some(IndexRecordOption::Basic)
                } else {
                    None
                }
            }
        }
    }

    /// returns true if the field is fast.
    pub fn is_fast(&self) -> bool {
        match *self {
            FieldType::Bytes(ref bytes_options) => bytes_options.is_fast(),
            FieldType::Str(ref text_options) => text_options.is_fast(),
            FieldType::U64(ref int_options)
            | FieldType::I64(ref int_options)
            | FieldType::F64(ref int_options)
            | FieldType::Bool(ref int_options) => int_options.is_fast(),
            FieldType::Date(ref date_options) => date_options.is_fast(),
            FieldType::IpAddr(ref ip_addr_options) => ip_addr_options.is_fast(),
            FieldType::Facet(_) => true,
            FieldType::JsonObject(ref json_object_options) => json_object_options.is_fast(),
        }
    }

    /// returns true if the field is normed (see [fieldnorms](crate::fieldnorm)).
    pub fn has_fieldnorms(&self) -> bool {
        match *self {
            FieldType::Str(ref text_options) => text_options
                .get_indexing_options()
                .map(|options| options.fieldnorms())
                .unwrap_or(false),
            FieldType::U64(ref int_options)
            | FieldType::I64(ref int_options)
            | FieldType::F64(ref int_options)
            | FieldType::Bool(ref int_options) => int_options.fieldnorms(),
            FieldType::Date(ref date_options) => date_options.fieldnorms(),
            FieldType::Facet(_) => false,
            FieldType::Bytes(ref bytes_options) => bytes_options.fieldnorms(),
            FieldType::JsonObject(ref _json_object_options) => false,
            FieldType::IpAddr(ref ip_addr_options) => ip_addr_options.fieldnorms(),
        }
    }

    /// Given a field configuration, return the maximal possible
    /// `IndexRecordOption` available.
    ///
    /// For the Json object, this does not necessarily mean it is the index record
    /// option level is available for all terms.
    /// (Non string terms have the Basic indexing option at most.)
    ///
    /// If the field is not indexed, then returns `None`.
    pub fn get_index_record_option(&self) -> Option<IndexRecordOption> {
        match *self {
            FieldType::Str(ref text_options) => text_options
                .get_indexing_options()
                .map(TextFieldIndexing::index_option),
            FieldType::U64(ref int_options)
            | FieldType::I64(ref int_options)
            | FieldType::F64(ref int_options)
            | FieldType::Bool(ref int_options) => {
                if int_options.is_indexed() {
                    Some(IndexRecordOption::Basic)
                } else {
                    None
                }
            }
            FieldType::Date(ref date_options) => {
                if date_options.is_indexed() {
                    Some(IndexRecordOption::Basic)
                } else {
                    None
                }
            }
            FieldType::Facet(ref _facet_options) => Some(IndexRecordOption::Basic),
            FieldType::Bytes(ref bytes_options) => {
                if bytes_options.is_indexed() {
                    Some(IndexRecordOption::Basic)
                } else {
                    None
                }
            }
            FieldType::JsonObject(ref json_obj_options) => json_obj_options
                .get_text_indexing_options()
                .map(TextFieldIndexing::index_option),
            FieldType::IpAddr(ref ip_addr_options) => {
                if ip_addr_options.is_indexed() {
                    Some(IndexRecordOption::Basic)
                } else {
                    None
                }
            }
        }
    }

    /// Parses a field value from json, given the target FieldType.
    ///
    /// Tantivy will try to cast values only with the coerce option.
    /// For instance, If the json value is the integer `3` and the
    /// target field is a `Str`, this method will return an Error if `coerce`
    /// is not enabled.
    pub fn value_from_json(&self, json: JsonValue) -> Result<OwnedValue, ValueParsingError> {
        match json {
            JsonValue::String(field_text) => {
                match self {
                    FieldType::Date(_) => {
                        let dt_with_fixed_tz = OffsetDateTime::parse(&field_text, &Rfc3339)
                            .map_err(|_err| ValueParsingError::TypeError {
                                expected: "rfc3339 format",
                                json: JsonValue::String(field_text),
                            })?;
                        Ok(DateTime::from_utc(dt_with_fixed_tz).into())
                    }
                    FieldType::Str(_) => Ok(OwnedValue::Str(field_text)),
                    FieldType::U64(opt) => {
                        if opt.should_coerce() {
                            Ok(OwnedValue::U64(field_text.parse().map_err(|_| {
                                ValueParsingError::TypeError {
                                    expected: "a u64 or a u64 as string",
                                    json: JsonValue::String(field_text),
                                }
                            })?))
                        } else {
                            Err(ValueParsingError::TypeError {
                                expected: "a u64",
                                json: JsonValue::String(field_text),
                            })
                        }
                    }
                    FieldType::I64(opt) => {
                        if opt.should_coerce() {
                            Ok(OwnedValue::I64(field_text.parse().map_err(|_| {
                                ValueParsingError::TypeError {
                                    expected: "a i64 or a i64 as string",
                                    json: JsonValue::String(field_text),
                                }
                            })?))
                        } else {
                            Err(ValueParsingError::TypeError {
                                expected: "a i64",
                                json: JsonValue::String(field_text),
                            })
                        }
                    }
                    FieldType::F64(opt) => {
                        if opt.should_coerce() {
                            Ok(OwnedValue::F64(field_text.parse().map_err(|_| {
                                ValueParsingError::TypeError {
                                    expected: "a f64 or a f64 as string",
                                    json: JsonValue::String(field_text),
                                }
                            })?))
                        } else {
                            Err(ValueParsingError::TypeError {
                                expected: "a f64",
                                json: JsonValue::String(field_text),
                            })
                        }
                    }
                    FieldType::Bool(opt) => {
                        if opt.should_coerce() {
                            Ok(OwnedValue::Bool(field_text.parse().map_err(|_| {
                                ValueParsingError::TypeError {
                                    expected: "a i64 or a bool as string",
                                    json: JsonValue::String(field_text),
                                }
                            })?))
                        } else {
                            Err(ValueParsingError::TypeError {
                                expected: "a boolean",
                                json: JsonValue::String(field_text),
                            })
                        }
                    }
                    FieldType::Facet(_) => Ok(OwnedValue::Facet(Facet::from(&field_text))),
                    FieldType::Bytes(_) => BASE64
                        .decode(&field_text)
                        .map(OwnedValue::Bytes)
                        .map_err(|_| ValueParsingError::InvalidBase64 { base64: field_text }),
                    FieldType::JsonObject(_) => Err(ValueParsingError::TypeError {
                        expected: "a json object",
                        json: JsonValue::String(field_text),
                    }),
                    FieldType::IpAddr(_) => {
                        let ip_addr: IpAddr = IpAddr::from_str(&field_text).map_err(|err| {
                            ValueParsingError::ParseError {
                                error: err.to_string(),
                                json: JsonValue::String(field_text),
                            }
                        })?;

                        Ok(OwnedValue::IpAddr(ip_addr.into_ipv6_addr()))
                    }
                }
            }
            JsonValue::Number(field_val_num) => match self {
                FieldType::I64(_) | FieldType::Date(_) => {
                    if let Some(field_val_i64) = field_val_num.as_i64() {
                        Ok(OwnedValue::I64(field_val_i64))
                    } else {
                        Err(ValueParsingError::OverflowError {
                            expected: "an i64 int",
                            json: JsonValue::Number(field_val_num),
                        })
                    }
                }
                FieldType::U64(_) => {
                    if let Some(field_val_u64) = field_val_num.as_u64() {
                        Ok(OwnedValue::U64(field_val_u64))
                    } else {
                        Err(ValueParsingError::OverflowError {
                            expected: "u64",
                            json: JsonValue::Number(field_val_num),
                        })
                    }
                }
                FieldType::F64(_) => {
                    if let Some(field_val_f64) = field_val_num.as_f64() {
                        Ok(OwnedValue::F64(field_val_f64))
                    } else {
                        Err(ValueParsingError::OverflowError {
                            expected: "a f64",
                            json: JsonValue::Number(field_val_num),
                        })
                    }
                }
                FieldType::Bool(_) => Err(ValueParsingError::TypeError {
                    expected: "a boolean",
                    json: JsonValue::Number(field_val_num),
                }),
                FieldType::Str(opt) => {
                    if opt.should_coerce() {
                        Ok(OwnedValue::Str(field_val_num.to_string()))
                    } else {
                        Err(ValueParsingError::TypeError {
                            expected: "a string",
                            json: JsonValue::Number(field_val_num),
                        })
                    }
                }
                FieldType::Facet(_) | FieldType::Bytes(_) => Err(ValueParsingError::TypeError {
                    expected: "a string",
                    json: JsonValue::Number(field_val_num),
                }),
                FieldType::JsonObject(_) => Err(ValueParsingError::TypeError {
                    expected: "a json object",
                    json: JsonValue::Number(field_val_num),
                }),
                FieldType::IpAddr(_) => Err(ValueParsingError::TypeError {
                    expected: "a string with an ip addr",
                    json: JsonValue::Number(field_val_num),
                }),
            },
            JsonValue::Object(json_map) => match self {
                FieldType::Str(_) => {
                    if let Ok(tok_str_val) = serde_json::from_value::<PreTokenizedString>(
                        serde_json::Value::Object(json_map.clone()),
                    ) {
                        Ok(OwnedValue::PreTokStr(tok_str_val))
                    } else {
                        Err(ValueParsingError::TypeError {
                            expected: "a string or an pretokenized string",
                            json: JsonValue::Object(json_map),
                        })
                    }
                }
                FieldType::JsonObject(_) => Ok(OwnedValue::from(json_map)),
                _ => Err(ValueParsingError::TypeError {
                    expected: self.value_type().name(),
                    json: JsonValue::Object(json_map),
                }),
            },
            JsonValue::Bool(json_bool_val) => match self {
                FieldType::Bool(_) => Ok(OwnedValue::Bool(json_bool_val)),
                FieldType::Str(opt) => {
                    if opt.should_coerce() {
                        Ok(OwnedValue::Str(json_bool_val.to_string()))
                    } else {
                        Err(ValueParsingError::TypeError {
                            expected: "a string",
                            json: JsonValue::Bool(json_bool_val),
                        })
                    }
                }
                _ => Err(ValueParsingError::TypeError {
                    expected: self.value_type().name(),
                    json: JsonValue::Bool(json_bool_val),
                }),
            },
            // Could also just filter them
            JsonValue::Null => match self {
                FieldType::Str(opt) => {
                    if opt.should_coerce() {
                        Ok(OwnedValue::Str("null".to_string()))
                    } else {
                        Err(ValueParsingError::TypeError {
                            expected: "a string",
                            json: JsonValue::Null,
                        })
                    }
                }
                _ => Err(ValueParsingError::TypeError {
                    expected: self.value_type().name(),
                    json: JsonValue::Null,
                }),
            },
            _ => Err(ValueParsingError::TypeError {
                expected: self.value_type().name(),
                json: json.clone(),
            }),
        }
    }
}

#[cfg(test)]
mod tests {
    use serde_json::json;

    use super::FieldType;
    use crate::schema::field_type::ValueParsingError;
    use crate::schema::{
        Document, NumericOptions, OwnedValue, Schema, TextOptions, Type, COERCE, INDEXED,
    };
    use crate::time::{Date, Month, PrimitiveDateTime, Time};
    use crate::tokenizer::{PreTokenizedString, Token};
    use crate::{DateTime, TantivyDocument};

    #[test]
    fn test_to_string_coercion() {
        let mut schema_builder = Schema::builder();
        let text_field = schema_builder.add_text_field("id", COERCE);
        let schema = schema_builder.build();
        let doc = TantivyDocument::parse_json(&schema, r#"{"id": 100}"#).unwrap();
        assert_eq!(
            OwnedValue::Str("100".to_string()),
            doc.get_first(text_field).unwrap().into()
        );

        let doc = TantivyDocument::parse_json(&schema, r#"{"id": true}"#).unwrap();
        assert_eq!(
            OwnedValue::Str("true".to_string()),
            doc.get_first(text_field).unwrap().into()
        );

        // Not sure if this null coercion is the best approach
        let doc = TantivyDocument::parse_json(&schema, r#"{"id": null}"#).unwrap();
        assert_eq!(
            OwnedValue::Str("null".to_string()),
            doc.get_first(text_field).unwrap().into()
        );
    }

    #[test]
    fn test_to_number_coercion() {
        let mut schema_builder = Schema::builder();
        let i64_field = schema_builder.add_i64_field("i64", COERCE);
        let u64_field = schema_builder.add_u64_field("u64", COERCE);
        let f64_field = schema_builder.add_f64_field("f64", COERCE);
        let schema = schema_builder.build();
        let doc_json = r#"{"i64": "100", "u64": "100", "f64": "100"}"#;
        let doc = TantivyDocument::parse_json(&schema, doc_json).unwrap();
        assert_eq!(
            OwnedValue::I64(100),
            doc.get_first(i64_field).unwrap().into()
        );
        assert_eq!(
            OwnedValue::U64(100),
            doc.get_first(u64_field).unwrap().into()
        );
        assert_eq!(
            OwnedValue::F64(100.0),
            doc.get_first(f64_field).unwrap().into()
        );
    }

    #[test]
    fn test_to_bool_coercion() {
        let mut schema_builder = Schema::builder();
        let bool_field = schema_builder.add_bool_field("bool", COERCE);
        let schema = schema_builder.build();
        let doc_json = r#"{"bool": "true"}"#;
        let doc = TantivyDocument::parse_json(&schema, doc_json).unwrap();
        assert_eq!(
            OwnedValue::Bool(true),
            doc.get_first(bool_field).unwrap().into()
        );

        let doc_json = r#"{"bool": "false"}"#;
        let doc = TantivyDocument::parse_json(&schema, doc_json).unwrap();
        assert_eq!(
            OwnedValue::Bool(false),
            doc.get_first(bool_field).unwrap().into()
        );
    }

    #[test]
    fn test_to_number_no_coercion() {
        let mut schema_builder = Schema::builder();
        schema_builder.add_i64_field("i64", NumericOptions::default());
        schema_builder.add_u64_field("u64", NumericOptions::default());
        schema_builder.add_f64_field("f64", NumericOptions::default());
        let schema = schema_builder.build();
        assert!(TantivyDocument::parse_json(&schema, r#"{"u64": "100"}"#)
            .unwrap_err()
            .to_string()
            .contains("a u64"));

        assert!(TantivyDocument::parse_json(&schema, r#"{"i64": "100"}"#)
            .unwrap_err()
            .to_string()
            .contains("a i64"));

        assert!(TantivyDocument::parse_json(&schema, r#"{"f64": "100"}"#)
            .unwrap_err()
            .to_string()
            .contains("a f64"));
    }

    #[test]
    fn test_deserialize_json_date() {
        let mut schema_builder = Schema::builder();
        let date_field = schema_builder.add_date_field("date", INDEXED);
        let schema = schema_builder.build();
        let doc_json = r#"{"date": "2019-10-12T07:20:50.52+02:00"}"#;
        let doc = TantivyDocument::parse_json(&schema, doc_json).unwrap();
        let date = OwnedValue::from(doc.get_first(date_field).unwrap());
        // Time zone is converted to UTC
        assert_eq!("Date(2019-10-12T05:20:50.52Z)", format!("{date:?}"));
    }

    #[test]
    fn test_serialize_json_date() {
        let mut doc = TantivyDocument::new();
        let mut schema_builder = Schema::builder();
        let date_field = schema_builder.add_date_field("date", INDEXED);
        let schema = schema_builder.build();
        let naive_date = Date::from_calendar_date(1982, Month::September, 17).unwrap();
        let naive_time = Time::from_hms(13, 20, 0).unwrap();
        let date_time = PrimitiveDateTime::new(naive_date, naive_time);
        doc.add_date(date_field, DateTime::from_primitive(date_time));
        let doc_json = doc.to_json(&schema);
        assert_eq!(doc_json, r#"{"date":["1982-09-17T13:20:00Z"]}"#);
    }

    #[test]
    fn test_bytes_value_from_json() {
        let result = FieldType::Bytes(Default::default())
            .value_from_json(json!("dGhpcyBpcyBhIHRlc3Q="))
            .unwrap();
        assert_eq!(
            result,
            OwnedValue::Bytes("this is a test".as_bytes().to_vec())
        );

        let result = FieldType::Bytes(Default::default()).value_from_json(json!(521));
        match result {
            Err(ValueParsingError::TypeError { .. }) => {}
            _ => panic!("Expected parse failure for wrong type"),
        }

        let result = FieldType::Bytes(Default::default()).value_from_json(json!("-"));
        match result {
            Err(ValueParsingError::InvalidBase64 { .. }) => {}
            _ => panic!("Expected parse failure for invalid base64"),
        }
    }

    #[test]
    fn test_pre_tok_str_value_from_json() {
        let pre_tokenized_string_json = r#"{
  "text": "The Old Man",
  "tokens": [
    {
      "offset_from": 0,
      "offset_to": 3,
      "position": 0,
      "text": "The",
      "position_length": 1
    },
    {
      "offset_from": 4,
      "offset_to": 7,
      "position": 1,
      "text": "Old",
      "position_length": 1
    },
    {
      "offset_from": 8,
      "offset_to": 11,
      "position": 2,
      "text": "Man",
      "position_length": 1
    }
  ]
}"#;

        let expected_value = OwnedValue::PreTokStr(PreTokenizedString {
            text: String::from("The Old Man"),
            tokens: vec![
                Token {
                    offset_from: 0,
                    offset_to: 3,
                    position: 0,
                    text: String::from("The"),
                    position_length: 1,
                },
                Token {
                    offset_from: 4,
                    offset_to: 7,
                    position: 1,
                    text: String::from("Old"),
                    position_length: 1,
                },
                Token {
                    offset_from: 8,
                    offset_to: 11,
                    position: 2,
                    text: String::from("Man"),
                    position_length: 1,
                },
            ],
        });

        let deserialized_value = FieldType::Str(TextOptions::default())
            .value_from_json(serde_json::from_str(pre_tokenized_string_json).unwrap())
            .unwrap();

        assert_eq!(deserialized_value, expected_value);

        let serialized_value_json = serde_json::to_string_pretty(&expected_value).unwrap();

        assert_eq!(serialized_value_json, pre_tokenized_string_json);
    }

    #[test]
    fn test_type_codes() {
        for type_val in Type::iter_values() {
            let code = type_val.to_code();
            assert_eq!(Type::from_code(code), Some(type_val));
        }
        assert_eq!(Type::from_code(b'z'), None);
    }
}


================================================
FILE: src/schema/flags.rs
================================================
use std::ops::BitOr;

use crate::schema::{DateOptions, NumericOptions, TextOptions};

#[derive(Clone)]
pub struct StoredFlag;
/// Flag to mark the field as stored.
/// This flag can apply to any kind of field.
///
/// A stored fields of a document can be retrieved given its `DocId`.
/// Stored field are stored together and compressed.
/// Reading the stored fields of a document is relatively slow.
/// (~ 100 microsecs)
///
/// It should not be used during scoring or collection.
pub const STORED: SchemaFlagList<StoredFlag, ()> = SchemaFlagList {
    head: StoredFlag,
    tail: (),
};

#[derive(Clone)]
pub struct IndexedFlag;
/// Flag to mark the field as indexed. An indexed field is searchable and has a fieldnorm.
///
/// The `INDEXED` flag can only be used when building `NumericOptions` (`u64`, `i64`, `f64` and
/// `bool` fields) Of course, text fields can also be indexed... But this is expressed by using
/// either the `STRING` (untokenized) or `TEXT` (tokenized with the english tokenizer) flags.
pub const INDEXED: SchemaFlagList<IndexedFlag, ()> = SchemaFlagList {
    head: IndexedFlag,
    tail: (),
};

#[derive(Clone)]
pub struct CoerceFlag;
/// Flag to mark the field as coerced.
///
/// `COERCE` will try to convert values into its value type if they don't match.
///
/// See [fast fields](`crate::fastfield`).
pub const COERCE: SchemaFlagList<CoerceFlag, ()> = SchemaFlagList {
    head: CoerceFlag,
    tail: (),
};

#[derive(Clone)]
pub struct FastFlag;
/// Flag to mark the field as a fast field (similar to Lucene's DocValues)
///
/// Fast fields can be random-accessed rapidly. Fields useful for scoring, filtering
/// or collection should be mark as fast fields.
///
/// See [fast fields](`crate::fastfield`).
pub const FAST: SchemaFlagList<FastFlag, ()> = SchemaFlagList {
    head: FastFlag,
    tail: (),
};

impl<Head, OldHead, OldTail> BitOr<SchemaFlagList<Head, ()>> for SchemaFlagList<OldHead, OldTail>
where
    Head: Clone,
    OldHead: Clone,
    OldTail: Clone,
{
    type Output = SchemaFlagList<Head, SchemaFlagList<OldHead, OldTail>>;

    fn bitor(self, head: SchemaFlagList<Head, ()>) -> Self::Output {
        SchemaFlagList {
            head: head.head,
            tail: self,
        }
    }
}

impl<T: Clone + Into<NumericOptions>> BitOr<NumericOptions> for SchemaFlagList<T, ()> {
    type Output = NumericOptions;

    fn bitor(self, rhs: NumericOptions) -> Self::Output {
        self.head.into() | rhs
    }
}

impl<T: Clone + Into<DateOptions>> BitOr<DateOptions> for SchemaFlagList<T, ()> {
    type Output = DateOptions;

    fn bitor(self, rhs: DateOptions) -> Self::Output {
        self.head.into() | rhs
    }
}

impl<T: Clone + Into<TextOptions>> BitOr<TextOptions> for SchemaFlagList<T, ()> {
    type Output = TextOptions;

    fn bitor(self, rhs: TextOptions) -> Self::Output {
        self.head.into() | rhs
    }
}

#[derive(Clone)]
pub struct SchemaFlagList<Head: Clone, Tail: Clone> {
    pub head: Head,
    pub tail: Tail,
}


================================================
FILE: src/schema/index_record_option.rs
================================================
use serde::{Deserialize, Serialize};

/// `IndexRecordOption` describes an amount information associated
/// with a given indexed field.
///
/// It is both used to:
///
///  * describe in the schema the amount of information that should be retained during indexing (See
///    [`TextFieldIndexing::set_index_option()`](crate::schema::TextFieldIndexing::set_index_option))
///  * request that a given amount of information to be decoded as one goes through a posting list.
///    (See [`InvertedIndexReader::read_postings()`](crate::InvertedIndexReader::read_postings))
#[derive(
    Clone, Copy, Debug, PartialEq, PartialOrd, Ord, Eq, Hash, Serialize, Deserialize, Default,
)]
pub enum IndexRecordOption {
    /// records only the `DocId`s
    #[serde(rename = "basic")]
    #[default]
    Basic,
    /// records the document ids as well as the term frequency.
    /// The term frequency can help giving better scoring of the documents.
    #[serde(rename = "freq")]
    WithFreqs,
    /// records the document id, the term frequency and the positions of
    /// the occurrences in the document.
    /// Positions are required to run a [`PhraseQuery`](crate::query::PhraseQuery).
    #[serde(rename = "position")]
    WithFreqsAndPositions,
}

impl IndexRecordOption {
    /// Returns true if this option includes encoding
    /// term frequencies.
    pub fn has_freq(self) -> bool {
        match self {
            IndexRecordOption::Basic => false,
            IndexRecordOption::WithFreqs | IndexRecordOption::WithFreqsAndPositions => true,
        }
    }

    /// Returns true if this option include encoding
    ///  term positions.
    pub fn has_positions(self) -> bool {
        match self {
            IndexRecordOption::Basic | IndexRecordOption::WithFreqs => false,
            IndexRecordOption::WithFreqsAndPositions => true,
        }
    }

    /// Downgrades to the next level if provided `IndexRecordOption` is unavailable.
    pub fn downgrade(&self, other: IndexRecordOption) -> IndexRecordOption {
        use IndexRecordOption::*;

        match (other, self) {
            (WithFreqsAndPositions, WithFreqsAndPositions) => WithFreqsAndPositions,
            (WithFreqs, WithFreqs) => WithFreqs,
            (WithFreqsAndPositions, WithFreqs) => WithFreqs,
            (WithFreqs, WithFreqsAndPositions) => WithFreqs,
            _ => Basic,
        }
    }
}


================================================
FILE: src/schema/ip_options.rs
================================================
use std::net::{IpAddr, Ipv6Addr};
use std::ops::BitOr;

use serde::{Deserialize, Serialize};

use super::flags::{FastFlag, IndexedFlag, SchemaFlagList, StoredFlag};

/// Trait to convert into an Ipv6Addr.
pub trait IntoIpv6Addr {
    /// Consumes the object and returns an Ipv6Addr.
    fn into_ipv6_addr(self) -> Ipv6Addr;
}

impl IntoIpv6Addr for IpAddr {
    fn into_ipv6_addr(self) -> Ipv6Addr {
        match self {
            IpAddr::V4(addr) => addr.to_ipv6_mapped(),
            IpAddr::V6(addr) => addr,
        }
    }
}

/// Define how an ip field should be handled by tantivy.
#[derive(Clone, Debug, PartialEq, Eq, Serialize, Deserialize, Default)]
pub struct IpAddrOptions {
    fast: bool,
    stored: bool,
    indexed: bool,
    fieldnorms: bool,
}

impl IpAddrOptions {
    /// Returns true iff the value is a fast field.
    #[inline]
    pub fn is_fast(&self) -> bool {
        self.fast
    }

    /// Returns `true` if the ip address should be stored in the doc store.
    #[inline]
    pub fn is_stored(&self) -> bool {
        self.stored
    }

    /// Returns true iff the value is indexed and therefore searchable.
    #[inline]
    pub fn is_indexed(&self) -> bool {
        self.indexed
    }

    /// Returns true if and only if the value is normed.
    #[inline]
    pub fn fieldnorms(&self) -> bool {
        self.fieldnorms
    }

    /// Set the field as normed.
    ///
    /// Setting an integer as normed will generate
    /// the fieldnorm data for it.
    #[must_use]
    pub fn set_fieldnorms(mut self) -> Self {
        self.fieldnorms = true;
        self
    }

    /// Sets the field as stored
    #[must_use]
    pub fn set_stored(mut self) -> Self {
        self.stored = true;
        self
    }

    /// Set the field as indexed.
    ///
    /// Setting an ip address as indexed will generate
    /// a posting list for each value taken by the ip address.
    /// Ips are normalized to IpV6.
    ///
    /// This is required for the field to be searchable.
    #[must_use]
    pub fn set_indexed(mut self) -> Self {
        self.indexed = true;
        self
    }

    /// Set the field as a fast field.
    ///
    /// Fast fields are designed for random access.
    #[must_use]
    pub fn set_fast(mut self) -> Self {
        self.fast = true;
        self
    }
}

impl From<()> for IpAddrOptions {
    fn from(_: ()) -> IpAddrOptions {
        IpAddrOptions::default()
    }
}

impl From<FastFlag> for IpAddrOptions {
    fn from(_: FastFlag) -> Self {
        IpAddrOptions {
            fieldnorms: false,
            indexed: false,
            stored: false,
            fast: true,
        }
    }
}

impl From<StoredFlag> for IpAddrOptions {
    fn from(_: StoredFlag) -> Self {
        IpAddrOptions {
            fieldnorms: false,
            indexed: false,
            stored: true,
            fast: false,
        }
    }
}

impl From<IndexedFlag> for IpAddrOptions {
    fn from(_: IndexedFlag) -> Self {
        IpAddrOptions {
            fieldnorms: true,
            indexed: true,
            stored: false,
            fast: false,
        }
    }
}

impl<T: Into<IpAddrOptions>> BitOr<T> for IpAddrOptions {
    type Output = IpAddrOptions;

    fn bitor(self, other: T) -> IpAddrOptions {
        let other = other.into();
        IpAddrOptions {
            fieldnorms: self.fieldnorms | other.fieldnorms,
            indexed: self.indexed | other.indexed,
            stored: self.stored | other.stored,
            fast: self.fast | other.fast,
        }
    }
}

impl<Head, Tail> From<SchemaFlagList<Head, Tail>> for IpAddrOptions
where
    Head: Clone,
    Tail: Clone,
    Self: BitOr<Output = Self> + From<Head> + From<Tail>,
{
    fn from(head_tail: SchemaFlagList<Head, Tail>) -> Self {
        Self::from(head_tail.head) | Self::from(head_tail.tail)
    }
}


================================================
FILE: src/schema/json_object_options.rs
================================================
use std::ops::BitOr;

use serde::{Deserialize, Serialize};

use super::text_options::{FastFieldTextOptions, TokenizerName};
use crate::schema::flags::{FastFlag, SchemaFlagList, StoredFlag};
use crate::schema::{TextFieldIndexing, TextOptions};

/// The `JsonObjectOptions` make it possible to
/// configure how a json object field should be indexed and stored.
#[derive(Clone, Debug, Default, PartialEq, Serialize, Deserialize)]
pub struct JsonObjectOptions {
    stored: bool,
    // If set to some, int, date, f64 and text will be indexed.
    // Text will use the TextFieldIndexing setting for indexing.
    indexing: Option<TextFieldIndexing>,
    // Store all field as fast fields with an optional tokenizer for text.
    fast: FastFieldTextOptions,
    /// tantivy will generate paths to the different nodes of the json object
    /// both in:
    /// - the inverted index (for the terms)
    /// - fast fields (for the column names).
    ///
    /// These json path are encoded by concatenating the list of object keys that
    /// are visited from the root to the leaf.
    ///
    /// By default, if an object key contains a `.`, we keep it as a `.` it as is.
    /// On the search side, users will then have to escape this `.` in the query parser
    /// or when referring to a column name.
    ///
    /// For instance:
    /// `{"root": {"child.with.dot": "hello"}}`
    ///
    /// Can be searched using the following query
    /// `root.child\.with\.dot:hello`
    ///
    /// If `expand_dots_enabled` is set to true, we will treat this `.` in object keys
    /// as json separators. In other words, if set to true, our object will be
    /// processed as if it was
    /// `{"root": {"child": {"with": {"dot": "hello"}}}}`
    /// and it can be search using the following query:
    /// `root.child.with.dot:hello`
    #[serde(default)]
    expand_dots_enabled: bool,
}

impl JsonObjectOptions {
    /// Returns `true` if the json object should be stored.
    #[inline]
    pub fn is_stored(&self) -> bool {
        self.stored
    }

    /// Returns `true` iff the json object should be indexed.
    #[inline]
    pub fn is_indexed(&self) -> bool {
        self.indexing.is_some()
    }

    /// Returns true if and only if the json object fields are
    /// to be treated as fast fields.
    #[inline]
    pub fn is_fast(&self) -> bool {
        matches!(self.fast, FastFieldTextOptions::IsEnabled(true))
            || matches!(
                &self.fast,
                FastFieldTextOptions::EnabledWithTokenizer { with_tokenizer: _ }
            )
    }

    /// Returns true if and only if the value is a fast field.
    #[inline]
    pub fn get_fast_field_tokenizer_name(&self) -> Option<&str> {
        match &self.fast {
            FastFieldTextOptions::IsEnabled(true) | FastFieldTextOptions::IsEnabled(false) => None,
            FastFieldTextOptions::EnabledWithTokenizer {
                with_tokenizer: tokenizer,
            } => Some(tokenizer.name()),
        }
    }

    /// Returns `true` iff dots in json keys should be expanded.
    ///
    /// When expand_dots is enabled, json object like
    /// `{"k8s.node.id": 5}` is processed as if it was
    /// `{"k8s": {"node": {"id": 5}}}`.
    /// This option has the merit of allowing users to
    /// write queries  like `k8s.node.id:5`.
    /// On the other, enabling that feature can lead to
    /// ambiguity.
    ///
    /// If disabled, the "." needs to be escaped:
    /// `k8s\.node\.id:5`.
    #[inline]
    pub fn is_expand_dots_enabled(&self) -> bool {
        self.expand_dots_enabled
    }

    /// Sets `expands_dots` to true.
    /// See `is_expand_dots_enabled` for more information.
    pub fn set_expand_dots_enabled(mut self) -> Self {
        self.expand_dots_enabled = true;
        self
    }

    /// Returns the text indexing options.
    ///
    /// If set to `Some` then both int and str values will be indexed.
    /// The inner `TextFieldIndexing` will however, only apply to the str values
    /// in the json object.
    #[inline]
    pub fn get_text_indexing_options(&self) -> Option<&TextFieldIndexing> {
        self.indexing.as_ref()
    }

    /// Sets the field as stored
    #[must_use]
    pub fn set_stored(mut self) -> Self {
        self.stored = true;
        self
    }

    /// Set the field as a fast field.
    ///
    /// Fast fields are designed for random access.
    /// Access time are similar to a random lookup in an array.
    /// Text fast fields will have the term ids stored in the fast field.
    ///
    /// The effective cardinality depends on the tokenizer. Without a tokenizer, the text will be
    /// stored as is, which equals to the "raw" tokenizer. The tokenizer can be used to apply
    /// normalization like lower case.
    /// The passed tokenizer_name must be available on the fast field tokenizer manager.
    /// `Index::fast_field_tokenizer`.
    ///
    /// The original text can be retrieved via
    /// [`TermDictionary::ord_to_term()`](crate::termdict::TermDictionary::ord_to_term)
    /// from the dictionary.
    #[must_use]
    pub fn set_fast(mut self, tokenizer_name: Option<&str>) -> Self {
        if let Some(tokenizer) = tokenizer_name {
            let tokenizer = TokenizerName::from_name(tokenizer);
            self.fast = FastFieldTextOptions::EnabledWithTokenizer {
                with_tokenizer: tokenizer,
            }
        } else {
            self.fast = FastFieldTextOptions::IsEnabled(true);
        }
        self
    }

    /// Sets the field as indexed, with the specific indexing options.
    #[must_use]
    pub fn set_indexing_options(mut self, indexing: TextFieldIndexing) -> Self {
        self.indexing = Some(indexing);
        self
    }
}

impl From<StoredFlag> for JsonObjectOptions {
    fn from(_stored_flag: StoredFlag) -> Self {
        JsonObjectOptions {
            stored: true,
            indexing: None,
            fast: FastFieldTextOptions::default(),
            expand_dots_enabled: false,
        }
    }
}

impl From<FastFlag> for JsonObjectOptions {
    fn from(_fast_flag: FastFlag) -> Self {
        JsonObjectOptions {
            stored: false,
            indexing: None,
            fast: FastFieldTextOptions::IsEnabled(true),
            expand_dots_enabled: false,
        }
    }
}

impl From<()> for JsonObjectOptions {
    fn from(_: ()) -> Self {
        Self::default()
    }
}

impl<T: Into<JsonObjectOptions>> BitOr<T> for JsonObjectOptions {
    type Output = JsonObjectOptions;

    fn bitor(self, other: T) -> Self {
        let other: JsonObjectOptions = other.into();
        JsonObjectOptions {
            indexing: self.indexing.or(other.indexing),
            stored: self.stored | other.stored,
            fast: self.fast | other.fast,
            expand_dots_enabled: self.expand_dots_enabled | other.expand_dots_enabled,
        }
    }
}

impl<Head, Tail> From<SchemaFlagList<Head, Tail>> for JsonObjectOptions
where
    Head: Clone,
    Tail: Clone,
    Self: BitOr<Output = Self> + From<Head> + From<Tail>,
{
    fn from(head_tail: SchemaFlagList<Head, Tail>) -> Self {
        Self::from(head_tail.head) | Self::from(head_tail.tail)
    }
}

impl From<TextOptions> for JsonObjectOptions {
    fn from(text_options: TextOptions) -> Self {
        JsonObjectOptions {
            stored: text_options.is_stored(),
            indexing: text_options.get_indexing_options().cloned(),
            fast: text_options.fast,
            expand_dots_enabled: false,
        }
    }
}

#[cfg(test)]
mod tests {
    use super::*;
    use crate::schema::{FAST, STORED, TEXT};

    #[test]
    fn test_json_options() {
        {
            let json_options: JsonObjectOptions = (STORED | TEXT).into();
            assert!(json_options.is_stored());
            assert!(json_options.is_indexed());
            assert!(!json_options.is_fast());
        }
        {
            let json_options: JsonObjectOptions = TEXT.into();
            assert!(!json_options.is_stored());
            assert!(json_options.is_indexed());
            assert!(!json_options.is_fast());
        }
        {
            let json_options: JsonObjectOptions = STORED.into();
            assert!(json_options.is_stored());
            assert!(!json_options.is_indexed());
            assert!(!json_options.is_fast());
        }
        {
            let json_options: JsonObjectOptions = FAST.into();
            assert!(!json_options.is_stored());
            assert!(!json_options.is_indexed());
            assert!(json_options.is_fast());
        }
        {
            let json_options: JsonObjectOptions = (FAST | STORED).into();
            assert!(json_options.is_stored());
            assert!(!json_options.is_indexed());
            assert!(json_options.is_fast());
        }
    }
}


================================================
FILE: src/schema/mod.rs
================================================
//! Schema definition for tantivy's indices.
//!
//! # Setting your schema in Tantivy
//!
//! Tantivy has a very strict schema.
//! The schema defines information about the fields your index contains, that is, for each field:
//!
//! - the field name (may contain any character, can't start with a `-` and can't be empty. Some
//!   characters may require escaping when using the query parser).
//! - the type of the field (currently `text`, `u64`, `i64`, `f64`, `bool`, `date`, `IpAddr`,
//!   facets, bytes and json are supported)
//! - how the field should be indexed / stored.
//!
//! This very last point is critical as it will enable / disable some of the functionality
//! for your index.
//!
//! Tantivy's schema is stored within the `meta.json` file at the root of your
//! directory.
//!
//!
//!
//! # Building a schema "programmatically"
//!
//!
//! ## Setting a text field
//!
//! ### Example
//!
//! ```
//! use tantivy::schema::*;
//! let mut schema_builder = Schema::builder();
//! let title_options = TextOptions::default()
//!     .set_stored()
//!     .set_indexing_options(TextFieldIndexing::default()
//!     .set_tokenizer("default")
//!     .set_index_option(IndexRecordOption::WithFreqsAndPositions));
//! schema_builder.add_text_field("title", title_options);
//! let schema = schema_builder.build();
//! ```
//!
//! We can split the problem of generating a search result page into two phases:
//!
//! - identifying the list of 10 or so documents to be displayed (Conceptually `query -> doc_ids[]`)
//! - for each of these documents, retrieving the information required to generate the search
//!   results page. (`doc_ids[] -> Document[]`)
//!
//! In the first phase, the ability to search for documents by the given field is determined by the
//! [`IndexRecordOption`] of our [`TextOptions`].
//!
//! The effect of each possible setting is described more in detail in [`TextOptions`].
//!
//! On the other hand setting the field as stored or not determines whether the field should be
//! returned when [`Searcher::doc()`](crate::Searcher::doc) is called.
//!
//!
//! ## Setting a u64, a i64 or a f64 field
//!
//! ### Example
//!
//! ```
//! use tantivy::schema::*;
//! let mut schema_builder = Schema::builder();
//! let num_stars_options = NumericOptions::default()
//!     .set_stored()
//!     .set_indexed();
//! schema_builder.add_u64_field("num_stars", num_stars_options);
//! let schema = schema_builder.build();
//! ```
//!
//! Just like for Text fields (see above),
//! setting the field as stored defines whether the field will be
//! returned when [`Searcher::doc()`](crate::Searcher::doc) is called,
//! and setting the field as indexed means that we will be able perform queries such as
//! `num_stars:10`. Note that unlike text fields, numeric fields can only be indexed in one way for
//! the moment.
//!
//! ### Shortcuts
//!
//!
//! For convenience, it is possible to define your field indexing options by combining different
//! flags using the  `|` operator.
//!
//! For instance, a schema containing the two fields defined in the example above could be
//! rewritten:
//!
//! ```
//! use tantivy::schema::*;
//! let mut schema_builder = Schema::builder();
//! schema_builder.add_u64_field("num_stars", INDEXED | STORED);
//! schema_builder.add_text_field("title", TEXT | STORED);
//! let schema = schema_builder.build();
//! ```
//!
//! ### Fast fields
//! This functionality is somewhat similar to Lucene's `DocValues`.
//!
//! Fields that are indexed as [`FAST`] will be stored in a special data structure that will
//! make it possible to access the value given the doc id rapidly. This is useful if the value
//! of the field is required during scoring or collection for instance.
//!
//! Some queries may leverage Fast fields when run on a field that is not indexed. This can be
//! handy if that kind of request is infrequent, however note that searching on a Fast field is
//! generally much slower than searching in an index.
//!
//! ```
//! use tantivy::schema::*;
//! let mut schema_builder = Schema::builder();
//! schema_builder.add_u64_field("population", STORED | FAST);
//! schema_builder.add_text_field("zip_code", STRING | FAST);
//! let schema = schema_builder.build();
//! ```

pub mod document;
mod facet;
mod facet_options;
mod schema;
pub(crate) mod term;

mod field_entry;
mod field_type;

mod bytes_options;
mod date_time_options;
mod field;
mod flags;
mod index_record_option;
mod ip_options;
mod json_object_options;
mod named_field_document;
mod numeric_options;
mod text_options;

use columnar::ColumnType;

pub use self::bytes_options::BytesOptions;
pub use self::date_time_options::{DateOptions, DateTimePrecision, DATE_TIME_PRECISION_INDEXED};
pub use self::document::{DocParsingError, Document, OwnedValue, TantivyDocument, Value};
pub(crate) use self::facet::FACET_SEP_BYTE;
pub use self::facet::{Facet, FacetParseError};
pub use self::facet_options::FacetOptions;
pub use self::field::Field;
pub use self::field_entry::FieldEntry;
pub use self::field_type::{FieldType, Type};
pub use self::flags::{COERCE, FAST, INDEXED, STORED};
pub use self::index_record_option::IndexRecordOption;
pub use self::ip_options::{IntoIpv6Addr, IpAddrOptions};
pub use self::json_object_options::JsonObjectOptions;
pub use self::named_field_document::NamedFieldDocument;
pub use self::numeric_options::NumericOptions;
pub use self::schema::{Schema, SchemaBuilder};
pub use self::term::{Term, ValueBytes};
pub use self::text_options::{TextFieldIndexing, TextOptions, STRING, TEXT};

/// Validator for a potential `field_name`.
/// Returns true if the name can be use for a field name.
///
/// A field name can be any character, must have at least one character
/// and must not start with a `-`.
pub fn is_valid_field_name(field_name: &str) -> bool {
    !field_name.is_empty() && !field_name.starts_with('-')
}

pub(crate) fn value_type_to_column_type(typ: Type) -> Option<ColumnType> {
    match typ {
        Type::Str => Some(ColumnType::Str),
        Type::U64 => Some(ColumnType::U64),
        Type::I64 => Some(ColumnType::I64),
        Type::F64 => Some(ColumnType::F64),
        Type::Bool => Some(ColumnType::Bool),
        Type::Date => Some(ColumnType::DateTime),
        Type::Facet => Some(ColumnType::Str),
        Type::Bytes => Some(ColumnType::Bytes),
        Type::IpAddr => Some(ColumnType::IpAddr),
        Type::Json => None,
    }
}

#[cfg(test)]
mod tests {

    use super::is_valid_field_name;

    #[test]
    fn test_is_valid_name() {
        assert!(is_valid_field_name("シャボン玉"));
        assert!(!is_valid_field_name("-fieldname"));
        assert!(!is_valid_field_name(""));
    }
}


================================================
FILE: src/schema/named_field_document.rs
================================================
use std::collections::BTreeMap;

use serde::{Deserialize, Serialize};

use crate::schema::OwnedValue;

/// Internal representation of a document used for JSON
/// serialization.
///
/// A `NamedFieldDocument` is a simple representation of a document
/// as a `BTreeMap<String, Vec<Value>>`.
#[derive(Debug, Deserialize, Serialize)]
pub struct NamedFieldDocument(pub BTreeMap<String, Vec<OwnedValue>>);


================================================
FILE: src/schema/numeric_options.rs
================================================
use std::ops::BitOr;

use serde::{Deserialize, Serialize};

use super::flags::CoerceFlag;
use crate::schema::flags::{FastFlag, IndexedFlag, SchemaFlagList, StoredFlag};

/// Define how an `u64`, `i64`, or `f64` field should be handled by tantivy.
#[derive(Clone, Debug, PartialEq, Eq, Serialize, Deserialize, Default)]
#[serde(from = "NumericOptionsDeser")]
pub struct NumericOptions {
    indexed: bool,
    // This boolean has no effect if the field is not marked as indexed too.
    fieldnorms: bool, // This attribute only has an effect if indexed is true.
    fast: bool,
    stored: bool,
    #[serde(skip_serializing_if = "is_false")]
    coerce: bool,
}

fn is_false(val: &bool) -> bool {
    !val
}

/// For backward compatibility we add an intermediary to interpret the
/// lack of fieldnorms attribute as "true" if and only if indexed.
///
/// (Downstream, for the moment, this attribute is not used anyway if not indexed...)
/// Note that: newly serialized `NumericOptions` will include the new attribute.
#[derive(Deserialize)]
struct NumericOptionsDeser {
    indexed: bool,
    #[serde(default)]
    fieldnorms: Option<bool>, // This attribute only has an effect if indexed is true.
    #[serde(default)]
    fast: bool,
    stored: bool,
    #[serde(default)]
    coerce: bool,
}

impl From<NumericOptionsDeser> for NumericOptions {
    fn from(deser: NumericOptionsDeser) -> Self {
        NumericOptions {
            indexed: deser.indexed,
            fieldnorms: deser.fieldnorms.unwrap_or(deser.indexed),
            fast: deser.fast,
            stored: deser.stored,
            coerce: deser.coerce,
        }
    }
}

impl NumericOptions {
    /// Returns true iff the value is stored in the doc store.
    #[inline]
    pub fn is_stored(&self) -> bool {
        self.stored
    }

    /// Returns true iff the value is indexed and therefore searchable.
    #[inline]
    pub fn is_indexed(&self) -> bool {
        self.indexed
    }

    /// Returns true iff the field has fieldnorm.
    #[inline]
    pub fn fieldnorms(&self) -> bool {
        self.fieldnorms && self.indexed
    }

    /// Returns true iff the value is a fast field.
    #[inline]
    pub fn is_fast(&self) -> bool {
        self.fast
    }

    /// Returns true if values should be coerced to numbers.
    #[inline]
    pub fn should_coerce(&self) -> bool {
        self.coerce
    }

    /// Try to coerce values if they are not a number. Defaults to false.
    #[must_use]
    pub fn set_coerce(mut self) -> Self {
        self.coerce = true;
        self
    }

    /// Set the field as stored.
    ///
    /// Only the fields that are set as *stored* are
    /// persisted into the Tantivy's store.
    #[must_use]
    pub fn set_stored(mut self) -> NumericOptions {
        self.stored = true;
        self
    }

    /// Set the field as indexed.
    ///
    /// Setting an integer as indexed will generate
    /// a posting list for each value taken by the integer.
    ///
    /// This is required for the field to be searchable.
    #[must_use]
    pub fn set_indexed(mut self) -> NumericOptions {
        self.indexed = true;
        self
    }

    /// Set the field with fieldnorm.
    ///
    /// Setting an integer as fieldnorm will generate
    /// the fieldnorm data for it.
    #[must_use]
    pub fn set_fieldnorm(mut self) -> NumericOptions {
        self.fieldnorms = true;
        self
    }

    /// Set the field as a fast field.
    ///
    /// Fast fields are designed for random access.
    #[must_use]
    pub fn set_fast(mut self) -> NumericOptions {
        self.fast = true;
        self
    }
}

impl From<()> for NumericOptions {
    fn from(_: ()) -> NumericOptions {
        NumericOptions::default()
    }
}

impl From<CoerceFlag> for NumericOptions {
    fn from(_: CoerceFlag) -> NumericOptions {
        NumericOptions {
            indexed: false,
            fieldnorms: false,
            stored: false,
            fast: false,
            coerce: true,
        }
    }
}

impl From<FastFlag> for NumericOptions {
    fn from(_: FastFlag) -> Self {
        NumericOptions {
            indexed: false,
            fieldnorms: false,
            stored: false,
            fast: true,
            coerce: false,
        }
    }
}

impl From<StoredFlag> for NumericOptions {
    fn from(_: StoredFlag) -> Self {
        NumericOptions {
            indexed: false,
            fieldnorms: false,
            stored: true,
            fast: false,
            coerce: false,
        }
    }
}

impl From<IndexedFlag> for NumericOptions {
    fn from(_: IndexedFlag) -> Self {
        NumericOptions {
            indexed: true,
            fieldnorms: true,
            stored: false,
            fast: false,
            coerce: false,
        }
    }
}

impl<T: Into<NumericOptions>> BitOr<T> for NumericOptions {
    type Output = NumericOptions;

    fn bitor(self, other: T) -> NumericOptions {
        let other = other.into();
        NumericOptions {
            indexed: self.indexed | other.indexed,
            fieldnorms: self.fieldnorms | other.fieldnorms,
            stored: self.stored | other.stored,
            fast: self.fast | other.fast,
            coerce: self.coerce | other.coerce,
        }
    }
}

impl<Head, Tail> From<SchemaFlagList<Head, Tail>> for NumericOptions
where
    Head: Clone,
    Tail: Clone,
    Self: BitOr<Output = Self> + From<Head> + From<Tail>,
{
    fn from(head_tail: SchemaFlagList<Head, Tail>) -> Self {
        Self::from(head_tail.head) | Self::from(head_tail.tail)
    }
}

#[cfg(test)]
mod tests {
    use super::*;

    #[test]
    fn test_int_options_deser_if_fieldnorm_missing_indexed_true() {
        let json = r#"{
            "indexed": true,
            "stored": false
        }"#;
        let int_options: NumericOptions = serde_json::from_str(json).unwrap();
        assert_eq!(
            &int_options,
            &NumericOptions {
                indexed: true,
                fieldnorms: true,
                fast: false,
                stored: false,
                coerce: false,
            }
        );
    }

    #[test]
    fn test_int_options_deser_if_fieldnorm_missing_indexed_false() {
        let json = r#"{
            "indexed": false,
            "stored": false
        }"#;
        let int_options: NumericOptions = serde_json::from_str(json).unwrap();
        assert_eq!(
            &int_options,
            &NumericOptions {
                indexed: false,
                fieldnorms: false,
                fast: false,
                stored: false,
                coerce: false,
            }
        );
    }

    #[test]
    fn test_int_options_deser_if_fieldnorm_false_indexed_true() {
        let json = r#"{
            "indexed": true,
            "fieldnorms": false,
            "stored": false
        }"#;
        let int_options: NumericOptions = serde_json::from_str(json).unwrap();
        assert_eq!(
            &int_options,
            &NumericOptions {
                indexed: true,
                fieldnorms: false,
                fast: false,
                stored: false,
                coerce: false,
            }
        );
    }

    #[test]
    fn test_int_options_deser_if_fieldnorm_true_indexed_false() {
        // this one is kind of useless, at least at the moment
        let json = r#"{
            "indexed": false,
            "fieldnorms": true,
            "stored": false
        }"#;
        let int_options: NumericOptions = serde_json::from_str(json).unwrap();
        assert_eq!(
            &int_options,
            &NumericOptions {
                indexed: false,
                fieldnorms: true,
                fast: false,
                stored: false,
                coerce: false,
            }
        );
    }

    #[test]
    fn test_int_options_deser_if_coerce_true() {
        // this one is kind of useless, at least at the moment
        let json = r#"{
            "indexed": false,
            "fieldnorms": true,
            "stored": false,
            "coerce": true
        }"#;
        let int_options: NumericOptions = serde_json::from_str(json).unwrap();
        assert_eq!(
            &int_options,
            &NumericOptions {
                indexed: false,
                fieldnorms: true,
                fast: false,
                stored: false,
                coerce: true,
            }
        );
    }
}


================================================
FILE: src/schema/schema.rs
================================================
use std::collections::HashMap;
use std::fmt;
use std::sync::Arc;

use serde::de::{SeqAccess, Visitor};
use serde::ser::SerializeSeq;
use serde::{Deserialize, Deserializer, Serialize, Serializer};

use super::*;
use crate::json_utils::split_json_path;
use crate::TantivyError;

/// Tantivy has a very strict schema.
/// You need to specify in advance whether a field is indexed or not,
/// stored or not, and RAM-based or not.
///
/// This is done by creating a schema object, and
/// setting up the fields one by one.
/// It is for the moment impossible to remove fields.
///
/// # Examples
///
/// ```
/// use tantivy::schema::*;
///
/// let mut schema_builder = Schema::builder();
/// let id_field = schema_builder.add_text_field("id", STRING);
/// let title_field = schema_builder.add_text_field("title", TEXT);
/// let body_field = schema_builder.add_text_field("body", TEXT);
/// let schema = schema_builder.build();
/// ```
#[derive(Debug, Default)]
pub struct SchemaBuilder {
    fields: Vec<FieldEntry>,
    fields_map: HashMap<String, Field>,
}

impl SchemaBuilder {
    /// Create a new `SchemaBuilder`
    pub fn new() -> SchemaBuilder {
        SchemaBuilder::default()
    }

    /// Adds a new u64 field.
    /// Returns the associated field handle
    ///
    /// # Panics
    ///
    /// Panics when field already exists.
    pub fn add_u64_field<T: Into<NumericOptions>>(
        &mut self,
        field_name_str: &str,
        field_options: T,
    ) -> Field {
        let field_name = String::from(field_name_str);
        let field_entry = FieldEntry::new_u64(field_name, field_options.into());
        self.add_field(field_entry)
    }

    /// Adds a new i64 field.
    /// Returns the associated field handle
    ///
    /// # Panics
    ///
    /// Panics when field already exists.
    pub fn add_i64_field<T: Into<NumericOptions>>(
        &mut self,
        field_name_str: &str,
        field_options: T,
    ) -> Field {
        let field_name = String::from(field_name_str);
        let field_entry = FieldEntry::new_i64(field_name, field_options.into());
        self.add_field(field_entry)
    }

    /// Adds a new f64 field.
    /// Returns the associated field handle
    ///
    /// # Panics
    ///
    /// Panics when field already exists.
    pub fn add_f64_field<T: Into<NumericOptions>>(
        &mut self,
        field_name_str: &str,
        field_options: T,
    ) -> Field {
        let field_name = String::from(field_name_str);
        let field_entry = FieldEntry::new_f64(field_name, field_options.into());
        self.add_field(field_entry)
    }

    /// Adds a new bool field.
    /// Returns the associated field handle
    ///
    /// # Panics
    ///
    /// Panics when field already exists.
    pub fn add_bool_field<T: Into<NumericOptions>>(
        &mut self,
        field_name_str: &str,
        field_options: T,
    ) -> Field {
        let field_name = String::from(field_name_str);
        let field_entry = FieldEntry::new_bool(field_name, field_options.into());
        self.add_field(field_entry)
    }

    /// Adds a new date field.
    /// Returns the associated field handle
    /// Internally, Tantivy simply stores dates as i64 UTC timestamps,
    /// while the user supplies DateTime values for convenience.
    ///
    /// # Panics
    ///
    /// Panics when field already exists.
    pub fn add_date_field<T: Into<DateOptions>>(
        &mut self,
        field_name_str: &str,
        field_options: T,
    ) -> Field {
        let field_name = String::from(field_name_str);
        let field_entry = FieldEntry::new_date(field_name, field_options.into());
        self.add_field(field_entry)
    }

    /// Adds a ip field.
    /// Returns the associated field handle.
    ///
    /// # Panics
    ///
    /// Panics when field already exists.
    pub fn add_ip_addr_field<T: Into<IpAddrOptions>>(
        &mut self,
        field_name_str: &str,
        field_options: T,
    ) -> Field {
        let field_name = String::from(field_name_str);
        let field_entry = FieldEntry::new_ip_addr(field_name, field_options.into());
        self.add_field(field_entry)
    }

    /// Adds a new text field.
    /// Returns the associated field handle
    ///
    /// # Panics
    ///
    /// Panics when field already exists.
    pub fn add_text_field<T: Into<TextOptions>>(
        &mut self,
        field_name_str: &str,
        field_options: T,
    ) -> Field {
        let field_name = String::from(field_name_str);
        let field_entry = FieldEntry::new_text(field_name, field_options.into());
        self.add_field(field_entry)
    }

    /// Adds a facet field to the schema.
    pub fn add_facet_field(
        &mut self,
        field_name: &str,
        facet_options: impl Into<FacetOptions>,
    ) -> Field {
        let field_entry = FieldEntry::new_facet(field_name.to_string(), facet_options.into());
        self.add_field(field_entry)
    }

    /// Adds a fast bytes field to the schema.
    ///
    /// Bytes field are not searchable and are only used
    /// as fast field, to associate any kind of payload
    /// to a document.
    ///
    /// For instance, learning-to-rank often requires to access
    /// some document features at scoring time.
    /// These can be serializing and stored as a bytes field to
    /// get access rapidly when scoring each document.
    pub fn add_bytes_field<T: Into<BytesOptions>>(
        &mut self,
        field_name: &str,
        field_options: T,
    ) -> Field {
        let field_entry = FieldEntry::new_bytes(field_name.to_string(), field_options.into());
        self.add_field(field_entry)
    }

    /// Adds a json object field to the schema.
    pub fn add_json_field<T: Into<JsonObjectOptions>>(
        &mut self,
        field_name: &str,
        field_options: T,
    ) -> Field {
        let field_entry = FieldEntry::new_json(field_name.to_string(), field_options.into());
        self.add_field(field_entry)
    }

    /// Adds a field entry to the schema in build.
    pub fn add_field(&mut self, field_entry: FieldEntry) -> Field {
        let field = Field::from_field_id(self.fields.len() as u32);
        let field_name = field_entry.name().to_string();
        if let Some(_previous_value) = self.fields_map.insert(field_name, field) {
            panic!("Field already exists in schema {}", field_entry.name());
        };
        self.fields.push(field_entry);
        field
    }

    /// Finalize the creation of a `Schema`
    /// This will consume your `SchemaBuilder`
    pub fn build(self) -> Schema {
        Schema(Arc::new(InnerSchema {
            fields: self.fields,
            fields_map: self.fields_map,
        }))
    }
}
#[derive(Debug)]
struct InnerSchema {
    fields: Vec<FieldEntry>,
    fields_map: HashMap<String, Field>, // transient
}

impl PartialEq for InnerSchema {
    fn eq(&self, other: &InnerSchema) -> bool {
        self.fields == other.fields
    }
}

impl Eq for InnerSchema {}

/// Tantivy has a very strict schema.
/// You need to specify in advance, whether a field is indexed or not,
/// stored or not, and RAM-based or not.
///
/// This is done by creating a schema object, and
/// setting up the fields one by one.
/// It is for the moment impossible to remove fields.
///
/// # Examples
///
/// ```
/// use tantivy::schema::*;
///
/// let mut schema_builder = Schema::builder();
/// let id_field = schema_builder.add_text_field("id", STRING);
/// let title_field = schema_builder.add_text_field("title", TEXT);
/// let body_field = schema_builder.add_text_field("body", TEXT);
/// let schema = schema_builder.build();
/// ```
#[derive(Clone, Eq, PartialEq, Debug)]
pub struct Schema(Arc<InnerSchema>);

// Returns the position (in byte offsets) of the unescaped '.' in the `field_path`.
//
// This function operates directly on bytes (as opposed to codepoint), relying
// on a encoding property of utf-8 for its correctness.
fn locate_splitting_dots(field_path: &str) -> Vec<usize> {
    let mut splitting_dots_pos = Vec::new();
    let mut escape_state = false;
    for (pos, b) in field_path.bytes().enumerate() {
        if escape_state {
            escape_state = false;
            continue;
        }
        match b {
            b'\\' => {
                escape_state = true;
            }
            b'.' => {
                splitting_dots_pos.push(pos);
            }
            _ => {}
        }
    }
    splitting_dots_pos
}

impl Schema {
    /// Return the `FieldEntry` associated with a `Field`.
    #[inline]
    pub fn get_field_entry(&self, field: Field) -> &FieldEntry {
        &self.0.fields[field.field_id() as usize]
    }

    /// Return the field name for a given `Field`.
    pub fn get_field_name(&self, field: Field) -> &str {
        self.get_field_entry(field).name()
    }

    /// Returns the number of fields in the schema.
    pub fn num_fields(&self) -> usize {
        self.0.fields.len()
    }

    /// Return the list of all the `Field`s.
    pub fn fields(&self) -> impl Iterator<Item = (Field, &FieldEntry)> {
        self.0
            .fields
            .iter()
            .enumerate()
            .map(|(field_id, field_entry)| (Field::from_field_id(field_id as u32), field_entry))
    }

    /// Creates a new builder.
    pub fn builder() -> SchemaBuilder {
        SchemaBuilder::default()
    }

    /// Returns the field option associated with a given name.
    pub fn get_field(&self, field_name: &str) -> crate::Result<Field> {
        self.0
            .fields_map
            .get(field_name)
            .cloned()
            .ok_or_else(|| TantivyError::FieldNotFound(field_name.to_string()))
    }

    /// Searches for a full_path in the schema, returning the field name and a JSON path.
    ///
    /// This function works by checking if the field exists for the exact given full_path.
    /// If it's not, it splits the full_path at non-escaped '.' chars and tries to match the
    /// prefix with the field names, favoring the longest field names.
    ///
    /// This does not check if field is a JSON field. It is possible for this functions to
    /// return a non-empty JSON path with a non-JSON field.
    pub fn find_field<'a>(&self, full_path: &'a str) -> Option<(Field, &'a str)> {
        if let Some(field) = self.0.fields_map.get(full_path) {
            return Some((*field, ""));
        }

        let mut splitting_period_pos: Vec<usize> = locate_splitting_dots(full_path);
        while let Some(pos) = splitting_period_pos.pop() {
            let (prefix, suffix) = full_path.split_at(pos);

            if let Some(field) = self.0.fields_map.get(prefix) {
                return Some((*field, &suffix[1..]));
            }
            // JSON path may contain a dot, for now we try both variants to find the field.
            let prefix = split_json_path(prefix).join(".");
            if let Some(field) = self.0.fields_map.get(&prefix) {
                return Some((*field, &suffix[1..]));
            }
        }
        None
    }

    /// Transforms a user-supplied fast field name into a column name.
    ///
    /// This is similar to `.find_field` except it includes some fallback logic to
    /// a default json field. This functionality is used in Quickwit.
    ///
    /// If the remaining path is empty and seems to target JSON field, we return None.
    /// If the remaining path is non-empty and seems to target a non-JSON field, we return None.
    #[doc(hidden)]
    pub fn find_field_with_default<'a>(
        &self,
        full_path: &'a str,

        default_field_opt: Option<Field>,
    ) -> Option<(Field, &'a str)> {
        let (field, json_path) = self
            .find_field(full_path)
            .or(default_field_opt.map(|field| (field, full_path)))?;
        let field_entry = self.get_field_entry(field);
        let is_json = field_entry.field_type().value_type() == Type::Json;
        if !is_json && !json_path.is_empty() {
            return None;
        }
        Some((field, json_path))
    }
}

impl Serialize for Schema {
    fn serialize<S>(&self, serializer: S) -> Result<S::Ok, S::Error>
    where S: Serializer {
        let mut seq = serializer.serialize_seq(Some(self.0.fields.len()))?;
        for e in &self.0.fields {
            seq.serialize_element(e)?;
        }
        seq.end()
    }
}

impl<'de> Deserialize<'de> for Schema {
    fn deserialize<D>(deserializer: D) -> Result<Self, D::Error>
    where D: Deserializer<'de> {
        struct SchemaVisitor;

        impl<'de> Visitor<'de> for SchemaVisitor {
            type Value = Schema;

            fn expecting(&self, formatter: &mut fmt::Formatter<'_>) -> fmt::Result {
                formatter.write_str("struct Schema")
            }

            fn visit_seq<A>(self, mut seq: A) -> Result<Self::Value, A::Error>
            where A: SeqAccess<'de> {
                let mut schema = SchemaBuilder {
                    fields: Vec::with_capacity(seq.size_hint().unwrap_or(0)),
                    fields_map: HashMap::with_capacity(seq.size_hint().unwrap_or(0)),
                };

                while let Some(value) = seq.next_element()? {
                    schema.add_field(value);
                }

                Ok(schema.build())
            }
        }

        deserializer.deserialize_seq(SchemaVisitor)
    }
}

#[cfg(test)]
mod tests {

    use std::collections::BTreeMap;

    use matches::{assert_matches, matches};
    use pretty_assertions::assert_eq;

    use crate::schema::field_type::ValueParsingError;
    use crate::schema::schema::DocParsingError::InvalidJson;
    use crate::schema::*;

    #[test]
    fn test_locate_splitting_dots() {
        assert_eq!(&super::locate_splitting_dots("a.b.c"), &[1, 3]);
        assert_eq!(&super::locate_splitting_dots(r"a\.b.c"), &[4]);
        assert_eq!(&super::locate_splitting_dots(r"a\..b.c"), &[3, 5]);
    }

    #[test]
    pub fn is_indexed_test() {
        let mut schema_builder = Schema::builder();
        let field_str = schema_builder.add_text_field("field_str", STRING);
        let schema = schema_builder.build();
        assert!(schema.get_field_entry(field_str).is_indexed());
    }

    #[test]
    pub fn test_schema_serialization() {
        let mut schema_builder = Schema::builder();
        let count_options = NumericOptions::default().set_stored().set_fast();
        let popularity_options = NumericOptions::default().set_stored().set_fast();
        let score_options = NumericOptions::default()
            .set_indexed()
            .set_fieldnorm()
            .set_fast();
        let is_read_options = NumericOptions::default().set_stored().set_fast();
        schema_builder.add_text_field("title", TEXT);
        schema_builder.add_text_field(
            "author",
            TextOptions::default().set_indexing_options(
                TextFieldIndexing::default()
                    .set_tokenizer("raw")
                    .set_fieldnorms(false),
            ),
        );
        schema_builder.add_u64_field("count", count_options);
        schema_builder.add_i64_field("popularity", popularity_options);
        schema_builder.add_f64_field("score", score_options);
        schema_builder.add_bool_field("is_read", is_read_options);
        let schema = schema_builder.build();
        let schema_json = serde_json::to_string_pretty(&schema).unwrap();
        let expected = r#"[
  {
    "name": "title",
    "type": "text",
    "options": {
      "indexing": {
        "record": "position",
        "fieldnorms": true,
        "tokenizer": "default"
      },
      "stored": false,
      "fast": false
    }
  },
  {
    "name": "author",
    "type": "text",
    "options": {
      "indexing": {
        "record": "basic",
        "fieldnorms": false,
        "tokenizer": "raw"
      },
      "stored": false,
      "fast": false
    }
  },
  {
    "name": "count",
    "type": "u64",
    "options": {
      "indexed": false,
      "fieldnorms": false,
      "fast": true,
      "stored": true
    }
  },
  {
    "name": "popularity",
    "type": "i64",
    "options": {
      "indexed": false,
      "fieldnorms": false,
      "fast": true,
      "stored": true
    }
  },
  {
    "name": "score",
    "type": "f64",
    "options": {
      "indexed": true,
      "fieldnorms": true,
      "fast": true,
      "stored": false
    }
  },
  {
    "name": "is_read",
    "type": "bool",
    "options": {
      "indexed": false,
      "fieldnorms": false,
      "fast": true,
      "stored": true
    }
  }
]"#;
        assert_eq!(schema_json, expected);

        let schema: Schema = serde_json::from_str(expected).unwrap();

        let mut fields = schema.fields();
        {
            let (field, field_entry) = fields.next().unwrap();
            assert_eq!("title", field_entry.name());
            assert_eq!(0, field.field_id());
        }
        {
            let (field, field_entry) = fields.next().unwrap();
            assert_eq!("author", field_entry.name());
            assert_eq!(1, field.field_id());
        }
        {
            let (field, field_entry) = fields.next().unwrap();
            assert_eq!("count", field_entry.name());
            assert_eq!(2, field.field_id());
        }
        {
            let (field, field_entry) = fields.next().unwrap();
            assert_eq!("popularity", field_entry.name());
            assert_eq!(3, field.field_id());
        }
        {
            let (field, field_entry) = fields.next().unwrap();
            assert_eq!("score", field_entry.name());
            assert_eq!(4, field.field_id());
        }
        {
            let (field, field_entry) = fields.next().unwrap();
            assert_eq!("is_read", field_entry.name());
            assert_eq!(5, field.field_id());
        }
        assert!(fields.next().is_none());
    }

    #[test]
    pub fn test_document_to_json() {
        let mut schema_builder = Schema::builder();
        let count_options = NumericOptions::default().set_stored().set_fast();
        let is_read_options = NumericOptions::default().set_stored().set_fast();
        schema_builder.add_text_field("title", TEXT);
        schema_builder.add_text_field("author", STRING);
        schema_builder.add_u64_field("count", count_options);
        schema_builder.add_ip_addr_field("ip", FAST | STORED);
        schema_builder.add_bool_field("is_read", is_read_options);
        let schema = schema_builder.build();
        let doc_json = r#"{
                "title": "my title",
                "author": "fulmicoton",
                "count": 4,
                "ip": "127.0.0.1",
                "is_read": true
        }"#;
        let doc = TantivyDocument::parse_json(&schema, doc_json).unwrap();

        let doc_serdeser = TantivyDocument::parse_json(&schema, &doc.to_json(&schema)).unwrap();
        assert_eq!(doc, doc_serdeser);
    }

    #[test]
    pub fn test_document_to_ipv4_json() {
        let mut schema_builder = Schema::builder();
        schema_builder.add_ip_addr_field("ip", FAST | STORED);
        let schema = schema_builder.build();

        // IpV4 loopback
        let doc_json = r#"{
                "ip": "127.0.0.1"
        }"#;
        let doc = TantivyDocument::parse_json(&schema, doc_json).unwrap();
        let value: serde_json::Value = serde_json::from_str(&doc.to_json(&schema)).unwrap();
        assert_eq!(value["ip"][0], "127.0.0.1");

        // Special case IpV6 loopback. We don't want to map that to IPv4
        let doc_json = r#"{
                "ip": "::1"
        }"#;
        let doc = TantivyDocument::parse_json(&schema, doc_json).unwrap();

        let value: serde_json::Value = serde_json::from_str(&doc.to_json(&schema)).unwrap();
        assert_eq!(value["ip"][0], "::1");

        // testing ip address of every router in the world
        let doc_json = r#"{
                "ip": "192.168.0.1"
        }"#;
        let doc = TantivyDocument::parse_json(&schema, doc_json).unwrap();

        let value: serde_json::Value = serde_json::from_str(&doc.to_json(&schema)).unwrap();
        assert_eq!(value["ip"][0], "192.168.0.1");
    }

    #[test]
    pub fn test_document_from_nameddoc() {
        let mut schema_builder = Schema::builder();
        let title = schema_builder.add_text_field("title", TEXT);
        let val = schema_builder.add_i64_field("val", INDEXED);
        let schema = schema_builder.build();
        let mut named_doc_map = BTreeMap::default();
        named_doc_map.insert(
            "title".to_string(),
            vec![OwnedValue::from("title1"), OwnedValue::from("title2")],
        );
        named_doc_map.insert(
            "val".to_string(),
            vec![OwnedValue::from(14u64), OwnedValue::from(-1i64)],
        );
        let doc =
            TantivyDocument::convert_named_doc(&schema, NamedFieldDocument(named_doc_map)).unwrap();
        assert_eq!(
            doc.get_all(title).map(OwnedValue::from).collect::<Vec<_>>(),
            vec![
                OwnedValue::from("title1".to_string()),
                OwnedValue::from("title2".to_string())
            ]
        );
        assert_eq!(
            doc.get_all(val).map(OwnedValue::from).collect::<Vec<_>>(),
            vec![OwnedValue::from(14u64), OwnedValue::from(-1i64)]
        );
    }

    #[test]
    pub fn test_document_missing_field_no_error() {
        let schema = Schema::builder().build();
        let mut named_doc_map = BTreeMap::default();
        named_doc_map.insert(
            "title".to_string(),
            vec![OwnedValue::from("title1"), OwnedValue::from("title2")],
        );
        TantivyDocument::convert_named_doc(&schema, NamedFieldDocument(named_doc_map)).unwrap();
    }

    #[test]
    pub fn test_parse_document() {
        let mut schema_builder = Schema::builder();
        let count_options = NumericOptions::default().set_stored().set_fast();
        let popularity_options = NumericOptions::default().set_stored().set_fast();
        let score_options = NumericOptions::default().set_indexed().set_fast();
        let title_field = schema_builder.add_text_field("title", TEXT);
        let author_field = schema_builder.add_text_field("author", STRING);
        let count_field = schema_builder.add_u64_field("count", count_options);
        let popularity_field = schema_builder.add_i64_field("popularity", popularity_options);
        let score_field = schema_builder.add_f64_field("score", score_options);
        let schema = schema_builder.build();
        {
            let doc = TantivyDocument::parse_json(&schema, "{}").unwrap();
            assert!(doc.field_values().next().is_none());
        }
        {
            let doc = TantivyDocument::parse_json(
                &schema,
                r#"{
                "title": "my title",
                "author": "fulmicoton",
                "count": 4,
                "popularity": 10,
                "score": 80.5
            }"#,
            )
            .unwrap();
            assert_eq!(
                doc.get_first(title_field).unwrap().as_str(),
                Some("my title")
            );
            assert_eq!(
                doc.get_first(author_field).unwrap().as_str(),
                Some("fulmicoton")
            );
            assert_eq!(doc.get_first(count_field).unwrap().as_u64(), Some(4));
            assert_eq!(doc.get_first(popularity_field).unwrap().as_i64(), Some(10));
            assert_eq!(doc.get_first(score_field).unwrap().as_f64(), Some(80.5f64));
        }
        {
            let res = TantivyDocument::parse_json(
                &schema,
                r#"{
                "thisfieldisnotdefinedintheschema": "my title",
                "title": "my title",
                "author": "fulmicoton",
                "count": 4,
                "popularity": 10,
                "score": 80.5,
                "jambon": "bayonne"
            }"#,
            );
            assert!(res.is_ok());
        }
        {
            let json_err = TantivyDocument::parse_json(
                &schema,
                r#"{
                "title": "my title",
                "author": "fulmicoton",
                "count": "5",
                "popularity": "10",
                "score": "80.5",
                "jambon": "bayonne"
            }"#,
            );
            assert_matches!(
                json_err,
                Err(DocParsingError::ValueError(
                    _,
                    ValueParsingError::TypeError { .. }
                ))
            );
        }
        {
            let json_err = TantivyDocument::parse_json(
                &schema,
                r#"{
                "title": "my title",
                "author": "fulmicoton",
                "count": -5,
                "popularity": 10,
                "score": 80.5
            }"#,
            );
            assert_matches!(
                json_err,
                Err(DocParsingError::ValueError(
                    _,
                    ValueParsingError::OverflowError { .. }
                ))
            );
        }
        {
            let json_err = TantivyDocument::parse_json(
                &schema,
                r#"{
                "title": "my title",
                "author": "fulmicoton",
                "count": 9223372036854775808,
                "popularity": 10,
                "score": 80.5
            }"#,
            );
            assert!(!matches!(
                json_err,
                Err(DocParsingError::ValueError(
                    _,
                    ValueParsingError::OverflowError { .. }
                ))
            ));
        }
        {
            let json_err = TantivyDocument::parse_json(
                &schema,
                r#"{
                "title": "my title",
                "author": "fulmicoton",
                "count": 50,
                "popularity": 9223372036854775808,
                "score": 80.5
            }"#,
            );
            assert_matches!(
                json_err,
                Err(DocParsingError::ValueError(
                    _,
                    ValueParsingError::OverflowError { .. }
                ))
            );
        }
        {
            // Short JSON, under the 20 char take.
            let json_err = TantivyDocument::parse_json(&schema, r#"{"count": 50,}"#);
            assert_matches!(json_err, Err(InvalidJson(_)));
        }
        {
            let json_err = TantivyDocument::parse_json(
                &schema,
                r#"{
                "title": "my title",
                "author": "fulmicoton",
                "count": 50,
            }"#,
            );
            assert_matches!(json_err, Err(InvalidJson(_)));
        }
    }

    #[test]
    pub fn test_schema_add_field() {
        let mut schema_builder = SchemaBuilder::default();
        let id_options = TextOptions::default().set_stored().set_indexing_options(
            TextFieldIndexing::default()
                .set_tokenizer("raw")
                .set_index_option(IndexRecordOption::Basic),
        );
        let timestamp_options = DateOptions::default()
            .set_stored()
            .set_indexed()
            .set_fieldnorm()
            .set_fast();
        schema_builder.add_text_field("_id", id_options);
        schema_builder.add_date_field("_timestamp", timestamp_options);

        let schema_content = r#"[
  {
    "name": "text",
    "type": "text",
    "options": {
      "indexing": {
        "record": "position",
        "fieldnorms": true,
        "tokenizer": "default"
      },
      "stored": false,
      "fast": false
    }
  },
  {
    "name": "popularity",
    "type": "i64",
    "options": {
      "indexed": false,
      "fieldnorms": false,
      "fast": true,
      "stored": true
    }
  }
]"#;
        let tmp_schema: Schema =
            serde_json::from_str(schema_content).expect("error while reading json");
        for (_field, field_entry) in tmp_schema.fields() {
            schema_builder.add_field(field_entry.clone());
        }

        let schema = schema_builder.build();
        let schema_json = serde_json::to_string_pretty(&schema).unwrap();
        let expected = r#"[
  {
    "name": "_id",
    "type": "text",
    "options": {
      "indexing": {
        "record": "basic",
        "fieldnorms": true,
        "tokenizer": "raw"
      },
      "stored": true,
      "fast": false
    }
  },
  {
    "name": "_timestamp",
    "type": "date",
    "options": {
      "indexed": true,
      "fieldnorms": true,
      "fast": true,
      "stored": true,
      "precision": "seconds"
    }
  },
  {
    "name": "text",
    "type": "text",
    "options": {
      "indexing": {
        "record": "position",
        "fieldnorms": true,
        "tokenizer": "default"
      },
      "stored": false,
      "fast": false
    }
  },
  {
    "name": "popularity",
    "type": "i64",
    "options": {
      "indexed": false,
      "fieldnorms": false,
      "fast": true,
      "stored": true
    }
  }
]"#;
        assert_eq!(schema_json, expected);
    }

    #[test]
    fn test_find_field() {
        let mut schema_builder = Schema::builder();
        schema_builder.add_json_field("foo", STRING);

        schema_builder.add_text_field("bar", STRING);
        schema_builder.add_text_field("foo.bar", STRING);
        schema_builder.add_text_field("foo.bar.baz", STRING);
        schema_builder.add_text_field("bar.a.b.c", STRING);
        let schema = schema_builder.build();

        assert_eq!(
            schema.find_field("foo.bar"),
            Some((schema.get_field("foo.bar").unwrap(), ""))
        );
        assert_eq!(
            schema.find_field("foo.bar.bar"),
            Some((schema.get_field("foo.bar").unwrap(), "bar"))
        );
        assert_eq!(
            schema.find_field("foo.bar.baz"),
            Some((schema.get_field("foo.bar.baz").unwrap(), ""))
        );
        assert_eq!(
            schema.find_field("foo.toto"),
            Some((schema.get_field("foo").unwrap(), "toto"))
        );
        assert_eq!(
            schema.find_field("foo.bar"),
            Some((schema.get_field("foo.bar").unwrap(), ""))
        );
        assert_eq!(
            schema.find_field("bar.toto.titi"),
            Some((schema.get_field("bar").unwrap(), "toto.titi"))
        );

        assert_eq!(schema.find_field("hello"), None);
        assert_eq!(schema.find_field(""), None);
        assert_eq!(schema.find_field("thiswouldbeareallylongfieldname"), None);
        assert_eq!(schema.find_field("baz.bar.foo"), None);
    }

    #[test]
    fn test_find_field_with_default() {
        let mut schema_builder = Schema::builder();
        schema_builder.add_json_field("_default", JsonObjectOptions::default());
        let default = Field::from_field_id(0);
        schema_builder.add_json_field("foo", STRING);
        let foo = Field::from_field_id(1);
        schema_builder.add_text_field("foo.bar", STRING);
        let foo_bar = Field::from_field_id(2);
        schema_builder.add_text_field("bar", STRING);
        let bar = Field::from_field_id(3);
        schema_builder.add_json_field("baz", JsonObjectOptions::default());
        let baz = Field::from_field_id(4);
        let schema = schema_builder.build();

        assert_eq!(schema.find_field_with_default("foo", None), Some((foo, "")));
        assert_eq!(
            schema.find_field_with_default("foo.bar", None),
            Some((foo_bar, ""))
        );
        assert_eq!(schema.find_field_with_default("bar", None), Some((bar, "")));
        assert_eq!(schema.find_field_with_default("bar.baz", None), None);
        assert_eq!(schema.find_field_with_default("baz", None), Some((baz, "")));
        assert_eq!(
            schema.find_field_with_default("baz.foobar", None),
            Some((baz, "foobar"))
        );
        assert_eq!(schema.find_field_with_default("foobar", None), None);

        assert_eq!(
            schema.find_field_with_default("foo", Some(default)),
            Some((foo, ""))
        );
        assert_eq!(
            schema.find_field_with_default("foo.bar", Some(default)),
            Some((foo_bar, ""))
        );
        assert_eq!(
            schema.find_field_with_default("bar", Some(default)),
            Some((bar, ""))
        );
        // still None, we are under an existing field
        assert_eq!(
            schema.find_field_with_default("bar.baz", Some(default)),
            None
        );
        assert_eq!(
            schema.find_field_with_default("baz", Some(default)),
            Some((baz, ""))
        );
        assert_eq!(
            schema.find_field_with_default("baz.foobar", Some(default)),
            Some((baz, "foobar"))
        );
        assert_eq!(
            schema.find_field_with_default("foobar", Some(default)),
            Some((default, "foobar"))
        );
    }
}


================================================
FILE: src/schema/term.rs
================================================
use std::hash::Hash;
use std::net::Ipv6Addr;
use std::{fmt, str};

use columnar::MonotonicallyMappableToU128;
use common::json_path_writer::{JSON_END_OF_PATH, JSON_PATH_SEGMENT_SEP_STR};
use common::JsonPathWriter;
use serde::{Deserialize, Serialize};

use super::date_time_options::DATE_TIME_PRECISION_INDEXED;
use super::{Field, Schema};
use crate::fastfield::FastValue;
use crate::json_utils::split_json_path;
use crate::schema::{Facet, Type};
use crate::DateTime;

/// Term represents the value that the token can take.
/// It's a serialized representation over different types.
///
/// A term is composed of Field and the serialized value bytes.
/// The serialized value bytes themselves start with a one byte type tag followed by the payload.
#[derive(Clone, Eq, PartialEq, Ord, PartialOrd, Hash, Serialize, Deserialize)]
pub struct Term {
    field: Field,
    serialized_value_bytes: Vec<u8>,
}

/// The number of bytes used as metadata when serializing a term.
const TERM_TYPE_TAG_LEN: usize = 1;

impl Term {
    /// Takes a serialized term and wraps it as a Term.
    /// First 4 bytes are the field id
    #[deprecated(
        note = "we want to avoid working on the serialized representation directly, replace with \
                typed API calls (add more if needed) or use serde to serialize/deserialize"
    )]
    pub fn wrap(serialized: &[u8]) -> Term {
        let field_id_bytes: [u8; 4] = serialized[0..4].try_into().unwrap();
        let field_id = u32::from_be_bytes(field_id_bytes);
        Term {
            field: Field::from_field_id(field_id),
            serialized_value_bytes: serialized[4..].to_vec(),
        }
    }

    /// Returns the serialized representation of the term.
    /// First 4 bytes are the field id
    #[deprecated(
        note = "we want to avoid working on the serialized representation directly, replace with \
                typed API calls (add more if needed) or use serde to serialize/deserialize"
    )]
    pub fn serialized_term(&self) -> Vec<u8> {
        let mut serialized = Vec::with_capacity(4 + self.serialized_value_bytes.len());
        serialized.extend(self.field.field_id().to_be_bytes().as_ref());
        serialized.extend_from_slice(&self.serialized_value_bytes);
        serialized
    }

    /// Create a new Term with a buffer with a given capacity.
    pub fn with_capacity(capacity: usize) -> Term {
        let mut data = Vec::with_capacity(TERM_TYPE_TAG_LEN + capacity);
        data.resize(TERM_TYPE_TAG_LEN, 0u8);
        Term {
            field: Field::from_field_id(0u32),
            serialized_value_bytes: data,
        }
    }

    /// Creates a term from a json path.
    ///
    /// The json path can address a nested value in a JSON object.
    /// e.g. `{"k8s": {"node": {"id": 5}}}` can be addressed via `k8s.node.id`.
    ///
    /// In case there are dots in the field name, and the `expand_dots_enabled` parameter is not
    /// set they need to be escaped with a backslash.
    /// e.g. `{"k8s.node": {"id": 5}}` can be addressed via `k8s\.node.id`.
    pub fn from_field_json_path(field: Field, json_path: &str, expand_dots_enabled: bool) -> Term {
        let paths = split_json_path(json_path);
        let mut json_path = JsonPathWriter::with_expand_dots(expand_dots_enabled);
        for path in paths {
            json_path.push(&path);
        }
        json_path.set_end();
        let mut term = Term::with_type_and_field(Type::Json, field);

        term.append_bytes(json_path.as_str().as_bytes());

        term
    }

    /// Gets the full path of the field name + optional json path.
    pub fn get_full_path(&self, schema: &Schema) -> String {
        let field = self.field();
        let mut field = schema.get_field_name(field).to_string();
        if let Some(json_path) = self.get_json_path() {
            field.push('.');
            field.push_str(&json_path);
        };
        field
    }

    /// Gets the json path if the type is JSON
    pub fn get_json_path(&self) -> Option<String> {
        let value = self.value();
        if let Some((json_path, _)) = value.as_json() {
            Some(unsafe {
                std::str::from_utf8_unchecked(&json_path[..json_path.len() - 1]).to_string()
            })
        } else {
            None
        }
    }

    pub(crate) fn with_type_and_field(typ: Type, field: Field) -> Term {
        let mut term = Self::with_capacity(8);
        term.set_field_and_type(field, typ);
        term
    }

    fn with_bytes_and_field_and_payload(typ: Type, field: Field, bytes: &[u8]) -> Term {
        let mut term = Self::with_capacity(bytes.len());
        term.set_field_and_type(field, typ);
        term.serialized_value_bytes.extend_from_slice(bytes);
        term
    }

    pub(crate) fn from_fast_value<T: FastValue>(field: Field, val: &T) -> Term {
        let mut term = Self::with_type_and_field(T::to_type(), field);
        term.set_bytes(val.to_u64().to_be_bytes().as_ref());
        term
    }

    /// Panics when the term is not empty... ie: some value is set.
    /// Use `clear_with_field_and_type` in that case.
    ///
    /// Sets field and the type.
    pub(crate) fn set_field_and_type(&mut self, field: Field, typ: Type) {
        assert!(self.is_empty());
        self.field = field;
        self.serialized_value_bytes[0] = typ.to_code();
    }

    /// Is empty if there are no value bytes.
    pub fn is_empty(&self) -> bool {
        self.serialized_value_bytes.len() == TERM_TYPE_TAG_LEN
    }

    /// Builds a term given a field, and a `Ipv6Addr`-value
    pub fn from_field_ip_addr(field: Field, ip_addr: Ipv6Addr) -> Term {
        let mut term = Self::with_type_and_field(Type::IpAddr, field);
        term.set_bytes(ip_addr.to_u128().to_be_bytes().as_ref());
        term
    }

    /// Builds a term given a field, and a `u64`-value
    pub fn from_field_u64(field: Field, val: u64) -> Term {
        Term::from_fast_value(field, &val)
    }

    /// Builds a term given a field, and a `i64`-value
    pub fn from_field_i64(field: Field, val: i64) -> Term {
        Term::from_fast_value(field, &val)
    }

    /// Builds a term given a field, and a `f64`-value
    pub fn from_field_f64(field: Field, val: f64) -> Term {
        Term::from_fast_value(field, &val)
    }

    /// Builds a term given a field, and a `bool`-value
    pub fn from_field_bool(field: Field, val: bool) -> Term {
        Term::from_fast_value(field, &val)
    }

    /// Builds a term given a field, and a `DateTime` value.
    ///
    /// The contained value may not match the value, due do the truncation used
    /// for indexed data [super::DATE_TIME_PRECISION_INDEXED].
    /// To create a term used for search use `from_field_date_for_search`.
    pub fn from_field_date(field: Field, val: DateTime) -> Term {
        Term::from_fast_value(field, &val)
    }

    /// Builds a term given a field, and a `DateTime` value to be used in searching the inverted
    /// index.
    /// It truncates the `DateTime` to the precision used in the index
    /// ([super::DATE_TIME_PRECISION_INDEXED]).
    pub fn from_field_date_for_search(field: Field, val: DateTime) -> Term {
        Term::from_fast_value(field, &val.truncate(DATE_TIME_PRECISION_INDEXED))
    }

    /// Creates a `Term` given a facet.
    pub fn from_facet(field: Field, facet: &Facet) -> Term {
        let facet_encoded_str = facet.encoded_str();
        Term::with_bytes_and_field_and_payload(Type::Facet, field, facet_encoded_str.as_bytes())
    }

    /// Builds a term given a field, and a string value
    pub fn from_field_text(field: Field, text: &str) -> Term {
        Term::with_bytes_and_field_and_payload(Type::Str, field, text.as_bytes())
    }

    /// Builds a term bytes.
    pub fn from_field_bytes(field: Field, bytes: &[u8]) -> Term {
        Term::with_bytes_and_field_and_payload(Type::Bytes, field, bytes)
    }

    /// Removes the value_bytes and set the type code.
    pub fn clear_with_type(&mut self, typ: Type) {
        self.truncate_value_bytes(0);
        self.serialized_value_bytes[0] = typ.to_code();
    }

    /// Append a type marker + fast value to a term.
    /// This is used in JSON type to append a fast value after the path.
    ///
    /// It will not clear existing bytes.
    pub fn append_type_and_fast_value<T: FastValue>(&mut self, val: T) {
        self.serialized_value_bytes.push(T::to_type().to_code());
        let value = val.to_u64();
        self.serialized_value_bytes
            .extend(value.to_be_bytes().as_ref());
    }

    /// Append a string type marker + string to a term.
    /// This is used in JSON type to append a str after the path.
    ///
    /// It will not clear existing bytes.
    pub fn append_type_and_str(&mut self, val: &str) {
        self.serialized_value_bytes.push(Type::Str.to_code());
        self.serialized_value_bytes.extend(val.as_bytes().as_ref());
    }

    /// Sets the value of a `Bytes` field.
    pub fn set_bytes(&mut self, bytes: &[u8]) {
        self.truncate_value_bytes(0);
        self.serialized_value_bytes.extend(bytes);
    }

    /// Truncates the value bytes of the term. Value and field type stays the same.
    pub fn truncate_value_bytes(&mut self, len: usize) {
        self.serialized_value_bytes
            .truncate(len + TERM_TYPE_TAG_LEN);
    }

    /// The length of the bytes.
    pub fn len_bytes(&self) -> usize {
        self.serialized_value_bytes.len() - TERM_TYPE_TAG_LEN
    }

    /// Appends value bytes to the Term.
    ///
    /// This function returns the segment that has just been added.
    #[inline]
    pub fn append_bytes(&mut self, bytes: &[u8]) -> &mut [u8] {
        let len_before = self.serialized_value_bytes.len();
        self.serialized_value_bytes.extend_from_slice(bytes);
        &mut self.serialized_value_bytes[len_before..]
    }

    /// Return the type of the term.
    pub fn typ(&self) -> Type {
        self.value().typ()
    }

    /// Returns the field.
    pub fn field(&self) -> Field {
        self.field
    }

    /// Returns the serialized representation of the value.
    /// (this does neither include the field id nor the value type.)
    ///
    /// If the term is a string, its value is utf-8 encoded.
    /// If the term is a u64, its value is encoded according
    /// to `byteorder::BigEndian`.
    pub fn serialized_value_bytes(&self) -> &[u8] {
        &self.serialized_value_bytes[TERM_TYPE_TAG_LEN..]
    }

    /// Returns the value of the term.
    /// address or JSON path + value. (this does not include the field.)
    pub fn value(&self) -> ValueBytes<&[u8]> {
        ValueBytes::wrap(self.serialized_value_bytes.as_ref())
    }
}

/// ValueBytes represents a serialized value.
///
/// The value can be of any type of [`Type`] (e.g. string, u64, f64, bool, date, JSON).
/// The serialized representation matches the lexicographical order of the type.
///
/// The `ValueBytes` format is as follow:
/// `[type code: u8][serialized value]`
///
/// For JSON `ValueBytes` equals to:
/// `[type code=JSON][JSON path][JSON_END_OF_PATH][ValueBytes]`
///
/// The nested ValueBytes in JSON is never of type JSON. (there's no recursion)
#[derive(Clone)]
pub struct ValueBytes<B>(B)
where B: AsRef<[u8]>;

impl<B> ValueBytes<B>
where B: AsRef<[u8]>
{
    /// Wraps a object holding bytes
    pub fn wrap(data: B) -> ValueBytes<B> {
        ValueBytes(data)
    }

    /// Wraps a object holding Vec<u8>
    pub fn to_owned(&self) -> ValueBytes<Vec<u8>> {
        ValueBytes(self.0.as_ref().to_vec())
    }

    fn typ_code(&self) -> u8 {
        self.0.as_ref()[0]
    }

    /// Return the type of the term.
    pub fn typ(&self) -> Type {
        Type::from_code(self.typ_code()).expect("The term has an invalid type code")
    }

    /// Returns the `u64` value stored in a term.
    ///
    /// Returns `None` if the term is not of the u64 type, or if the term byte representation
    /// is invalid.
    pub fn as_u64(&self) -> Option<u64> {
        self.get_fast_type::<u64>()
    }

    fn get_fast_type<T: FastValue>(&self) -> Option<T> {
        if self.typ() != T::to_type() {
            return None;
        }
        let value_bytes = self.raw_value_bytes_payload();
        let value_u64 = u64::from_be_bytes(value_bytes.try_into().ok()?);
        Some(T::from_u64(value_u64))
    }

    /// Returns the `i64` value stored in a term.
    ///
    /// Returns `None` if the term is not of the i64 type, or if the term byte representation
    /// is invalid.
    pub fn as_i64(&self) -> Option<i64> {
        self.get_fast_type::<i64>()
    }

    /// Returns the `f64` value stored in a term.
    ///
    /// Returns `None` if the term is not of the f64 type, or if the term byte representation
    /// is invalid.
    pub fn as_f64(&self) -> Option<f64> {
        self.get_fast_type::<f64>()
    }

    /// Returns the `bool` value stored in a term.
    ///
    /// Returns `None` if the term is not of the bool type, or if the term byte representation
    /// is invalid.
    pub fn as_bool(&self) -> Option<bool> {
        self.get_fast_type::<bool>()
    }

    /// Returns the `Date` value stored in a term.
    ///
    /// Returns `None` if the term is not of the Date type, or if the term byte representation
    /// is invalid.
    pub fn as_date(&self) -> Option<DateTime> {
        self.get_fast_type::<DateTime>()
    }

    /// Returns the text associated with the term.
    ///
    /// Returns `None` if the field is not of string type
    /// or if the bytes are not valid utf-8.
    pub fn as_str(&self) -> Option<&str> {
        if self.typ() != Type::Str {
            return None;
        }
        str::from_utf8(self.raw_value_bytes_payload()).ok()
    }

    /// Returns the facet associated with the term.
    ///
    /// Returns `None` if the field is not of facet type
    /// or if the bytes are not valid utf-8.
    pub fn as_facet(&self) -> Option<Facet> {
        if self.typ() != Type::Facet {
            return None;
        }
        let facet_encode_str = str::from_utf8(self.raw_value_bytes_payload()).ok()?;
        Some(Facet::from_encoded_string(facet_encode_str.to_string()))
    }

    /// Returns the bytes associated with the term.
    ///
    /// Returns `None` if the field is not of bytes type.
    pub fn as_bytes(&self) -> Option<&[u8]> {
        if self.typ() != Type::Bytes {
            return None;
        }
        Some(self.raw_value_bytes_payload())
    }

    /// Returns a `Ipv6Addr` value from the term.
    pub fn as_ip_addr(&self) -> Option<Ipv6Addr> {
        if self.typ() != Type::IpAddr {
            return None;
        }
        let ip_u128 = u128::from_be_bytes(self.raw_value_bytes_payload().try_into().ok()?);
        Some(Ipv6Addr::from_u128(ip_u128))
    }

    /// Returns the json path type.
    ///
    /// Returns `None` if the value is not JSON.
    pub fn json_path_type(&self) -> Option<Type> {
        let json_value_bytes = self.as_json_value_bytes()?;

        Some(json_value_bytes.typ())
    }

    /// Returns the json path bytes (including the JSON_END_OF_PATH byte),
    /// and the encoded ValueBytes after the json path.
    ///
    /// Returns `None` if the value is not JSON.
    pub(crate) fn as_json(&self) -> Option<(&[u8], ValueBytes<&[u8]>)> {
        if self.typ() != Type::Json {
            return None;
        }
        let bytes = self.raw_value_bytes_payload();

        let pos = bytes.iter().cloned().position(|b| b == JSON_END_OF_PATH)?;
        // split at pos + 1, so that json_path_bytes includes the JSON_END_OF_PATH byte.
        let (json_path_bytes, term) = bytes.split_at(pos + 1);
        Some((json_path_bytes, ValueBytes::wrap(term)))
    }

    /// Returns the encoded ValueBytes after the json path.
    ///
    /// Returns `None` if the value is not JSON.
    pub(crate) fn as_json_value_bytes(&self) -> Option<ValueBytes<&[u8]>> {
        if self.typ() != Type::Json {
            return None;
        }
        let bytes = self.raw_value_bytes_payload();
        let pos = bytes.iter().cloned().position(|b| b == JSON_END_OF_PATH)?;
        Some(ValueBytes::wrap(&bytes[pos + 1..]))
    }

    /// Returns the raw value of ValueBytes payload, without the type tag.
    pub(crate) fn raw_value_bytes_payload(&self) -> &[u8] {
        &self.0.as_ref()[1..]
    }

    /// Returns the serialized value of ValueBytes payload, without the type tag.
    pub(crate) fn value_bytes_payload(&self) -> Vec<u8> {
        if let Some(value_bytes) = self.as_json_value_bytes() {
            value_bytes.raw_value_bytes_payload().to_vec()
        } else {
            self.raw_value_bytes_payload().to_vec()
        }
    }

    /// Returns the serialized representation of the value bytes including the type tag.
    pub fn as_serialized(&self) -> &[u8] {
        self.0.as_ref()
    }

    fn debug_value_bytes(&self, f: &mut fmt::Formatter) -> fmt::Result {
        let typ = self.typ();
        write!(f, "type={typ:?}, ")?;
        match typ {
            Type::Str => {
                let s = self.as_str();
                write_opt(f, s)?;
            }
            Type::U64 => {
                write_opt(f, self.as_u64())?;
            }
            Type::I64 => {
                write_opt(f, self.as_i64())?;
            }
            Type::F64 => {
                write_opt(f, self.as_f64())?;
            }
            Type::Bool => {
                write_opt(f, self.as_bool())?;
            }
            // TODO pretty print these types too.
            Type::Date => {
                write_opt(f, self.as_date())?;
            }
            Type::Facet => {
                write_opt(f, self.as_facet())?;
            }
            Type::Bytes => {
                write_opt(f, self.as_bytes())?;
            }
            Type::Json => {
                if let Some((path_bytes, sub_value_bytes)) = self.as_json() {
                    // Remove the JSON_END_OF_PATH byte & convert to utf8.
                    let path = str::from_utf8(&path_bytes[..path_bytes.len() - 1])
                        .map_err(|_| std::fmt::Error)?;
                    let path_pretty = path.replace(JSON_PATH_SEGMENT_SEP_STR, ".");
                    write!(f, "path={path_pretty}, ")?;
                    sub_value_bytes.debug_value_bytes(f)?;
                }
            }
            Type::IpAddr => {
                write_opt(f, self.as_ip_addr())?;
            }
        }
        Ok(())
    }
}

fn write_opt<T: std::fmt::Debug>(f: &mut fmt::Formatter, val_opt: Option<T>) -> fmt::Result {
    if let Some(val) = val_opt {
        write!(f, "{val:?}")?;
    }
    Ok(())
}

impl fmt::Debug for Term {
    fn fmt(&self, f: &mut fmt::Formatter) -> fmt::Result {
        let field_id = self.field.field_id();
        write!(f, "Term(field={field_id}, ")?;
        let value_bytes = ValueBytes::wrap(&self.serialized_value_bytes);
        value_bytes.debug_value_bytes(f)?;
        write!(f, ")",)?;
        Ok(())
    }
}

#[cfg(test)]
mod tests {

    use crate::schema::*;

    #[test]
    pub fn test_term_str() {
        let mut schema_builder = Schema::builder();
        schema_builder.add_text_field("text", STRING);
        let title_field = schema_builder.add_text_field("title", STRING);
        let term = Term::from_field_text(title_field, "test");
        assert_eq!(term.field(), title_field);
        assert_eq!(term.typ(), Type::Str);
        assert_eq!(term.value().as_str(), Some("test"))
    }

    #[test]
    pub fn test_term_u64() {
        let mut schema_builder = Schema::builder();
        let count_field = schema_builder.add_u64_field("count", INDEXED);
        let term = Term::from_field_u64(count_field, 983u64);
        assert_eq!(term.field(), count_field);
        assert_eq!(term.typ(), Type::U64);
        assert_eq!(term.serialized_value_bytes().len(), 8);
        assert_eq!(term.value().as_u64(), Some(983u64))
    }

    #[test]
    pub fn test_term_bool() {
        let mut schema_builder = Schema::builder();
        let bool_field = schema_builder.add_bool_field("bool", INDEXED);
        let term = Term::from_field_bool(bool_field, true);
        assert_eq!(term.field(), bool_field);
        assert_eq!(term.typ(), Type::Bool);
        assert_eq!(term.serialized_value_bytes().len(), 8);
        assert_eq!(term.value().as_bool(), Some(true))
    }
}


================================================
FILE: src/schema/text_options.rs
================================================
use std::borrow::Cow;
use std::ops::BitOr;

use serde::{Deserialize, Serialize};

use super::flags::{CoerceFlag, FastFlag};
use crate::schema::flags::{SchemaFlagList, StoredFlag};
use crate::schema::IndexRecordOption;

/// Define how a text field should be handled by tantivy.
#[derive(Clone, Debug, PartialEq, Serialize, Deserialize, Default)]
pub struct TextOptions {
    #[serde(default)]
    #[serde(skip_serializing_if = "Option::is_none")]
    indexing: Option<TextFieldIndexing>,
    #[serde(default)]
    stored: bool,
    #[serde(default)]
    pub(crate) fast: FastFieldTextOptions,
    #[serde(default)]
    #[serde(skip_serializing_if = "is_false")]
    /// coerce values into string if they are not of type string
    coerce: bool,
}

#[derive(Clone, Debug, PartialEq, Serialize, Deserialize)]
#[serde(untagged)]
/// Enum to control how the fast field setting of a text field.
pub(crate) enum FastFieldTextOptions {
    /// Flag to enable/disable
    IsEnabled(bool),
    /// Enable with tokenizer. The tokenizer must be available on the fast field tokenizer manager.
    /// `Index::fast_field_tokenizer`.
    EnabledWithTokenizer { with_tokenizer: TokenizerName },
}

impl Default for FastFieldTextOptions {
    fn default() -> Self {
        FastFieldTextOptions::IsEnabled(false)
    }
}

impl BitOr<FastFieldTextOptions> for FastFieldTextOptions {
    type Output = FastFieldTextOptions;

    fn bitor(self, other: FastFieldTextOptions) -> FastFieldTextOptions {
        match (self, other) {
            (
                FastFieldTextOptions::EnabledWithTokenizer {
                    with_tokenizer: tokenizer,
                },
                _,
            )
            | (
                _,
                FastFieldTextOptions::EnabledWithTokenizer {
                    with_tokenizer: tokenizer,
                },
            ) => FastFieldTextOptions::EnabledWithTokenizer {
                with_tokenizer: tokenizer,
            },
            (FastFieldTextOptions::IsEnabled(true), _)
            | (_, FastFieldTextOptions::IsEnabled(true)) => FastFieldTextOptions::IsEnabled(true),
            (_, FastFieldTextOptions::IsEnabled(false)) => FastFieldTextOptions::IsEnabled(false),
        }
    }
}

fn is_false(val: &bool) -> bool {
    !val
}

impl TextOptions {
    /// Returns the indexing options.
    #[inline]
    pub fn get_indexing_options(&self) -> Option<&TextFieldIndexing> {
        self.indexing.as_ref()
    }

    /// Returns true if the text is to be stored.
    #[inline]
    pub fn is_stored(&self) -> bool {
        self.stored
    }

    /// Returns true if and only if the value is a fast field.
    #[inline]
    pub fn is_fast(&self) -> bool {
        matches!(self.fast, FastFieldTextOptions::IsEnabled(true))
            || matches!(
                &self.fast,
                FastFieldTextOptions::EnabledWithTokenizer { with_tokenizer: _ }
            )
    }

    /// Returns true if and only if the value is a fast field.
    #[inline]
    pub fn get_fast_field_tokenizer_name(&self) -> Option<&str> {
        match &self.fast {
            FastFieldTextOptions::IsEnabled(true) | FastFieldTextOptions::IsEnabled(false) => None,
            FastFieldTextOptions::EnabledWithTokenizer {
                with_tokenizer: tokenizer,
            } => Some(tokenizer.name()),
        }
    }

    /// Returns true if values should be coerced to strings (numbers, null).
    #[inline]
    pub fn should_coerce(&self) -> bool {
        self.coerce
    }

    /// Set the field as a fast field.
    ///
    /// Fast fields are designed for random access.
    /// Access time are similar to a random lookup in an array.
    /// Text fast fields will have the term ids stored in the fast field.
    ///
    /// The effective cardinality depends on the tokenizer. Without a tokenizer, the text will be
    /// stored as is, which equals to the "raw" tokenizer. The tokenizer can be used to apply
    /// normalization like lower case.
    /// The passed tokenizer_name must be available on the fast field tokenizer manager.
    /// `Index::fast_field_tokenizer`.
    ///
    /// The original text can be retrieved via
    /// [`TermDictionary::ord_to_term()`](crate::termdict::TermDictionary::ord_to_term)
    /// from the dictionary.
    #[must_use]
    pub fn set_fast(mut self, tokenizer_name: Option<&str>) -> TextOptions {
        if let Some(tokenizer) = tokenizer_name {
            let tokenizer = TokenizerName::from_name(tokenizer);
            self.fast = FastFieldTextOptions::EnabledWithTokenizer {
                with_tokenizer: tokenizer,
            }
        } else {
            self.fast = FastFieldTextOptions::IsEnabled(true);
        }
        self
    }

    /// Coerce values if they are not of type string. Defaults to false.
    #[must_use]
    pub fn set_coerce(mut self) -> TextOptions {
        self.coerce = true;
        self
    }

    /// Sets the field as stored.
    #[must_use]
    pub fn set_stored(mut self) -> TextOptions {
        self.stored = true;
        self
    }

    /// Sets the field as indexed, with the specific indexing options.
    #[must_use]
    pub fn set_indexing_options(mut self, indexing: TextFieldIndexing) -> TextOptions {
        self.indexing = Some(indexing);
        self
    }
}

#[derive(Clone, PartialEq, Debug, Eq, Serialize, Deserialize)]
pub(crate) struct TokenizerName(Cow<'static, str>);

const DEFAULT_TOKENIZER_NAME: &str = "default";

const NO_TOKENIZER_NAME: &str = "raw";

impl Default for TokenizerName {
    fn default() -> Self {
        TokenizerName::from_static(DEFAULT_TOKENIZER_NAME)
    }
}

impl TokenizerName {
    pub const fn from_static(name: &'static str) -> Self {
        TokenizerName(Cow::Borrowed(name))
    }
    pub(crate) fn from_name(name: &str) -> Self {
        TokenizerName(Cow::Owned(name.to_string()))
    }
    pub(crate) fn name(&self) -> &str {
        &self.0
    }
}

/// Configuration defining indexing for a text field.
///
/// It defines
/// - The amount of information that should be stored about the presence of a term in a document.
///   Essentially, should we store the term frequency and/or the positions (See
///   [`IndexRecordOption`]).
/// - The name of the `Tokenizer` that should be used to process the field.
/// - Flag indicating, if fieldnorms should be stored (See [fieldnorm](crate::fieldnorm)). Defaults
///   to `true`.
#[derive(Clone, PartialEq, Debug, Eq, Serialize, Deserialize)]
pub struct TextFieldIndexing {
    #[serde(default)]
    record: IndexRecordOption,
    #[serde(default = "default_fieldnorms")]
    fieldnorms: bool,
    #[serde(default)]
    tokenizer: TokenizerName,
}

pub(crate) fn default_fieldnorms() -> bool {
    true
}

impl Default for TextFieldIndexing {
    fn default() -> TextFieldIndexing {
        TextFieldIndexing {
            tokenizer: TokenizerName::default(),
            record: IndexRecordOption::default(),
            fieldnorms: default_fieldnorms(),
        }
    }
}

impl TextFieldIndexing {
    /// Sets the tokenizer to be used for a given field.
    #[must_use]
    pub fn set_tokenizer(mut self, tokenizer_name: &str) -> TextFieldIndexing {
        self.tokenizer = TokenizerName::from_name(tokenizer_name);
        self
    }

    /// Returns the tokenizer that will be used for this field.
    pub fn tokenizer(&self) -> &str {
        self.tokenizer.name()
    }

    /// Sets fieldnorms
    #[must_use]
    pub fn set_fieldnorms(mut self, fieldnorms: bool) -> TextFieldIndexing {
        self.fieldnorms = fieldnorms;
        self
    }

    /// Returns true if and only if [fieldnorms](crate::fieldnorm) are stored.
    pub fn fieldnorms(&self) -> bool {
        self.fieldnorms
    }

    /// Sets which information should be indexed with the tokens.
    ///
    /// See [`IndexRecordOption`] for more detail.
    #[must_use]
    pub fn set_index_option(mut self, index_option: IndexRecordOption) -> TextFieldIndexing {
        self.record = index_option;
        self
    }

    /// Returns the indexing options associated with this field.
    ///
    /// See [`IndexRecordOption`] for more detail.
    pub fn index_option(&self) -> IndexRecordOption {
        self.record
    }
}

/// The field will be untokenized and indexed.
pub const STRING: TextOptions = TextOptions {
    indexing: Some(TextFieldIndexing {
        tokenizer: TokenizerName::from_static(NO_TOKENIZER_NAME),
        fieldnorms: true,
        record: IndexRecordOption::Basic,
    }),
    stored: false,
    fast: FastFieldTextOptions::IsEnabled(false),
    coerce: false,
};

/// The field will be tokenized and indexed.
pub const TEXT: TextOptions = TextOptions {
    indexing: Some(TextFieldIndexing {
        tokenizer: TokenizerName::from_static(DEFAULT_TOKENIZER_NAME),
        fieldnorms: true,
        record: IndexRecordOption::WithFreqsAndPositions,
    }),
    stored: false,
    coerce: false,
    fast: FastFieldTextOptions::IsEnabled(false),
};

impl<T: Into<TextOptions>> BitOr<T> for TextOptions {
    type Output = TextOptions;

    fn bitor(self, other: T) -> TextOptions {
        let other = other.into();
        TextOptions {
            indexing: self.indexing.or(other.indexing),
            stored: self.stored | other.stored,
            fast: self.fast | other.fast,
            coerce: self.coerce | other.coerce,
        }
    }
}

impl From<()> for TextOptions {
    fn from(_: ()) -> TextOptions {
        TextOptions::default()
    }
}

impl From<StoredFlag> for TextOptions {
    fn from(_: StoredFlag) -> TextOptions {
        TextOptions {
            indexing: None,
            stored: true,
            fast: FastFieldTextOptions::default(),
            coerce: false,
        }
    }
}

impl From<CoerceFlag> for TextOptions {
    fn from(_: CoerceFlag) -> TextOptions {
        TextOptions {
            indexing: None,
            stored: false,
            fast: FastFieldTextOptions::default(),
            coerce: true,
        }
    }
}

impl From<FastFlag> for TextOptions {
    fn from(_: FastFlag) -> TextOptions {
        TextOptions {
            indexing: None,
            stored: false,
            fast: FastFieldTextOptions::IsEnabled(true),
            coerce: false,
        }
    }
}

impl<Head, Tail> From<SchemaFlagList<Head, Tail>> for TextOptions
where
    Head: Clone,
    Tail: Clone,
    Self: BitOr<Output = Self> + From<Head> + From<Tail>,
{
    fn from(head_tail: SchemaFlagList<Head, Tail>) -> Self {
        Self::from(head_tail.head) | Self::from(head_tail.tail)
    }
}

#[cfg(test)]
mod tests {
    use crate::schema::text_options::{FastFieldTextOptions, TokenizerName};
    use crate::schema::*;

    #[test]
    fn test_field_options() {
        let field_options = STORED | TEXT;
        assert!(field_options.is_stored());
        assert!(field_options.get_indexing_options().is_some());
        let mut schema_builder = Schema::builder();
        schema_builder.add_text_field("body", TEXT);
        let schema = schema_builder.build();
        let field = schema.get_field("body").unwrap();
        let field_entry = schema.get_field_entry(field);
        assert!(matches!(field_entry.field_type(),
                FieldType::Str(text_options)
                if text_options.get_indexing_options().unwrap().tokenizer() == "default"));
    }

    #[test]
    fn test_cmp_index_record_option() {
        assert!(IndexRecordOption::WithFreqsAndPositions > IndexRecordOption::WithFreqs);
        assert!(IndexRecordOption::WithFreqs > IndexRecordOption::Basic);
    }

    #[test]
    fn serde_default_test() {
        let json = r#"
        {
            "indexing": {
                "record": "basic",
                "fieldnorms": true,
                "tokenizer": "default"
            },
            "stored": false
        }
        "#;
        let options: TextOptions = serde_json::from_str(json).unwrap();
        let options2: TextOptions = serde_json::from_str("{\"indexing\": {}}").unwrap();
        assert_eq!(options, options2);
        assert_eq!(options.indexing.unwrap().record, IndexRecordOption::Basic);
        let options3: TextOptions = serde_json::from_str("{}").unwrap();
        assert_eq!(options3.indexing, None);
    }

    #[test]
    fn serde_fast_field_tokenizer() {
        let json = r#" {
            "fast": { "with_tokenizer": "default" }
        } "#;
        let options: TextOptions = serde_json::from_str(json).unwrap();
        assert_eq!(
            options.fast,
            FastFieldTextOptions::EnabledWithTokenizer {
                with_tokenizer: TokenizerName::from_static("default")
            }
        );
        let options: TextOptions =
            serde_json::from_str(&serde_json::to_string(&options).unwrap()).unwrap();
        assert_eq!(
            options.fast,
            FastFieldTextOptions::EnabledWithTokenizer {
                with_tokenizer: TokenizerName::from_static("default")
            }
        );

        let json = r#" {
            "fast": true
        } "#;
        let options: TextOptions = serde_json::from_str(json).unwrap();
        assert_eq!(options.fast, FastFieldTextOptions::IsEnabled(true));
        let options: TextOptions =
            serde_json::from_str(&serde_json::to_string(&options).unwrap()).unwrap();
        assert_eq!(options.fast, FastFieldTextOptions::IsEnabled(true));

        let json = r#" {
            "fast": false
        } "#;
        let options: TextOptions = serde_json::from_str(json).unwrap();
        assert_eq!(options.fast, FastFieldTextOptions::IsEnabled(false));
        let options: TextOptions =
            serde_json::from_str(&serde_json::to_string(&options).unwrap()).unwrap();
        assert_eq!(options.fast, FastFieldTextOptions::IsEnabled(false));
    }
}


================================================
FILE: src/snippet/mod.rs
================================================
//! [`SnippetGenerator`]
//! Generates a text snippet for a given document, and some highlighted parts inside it.
//!
//! Imagine you doing a text search in a document
//! and want to show a preview of where in the document the search terms occur,
//! along with some surrounding text to give context, and the search terms highlighted.
//!
//! [`SnippetGenerator`] serves this purpose.
//! It scans a document and constructs a snippet, which consists of sections where the search terms
//! have been found, stitched together with "..." in between sections if necessary.
//!
//! ## Example
//!
//! ```rust
//! # use tantivy::query::QueryParser;
//! # use tantivy::schema::{Schema, TEXT};
//! # use tantivy::{doc, Index};
//! use tantivy::snippet::SnippetGenerator;
//!
//! # fn main() -> tantivy::Result<()> {
//! #    let mut schema_builder = Schema::builder();
//! #    let text_field = schema_builder.add_text_field("text", TEXT);
//! #    let schema = schema_builder.build();
//! #    let index = Index::create_in_ram(schema);
//! #    let mut index_writer = index.writer_with_num_threads(1, 20_000_000)?;
//! #    let doc = doc!(text_field => r#"Comme je descendais des Fleuves impassibles,
//! #   Je ne me sentis plus guidé par les haleurs :
//! #  Des Peaux-Rouges criards les avaient pris pour cibles,
//! #  Les ayant cloués nus aux poteaux de couleurs.
//! #
//! #  J'étais insoucieux de tous les équipages,
//! #  Porteur de blés flamands ou de cotons anglais.
//! #  Quand avec mes haleurs ont fini ces tapages,
//! #  Les Fleuves m'ont laissé descendre où je voulais.
//! #  "#);
//! #    index_writer.add_document(doc.clone())?;
//! #    index_writer.commit()?;
//! #    let query_parser = QueryParser::for_index(&index, vec![text_field]);
//! // ...
//! let query = query_parser.parse_query("haleurs flamands").unwrap();
//! # let reader = index.reader()?;
//! # let searcher = reader.searcher();
//! let mut snippet_generator = SnippetGenerator::create(&searcher, &*query, text_field)?;
//! snippet_generator.set_max_num_chars(100);
//! let snippet = snippet_generator.snippet_from_doc(&doc);
//! let snippet_html: String = snippet.to_html();
//! assert_eq!(snippet_html, "Comme je descendais des Fleuves impassibles,\n  Je ne me sentis plus guidé par les <b>haleurs</b> :\n Des");
//! #    Ok(())
//! # }
//! ```
//!
//! You can also specify the maximum number of characters for the snippets generated with the
//! `set_max_num_chars` method. By default, this limit is set to 150.
//!
//! SnippetGenerator needs to be created from the `Searcher` and the query, and the field on which
//! the `SnippetGenerator` should generate the snippets.

use std::cmp::Ordering;
use std::collections::{BTreeMap, BTreeSet};
use std::ops::Range;

use htmlescape::encode_minimal;

use crate::query::Query;
use crate::schema::document::{Document, Value};
use crate::schema::Field;
use crate::tokenizer::{TextAnalyzer, Token};
use crate::{Score, Searcher, Term};

const DEFAULT_MAX_NUM_CHARS: usize = 150;

const DEFAULT_SNIPPET_PREFIX: &str = "<b>";
const DEFAULT_SNIPPET_POSTFIX: &str = "</b>";

#[derive(Debug)]
pub(crate) struct FragmentCandidate {
    score: Score,
    start_offset: usize,
    stop_offset: usize,
    highlighted: Vec<Range<usize>>,
}

impl FragmentCandidate {
    /// Create a basic `FragmentCandidate`
    ///
    /// `score`, `num_chars` are set to 0
    /// and `highlighted` is set to empty vec
    /// stop_offset is set to start_offset, which is taken as a param.
    fn new(start_offset: usize) -> FragmentCandidate {
        FragmentCandidate {
            score: 0.0,
            start_offset,
            stop_offset: start_offset,
            highlighted: vec![],
        }
    }

    /// Updates `score` and `highlighted` fields of the objects.
    ///
    /// taking the token and terms, the token is added to the fragment.
    /// if the token is one of the terms, the score
    /// and highlighted fields are updated in the fragment.
    fn try_add_token(&mut self, token: &Token, terms: &BTreeMap<String, Score>) {
        self.stop_offset = token.offset_to;

        if let Some(&score) = terms.get(&token.text.to_lowercase()) {
            self.score += score;
            self.highlighted.push(token.offset_from..token.offset_to);
        }
    }
}

/// `Snippet`
/// Contains a fragment of a document, and some highlighted parts inside it.
#[derive(Debug)]
pub struct Snippet {
    fragment: String,
    highlighted: Vec<Range<usize>>,
    snippet_prefix: String,
    snippet_postfix: String,
}

impl Snippet {
    /// Create a new `Snippet`.
    fn new(fragment: &str, highlighted: Vec<Range<usize>>) -> Self {
        Self {
            fragment: fragment.to_string(),
            highlighted,
            snippet_prefix: DEFAULT_SNIPPET_PREFIX.to_string(),
            snippet_postfix: DEFAULT_SNIPPET_POSTFIX.to_string(),
        }
    }

    /// Create a new, empty, `Snippet`.
    pub fn empty() -> Snippet {
        Snippet {
            fragment: String::new(),
            highlighted: Vec::new(),
            snippet_prefix: String::new(),
            snippet_postfix: String::new(),
        }
    }

    /// Returns `true` if the snippet is empty.
    pub fn is_empty(&self) -> bool {
        self.highlighted.len() == 0
    }

    /// Returns a highlighted html from the `Snippet`.
    pub fn to_html(&self) -> String {
        let mut html = String::new();
        let mut start_from: usize = 0;

        for item in collapse_overlapped_ranges(&self.highlighted) {
            html.push_str(&encode_minimal(&self.fragment[start_from..item.start]));
            html.push_str(&self.snippet_prefix);
            html.push_str(&encode_minimal(&self.fragment[item.clone()]));
            html.push_str(&self.snippet_postfix);
            start_from = item.end;
        }
        html.push_str(&encode_minimal(
            &self.fragment[start_from..self.fragment.len()],
        ));
        html
    }

    /// Returns the fragment of text used in the  snippet.
    pub fn fragment(&self) -> &str {
        &self.fragment
    }

    /// Returns a list of highlighted positions from the `Snippet`.
    pub fn highlighted(&self) -> &[Range<usize>] {
        &self.highlighted
    }

    /// Sets highlighted prefix and postfix.
    pub fn set_snippet_prefix_postfix(&mut self, prefix: &str, postfix: &str) {
        self.snippet_prefix = prefix.to_string();
        self.snippet_postfix = postfix.to_string()
    }
}

/// Returns a non-empty list of "good" fragments.
///
/// If no target term is within the text, then the function
/// should return an empty Vec.
///
/// If a target term is within the text, then the returned
/// list is required to be non-empty.
///
/// The returned list is non-empty and contain less
/// than 12 possibly overlapping fragments.
///
/// All fragments should contain at least one target term
/// and have at most `max_num_chars` characters (not bytes).
///
/// It is ok to emit non-overlapping fragments, for instance,
/// one short and one long containing the same keyword, in order
/// to leave optimization opportunity to the fragment selector
/// upstream.
///
/// Fragments must be valid in the sense that `&text[fragment.start..fragment.stop]`\
/// has to be a valid string.
fn search_fragments(
    tokenizer: &mut TextAnalyzer,
    text: &str,
    terms: &BTreeMap<String, Score>,
    max_num_chars: usize,
) -> Vec<FragmentCandidate> {
    let mut token_stream = tokenizer.token_stream(text);
    let mut fragment = FragmentCandidate::new(0);
    let mut fragments: Vec<FragmentCandidate> = vec![];
    while let Some(next) = token_stream.next() {
        if (next.offset_to - fragment.start_offset) > max_num_chars {
            if fragment.score > 0.0 {
                fragments.push(fragment)
            };
            fragment = FragmentCandidate::new(next.offset_from);
        }
        fragment.try_add_token(next, terms);
    }
    if fragment.score > 0.0 {
        fragments.push(fragment)
    }

    fragments
}

/// Returns a Snippet
///
/// Takes a vector of `FragmentCandidate`s and the text.
/// Figures out the best fragment from it and creates a snippet.
fn select_best_fragment_combination(fragments: &[FragmentCandidate], text: &str) -> Snippet {
    let best_fragment_opt = fragments.iter().max_by(|left, right| {
        let cmp_score = left
            .score
            .partial_cmp(&right.score)
            .unwrap_or(Ordering::Equal);
        if cmp_score == Ordering::Equal {
            (right.start_offset, right.stop_offset).cmp(&(left.start_offset, left.stop_offset))
        } else {
            cmp_score
        }
    });
    if let Some(fragment) = best_fragment_opt {
        let fragment_text = &text[fragment.start_offset..fragment.stop_offset];
        let highlighted = fragment
            .highlighted
            .iter()
            .map(|item| item.start - fragment.start_offset..item.end - fragment.start_offset)
            .collect();
        Snippet::new(fragment_text, highlighted)
    } else {
        // When there are no fragments to chose from,
        // for now create an empty snippet.
        Snippet::empty()
    }
}

/// Sorts and removes duplicate ranges from the input.
///
/// This function first sorts the ranges by their start position,
/// then by their end position, and finally removes any duplicate ranges.
///
/// ## Examples
/// - [0..3, 3..6, 0..3, 3..6] -> [0..3, 3..6]
/// - [2..4, 1..3, 2..4, 0..2] -> [0..2, 1..3, 2..4]
fn sort_and_deduplicate_ranges(ranges: &[Range<usize>]) -> Vec<Range<usize>> {
    let mut sorted_ranges = ranges.to_vec();
    sorted_ranges.sort_by_key(|range| (range.start, range.end));
    sorted_ranges.dedup();
    sorted_ranges
}

/// Merges overlapping or adjacent ranges into non-overlapping ranges.
///
/// This function assumes that the input ranges are already sorted
/// and deduplicated. Use `sort_and_deduplicate_ranges` before calling
/// this function if the input might contain unsorted or duplicate ranges.
///
/// ## Examples
/// - [0..1, 2..3] -> [0..1, 2..3]  # no overlap
/// - [0..1, 1..2] -> [0..2]  # adjacent, merged
/// - [0..2, 1..3] -> [0..3]  # overlapping, merged
/// - [0..3, 1..2] -> [0..3]  # second range is completely within the first
fn merge_overlapping_ranges(ranges: &[Range<usize>]) -> Vec<Range<usize>> {
    debug_assert!(is_sorted(ranges.iter().map(|range| range.start)));
    let mut result = Vec::<Range<usize>>::new();
    for range in ranges {
        if let Some(last) = result.last_mut() {
            if last.end > range.start {
                // Only merge when there is a true overlap.
                last.end = std::cmp::max(last.end, range.end);
            } else {
                // Do not overlap or only adjacent, add new scope.
                result.push(range.clone());
            }
        } else {
            // The first range
            result.push(range.clone());
        }
    }
    result
}

/// Collapses ranges into non-overlapped ranges.
///
/// This function first sorts and deduplicates the input ranges,
/// then merges any overlapping or adjacent ranges.
///
/// ## Examples
/// - [0..1, 2..3] -> [0..1, 2..3]  # no overlap
/// - [0..1, 1..2] -> [0..2]  # adjacent, merged
/// - [0..2, 1..3] -> [0..3]  # overlapping, merged
/// - [0..3, 1..2] -> [0..3]  # second range is completely within the first
/// - [0..3, 3..6, 0..3, 3..6] -> [0..6]  # duplicates removed, then merged
pub fn collapse_overlapped_ranges(ranges: &[Range<usize>]) -> Vec<Range<usize>> {
    let prepared = sort_and_deduplicate_ranges(ranges);
    merge_overlapping_ranges(&prepared)
}

fn is_sorted(mut it: impl Iterator<Item = usize>) -> bool {
    if let Some(first) = it.next() {
        let mut prev = first;
        for item in it {
            if item < prev {
                return false;
            }
            prev = item;
        }
    }
    true
}

/// `SnippetGenerator`
///
/// # Example
///
/// ```rust
/// # use tantivy::query::QueryParser;
/// # use tantivy::schema::{Schema, TEXT};
/// # use tantivy::{doc, Index};
/// use tantivy::snippet::SnippetGenerator;
///
/// # fn main() -> tantivy::Result<()> {
/// #    let mut schema_builder = Schema::builder();
/// #    let text_field = schema_builder.add_text_field("text", TEXT);
/// #    let schema = schema_builder.build();
/// #    let index = Index::create_in_ram(schema);
/// #    let mut index_writer = index.writer_with_num_threads(1, 20_000_000)?;
/// #    let doc = doc!(text_field => r#"Comme je descendais des Fleuves impassibles,
/// #   Je ne me sentis plus guidé par les haleurs :
/// #  Des Peaux-Rouges criards les avaient pris pour cibles,
/// #  Les ayant cloués nus aux poteaux de couleurs.
/// #
/// #  J'étais insoucieux de tous les équipages,
/// #  Porteur de blés flamands ou de cotons anglais.
/// #  Quand avec mes haleurs ont fini ces tapages,
/// #  Les Fleuves m'ont laissé descendre où je voulais.
/// #  "#);
/// #    index_writer.add_document(doc.clone())?;
/// #    index_writer.commit()?;
/// #    let query_parser = QueryParser::for_index(&index, vec![text_field]);
/// // ...
/// let query = query_parser.parse_query("haleurs flamands").unwrap();
/// # let reader = index.reader()?;
/// # let searcher = reader.searcher();
/// let mut snippet_generator = SnippetGenerator::create(&searcher, &*query, text_field)?;
/// snippet_generator.set_max_num_chars(100);
/// let snippet = snippet_generator.snippet_from_doc(&doc);
/// let snippet_html: String = snippet.to_html();
/// assert_eq!(snippet_html, "Comme je descendais des Fleuves impassibles,\n  Je ne me sentis plus guidé par les <b>haleurs</b> :\n Des");
/// #    Ok(())
/// # }
/// ```
pub struct SnippetGenerator {
    terms_text: BTreeMap<String, Score>,
    tokenizer: TextAnalyzer,
    field: Field,
    max_num_chars: usize,
}

impl SnippetGenerator {
    /// Creates a new snippet generator
    pub fn new(
        terms_text: BTreeMap<String, Score>,
        tokenizer: TextAnalyzer,
        field: Field,
        max_num_chars: usize,
    ) -> Self {
        SnippetGenerator {
            terms_text,
            tokenizer,
            field,
            max_num_chars,
        }
    }
    /// Creates a new snippet generator
    pub fn create(
        searcher: &Searcher,
        query: &dyn Query,
        field: Field,
    ) -> crate::Result<SnippetGenerator> {
        let mut terms: BTreeSet<&Term> = BTreeSet::new();
        query.query_terms(&mut |term, _| {
            if term.field() == field {
                terms.insert(term);
            }
        });
        let mut terms_text: BTreeMap<String, Score> = Default::default();
        for term in terms {
            let term_value = term.value();
            let term_str = if let Some(term_str) = term_value.as_str() {
                term_str
            } else {
                continue;
            };
            let doc_freq = searcher.doc_freq(term)?;
            if doc_freq > 0 {
                let score = 1.0 / (1.0 + doc_freq as Score);
                terms_text.insert(term_str.to_string(), score);
            }
        }
        let tokenizer = searcher.index().tokenizer_for_field(field)?;
        Ok(SnippetGenerator {
            terms_text,
            tokenizer,
            field,
            max_num_chars: DEFAULT_MAX_NUM_CHARS,
        })
    }

    /// Sets a maximum number of chars. Default is 150.
    pub fn set_max_num_chars(&mut self, max_num_chars: usize) {
        self.max_num_chars = max_num_chars;
    }

    #[cfg(test)]
    pub(crate) fn terms_text(&self) -> &BTreeMap<String, Score> {
        &self.terms_text
    }

    /// Generates a snippet for the given `Document`.
    ///
    /// This method extract the text associated with the `SnippetGenerator`'s field
    /// and computes a snippet.
    pub fn snippet_from_doc<D: Document>(&self, doc: &D) -> Snippet {
        let mut text = String::new();
        for (field, value) in doc.iter_fields_and_values() {
            let value = value as D::Value<'_>;
            if field != self.field {
                continue;
            }

            if let Some(val) = value.as_str() {
                text.push(' ');
                text.push_str(val);
            }
        }

        self.snippet(text.trim())
    }

    /// Generates a snippet for the given text.
    pub fn snippet(&self, text: &str) -> Snippet {
        let fragment_candidates = search_fragments(
            &mut self.tokenizer.clone(),
            text,
            &self.terms_text,
            self.max_num_chars,
        );
        select_best_fragment_combination(&fragment_candidates[..], text)
    }
}

#[cfg(test)]
mod tests {
    use std::collections::BTreeMap;
    use std::ops::Range;

    use maplit::btreemap;

    use super::{collapse_overlapped_ranges, search_fragments, select_best_fragment_combination};
    use crate::query::QueryParser;
    use crate::schema::{Schema, TEXT};
    use crate::snippet::SnippetGenerator;
    use crate::tokenizer::{NgramTokenizer, SimpleTokenizer};
    use crate::Index;

    const TEST_TEXT: &str = r#"Rust is a systems programming language sponsored by
Mozilla which describes it as a "safe, concurrent, practical language", supporting functional and
imperative-procedural paradigms. Rust is syntactically similar to C++[according to whom?],
but its designers intend it to provide better memory safety while still maintaining
performance.

Rust is free and open-source software, released under an MIT License, or Apache License
2.0. Its designers have refined the language through the experiences of writing the Servo
web browser layout engine[14] and the Rust compiler. A large proportion of current commits
to the project are from community members.[15]

Rust won first place for "most loved programming language" in the Stack Overflow Developer
Survey in 2016, 2017, and 2018."#;

    #[test]
    fn test_snippet() {
        let terms = btreemap! {
            String::from("rust") => 1.0,
            String::from("language") => 0.9
        };
        let fragments = search_fragments(
            &mut From::from(SimpleTokenizer::default()),
            TEST_TEXT,
            &terms,
            100,
        );
        assert_eq!(fragments.len(), 7);
        {
            let first = &fragments[0];
            assert_eq!(first.score, 1.9);
            assert_eq!(first.stop_offset, 89);
        }
        let snippet = select_best_fragment_combination(&fragments[..], TEST_TEXT);
        assert_eq!(
            snippet.fragment,
            "Rust is a systems programming language sponsored by\nMozilla which describes it as a \
             \"safe"
        );
        assert_eq!(
            snippet.to_html(),
            "<b>Rust</b> is a systems programming <b>language</b> sponsored by\nMozilla which \
             describes it as a &quot;safe"
        )
    }

    #[test]
    fn test_snippet_scored_fragment() {
        {
            let terms = btreemap! {
                String::from("rust") =>1.0,
                String::from("language") => 0.9
            };
            let fragments = search_fragments(
                &mut From::from(SimpleTokenizer::default()),
                TEST_TEXT,
                &terms,
                20,
            );
            {
                let first = &fragments[0];
                assert_eq!(first.score, 1.0);
                assert_eq!(first.stop_offset, 17);
            }
            let snippet = select_best_fragment_combination(&fragments[..], TEST_TEXT);
            assert_eq!(snippet.to_html(), "<b>Rust</b> is a systems")
        }
        {
            let terms = btreemap! {
                String::from("rust") =>0.9,
                String::from("language") => 1.0
            };
            let fragments = search_fragments(
                &mut From::from(SimpleTokenizer::default()),
                TEST_TEXT,
                &terms,
                20,
            );
            // assert_eq!(fragments.len(), 7);
            {
                let first = &fragments[0];
                assert_eq!(first.score, 0.9);
                assert_eq!(first.stop_offset, 17);
            }
            let snippet = select_best_fragment_combination(&fragments[..], TEST_TEXT);
            assert_eq!(snippet.to_html(), "programming <b>language</b>")
        }
    }

    #[test]
    fn test_snippet_in_second_fragment() {
        let text = "a b c d e f g";

        let mut terms = BTreeMap::new();
        terms.insert(String::from("c"), 1.0);

        let fragments =
            search_fragments(&mut From::from(SimpleTokenizer::default()), text, &terms, 3);

        assert_eq!(fragments.len(), 1);
        {
            let first = &fragments[0];
            assert_eq!(first.score, 1.0);
            assert_eq!(first.start_offset, 4);
            assert_eq!(first.stop_offset, 7);
        }

        let snippet = select_best_fragment_combination(&fragments[..], text);
        assert_eq!(snippet.fragment, "c d");
        assert_eq!(snippet.to_html(), "<b>c</b> d");
    }

    #[test]
    fn test_snippet_with_term_at_the_end_of_fragment() {
        let text = "a b c d e f f g";

        let mut terms = BTreeMap::new();
        terms.insert(String::from("f"), 1.0);

        let fragments =
            search_fragments(&mut From::from(SimpleTokenizer::default()), text, &terms, 3);

        assert_eq!(fragments.len(), 2);
        {
            let first = &fragments[0];
            assert_eq!(first.score, 1.0);
            assert_eq!(first.stop_offset, 11);
            assert_eq!(first.start_offset, 8);
        }

        let snippet = select_best_fragment_combination(&fragments[..], text);
        assert_eq!(snippet.fragment, "e f");
        assert_eq!(snippet.to_html(), "e <b>f</b>");
    }

    #[test]
    fn test_snippet_with_second_fragment_has_the_highest_score() {
        let text = "a b c d e f g";

        let mut terms = BTreeMap::new();
        terms.insert(String::from("f"), 1.0);
        terms.insert(String::from("a"), 0.9);

        let fragments =
            search_fragments(&mut From::from(SimpleTokenizer::default()), text, &terms, 7);

        assert_eq!(fragments.len(), 2);
        {
            let first = &fragments[0];
            assert_eq!(first.score, 0.9);
            assert_eq!(first.stop_offset, 7);
            assert_eq!(first.start_offset, 0);
        }

        let snippet = select_best_fragment_combination(&fragments[..], text);
        assert_eq!(snippet.fragment, "e f g");
        assert_eq!(snippet.to_html(), "e <b>f</b> g");
    }

    #[test]
    fn test_snippet_with_term_not_in_text() {
        let text = "a b c d";

        let mut terms = BTreeMap::new();
        terms.insert(String::from("z"), 1.0);

        let fragments =
            search_fragments(&mut From::from(SimpleTokenizer::default()), text, &terms, 3);

        assert_eq!(fragments.len(), 0);

        let snippet = select_best_fragment_combination(&fragments[..], text);
        assert_eq!(snippet.fragment, "");
        assert_eq!(snippet.to_html(), "");
        assert!(snippet.is_empty());
    }

    #[test]
    fn test_snippet_with_no_terms() {
        let text = "a b c d";

        let terms = BTreeMap::new();
        let fragments =
            search_fragments(&mut From::from(SimpleTokenizer::default()), text, &terms, 3);
        assert_eq!(fragments.len(), 0);

        let snippet = select_best_fragment_combination(&fragments[..], text);
        assert_eq!(snippet.fragment, "");
        assert_eq!(snippet.to_html(), "");
        assert!(snippet.is_empty());
    }

    #[test]
    fn test_snippet_generator_term_score() -> crate::Result<()> {
        let mut schema_builder = Schema::builder();
        let text_field = schema_builder.add_text_field("text", TEXT);
        let schema = schema_builder.build();
        let index = Index::create_in_ram(schema);
        {
            // writing the segment
            let mut index_writer = index.writer_for_tests()?;
            index_writer.add_document(doc!(text_field => "a"))?;
            index_writer.add_document(doc!(text_field => "a"))?;
            index_writer.add_document(doc!(text_field => "a b"))?;
            index_writer.commit()?;
        }
        let searcher = index.reader()?.searcher();
        let query_parser = QueryParser::for_index(&index, vec![text_field]);
        {
            let query = query_parser.parse_query("e")?;
            let snippet_generator = SnippetGenerator::create(&searcher, &*query, text_field)?;
            assert!(snippet_generator.terms_text().is_empty());
        }
        {
            let query = query_parser.parse_query("a")?;
            let snippet_generator = SnippetGenerator::create(&searcher, &*query, text_field)?;
            assert_eq!(
                &btreemap!("a".to_string() => 0.25),
                snippet_generator.terms_text()
            );
        }
        {
            let query = query_parser.parse_query("a b")?;
            let snippet_generator = SnippetGenerator::create(&searcher, &*query, text_field)?;
            assert_eq!(
                &btreemap!("a".to_string() => 0.25, "b".to_string() => 0.5),
                snippet_generator.terms_text()
            );
        }
        {
            let query = query_parser.parse_query("a b c")?;
            let snippet_generator = SnippetGenerator::create(&searcher, &*query, text_field)?;
            assert_eq!(
                &btreemap!("a".to_string() => 0.25, "b".to_string() => 0.5),
                snippet_generator.terms_text()
            );
        }
        Ok(())
    }

    #[cfg(feature = "stemmer")]
    #[test]
    fn test_snippet_generator() -> crate::Result<()> {
        use crate::schema::{IndexRecordOption, TextFieldIndexing, TextOptions};
        let mut schema_builder = Schema::builder();
        let text_options = TextOptions::default().set_indexing_options(
            TextFieldIndexing::default()
                .set_tokenizer("en_stem")
                .set_index_option(IndexRecordOption::Basic),
        );
        let text_field = schema_builder.add_text_field("text", text_options);
        let schema = schema_builder.build();
        let index = Index::create_in_ram(schema);
        {
            // writing the segment
            let mut index_writer = index.writer_for_tests()?;
            let doc = doc!(text_field => TEST_TEXT);
            index_writer.add_document(doc)?;
            index_writer.commit()?;
        }
        let searcher = index.reader().unwrap().searcher();
        let query_parser = QueryParser::for_index(&index, vec![text_field]);
        let query = query_parser.parse_query("rust design").unwrap();
        let mut snippet_generator =
            SnippetGenerator::create(&searcher, &*query, text_field).unwrap();
        {
            let snippet = snippet_generator.snippet(TEST_TEXT);
            assert_eq!(
                snippet.to_html(),
                "imperative-procedural paradigms. <b>Rust</b> is syntactically similar to \
                 C++[according to whom?],\nbut its <b>designers</b> intend it to provide better \
                 memory safety"
            );
        }
        {
            snippet_generator.set_max_num_chars(90);
            let snippet = snippet_generator.snippet(TEST_TEXT);
            assert_eq!(
                snippet.to_html(),
                "<b>Rust</b> is syntactically similar to C++[according to whom?],\nbut its \
                 <b>designers</b> intend it to"
            );
        }
        Ok(())
    }

    #[test]
    fn test_snippet_with_overlapped_highlighted_ranges() {
        let text = "abc";

        let mut terms = BTreeMap::new();
        terms.insert(String::from("ab"), 0.9);
        terms.insert(String::from("bc"), 1.0);

        let fragments = search_fragments(
            &mut From::from(NgramTokenizer::all_ngrams(2, 2).unwrap()),
            text,
            &terms,
            3,
        );

        assert_eq!(fragments.len(), 1);
        {
            let first = &fragments[0];
            assert_eq!(first.score, 1.9);
            assert_eq!(first.start_offset, 0);
            assert_eq!(first.stop_offset, 3);
        }

        let snippet = select_best_fragment_combination(&fragments[..], text);
        assert_eq!(snippet.fragment, "abc");
        assert_eq!(snippet.to_html(), "<b>abc</b>");
    }

    #[test]
    fn test_snippet_generator_custom_highlighted_elements() {
        let terms = btreemap! { String::from("rust") => 1.0, String::from("language") => 0.9 };
        let fragments = search_fragments(
            &mut From::from(SimpleTokenizer::default()),
            TEST_TEXT,
            &terms,
            100,
        );
        let mut snippet = select_best_fragment_combination(&fragments[..], TEST_TEXT);
        assert_eq!(
            snippet.to_html(),
            "<b>Rust</b> is a systems programming <b>language</b> sponsored by\nMozilla which \
             describes it as a &quot;safe"
        );
        snippet.set_snippet_prefix_postfix("<q class=\"super\">", "</q>");
        assert_eq!(
            snippet.to_html(),
            "<q class=\"super\">Rust</q> is a systems programming <q class=\"super\">language</q> \
             sponsored by\nMozilla which describes it as a &quot;safe"
        );
    }

    #[test]
    fn test_collapse_overlapped_ranges() {
        #![allow(clippy::single_range_in_vec_init)]
        assert_eq!(&collapse_overlapped_ranges(&[0..1, 2..3]), &[0..1, 2..3]);
        assert_eq!(&collapse_overlapped_ranges(&[0..1, 1..2]), &[0..1, 1..2]);
        assert_eq!(&collapse_overlapped_ranges(&[0..2, 1..2]), &[0..2]);
        assert_eq!(&collapse_overlapped_ranges(&[0..2, 1..3]), &[0..3]);
        assert_eq!(&collapse_overlapped_ranges(&[0..3, 1..2]), &[0..3]);
    }

    #[test]
    fn test_no_overlap() {
        let ranges = vec![0..1, 2..3, 4..5];
        let result = collapse_overlapped_ranges(&ranges);
        assert_eq!(result, vec![0..1, 2..3, 4..5]);
    }

    #[test]
    fn test_adjacent_ranges() {
        let ranges = vec![0..1, 1..2, 2..3];
        let result = collapse_overlapped_ranges(&ranges);
        assert_eq!(result, vec![0..1, 1..2, 2..3]);
    }

    #[test]
    fn test_overlapping_ranges() {
        let ranges = vec![0..2, 1..3, 2..4];
        let result = collapse_overlapped_ranges(&ranges);
        assert_eq!(result, vec![0..4]);
    }

    #[test]
    fn test_contained_ranges() {
        let ranges = vec![0..5, 1..2, 3..4];
        let result = collapse_overlapped_ranges(&ranges);
        assert_eq!(result, vec![0..5]);
    }

    #[test]
    fn test_duplicate_ranges() {
        let ranges = vec![0..2, 2..4, 0..2, 2..4];
        let result = collapse_overlapped_ranges(&ranges);
        assert_eq!(result, vec![0..2, 2..4]);
    }

    #[test]
    fn test_unsorted_ranges() {
        let ranges = vec![2..4, 0..2, 1..3];
        let result = collapse_overlapped_ranges(&ranges);
        assert_eq!(result, vec![0..4]);
    }

    #[test]
    fn test_complex_scenario() {
        let ranges = vec![0..2, 5..7, 1..3, 8..9, 2..4, 3..6, 8..10];
        let result = collapse_overlapped_ranges(&ranges);
        assert_eq!(result, vec![0..7, 8..10]);
    }

    #[test]
    fn test_empty_input() {
        let ranges: Vec<Range<usize>> = vec![];
        let result = collapse_overlapped_ranges(&ranges);
        assert_eq!(result, ranges);
    }

    #[test]
    fn test_single_range() {
        #![allow(clippy::single_range_in_vec_init)]
        let ranges = vec![0..5];
        let result = collapse_overlapped_ranges(&ranges);
        assert_eq!(result, vec![0..5]);
    }

    #[test]
    fn test_zero_length_ranges() {
        let ranges = vec![0..0, 1..1, 2..2, 3..3];
        let result = collapse_overlapped_ranges(&ranges);
        assert_eq!(result, vec![0..0, 1..1, 2..2, 3..3]);
    }
}


================================================
FILE: src/space_usage/mod.rs
================================================
//! Representations for the space usage of various parts of a Tantivy index.
//!
//! This can be used programmatically, and will also be exposed in a human readable fashion in
//! tantivy-cli.
//!
//! One important caveat for all of this functionality is that none of it currently takes
//! storage-level details into consideration. For example, if your file system block size is 4096
//! bytes, we can under-count actual resultant space usage by up to 4095 bytes per file.

use std::collections::btree_map::Entry;
use std::collections::BTreeMap;

use columnar::ColumnSpaceUsage;
use common::ByteCount;
use serde::{Deserialize, Serialize};

use crate::index::SegmentComponent;

/// Enum containing any of the possible space usage results for segment components.
pub enum ComponentSpaceUsage {
    /// Data is stored per field in a uniform way
    PerField(PerFieldSpaceUsage),
    /// Data is stored in separate pieces in the store
    Store(StoreSpaceUsage),
    /// Some sort of raw byte count
    Basic(ByteCount),
}

/// Represents combined space usage of an entire searcher and its component segments.
#[derive(Clone, Debug, Serialize, Deserialize)]
pub struct SearcherSpaceUsage {
    segments: Vec<SegmentSpaceUsage>,
    total: ByteCount,
}

impl SearcherSpaceUsage {
    pub(crate) fn new() -> SearcherSpaceUsage {
        SearcherSpaceUsage {
            segments: Vec::new(),
            total: Default::default(),
        }
    }

    /// Add a segment, to `self`.
    /// Performs no deduplication or other intelligence.
    pub(crate) fn add_segment(&mut self, segment: SegmentSpaceUsage) {
        self.total += segment.total();
        self.segments.push(segment);
    }

    /// Per segment space usage
    pub fn segments(&self) -> &[SegmentSpaceUsage] {
        &self.segments[..]
    }

    /// Returns total byte usage of this searcher, including all large subcomponents.
    /// Does not account for smaller things like `meta.json`.
    pub fn total(&self) -> ByteCount {
        self.total
    }
}

/// Represents combined space usage for all of the large components comprising a segment.
#[derive(Clone, Debug, Serialize, Deserialize)]
pub struct SegmentSpaceUsage {
    num_docs: u32,

    termdict: PerFieldSpaceUsage,
    postings: PerFieldSpaceUsage,
    positions: PerFieldSpaceUsage,
    fast_fields: PerFieldSpaceUsage,
    fieldnorms: PerFieldSpaceUsage,

    store: StoreSpaceUsage,

    deletes: ByteCount,

    total: ByteCount,
}

impl SegmentSpaceUsage {
    #[expect(clippy::too_many_arguments)]
    pub(crate) fn new(
        num_docs: u32,
        termdict: PerFieldSpaceUsage,
        postings: PerFieldSpaceUsage,
        positions: PerFieldSpaceUsage,
        fast_fields: PerFieldSpaceUsage,
        fieldnorms: PerFieldSpaceUsage,
        store: StoreSpaceUsage,
        deletes: ByteCount,
    ) -> SegmentSpaceUsage {
        let total = termdict.total()
            + postings.total()
            + positions.total()
            + fast_fields.total()
            + fieldnorms.total()
            + store.total()
            + deletes;
        SegmentSpaceUsage {
            num_docs,
            termdict,
            postings,
            positions,
            fast_fields,
            fieldnorms,
            store,
            deletes,
            total,
        }
    }

    /// Space usage for the given component
    ///
    /// Clones the underlying data.
    /// Use the components directly if this is somehow in performance critical code.
    pub fn component(&self, component: SegmentComponent) -> ComponentSpaceUsage {
        use self::ComponentSpaceUsage::*;
        use crate::index::SegmentComponent::*;
        match component {
            Postings => PerField(self.postings().clone()),
            Positions => PerField(self.positions().clone()),
            FastFields => PerField(self.fast_fields().clone()),
            FieldNorms => PerField(self.fieldnorms().clone()),
            Terms => PerField(self.termdict().clone()),
            SegmentComponent::Store => ComponentSpaceUsage::Store(self.store().clone()),
            Delete => Basic(self.deletes()),
        }
    }

    /// Num docs in segment
    pub fn num_docs(&self) -> u32 {
        self.num_docs
    }

    /// Space usage for term dictionary
    pub fn termdict(&self) -> &PerFieldSpaceUsage {
        &self.termdict
    }

    /// Space usage for postings list
    pub fn postings(&self) -> &PerFieldSpaceUsage {
        &self.postings
    }

    /// Space usage for positions
    pub fn positions(&self) -> &PerFieldSpaceUsage {
        &self.positions
    }

    /// Space usage for fast fields
    pub fn fast_fields(&self) -> &PerFieldSpaceUsage {
        &self.fast_fields
    }

    /// Space usage for field norms
    pub fn fieldnorms(&self) -> &PerFieldSpaceUsage {
        &self.fieldnorms
    }

    /// Space usage for stored documents
    pub fn store(&self) -> &StoreSpaceUsage {
        &self.store
    }

    /// Space usage for document deletions
    pub fn deletes(&self) -> ByteCount {
        self.deletes
    }

    /// Total space usage in bytes for this segment.
    pub fn total(&self) -> ByteCount {
        self.total
    }
}

/// Represents space usage for the Store for this segment.
///
/// This is composed of two parts.
/// `data` represents the compressed data itself.
/// `offsets` represents a lookup to find the start of a block
#[derive(Clone, Debug, Serialize, Deserialize)]
pub struct StoreSpaceUsage {
    data: ByteCount,
    offsets: ByteCount,
}

impl StoreSpaceUsage {
    pub(crate) fn new(data: ByteCount, offsets: ByteCount) -> StoreSpaceUsage {
        StoreSpaceUsage { data, offsets }
    }

    /// Space usage for the data part of the store
    pub fn data_usage(&self) -> ByteCount {
        self.data
    }

    /// Space usage for the offsets part of the store (doc ID -> offset)
    pub fn offsets_usage(&self) -> ByteCount {
        self.offsets
    }

    /// Total space usage in bytes for this Store
    pub fn total(&self) -> ByteCount {
        self.data + self.offsets
    }
}

/// Represents space usage for all of the (field, index) pairs that appear in a `CompositeFile`.
///
/// A field can appear with a single index (typically 0) or with multiple indexes.
/// Multiple indexes are used to handle variable length things, where
#[derive(Clone, Debug, Serialize, Deserialize)]
pub struct PerFieldSpaceUsage {
    fields: BTreeMap<String, FieldUsage>,
    total: ByteCount,
}

impl PerFieldSpaceUsage {
    pub(crate) fn new(fields: Vec<FieldUsage>) -> PerFieldSpaceUsage {
        let mut total = ByteCount::default();
        let mut field_usage_map: BTreeMap<String, FieldUsage> = BTreeMap::new();
        for field_usage in fields {
            total += field_usage.total();
            let field_name = field_usage.field_name().to_string();
            match field_usage_map.entry(field_name) {
                Entry::Vacant(entry) => {
                    entry.insert(field_usage);
                }
                Entry::Occupied(mut entry) => {
                    entry.get_mut().merge(field_usage);
                }
            }
        }
        PerFieldSpaceUsage {
            fields: field_usage_map,
            total,
        }
    }

    /// Per field space usage
    pub fn fields(&self) -> impl Iterator<Item = &FieldUsage> {
        self.fields.values()
    }

    /// Bytes used by the represented file
    pub fn total(&self) -> ByteCount {
        self.total
    }
}

/// Represents space usage of a given field, breaking it down into the (field, index) pairs that
/// comprise it.
///
/// See documentation for [`PerFieldSpaceUsage`] for slightly more information.
#[derive(Clone, Debug, Serialize, Deserialize)]
pub struct FieldUsage {
    field_name: String,
    num_bytes: ByteCount,
    /// A field can be composed of more than one piece.
    /// These pieces are indexed by arbitrary numbers starting at zero.
    /// `self.num_bytes` includes all of `self.sub_num_bytes`.
    sub_num_bytes: Vec<Option<ByteCount>>,
    /// Space usage of the column for fast fields, if relevant.
    column_space_usage: Option<ColumnSpaceUsage>,
}

impl FieldUsage {
    pub(crate) fn empty(field_name: impl Into<String>) -> FieldUsage {
        FieldUsage {
            field_name: field_name.into(),
            num_bytes: Default::default(),
            sub_num_bytes: Vec::new(),
            column_space_usage: None,
        }
    }

    pub(crate) fn add_field_idx(&mut self, idx: usize, size: ByteCount) {
        if self.sub_num_bytes.len() < idx + 1 {
            self.sub_num_bytes.resize(idx + 1, None);
        }
        assert!(self.sub_num_bytes[idx].is_none());
        self.sub_num_bytes[idx] = Some(size);
        self.num_bytes += size
    }

    pub(crate) fn set_column_usage(&mut self, column_space_usage: ColumnSpaceUsage) {
        self.num_bytes += column_space_usage.total_num_bytes();
        self.column_space_usage = Some(column_space_usage);
    }

    /// Field
    pub fn field_name(&self) -> &str {
        &self.field_name
    }

    /// Space usage for each index
    pub fn sub_num_bytes(&self) -> &[Option<ByteCount>] {
        &self.sub_num_bytes[..]
    }

    /// Returns the number of bytes used by the column payload, if the field is columnar.
    pub fn column_num_bytes(&self) -> Option<ByteCount> {
        self.column_space_usage
            .as_ref()
            .map(ColumnSpaceUsage::column_num_bytes)
    }

    /// Returns the number of bytes used by the dictionary for dictionary-encoded columns.
    pub fn dictionary_num_bytes(&self) -> Option<ByteCount> {
        self.column_space_usage
            .as_ref()
            .and_then(ColumnSpaceUsage::dictionary_num_bytes)
    }

    /// Returns the space usage of the column, if any.
    pub fn column_space_usage(&self) -> Option<&ColumnSpaceUsage> {
        self.column_space_usage.as_ref()
    }

    /// Total bytes used for this field in this context
    pub fn total(&self) -> ByteCount {
        self.num_bytes
    }

    fn merge(&mut self, other: FieldUsage) {
        assert_eq!(self.field_name, other.field_name);
        self.num_bytes += other.num_bytes;
        if other.sub_num_bytes.len() > self.sub_num_bytes.len() {
            self.sub_num_bytes.resize(other.sub_num_bytes.len(), None);
        }
        for (idx, num_bytes_opt) in other.sub_num_bytes.into_iter().enumerate() {
            if let Some(num_bytes) = num_bytes_opt {
                match self.sub_num_bytes[idx] {
                    Some(existing) => self.sub_num_bytes[idx] = Some(existing + num_bytes),
                    None => self.sub_num_bytes[idx] = Some(num_bytes),
                }
            }
        }
        self.column_space_usage =
            merge_column_space_usage(self.column_space_usage.take(), other.column_space_usage);
    }
}

fn merge_column_space_usage(
    left: Option<ColumnSpaceUsage>,
    right: Option<ColumnSpaceUsage>,
) -> Option<ColumnSpaceUsage> {
    match (left, right) {
        (Some(lhs), Some(rhs)) => Some(lhs.merge(&rhs)),
        (Some(space), None) | (None, Some(space)) => Some(space),
        (None, None) => None,
    }
}

#[cfg(test)]
mod test {
    use crate::index::Index;
    use crate::schema::{Schema, FAST, INDEXED, STORED, TEXT};
    use crate::space_usage::PerFieldSpaceUsage;
    use crate::{IndexWriter, Term};

    #[test]
    fn test_empty() {
        let schema = Schema::builder().build();
        let index = Index::create_in_ram(schema);
        let reader = index.reader().unwrap();
        let searcher = reader.searcher();
        let searcher_space_usage = searcher.space_usage().unwrap();
        assert_eq!(searcher_space_usage.total(), 0u64);
    }

    fn expect_single_field(
        field_space: &PerFieldSpaceUsage,
        field: &str,
        min_size: u64,
        max_size: u64,
    ) {
        assert!(field_space.total() >= min_size);
        assert!(field_space.total() <= max_size);
        assert_eq!(
            vec![(field.to_string(), field_space.total())],
            field_space
                .fields()
                .map(|usage| (usage.field_name().to_string(), usage.total()))
                .collect::<Vec<_>>()
        );
    }

    #[test]
    fn test_fast_indexed() -> crate::Result<()> {
        let mut schema_builder = Schema::builder();
        let name = schema_builder.add_u64_field("name", FAST | INDEXED);
        let schema = schema_builder.build();
        let field_name = schema.get_field_name(name).to_string();
        let index = Index::create_in_ram(schema);

        {
            let mut index_writer = index.writer_for_tests()?;
            index_writer.add_document(doc!(name => 1u64))?;
            index_writer.add_document(doc!(name => 2u64))?;
            index_writer.add_document(doc!(name => 10u64))?;
            index_writer.add_document(doc!(name => 20u64))?;
            index_writer.commit()?;
        }

        let reader = index.reader()?;
        let searcher = reader.searcher();
        let searcher_space_usage = searcher.space_usage()?;
        assert!(searcher_space_usage.total() > 0);
        assert_eq!(1, searcher_space_usage.segments().len());

        let segment = &searcher_space_usage.segments()[0];
        assert!(segment.total() > 0);

        assert_eq!(4, segment.num_docs());

        expect_single_field(segment.termdict(), &field_name, 1, 512);
        expect_single_field(segment.postings(), &field_name, 1, 512);
        assert_eq!(segment.positions().total(), 0);
        expect_single_field(segment.fast_fields(), &field_name, 1, 512);
        expect_single_field(segment.fieldnorms(), &field_name, 1, 512);
        // TODO: understand why the following fails
        //        assert_eq!(0, segment.store().total());
        assert_eq!(segment.deletes(), 0);
        Ok(())
    }

    #[test]
    fn test_text() -> crate::Result<()> {
        let mut schema_builder = Schema::builder();
        let name = schema_builder.add_text_field("name", TEXT);
        let schema = schema_builder.build();
        let field_name = schema.get_field_name(name).to_string();
        let index = Index::create_in_ram(schema);

        {
            let mut index_writer = index.writer_for_tests()?;
            index_writer.add_document(doc!(name => "hi"))?;
            index_writer.add_document(doc!(name => "this is a test"))?;
            index_writer.add_document(
                doc!(name => "some more documents with some word overlap with the other test"),
            )?;
            index_writer.add_document(doc!(name => "hello hi goodbye"))?;
            index_writer.commit()?;
        }

        let reader = index.reader()?;
        let searcher = reader.searcher();
        let searcher_space_usage = searcher.space_usage()?;
        assert!(searcher_space_usage.total() > 0);
        assert_eq!(1, searcher_space_usage.segments().len());

        let segment = &searcher_space_usage.segments()[0];
        assert!(segment.total() > 0);

        assert_eq!(4, segment.num_docs());

        expect_single_field(segment.termdict(), &field_name, 1, 512);
        expect_single_field(segment.postings(), &field_name, 1, 512);
        expect_single_field(segment.positions(), &field_name, 1, 512);
        assert_eq!(segment.fast_fields().total(), 0);
        expect_single_field(segment.fieldnorms(), &field_name, 1, 512);
        // TODO: understand why the following fails
        //        assert_eq!(0, segment.store().total());
        assert_eq!(segment.deletes(), 0);
        Ok(())
    }

    #[test]
    fn test_store() -> crate::Result<()> {
        let mut schema_builder = Schema::builder();
        let name = schema_builder.add_text_field("name", STORED);
        let schema = schema_builder.build();
        let index = Index::create_in_ram(schema);

        {
            let mut index_writer = index.writer_for_tests()?;
            index_writer.add_document(doc!(name => "hi"))?;
            index_writer.add_document(doc!(name => "this is a test"))?;
            index_writer.add_document(
                doc!(name => "some more documents with some word overlap with the other test"),
            )?;
            index_writer.add_document(doc!(name => "hello hi goodbye"))?;
            index_writer.commit()?;
        }
        let reader = index.reader()?;
        let searcher = reader.searcher();
        let searcher_space_usage = searcher.space_usage()?;
        assert!(searcher_space_usage.total() > 0);
        assert_eq!(1, searcher_space_usage.segments().len());

        let segment = &searcher_space_usage.segments()[0];
        assert!(segment.total() > 0);

        assert_eq!(4, segment.num_docs());

        assert_eq!(segment.termdict().total(), 0);
        assert!(segment.termdict().fields().next().is_none());
        assert_eq!(segment.postings().total(), 0);
        assert!(segment.postings().fields().next().is_none());
        assert_eq!(segment.positions().total(), 0);
        assert!(segment.positions().fields().next().is_none());
        assert_eq!(segment.fast_fields().total(), 0);
        assert!(segment.fast_fields().fields().next().is_none());
        assert_eq!(segment.fieldnorms().total(), 0);
        assert!(segment.fieldnorms().fields().next().is_none());
        assert!(segment.store().total() > 0);
        assert!(segment.store().total() < 512);
        assert_eq!(segment.deletes(), 0);
        Ok(())
    }

    #[test]
    fn test_deletes() -> crate::Result<()> {
        let mut schema_builder = Schema::builder();
        let name = schema_builder.add_u64_field("name", INDEXED);
        let schema = schema_builder.build();
        let field_name = schema.get_field_name(name).to_string();
        let index = Index::create_in_ram(schema);

        {
            let mut index_writer: IndexWriter = index.writer_for_tests()?;
            index_writer.add_document(doc!(name => 1u64))?;
            index_writer.add_document(doc!(name => 2u64))?;
            index_writer.add_document(doc!(name => 3u64))?;
            index_writer.add_document(doc!(name => 4u64))?;
            index_writer.commit()?;
        }

        {
            let mut index_writer2: IndexWriter = index.writer(50_000_000)?;
            index_writer2.delete_term(Term::from_field_u64(name, 2u64));
            index_writer2.delete_term(Term::from_field_u64(name, 3u64));
            // ok, now we should have a deleted doc
            index_writer2.commit()?;
        }

        let reader = index.reader()?;
        let searcher = reader.searcher();
        let searcher_space_usage = searcher.space_usage()?;
        assert!(searcher_space_usage.total() > 0);
        assert_eq!(1, searcher_space_usage.segments().len());

        let segment_space_usage = &searcher_space_usage.segments()[0];
        assert!(segment_space_usage.total() > 0);

        assert_eq!(2, segment_space_usage.num_docs());

        expect_single_field(segment_space_usage.termdict(), &field_name, 1, 512);
        expect_single_field(segment_space_usage.postings(), &field_name, 1, 512);
        assert_eq!(segment_space_usage.positions().total(), 0u64);
        assert_eq!(segment_space_usage.fast_fields().total(), 0u64);
        expect_single_field(segment_space_usage.fieldnorms(), &field_name, 1, 512);
        assert!(segment_space_usage.deletes() > 0);
        Ok(())
    }
}


================================================
FILE: src/store/compression_lz4_block.rs
================================================
use std::io::{self};
use std::mem;

use lz4_flex::{compress_into, decompress_into};

#[inline]
#[expect(clippy::uninit_vec)]
pub fn compress(uncompressed: &[u8], compressed: &mut Vec<u8>) -> io::Result<()> {
    compressed.clear();
    let maximum_output_size =
        mem::size_of::<u32>() + lz4_flex::block::get_maximum_output_size(uncompressed.len());
    compressed.reserve(maximum_output_size);
    unsafe {
        compressed.set_len(maximum_output_size);
    }
    let bytes_written = compress_into(uncompressed, &mut compressed[4..])
        .map_err(|err| io::Error::new(io::ErrorKind::InvalidData, err.to_string()))?;
    let num_bytes = uncompressed.len() as u32;
    compressed[0..4].copy_from_slice(&num_bytes.to_le_bytes());
    unsafe {
        compressed.set_len(bytes_written + mem::size_of::<u32>());
    }
    Ok(())
}

#[inline]
#[expect(clippy::uninit_vec)]
pub fn decompress(compressed: &[u8], decompressed: &mut Vec<u8>) -> io::Result<()> {
    decompressed.clear();
    let uncompressed_size_bytes: &[u8; 4] = compressed
        .get(..4)
        .ok_or(io::ErrorKind::InvalidData)?
        .try_into()
        .unwrap();
    let uncompressed_size = u32::from_le_bytes(*uncompressed_size_bytes) as usize;
    decompressed.reserve(uncompressed_size);
    unsafe {
        decompressed.set_len(uncompressed_size);
    }
    let bytes_written = decompress_into(&compressed[4..], decompressed)
        .map_err(|err| io::Error::new(io::ErrorKind::InvalidData, err.to_string()))?;
    if bytes_written != uncompressed_size {
        return Err(io::Error::new(
            io::ErrorKind::InvalidData,
            "doc store block not completely decompressed, data corruption".to_string(),
        ));
    }
    Ok(())
}


================================================
FILE: src/store/compression_zstd_block.rs
================================================
use std::io;

use zstd::bulk::{compress_to_buffer, decompress_to_buffer};
use zstd::DEFAULT_COMPRESSION_LEVEL;

#[inline]
pub fn compress(
    uncompressed: &[u8],
    compressed: &mut Vec<u8>,
    compression_level: Option<i32>,
) -> io::Result<()> {
    let count_size = std::mem::size_of::<u32>();
    let max_size = zstd::zstd_safe::compress_bound(uncompressed.len()) + count_size;

    compressed.clear();
    compressed.resize(max_size, 0);

    let compressed_size = compress_to_buffer(
        uncompressed,
        &mut compressed[count_size..],
        compression_level.unwrap_or(DEFAULT_COMPRESSION_LEVEL),
    )?;

    compressed[0..count_size].copy_from_slice(&(uncompressed.len() as u32).to_le_bytes());
    compressed.resize(compressed_size + count_size, 0);

    Ok(())
}

#[inline]
pub fn decompress(compressed: &[u8], decompressed: &mut Vec<u8>) -> io::Result<()> {
    let count_size = std::mem::size_of::<u32>();
    let uncompressed_size = u32::from_le_bytes(
        compressed
            .get(..count_size)
            .ok_or(io::ErrorKind::InvalidData)?
            .try_into()
            .unwrap(),
    ) as usize;

    decompressed.clear();
    decompressed.resize(uncompressed_size, 0);

    let decompressed_size = decompress_to_buffer(&compressed[count_size..], decompressed)?;

    if decompressed_size != uncompressed_size {
        return Err(io::Error::new(
            io::ErrorKind::InvalidData,
            "doc store block not completely decompressed, data corruption".to_string(),
        ));
    }

    Ok(())
}


================================================
FILE: src/store/compressors.rs
================================================
use std::io;

use serde::{Deserialize, Deserializer, Serialize};

/// Compressor can be used on `IndexSettings` to choose
/// the compressor used to compress the doc store.
///
/// The default is Lz4Block, but also depends on the enabled feature flags.
#[derive(Clone, Debug, Copy, PartialEq, Eq)]
pub enum Compressor {
    /// No compression
    None,
    /// Use the lz4 compressor (block format)
    #[cfg(feature = "lz4-compression")]
    Lz4,
    /// Use the zstd compressor
    #[cfg(feature = "zstd-compression")]
    Zstd(ZstdCompressor),
}

impl Serialize for Compressor {
    fn serialize<S>(&self, serializer: S) -> Result<S::Ok, S::Error>
    where S: serde::Serializer {
        match *self {
            Compressor::None => serializer.serialize_str("none"),
            #[cfg(feature = "lz4-compression")]
            Compressor::Lz4 => serializer.serialize_str("lz4"),
            #[cfg(feature = "zstd-compression")]
            Compressor::Zstd(zstd) => serializer.serialize_str(&zstd.ser_to_string()),
        }
    }
}

impl<'de> Deserialize<'de> for Compressor {
    fn deserialize<D>(deserializer: D) -> Result<Self, D::Error>
    where D: Deserializer<'de> {
        let buf = String::deserialize(deserializer)?;
        let compressor = match buf.as_str() {
            "none" => Compressor::None,
            #[cfg(feature = "lz4-compression")]
            "lz4" => Compressor::Lz4,
            #[cfg(not(feature = "lz4-compression"))]
            "lz4" => {
                return Err(serde::de::Error::custom(
                    "unsupported variant `lz4`, please enable Tantivy's `lz4-compression` feature",
                ))
            }
            #[cfg(feature = "zstd-compression")]
            _ if buf.starts_with("zstd") => Compressor::Zstd(
                ZstdCompressor::deser_from_str(&buf).map_err(serde::de::Error::custom)?,
            ),
            #[cfg(not(feature = "zstd-compression"))]
            _ if buf.starts_with("zstd") => {
                return Err(serde::de::Error::custom(
                    "unsupported variant `zstd`, please enable Tantivy's `zstd-compression` \
                     feature",
                ))
            }
            _ => {
                return Err(serde::de::Error::unknown_variant(
                    &buf,
                    &[
                        "none",
                        #[cfg(feature = "lz4-compression")]
                        "lz4",
                        #[cfg(feature = "zstd-compression")]
                        "zstd",
                        #[cfg(feature = "zstd-compression")]
                        "zstd(compression_level=5)",
                    ],
                ));
            }
        };

        Ok(compressor)
    }
}

#[derive(Clone, Default, Debug, Copy, PartialEq, Eq, Serialize, Deserialize)]
/// The Zstd compressor, with optional compression level.
pub struct ZstdCompressor {
    /// The compression level, if unset defaults to zstd::DEFAULT_COMPRESSION_LEVEL = 3
    pub compression_level: Option<i32>,
}

#[cfg(feature = "zstd-compression")]
impl ZstdCompressor {
    fn deser_from_str(val: &str) -> Result<ZstdCompressor, String> {
        if !val.starts_with("zstd") {
            return Err(format!("needs to start with zstd, but got {val}"));
        }
        if val == "zstd" {
            return Ok(ZstdCompressor::default());
        }
        let options = &val["zstd".len() + 1..val.len() - 1];

        let mut compressor = ZstdCompressor::default();
        for option in options.split(',') {
            let (opt_name, value) = options
                .split_once('=')
                .ok_or_else(|| format!("no '=' found in option {option:?}"))?;

            match opt_name {
                "compression_level" => {
                    let value = value.parse::<i32>().map_err(|err| {
                        format!("Could not parse value {value} of option {opt_name}, e: {err}")
                    })?;
                    if value >= 15 {
                        warn!(
                            "High zstd compression level detected: {:?}. High compression levels \
                             (>=15) are slow and will limit indexing speed.",
                            value
                        )
                    }
                    compressor.compression_level = Some(value);
                }
                _ => {
                    return Err(format!("unknown zstd option {opt_name:?}"));
                }
            }
        }
        Ok(compressor)
    }
    fn ser_to_string(&self) -> String {
        if let Some(compression_level) = self.compression_level {
            format!("zstd(compression_level={compression_level})")
        } else {
            "zstd".to_string()
        }
    }
}

impl Default for Compressor {
    #[allow(unreachable_code)]
    fn default() -> Self {
        #[cfg(feature = "lz4-compression")]
        return Compressor::Lz4;

        #[cfg(feature = "zstd-compression")]
        return Compressor::Zstd(ZstdCompressor::default());

        Compressor::None
    }
}

impl Compressor {
    #[inline]
    pub(crate) fn compress_into(
        &self,
        uncompressed: &[u8],
        compressed: &mut Vec<u8>,
    ) -> io::Result<()> {
        match self {
            Self::None => {
                compressed.clear();
                compressed.extend_from_slice(uncompressed);
                Ok(())
            }
            #[cfg(feature = "lz4-compression")]
            Self::Lz4 => super::compression_lz4_block::compress(uncompressed, compressed),
            #[cfg(feature = "zstd-compression")]
            Self::Zstd(_zstd_compressor) => super::compression_zstd_block::compress(
                uncompressed,
                compressed,
                _zstd_compressor.compression_level,
            ),
        }
    }
}

#[cfg(all(feature = "zstd-compression", test))]
mod tests {
    use super::*;

    #[test]
    fn zstd_serde_roundtrip() {
        let compressor = ZstdCompressor {
            compression_level: Some(15),
        };

        assert_eq!(
            ZstdCompressor::deser_from_str(&compressor.ser_to_string()).unwrap(),
            compressor
        );

        assert_eq!(
            ZstdCompressor::deser_from_str(&ZstdCompressor::default().ser_to_string()).unwrap(),
            ZstdCompressor::default()
        );
    }

    #[test]
    fn deser_zstd_test() {
        assert_eq!(
            ZstdCompressor::deser_from_str("zstd").unwrap(),
            ZstdCompressor::default()
        );

        assert!(ZstdCompressor::deser_from_str("zzstd").is_err());
        assert!(ZstdCompressor::deser_from_str("zzstd()").is_err());
        assert_eq!(
            ZstdCompressor::deser_from_str("zstd(compression_level=15)").unwrap(),
            ZstdCompressor {
                compression_level: Some(15)
            }
        );
        assert_eq!(
            ZstdCompressor::deser_from_str("zstd(compresion_level=15)").unwrap_err(),
            "unknown zstd option \"compresion_level\""
        );
        assert_eq!(
            ZstdCompressor::deser_from_str("zstd(compression_level->2)").unwrap_err(),
            "no '=' found in option \"compression_level->2\""
        );
        assert_eq!(
            ZstdCompressor::deser_from_str("zstd(compression_level=over9000)").unwrap_err(),
            "Could not parse value over9000 of option compression_level, e: invalid digit found \
             in string"
        );
    }
}


================================================
FILE: src/store/decompressors.rs
================================================
use std::io;

use serde::{Deserialize, Serialize};

use super::Compressor;

/// Decompressor is deserialized from the doc store footer, when opening an index.
#[derive(Clone, Debug, Copy, PartialEq, Eq, Serialize, Deserialize)]
pub enum Decompressor {
    /// No compression
    None,
    /// Use the lz4 decompressor (block format)
    #[cfg(feature = "lz4-compression")]
    Lz4,
    /// Use the zstd decompressor
    #[cfg(feature = "zstd-compression")]
    Zstd,
}

impl From<Compressor> for Decompressor {
    fn from(compressor: Compressor) -> Self {
        match compressor {
            Compressor::None => Decompressor::None,
            #[cfg(feature = "lz4-compression")]
            Compressor::Lz4 => Decompressor::Lz4,
            #[cfg(feature = "zstd-compression")]
            Compressor::Zstd(_) => Decompressor::Zstd,
        }
    }
}

impl Decompressor {
    pub(crate) fn from_id(id: u8) -> Decompressor {
        match id {
            0 => Decompressor::None,
            #[cfg(feature = "lz4-compression")]
            1 => Decompressor::Lz4,
            #[cfg(feature = "zstd-compression")]
            4 => Decompressor::Zstd,
            _ => panic!("unknown compressor id {id:?}"),
        }
    }

    pub(crate) fn get_id(&self) -> u8 {
        match self {
            Self::None => 0,
            #[cfg(feature = "lz4-compression")]
            Self::Lz4 => 1,
            #[cfg(feature = "zstd-compression")]
            Self::Zstd => 4,
        }
    }

    pub(crate) fn decompress(&self, compressed_block: &[u8]) -> io::Result<Vec<u8>> {
        let mut decompressed_block = vec![];
        self.decompress_into(compressed_block, &mut decompressed_block)?;
        Ok(decompressed_block)
    }

    #[inline]
    pub(crate) fn decompress_into(
        &self,
        compressed: &[u8],
        decompressed: &mut Vec<u8>,
    ) -> io::Result<()> {
        match self {
            Self::None => {
                decompressed.clear();
                decompressed.extend_from_slice(compressed);
                Ok(())
            }
            #[cfg(feature = "lz4-compression")]
            Self::Lz4 => super::compression_lz4_block::decompress(compressed, decompressed),
            #[cfg(feature = "zstd-compression")]
            Self::Zstd => super::compression_zstd_block::decompress(compressed, decompressed),
        }
    }
}

#[cfg(test)]
mod tests {
    use super::*;

    #[test]
    fn compressor_decompressor_id_test() {
        assert_eq!(Decompressor::from(Compressor::None), Decompressor::None);
        #[cfg(feature = "lz4-compression")]
        assert_eq!(Decompressor::from(Compressor::Lz4), Decompressor::Lz4);
        #[cfg(feature = "zstd-compression")]
        assert_eq!(
            Decompressor::from(Compressor::Zstd(Default::default())),
            Decompressor::Zstd
        );
    }
}


================================================
FILE: src/store/footer.rs
================================================
use std::io;

use common::{BinarySerializable, FixedSize, HasLen};

use super::{Decompressor, DocStoreVersion, DOC_STORE_VERSION};
use crate::directory::FileSlice;

#[derive(Debug, Clone, PartialEq)]
pub struct DocStoreFooter {
    pub offset: u64,
    pub doc_store_version: DocStoreVersion,
    pub decompressor: Decompressor,
}

/// Serialises the footer to a byte-array
/// - offset : 8 bytes
/// - compressor id: 1 byte
/// - reserved for future use: 15 bytes
impl BinarySerializable for DocStoreFooter {
    fn serialize<W: io::Write + ?Sized>(&self, writer: &mut W) -> io::Result<()> {
        BinarySerializable::serialize(&DOC_STORE_VERSION, writer)?;
        BinarySerializable::serialize(&self.offset, writer)?;
        BinarySerializable::serialize(&self.decompressor.get_id(), writer)?;
        writer.write_all(&[0; 15])?;
        Ok(())
    }

    fn deserialize<R: io::Read>(reader: &mut R) -> io::Result<Self> {
        let doc_store_version = DocStoreVersion::deserialize(reader)?;
        if doc_store_version > DOC_STORE_VERSION {
            panic!(
                "actual doc store version: {doc_store_version}, max_supported: {DOC_STORE_VERSION}"
            );
        }
        let offset = u64::deserialize(reader)?;
        let compressor_id = u8::deserialize(reader)?;
        let mut skip_buf = [0; 15];
        reader.read_exact(&mut skip_buf)?;
        Ok(DocStoreFooter {
            offset,
            doc_store_version,
            decompressor: Decompressor::from_id(compressor_id),
        })
    }
}

impl FixedSize for DocStoreFooter {
    const SIZE_IN_BYTES: usize = 28;
}

impl DocStoreFooter {
    pub fn new(
        offset: u64,
        decompressor: Decompressor,
        doc_store_version: DocStoreVersion,
    ) -> Self {
        DocStoreFooter {
            offset,
            doc_store_version,
            decompressor,
        }
    }

    pub fn extract_footer(file: FileSlice) -> io::Result<(DocStoreFooter, FileSlice)> {
        if file.len() < DocStoreFooter::SIZE_IN_BYTES {
            return Err(io::Error::new(
                io::ErrorKind::UnexpectedEof,
                format!(
                    "File corrupted. The file is smaller than Footer::SIZE_IN_BYTES (len={}).",
                    file.len()
                ),
            ));
        }
        let (body, footer_slice) = file.split_from_end(DocStoreFooter::SIZE_IN_BYTES);
        let mut footer_bytes = footer_slice.read_bytes()?;
        let footer = DocStoreFooter::deserialize(&mut footer_bytes)?;
        Ok((footer, body))
    }
}

#[test]
fn doc_store_footer_test() {
    // This test is just to safe guard changes on the footer.
    // When the doc store footer is updated, make sure to update also the serialize/deserialize
    // methods
    assert_eq!(core::mem::size_of::<DocStoreFooter>(), 16);
}


================================================
FILE: src/store/index/block.rs
================================================
use std::io;
use std::ops::Range;

use common::{read_u32_vint, VInt};

use crate::store::index::{Checkpoint, CHECKPOINT_PERIOD};
use crate::DocId;

/// Represents a block of checkpoints.
///
/// The DocStore index checkpoints are organized into block
/// for code-readability and compression purpose.
///
/// A block can be of any size.
pub struct CheckpointBlock {
    pub checkpoints: Vec<Checkpoint>,
}

impl Default for CheckpointBlock {
    fn default() -> CheckpointBlock {
        CheckpointBlock {
            checkpoints: Vec::with_capacity(2 * CHECKPOINT_PERIOD),
        }
    }
}

impl CheckpointBlock {
    /// If non-empty returns [start_doc, end_doc)
    /// for the overall block.
    pub fn doc_interval(&self) -> Option<Range<DocId>> {
        let start_doc_opt = self
            .checkpoints
            .first()
            .cloned()
            .map(|checkpoint| checkpoint.doc_range.start);
        let end_doc_opt = self
            .checkpoints
            .last()
            .cloned()
            .map(|checkpoint| checkpoint.doc_range.end);
        match (start_doc_opt, end_doc_opt) {
            (Some(start_doc), Some(end_doc)) => Some(start_doc..end_doc),
            _ => None,
        }
    }

    /// Adding another checkpoint in the block.
    pub fn push(&mut self, checkpoint: Checkpoint) {
        if let Some(prev_checkpoint) = self.checkpoints.last() {
            assert!(checkpoint.follows(prev_checkpoint));
        }
        self.checkpoints.push(checkpoint);
    }

    /// Returns the number of checkpoints in the block.
    pub fn len(&self) -> usize {
        self.checkpoints.len()
    }

    pub fn get(&self, idx: usize) -> Checkpoint {
        self.checkpoints[idx].clone()
    }

    pub fn clear(&mut self) {
        self.checkpoints.clear();
    }

    pub fn serialize(&mut self, buffer: &mut Vec<u8>) {
        VInt(self.checkpoints.len() as u64).serialize_into_vec(buffer);
        if self.checkpoints.is_empty() {
            return;
        }
        VInt(self.checkpoints[0].doc_range.start as u64).serialize_into_vec(buffer);
        VInt(self.checkpoints[0].byte_range.start as u64).serialize_into_vec(buffer);
        for checkpoint in &self.checkpoints {
            let delta_doc = checkpoint.doc_range.end - checkpoint.doc_range.start;
            VInt(delta_doc as u64).serialize_into_vec(buffer);
            VInt((checkpoint.byte_range.end - checkpoint.byte_range.start) as u64)
                .serialize_into_vec(buffer);
        }
    }

    pub fn deserialize(&mut self, data: &mut &[u8]) -> io::Result<()> {
        if data.is_empty() {
            return Err(io::Error::new(io::ErrorKind::UnexpectedEof, ""));
        }
        self.checkpoints.clear();
        let len = read_u32_vint(data);
        if len == 0 {
            return Ok(());
        }
        let mut doc = read_u32_vint(data);
        let mut start_offset = VInt::deserialize_u64(data)? as usize;
        for _ in 0..len {
            let num_docs = read_u32_vint(data);
            let block_num_bytes = read_u32_vint(data) as usize;
            self.checkpoints.push(Checkpoint {
                doc_range: doc..doc + num_docs,
                byte_range: start_offset..start_offset + block_num_bytes,
            });
            doc += num_docs;
            start_offset += block_num_bytes;
        }
        Ok(())
    }
}

#[cfg(test)]
mod tests {
    use std::io;

    use crate::store::index::block::CheckpointBlock;
    use crate::store::index::Checkpoint;
    use crate::DocId;

    fn test_aux_ser_deser(checkpoints: &[Checkpoint]) -> io::Result<()> {
        let mut block = CheckpointBlock::default();
        for checkpoint in checkpoints {
            block.push(checkpoint.clone());
        }
        let mut buffer = Vec::new();
        block.serialize(&mut buffer);
        let mut block_deser = CheckpointBlock::default();
        let checkpoint = Checkpoint {
            doc_range: 0..1,
            byte_range: 2..3,
        };
        block_deser.push(checkpoint); // < check that value is erased before deser
        let mut data = &buffer[..];
        block_deser.deserialize(&mut data)?;
        assert!(data.is_empty());
        assert_eq!(checkpoints, &block_deser.checkpoints[..]);
        Ok(())
    }

    #[test]
    fn test_block_serialize_empty() -> io::Result<()> {
        test_aux_ser_deser(&[])
    }

    #[test]
    fn test_block_serialize_simple() -> io::Result<()> {
        let checkpoints = vec![Checkpoint {
            doc_range: 10..12,
            byte_range: 100..120,
        }];
        test_aux_ser_deser(&checkpoints)
    }

    #[test]
    fn test_block_serialize_large_byte_range() -> io::Result<()> {
        let checkpoints = vec![Checkpoint {
            doc_range: 10..12,
            byte_range: 8_000_000_000..9_000_000_000,
        }];
        test_aux_ser_deser(&checkpoints)
    }

    #[test]
    fn test_block_serialize() -> io::Result<()> {
        let offsets: Vec<usize> = (0..11).map(|i| i * i * i).collect();
        let mut checkpoints = vec![];
        let mut start_doc = 0;
        for i in 0..10 {
            let end_doc = (i * i) as DocId;
            checkpoints.push(Checkpoint {
                doc_range: start_doc..end_doc,
                byte_range: offsets[i]..offsets[i + 1],
            });
            start_doc = end_doc;
        }
        test_aux_ser_deser(&checkpoints)
    }
}


================================================
FILE: src/store/index/mod.rs
================================================
const CHECKPOINT_PERIOD: usize = 8;

use std::fmt;
use std::ops::Range;
mod block;
mod skip_index;
mod skip_index_builder;

pub use self::skip_index::SkipIndex;
pub use self::skip_index_builder::SkipIndexBuilder;
use crate::DocId;

/// A checkpoint contains meta-information about
/// a block. Either a block of documents, or another block
/// of checkpoints.
///
/// All of the intervals here defined are semi-open.
/// The checkpoint describes that the block within the `byte_range`
/// and spans over the `doc_range`.
#[derive(Clone, Eq, PartialEq, Default)]
pub struct Checkpoint {
    pub doc_range: Range<DocId>,
    pub byte_range: Range<usize>,
}

impl Checkpoint {
    pub(crate) fn follows(&self, other: &Checkpoint) -> bool {
        (self.doc_range.start == other.doc_range.end)
            && (self.byte_range.start == other.byte_range.end)
    }
}

impl fmt::Debug for Checkpoint {
    fn fmt(&self, f: &mut fmt::Formatter) -> fmt::Result {
        write!(f, "(doc={:?}, bytes={:?})", self.doc_range, self.byte_range)
    }
}

#[cfg(test)]
mod tests {

    use std::io;

    use proptest::prelude::*;

    use super::{SkipIndex, SkipIndexBuilder};
    use crate::directory::OwnedBytes;
    use crate::indexer::NoMergePolicy;
    use crate::schema::{SchemaBuilder, STORED, TEXT};
    use crate::store::index::Checkpoint;
    use crate::{DocAddress, DocId, Index, IndexWriter, TantivyDocument, Term};

    #[test]
    fn test_skip_index_empty() -> io::Result<()> {
        let mut output: Vec<u8> = Vec::new();
        let skip_index_builder: SkipIndexBuilder = SkipIndexBuilder::new();
        skip_index_builder.serialize_into(&mut output)?;
        let skip_index: SkipIndex = SkipIndex::open(OwnedBytes::new(output));
        let mut skip_cursor = skip_index.checkpoints();
        assert!(skip_cursor.next().is_none());
        Ok(())
    }

    #[test]
    fn test_skip_index_single_el() -> io::Result<()> {
        let mut output: Vec<u8> = Vec::new();
        let mut skip_index_builder: SkipIndexBuilder = SkipIndexBuilder::new();
        let checkpoint = Checkpoint {
            doc_range: 0..2,
            byte_range: 0..3,
        };
        skip_index_builder.insert(checkpoint.clone());
        skip_index_builder.serialize_into(&mut output)?;
        let skip_index: SkipIndex = SkipIndex::open(OwnedBytes::new(output));
        let mut skip_cursor = skip_index.checkpoints();
        assert_eq!(skip_cursor.next(), Some(checkpoint));
        assert_eq!(skip_cursor.next(), None);
        Ok(())
    }

    #[test]
    fn test_skip_index() -> io::Result<()> {
        let mut output: Vec<u8> = Vec::new();
        let checkpoints = vec![
            Checkpoint {
                doc_range: 0..3,
                byte_range: 0..9,
            },
            Checkpoint {
                doc_range: 3..4,
                byte_range: 9..25,
            },
            Checkpoint {
                doc_range: 4..6,
                byte_range: 25..49,
            },
            Checkpoint {
                doc_range: 6..8,
                byte_range: 49..81,
            },
            Checkpoint {
                doc_range: 8..10,
                byte_range: 81..100,
            },
        ];

        let mut skip_index_builder: SkipIndexBuilder = SkipIndexBuilder::new();
        for checkpoint in &checkpoints {
            skip_index_builder.insert(checkpoint.clone());
        }
        skip_index_builder.serialize_into(&mut output)?;

        let skip_index: SkipIndex = SkipIndex::open(OwnedBytes::new(output));
        assert_eq!(
            &skip_index.checkpoints().collect::<Vec<_>>()[..],
            &checkpoints[..]
        );
        Ok(())
    }

    fn offset_test(doc: DocId) -> usize {
        (doc as usize) * (doc as usize)
    }

    #[test]
    fn test_merge_store_with_stacking_reproducing_issue969() -> crate::Result<()> {
        let mut schema_builder = SchemaBuilder::default();
        let text = schema_builder.add_text_field("text", STORED | TEXT);
        let body = schema_builder.add_text_field("body", STORED);
        let schema = schema_builder.build();
        let index = Index::create_in_ram(schema);
        let mut index_writer: IndexWriter = index.writer_for_tests()?;
        index_writer.set_merge_policy(Box::new(NoMergePolicy));
        let long_text: String = "abcdefghijklmnopqrstuvwxyz".repeat(1_000);
        for _ in 0..20 {
            index_writer.add_document(doc!(body=>long_text.clone()))?;
        }
        index_writer.commit()?;
        index_writer.add_document(doc!(text=>"testb"))?;
        for _ in 0..10 {
            index_writer.add_document(doc!(text=>"testd", body=>long_text.clone()))?;
        }
        index_writer.commit()?;
        index_writer.delete_term(Term::from_field_text(text, "testb"));
        index_writer.commit()?;
        let segment_ids = index.searchable_segment_ids()?;
        index_writer.merge(&segment_ids).wait().unwrap();
        let reader = index.reader()?;
        let searcher = reader.searcher();
        assert_eq!(searcher.num_docs(), 30);
        for i in 0..searcher.num_docs() as u32 {
            let _doc = searcher.doc::<TantivyDocument>(DocAddress::new(0u32, i))?;
        }
        Ok(())
    }

    #[test]
    fn test_skip_index_long() -> io::Result<()> {
        let mut output: Vec<u8> = Vec::new();
        let checkpoints: Vec<Checkpoint> = (0..1000)
            .map(|i| Checkpoint {
                doc_range: i..(i + 1),
                byte_range: offset_test(i)..offset_test(i + 1),
            })
            .collect();
        let mut skip_index_builder = SkipIndexBuilder::new();
        for checkpoint in &checkpoints {
            skip_index_builder.insert(checkpoint.clone());
        }
        skip_index_builder.serialize_into(&mut output)?;
        assert_eq!(output.len(), 4035);
        let resulting_checkpoints: Vec<Checkpoint> = SkipIndex::open(OwnedBytes::new(output))
            .checkpoints()
            .collect();
        assert_eq!(&resulting_checkpoints, &checkpoints);
        Ok(())
    }

    fn integrate_delta(vals: Vec<usize>) -> Vec<usize> {
        let mut output = Vec::with_capacity(vals.len() + 1);
        output.push(0);
        let mut prev = 0;
        for val in vals {
            let new_val = val + prev;
            prev = new_val;
            output.push(new_val);
        }
        output
    }

    // Generates a sequence of n valid checkpoints, with n < max_len.
    fn monotonic_checkpoints(max_len: usize) -> BoxedStrategy<Vec<Checkpoint>> {
        (0..max_len)
            .prop_flat_map(move |len: usize| {
                (
                    proptest::collection::vec(1usize..20, len).prop_map(integrate_delta),
                    proptest::collection::vec(1usize..26, len).prop_map(integrate_delta),
                )
                    .prop_map(|(docs, offsets)| {
                        (0..docs.len() - 1)
                            .map(move |i| Checkpoint {
                                doc_range: docs[i] as DocId..docs[i + 1] as DocId,
                                byte_range: offsets[i]..offsets[i + 1],
                            })
                            .collect::<Vec<Checkpoint>>()
                    })
            })
            .boxed()
    }

    fn seek_manual<I: Iterator<Item = Checkpoint>>(
        checkpoints: I,
        target: DocId,
    ) -> Option<Checkpoint> {
        checkpoints
            .into_iter()
            .find(|checkpoint| checkpoint.doc_range.end > target)
    }

    fn test_skip_index_aux(skip_index: SkipIndex, checkpoints: &[Checkpoint]) {
        if let Some(last_checkpoint) = checkpoints.last() {
            for doc in 0u32..last_checkpoint.doc_range.end {
                let expected = seek_manual(skip_index.checkpoints(), doc);
                assert_eq!(expected, skip_index.seek(doc), "Doc {doc}");
            }
            assert!(skip_index.seek(last_checkpoint.doc_range.end).is_none());
        }
    }

    proptest! {
        #![proptest_config(ProptestConfig::with_cases(20))]
        #[test]
        fn test_proptest_skip(checkpoints in monotonic_checkpoints(100)) {
             let mut skip_index_builder = SkipIndexBuilder::new();
             for checkpoint in checkpoints.iter().cloned() {
                 skip_index_builder.insert(checkpoint);
             }
             let mut buffer = Vec::new();
             skip_index_builder.serialize_into(&mut buffer).unwrap();
             let skip_index = SkipIndex::open(OwnedBytes::new(buffer));
             let iter_checkpoints: Vec<Checkpoint> = skip_index.checkpoints().collect();
             assert_eq!(&checkpoints[..], &iter_checkpoints[..]);
             test_skip_index_aux(skip_index, &checkpoints[..]);
         }
    }
}


================================================
FILE: src/store/index/skip_index.rs
================================================
use common::{BinarySerializable, VInt};

use crate::directory::OwnedBytes;
use crate::store::index::block::CheckpointBlock;
use crate::store::index::Checkpoint;
use crate::DocId;

pub struct LayerCursor<'a> {
    remaining: &'a [u8],
    block: CheckpointBlock,
    cursor: usize,
}

impl Iterator for LayerCursor<'_> {
    type Item = Checkpoint;

    fn next(&mut self) -> Option<Checkpoint> {
        if self.cursor == self.block.len() {
            if self.remaining.is_empty() {
                return None;
            }
            let (block_mut, remaining_mut) = (&mut self.block, &mut self.remaining);
            block_mut.deserialize(remaining_mut).ok()?;
            self.cursor = 0;
        }
        let res = Some(self.block.get(self.cursor));
        self.cursor += 1;
        res
    }
}

struct Layer {
    data: OwnedBytes,
}

impl Layer {
    fn cursor(&self) -> impl Iterator<Item = Checkpoint> + '_ {
        self.cursor_at_offset(0)
    }

    fn cursor_at_offset(&self, start_offset: usize) -> impl Iterator<Item = Checkpoint> + '_ {
        let data = &self.data.as_slice();
        LayerCursor {
            remaining: &data[start_offset..],
            block: CheckpointBlock::default(),
            cursor: 0,
        }
    }

    fn seek_start_at_offset(&self, target: DocId, offset: usize) -> Option<Checkpoint> {
        self.cursor_at_offset(offset)
            .find(|checkpoint| checkpoint.doc_range.end > target)
    }
}

pub struct SkipIndex {
    layers: Vec<Layer>,
}

impl SkipIndex {
    pub fn open(mut data: OwnedBytes) -> SkipIndex {
        let offsets: Vec<u64> = Vec::<VInt>::deserialize(&mut data)
            .unwrap()
            .into_iter()
            .map(|el| el.0)
            .collect();
        let mut start_offset = 0;
        let mut layers = Vec::new();
        for end_offset in offsets {
            let layer = Layer {
                data: data.slice(start_offset as usize..end_offset as usize),
            };
            layers.push(layer);
            start_offset = end_offset;
        }
        SkipIndex { layers }
    }

    pub(crate) fn checkpoints(&self) -> impl Iterator<Item = Checkpoint> + '_ {
        self.layers
            .last()
            .into_iter()
            .flat_map(|layer| layer.cursor())
    }

    pub fn seek(&self, target: DocId) -> Option<Checkpoint> {
        let first_layer_len = self
            .layers
            .first()
            .map(|layer| layer.data.len())
            .unwrap_or(0);
        let mut cur_checkpoint = Checkpoint {
            doc_range: 0u32..1u32,
            byte_range: 0..first_layer_len,
        };
        for layer in &self.layers {
            if let Some(checkpoint) =
                layer.seek_start_at_offset(target, cur_checkpoint.byte_range.start)
            {
                cur_checkpoint = checkpoint;
            } else {
                return None;
            }
        }
        Some(cur_checkpoint)
    }
}


================================================
FILE: src/store/index/skip_index_builder.rs
================================================
use std::io;
use std::io::Write;

use common::{BinarySerializable, VInt};

use crate::store::index::block::CheckpointBlock;
use crate::store::index::{Checkpoint, CHECKPOINT_PERIOD};

// Each skip contains iterator over pairs (last doc in block, offset to start of block).

struct LayerBuilder {
    buffer: Vec<u8>,
    pub block: CheckpointBlock,
}

impl LayerBuilder {
    fn finish(self) -> Vec<u8> {
        self.buffer
    }

    fn new() -> LayerBuilder {
        LayerBuilder {
            buffer: Vec::new(),
            block: CheckpointBlock::default(),
        }
    }

    /// Serializes the block, and return a checkpoint representing
    /// the entire block.
    ///
    /// If the block was empty to begin with, simply return `None`.
    fn flush_block(&mut self) -> Option<Checkpoint> {
        if let Some(doc_range) = self.block.doc_interval() {
            let start_offset = self.buffer.len();
            self.block.serialize(&mut self.buffer);
            let end_offset = self.buffer.len();
            self.block.clear();
            Some(Checkpoint {
                doc_range,
                byte_range: start_offset..end_offset,
            })
        } else {
            None
        }
    }

    fn push(&mut self, checkpoint: Checkpoint) {
        self.block.push(checkpoint);
    }

    fn insert(&mut self, checkpoint: Checkpoint) -> Option<Checkpoint> {
        self.push(checkpoint);
        let emit_skip_info = self.block.len() >= CHECKPOINT_PERIOD;
        if emit_skip_info {
            self.flush_block()
        } else {
            None
        }
    }
}

pub struct SkipIndexBuilder {
    layers: Vec<LayerBuilder>,
}

impl SkipIndexBuilder {
    pub fn new() -> SkipIndexBuilder {
        SkipIndexBuilder { layers: Vec::new() }
    }

    fn get_layer(&mut self, layer_id: usize) -> &mut LayerBuilder {
        if layer_id == self.layers.len() {
            let layer_builder = LayerBuilder::new();
            self.layers.push(layer_builder);
        }
        &mut self.layers[layer_id]
    }

    pub fn insert(&mut self, checkpoint: Checkpoint) {
        let mut skip_pointer = Some(checkpoint);
        for layer_id in 0.. {
            if let Some(checkpoint) = skip_pointer {
                skip_pointer = self.get_layer(layer_id).insert(checkpoint);
            } else {
                break;
            }
        }
    }

    pub fn serialize_into<W: Write>(mut self, output: &mut W) -> io::Result<()> {
        let mut last_pointer = None;
        for skip_layer in self.layers.iter_mut() {
            if let Some(checkpoint) = last_pointer {
                skip_layer.push(checkpoint);
            }
            last_pointer = skip_layer.flush_block();
        }
        let layer_buffers: Vec<Vec<u8>> = self
            .layers
            .into_iter()
            .rev()
            .map(|layer| layer.finish())
            .collect();

        let mut layer_offset = 0;
        let mut layer_sizes = Vec::new();
        for layer_buffer in &layer_buffers {
            layer_offset += layer_buffer.len() as u64;
            layer_sizes.push(VInt(layer_offset));
        }
        layer_sizes.serialize(output)?;
        for layer_buffer in layer_buffers {
            output.write_all(&layer_buffer[..])?;
        }
        Ok(())
    }
}


================================================
FILE: src/store/mod.rs
================================================
//! Compressed/slow/row-oriented storage for documents.
//!
//! A field needs to be marked as stored in the schema in
//! order to be handled in the `Store`.
//!
//! Internally, documents (or rather their stored fields) are serialized to a buffer.
//! When the buffer exceeds `block_size` (defaults to 16K), the buffer is compressed
//! using LZ4 or Zstd and the resulting block is written to disk.
//!
//! One can then request for a specific `DocId`.
//! A skip list helps navigating to the right block,
//! decompresses it entirely and returns the document within it.
//!
//! If the last document requested was in the same block,
//! the reader is smart enough to avoid decompressing
//! the block a second time, but their is no real
//! uncompressed block* cache.
//!
//! A typical use case for the store is, once
//! the search result page has been computed, returning
//! the actual content of the 10 best document.
//!
//! # Usage
//!
//! Most users should not access the `StoreReader` directly
//! and should rely on either
//!
//! - at the segment level, the [`SegmentReader`'s `doc`
//!   method](../struct.SegmentReader.html#method.doc)
//! - at the index level, the [`Searcher::doc()`](crate::Searcher::doc) method

mod compressors;
mod decompressors;
mod footer;
mod index;
mod reader;
mod writer;

pub use self::compressors::{Compressor, ZstdCompressor};
pub use self::decompressors::Decompressor;
pub use self::reader::{CacheStats, StoreReader};
pub(crate) use self::reader::{DocStoreVersion, DOCSTORE_CACHE_CAPACITY};
pub use self::writer::StoreWriter;
mod store_compressor;

/// Doc store version in footer to handle format changes.
pub(crate) const DOC_STORE_VERSION: DocStoreVersion = DocStoreVersion::V2;

#[cfg(feature = "lz4-compression")]
mod compression_lz4_block;

#[cfg(feature = "zstd-compression")]
mod compression_zstd_block;

#[cfg(test)]
pub(crate) mod tests {

    use std::path::Path;

    use super::*;
    use crate::directory::{Directory, RamDirectory, WritePtr};
    use crate::fastfield::AliveBitSet;
    use crate::schema::{
        self, Schema, TantivyDocument, TextFieldIndexing, TextOptions, Value, STORED, TEXT,
    };
    use crate::{Index, IndexWriter, Term};

    const LOREM: &str = "Doc Lorem ipsum dolor sit amet, consectetur adipiscing elit, sed do \
                         eiusmod tempor incididunt ut labore et dolore magna aliqua. Ut enim ad \
                         minim veniam, quis nostrud exercitation ullamco laboris nisi ut aliquip \
                         ex ea commodo consequat. Duis aute irure dolor in reprehenderit in \
                         voluptate velit esse cillum dolore eu fugiat nulla pariatur. Excepteur \
                         sint occaecat cupidatat non proident, sunt in culpa qui officia deserunt \
                         mollit anim id est laborum.";

    const BLOCK_SIZE: usize = 16_384;

    pub fn write_lorem_ipsum_store(
        writer: WritePtr,
        num_docs: usize,
        compressor: Compressor,
        blocksize: usize,
        separate_thread: bool,
    ) -> Schema {
        let mut schema_builder = Schema::builder();
        let field_body = schema_builder.add_text_field("body", TextOptions::default().set_stored());
        let field_title =
            schema_builder.add_text_field("title", TextOptions::default().set_stored());
        let schema = schema_builder.build();
        {
            let mut store_writer =
                StoreWriter::new(writer, compressor, blocksize, separate_thread).unwrap();
            for i in 0..num_docs {
                let mut doc = TantivyDocument::default();
                doc.add_text(field_body, LOREM);
                doc.add_text(field_title, format!("Doc {i}"));
                store_writer.store(&doc, &schema).unwrap();
            }
            store_writer.close().unwrap();
        }
        schema
    }

    const NUM_DOCS: usize = 1_000;

    #[test]
    fn test_doc_store_iter_with_delete_bug_1077() -> crate::Result<()> {
        // this will cover deletion of the first element in a checkpoint
        let deleted_doc_ids = (200..300).collect::<Vec<_>>();
        let alive_bitset =
            AliveBitSet::for_test_from_deleted_docs(&deleted_doc_ids, NUM_DOCS as u32);

        let path = Path::new("store");
        let directory = RamDirectory::create();
        let store_wrt = directory.open_write(path)?;
        let schema =
            write_lorem_ipsum_store(store_wrt, NUM_DOCS, Compressor::default(), BLOCK_SIZE, true);
        let field_title = schema.get_field("title").unwrap();
        let store_file = directory.open_read(path)?;
        let store = StoreReader::open(store_file, 10)?;
        for i in 0..NUM_DOCS as u32 {
            assert_eq!(
                store
                    .get::<TantivyDocument>(i)?
                    .get_first(field_title)
                    .unwrap()
                    .as_value()
                    .as_str()
                    .unwrap(),
                format!("Doc {i}")
            );
        }

        for doc in store.iter::<TantivyDocument>(Some(&alive_bitset)) {
            let doc = doc?;
            let title_content = doc
                .get_first(field_title)
                .unwrap()
                .as_value()
                .as_str()
                .unwrap()
                .to_string();
            if !title_content.starts_with("Doc ") {
                panic!("unexpected title_content {title_content}");
            }

            let id = title_content
                .strip_prefix("Doc ")
                .unwrap()
                .parse::<u32>()
                .unwrap();
            if alive_bitset.is_deleted(id) {
                panic!("unexpected deleted document {id}");
            }
        }

        Ok(())
    }

    fn test_store(
        compressor: Compressor,
        blocksize: usize,
        separate_thread: bool,
    ) -> crate::Result<()> {
        let path = Path::new("store");
        let directory = RamDirectory::create();
        let store_wrt = directory.open_write(path)?;
        let schema =
            write_lorem_ipsum_store(store_wrt, NUM_DOCS, compressor, blocksize, separate_thread);
        let field_title = schema.get_field("title").unwrap();
        let store_file = directory.open_read(path)?;
        let store = StoreReader::open(store_file, 10)?;
        for i in 0..NUM_DOCS as u32 {
            assert_eq!(
                *store
                    .get::<TantivyDocument>(i)?
                    .get_first(field_title)
                    .unwrap()
                    .as_str()
                    .unwrap(),
                format!("Doc {i}")
            );
        }
        for (i, doc) in store.iter::<TantivyDocument>(None).enumerate() {
            assert_eq!(
                *doc?.get_first(field_title).unwrap().as_str().unwrap(),
                format!("Doc {i}")
            );
        }
        Ok(())
    }

    #[test]
    fn test_store_no_compression_same_thread() -> crate::Result<()> {
        test_store(Compressor::None, BLOCK_SIZE, false)
    }

    #[test]
    fn test_store_no_compression() -> crate::Result<()> {
        test_store(Compressor::None, BLOCK_SIZE, true)
    }

    #[cfg(feature = "lz4-compression")]
    #[test]
    fn test_store_lz4_block() -> crate::Result<()> {
        test_store(Compressor::Lz4, BLOCK_SIZE, true)
    }

    #[cfg(feature = "zstd-compression")]
    #[test]
    fn test_store_zstd() -> crate::Result<()> {
        test_store(
            Compressor::Zstd(ZstdCompressor::default()),
            BLOCK_SIZE,
            true,
        )
    }

    #[test]
    fn test_store_with_delete() -> crate::Result<()> {
        let mut schema_builder = schema::Schema::builder();

        let text_field_options = TextOptions::default()
            .set_indexing_options(
                TextFieldIndexing::default()
                    .set_index_option(schema::IndexRecordOption::WithFreqsAndPositions),
            )
            .set_stored();
        let text_field = schema_builder.add_text_field("text_field", text_field_options);
        let schema = schema_builder.build();
        let index_builder = Index::builder().schema(schema);

        let index = index_builder.create_in_ram()?;

        {
            let mut index_writer: IndexWriter = index.writer_for_tests().unwrap();
            index_writer.add_document(doc!(text_field=> "deleteme"))?;
            index_writer.add_document(doc!(text_field=> "deletemenot"))?;
            index_writer.add_document(doc!(text_field=> "deleteme"))?;
            index_writer.add_document(doc!(text_field=> "deletemenot"))?;
            index_writer.add_document(doc!(text_field=> "deleteme"))?;

            index_writer.delete_term(Term::from_field_text(text_field, "deleteme"));
            index_writer.commit()?;
        }

        let searcher = index.reader()?.searcher();
        let reader = searcher.segment_reader(0);
        let store = reader.get_store_reader(10)?;
        for doc in store.iter::<TantivyDocument>(reader.alive_bitset()) {
            assert_eq!(
                *doc?.get_first(text_field).unwrap().as_str().unwrap(),
                "deletemenot".to_string()
            );
        }
        Ok(())
    }

    #[cfg(feature = "lz4-compression")]
    #[cfg(feature = "zstd-compression")]
    #[test]
    fn test_merge_with_changed_compressor() -> crate::Result<()> {
        let mut schema_builder = schema::Schema::builder();

        let text_field = schema_builder.add_text_field("text_field", TEXT | STORED);
        let schema = schema_builder.build();
        let index_builder = Index::builder().schema(schema);

        let mut index = index_builder.create_in_ram().unwrap();
        index.settings_mut().docstore_compression = Compressor::Lz4;
        {
            let mut index_writer: IndexWriter = index.writer_for_tests().unwrap();
            // put enough data create enough blocks in the doc store to be considered for stacking
            for _ in 0..200 {
                index_writer.add_document(doc!(text_field=> LOREM))?;
            }
            assert!(index_writer.commit().is_ok());
            for _ in 0..200 {
                index_writer.add_document(doc!(text_field=> LOREM))?;
            }
            assert!(index_writer.commit().is_ok());
        }
        assert_eq!(
            index.reader().unwrap().searcher().segment_readers()[0]
                .get_store_reader(10)
                .unwrap()
                .decompressor(),
            Decompressor::Lz4
        );
        // Change compressor, this disables stacking on merging
        let index_settings = index.settings_mut();
        index_settings.docstore_compression = Compressor::Zstd(Default::default());
        // Merging the segments
        {
            let segment_ids = index
                .searchable_segment_ids()
                .expect("Searchable segments failed.");
            let mut index_writer: IndexWriter = index.writer_for_tests().unwrap();
            assert!(index_writer.merge(&segment_ids).wait().is_ok());
            assert!(index_writer.wait_merging_threads().is_ok());
        }

        let searcher = index.reader().unwrap().searcher();
        assert_eq!(searcher.segment_readers().len(), 1);
        let reader = searcher.segment_readers().iter().last().unwrap();
        let store = reader.get_store_reader(10).unwrap();

        for doc in store
            .iter::<TantivyDocument>(reader.alive_bitset())
            .take(50)
        {
            assert_eq!(
                *doc?.get_first(text_field).and_then(|v| v.as_str()).unwrap(),
                LOREM.to_string()
            );
        }
        assert_eq!(store.decompressor(), Decompressor::Zstd);

        Ok(())
    }

    #[test]
    fn test_merge_of_small_segments() -> crate::Result<()> {
        let mut schema_builder = schema::Schema::builder();

        let text_field = schema_builder.add_text_field("text_field", TEXT | STORED);
        let schema = schema_builder.build();
        let index_builder = Index::builder().schema(schema);

        let index = index_builder.create_in_ram().unwrap();

        {
            let mut index_writer = index.writer_for_tests()?;
            index_writer.add_document(doc!(text_field=> "1"))?;
            index_writer.commit()?;
            index_writer.add_document(doc!(text_field=> "2"))?;
            index_writer.commit()?;
            index_writer.add_document(doc!(text_field=> "3"))?;
            index_writer.commit()?;
            index_writer.add_document(doc!(text_field=> "4"))?;
            index_writer.commit()?;
            index_writer.add_document(doc!(text_field=> "5"))?;
            index_writer.commit()?;
        }
        // Merging the segments
        {
            let segment_ids = index.searchable_segment_ids()?;
            let mut index_writer: IndexWriter = index.writer_for_tests()?;
            index_writer.merge(&segment_ids).wait()?;
            index_writer.wait_merging_threads()?;
        }

        let searcher = index.reader()?.searcher();
        assert_eq!(searcher.segment_readers().len(), 1);
        let reader = searcher.segment_readers().iter().last().unwrap();
        let store = reader.get_store_reader(10)?;
        assert_eq!(store.block_checkpoints().count(), 1);
        Ok(())
    }
}

#[cfg(all(test, feature = "unstable"))]
mod bench {

    use std::path::Path;

    use test::Bencher;

    use super::tests::write_lorem_ipsum_store;
    use crate::directory::{Directory, RamDirectory};
    use crate::store::{Compressor, StoreReader};
    use crate::TantivyDocument;

    #[bench]
    #[cfg(feature = "mmap")]
    fn bench_store_encode(b: &mut Bencher) {
        let directory = RamDirectory::create();
        let path = Path::new("store");
        b.iter(|| {
            write_lorem_ipsum_store(
                directory.open_write(path).unwrap(),
                1_000,
                Compressor::default(),
                16_384,
                true,
            );
            directory.delete(path).unwrap();
        });
    }

    #[bench]
    fn bench_store_decode(b: &mut Bencher) {
        let directory = RamDirectory::create();
        let path = Path::new("store");
        write_lorem_ipsum_store(
            directory.open_write(path).unwrap(),
            1_000,
            Compressor::default(),
            16_384,
            true,
        );
        let store_file = directory.open_read(path).unwrap();
        let store = StoreReader::open(store_file, 10).unwrap();
        b.iter(|| store.iter::<TantivyDocument>(None).collect::<Vec<_>>());
    }
}


================================================
FILE: src/store/reader.rs
================================================
use std::fmt::Display;
use std::io;
use std::iter::Sum;
use std::num::NonZeroUsize;
use std::ops::{AddAssign, Range};
use std::sync::atomic::{AtomicUsize, Ordering};
use std::sync::{Arc, Mutex};

use common::{BinarySerializable, OwnedBytes};
use lru::LruCache;

use super::footer::DocStoreFooter;
use super::index::SkipIndex;
use super::Decompressor;
use crate::directory::FileSlice;
use crate::error::DataCorruption;
use crate::fastfield::AliveBitSet;
use crate::schema::document::{BinaryDocumentDeserializer, DocumentDeserialize};
use crate::space_usage::StoreSpaceUsage;
use crate::store::index::Checkpoint;
use crate::DocId;
#[cfg(feature = "quickwit")]
use crate::Executor;

pub(crate) const DOCSTORE_CACHE_CAPACITY: usize = 100;

type Block = OwnedBytes;

/// The format version of the document store.
#[derive(Clone, Copy, Debug, PartialEq, PartialOrd)]
pub(crate) enum DocStoreVersion {
    V1 = 1,
    V2 = 2,
}
impl Display for DocStoreVersion {
    fn fmt(&self, f: &mut std::fmt::Formatter<'_>) -> std::fmt::Result {
        match self {
            DocStoreVersion::V1 => write!(f, "V1"),
            DocStoreVersion::V2 => write!(f, "V2"),
        }
    }
}
impl BinarySerializable for DocStoreVersion {
    fn serialize<W: io::Write + ?Sized>(&self, writer: &mut W) -> io::Result<()> {
        (*self as u32).serialize(writer)
    }

    fn deserialize<R: io::Read>(reader: &mut R) -> io::Result<Self> {
        Ok(match u32::deserialize(reader)? {
            1 => DocStoreVersion::V1,
            2 => DocStoreVersion::V2,
            v => {
                return Err(io::Error::new(
                    io::ErrorKind::InvalidData,
                    format!("Invalid doc store version {v}"),
                ))
            }
        })
    }
}

/// Reads document off tantivy's [`Store`](./index.html)
pub struct StoreReader {
    decompressor: Decompressor,
    doc_store_version: DocStoreVersion,
    data: FileSlice,
    skip_index: Arc<SkipIndex>,
    space_usage: StoreSpaceUsage,
    cache: BlockCache,
}

/// The cache for decompressed blocks.
struct BlockCache {
    cache: Option<Mutex<LruCache<usize, Block>>>,
    cache_hits: AtomicUsize,
    cache_misses: AtomicUsize,
}

impl BlockCache {
    fn get_from_cache(&self, pos: usize) -> Option<Block> {
        if let Some(block) = self
            .cache
            .as_ref()
            .and_then(|cache| cache.lock().unwrap().get(&pos).cloned())
        {
            self.cache_hits.fetch_add(1, Ordering::SeqCst);
            return Some(block);
        }
        self.cache_misses.fetch_add(1, Ordering::SeqCst);
        None
    }

    fn put_into_cache(&self, pos: usize, data: Block) {
        if let Some(cache) = self.cache.as_ref() {
            cache.lock().unwrap().put(pos, data);
        }
    }

    fn stats(&self) -> CacheStats {
        CacheStats {
            cache_hits: self.cache_hits.load(Ordering::Relaxed),
            cache_misses: self.cache_misses.load(Ordering::Relaxed),
            num_entries: self.len(),
        }
    }

    fn len(&self) -> usize {
        self.cache
            .as_ref()
            .map_or(0, |cache| cache.lock().unwrap().len())
    }

    #[cfg(test)]
    fn peek_lru(&self) -> Option<usize> {
        self.cache
            .as_ref()
            .and_then(|cache| cache.lock().unwrap().peek_lru().map(|(&k, _)| k))
    }
}

#[derive(Debug, Default)]
/// CacheStats for the `StoreReader`.
pub struct CacheStats {
    /// The number of entries in the cache
    pub num_entries: usize,
    /// The number of cache hits.
    pub cache_hits: usize,
    /// The number of cache misses.
    pub cache_misses: usize,
}

impl AddAssign for CacheStats {
    fn add_assign(&mut self, other: Self) {
        *self = Self {
            num_entries: self.num_entries + other.num_entries,
            cache_hits: self.cache_hits + other.cache_hits,
            cache_misses: self.cache_misses + other.cache_misses,
        };
    }
}

impl Sum for CacheStats {
    fn sum<I: Iterator<Item = Self>>(mut iter: I) -> Self {
        let mut first = iter.next().unwrap_or_default();
        for el in iter {
            first += el;
        }
        first
    }
}

impl StoreReader {
    /// Opens a store reader
    ///
    /// `cache_num_blocks` sets the number of decompressed blocks to be cached in an LRU.
    /// The size of blocks is configurable, this should be reflexted in the
    pub fn open(store_file: FileSlice, cache_num_blocks: usize) -> io::Result<StoreReader> {
        let (footer, data_and_offset) = DocStoreFooter::extract_footer(store_file)?;

        let (data_file, offset_index_file) = data_and_offset.split(footer.offset as usize);
        let index_data = offset_index_file.read_bytes()?;
        let space_usage =
            StoreSpaceUsage::new(data_file.num_bytes(), offset_index_file.num_bytes());
        let skip_index = SkipIndex::open(index_data);
        Ok(StoreReader {
            decompressor: footer.decompressor,
            doc_store_version: footer.doc_store_version,
            data: data_file,
            cache: BlockCache {
                cache: NonZeroUsize::new(cache_num_blocks)
                    .map(|cache_num_blocks| Mutex::new(LruCache::new(cache_num_blocks))),
                cache_hits: Default::default(),
                cache_misses: Default::default(),
            },
            skip_index: Arc::new(skip_index),
            space_usage,
        })
    }

    pub(crate) fn block_checkpoints(&self) -> impl Iterator<Item = Checkpoint> + '_ {
        self.skip_index.checkpoints()
    }

    pub(crate) fn decompressor(&self) -> Decompressor {
        self.decompressor
    }

    /// Returns the cache hit and miss statistics of the store reader.
    pub(crate) fn cache_stats(&self) -> CacheStats {
        self.cache.stats()
    }

    /// Get checkpoint for `DocId`. The checkpoint can be used to load a block containing the
    /// document.
    ///
    /// Advanced API. In most cases use [`get`](Self::get).
    fn block_checkpoint(&self, doc_id: DocId) -> crate::Result<Checkpoint> {
        self.skip_index.seek(doc_id).ok_or_else(|| {
            crate::TantivyError::InvalidArgument(format!("Failed to lookup Doc #{doc_id}."))
        })
    }

    pub(crate) fn block_data(&self) -> io::Result<OwnedBytes> {
        self.data.read_bytes()
    }

    fn get_compressed_block(&self, checkpoint: &Checkpoint) -> io::Result<OwnedBytes> {
        self.data.slice(checkpoint.byte_range.clone()).read_bytes()
    }

    /// Loads and decompresses a block.
    ///
    /// Advanced API. In most cases use [`get`](Self::get).
    fn read_block(&self, checkpoint: &Checkpoint) -> io::Result<Block> {
        let cache_key = checkpoint.byte_range.start;
        if let Some(block) = self.cache.get_from_cache(cache_key) {
            return Ok(block);
        }

        let compressed_block = self.get_compressed_block(checkpoint)?;
        let decompressed_block =
            OwnedBytes::new(self.decompressor.decompress(compressed_block.as_ref())?);

        self.cache
            .put_into_cache(cache_key, decompressed_block.clone());

        Ok(decompressed_block)
    }

    /// Reads a given document.
    ///
    /// Calling `.get(doc)` is relatively costly as it requires
    /// decompressing a compressed block. The store utilizes a LRU cache,
    /// so accessing docs from the same compressed block should be faster.
    /// For that reason a store reader should be kept and reused.
    ///
    /// It should not be called to score documents
    /// for instance.
    pub fn get<D: DocumentDeserialize>(&self, doc_id: DocId) -> crate::Result<D> {
        let mut doc_bytes = self.get_document_bytes(doc_id)?;

        let deserializer =
            BinaryDocumentDeserializer::from_reader(&mut doc_bytes, self.doc_store_version)
                .map_err(crate::TantivyError::from)?;
        D::deserialize(deserializer).map_err(crate::TantivyError::from)
    }

    /// Returns raw bytes of a given document.
    ///
    /// Calling `.get(doc)` is relatively costly as it requires
    /// decompressing a compressed block. The store utilizes a LRU cache,
    /// so accessing docs from the same compressed block should be faster.
    /// For that reason a store reader should be kept and reused.
    pub fn get_document_bytes(&self, doc_id: DocId) -> crate::Result<OwnedBytes> {
        let checkpoint = self.block_checkpoint(doc_id)?;
        let block = self.read_block(&checkpoint)?;
        Self::get_document_bytes_from_block(block, doc_id, &checkpoint)
    }

    /// Advanced API.
    ///
    /// In most cases use [`get_document_bytes`](Self::get_document_bytes).
    fn get_document_bytes_from_block(
        block: OwnedBytes,
        doc_id: DocId,
        checkpoint: &Checkpoint,
    ) -> crate::Result<OwnedBytes> {
        let doc_pos = doc_id - checkpoint.doc_range.start;

        let range = block_read_index(&block, doc_pos)?;
        Ok(block.slice(range))
    }

    /// Iterator over all Documents in their order as they are stored in the doc store.
    /// Use this, if you want to extract all Documents from the doc store.
    /// The `alive_bitset` has to be forwarded from the `SegmentReader` or the results may be wrong.
    pub fn iter<'a: 'b, 'b, D: DocumentDeserialize>(
        &'b self,
        alive_bitset: Option<&'a AliveBitSet>,
    ) -> impl Iterator<Item = crate::Result<D>> + 'b {
        self.iter_raw(alive_bitset).map(|doc_bytes_res| {
            let mut doc_bytes = doc_bytes_res?;

            let deserializer =
                BinaryDocumentDeserializer::from_reader(&mut doc_bytes, self.doc_store_version)
                    .map_err(crate::TantivyError::from)?;
            D::deserialize(deserializer).map_err(crate::TantivyError::from)
        })
    }

    /// Iterator over all raw Documents in their order as they are stored in the doc store.
    /// Use this, if you want to extract all Documents from the doc store.
    /// The `alive_bitset` has to be forwarded from the `SegmentReader` or the results may be wrong.
    pub(crate) fn iter_raw<'a: 'b, 'b>(
        &'b self,
        alive_bitset: Option<&'a AliveBitSet>,
    ) -> impl Iterator<Item = crate::Result<OwnedBytes>> + 'b {
        let last_doc_id = self
            .block_checkpoints()
            .last()
            .map(|checkpoint| checkpoint.doc_range.end)
            .unwrap_or(0);
        let mut checkpoint_block_iter = self.block_checkpoints();
        let mut curr_checkpoint = checkpoint_block_iter.next();
        let mut curr_block = curr_checkpoint
            .as_ref()
            .map(|checkpoint| self.read_block(checkpoint).map_err(|e| e.kind())); // map error in order to enable cloning
        let mut doc_pos = 0;
        (0..last_doc_id)
            .filter_map(move |doc_id| {
                // filter_map is only used to resolve lifetime issues between the two closures on
                // the outer variables

                // check move to next checkpoint
                if doc_id >= curr_checkpoint.as_ref().unwrap().doc_range.end {
                    curr_checkpoint = checkpoint_block_iter.next();
                    curr_block = curr_checkpoint
                        .as_ref()
                        .map(|checkpoint| self.read_block(checkpoint).map_err(|e| e.kind()));
                    doc_pos = 0;
                }

                let alive = alive_bitset
                    .map(|bitset| bitset.is_alive(doc_id))
                    .unwrap_or(true);
                let res = if alive {
                    Some((curr_block.clone(), doc_pos))
                } else {
                    None
                };
                doc_pos += 1;
                res
            })
            .map(move |(block, doc_pos)| {
                let block = block
                    .ok_or_else(|| {
                        DataCorruption::comment_only(
                            "the current checkpoint in the doc store iterator is none, this \
                             should never happen",
                        )
                    })?
                    .map_err(|error_kind| {
                        std::io::Error::new(error_kind, "error when reading block in doc store")
                    })?;

                let range = block_read_index(&block, doc_pos)?;
                Ok(block.slice(range))
            })
    }

    /// Summarize total space usage of this store reader.
    pub fn space_usage(&self) -> StoreSpaceUsage {
        self.space_usage.clone()
    }
}

fn block_read_index(block: &[u8], doc_pos: u32) -> crate::Result<Range<usize>> {
    let doc_pos = doc_pos as usize;
    let size_of_u32 = std::mem::size_of::<u32>();

    let index_len_pos = block.len() - size_of_u32;
    let index_len = u32::deserialize(&mut &block[index_len_pos..])? as usize;

    if doc_pos > index_len {
        return Err(crate::TantivyError::InternalError(
            "Attempted to read doc from wrong block".to_owned(),
        ));
    }

    let index_start = block.len() - (index_len + 1) * size_of_u32;
    let index = &block[index_start..index_start + index_len * size_of_u32];

    let start_offset = u32::deserialize(&mut &index[doc_pos * size_of_u32..])? as usize;
    let end_offset = u32::deserialize(&mut &index[(doc_pos + 1) * size_of_u32..])
        .unwrap_or(index_start as u32) as usize;
    Ok(start_offset..end_offset)
}

#[cfg(feature = "quickwit")]
impl StoreReader {
    /// Advanced API.
    ///
    /// In most cases use [`get_async`](Self::get_async)
    ///
    /// Loads and decompresses a block asynchronously.
    async fn read_block_async(
        &self,
        checkpoint: &Checkpoint,
        executor: &Executor,
    ) -> io::Result<Block> {
        let cache_key = checkpoint.byte_range.start;
        if let Some(block) = self.cache.get_from_cache(checkpoint.byte_range.start) {
            return Ok(block);
        }

        let compressed_block = self
            .data
            .slice(checkpoint.byte_range.clone())
            .read_bytes_async()
            .await?;

        let decompressor = self.decompressor;
        let maybe_decompressed_block = executor
            .spawn_blocking(move || decompressor.decompress(compressed_block.as_ref()))
            .await
            .expect("decompression panicked");
        let decompressed_block = OwnedBytes::new(maybe_decompressed_block?);

        self.cache
            .put_into_cache(cache_key, decompressed_block.clone());

        Ok(decompressed_block)
    }

    /// Reads raw bytes of a given document asynchronously.
    pub async fn get_document_bytes_async(
        &self,
        doc_id: DocId,
        executor: &Executor,
    ) -> crate::Result<OwnedBytes> {
        let checkpoint = self.block_checkpoint(doc_id)?;
        let block = self.read_block_async(&checkpoint, executor).await?;
        Self::get_document_bytes_from_block(block, doc_id, &checkpoint)
    }

    /// Fetches a document asynchronously. Async version of [`get`](Self::get).
    pub async fn get_async<D: DocumentDeserialize>(
        &self,
        doc_id: DocId,
        executor: &Executor,
    ) -> crate::Result<D> {
        let mut doc_bytes = self.get_document_bytes_async(doc_id, executor).await?;

        let deserializer =
            BinaryDocumentDeserializer::from_reader(&mut doc_bytes, self.doc_store_version)
                .map_err(crate::TantivyError::from)?;
        D::deserialize(deserializer).map_err(crate::TantivyError::from)
    }
}

#[cfg(test)]
mod tests {
    use std::path::Path;

    use super::*;
    use crate::directory::RamDirectory;
    use crate::schema::{Field, TantivyDocument, Value};
    use crate::store::tests::write_lorem_ipsum_store;
    use crate::store::Compressor;
    use crate::Directory;

    const BLOCK_SIZE: usize = 16_384;

    fn get_text_field<'a>(doc: &'a TantivyDocument, field: &'a Field) -> Option<&'a str> {
        doc.get_first(*field).and_then(|f| f.as_value().as_str())
    }

    #[test]
    fn test_doc_store_version_ord() {
        assert!(DocStoreVersion::V1 < DocStoreVersion::V2);
    }

    #[test]
    fn test_store_lru_cache() -> crate::Result<()> {
        let directory = RamDirectory::create();
        let path = Path::new("store");
        let writer = directory.open_write(path)?;
        let schema = write_lorem_ipsum_store(writer, 500, Compressor::None, BLOCK_SIZE, true);
        let title = schema.get_field("title").unwrap();
        let store_file = directory.open_read(path)?;
        let store = StoreReader::open(store_file, DOCSTORE_CACHE_CAPACITY)?;

        assert_eq!(store.cache.len(), 0);
        assert_eq!(store.cache_stats().cache_hits, 0);
        assert_eq!(store.cache_stats().cache_misses, 0);

        let doc = store.get(0)?;
        assert_eq!(get_text_field(&doc, &title), Some("Doc 0"));

        assert_eq!(store.cache.len(), 1);
        assert_eq!(store.cache_stats().cache_hits, 0);
        assert_eq!(store.cache_stats().cache_misses, 1);

        assert_eq!(store.cache.peek_lru(), Some(0));

        let doc = store.get(499)?;
        assert_eq!(get_text_field(&doc, &title), Some("Doc 499"));

        assert_eq!(store.cache.len(), 2);
        assert_eq!(store.cache_stats().cache_hits, 0);
        assert_eq!(store.cache_stats().cache_misses, 2);

        assert_eq!(store.cache.peek_lru(), Some(0));

        let doc = store.get(0)?;
        assert_eq!(get_text_field(&doc, &title), Some("Doc 0"));

        assert_eq!(store.cache.len(), 2);
        assert_eq!(store.cache_stats().cache_hits, 1);
        assert_eq!(store.cache_stats().cache_misses, 2);

        assert_eq!(store.cache.peek_lru(), Some(232206));

        Ok(())
    }
}


================================================
FILE: src/store/store_compressor.rs
================================================
use std::io::Write;
use std::sync::mpsc::{sync_channel, Receiver, SyncSender};
use std::thread::JoinHandle;
use std::{io, thread};

use common::{BinarySerializable, CountingWriter, TerminatingWrite};

use super::DOC_STORE_VERSION;
use crate::directory::WritePtr;
use crate::store::footer::DocStoreFooter;
use crate::store::index::{Checkpoint, SkipIndexBuilder};
use crate::store::{Compressor, Decompressor, StoreReader};
use crate::DocId;

pub struct BlockCompressor(BlockCompressorVariants);

// The struct wrapping an enum is just here to keep the
// impls private.
enum BlockCompressorVariants {
    SameThread(BlockCompressorImpl),
    DedicatedThread(DedicatedThreadBlockCompressorImpl),
}

impl BlockCompressor {
    pub fn new(compressor: Compressor, wrt: WritePtr, dedicated_thread: bool) -> io::Result<Self> {
        let block_compressor_impl = BlockCompressorImpl::new(compressor, wrt);
        if dedicated_thread {
            let dedicated_thread_compressor =
                DedicatedThreadBlockCompressorImpl::new(block_compressor_impl)?;
            Ok(BlockCompressor(BlockCompressorVariants::DedicatedThread(
                dedicated_thread_compressor,
            )))
        } else {
            Ok(BlockCompressor(BlockCompressorVariants::SameThread(
                block_compressor_impl,
            )))
        }
    }

    pub fn compress_block_and_write(
        &mut self,
        bytes: &[u8],
        num_docs_in_block: u32,
    ) -> io::Result<()> {
        match &mut self.0 {
            BlockCompressorVariants::SameThread(block_compressor) => {
                block_compressor.compress_block_and_write(bytes, num_docs_in_block)?;
            }
            BlockCompressorVariants::DedicatedThread(different_thread_block_compressor) => {
                different_thread_block_compressor
                    .compress_block_and_write(bytes, num_docs_in_block)?;
            }
        }
        Ok(())
    }

    pub fn stack_reader(&mut self, store_reader: StoreReader) -> io::Result<()> {
        match &mut self.0 {
            BlockCompressorVariants::SameThread(block_compressor) => {
                block_compressor.stack(store_reader)?;
            }
            BlockCompressorVariants::DedicatedThread(different_thread_block_compressor) => {
                different_thread_block_compressor.stack_reader(store_reader)?;
            }
        }
        Ok(())
    }

    pub fn close(self) -> io::Result<()> {
        let imp = self.0;
        match imp {
            BlockCompressorVariants::SameThread(block_compressor) => block_compressor.close(),
            BlockCompressorVariants::DedicatedThread(different_thread_block_compressor) => {
                different_thread_block_compressor.close()
            }
        }
    }
}

struct BlockCompressorImpl {
    compressor: Compressor,
    first_doc_in_block: DocId,
    offset_index_writer: SkipIndexBuilder,
    intermediary_buffer: Vec<u8>,
    writer: CountingWriter<WritePtr>,
}

impl BlockCompressorImpl {
    fn new(compressor: Compressor, writer: WritePtr) -> Self {
        Self {
            compressor,
            first_doc_in_block: 0,
            offset_index_writer: SkipIndexBuilder::new(),
            intermediary_buffer: Vec::new(),
            writer: CountingWriter::wrap(writer),
        }
    }

    fn compress_block_and_write(&mut self, data: &[u8], num_docs_in_block: u32) -> io::Result<()> {
        assert!(num_docs_in_block > 0);
        self.intermediary_buffer.clear();
        self.compressor
            .compress_into(data, &mut self.intermediary_buffer)?;

        let start_offset = self.writer.written_bytes() as usize;
        self.writer.write_all(&self.intermediary_buffer)?;
        let end_offset = self.writer.written_bytes() as usize;

        self.register_checkpoint(Checkpoint {
            doc_range: self.first_doc_in_block..self.first_doc_in_block + num_docs_in_block,
            byte_range: start_offset..end_offset,
        });
        Ok(())
    }

    fn register_checkpoint(&mut self, checkpoint: Checkpoint) {
        self.offset_index_writer.insert(checkpoint.clone());
        self.first_doc_in_block = checkpoint.doc_range.end;
    }

    /// Stacks a store reader on top of the documents written so far.
    /// This method is an optimization compared to iterating over the documents
    /// in the store and adding them one by one, as the store's data will
    /// not be decompressed and then recompressed.
    fn stack(&mut self, store_reader: StoreReader) -> io::Result<()> {
        let doc_shift = self.first_doc_in_block;
        let start_shift = self.writer.written_bytes() as usize;

        // just bulk write all of the block of the given reader.
        self.writer
            .write_all(store_reader.block_data()?.as_slice())?;

        // concatenate the index of the `store_reader`, after translating
        // its start doc id and its start file offset.
        for mut checkpoint in store_reader.block_checkpoints() {
            checkpoint.doc_range.start += doc_shift;
            checkpoint.doc_range.end += doc_shift;
            checkpoint.byte_range.start += start_shift;
            checkpoint.byte_range.end += start_shift;
            self.register_checkpoint(checkpoint);
        }
        Ok(())
    }

    fn close(mut self) -> io::Result<()> {
        let header_offset: u64 = self.writer.written_bytes();
        let docstore_footer = DocStoreFooter::new(
            header_offset,
            Decompressor::from(self.compressor),
            DOC_STORE_VERSION,
        );
        self.offset_index_writer.serialize_into(&mut self.writer)?;
        docstore_footer.serialize(&mut self.writer)?;
        self.writer.terminate()
    }
}

// ---------------------------------
enum BlockCompressorMessage {
    CompressBlockAndWrite {
        block_data: Vec<u8>,
        num_docs_in_block: u32,
    },
    Stack(StoreReader),
}

struct DedicatedThreadBlockCompressorImpl {
    join_handle: Option<JoinHandle<io::Result<()>>>,
    tx: SyncSender<BlockCompressorMessage>,
}

impl DedicatedThreadBlockCompressorImpl {
    fn new(mut block_compressor: BlockCompressorImpl) -> io::Result<Self> {
        let (tx, rx): (
            SyncSender<BlockCompressorMessage>,
            Receiver<BlockCompressorMessage>,
        ) = sync_channel(3);
        let join_handle = thread::Builder::new()
            .name("docstore-compressor-thread".to_string())
            .spawn(move || {
                while let Ok(packet) = rx.recv() {
                    match packet {
                        BlockCompressorMessage::CompressBlockAndWrite {
                            block_data,
                            num_docs_in_block,
                        } => {
                            block_compressor
                                .compress_block_and_write(&block_data[..], num_docs_in_block)?;
                        }
                        BlockCompressorMessage::Stack(store_reader) => {
                            block_compressor.stack(store_reader)?;
                        }
                    }
                }
                block_compressor.close()?;
                Ok(())
            })?;
        Ok(DedicatedThreadBlockCompressorImpl {
            join_handle: Some(join_handle),
            tx,
        })
    }

    fn compress_block_and_write(&mut self, bytes: &[u8], num_docs_in_block: u32) -> io::Result<()> {
        self.send(BlockCompressorMessage::CompressBlockAndWrite {
            block_data: bytes.to_vec(),
            num_docs_in_block,
        })
    }

    fn stack_reader(&mut self, store_reader: StoreReader) -> io::Result<()> {
        self.send(BlockCompressorMessage::Stack(store_reader))
    }

    fn send(&mut self, msg: BlockCompressorMessage) -> io::Result<()> {
        if self.tx.send(msg).is_err() {
            harvest_thread_result(self.join_handle.take())?;
            return Err(io::Error::other("Unidentified error."));
        }
        Ok(())
    }

    fn close(self) -> io::Result<()> {
        drop(self.tx);
        harvest_thread_result(self.join_handle)
    }
}

/// Wait for the thread result to terminate and returns its result.
///
/// If the thread panicked, or if the result has already been harvested,
/// returns an explicit error.
fn harvest_thread_result(join_handle_opt: Option<JoinHandle<io::Result<()>>>) -> io::Result<()> {
    let join_handle = join_handle_opt.ok_or_else(|| io::Error::other("Thread already joined."))?;
    join_handle
        .join()
        .map_err(|_err| io::Error::other("Compressing thread panicked."))?
}

#[cfg(test)]
mod tests {
    use std::io;
    use std::path::Path;

    use crate::directory::RamDirectory;
    use crate::store::store_compressor::BlockCompressor;
    use crate::store::Compressor;
    use crate::Directory;

    fn populate_block_compressor(mut block_compressor: BlockCompressor) -> io::Result<()> {
        block_compressor.compress_block_and_write(b"hello", 1)?;
        block_compressor.compress_block_and_write(b"happy", 1)?;
        block_compressor.close()?;
        Ok(())
    }

    #[test]
    fn test_block_store_compressor_impls_yield_the_same_result() {
        let ram_directory = RamDirectory::default();
        let path1 = Path::new("path1");
        let path2 = Path::new("path2");
        let wrt1 = ram_directory.open_write(path1).unwrap();
        let wrt2 = ram_directory.open_write(path2).unwrap();
        let block_compressor1 = BlockCompressor::new(Compressor::None, wrt1, true).unwrap();
        let block_compressor2 = BlockCompressor::new(Compressor::None, wrt2, false).unwrap();
        populate_block_compressor(block_compressor1).unwrap();
        populate_block_compressor(block_compressor2).unwrap();
        let data1 = ram_directory.open_read(path1).unwrap();
        let data2 = ram_directory.open_read(path2).unwrap();
        assert_eq!(data1.read_bytes().unwrap(), data2.read_bytes().unwrap());
    }
}


================================================
FILE: src/store/writer.rs
================================================
use std::io;

use common::BinarySerializable;

use super::compressors::Compressor;
use super::StoreReader;
use crate::directory::WritePtr;
use crate::schema::document::{BinaryDocumentSerializer, Document};
use crate::schema::Schema;
use crate::store::store_compressor::BlockCompressor;
use crate::DocId;

/// Write tantivy's [`Store`](./index.html)
///
/// Contrary to the other components of `tantivy`,
/// the store is written to disc as document as being added,
/// as opposed to when the segment is getting finalized.
///
/// The skip list index on the other hand, is built in memory.
pub struct StoreWriter {
    compressor: Compressor,
    block_size: usize,
    num_docs_in_current_block: DocId,
    current_block: Vec<u8>,
    doc_pos: Vec<u32>,
    block_compressor: BlockCompressor,
}

impl StoreWriter {
    /// Create a store writer.
    ///
    /// The store writer will writes blocks on disc as
    /// document are added.
    pub fn new(
        writer: WritePtr,
        compressor: Compressor,
        block_size: usize,
        dedicated_thread: bool,
    ) -> io::Result<StoreWriter> {
        let block_compressor = BlockCompressor::new(compressor, writer, dedicated_thread)?;
        Ok(StoreWriter {
            compressor,
            block_size,
            num_docs_in_current_block: 0,
            doc_pos: Vec::new(),
            current_block: Vec::new(),
            block_compressor,
        })
    }

    pub(crate) fn compressor(&self) -> Compressor {
        self.compressor
    }

    /// The memory used (inclusive childs)
    pub fn mem_usage(&self) -> usize {
        self.current_block.capacity() + self.doc_pos.capacity() * std::mem::size_of::<u32>()
    }

    /// Checks if the current block is full, and if so, compresses and flushes it.
    fn check_flush_block(&mut self) -> io::Result<()> {
        // this does not count the VInt storing the index length itself, but it is negligible in
        // front of everything else.
        let index_len = self.doc_pos.len() * std::mem::size_of::<usize>();
        if self.current_block.len() + index_len > self.block_size {
            self.send_current_block_to_compressor()?;
        }
        Ok(())
    }

    /// Flushes current uncompressed block and sends to compressor.
    fn send_current_block_to_compressor(&mut self) -> io::Result<()> {
        // We don't do anything if the current block is empty to begin with.
        if self.current_block.is_empty() {
            return Ok(());
        }

        let size_of_u32 = std::mem::size_of::<u32>();
        self.current_block
            .reserve((self.doc_pos.len() + 1) * size_of_u32);

        for pos in self.doc_pos.iter() {
            pos.serialize(&mut self.current_block)?;
        }
        (self.doc_pos.len() as u32).serialize(&mut self.current_block)?;

        self.block_compressor
            .compress_block_and_write(&self.current_block, self.num_docs_in_current_block)?;
        self.doc_pos.clear();
        self.current_block.clear();
        self.num_docs_in_current_block = 0;
        Ok(())
    }

    /// Store a new document.
    ///
    /// The document id is implicitly the current number
    /// of documents.
    pub fn store<D: Document>(&mut self, document: &D, schema: &Schema) -> io::Result<()> {
        self.doc_pos.push(self.current_block.len() as u32);

        let mut serializer = BinaryDocumentSerializer::new(&mut self.current_block, schema);
        serializer.serialize_doc(document)?;

        self.num_docs_in_current_block += 1;
        self.check_flush_block()?;
        Ok(())
    }

    /// Store bytes of a serialized document.
    ///
    /// The document id is implicitly the current number
    /// of documents.
    pub fn store_bytes(&mut self, serialized_document: &[u8]) -> io::Result<()> {
        self.doc_pos.push(self.current_block.len() as u32);
        self.current_block.extend_from_slice(serialized_document);
        self.num_docs_in_current_block += 1;
        self.check_flush_block()?;
        Ok(())
    }

    /// Stacks a store reader on top of the documents written so far.
    /// This method is an optimization compared to iterating over the documents
    /// in the store and adding them one by one, as the store's data will
    /// not be decompressed and then recompressed.
    pub fn stack(&mut self, store_reader: StoreReader) -> io::Result<()> {
        // We flush the current block first before stacking
        self.send_current_block_to_compressor()?;
        self.block_compressor.stack_reader(store_reader)?;
        Ok(())
    }

    /// Finalized the store writer.
    ///
    /// Compress the last unfinished block if any,
    /// and serializes the skip list index on disc.
    pub fn close(mut self) -> io::Result<()> {
        self.send_current_block_to_compressor()?;
        self.block_compressor.close()?;
        Ok(())
    }
}


================================================
FILE: src/termdict/fst_termdict/merger.rs
================================================
use tantivy_fst::map::{OpBuilder, Union};
use tantivy_fst::raw::IndexedValue;
use tantivy_fst::Streamer;

use super::termdict::TermDictionary;
use crate::postings::TermInfo;
use crate::termdict::{TermOrdinal, TermStreamer};

/// Given a list of sorted term streams,
/// returns an iterator over sorted unique terms.
///
/// The item yielded is actually a pair with
/// - the term
/// - a slice with the ordinal of the segments containing the term.
pub struct TermMerger<'a> {
    dictionaries: Vec<&'a TermDictionary>,
    union: Union<'a>,
    current_key: Vec<u8>,
    current_segment_and_term_ordinals: Vec<IndexedValue>,
}

impl<'a> TermMerger<'a> {
    /// Stream of merged term dictionary
    pub fn new(streams: Vec<TermStreamer<'a>>) -> TermMerger<'a> {
        let mut op_builder = OpBuilder::new();
        let mut dictionaries = vec![];
        for streamer in streams {
            op_builder.push(streamer.stream);
            dictionaries.push(streamer.fst_map);
        }
        TermMerger {
            dictionaries,
            union: op_builder.union(),
            current_key: vec![],
            current_segment_and_term_ordinals: vec![],
        }
    }

    /// Iterator over `(segment ordinal, TermOrdinal)` pairs sorted by segment ordinal
    ///
    /// This method may be called
    /// if [`Self::advance`] has been called before
    /// and `true` was returned.
    pub fn matching_segments<'b: 'a>(&'b self) -> impl 'b + Iterator<Item = (usize, TermOrdinal)> {
        self.current_segment_and_term_ordinals
            .iter()
            .map(|iv| (iv.index, iv.value))
    }

    /// Advance the term iterator to the next term.
    /// Returns `true` if there is indeed another term
    /// `false` if there is none.
    pub fn advance(&mut self) -> bool {
        let (key, values) = if let Some((key, values)) = self.union.next() {
            (key, values)
        } else {
            return false;
        };
        self.current_key.clear();
        self.current_key.extend_from_slice(key);
        self.current_segment_and_term_ordinals.clear();
        self.current_segment_and_term_ordinals
            .extend_from_slice(values);
        self.current_segment_and_term_ordinals
            .sort_by_key(|iv| iv.index);
        true
    }

    /// Returns the current term.
    ///
    /// This method may be called if [`Self::advance`] has been called before
    /// and `true` was returned.
    pub fn key(&self) -> &[u8] {
        &self.current_key
    }

    /// Iterator over `(segment ordinal, TermInfo)` pairs sorted by the ordinal.
    ///
    /// This method may be called if [`Self::advance`] has been called before
    /// and `true` was returned.
    pub fn current_segment_ords_and_term_infos<'b: 'a>(
        &'b self,
    ) -> impl 'b + Iterator<Item = (usize, TermInfo)> {
        self.current_segment_and_term_ordinals
            .iter()
            .map(move |iv| {
                (
                    iv.index,
                    self.dictionaries[iv.index].term_info_from_ord(iv.value),
                )
            })
    }
}

#[cfg(all(test, feature = "unstable"))]
mod bench {
    use rand::distributions::Alphanumeric;
    use rand::{rng, Rng};
    use test::{self, Bencher};

    use super::TermMerger;
    use crate::directory::FileSlice;
    use crate::postings::TermInfo;
    use crate::termdict::{TermDictionary, TermDictionaryBuilder};

    fn make_term_info(term_ord: u64) -> TermInfo {
        let offset = |term_ord: u64| (term_ord * 100 + term_ord * term_ord) as usize;
        TermInfo {
            doc_freq: term_ord as u32,
            postings_range: offset(term_ord)..offset(term_ord + 1),
            positions_range: offset(term_ord)..offset(term_ord + 1),
        }
    }

    /// Create a dictionary of random strings.
    fn rand_dict(num_terms: usize) -> std::io::Result<TermDictionary> {
        let buffer: Vec<u8> = {
            let mut terms = vec![];
            for _i in 0..num_terms {
                let rand_string: String = rng()
                    .sample_iter(&Alphanumeric)
                    .take(rng().random_range(30..42))
                    .map(char::from)
                    .collect();
                terms.push(rand_string);
            }
            terms.sort();

            let mut term_dictionary_builder = TermDictionaryBuilder::create(Vec::new())?;
            for i in 0..num_terms {
                term_dictionary_builder.insert(terms[i].as_bytes(), &make_term_info(i as u64))?;
            }
            term_dictionary_builder.finish()?
        };
        let file = FileSlice::from(buffer);
        TermDictionary::open(file)
    }

    #[bench]
    fn bench_termmerger(b: &mut Bencher) -> crate::Result<()> {
        let dict1 = rand_dict(100_000)?;
        let dict2 = rand_dict(100_000)?;
        b.iter(|| -> crate::Result<u32> {
            let stream1 = dict1.stream()?;
            let stream2 = dict2.stream()?;
            let mut merger = TermMerger::new(vec![stream1, stream2]);
            let mut count = 0;
            while merger.advance() {
                count += 1;
            }
            Ok(count)
        });
        Ok(())
    }
}


================================================
FILE: src/termdict/fst_termdict/mod.rs
================================================
//! The term dictionary main role is to associate the sorted [`Term`](crate::Term)s with
//! a [`TermInfo`](crate::postings::TermInfo) struct that contains some meta-information
//! about the term.
//!
//! Internally, the term dictionary relies on the `fst` crate to store
//! a sorted mapping that associates each term to its rank in the lexicographical order.
//! For instance, in a dictionary containing the sorted terms "abba", "bjork", "blur" and "donovan",
//! the `TermOrdinal` are respectively `0`, `1`, `2`, and `3`.
//!
//! For `u64`-terms, tantivy explicitly uses a `BigEndian` representation to ensure that the
//! lexicographical order matches the natural order of integers.
//!
//! `i64`-terms are transformed to `u64` using a continuous mapping `val ⟶ val - i64::MIN`
//! and then treated as a `u64`.
//!
//! `f64`-terms are transformed to `u64` using a mapping that preserve order, and are then treated
//! as `u64`.
//!
//! A second datastructure makes it possible to access a
//! [`TermInfo`](crate::postings::TermInfo).
mod merger;
mod streamer;
mod term_info_store;
mod termdict;

pub use self::merger::TermMerger;
pub use self::streamer::{TermStreamer, TermStreamerBuilder};
pub use self::termdict::{TermDictionary, TermDictionaryBuilder};


================================================
FILE: src/termdict/fst_termdict/streamer.rs
================================================
use std::io;

use tantivy_fst::automaton::AlwaysMatch;
use tantivy_fst::map::{Stream, StreamBuilder};
use tantivy_fst::{Automaton, IntoStreamer, Streamer};

use super::TermDictionary;
use crate::postings::TermInfo;
use crate::termdict::TermOrdinal;

/// `TermStreamerBuilder` is a helper object used to define
/// a range of terms that should be streamed.
pub struct TermStreamerBuilder<'a, A = AlwaysMatch>
where A: Automaton
{
    fst_map: &'a TermDictionary,
    stream_builder: StreamBuilder<'a, A>,
}

impl<'a, A> TermStreamerBuilder<'a, A>
where A: Automaton
{
    pub(crate) fn new(fst_map: &'a TermDictionary, stream_builder: StreamBuilder<'a, A>) -> Self {
        TermStreamerBuilder {
            fst_map,
            stream_builder,
        }
    }

    /// Limit the range to terms greater or equal to the bound
    pub fn ge<T: AsRef<[u8]>>(mut self, bound: T) -> Self {
        self.stream_builder = self.stream_builder.ge(bound);
        self
    }

    /// Limit the range to terms strictly greater than the bound
    pub fn gt<T: AsRef<[u8]>>(mut self, bound: T) -> Self {
        self.stream_builder = self.stream_builder.gt(bound);
        self
    }

    /// Limit the range to terms lesser or equal to the bound
    pub fn le<T: AsRef<[u8]>>(mut self, bound: T) -> Self {
        self.stream_builder = self.stream_builder.le(bound);
        self
    }

    /// Limit the range to terms lesser or equal to the bound
    pub fn lt<T: AsRef<[u8]>>(mut self, bound: T) -> Self {
        self.stream_builder = self.stream_builder.lt(bound);
        self
    }

    /// Iterate over the range backwards.
    pub fn backward(mut self) -> Self {
        self.stream_builder = self.stream_builder.backward();
        self
    }

    /// Creates the stream corresponding to the range
    /// of terms defined using the `TermStreamerBuilder`.
    pub fn into_stream(self) -> io::Result<TermStreamer<'a, A>> {
        Ok(TermStreamer {
            fst_map: self.fst_map,
            stream: self.stream_builder.into_stream(),
            term_ord: 0u64,
            current_key: Vec::with_capacity(100),
            current_value: TermInfo::default(),
        })
    }
}

/// `TermStreamer` acts as a cursor over a range of terms of a segment.
/// Terms are guaranteed to be sorted.
pub struct TermStreamer<'a, A = AlwaysMatch>
where A: Automaton
{
    pub(crate) fst_map: &'a TermDictionary,
    pub(crate) stream: Stream<'a, A>,
    term_ord: TermOrdinal,
    current_key: Vec<u8>,
    current_value: TermInfo,
}

impl<A> TermStreamer<'_, A>
where A: Automaton
{
    /// Advance position the stream on the next item.
    /// Before the first call to `.advance()`, the stream
    /// is an uninitialized state.
    pub fn advance(&mut self) -> bool {
        if let Some((term, term_ord)) = self.stream.next() {
            self.current_key.clear();
            self.current_key.extend_from_slice(term);
            self.term_ord = term_ord;
            self.current_value = self.fst_map.term_info_from_ord(term_ord);
            true
        } else {
            false
        }
    }

    /// Returns the `TermOrdinal` of the given term.
    ///
    /// May panic if the called as `.advance()` as never
    /// been called before.
    pub fn term_ord(&self) -> TermOrdinal {
        self.term_ord
    }

    /// Accesses the current key.
    ///
    /// `.key()` should return the key that was returned
    /// by the `.next()` method.
    ///
    /// If the end of the stream as been reached, and `.next()`
    /// has been called and returned `None`, `.key()` remains
    /// the value of the last key encountered.
    ///
    /// Before any call to `.next()`, `.key()` returns an empty array.
    pub fn key(&self) -> &[u8] {
        &self.current_key
    }

    /// Accesses the current value.
    ///
    /// Calling `.value()` after the end of the stream will return the
    /// last `.value()` encountered.
    ///
    /// # Panics
    ///
    /// Calling `.value()` before the first call to `.advance()` returns
    /// `V::default()`.
    pub fn value(&self) -> &TermInfo {
        &self.current_value
    }

    /// Return the next `(key, value)` pair.
    #[expect(clippy::should_implement_trait)]
    pub fn next(&mut self) -> Option<(&[u8], &TermInfo)> {
        if self.advance() {
            Some((self.key(), self.value()))
        } else {
            None
        }
    }
}


================================================
FILE: src/termdict/fst_termdict/term_info_store.rs
================================================
use std::cmp;
use std::io::{self, Read, Write};

use byteorder::{ByteOrder, LittleEndian};
use common::{BinarySerializable, FixedSize};
use tantivy_bitpacker::{compute_num_bits, BitPacker};

use crate::directory::{FileSlice, OwnedBytes};
use crate::postings::TermInfo;
use crate::termdict::TermOrdinal;

const BLOCK_LEN: usize = 256;

#[derive(Debug, Eq, PartialEq, Default)]
struct TermInfoBlockMeta {
    offset: u64,
    ref_term_info: TermInfo,
    doc_freq_nbits: u8,
    postings_offset_nbits: u8,
    positions_offset_nbits: u8,
}

impl BinarySerializable for TermInfoBlockMeta {
    fn serialize<W: Write + ?Sized>(&self, write: &mut W) -> io::Result<()> {
        self.offset.serialize(write)?;
        self.ref_term_info.serialize(write)?;
        write.write_all(&[
            self.doc_freq_nbits,
            self.postings_offset_nbits,
            self.positions_offset_nbits,
        ])?;
        Ok(())
    }

    fn deserialize<R: Read>(reader: &mut R) -> io::Result<Self> {
        let offset = u64::deserialize(reader)?;
        let ref_term_info = TermInfo::deserialize(reader)?;
        let mut buffer = [0u8; 3];
        reader.read_exact(&mut buffer)?;
        Ok(TermInfoBlockMeta {
            offset,
            ref_term_info,
            doc_freq_nbits: buffer[0],
            postings_offset_nbits: buffer[1],
            positions_offset_nbits: buffer[2],
        })
    }
}

impl FixedSize for TermInfoBlockMeta {
    const SIZE_IN_BYTES: usize = u64::SIZE_IN_BYTES + TermInfo::SIZE_IN_BYTES + 3;
}

impl TermInfoBlockMeta {
    fn num_bits(&self) -> u8 {
        self.doc_freq_nbits + self.postings_offset_nbits + self.positions_offset_nbits
    }

    // Here inner_offset is the offset within the block, WITHOUT the first term_info.
    // In other word, term_info #1,#2,#3 gets inner_offset 0,1,2... While term_info #0
    // is encoded without bitpacking.
    fn deserialize_term_info(&self, data: &[u8], inner_offset: usize) -> TermInfo {
        assert!(inner_offset < BLOCK_LEN - 1);
        let num_bits = self.num_bits() as usize;

        let posting_start_addr = num_bits * inner_offset;
        // the posting_start is the posting_start of the next term info.
        let posting_end_addr = posting_start_addr + num_bits;
        let positions_start_addr = posting_start_addr + self.postings_offset_nbits as usize;
        // the position_end is the positions_start of the next term info.
        let positions_end_addr = positions_start_addr + num_bits;

        let doc_freq_addr = positions_start_addr + self.positions_offset_nbits as usize;

        let postings_start_offset = self.ref_term_info.postings_range.start
            + extract_bits(data, posting_start_addr, self.postings_offset_nbits) as usize;
        let postings_end_offset = self.ref_term_info.postings_range.start
            + extract_bits(data, posting_end_addr, self.postings_offset_nbits) as usize;

        let positions_start_offset = self.ref_term_info.positions_range.start
            + extract_bits(data, positions_start_addr, self.positions_offset_nbits) as usize;
        let positions_end_offset = self.ref_term_info.positions_range.start
            + extract_bits(data, positions_end_addr, self.positions_offset_nbits) as usize;

        let doc_freq = extract_bits(data, doc_freq_addr, self.doc_freq_nbits) as u32;

        TermInfo {
            doc_freq,
            postings_range: postings_start_offset..postings_end_offset,
            positions_range: positions_start_offset..positions_end_offset,
        }
    }
}

#[derive(Clone)]
pub struct TermInfoStore {
    num_terms: usize,
    block_meta_bytes: OwnedBytes,
    term_info_bytes: OwnedBytes,
}

fn extract_bits(data: &[u8], addr_bits: usize, num_bits: u8) -> u64 {
    assert!(num_bits <= 56);
    let addr_byte = addr_bits / 8;
    let bit_shift = (addr_bits % 8) as u64;
    let val_unshifted_unmasked: u64 = if data.len() >= addr_byte + 8 {
        LittleEndian::read_u64(&data[addr_byte..][..8])
    } else {
        // the buffer is not large enough.
        // Let's copy the few remaining bytes to a 8 byte buffer
        // padded with 0s.
        let mut buf = [0u8; 8];
        let data_to_copy = &data[addr_byte..];
        let nbytes = data_to_copy.len();
        buf[..nbytes].copy_from_slice(data_to_copy);
        LittleEndian::read_u64(&buf)
    };
    let val_shifted_unmasked = val_unshifted_unmasked >> bit_shift;
    let mask = (1u64 << u64::from(num_bits)) - 1;
    val_shifted_unmasked & mask
}

impl TermInfoStore {
    pub fn open(term_info_store_file: FileSlice) -> io::Result<TermInfoStore> {
        let (len_slice, main_slice) = term_info_store_file.split(16);
        let mut bytes = len_slice.read_bytes()?;
        let len = u64::deserialize(&mut bytes)? as usize;
        let num_terms = u64::deserialize(&mut bytes)? as usize;
        let (block_meta_file, term_info_file) = main_slice.split(len);
        let term_info_bytes = term_info_file.read_bytes()?;
        Ok(TermInfoStore {
            num_terms,
            block_meta_bytes: block_meta_file.read_bytes()?,
            term_info_bytes,
        })
    }

    pub fn get(&self, term_ord: TermOrdinal) -> TermInfo {
        let block_id = (term_ord as usize) / BLOCK_LEN;
        let buffer = self.block_meta_bytes.as_slice();
        let mut block_data: &[u8] = &buffer[block_id * TermInfoBlockMeta::SIZE_IN_BYTES..];
        let term_info_block_data = TermInfoBlockMeta::deserialize(&mut block_data)
            .expect("Failed to deserialize terminfoblockmeta");
        let inner_offset = (term_ord as usize) % BLOCK_LEN;
        if inner_offset == 0 {
            return term_info_block_data.ref_term_info;
        }
        let term_info_data = self.term_info_bytes.as_slice();
        term_info_block_data.deserialize_term_info(
            &term_info_data[term_info_block_data.offset as usize..],
            inner_offset - 1,
        )
    }

    pub fn num_terms(&self) -> usize {
        self.num_terms
    }
}

pub struct TermInfoStoreWriter {
    buffer_block_metas: Vec<u8>,
    buffer_term_infos: Vec<u8>,
    term_infos: Vec<TermInfo>,
    num_terms: u64,
}

fn bitpack_serialize<W: Write>(
    write: &mut W,
    bit_packer: &mut BitPacker,
    term_info_block_meta: &TermInfoBlockMeta,
    term_info: &TermInfo,
) -> io::Result<()> {
    bit_packer.write(
        term_info.postings_range.start as u64,
        term_info_block_meta.postings_offset_nbits,
        write,
    )?;
    bit_packer.write(
        term_info.positions_range.start as u64,
        term_info_block_meta.positions_offset_nbits,
        write,
    )?;
    bit_packer.write(
        u64::from(term_info.doc_freq),
        term_info_block_meta.doc_freq_nbits,
        write,
    )?;
    Ok(())
}

impl TermInfoStoreWriter {
    pub fn new() -> TermInfoStoreWriter {
        TermInfoStoreWriter {
            buffer_block_metas: Vec::new(),
            buffer_term_infos: Vec::new(),
            term_infos: Vec::with_capacity(BLOCK_LEN),
            num_terms: 0u64,
        }
    }

    fn flush_block(&mut self) -> io::Result<()> {
        let mut bit_packer = BitPacker::new();
        let ref_term_info = self.term_infos[0].clone();

        let last_term_info = if let Some(last_term_info) = self.term_infos.last().cloned() {
            last_term_info
        } else {
            return Ok(());
        };
        let postings_end_offset =
            last_term_info.postings_range.end - ref_term_info.postings_range.start;
        let positions_end_offset =
            last_term_info.positions_range.end - ref_term_info.positions_range.start;
        for term_info in &mut self.term_infos[1..] {
            term_info.postings_range.start -= ref_term_info.postings_range.start;
            term_info.positions_range.start -= ref_term_info.positions_range.start;
        }

        let mut max_doc_freq: u32 = 0u32;

        for term_info in &self.term_infos[1..] {
            max_doc_freq = cmp::max(max_doc_freq, term_info.doc_freq);
        }

        let max_doc_freq_nbits: u8 = compute_num_bits(u64::from(max_doc_freq));
        let max_postings_offset_nbits = compute_num_bits(postings_end_offset as u64);
        let max_positions_offset_nbits = compute_num_bits(positions_end_offset as u64);

        let term_info_block_meta = TermInfoBlockMeta {
            offset: self.buffer_term_infos.len() as u64,
            ref_term_info,
            doc_freq_nbits: max_doc_freq_nbits,
            postings_offset_nbits: max_postings_offset_nbits,
            positions_offset_nbits: max_positions_offset_nbits,
        };

        term_info_block_meta.serialize(&mut self.buffer_block_metas)?;
        for term_info in &self.term_infos[1..] {
            bitpack_serialize(
                &mut self.buffer_term_infos,
                &mut bit_packer,
                &term_info_block_meta,
                term_info,
            )?;
        }

        // We still need to serialize the end offset for postings & positions.
        bit_packer.write(
            postings_end_offset as u64,
            term_info_block_meta.postings_offset_nbits,
            &mut self.buffer_term_infos,
        )?;
        bit_packer.write(
            positions_end_offset as u64,
            term_info_block_meta.positions_offset_nbits,
            &mut self.buffer_term_infos,
        )?;

        // Block need end up at the end of a byte.
        bit_packer.flush(&mut self.buffer_term_infos)?;
        self.term_infos.clear();

        Ok(())
    }

    pub fn write_term_info(&mut self, term_info: &TermInfo) -> io::Result<()> {
        self.num_terms += 1u64;
        self.term_infos.push(term_info.clone());
        if self.term_infos.len() >= BLOCK_LEN {
            self.flush_block()?;
        }
        Ok(())
    }

    pub fn serialize<W: io::Write + ?Sized>(&mut self, write: &mut W) -> io::Result<()> {
        if !self.term_infos.is_empty() {
            self.flush_block()?;
        }
        let len = self.buffer_block_metas.len() as u64;
        len.serialize(write)?;
        self.num_terms.serialize(write)?;
        write.write_all(&self.buffer_block_metas)?;
        write.write_all(&self.buffer_term_infos)?;
        Ok(())
    }
}

#[cfg(test)]
mod tests {

    use common::BinarySerializable;
    use tantivy_bitpacker::{compute_num_bits, BitPacker};

    use super::{extract_bits, TermInfoBlockMeta, TermInfoStore, TermInfoStoreWriter};
    use crate::directory::FileSlice;
    use crate::postings::TermInfo;

    #[test]
    fn test_term_info_block() {
        crate::tests::fixed_size_test::<TermInfoBlockMeta>();
    }

    #[test]
    fn test_bitpacked() {
        let mut buffer = Vec::new();
        let mut bitpack = BitPacker::new();
        bitpack.write(321u64, 9, &mut buffer).unwrap();
        assert_eq!(compute_num_bits(321u64), 9);
        bitpack.write(2u64, 2, &mut buffer).unwrap();
        assert_eq!(compute_num_bits(2u64), 2);
        bitpack.write(51, 6, &mut buffer).unwrap();
        assert_eq!(compute_num_bits(51), 6);
        bitpack.close(&mut buffer).unwrap();
        assert_eq!(buffer.len(), 3);
        assert_eq!(extract_bits(&buffer[..], 0, 9), 321u64);
        assert_eq!(extract_bits(&buffer[..], 9, 2), 2u64);
        assert_eq!(extract_bits(&buffer[..], 11, 6), 51u64);
    }

    #[test]
    fn test_term_info_block_meta_serialization() {
        let term_info_block_meta = TermInfoBlockMeta {
            offset: 2009u64,
            ref_term_info: TermInfo {
                doc_freq: 512,
                postings_range: 51..57,
                positions_range: 110..134,
            },
            doc_freq_nbits: 10,
            postings_offset_nbits: 5,
            positions_offset_nbits: 8,
        };
        let mut buffer: Vec<u8> = Vec::new();
        term_info_block_meta.serialize(&mut buffer).unwrap();
        let mut cursor: &[u8] = &buffer[..];
        let term_info_block_meta_serde = TermInfoBlockMeta::deserialize(&mut cursor).unwrap();
        assert_eq!(term_info_block_meta_serde, term_info_block_meta);
    }

    #[test]
    fn test_pack() -> crate::Result<()> {
        let mut store_writer = TermInfoStoreWriter::new();
        let mut term_infos = vec![];
        let offset = |i| i * 13 + i * i;
        for i in 0usize..1000usize {
            let term_info = TermInfo {
                doc_freq: i as u32,
                postings_range: offset(i)..offset(i + 1),
                positions_range: offset(i) * 3..offset(i + 1) * 3,
            };
            store_writer.write_term_info(&term_info)?;
            term_infos.push(term_info);
        }
        let mut buffer = Vec::new();
        store_writer.serialize(&mut buffer)?;
        let term_info_store = TermInfoStore::open(FileSlice::from(buffer))?;
        for i in 0..1000 {
            assert_eq!(
                term_info_store.get(i as u64),
                term_infos[i],
                "term info {i}"
            );
        }
        Ok(())
    }
}


================================================
FILE: src/termdict/fst_termdict/termdict.rs
================================================
use std::io::{self, Write};
use std::sync::Arc;

use common::{BinarySerializable, CountingWriter};
use once_cell::sync::Lazy;
use tantivy_fst::raw::Fst;
use tantivy_fst::Automaton;

use super::term_info_store::{TermInfoStore, TermInfoStoreWriter};
use super::{TermStreamer, TermStreamerBuilder};
use crate::directory::{FileSlice, OwnedBytes};
use crate::postings::TermInfo;
use crate::termdict::TermOrdinal;

fn convert_fst_error(e: tantivy_fst::Error) -> io::Error {
    io::Error::other(e)
}

const FST_VERSION: u32 = 1;

/// Builder for the new term dictionary.
///
/// Inserting must be done in the order of the `keys`.
pub struct TermDictionaryBuilder<W> {
    fst_builder: tantivy_fst::MapBuilder<W>,
    term_info_store_writer: TermInfoStoreWriter,
    term_ord: u64,
}

impl<W> TermDictionaryBuilder<W>
where W: Write
{
    /// Creates a new `TermDictionaryBuilder`
    pub fn create(w: W) -> io::Result<Self> {
        let fst_builder = tantivy_fst::MapBuilder::new(w).map_err(convert_fst_error)?;
        Ok(TermDictionaryBuilder {
            fst_builder,
            term_info_store_writer: TermInfoStoreWriter::new(),
            term_ord: 0,
        })
    }

    /// Inserts a `(key, value)` pair in the term dictionary.
    ///
    /// *Keys have to be inserted in order.*
    pub fn insert<K: AsRef<[u8]>>(&mut self, key_ref: K, value: &TermInfo) -> io::Result<()> {
        let key = key_ref.as_ref();
        self.insert_key(key)?;
        self.insert_value(value)?;
        Ok(())
    }

    /// # Warning
    /// Horribly dangerous internal API
    ///
    /// If used, it must be used by systematically alternating calls
    /// to insert_key and insert_value.
    ///
    /// Prefer using `.insert(key, value)`
    pub fn insert_key(&mut self, key: &[u8]) -> io::Result<()> {
        self.fst_builder
            .insert(key, self.term_ord)
            .map_err(convert_fst_error)?;
        self.term_ord += 1;
        Ok(())
    }

    /// # Warning
    ///
    /// Horribly dangerous internal API. See `.insert_key(...)`.
    pub fn insert_value(&mut self, term_info: &TermInfo) -> io::Result<()> {
        self.term_info_store_writer.write_term_info(term_info)?;
        Ok(())
    }

    /// Finalize writing the builder, and returns the underlying
    /// `Write` object.
    pub fn finish(mut self) -> io::Result<W> {
        let mut file = self.fst_builder.into_inner().map_err(convert_fst_error)?;
        {
            let mut counting_writer = CountingWriter::wrap(&mut file);
            self.term_info_store_writer
                .serialize(&mut counting_writer)?;
            let footer_size = counting_writer.written_bytes();
            footer_size.serialize(&mut counting_writer)?;
            FST_VERSION.serialize(&mut counting_writer)?;
        }
        Ok(file)
    }
}

fn open_fst_index(fst_file: FileSlice) -> io::Result<tantivy_fst::Map<OwnedBytes>> {
    let bytes = fst_file.read_bytes()?;
    let fst = Fst::new(bytes).map_err(|err| {
        io::Error::new(
            io::ErrorKind::InvalidData,
            format!("Fst data is corrupted: {err:?}"),
        )
    })?;
    Ok(tantivy_fst::Map::from(fst))
}

static EMPTY_TERM_DICT_FILE: Lazy<FileSlice> = Lazy::new(|| {
    let term_dictionary_data: Vec<u8> = TermDictionaryBuilder::create(Vec::<u8>::new())
        .expect("Creating a TermDictionaryBuilder in a Vec<u8> should never fail")
        .finish()
        .expect("Writing in a Vec<u8> should never fail");
    FileSlice::from(term_dictionary_data)
});

/// The term dictionary contains all of the terms in
/// `tantivy index` in a sorted manner.
///
/// The `Fst` crate is used to associate terms to their
/// respective `TermOrdinal`. The `TermInfoStore` then makes it
/// possible to fetch the associated `TermInfo`.
#[derive(Clone)]
pub struct TermDictionary {
    fst_index: Arc<tantivy_fst::Map<OwnedBytes>>,
    term_info_store: TermInfoStore,
}

impl TermDictionary {
    /// Opens a `TermDictionary`.
    pub fn open(file: FileSlice) -> io::Result<Self> {
        let (main_slice, footer_len_slice) = file.split_from_end(12);
        let mut footer_len_bytes = footer_len_slice.read_bytes()?;
        let footer_size = u64::deserialize(&mut footer_len_bytes)?;
        let version = u32::deserialize(&mut footer_len_bytes)?;
        if version != FST_VERSION {
            return Err(io::Error::other(format!(
                "Unsupported fst version, expected {version}, found {FST_VERSION}",
            )));
        }

        let (fst_file_slice, values_file_slice) = main_slice.split_from_end(footer_size as usize);
        let fst_index = open_fst_index(fst_file_slice)?;
        let term_info_store = TermInfoStore::open(values_file_slice)?;
        Ok(TermDictionary {
            fst_index: Arc::new(fst_index),
            term_info_store,
        })
    }

    /// Creates an empty term dictionary which contains no terms.
    pub fn empty() -> Self {
        TermDictionary::open(EMPTY_TERM_DICT_FILE.clone()).unwrap()
    }

    /// Returns the number of terms in the dictionary.
    /// Term ordinals range from 0 to `num_terms() - 1`.
    pub fn num_terms(&self) -> usize {
        self.term_info_store.num_terms()
    }

    /// Returns the ordinal associated with a given term.
    pub fn term_ord<K: AsRef<[u8]>>(&self, key: K) -> io::Result<Option<TermOrdinal>> {
        Ok(self.fst_index.get(key))
    }

    /// Stores the term associated with a given term ordinal in
    /// a `bytes` buffer.
    ///
    /// Term ordinals are defined as the position of the term in
    /// the sorted list of terms.
    ///
    /// Returns true if and only if the term has been found.
    ///
    /// Regardless of whether the term is found or not,
    /// the buffer may be modified.
    pub fn ord_to_term(&self, mut ord: TermOrdinal, bytes: &mut Vec<u8>) -> io::Result<bool> {
        bytes.clear();
        let fst = self.fst_index.as_fst();
        let mut node = fst.root();
        while ord != 0 || !node.is_final() {
            if let Some(transition) = node
                .transitions()
                .take_while(|transition| transition.out.value() <= ord)
                .last()
            {
                ord -= transition.out.value();
                bytes.push(transition.inp);
                let new_node_addr = transition.addr;
                node = fst.node(new_node_addr);
            } else {
                return Ok(false);
            }
        }
        Ok(true)
    }

    /// Returns the number of terms in the dictionary.
    pub fn term_info_from_ord(&self, term_ord: TermOrdinal) -> TermInfo {
        self.term_info_store.get(term_ord)
    }

    /// Lookups the value corresponding to the key.
    pub fn get<K: AsRef<[u8]>>(&self, key: K) -> io::Result<Option<TermInfo>> {
        Ok(self
            .term_ord(key)?
            .map(|term_ord| self.term_info_from_ord(term_ord)))
    }

    /// Returns a range builder, to stream all of the terms
    /// within an interval.
    pub fn range(&self) -> TermStreamerBuilder<'_> {
        TermStreamerBuilder::new(self, self.fst_index.range())
    }

    /// A stream of all the sorted terms.
    pub fn stream(&self) -> io::Result<TermStreamer<'_>> {
        self.range().into_stream()
    }

    /// Returns a search builder, to stream all of the terms
    /// within the Automaton
    pub fn search<'a, A: Automaton + 'a>(&'a self, automaton: A) -> TermStreamerBuilder<'a, A> {
        let stream_builder = self.fst_index.search(automaton);
        TermStreamerBuilder::<A>::new(self, stream_builder)
    }
}


================================================
FILE: src/termdict/mod.rs
================================================
//! The term dictionary main role is to associate the sorted [`Term`s](crate::Term) to
//! a [`TermInfo`] struct that contains some meta-information
//! about the term.
//!
//! Internally, the term dictionary relies on the `fst` crate to store
//! a sorted mapping that associate each term to its rank in the lexicographical order.
//! For instance, in a dictionary containing the sorted terms "abba", "bjork", "blur" and "donovan",
//! the [`TermOrdinal`] are respectively `0`, `1`, `2`, and `3`.
//!
//! For `u64`-terms, tantivy explicitly uses a `BigEndian` representation to ensure that the
//! lexicographical order matches the natural order of integers.
//!
//! `i64`-terms are transformed to `u64` using a continuous mapping `val ⟶ val - i64::MIN`
//! and then treated as a `u64`.
//!
//! `f64`-terms are transformed to `u64` using a mapping that preserve order, and are then treated
//! as `u64`.
//!
//! A second datastructure makes it possible to access a [`TermInfo`].

#[cfg(not(feature = "quickwit"))]
mod fst_termdict;
#[cfg(not(feature = "quickwit"))]
use fst_termdict as termdict;

#[cfg(feature = "quickwit")]
mod sstable_termdict;
#[cfg(feature = "quickwit")]
use sstable_termdict as termdict;

#[cfg(test)]
mod tests;

/// Position of the term in the sorted list of terms.
pub type TermOrdinal = u64;

use std::io;

use common::file_slice::FileSlice;
use common::BinarySerializable;
use tantivy_fst::Automaton;

use self::termdict::{
    TermDictionary as InnerTermDict, TermDictionaryBuilder as InnerTermDictBuilder,
    TermStreamerBuilder,
};
pub use self::termdict::{TermMerger, TermStreamer};
use crate::postings::TermInfo;

#[derive(Debug, Eq, PartialEq)]
#[repr(u32)]
enum DictionaryType {
    Fst = 1,
    SSTable = 2,
}

impl TryFrom<u32> for DictionaryType {
    type Error = &'static str;

    fn try_from(value: u32) -> Result<Self, Self::Error> {
        match value {
            1 => Ok(DictionaryType::Fst),
            2 => Ok(DictionaryType::SSTable),
            _ => Err("Invalid value for DictionaryType"),
        }
    }
}

#[cfg(not(feature = "quickwit"))]
const CURRENT_TYPE: DictionaryType = DictionaryType::Fst;

#[cfg(feature = "quickwit")]
const CURRENT_TYPE: DictionaryType = DictionaryType::SSTable;

// TODO in the future this should become an enum of supported dictionaries
/// A TermDictionary wrapping either an FST based dictionary or a SSTable based one.
#[derive(Clone)]
pub struct TermDictionary(InnerTermDict);

impl TermDictionary {
    /// Opens a `TermDictionary`.
    pub fn open(file: FileSlice) -> io::Result<Self> {
        let (main_slice, dict_type) = file.split_from_end(4);
        let mut dict_type = dict_type.read_bytes()?;
        let dict_type = u32::deserialize(&mut dict_type)?;
        let dict_type = DictionaryType::try_from(dict_type).map_err(|_| {
            io::Error::other(format!("Unsupported dictionary type, found {dict_type}"))
        })?;

        if dict_type != CURRENT_TYPE {
            return Err(io::Error::other(format!(
                "Unsupported dictionary type, compiled tantivy with {CURRENT_TYPE:?}, but got \
                 {dict_type:?}",
            )));
        }

        InnerTermDict::open(main_slice).map(TermDictionary)
    }

    /// Creates an empty term dictionary which contains no terms.
    pub fn empty() -> Self {
        TermDictionary(InnerTermDict::empty())
    }

    /// Returns the number of terms in the dictionary.
    /// Term ordinals range from 0 to `num_terms() - 1`.
    pub fn num_terms(&self) -> usize {
        self.0.num_terms()
    }

    /// Returns the ordinal associated with a given term.
    pub fn term_ord<K: AsRef<[u8]>>(&self, key: K) -> io::Result<Option<TermOrdinal>> {
        self.0.term_ord(key)
    }

    /// Stores the term associated with a given term ordinal in
    /// a `bytes` buffer.
    ///
    /// Term ordinals are defined as the position of the term in
    /// the sorted list of terms.
    ///
    /// Returns true if and only if the term has been found.
    ///
    /// Regardless of whether the term is found or not,
    /// the buffer may be modified.
    pub fn ord_to_term(&self, ord: TermOrdinal, bytes: &mut Vec<u8>) -> io::Result<bool> {
        self.0.ord_to_term(ord, bytes)
    }

    // this isn't used, and has different prototype in Fst and SSTable
    // Returns the number of terms in the dictionary.
    // pub fn term_info_from_ord(&self, term_ord: TermOrdinal) -> TermInfo {
    // self.0.term_info_from_ord(term_ord)
    // }

    /// Lookups the value corresponding to the key.
    pub fn get<K: AsRef<[u8]>>(&self, key: K) -> io::Result<Option<TermInfo>> {
        self.0.get(key)
    }

    /// Returns a range builder, to stream all of the terms
    /// within an interval.
    pub fn range(&self) -> TermStreamerBuilder<'_> {
        self.0.range()
    }

    /// A stream of all the sorted terms.
    pub fn stream(&self) -> io::Result<TermStreamer<'_>> {
        self.0.stream()
    }

    /// Returns a search builder, to stream all of the terms
    /// within the Automaton
    pub fn search<'a, A: Automaton + 'a>(&'a self, automaton: A) -> TermStreamerBuilder<'a, A>
    where A::State: Clone {
        self.0.search(automaton)
    }

    #[cfg(feature = "quickwit")]
    /// Lookups the value corresponding to the key.
    pub async fn get_async<K: AsRef<[u8]>>(&self, key: K) -> io::Result<Option<TermInfo>> {
        self.0.get_async(key).await
    }

    #[cfg(feature = "quickwit")]
    #[doc(hidden)]
    pub async fn warm_up_dictionary(&self) -> io::Result<()> {
        self.0.warm_up_dictionary().await
    }

    #[cfg(feature = "quickwit")]
    /// Returns a file slice covering a set of sstable blocks
    /// that includes the key range passed in arguments.
    pub fn file_slice_for_range(
        &self,
        key_range: impl std::ops::RangeBounds<[u8]>,
        limit: Option<u64>,
    ) -> FileSlice {
        self.0.file_slice_for_range(key_range, limit)
    }
}

/// A TermDictionaryBuilder wrapping either an FST or a SSTable dictionary builder.
pub struct TermDictionaryBuilder<W: io::Write>(InnerTermDictBuilder<W>);

impl<W: io::Write> TermDictionaryBuilder<W> {
    /// Creates a new `TermDictionaryBuilder`
    pub fn create(w: W) -> io::Result<Self> {
        InnerTermDictBuilder::create(w).map(TermDictionaryBuilder)
    }

    /// Inserts a `(key, value)` pair in the term dictionary.
    ///
    /// *Keys have to be inserted in order.*
    pub fn insert<K: AsRef<[u8]>>(&mut self, key_ref: K, value: &TermInfo) -> io::Result<()> {
        self.0.insert(key_ref, value)
    }

    /// # Warning
    /// Horribly dangerous internal API
    ///
    /// If used, it must be used by systematically alternating calls
    /// to insert_key and insert_value.
    ///
    /// Prefer using `.insert(key, value)`
    pub fn insert_key(&mut self, key: &[u8]) -> io::Result<()> {
        self.0.insert_key(key)
    }

    /// # Warning
    ///
    /// Horribly dangerous internal API. See `.insert_key(...)`.
    pub fn insert_value(&mut self, term_info: &TermInfo) -> io::Result<()> {
        self.0.insert_value(term_info)
    }

    /// Finalize writing the builder, and returns the underlying
    /// `Write` object.
    pub fn finish(self) -> io::Result<W> {
        let mut writer = self.0.finish()?;
        (CURRENT_TYPE as u32).serialize(&mut writer)?;
        Ok(writer)
    }
}


================================================
FILE: src/termdict/sstable_termdict/merger.rs
================================================
use std::cmp::Ordering;
use std::collections::BinaryHeap;

use crate::postings::TermInfo;
use crate::termdict::TermStreamer;

pub struct HeapItem<'a> {
    pub streamer: TermStreamer<'a>,
    pub segment_ord: usize,
}

impl<'a> PartialEq for HeapItem<'a> {
    fn eq(&self, other: &Self) -> bool {
        self.segment_ord == other.segment_ord
    }
}

impl<'a> Eq for HeapItem<'a> {}

impl<'a> PartialOrd for HeapItem<'a> {
    fn partial_cmp(&self, other: &HeapItem<'a>) -> Option<Ordering> {
        Some(self.cmp(other))
    }
}

impl<'a> Ord for HeapItem<'a> {
    fn cmp(&self, other: &HeapItem<'a>) -> Ordering {
        (&other.streamer.key(), &other.segment_ord).cmp(&(&self.streamer.key(), &self.segment_ord))
    }
}

/// Given a list of sorted term streams,
/// returns an iterator over sorted unique terms.
///
/// The item yield is actually a pair with
/// - the term
/// - a slice with the ordinal of the segments containing the terms.
pub struct TermMerger<'a> {
    heap: BinaryHeap<HeapItem<'a>>,
    current_streamers: Vec<HeapItem<'a>>,
}

impl<'a> TermMerger<'a> {
    /// Stream of merged term dictionary
    pub fn new(streams: Vec<TermStreamer<'a>>) -> TermMerger<'a> {
        TermMerger {
            heap: BinaryHeap::new(),
            current_streamers: streams
                .into_iter()
                .enumerate()
                .map(|(ord, streamer)| HeapItem {
                    streamer,
                    segment_ord: ord,
                })
                .collect(),
        }
    }

    fn advance_segments(&mut self) {
        let streamers = &mut self.current_streamers;
        let heap = &mut self.heap;
        for mut heap_item in streamers.drain(..) {
            if heap_item.streamer.advance() {
                heap.push(heap_item);
            }
        }
    }

    /// Advance the term iterator to the next term.
    /// Returns true if there is indeed another term
    /// False if there is none.
    pub fn advance(&mut self) -> bool {
        self.advance_segments();
        let Some(head) = self.heap.pop() else {
            return false;
        };
        self.current_streamers.push(head);
        while let Some(next_streamer) = self.heap.peek() {
            if self.current_streamers[0].streamer.key() != next_streamer.streamer.key() {
                break;
            }
            let next_heap_it = self.heap.pop().unwrap(); // safe : we peeked beforehand
            self.current_streamers.push(next_heap_it);
        }
        true
    }

    /// Returns the current term.
    ///
    /// This method may be called
    /// if and only if advance() has been called before
    /// and "true" was returned.
    pub fn key(&self) -> &[u8] {
        self.current_streamers[0].streamer.key()
    }

    /// Returns the sorted list of segment ordinals
    /// that include the current term.
    ///
    /// This method may be called
    /// if and only if advance() has been called before
    /// and "true" was returned.
    pub fn current_segment_ords_and_term_infos<'b: 'a>(
        &'b self,
    ) -> impl 'b + Iterator<Item = (usize, TermInfo)> {
        self.current_streamers
            .iter()
            .map(|heap_item| (heap_item.segment_ord, heap_item.streamer.value().clone()))
    }
}


================================================
FILE: src/termdict/sstable_termdict/mod.rs
================================================
use std::io;

mod merger;

use std::iter::ExactSizeIterator;

use common::VInt;
use sstable::value::{ValueReader, ValueWriter};
use sstable::SSTable;
use tantivy_fst::automaton::AlwaysMatch;

pub use self::merger::TermMerger;
use crate::postings::TermInfo;

/// The term dictionary contains all of the terms in
/// `tantivy index` in a sorted manner.
///
/// The `Fst` crate is used to associate terms to their
/// respective `TermOrdinal`. The `TermInfoStore` then makes it
/// possible to fetch the associated `TermInfo`.
pub type TermDictionary = sstable::Dictionary<TermSSTable>;

/// Builder for the new term dictionary.
pub type TermDictionaryBuilder<W> = sstable::Writer<W, TermInfoValueWriter>;

/// `TermStreamer` acts as a cursor over a range of terms of a segment.
/// Terms are guaranteed to be sorted.
pub type TermStreamer<'a, A = AlwaysMatch> = sstable::Streamer<'a, TermSSTable, A>;

/// SSTable used to store TermInfo objects.
#[derive(Clone)]
pub struct TermSSTable;

pub type TermStreamerBuilder<'a, A = AlwaysMatch> = sstable::StreamerBuilder<'a, TermSSTable, A>;

impl SSTable for TermSSTable {
    type Value = TermInfo;
    type ValueReader = TermInfoValueReader;
    type ValueWriter = TermInfoValueWriter;
}

#[derive(Default)]
pub struct TermInfoValueReader {
    term_infos: Vec<TermInfo>,
}

impl ValueReader for TermInfoValueReader {
    type Value = TermInfo;

    #[inline(always)]
    fn value(&self, idx: usize) -> &TermInfo {
        &self.term_infos[idx]
    }

    fn load(&mut self, mut data: &[u8]) -> io::Result<usize> {
        let len_before = data.len();
        self.term_infos.clear();
        let num_els = VInt::deserialize_u64(&mut data)?;
        let mut postings_start = VInt::deserialize_u64(&mut data)? as usize;
        let mut positions_start = VInt::deserialize_u64(&mut data)? as usize;
        for _ in 0..num_els {
            let doc_freq = VInt::deserialize_u64(&mut data)? as u32;
            let postings_num_bytes = VInt::deserialize_u64(&mut data)?;
            let positions_num_bytes = VInt::deserialize_u64(&mut data)?;
            let postings_end = postings_start + postings_num_bytes as usize;
            let positions_end = positions_start + positions_num_bytes as usize;
            let term_info = TermInfo {
                doc_freq,
                postings_range: postings_start..postings_end,
                positions_range: positions_start..positions_end,
            };
            self.term_infos.push(term_info);
            postings_start = postings_end;
            positions_start = positions_end;
        }
        let consumed_len = len_before - data.len();
        Ok(consumed_len)
    }
}

#[derive(Default)]
pub struct TermInfoValueWriter {
    term_infos: Vec<TermInfo>,
}

impl ValueWriter for TermInfoValueWriter {
    type Value = TermInfo;

    fn write(&mut self, term_info: &TermInfo) {
        self.term_infos.push(term_info.clone());
    }

    fn serialize_block(&self, buffer: &mut Vec<u8>) {
        VInt(self.term_infos.len() as u64).serialize_into_vec(buffer);
        if self.term_infos.is_empty() {
            return;
        }
        VInt(self.term_infos[0].postings_range.start as u64).serialize_into_vec(buffer);
        VInt(self.term_infos[0].positions_range.start as u64).serialize_into_vec(buffer);
        for term_info in &self.term_infos {
            VInt(term_info.doc_freq as u64).serialize_into_vec(buffer);
            VInt(term_info.postings_range.len() as u64).serialize_into_vec(buffer);
            VInt(term_info.positions_range.len() as u64).serialize_into_vec(buffer);
        }
    }

    fn clear(&mut self) {
        self.term_infos.clear();
    }
}

#[cfg(test)]
mod tests {
    use sstable::value::{ValueReader, ValueWriter};

    use crate::postings::TermInfo;
    use crate::termdict::sstable_termdict::TermInfoValueReader;

    #[test]
    fn test_block_terminfos() {
        let mut term_info_writer = super::TermInfoValueWriter::default();
        term_info_writer.write(&TermInfo {
            doc_freq: 120u32,
            postings_range: 17..45,
            positions_range: 10..122,
        });
        term_info_writer.write(&TermInfo {
            doc_freq: 10u32,
            postings_range: 45..450,
            positions_range: 122..1100,
        });
        term_info_writer.write(&TermInfo {
            doc_freq: 17u32,
            postings_range: 450..462,
            positions_range: 1100..1302,
        });
        let mut buffer = Vec::new();
        term_info_writer.serialize_block(&mut buffer);
        let mut term_info_reader = TermInfoValueReader::default();
        let num_bytes: usize = term_info_reader.load(&buffer[..]).unwrap();
        assert_eq!(
            term_info_reader.value(0),
            &TermInfo {
                doc_freq: 120u32,
                postings_range: 17..45,
                positions_range: 10..122
            }
        );
        assert_eq!(buffer.len(), num_bytes);
    }
}


================================================
FILE: src/termdict/tests.rs
================================================
use std::path::PathBuf;
use std::{io, str};

use super::{TermDictionary, TermDictionaryBuilder, TermStreamer};
use crate::directory::{Directory, FileSlice, RamDirectory, TerminatingWrite};
use crate::postings::TermInfo;

const BLOCK_SIZE: usize = 1_500;

fn make_term_info(term_ord: u64) -> TermInfo {
    let offset = |term_ord: u64| (term_ord * 100 + term_ord * term_ord) as usize;
    TermInfo {
        doc_freq: term_ord as u32,
        postings_range: offset(term_ord)..offset(term_ord + 1),
        positions_range: offset(term_ord) * 2..offset(term_ord + 1) * 2,
    }
}

#[test]
fn test_empty_term_dictionary() {
    let empty = TermDictionary::empty();
    assert!(empty.stream().unwrap().next().is_none());
}

#[test]
fn test_term_ordinals() -> crate::Result<()> {
    const COUNTRIES: [&str; 7] = [
        "San Marino",
        "Serbia",
        "Slovakia",
        "Slovenia",
        "Spain",
        "Sweden",
        "Switzerland",
    ];
    let directory = RamDirectory::create();
    let path = PathBuf::from("TermDictionary");
    {
        let write = directory.open_write(&path)?;
        let mut term_dictionary_builder = TermDictionaryBuilder::create(write)?;
        for term in COUNTRIES.iter() {
            term_dictionary_builder.insert(term.as_bytes(), &make_term_info(0u64))?;
        }
        term_dictionary_builder.finish()?.terminate()?;
    }
    let term_file = directory.open_read(&path)?;
    let term_dict: TermDictionary = TermDictionary::open(term_file)?;
    for (term_ord, term) in COUNTRIES.iter().enumerate() {
        assert_eq!(term_dict.term_ord(term)?, Some(term_ord as u64));
        let mut bytes = vec![];
        assert!(term_dict.ord_to_term(term_ord as u64, &mut bytes)?);
        assert_eq!(bytes, term.as_bytes());
    }
    Ok(())
}

#[test]
fn test_term_dictionary_simple() -> crate::Result<()> {
    let directory = RamDirectory::create();
    let path = PathBuf::from("TermDictionary");
    {
        let write = directory.open_write(&path)?;
        let mut term_dictionary_builder = TermDictionaryBuilder::create(write)?;
        term_dictionary_builder.insert("abc".as_bytes(), &make_term_info(34u64))?;
        term_dictionary_builder.insert("abcd".as_bytes(), &make_term_info(346u64))?;
        term_dictionary_builder.finish()?.terminate()?;
    }
    let file = directory.open_read(&path)?;
    let term_dict: TermDictionary = TermDictionary::open(file)?;
    assert_eq!(term_dict.get("abc")?.unwrap().doc_freq, 34u32);
    assert_eq!(term_dict.get("abcd")?.unwrap().doc_freq, 346u32);
    let mut stream = term_dict.stream()?;
    {
        {
            let (k, v) = stream.next().unwrap();
            assert_eq!(k, "abc".as_bytes());
            assert_eq!(v.doc_freq, 34u32);
        }
        assert_eq!(stream.key(), "abc".as_bytes());
        assert_eq!(stream.value().doc_freq, 34u32);
    }
    {
        {
            let (k, v) = stream.next().unwrap();
            assert_eq!(k, "abcd".as_bytes());
            assert_eq!(v.doc_freq, 346u32);
        }
        assert_eq!(stream.key(), "abcd".as_bytes());
        assert_eq!(stream.value().doc_freq, 346u32);
    }
    assert!(!stream.advance());
    Ok(())
}

#[test]
fn test_term_dictionary_stream() -> crate::Result<()> {
    let ids: Vec<_> = (0u32..10_000u32)
        .map(|i| (format!("doc{i:0>6}"), i))
        .collect();
    let buffer: Vec<u8> = {
        let mut term_dictionary_builder = TermDictionaryBuilder::create(vec![]).unwrap();
        for (id, i) in &ids {
            term_dictionary_builder
                .insert(id.as_bytes(), &make_term_info(*i as u64))
                .unwrap();
        }
        term_dictionary_builder.finish()?
    };
    let term_file = FileSlice::from(buffer);
    let term_dictionary: TermDictionary = TermDictionary::open(term_file)?;
    {
        let mut streamer = term_dictionary.stream()?;
        let mut i = 0;
        while let Some((streamer_k, streamer_v)) = streamer.next() {
            let (key, v) = &ids[i];
            assert_eq!(streamer_k, key.as_bytes());
            assert_eq!(streamer_v, &make_term_info(*v as u64));
            i += 1;
        }
    }

    let (key, val) = &ids[2047];
    assert_eq!(
        term_dictionary.get(key.as_bytes())?,
        Some(make_term_info(*val as u64))
    );
    Ok(())
}

#[test]
fn test_stream_high_range_prefix_suffix() -> crate::Result<()> {
    let buffer: Vec<u8> = {
        let mut term_dictionary_builder = TermDictionaryBuilder::create(vec![]).unwrap();
        // term requires more than 16bits
        term_dictionary_builder.insert("abcdefghijklmnopqrstuvwxy", &make_term_info(1))?;
        term_dictionary_builder.insert("abcdefghijklmnopqrstuvwxyz", &make_term_info(2))?;
        term_dictionary_builder.insert("abr", &make_term_info(3))?;
        term_dictionary_builder.finish()?
    };
    let term_dict_file = FileSlice::from(buffer);
    let term_dictionary: TermDictionary = TermDictionary::open(term_dict_file)?;
    let mut kv_stream = term_dictionary.stream()?;
    assert!(kv_stream.advance());
    assert_eq!(kv_stream.key(), "abcdefghijklmnopqrstuvwxy".as_bytes());
    assert_eq!(kv_stream.value(), &make_term_info(1));
    assert!(kv_stream.advance());
    assert_eq!(kv_stream.key(), "abcdefghijklmnopqrstuvwxyz".as_bytes());
    assert_eq!(kv_stream.value(), &make_term_info(2));
    assert!(kv_stream.advance());
    assert_eq!(kv_stream.key(), "abr".as_bytes());
    assert_eq!(kv_stream.value(), &make_term_info(3));
    assert!(!kv_stream.advance());
    Ok(())
}

#[test]
fn test_stream_range() -> crate::Result<()> {
    let ids: Vec<_> = (0u32..10_000u32)
        .map(|i| (format!("doc{i:0>6}"), i))
        .collect();
    let buffer: Vec<u8> = {
        let mut term_dictionary_builder = TermDictionaryBuilder::create(vec![]).unwrap();
        for (id, i) in &ids {
            term_dictionary_builder
                .insert(id.as_bytes(), &make_term_info(*i as u64))
                .unwrap();
        }
        term_dictionary_builder.finish()?
    };

    let file = FileSlice::from(buffer);

    let term_dictionary: TermDictionary = TermDictionary::open(file)?;
    {
        for i in (0..20).chain(6000..8_000) {
            let (target_key, _) = &ids[i];
            let mut streamer = term_dictionary
                .range()
                .ge(target_key.as_bytes())
                .into_stream()?;
            for j in 0..3 {
                let (streamer_k, streamer_v) = streamer.next().unwrap();
                let (key, v) = &ids[i + j];
                assert_eq!(str::from_utf8(streamer_k).unwrap(), key);
                assert_eq!(streamer_v.doc_freq, *v);
                assert_eq!(streamer_v, &make_term_info(*v as u64));
            }
        }
    }

    {
        for i in (0..20).chain(BLOCK_SIZE - 10..BLOCK_SIZE + 10) {
            let (target_key, _) = &ids[i];
            let mut streamer = term_dictionary
                .range()
                .gt(target_key.as_bytes())
                .into_stream()?;
            for j in 0..3 {
                let (streamer_k, streamer_v) = streamer.next().unwrap();
                let (key, v) = &ids[i + j + 1];
                assert_eq!(streamer_k, key.as_bytes());
                assert_eq!(streamer_v.doc_freq, *v);
            }
        }
    }

    {
        for i in (0..20).chain(BLOCK_SIZE - 10..BLOCK_SIZE + 10) {
            for j in 0..3 {
                let (fst_key, _) = &ids[i];
                let (last_key, _) = &ids[i + j];
                let mut streamer = term_dictionary
                    .range()
                    .ge(fst_key.as_bytes())
                    .lt(last_key.as_bytes())
                    .into_stream()?;
                for _ in 0..j {
                    assert!(streamer.next().is_some());
                }
                assert!(streamer.next().is_none());
            }
        }
    }
    Ok(())
}

#[test]
fn test_empty_string() -> crate::Result<()> {
    let buffer: Vec<u8> = {
        let mut term_dictionary_builder = TermDictionaryBuilder::create(vec![]).unwrap();
        term_dictionary_builder
            .insert([], &make_term_info(1_u64))
            .unwrap();
        term_dictionary_builder
            .insert([1u8], &make_term_info(2_u64))
            .unwrap();
        term_dictionary_builder.finish()?
    };
    let file = FileSlice::from(buffer);
    let term_dictionary: TermDictionary = TermDictionary::open(file)?;
    let mut stream = term_dictionary.stream()?;
    assert!(stream.advance());
    assert!(stream.key().is_empty());
    assert!(stream.advance());
    assert_eq!(stream.key(), &[1u8]);
    assert!(!stream.advance());
    Ok(())
}

fn stream_range_test_dict() -> io::Result<TermDictionary> {
    let buffer: Vec<u8> = {
        let mut term_dictionary_builder = TermDictionaryBuilder::create(Vec::new())?;
        for i in 0u8..10u8 {
            let number_arr = [i; 1];
            term_dictionary_builder.insert(number_arr, &make_term_info(i as u64))?;
        }
        term_dictionary_builder.finish()?
    };
    let file = FileSlice::from(buffer);
    TermDictionary::open(file)
}

#[test]
fn test_stream_range_boundaries_forward() -> crate::Result<()> {
    let term_dictionary = stream_range_test_dict()?;
    let value_list = |mut streamer: TermStreamer<'_>| {
        let mut res: Vec<u32> = vec![];
        while let Some((_, v)) = streamer.next() {
            res.push(v.doc_freq);
        }
        res
    };
    {
        let range = term_dictionary.range().ge([2u8]).into_stream()?;
        assert_eq!(
            value_list(range),
            vec![2u32, 3u32, 4u32, 5u32, 6u32, 7u32, 8u32, 9u32]
        );
    }
    {
        let range = term_dictionary.range().gt([2u8]).into_stream()?;
        assert_eq!(
            value_list(range),
            vec![3u32, 4u32, 5u32, 6u32, 7u32, 8u32, 9u32]
        );
    }
    {
        let range = term_dictionary.range().lt([6u8]).into_stream()?;
        assert_eq!(value_list(range), vec![0u32, 1u32, 2u32, 3u32, 4u32, 5u32]);
    }
    {
        let range = term_dictionary.range().le([6u8]).into_stream()?;
        assert_eq!(
            value_list(range),
            vec![0u32, 1u32, 2u32, 3u32, 4u32, 5u32, 6u32]
        );
    }
    {
        let range = term_dictionary.range().ge([0u8]).lt([5u8]).into_stream()?;
        assert_eq!(value_list(range), vec![0u32, 1u32, 2u32, 3u32, 4u32]);
    }
    Ok(())
}

#[cfg(not(feature = "quickwit"))]
#[test]
fn test_stream_range_boundaries_backward() -> crate::Result<()> {
    let term_dictionary = stream_range_test_dict()?;
    let value_list_backward = |mut streamer: TermStreamer<'_>| {
        let mut res: Vec<u32> = vec![];
        while let Some((_, v)) = streamer.next() {
            res.push(v.doc_freq);
        }
        res.reverse();
        res
    };
    {
        let range = term_dictionary.range().backward().into_stream()?;
        assert_eq!(
            value_list_backward(range),
            vec![0u32, 1u32, 2u32, 3u32, 4u32, 5u32, 6u32, 7u32, 8u32, 9u32]
        );
    }
    {
        let range = term_dictionary.range().ge([2u8]).backward().into_stream()?;
        assert_eq!(
            value_list_backward(range),
            vec![2u32, 3u32, 4u32, 5u32, 6u32, 7u32, 8u32, 9u32]
        );
    }
    {
        let range = term_dictionary.range().gt([2u8]).backward().into_stream()?;
        assert_eq!(
            value_list_backward(range),
            vec![3u32, 4u32, 5u32, 6u32, 7u32, 8u32, 9u32]
        );
    }
    {
        let range = term_dictionary.range().lt([6u8]).backward().into_stream()?;
        assert_eq!(
            value_list_backward(range),
            vec![0u32, 1u32, 2u32, 3u32, 4u32, 5u32]
        );
    }
    {
        let range = term_dictionary.range().le([6u8]).backward().into_stream()?;
        assert_eq!(
            value_list_backward(range),
            vec![0u32, 1u32, 2u32, 3u32, 4u32, 5u32, 6u32]
        );
    }
    {
        let range = term_dictionary
            .range()
            .ge([0u8])
            .lt([5u8])
            .backward()
            .into_stream()?;
        assert_eq!(
            value_list_backward(range),
            vec![0u32, 1u32, 2u32, 3u32, 4u32]
        );
    }
    Ok(())
}

#[test]
fn test_ord_to_term() -> crate::Result<()> {
    let termdict = stream_range_test_dict()?;
    let mut bytes = vec![];
    for b in 0u8..10u8 {
        termdict.ord_to_term(b as u64, &mut bytes)?;
        assert_eq!(&bytes, &[b]);
    }
    Ok(())
}

#[test]
fn test_stream_term_ord() -> crate::Result<()> {
    let termdict = stream_range_test_dict()?;
    let mut stream = termdict.stream()?;
    for b in 0u8..10u8 {
        assert!(stream.advance());
        assert_eq!(stream.term_ord(), b as u64);
        assert_eq!(stream.key(), &[b]);
    }
    assert!(!stream.advance());
    Ok(())
}

#[test]
fn test_automaton_search() -> crate::Result<()> {
    use levenshtein_automata::LevenshteinAutomatonBuilder;

    use crate::query::DfaWrapper;

    const COUNTRIES: [&str; 7] = [
        "San Marino",
        "Serbia",
        "Slovakia",
        "Slovenia",
        "Spain",
        "Sweden",
        "Switzerland",
    ];

    let directory = RamDirectory::create();
    let path = PathBuf::from("TermDictionary");
    {
        let write = directory.open_write(&path)?;
        let mut term_dictionary_builder = TermDictionaryBuilder::create(write)?;
        for term in COUNTRIES.iter() {
            term_dictionary_builder.insert(term.as_bytes(), &make_term_info(0u64))?;
        }
        term_dictionary_builder.finish()?.terminate()?;
    }
    let file = directory.open_read(&path)?;
    let term_dict: TermDictionary = TermDictionary::open(file)?;

    // We can now build an entire dfa.
    let lev_automaton_builder = LevenshteinAutomatonBuilder::new(2, true);
    let automaton = DfaWrapper(lev_automaton_builder.build_dfa("Spaen"));

    let mut range = term_dict.search(automaton).into_stream()?;

    // get the first finding
    assert!(range.advance());
    assert_eq!("Spain".as_bytes(), range.key());
    assert!(!range.advance());
    Ok(())
}


================================================
FILE: src/tokenizer/alphanum_only.rs
================================================
//! # Example
//! ```rust
//! use tantivy::tokenizer::*;
//!
//! let mut tokenizer = TextAnalyzer::builder(RawTokenizer::default())
//!   .filter(AlphaNumOnlyFilter)
//!   .build();
//!
//! let mut stream = tokenizer.token_stream("hello there");
//! // is none because the raw filter emits one token that
//! // contains a space
//! assert!(stream.next().is_none());
//!
//! let mut tokenizer = TextAnalyzer::builder(SimpleTokenizer::default())
//!   .filter(AlphaNumOnlyFilter)
//!   .build();
//!
//! let mut stream = tokenizer.token_stream("hello there 💣");
//! assert!(stream.next().is_some());
//! assert!(stream.next().is_some());
//! // the "emoji" is dropped because its not an alphanum
//! assert!(stream.next().is_none());
//! ```
use super::{Token, TokenFilter, TokenStream, Tokenizer};

/// `TokenFilter` that removes all tokens that contain non
/// ascii alphanumeric characters.
#[derive(Clone)]
pub struct AlphaNumOnlyFilter;

pub struct AlphaNumOnlyFilterStream<T> {
    tail: T,
}

impl<T> AlphaNumOnlyFilterStream<T> {
    fn predicate(&self, token: &Token) -> bool {
        token.text.chars().all(|c| c.is_ascii_alphanumeric())
    }
}

impl TokenFilter for AlphaNumOnlyFilter {
    type Tokenizer<T: Tokenizer> = AlphaNumOnlyFilterWrapper<T>;

    fn transform<T: Tokenizer>(self, tokenizer: T) -> AlphaNumOnlyFilterWrapper<T> {
        AlphaNumOnlyFilterWrapper(tokenizer)
    }
}

#[derive(Clone)]
pub struct AlphaNumOnlyFilterWrapper<T>(T);

impl<T: Tokenizer> Tokenizer for AlphaNumOnlyFilterWrapper<T> {
    type TokenStream<'a> = AlphaNumOnlyFilterStream<T::TokenStream<'a>>;

    fn token_stream<'a>(&'a mut self, text: &'a str) -> Self::TokenStream<'a> {
        AlphaNumOnlyFilterStream {
            tail: self.0.token_stream(text),
        }
    }
}

impl<T: TokenStream> TokenStream for AlphaNumOnlyFilterStream<T> {
    fn advance(&mut self) -> bool {
        while self.tail.advance() {
            if self.predicate(self.tail.token()) {
                return true;
            }
        }

        false
    }

    fn token(&self) -> &Token {
        self.tail.token()
    }

    fn token_mut(&mut self) -> &mut Token {
        self.tail.token_mut()
    }
}

#[cfg(test)]
mod tests {
    use crate::tokenizer::tests::assert_token;
    use crate::tokenizer::{AlphaNumOnlyFilter, SimpleTokenizer, TextAnalyzer, Token};

    #[test]
    fn test_alphanum_only() {
        let tokens = token_stream_helper("I am a cat. 我輩は猫である。(1906)");
        assert_eq!(tokens.len(), 5);
        assert_token(&tokens[0], 0, "I", 0, 1);
        assert_token(&tokens[1], 1, "am", 2, 4);
        assert_token(&tokens[2], 2, "a", 5, 6);
        assert_token(&tokens[3], 3, "cat", 7, 10);
        assert_token(&tokens[4], 5, "1906", 37, 41);
    }

    fn token_stream_helper(text: &str) -> Vec<Token> {
        let mut a = TextAnalyzer::builder(SimpleTokenizer::default())
            .filter(AlphaNumOnlyFilter)
            .build();
        let mut token_stream = a.token_stream(text);
        let mut tokens: Vec<Token> = vec![];
        let mut add_token = |token: &Token| {
            tokens.push(token.clone());
        };
        token_stream.process(&mut add_token);
        tokens
    }
}


================================================
FILE: src/tokenizer/ascii_folding_filter.rs
================================================
use std::mem;

use super::{Token, TokenFilter, TokenStream, Tokenizer};

/// This class converts alphabetic, numeric, and symbolic Unicode characters
/// which are not in the first 127 ASCII characters (the "Basic Latin" Unicode
/// block) into their ASCII equivalents, if one exists.
#[derive(Clone)]
pub struct AsciiFoldingFilter;

impl TokenFilter for AsciiFoldingFilter {
    type Tokenizer<T: Tokenizer> = AsciiFoldingFilterWrapper<T>;

    fn transform<T: Tokenizer>(self, tokenizer: T) -> AsciiFoldingFilterWrapper<T> {
        AsciiFoldingFilterWrapper {
            tokenizer,
            buffer: String::new(),
        }
    }
}

#[derive(Clone)]
pub struct AsciiFoldingFilterWrapper<T> {
    tokenizer: T,
    buffer: String,
}

impl<T: Tokenizer> Tokenizer for AsciiFoldingFilterWrapper<T> {
    type TokenStream<'a> = AsciiFoldingFilterTokenStream<'a, T::TokenStream<'a>>;

    fn token_stream<'a>(&'a mut self, text: &'a str) -> Self::TokenStream<'a> {
        self.buffer.clear();
        AsciiFoldingFilterTokenStream {
            buffer: &mut self.buffer,
            tail: self.tokenizer.token_stream(text),
        }
    }
}

pub struct AsciiFoldingFilterTokenStream<'a, T> {
    buffer: &'a mut String,
    tail: T,
}

impl<T: TokenStream> TokenStream for AsciiFoldingFilterTokenStream<'_, T> {
    fn advance(&mut self) -> bool {
        if !self.tail.advance() {
            return false;
        }
        if !self.token_mut().text.is_ascii() {
            // ignore its already ascii
            to_ascii(&self.tail.token().text, self.buffer);
            mem::swap(&mut self.tail.token_mut().text, self.buffer);
        }
        true
    }

    fn token(&self) -> &Token {
        self.tail.token()
    }

    fn token_mut(&mut self) -> &mut Token {
        self.tail.token_mut()
    }
}

// Returns a string that represents the ascii folded version of
// the character. If the `char` does not require ascii folding
// (e.g. simple ASCII chars like `A`) or if the `char`
// does not have a sensible ascii equivalent (e.g.: Kanjis like 馬,
// this function returns `None`.
fn fold_non_ascii_char(c: char) -> Option<&'static str> {
    match c {
        '\u{00C0}' | // À  [LATIN CAPITAL LETTER A WITH GRAVE]
        '\u{00C1}' | // Á  [LATIN CAPITAL LETTER A WITH ACUTE]
        '\u{00C2}' | // Â  [LATIN CAPITAL LETTER A WITH CIRCUMFLEX]
        '\u{00C3}' | // Ã  [LATIN CAPITAL LETTER A WITH TILDE]
        '\u{00C4}' | // Ä  [LATIN CAPITAL LETTER A WITH DIAERESIS]
        '\u{00C5}' | // Å  [LATIN CAPITAL LETTER A WITH RING ABOVE]
        '\u{0100}' | // Ā  [LATIN CAPITAL LETTER A WITH MACRON]
        '\u{0102}' | // Ă  [LATIN CAPITAL LETTER A WITH BREVE]
        '\u{0104}' | // Ą  [LATIN CAPITAL LETTER A WITH OGONEK]
        '\u{018F}' | // Ə  http://en.wikipedia.org/wiki/Schwa  [LATIN CAPITAL LETTER SCHWA]
        '\u{01CD}' | // Ǎ  [LATIN CAPITAL LETTER A WITH CARON]
        '\u{01DE}' | // Ǟ  [LATIN CAPITAL LETTER A WITH DIAERESIS AND MACRON]
        '\u{01E0}' | // Ǡ  [LATIN CAPITAL LETTER A WITH DOT ABOVE AND MACRON]
        '\u{01FA}' | // Ǻ  [LATIN CAPITAL LETTER A WITH RING ABOVE AND ACUTE]
        '\u{0200}' | // Ȁ  [LATIN CAPITAL LETTER A WITH DOUBLE GRAVE]
        '\u{0202}' | // Ȃ  [LATIN CAPITAL LETTER A WITH INVERTED BREVE]
        '\u{0226}' | // Ȧ  [LATIN CAPITAL LETTER A WITH DOT ABOVE]
        '\u{023A}' | // Ⱥ  [LATIN CAPITAL LETTER A WITH STROKE]
        '\u{1D00}' | // ᴀ  [LATIN LETTER SMALL CAPITAL A]
        '\u{1E00}' | // Ḁ  [LATIN CAPITAL LETTER A WITH RING BELOW]
        '\u{1EA0}' | // Ạ  [LATIN CAPITAL LETTER A WITH DOT BELOW]
        '\u{1EA2}' | // Ả  [LATIN CAPITAL LETTER A WITH HOOK ABOVE]
        '\u{1EA4}' | // Ấ  [LATIN CAPITAL LETTER A WITH CIRCUMFLEX AND ACUTE]
        '\u{1EA6}' | // Ầ  [LATIN CAPITAL LETTER A WITH CIRCUMFLEX AND GRAVE]
        '\u{1EA8}' | // Ẩ  [LATIN CAPITAL LETTER A WITH CIRCUMFLEX AND HOOK ABOVE]
        '\u{1EAA}' | // Ẫ  [LATIN CAPITAL LETTER A WITH CIRCUMFLEX AND TILDE]
        '\u{1EAC}' | // Ậ  [LATIN CAPITAL LETTER A WITH CIRCUMFLEX AND DOT BELOW]
        '\u{1EAE}' | // Ắ  [LATIN CAPITAL LETTER A WITH BREVE AND ACUTE]
        '\u{1EB0}' | // Ằ  [LATIN CAPITAL LETTER A WITH BREVE AND GRAVE]
        '\u{1EB2}' | // Ẳ  [LATIN CAPITAL LETTER A WITH BREVE AND HOOK ABOVE]
        '\u{1EB4}' | // Ẵ  [LATIN CAPITAL LETTER A WITH BREVE AND TILDE]
        '\u{1EB6}' | // Ặ  [LATIN CAPITAL LETTER A WITH BREVE AND DOT BELOW]
        '\u{24B6}' | // Ⓐ  [CIRCLED LATIN CAPITAL LETTER A]
        '\u{FF21}'  // Ａ  [FULLWIDTH LATIN CAPITAL LETTER A]
        => Some("A"),
        '\u{00E0}' | // à  [LATIN SMALL LETTER A WITH GRAVE]
        '\u{00E1}' | // á  [LATIN SMALL LETTER A WITH ACUTE]
        '\u{00E2}' | // â  [LATIN SMALL LETTER A WITH CIRCUMFLEX]
        '\u{00E3}' | // ã  [LATIN SMALL LETTER A WITH TILDE]
        '\u{00E4}' | // ä  [LATIN SMALL LETTER A WITH DIAERESIS]
        '\u{00E5}' | // å  [LATIN SMALL LETTER A WITH RING ABOVE]
        '\u{0101}' | // ā  [LATIN SMALL LETTER A WITH MACRON]
        '\u{0103}' | // ă  [LATIN SMALL LETTER A WITH BREVE]
        '\u{0105}' | // ą  [LATIN SMALL LETTER A WITH OGONEK]
        '\u{01CE}' | // ǎ  [LATIN SMALL LETTER A WITH CARON]
        '\u{01DF}' | // ǟ  [LATIN SMALL LETTER A WITH DIAERESIS AND MACRON]
        '\u{01E1}' | // ǡ  [LATIN SMALL LETTER A WITH DOT ABOVE AND MACRON]
        '\u{01FB}' | // ǻ  [LATIN SMALL LETTER A WITH RING ABOVE AND ACUTE]
        '\u{0201}' | // ȁ  [LATIN SMALL LETTER A WITH DOUBLE GRAVE]
        '\u{0203}' | // ȃ  [LATIN SMALL LETTER A WITH INVERTED BREVE]
        '\u{0227}' | // ȧ  [LATIN SMALL LETTER A WITH DOT ABOVE]
        '\u{0250}' | // ɐ  [LATIN SMALL LETTER TURNED A]
        '\u{0259}' | // ə  [LATIN SMALL LETTER SCHWA]
        '\u{025A}' | // ɚ  [LATIN SMALL LETTER SCHWA WITH HOOK]
        '\u{1D8F}' | // ᶏ  [LATIN SMALL LETTER A WITH RETROFLEX HOOK]
        '\u{1D95}' | // ᶕ  [LATIN SMALL LETTER SCHWA WITH RETROFLEX HOOK]
        '\u{1E01}' | // ạ  [LATIN SMALL LETTER A WITH RING BELOW]
        '\u{1E9A}' | // ả  [LATIN SMALL LETTER A WITH RIGHT HALF RING]
        '\u{1EA1}' | // ạ  [LATIN SMALL LETTER A WITH DOT BELOW]
        '\u{1EA3}' | // ả  [LATIN SMALL LETTER A WITH HOOK ABOVE]
        '\u{1EA5}' | // ấ  [LATIN SMALL LETTER A WITH CIRCUMFLEX AND ACUTE]
        '\u{1EA7}' | // ầ  [LATIN SMALL LETTER A WITH CIRCUMFLEX AND GRAVE]
        '\u{1EA9}' | // ẩ  [LATIN SMALL LETTER A WITH CIRCUMFLEX AND HOOK ABOVE]
        '\u{1EAB}' | // ẫ  [LATIN SMALL LETTER A WITH CIRCUMFLEX AND TILDE]
        '\u{1EAD}' | // ậ  [LATIN SMALL LETTER A WITH CIRCUMFLEX AND DOT BELOW]
        '\u{1EAF}' | // ắ  [LATIN SMALL LETTER A WITH BREVE AND ACUTE]
        '\u{1EB1}' | // ằ  [LATIN SMALL LETTER A WITH BREVE AND GRAVE]
        '\u{1EB3}' | // ẳ  [LATIN SMALL LETTER A WITH BREVE AND HOOK ABOVE]
        '\u{1EB5}' | // ẵ  [LATIN SMALL LETTER A WITH BREVE AND TILDE]
        '\u{1EB7}' | // ặ  [LATIN SMALL LETTER A WITH BREVE AND DOT BELOW]
        '\u{2090}' | // ₐ  [LATIN SUBSCRIPT SMALL LETTER A]
        '\u{2094}' | // ₔ  [LATIN SUBSCRIPT SMALL LETTER SCHWA]
        '\u{24D0}' | // ⓐ  [CIRCLED LATIN SMALL LETTER A]
        '\u{2C65}' | // ⱥ  [LATIN SMALL LETTER A WITH STROKE]
        '\u{2C6F}' | // Ɐ  [LATIN CAPITAL LETTER TURNED A]
        '\u{FF41}'  // ａ  [FULLWIDTH LATIN SMALL LETTER A]
        => Some("a"),
        '\u{A732}'  // Ꜳ  [LATIN CAPITAL LETTER AA]
        => Some("AA"),
        '\u{00C6}' | // Æ  [LATIN CAPITAL LETTER AE]
        '\u{01E2}' | // Ǣ  [LATIN CAPITAL LETTER AE WITH MACRON]
        '\u{01FC}' | // Ǽ  [LATIN CAPITAL LETTER AE WITH ACUTE]
        '\u{1D01}' // ᴁ  [LATIN LETTER SMALL CAPITAL AE]
        => Some("AE"),
        '\u{A734}' // Ꜵ  [LATIN CAPITAL LETTER AO]
        => Some("AO"),
        '\u{A736}'  // Ꜷ  [LATIN CAPITAL LETTER AU]
        => Some("AU"),
        '\u{A738}' | // Ꜹ  [LATIN CAPITAL LETTER AV]
        '\u{A73A}'  // Ꜻ  [LATIN CAPITAL LETTER AV WITH HORIZONTAL BAR]
        => Some("AV"),
        '\u{A73C}'  // Ꜽ  [LATIN CAPITAL LETTER AY]
        => Some("AY"),
        '\u{249C}'  // ⒜  [PARENTHESIZED LATIN SMALL LETTER A]
        => Some("(a)"),
        '\u{A733}' // ꜳ  [LATIN SMALL LETTER AA]
        => Some("aa"),
        '\u{00E6}' | // æ  [LATIN SMALL LETTER AE]
        '\u{01E3}' | // ǣ  [LATIN SMALL LETTER AE WITH MACRON]
        '\u{01FD}' | // ǽ  [LATIN SMALL LETTER AE WITH ACUTE]
        '\u{1D02}' // ᴂ  [LATIN SMALL LETTER TURNED AE]
        => Some("ae"),
        '\u{A735}' // ꜵ  [LATIN SMALL LETTER AO]
        => Some("ao"),
        '\u{A737}' // ꜷ  [LATIN SMALL LETTER AU]
        => Some("au"),
        '\u{A739}' | // ꜹ  [LATIN SMALL LETTER AV]
        '\u{A73B}' // ꜻ  [LATIN SMALL LETTER AV WITH HORIZONTAL BAR]
        => Some("av"),
        '\u{A73D}' // ꜽ  [LATIN SMALL LETTER AY]
        => Some("ay"),
        '\u{0181}' | // Ɓ  [LATIN CAPITAL LETTER B WITH HOOK]
        '\u{0182}' | // Ƃ  [LATIN CAPITAL LETTER B WITH TOPBAR]
        '\u{0243}' | // Ƀ  [LATIN CAPITAL LETTER B WITH STROKE]
        '\u{0299}' | // ʙ  [LATIN LETTER SMALL CAPITAL B]
        '\u{1D03}' | // ᴃ  [LATIN LETTER SMALL CAPITAL BARRED B]
        '\u{1E02}' | // Ḃ  [LATIN CAPITAL LETTER B WITH DOT ABOVE]
        '\u{1E04}' | // Ḅ  [LATIN CAPITAL LETTER B WITH DOT BELOW]
        '\u{1E06}' | // Ḇ  [LATIN CAPITAL LETTER B WITH LINE BELOW]
        '\u{24B7}' | // Ⓑ  [CIRCLED LATIN CAPITAL LETTER B]
        '\u{FF22}' // Ｂ  [FULLWIDTH LATIN CAPITAL LETTER B]
        => Some("B"),
        '\u{0180}' | // ƀ  [LATIN SMALL LETTER B WITH STROKE]
        '\u{0183}' | // ƃ  [LATIN SMALL LETTER B WITH TOPBAR]
        '\u{0253}' | // ɓ  [LATIN SMALL LETTER B WITH HOOK]
        '\u{1D6C}' | // ᵬ  [LATIN SMALL LETTER B WITH MIDDLE TILDE]
        '\u{1D80}' | // ᶀ  [LATIN SMALL LETTER B WITH PALATAL HOOK]
        '\u{1E03}' | // ḃ  [LATIN SMALL LETTER B WITH DOT ABOVE]
        '\u{1E05}' | // ḅ  [LATIN SMALL LETTER B WITH DOT BELOW]
        '\u{1E07}' | // ḇ  [LATIN SMALL LETTER B WITH LINE BELOW]
        '\u{24D1}' | // ⓑ  [CIRCLED LATIN SMALL LETTER B]
        '\u{FF42}' // ｂ  [FULLWIDTH LATIN SMALL LETTER B]
        => Some("b"),
        '\u{249D}' // ⒝  [PARENTHESIZED LATIN SMALL LETTER B]
        => Some("(b)"),
        '\u{00C7}' | // Ç  [LATIN CAPITAL LETTER C WITH CEDILLA]
        '\u{0106}' | // Ć  [LATIN CAPITAL LETTER C WITH ACUTE]
        '\u{0108}' | // Ĉ  [LATIN CAPITAL LETTER C WITH CIRCUMFLEX]
        '\u{010A}' | // Ċ  [LATIN CAPITAL LETTER C WITH DOT ABOVE]
        '\u{010C}' | // Č  [LATIN CAPITAL LETTER C WITH CARON]
        '\u{0187}' | // Ƈ  [LATIN CAPITAL LETTER C WITH HOOK]
        '\u{023B}' | // Ȼ  [LATIN CAPITAL LETTER C WITH STROKE]
        '\u{0297}' | // ʗ  [LATIN LETTER STRETCHED C]
        '\u{1D04}' | // ᴄ  [LATIN LETTER SMALL CAPITAL C]
        '\u{1E08}' | // Ḉ  [LATIN CAPITAL LETTER C WITH CEDILLA AND ACUTE]
        '\u{24B8}' | // Ⓒ  [CIRCLED LATIN CAPITAL LETTER C]
        '\u{FF23}' // Ｃ  [FULLWIDTH LATIN CAPITAL LETTER C]
        => Some("C"),
        '\u{00E7}' | // ç  [LATIN SMALL LETTER C WITH CEDILLA]
        '\u{0107}' | // ć  [LATIN SMALL LETTER C WITH ACUTE]
        '\u{0109}' | // ĉ  [LATIN SMALL LETTER C WITH CIRCUMFLEX]
        '\u{010B}' | // ċ  [LATIN SMALL LETTER C WITH DOT ABOVE]
        '\u{010D}' | // č  [LATIN SMALL LETTER C WITH CARON]
        '\u{0188}' | // ƈ  [LATIN SMALL LETTER C WITH HOOK]
        '\u{023C}' | // ȼ  [LATIN SMALL LETTER C WITH STROKE]
        '\u{0255}' | // ɕ  [LATIN SMALL LETTER C WITH CURL]
        '\u{1E09}' | // ḉ  [LATIN SMALL LETTER C WITH CEDILLA AND ACUTE]
        '\u{2184}' | // ↄ  [LATIN SMALL LETTER REVERSED C]
        '\u{24D2}' | // ⓒ  [CIRCLED LATIN SMALL LETTER C]
        '\u{A73E}' | // Ꜿ  [LATIN CAPITAL LETTER REVERSED C WITH DOT]
        '\u{A73F}' | // ꜿ  [LATIN SMALL LETTER REVERSED C WITH DOT]
        '\u{FF43}' // ｃ  [FULLWIDTH LATIN SMALL LETTER C]
        => Some("c"),
        '\u{249E}' // ⒞  [PARENTHESIZED LATIN SMALL LETTER C]
        => Some("(c)"),
        '\u{00D0}' | // Ð  [LATIN CAPITAL LETTER ETH]
        '\u{010E}' | // Ď  [LATIN CAPITAL LETTER D WITH CARON]
        '\u{0110}' | // Đ  [LATIN CAPITAL LETTER D WITH STROKE]
        '\u{0189}' | // Ɖ  [LATIN CAPITAL LETTER AFRICAN D]
        '\u{018A}' | // Ɗ  [LATIN CAPITAL LETTER D WITH HOOK]
        '\u{018B}' | // Ƌ  [LATIN CAPITAL LETTER D WITH TOPBAR]
        '\u{1D05}' | // ᴅ  [LATIN LETTER SMALL CAPITAL D]
        '\u{1D06}' | // ᴆ  [LATIN LETTER SMALL CAPITAL ETH]
        '\u{1E0A}' | // Ḋ  [LATIN CAPITAL LETTER D WITH DOT ABOVE]
        '\u{1E0C}' | // Ḍ  [LATIN CAPITAL LETTER D WITH DOT BELOW]
        '\u{1E0E}' | // Ḏ  [LATIN CAPITAL LETTER D WITH LINE BELOW]
        '\u{1E10}' | // Ḑ  [LATIN CAPITAL LETTER D WITH CEDILLA]
        '\u{1E12}' | // Ḓ  [LATIN CAPITAL LETTER D WITH CIRCUMFLEX BELOW]
        '\u{24B9}' | // Ⓓ  [CIRCLED LATIN CAPITAL LETTER D]
        '\u{A779}' | // Ꝺ  [LATIN CAPITAL LETTER INSULAR D]
        '\u{FF24}' // Ｄ  [FULLWIDTH LATIN CAPITAL LETTER D]
        => Some("D"),
        '\u{00F0}' | // ð  [LATIN SMALL LETTER ETH]
        '\u{010F}' | // ď  [LATIN SMALL LETTER D WITH CARON]
        '\u{0111}' | // đ  [LATIN SMALL LETTER D WITH STROKE]
        '\u{018C}' | // ƌ  [LATIN SMALL LETTER D WITH TOPBAR]
        '\u{0221}' | // ȡ  [LATIN SMALL LETTER D WITH CURL]
        '\u{0256}' | // ɖ  [LATIN SMALL LETTER D WITH TAIL]
        '\u{0257}' | // ɗ  [LATIN SMALL LETTER D WITH HOOK]
        '\u{1D6D}' | // ᵭ  [LATIN SMALL LETTER D WITH MIDDLE TILDE]
        '\u{1D81}' | // ᶁ  [LATIN SMALL LETTER D WITH PALATAL HOOK]
        '\u{1D91}' | // ᶑ  [LATIN SMALL LETTER D WITH HOOK AND TAIL]
        '\u{1E0B}' | // ḋ  [LATIN SMALL LETTER D WITH DOT ABOVE]
        '\u{1E0D}' | // ḍ  [LATIN SMALL LETTER D WITH DOT BELOW]
        '\u{1E0F}' | // ḏ  [LATIN SMALL LETTER D WITH LINE BELOW]
        '\u{1E11}' | // ḑ  [LATIN SMALL LETTER D WITH CEDILLA]
        '\u{1E13}' | // ḓ  [LATIN SMALL LETTER D WITH CIRCUMFLEX BELOW]
        '\u{24D3}' | // ⓓ  [CIRCLED LATIN SMALL LETTER D]
        '\u{A77A}' | // ꝺ  [LATIN SMALL LETTER INSULAR D]
        '\u{FF44}' // ｄ  [FULLWIDTH LATIN SMALL LETTER D]
        => Some("d"),
        '\u{01C4}' | // Ǆ  [LATIN CAPITAL LETTER DZ WITH CARON]
        '\u{01F1}' // Ǳ  [LATIN CAPITAL LETTER DZ]
        => Some("DZ"),
        '\u{01C5}' | // ǅ  [LATIN CAPITAL LETTER D WITH SMALL LETTER Z WITH CARON]
        '\u{01F2}' // ǲ  [LATIN CAPITAL LETTER D WITH SMALL LETTER Z]
        => Some("Dz"),
        '\u{249F}' // ⒟  [PARENTHESIZED LATIN SMALL LETTER D]
        => Some("(d)"),
        '\u{0238}' // ȸ  [LATIN SMALL LETTER DB DIGRAPH]
        => Some("db"),
        '\u{01C6}' | // ǆ  [LATIN SMALL LETTER DZ WITH CARON]
        '\u{01F3}' | // ǳ  [LATIN SMALL LETTER DZ]
        '\u{02A3}' | // ʣ  [LATIN SMALL LETTER DZ DIGRAPH]
        '\u{02A5}' // ʥ  [LATIN SMALL LETTER DZ DIGRAPH WITH CURL]
        => Some("dz"),
        '\u{00C8}' | // È  [LATIN CAPITAL LETTER E WITH GRAVE]
        '\u{00C9}' | // É  [LATIN CAPITAL LETTER E WITH ACUTE]
        '\u{00CA}' | // Ê  [LATIN CAPITAL LETTER E WITH CIRCUMFLEX]
        '\u{00CB}' | // Ë  [LATIN CAPITAL LETTER E WITH DIAERESIS]
        '\u{0112}' | // Ē  [LATIN CAPITAL LETTER E WITH MACRON]
        '\u{0114}' | // Ĕ  [LATIN CAPITAL LETTER E WITH BREVE]
        '\u{0116}' | // Ė  [LATIN CAPITAL LETTER E WITH DOT ABOVE]
        '\u{0118}' | // Ę  [LATIN CAPITAL LETTER E WITH OGONEK]
        '\u{011A}' | // Ě  [LATIN CAPITAL LETTER E WITH CARON]
        '\u{018E}' | // Ǝ  [LATIN CAPITAL LETTER REVERSED E]
        '\u{0190}' | // Ɛ  [LATIN CAPITAL LETTER OPEN E]
        '\u{0204}' | // Ȅ  [LATIN CAPITAL LETTER E WITH DOUBLE GRAVE]
        '\u{0206}' | // Ȇ  [LATIN CAPITAL LETTER E WITH INVERTED BREVE]
        '\u{0228}' | // Ȩ  [LATIN CAPITAL LETTER E WITH CEDILLA]
        '\u{0246}' | // Ɇ  [LATIN CAPITAL LETTER E WITH STROKE]
        '\u{1D07}' | // ᴇ  [LATIN LETTER SMALL CAPITAL E]
        '\u{1E14}' | // Ḕ  [LATIN CAPITAL LETTER E WITH MACRON AND GRAVE]
        '\u{1E16}' | // Ḗ  [LATIN CAPITAL LETTER E WITH MACRON AND ACUTE]
        '\u{1E18}' | // Ḙ  [LATIN CAPITAL LETTER E WITH CIRCUMFLEX BELOW]
        '\u{1E1A}' | // Ḛ  [LATIN CAPITAL LETTER E WITH TILDE BELOW]
        '\u{1E1C}' | // Ḝ  [LATIN CAPITAL LETTER E WITH CEDILLA AND BREVE]
        '\u{1EB8}' | // Ẹ  [LATIN CAPITAL LETTER E WITH DOT BELOW]
        '\u{1EBA}' | // Ẻ  [LATIN CAPITAL LETTER E WITH HOOK ABOVE]
        '\u{1EBC}' | // Ẽ  [LATIN CAPITAL LETTER E WITH TILDE]
        '\u{1EBE}' | // Ế  [LATIN CAPITAL LETTER E WITH CIRCUMFLEX AND ACUTE]
        '\u{1EC0}' | // Ề  [LATIN CAPITAL LETTER E WITH CIRCUMFLEX AND GRAVE]
        '\u{1EC2}' | // Ể  [LATIN CAPITAL LETTER E WITH CIRCUMFLEX AND HOOK ABOVE]
        '\u{1EC4}' | // Ễ  [LATIN CAPITAL LETTER E WITH CIRCUMFLEX AND TILDE]
        '\u{1EC6}' | // Ệ  [LATIN CAPITAL LETTER E WITH CIRCUMFLEX AND DOT BELOW]
        '\u{24BA}' | // Ⓔ  [CIRCLED LATIN CAPITAL LETTER E]
        '\u{2C7B}' | // ⱻ  [LATIN LETTER SMALL CAPITAL TURNED E]
        '\u{FF25}' // Ｅ  [FULLWIDTH LATIN CAPITAL LETTER E]
        => Some("E"),
        '\u{00E8}' | // è  [LATIN SMALL LETTER E WITH GRAVE]
        '\u{00E9}' | // é  [LATIN SMALL LETTER E WITH ACUTE]
        '\u{00EA}' | // ê  [LATIN SMALL LETTER E WITH CIRCUMFLEX]
        '\u{00EB}' | // ë  [LATIN SMALL LETTER E WITH DIAERESIS]
        '\u{0113}' | // ē  [LATIN SMALL LETTER E WITH MACRON]
        '\u{0115}' | // ĕ  [LATIN SMALL LETTER E WITH BREVE]
        '\u{0117}' | // ė  [LATIN SMALL LETTER E WITH DOT ABOVE]
        '\u{0119}' | // ę  [LATIN SMALL LETTER E WITH OGONEK]
        '\u{011B}' | // ě  [LATIN SMALL LETTER E WITH CARON]
        '\u{01DD}' | // ǝ  [LATIN SMALL LETTER TURNED E]
        '\u{0205}' | // ȅ  [LATIN SMALL LETTER E WITH DOUBLE GRAVE]
        '\u{0207}' | // ȇ  [LATIN SMALL LETTER E WITH INVERTED BREVE]
        '\u{0229}' | // ȩ  [LATIN SMALL LETTER E WITH CEDILLA]
        '\u{0247}' | // ɇ  [LATIN SMALL LETTER E WITH STROKE]
        '\u{0258}' | // ɘ  [LATIN SMALL LETTER REVERSED E]
        '\u{025B}' | // ɛ  [LATIN SMALL LETTER OPEN E]
        '\u{025C}' | // ɜ  [LATIN SMALL LETTER REVERSED OPEN E]
        '\u{025D}' | // ɝ  [LATIN SMALL LETTER REVERSED OPEN E WITH HOOK]
        '\u{025E}' | // ɞ  [LATIN SMALL LETTER CLOSED REVERSED OPEN E]
        '\u{029A}' | // ʚ  [LATIN SMALL LETTER CLOSED OPEN E]
        '\u{1D08}' | // ᴈ  [LATIN SMALL LETTER TURNED OPEN E]
        '\u{1D92}' | // ᶒ  [LATIN SMALL LETTER E WITH RETROFLEX HOOK]
        '\u{1D93}' | // ᶓ  [LATIN SMALL LETTER OPEN E WITH RETROFLEX HOOK]
        '\u{1D94}' | // ᶔ  [LATIN SMALL LETTER REVERSED OPEN E WITH RETROFLEX HOOK]
        '\u{1E15}' | // ḕ  [LATIN SMALL LETTER E WITH MACRON AND GRAVE]
        '\u{1E17}' | // ḗ  [LATIN SMALL LETTER E WITH MACRON AND ACUTE]
        '\u{1E19}' | // ḙ  [LATIN SMALL LETTER E WITH CIRCUMFLEX BELOW]
        '\u{1E1B}' | // ḛ  [LATIN SMALL LETTER E WITH TILDE BELOW]
        '\u{1E1D}' | // ḝ  [LATIN SMALL LETTER E WITH CEDILLA AND BREVE]
        '\u{1EB9}' | // ẹ  [LATIN SMALL LETTER E WITH DOT BELOW]
        '\u{1EBB}' | // ẻ  [LATIN SMALL LETTER E WITH HOOK ABOVE]
        '\u{1EBD}' | // ẽ  [LATIN SMALL LETTER E WITH TILDE]
        '\u{1EBF}' | // ế  [LATIN SMALL LETTER E WITH CIRCUMFLEX AND ACUTE]
        '\u{1EC1}' | // ề  [LATIN SMALL LETTER E WITH CIRCUMFLEX AND GRAVE]
        '\u{1EC3}' | // ể  [LATIN SMALL LETTER E WITH CIRCUMFLEX AND HOOK ABOVE]
        '\u{1EC5}' | // ễ  [LATIN SMALL LETTER E WITH CIRCUMFLEX AND TILDE]
        '\u{1EC7}' | // ệ  [LATIN SMALL LETTER E WITH CIRCUMFLEX AND DOT BELOW]
        '\u{2091}' | // ₑ  [LATIN SUBSCRIPT SMALL LETTER E]
        '\u{24D4}' | // ⓔ  [CIRCLED LATIN SMALL LETTER E]
        '\u{2C78}' | // ⱸ  [LATIN SMALL LETTER E WITH NOTCH]
        '\u{FF45}' // ｅ  [FULLWIDTH LATIN SMALL LETTER E]
        => Some("e"),
        '\u{24A0}' // ⒠  [PARENTHESIZED LATIN SMALL LETTER E]
        => Some("(e)"),
        '\u{0191}' | // Ƒ  [LATIN CAPITAL LETTER F WITH HOOK]
        '\u{1E1E}' | // Ḟ  [LATIN CAPITAL LETTER F WITH DOT ABOVE]
        '\u{24BB}' | // Ⓕ  [CIRCLED LATIN CAPITAL LETTER F]
        '\u{A730}' | // ꜰ  [LATIN LETTER SMALL CAPITAL F]
        '\u{A77B}' | // Ꝼ  [LATIN CAPITAL LETTER INSULAR F]
        '\u{A7FB}' | // ꟻ  [LATIN EPIGRAPHIC LETTER REVERSED F]
        '\u{FF26}' // Ｆ  [FULLWIDTH LATIN CAPITAL LETTER F]
        => Some("F"),
        '\u{0192}' | // ƒ  [LATIN SMALL LETTER F WITH HOOK]
        '\u{1D6E}' | // ᵮ  [LATIN SMALL LETTER F WITH MIDDLE TILDE]
        '\u{1D82}' | // ᶂ  [LATIN SMALL LETTER F WITH PALATAL HOOK]
        '\u{1E1F}' | // ḟ  [LATIN SMALL LETTER F WITH DOT ABOVE]
        '\u{1E9B}' | // ẛ  [LATIN SMALL LETTER LONG S WITH DOT ABOVE]
        '\u{24D5}' | // ⓕ  [CIRCLED LATIN SMALL LETTER F]
        '\u{A77C}' | // ꝼ  [LATIN SMALL LETTER INSULAR F]
        '\u{FF46}' // ｆ  [FULLWIDTH LATIN SMALL LETTER F]
        => Some("f"),
        '\u{24A1}' // ⒡  [PARENTHESIZED LATIN SMALL LETTER F]
        => Some("(f)"),
        '\u{FB00}' // ﬀ  [LATIN SMALL LIGATURE FF]
        => Some("ff"),
        '\u{FB03}' // ﬃ  [LATIN SMALL LIGATURE FFI]
        => Some("ffi"),
        '\u{FB04}' // ﬄ  [LATIN SMALL LIGATURE FFL]
        => Some("ffl"),
        '\u{FB01}' // ﬁ  [LATIN SMALL LIGATURE FI]
        => Some("fi"),
        '\u{FB02}' // ﬂ  [LATIN SMALL LIGATURE FL]
        => Some("fl"),
        '\u{011C}' | // Ĝ  [LATIN CAPITAL LETTER G WITH CIRCUMFLEX]
        '\u{011E}' | // Ğ  [LATIN CAPITAL LETTER G WITH BREVE]
        '\u{0120}' | // Ġ  [LATIN CAPITAL LETTER G WITH DOT ABOVE]
        '\u{0122}' | // Ģ  [LATIN CAPITAL LETTER G WITH CEDILLA]
        '\u{0193}' | // Ɠ  [LATIN CAPITAL LETTER G WITH HOOK]
        '\u{01E4}' | // Ǥ  [LATIN CAPITAL LETTER G WITH STROKE]
        '\u{01E5}' | // ǥ  [LATIN SMALL LETTER G WITH STROKE]
        '\u{01E6}' | // Ǧ  [LATIN CAPITAL LETTER G WITH CARON]
        '\u{01E7}' | // ǧ  [LATIN SMALL LETTER G WITH CARON]
        '\u{01F4}' | // Ǵ  [LATIN CAPITAL LETTER G WITH ACUTE]
        '\u{0262}' | // ɢ  [LATIN LETTER SMALL CAPITAL G]
        '\u{029B}' | // ʛ  [LATIN LETTER SMALL CAPITAL G WITH HOOK]
        '\u{1E20}' | // Ḡ  [LATIN CAPITAL LETTER G WITH MACRON]
        '\u{24BC}' | // Ⓖ  [CIRCLED LATIN CAPITAL LETTER G]
        '\u{A77D}' | // Ᵹ  [LATIN CAPITAL LETTER INSULAR G]
        '\u{A77E}' | // Ꝿ  [LATIN CAPITAL LETTER TURNED INSULAR G]
        '\u{FF27}' // Ｇ  [FULLWIDTH LATIN CAPITAL LETTER G]
        => Some("G"),
        '\u{011D}' | // ĝ  [LATIN SMALL LETTER G WITH CIRCUMFLEX]
        '\u{011F}' | // ğ  [LATIN SMALL LETTER G WITH BREVE]
        '\u{0121}' | // ġ  [LATIN SMALL LETTER G WITH DOT ABOVE]
        '\u{0123}' | // ģ  [LATIN SMALL LETTER G WITH CEDILLA]
        '\u{01F5}' | // ǵ  [LATIN SMALL LETTER G WITH ACUTE]
        '\u{0260}' | // ɠ  [LATIN SMALL LETTER G WITH HOOK]
        '\u{0261}' | // ɡ  [LATIN SMALL LETTER SCRIPT G]
        '\u{1D77}' | // ᵷ  [LATIN SMALL LETTER TURNED G]
        '\u{1D79}' | // ᵹ  [LATIN SMALL LETTER INSULAR G]
        '\u{1D83}' | // ᶃ  [LATIN SMALL LETTER G WITH PALATAL HOOK]
        '\u{1E21}' | // ḡ  [LATIN SMALL LETTER G WITH MACRON]
        '\u{24D6}' | // ⓖ  [CIRCLED LATIN SMALL LETTER G]
        '\u{A77F}' | // ꝿ  [LATIN SMALL LETTER TURNED INSULAR G]
        '\u{FF47}' // ｇ  [FULLWIDTH LATIN SMALL LETTER G]
        => Some("g"),
        '\u{24A2}' // ⒢  [PARENTHESIZED LATIN SMALL LETTER G]
        => Some("(g)"),
        '\u{0124}' | // Ĥ  [LATIN CAPITAL LETTER H WITH CIRCUMFLEX]
        '\u{0126}' | // Ħ  [LATIN CAPITAL LETTER H WITH STROKE]
        '\u{021E}' | // Ȟ  [LATIN CAPITAL LETTER H WITH CARON]
        '\u{029C}' | // ʜ  [LATIN LETTER SMALL CAPITAL H]
        '\u{1E22}' | // Ḣ  [LATIN CAPITAL LETTER H WITH DOT ABOVE]
        '\u{1E24}' | // Ḥ  [LATIN CAPITAL LETTER H WITH DOT BELOW]
        '\u{1E26}' | // Ḧ  [LATIN CAPITAL LETTER H WITH DIAERESIS]
        '\u{1E28}' | // Ḩ  [LATIN CAPITAL LETTER H WITH CEDILLA]
        '\u{1E2A}' | // Ḫ  [LATIN CAPITAL LETTER H WITH BREVE BELOW]
        '\u{24BD}' | // Ⓗ  [CIRCLED LATIN CAPITAL LETTER H]
        '\u{2C67}' | // Ⱨ  [LATIN CAPITAL LETTER H WITH DESCENDER]
        '\u{2C75}' | // Ⱶ  [LATIN CAPITAL LETTER HALF H]
        '\u{FF28}' // Ｈ  [FULLWIDTH LATIN CAPITAL LETTER H]
        => Some("H"),
        '\u{0125}' | // ĥ  [LATIN SMALL LETTER H WITH CIRCUMFLEX]
        '\u{0127}' | // ħ  [LATIN SMALL LETTER H WITH STROKE]
        '\u{021F}' | // ȟ  [LATIN SMALL LETTER H WITH CARON]
        '\u{0265}' | // ɥ  [LATIN SMALL LETTER TURNED H]
        '\u{0266}' | // ɦ  [LATIN SMALL LETTER H WITH HOOK]
        '\u{02AE}' | // ʮ  [LATIN SMALL LETTER TURNED H WITH FISHHOOK]
        '\u{02AF}' | // ʯ  [LATIN SMALL LETTER TURNED H WITH FISHHOOK AND TAIL]
        '\u{1E23}' | // ḣ  [LATIN SMALL LETTER H WITH DOT ABOVE]
        '\u{1E25}' | // ḥ  [LATIN SMALL LETTER H WITH DOT BELOW]
        '\u{1E27}' | // ḧ  [LATIN SMALL LETTER H WITH DIAERESIS]
        '\u{1E29}' | // ḩ  [LATIN SMALL LETTER H WITH CEDILLA]
        '\u{1E2B}' | // ḫ  [LATIN SMALL LETTER H WITH BREVE BELOW]
        '\u{1E96}' | // ẖ  [LATIN SMALL LETTER H WITH LINE BELOW]
        '\u{24D7}' | // ⓗ  [CIRCLED LATIN SMALL LETTER H]
        '\u{2C68}' | // ⱨ  [LATIN SMALL LETTER H WITH DESCENDER]
        '\u{2C76}' | // ⱶ  [LATIN SMALL LETTER HALF H]
        '\u{FF48}' // ｈ  [FULLWIDTH LATIN SMALL LETTER H]
        => Some("h"),
        '\u{01F6}' // Ƕ  http://en.wikipedia.org/wiki/Hwair  [LATIN CAPITAL LETTER HWAIR]
        => Some("HV"),
        '\u{24A3}' // ⒣  [PARENTHESIZED LATIN SMALL LETTER H]
        => Some("(h)"),
        '\u{0195}' // ƕ  [LATIN SMALL LETTER HV]
        => Some("hv"),
        '\u{00CC}' | // Ì  [LATIN CAPITAL LETTER I WITH GRAVE]
        '\u{00CD}' | // Í  [LATIN CAPITAL LETTER I WITH ACUTE]
        '\u{00CE}' | // Î  [LATIN CAPITAL LETTER I WITH CIRCUMFLEX]
        '\u{00CF}' | // Ï  [LATIN CAPITAL LETTER I WITH DIAERESIS]
        '\u{0128}' | // Ĩ  [LATIN CAPITAL LETTER I WITH TILDE]
        '\u{012A}' | // Ī  [LATIN CAPITAL LETTER I WITH MACRON]
        '\u{012C}' | // Ĭ  [LATIN CAPITAL LETTER I WITH BREVE]
        '\u{012E}' | // Į  [LATIN CAPITAL LETTER I WITH OGONEK]
        '\u{0130}' | // İ  [LATIN CAPITAL LETTER I WITH DOT ABOVE]
        '\u{0196}' | // Ɩ  [LATIN CAPITAL LETTER IOTA]
        '\u{0197}' | // Ɨ  [LATIN CAPITAL LETTER I WITH STROKE]
        '\u{01CF}' | // Ǐ  [LATIN CAPITAL LETTER I WITH CARON]
        '\u{0208}' | // Ȉ  [LATIN CAPITAL LETTER I WITH DOUBLE GRAVE]
        '\u{020A}' | // Ȋ  [LATIN CAPITAL LETTER I WITH INVERTED BREVE]
        '\u{026A}' | // ɪ  [LATIN LETTER SMALL CAPITAL I]
        '\u{1D7B}' | // ᵻ  [LATIN SMALL CAPITAL LETTER I WITH STROKE]
        '\u{1E2C}' | // Ḭ  [LATIN CAPITAL LETTER I WITH TILDE BELOW]
        '\u{1E2E}' | // Ḯ  [LATIN CAPITAL LETTER I WITH DIAERESIS AND ACUTE]
        '\u{1EC8}' | // Ỉ  [LATIN CAPITAL LETTER I WITH HOOK ABOVE]
        '\u{1ECA}' | // Ị  [LATIN CAPITAL LETTER I WITH DOT BELOW]
        '\u{24BE}' | // Ⓘ  [CIRCLED LATIN CAPITAL LETTER I]
        '\u{A7FE}' | // ꟾ  [LATIN EPIGRAPHIC LETTER I LONGA]
        '\u{FF29}' // Ｉ  [FULLWIDTH LATIN CAPITAL LETTER I]
        => Some("I"),
        '\u{00EC}' | // ì  [LATIN SMALL LETTER I WITH GRAVE]
        '\u{00ED}' | // í  [LATIN SMALL LETTER I WITH ACUTE]
        '\u{00EE}' | // î  [LATIN SMALL LETTER I WITH CIRCUMFLEX]
        '\u{00EF}' | // ï  [LATIN SMALL LETTER I WITH DIAERESIS]
        '\u{0129}' | // ĩ  [LATIN SMALL LETTER I WITH TILDE]
        '\u{012B}' | // ī  [LATIN SMALL LETTER I WITH MACRON]
        '\u{012D}' | // ĭ  [LATIN SMALL LETTER I WITH BREVE]
        '\u{012F}' | // į  [LATIN SMALL LETTER I WITH OGONEK]
        '\u{0131}' | // ı  [LATIN SMALL LETTER DOTLESS I]
        '\u{01D0}' | // ǐ  [LATIN SMALL LETTER I WITH CARON]
        '\u{0209}' | // ȉ  [LATIN SMALL LETTER I WITH DOUBLE GRAVE]
        '\u{020B}' | // ȋ  [LATIN SMALL LETTER I WITH INVERTED BREVE]
        '\u{0268}' | // ɨ  [LATIN SMALL LETTER I WITH STROKE]
        '\u{1D09}' | // ᴉ  [LATIN SMALL LETTER TURNED I]
        '\u{1D62}' | // ᵢ  [LATIN SUBSCRIPT SMALL LETTER I]
        '\u{1D7C}' | // ᵼ  [LATIN SMALL LETTER IOTA WITH STROKE]
        '\u{1D96}' | // ᶖ  [LATIN SMALL LETTER I WITH RETROFLEX HOOK]
        '\u{1E2D}' | // ḭ  [LATIN SMALL LETTER I WITH TILDE BELOW]
        '\u{1E2F}' | // ḯ  [LATIN SMALL LETTER I WITH DIAERESIS AND ACUTE]
        '\u{1EC9}' | // ỉ  [LATIN SMALL LETTER I WITH HOOK ABOVE]
        '\u{1ECB}' | // ị  [LATIN SMALL LETTER I WITH DOT BELOW]
        '\u{2071}' | // ⁱ  [SUPERSCRIPT LATIN SMALL LETTER I]
        '\u{24D8}' | // ⓘ  [CIRCLED LATIN SMALL LETTER I]
        '\u{FF49}' // ｉ  [FULLWIDTH LATIN SMALL LETTER I]
        => Some("i"),
        '\u{0132}' // Ĳ  [LATIN CAPITAL LIGATURE IJ]
        => Some("IJ"),
        '\u{24A4}' // ⒤  [PARENTHESIZED LATIN SMALL LETTER I]
        => Some("(i)"),
        '\u{0133}' // ĳ  [LATIN SMALL LIGATURE IJ]
        => Some("ij"),
        '\u{0134}' | // Ĵ  [LATIN CAPITAL LETTER J WITH CIRCUMFLEX]
        '\u{0248}' | // Ɉ  [LATIN CAPITAL LETTER J WITH STROKE]
        '\u{1D0A}' | // ᴊ  [LATIN LETTER SMALL CAPITAL J]
        '\u{24BF}' | // Ⓙ  [CIRCLED LATIN CAPITAL LETTER J]
        '\u{FF2A}' // Ｊ  [FULLWIDTH LATIN CAPITAL LETTER J]
        => Some("J"),
        '\u{0135}' | // ĵ  [LATIN SMALL LETTER J WITH CIRCUMFLEX]
        '\u{01F0}' | // ǰ  [LATIN SMALL LETTER J WITH CARON]
        '\u{0237}' | // ȷ  [LATIN SMALL LETTER DOTLESS J]
        '\u{0249}' | // ɉ  [LATIN SMALL LETTER J WITH STROKE]
        '\u{025F}' | // ɟ  [LATIN SMALL LETTER DOTLESS J WITH STROKE]
        '\u{0284}' | // ʄ  [LATIN SMALL LETTER DOTLESS J WITH STROKE AND HOOK]
        '\u{029D}' | // ʝ  [LATIN SMALL LETTER J WITH CROSSED-TAIL]
        '\u{24D9}' | // ⓙ  [CIRCLED LATIN SMALL LETTER J]
        '\u{2C7C}' | // ⱼ  [LATIN SUBSCRIPT SMALL LETTER J]
        '\u{FF4A}' // ｊ  [FULLWIDTH LATIN SMALL LETTER J]
        => Some("j"),
        '\u{24A5}' // ⒥  [PARENTHESIZED LATIN SMALL LETTER J]
        => Some("(j)"),
        '\u{0136}' | // Ķ  [LATIN CAPITAL LETTER K WITH CEDILLA]
        '\u{0198}' | // Ƙ  [LATIN CAPITAL LETTER K WITH HOOK]
        '\u{01E8}' | // Ǩ  [LATIN CAPITAL LETTER K WITH CARON]
        '\u{1D0B}' | // ᴋ  [LATIN LETTER SMALL CAPITAL K]
        '\u{1E30}' | // Ḱ  [LATIN CAPITAL LETTER K WITH ACUTE]
        '\u{1E32}' | // Ḳ  [LATIN CAPITAL LETTER K WITH DOT BELOW]
        '\u{1E34}' | // Ḵ  [LATIN CAPITAL LETTER K WITH LINE BELOW]
        '\u{24C0}' | // Ⓚ  [CIRCLED LATIN CAPITAL LETTER K]
        '\u{2C69}' | // Ⱪ  [LATIN CAPITAL LETTER K WITH DESCENDER]
        '\u{A740}' | // Ꝁ  [LATIN CAPITAL LETTER K WITH STROKE]
        '\u{A742}' | // Ꝃ  [LATIN CAPITAL LETTER K WITH DIAGONAL STROKE]
        '\u{A744}' | // Ꝅ  [LATIN CAPITAL LETTER K WITH STROKE AND DIAGONAL STROKE]
        '\u{FF2B}' // Ｋ  [FULLWIDTH LATIN CAPITAL LETTER K]
        => Some("K"),
        '\u{0137}' | // ķ  [LATIN SMALL LETTER K WITH CEDILLA]
        '\u{0199}' | // ƙ  [LATIN SMALL LETTER K WITH HOOK]
        '\u{01E9}' | // ǩ  [LATIN SMALL LETTER K WITH CARON]
        '\u{029E}' | // ʞ  [LATIN SMALL LETTER TURNED K]
        '\u{1D84}' | // ᶄ  [LATIN SMALL LETTER K WITH PALATAL HOOK]
        '\u{1E31}' | // ḱ  [LATIN SMALL LETTER K WITH ACUTE]
        '\u{1E33}' | // ḳ  [LATIN SMALL LETTER K WITH DOT BELOW]
        '\u{1E35}' | // ḵ  [LATIN SMALL LETTER K WITH LINE BELOW]
        '\u{24DA}' | // ⓚ  [CIRCLED LATIN SMALL LETTER K]
        '\u{2C6A}' | // ⱪ  [LATIN SMALL LETTER K WITH DESCENDER]
        '\u{A741}' | // ꝁ  [LATIN SMALL LETTER K WITH STROKE]
        '\u{A743}' | // ꝃ  [LATIN SMALL LETTER K WITH DIAGONAL STROKE]
        '\u{A745}' | // ꝅ  [LATIN SMALL LETTER K WITH STROKE AND DIAGONAL STROKE]
        '\u{FF4B}' // ｋ  [FULLWIDTH LATIN SMALL LETTER K]
        => Some("k"),
        '\u{24A6}' // ⒦  [PARENTHESIZED LATIN SMALL LETTER K]
        => Some("(k)"),
        '\u{0139}' | // Ĺ  [LATIN CAPITAL LETTER L WITH ACUTE]
        '\u{013B}' | // Ļ  [LATIN CAPITAL LETTER L WITH CEDILLA]
        '\u{013D}' | // Ľ  [LATIN CAPITAL LETTER L WITH CARON]
        '\u{013F}' | // Ŀ  [LATIN CAPITAL LETTER L WITH MIDDLE DOT]
        '\u{0141}' | // Ł  [LATIN CAPITAL LETTER L WITH STROKE]
        '\u{023D}' | // Ƚ  [LATIN CAPITAL LETTER L WITH BAR]
        '\u{029F}' | // ʟ  [LATIN LETTER SMALL CAPITAL L]
        '\u{1D0C}' | // ᴌ  [LATIN LETTER SMALL CAPITAL L WITH STROKE]
        '\u{1E36}' | // Ḷ  [LATIN CAPITAL LETTER L WITH DOT BELOW]
        '\u{1E38}' | // Ḹ  [LATIN CAPITAL LETTER L WITH DOT BELOW AND MACRON]
        '\u{1E3A}' | // Ḻ  [LATIN CAPITAL LETTER L WITH LINE BELOW]
        '\u{1E3C}' | // Ḽ  [LATIN CAPITAL LETTER L WITH CIRCUMFLEX BELOW]
        '\u{24C1}' | // Ⓛ  [CIRCLED LATIN CAPITAL LETTER L]
        '\u{2C60}' | // Ⱡ  [LATIN CAPITAL LETTER L WITH DOUBLE BAR]
        '\u{2C62}' | // Ɫ  [LATIN CAPITAL LETTER L WITH MIDDLE TILDE]
        '\u{A746}' | // Ꝇ  [LATIN CAPITAL LETTER BROKEN L]
        '\u{A748}' | // Ꝉ  [LATIN CAPITAL LETTER L WITH HIGH STROKE]
        '\u{A780}' | // Ꞁ  [LATIN CAPITAL LETTER TURNED L]
        '\u{FF2C}' // Ｌ  [FULLWIDTH LATIN CAPITAL LETTER L]
        => Some("L"),
        '\u{013A}' | // ĺ  [LATIN SMALL LETTER L WITH ACUTE]
        '\u{013C}' | // ļ  [LATIN SMALL LETTER L WITH CEDILLA]
        '\u{013E}' | // ľ  [LATIN SMALL LETTER L WITH CARON]
        '\u{0140}' | // ŀ  [LATIN SMALL LETTER L WITH MIDDLE DOT]
        '\u{0142}' | // ł  [LATIN SMALL LETTER L WITH STROKE]
        '\u{019A}' | // ƚ  [LATIN SMALL LETTER L WITH BAR]
        '\u{0234}' | // ȴ  [LATIN SMALL LETTER L WITH CURL]
        '\u{026B}' | // ɫ  [LATIN SMALL LETTER L WITH MIDDLE TILDE]
        '\u{026C}' | // ɬ  [LATIN SMALL LETTER L WITH BELT]
        '\u{026D}' | // ɭ  [LATIN SMALL LETTER L WITH RETROFLEX HOOK]
        '\u{1D85}' | // ᶅ  [LATIN SMALL LETTER L WITH PALATAL HOOK]
        '\u{1E37}' | // ḷ  [LATIN SMALL LETTER L WITH DOT BELOW]
        '\u{1E39}' | // ḹ  [LATIN SMALL LETTER L WITH DOT BELOW AND MACRON]
        '\u{1E3B}' | // ḻ  [LATIN SMALL LETTER L WITH LINE BELOW]
        '\u{1E3D}' | // ḽ  [LATIN SMALL LETTER L WITH CIRCUMFLEX BELOW]
        '\u{24DB}' | // ⓛ  [CIRCLED LATIN SMALL LETTER L]
        '\u{2C61}' | // ⱡ  [LATIN SMALL LETTER L WITH DOUBLE BAR]
        '\u{A747}' | // ꝇ  [LATIN SMALL LETTER BROKEN L]
        '\u{A749}' | // ꝉ  [LATIN SMALL LETTER L WITH HIGH STROKE]
        '\u{A781}' | // ꞁ  [LATIN SMALL LETTER TURNED L]
        '\u{FF4C}' // ｌ  [FULLWIDTH LATIN SMALL LETTER L]
        => Some("l"),
        '\u{01C7}' // Ǉ  [LATIN CAPITAL LETTER LJ]
        => Some("LJ"),
        '\u{1EFA}' // Ỻ  [LATIN CAPITAL LETTER MIDDLE-WELSH LL]
        => Some("LL"),
        '\u{01C8}' // ǈ  [LATIN CAPITAL LETTER L WITH SMALL LETTER J]
        => Some("Lj"),
        '\u{24A7}' // ⒧  [PARENTHESIZED LATIN SMALL LETTER L]
        => Some("(l)"),
        '\u{01C9}' // ǉ  [LATIN SMALL LETTER LJ]
        => Some("lj"),
        '\u{1EFB}' // ỻ  [LATIN SMALL LETTER MIDDLE-WELSH LL]
        => Some("ll"),
        '\u{02AA}' // ʪ  [LATIN SMALL LETTER LS DIGRAPH]
        => Some("ls"),
        '\u{02AB}' // ʫ  [LATIN SMALL LETTER LZ DIGRAPH]
        => Some("lz"),
        '\u{019C}' | // Ɯ  [LATIN CAPITAL LETTER TURNED M]
        '\u{1D0D}' | // ᴍ  [LATIN LETTER SMALL CAPITAL M]
        '\u{1E3E}' | // Ḿ  [LATIN CAPITAL LETTER M WITH ACUTE]
        '\u{1E40}' | // Ṁ  [LATIN CAPITAL LETTER M WITH DOT ABOVE]
        '\u{1E42}' | // Ṃ  [LATIN CAPITAL LETTER M WITH DOT BELOW]
        '\u{24C2}' | // Ⓜ  [CIRCLED LATIN CAPITAL LETTER M]
        '\u{2C6E}' | // Ɱ  [LATIN CAPITAL LETTER M WITH HOOK]
        '\u{A7FD}' | // ꟽ  [LATIN EPIGRAPHIC LETTER INVERTED M]
        '\u{A7FF}' | // ꟿ  [LATIN EPIGRAPHIC LETTER ARCHAIC M]
        '\u{FF2D}' // Ｍ  [FULLWIDTH LATIN CAPITAL LETTER M]
        => Some("M"),
        '\u{026F}' | // ɯ  [LATIN SMALL LETTER TURNED M]
        '\u{0270}' | // ɰ  [LATIN SMALL LETTER TURNED M WITH LONG LEG]
        '\u{0271}' | // ɱ  [LATIN SMALL LETTER M WITH HOOK]
        '\u{1D6F}' | // ᵯ  [LATIN SMALL LETTER M WITH MIDDLE TILDE]
        '\u{1D86}' | // ᶆ  [LATIN SMALL LETTER M WITH PALATAL HOOK]
        '\u{1E3F}' | // ḿ  [LATIN SMALL LETTER M WITH ACUTE]
        '\u{1E41}' | // ṁ  [LATIN SMALL LETTER M WITH DOT ABOVE]
        '\u{1E43}' | // ṃ  [LATIN SMALL LETTER M WITH DOT BELOW]
        '\u{24DC}' | // ⓜ  [CIRCLED LATIN SMALL LETTER M]
        '\u{FF4D}' // ｍ  [FULLWIDTH LATIN SMALL LETTER M]
        => Some("m"),
        '\u{24A8}' // ⒨  [PARENTHESIZED LATIN SMALL LETTER M]
        => Some("(m)"),
        '\u{00D1}' | // Ñ  [LATIN CAPITAL LETTER N WITH TILDE]
        '\u{0143}' | // Ń  [LATIN CAPITAL LETTER N WITH ACUTE]
        '\u{0145}' | // Ņ  [LATIN CAPITAL LETTER N WITH CEDILLA]
        '\u{0147}' | // Ň  [LATIN CAPITAL LETTER N WITH CARON]
        '\u{014A}' | // Ŋ  http://en.wikipedia.org/wiki/Eng_(letter)  [LATIN CAPITAL LETTER ENG]
        '\u{019D}' | // Ɲ  [LATIN CAPITAL LETTER N WITH LEFT HOOK]
        '\u{01F8}' | // Ǹ  [LATIN CAPITAL LETTER N WITH GRAVE]
        '\u{0220}' | // Ƞ  [LATIN CAPITAL LETTER N WITH LONG RIGHT LEG]
        '\u{0274}' | // ɴ  [LATIN LETTER SMALL CAPITAL N]
        '\u{1D0E}' | // ᴎ  [LATIN LETTER SMALL CAPITAL REVERSED N]
        '\u{1E44}' | // Ṅ  [LATIN CAPITAL LETTER N WITH DOT ABOVE]
        '\u{1E46}' | // Ṇ  [LATIN CAPITAL LETTER N WITH DOT BELOW]
        '\u{1E48}' | // Ṉ  [LATIN CAPITAL LETTER N WITH LINE BELOW]
        '\u{1E4A}' | // Ṋ  [LATIN CAPITAL LETTER N WITH CIRCUMFLEX BELOW]
        '\u{24C3}' | // Ⓝ  [CIRCLED LATIN CAPITAL LETTER N]
        '\u{FF2E}' // Ｎ  [FULLWIDTH LATIN CAPITAL LETTER N]
        => Some("N"),
        '\u{00F1}' | // ñ  [LATIN SMALL LETTER N WITH TILDE]
        '\u{0144}' | // ń  [LATIN SMALL LETTER N WITH ACUTE]
        '\u{0146}' | // ņ  [LATIN SMALL LETTER N WITH CEDILLA]
        '\u{0148}' | // ň  [LATIN SMALL LETTER N WITH CARON]
        '\u{0149}' | // ŉ  [LATIN SMALL LETTER N PRECEDED BY APOSTROPHE]
        '\u{014B}' | // ŋ  http://en.wikipedia.org/wiki/Eng_(letter)  [LATIN SMALL LETTER ENG]
        '\u{019E}' | // ƞ  [LATIN SMALL LETTER N WITH LONG RIGHT LEG]
        '\u{01F9}' | // ǹ  [LATIN SMALL LETTER N WITH GRAVE]
        '\u{0235}' | // ȵ  [LATIN SMALL LETTER N WITH CURL]
        '\u{0272}' | // ɲ  [LATIN SMALL LETTER N WITH LEFT HOOK]
        '\u{0273}' | // ɳ  [LATIN SMALL LETTER N WITH RETROFLEX HOOK]
        '\u{1D70}' | // ᵰ  [LATIN SMALL LETTER N WITH MIDDLE TILDE]
        '\u{1D87}' | // ᶇ  [LATIN SMALL LETTER N WITH PALATAL HOOK]
        '\u{1E45}' | // ṅ  [LATIN SMALL LETTER N WITH DOT ABOVE]
        '\u{1E47}' | // ṇ  [LATIN SMALL LETTER N WITH DOT BELOW]
        '\u{1E49}' | // ṉ  [LATIN SMALL LETTER N WITH LINE BELOW]
        '\u{1E4B}' | // ṋ  [LATIN SMALL LETTER N WITH CIRCUMFLEX BELOW]
        '\u{207F}' | // ⁿ  [SUPERSCRIPT LATIN SMALL LETTER N]
        '\u{24DD}' | // ⓝ  [CIRCLED LATIN SMALL LETTER N]
        '\u{FF4E}' // ｎ  [FULLWIDTH LATIN SMALL LETTER N]
        => Some("n"),
        '\u{01CA}' // Ǌ  [LATIN CAPITAL LETTER NJ]
        => Some("NJ"),
        '\u{01CB}' // ǋ  [LATIN CAPITAL LETTER N WITH SMALL LETTER J]
        => Some("Nj"),
        '\u{24A9}' // ⒩  [PARENTHESIZED LATIN SMALL LETTER N]
        => Some("(n)"),
        '\u{01CC}' // ǌ  [LATIN SMALL LETTER NJ]
        => Some("nj"),
        '\u{00D2}' | // Ò  [LATIN CAPITAL LETTER O WITH GRAVE]
        '\u{00D3}' | // Ó  [LATIN CAPITAL LETTER O WITH ACUTE]
        '\u{00D4}' | // Ô  [LATIN CAPITAL LETTER O WITH CIRCUMFLEX]
        '\u{00D5}' | // Õ  [LATIN CAPITAL LETTER O WITH TILDE]
        '\u{00D6}' | // Ö  [LATIN CAPITAL LETTER O WITH DIAERESIS]
        '\u{00D8}' | // Ø  [LATIN CAPITAL LETTER O WITH STROKE]
        '\u{014C}' | // Ō  [LATIN CAPITAL LETTER O WITH MACRON]
        '\u{014E}' | // Ŏ  [LATIN CAPITAL LETTER O WITH BREVE]
        '\u{0150}' | // Ő  [LATIN CAPITAL LETTER O WITH DOUBLE ACUTE]
        '\u{0186}' | // Ɔ  [LATIN CAPITAL LETTER OPEN O]
        '\u{019F}' | // Ɵ  [LATIN CAPITAL LETTER O WITH MIDDLE TILDE]
        '\u{01A0}' | // Ơ  [LATIN CAPITAL LETTER O WITH HORN]
        '\u{01D1}' | // Ǒ  [LATIN CAPITAL LETTER O WITH CARON]
        '\u{01EA}' | // Ǫ  [LATIN CAPITAL LETTER O WITH OGONEK]
        '\u{01EC}' | // Ǭ  [LATIN CAPITAL LETTER O WITH OGONEK AND MACRON]
        '\u{01FE}' | // Ǿ  [LATIN CAPITAL LETTER O WITH STROKE AND ACUTE]
        '\u{020C}' | // Ȍ  [LATIN CAPITAL LETTER O WITH DOUBLE GRAVE]
        '\u{020E}' | // Ȏ  [LATIN CAPITAL LETTER O WITH INVERTED BREVE]
        '\u{022A}' | // Ȫ  [LATIN CAPITAL LETTER O WITH DIAERESIS AND MACRON]
        '\u{022C}' | // Ȭ  [LATIN CAPITAL LETTER O WITH TILDE AND MACRON]
        '\u{022E}' | // Ȯ  [LATIN CAPITAL LETTER O WITH DOT ABOVE]
        '\u{0230}' | // Ȱ  [LATIN CAPITAL LETTER O WITH DOT ABOVE AND MACRON]
        '\u{1D0F}' | // ᴏ  [LATIN LETTER SMALL CAPITAL O]
        '\u{1D10}' | // ᴐ  [LATIN LETTER SMALL CAPITAL OPEN O]
        '\u{1E4C}' | // Ṍ  [LATIN CAPITAL LETTER O WITH TILDE AND ACUTE]
        '\u{1E4E}' | // Ṏ  [LATIN CAPITAL LETTER O WITH TILDE AND DIAERESIS]
        '\u{1E50}' | // Ṑ  [LATIN CAPITAL LETTER O WITH MACRON AND GRAVE]
        '\u{1E52}' | // Ṓ  [LATIN CAPITAL LETTER O WITH MACRON AND ACUTE]
        '\u{1ECC}' | // Ọ  [LATIN CAPITAL LETTER O WITH DOT BELOW]
        '\u{1ECE}' | // Ỏ  [LATIN CAPITAL LETTER O WITH HOOK ABOVE]
        '\u{1ED0}' | // Ố  [LATIN CAPITAL LETTER O WITH CIRCUMFLEX AND ACUTE]
        '\u{1ED2}' | // Ồ  [LATIN CAPITAL LETTER O WITH CIRCUMFLEX AND GRAVE]
        '\u{1ED4}' | // Ổ  [LATIN CAPITAL LETTER O WITH CIRCUMFLEX AND HOOK ABOVE]
        '\u{1ED6}' | // Ỗ  [LATIN CAPITAL LETTER O WITH CIRCUMFLEX AND TILDE]
        '\u{1ED8}' | // Ộ  [LATIN CAPITAL LETTER O WITH CIRCUMFLEX AND DOT BELOW]
        '\u{1EDA}' | // Ớ  [LATIN CAPITAL LETTER O WITH HORN AND ACUTE]
        '\u{1EDC}' | // Ờ  [LATIN CAPITAL LETTER O WITH HORN AND GRAVE]
        '\u{1EDE}' | // Ở  [LATIN CAPITAL LETTER O WITH HORN AND HOOK ABOVE]
        '\u{1EE0}' | // Ỡ  [LATIN CAPITAL LETTER O WITH HORN AND TILDE]
        '\u{1EE2}' | // Ợ  [LATIN CAPITAL LETTER O WITH HORN AND DOT BELOW]
        '\u{24C4}' | // Ⓞ  [CIRCLED LATIN CAPITAL LETTER O]
        '\u{A74A}' | // Ꝋ  [LATIN CAPITAL LETTER O WITH LONG STROKE OVERLAY]
        '\u{A74C}' | // Ꝍ  [LATIN CAPITAL LETTER O WITH LOOP]
        '\u{FF2F}' // Ｏ  [FULLWIDTH LATIN CAPITAL LETTER O]
        => Some("O"),
        '\u{00F2}' | // ò  [LATIN SMALL LETTER O WITH GRAVE]
        '\u{00F3}' | // ó  [LATIN SMALL LETTER O WITH ACUTE]
        '\u{00F4}' | // ô  [LATIN SMALL LETTER O WITH CIRCUMFLEX]
        '\u{00F5}' | // õ  [LATIN SMALL LETTER O WITH TILDE]
        '\u{00F6}' | // ö  [LATIN SMALL LETTER O WITH DIAERESIS]
        '\u{00F8}' | // ø  [LATIN SMALL LETTER O WITH STROKE]
        '\u{014D}' | // ō  [LATIN SMALL LETTER O WITH MACRON]
        '\u{014F}' | // ŏ  [LATIN SMALL LETTER O WITH BREVE]
        '\u{0151}' | // ő  [LATIN SMALL LETTER O WITH DOUBLE ACUTE]
        '\u{01A1}' | // ơ  [LATIN SMALL LETTER O WITH HORN]
        '\u{01D2}' | // ǒ  [LATIN SMALL LETTER O WITH CARON]
        '\u{01EB}' | // ǫ  [LATIN SMALL LETTER O WITH OGONEK]
        '\u{01ED}' | // ǭ  [LATIN SMALL LETTER O WITH OGONEK AND MACRON]
        '\u{01FF}' | // ǿ  [LATIN SMALL LETTER O WITH STROKE AND ACUTE]
        '\u{020D}' | // ȍ  [LATIN SMALL LETTER O WITH DOUBLE GRAVE]
        '\u{020F}' | // ȏ  [LATIN SMALL LETTER O WITH INVERTED BREVE]
        '\u{022B}' | // ȫ  [LATIN SMALL LETTER O WITH DIAERESIS AND MACRON]
        '\u{022D}' | // ȭ  [LATIN SMALL LETTER O WITH TILDE AND MACRON]
        '\u{022F}' | // ȯ  [LATIN SMALL LETTER O WITH DOT ABOVE]
        '\u{0231}' | // ȱ  [LATIN SMALL LETTER O WITH DOT ABOVE AND MACRON]
        '\u{0254}' | // ɔ  [LATIN SMALL LETTER OPEN O]
        '\u{0275}' | // ɵ  [LATIN SMALL LETTER BARRED O]
        '\u{1D16}' | // ᴖ  [LATIN SMALL LETTER TOP HALF O]
        '\u{1D17}' | // ᴗ  [LATIN SMALL LETTER BOTTOM HALF O]
        '\u{1D97}' | // ᶗ  [LATIN SMALL LETTER OPEN O WITH RETROFLEX HOOK]
        '\u{1E4D}' | // ṍ  [LATIN SMALL LETTER O WITH TILDE AND ACUTE]
        '\u{1E4F}' | // ṏ  [LATIN SMALL LETTER O WITH TILDE AND DIAERESIS]
        '\u{1E51}' | // ṑ  [LATIN SMALL LETTER O WITH MACRON AND GRAVE]
        '\u{1E53}' | // ṓ  [LATIN SMALL LETTER O WITH MACRON AND ACUTE]
        '\u{1ECD}' | // ọ  [LATIN SMALL LETTER O WITH DOT BELOW]
        '\u{1ECF}' | // ỏ  [LATIN SMALL LETTER O WITH HOOK ABOVE]
        '\u{1ED1}' | // ố  [LATIN SMALL LETTER O WITH CIRCUMFLEX AND ACUTE]
        '\u{1ED3}' | // ồ  [LATIN SMALL LETTER O WITH CIRCUMFLEX AND GRAVE]
        '\u{1ED5}' | // ổ  [LATIN SMALL LETTER O WITH CIRCUMFLEX AND HOOK ABOVE]
        '\u{1ED7}' | // ỗ  [LATIN SMALL LETTER O WITH CIRCUMFLEX AND TILDE]
        '\u{1ED9}' | // ộ  [LATIN SMALL LETTER O WITH CIRCUMFLEX AND DOT BELOW]
        '\u{1EDB}' | // ớ  [LATIN SMALL LETTER O WITH HORN AND ACUTE]
        '\u{1EDD}' | // ờ  [LATIN SMALL LETTER O WITH HORN AND GRAVE]
        '\u{1EDF}' | // ở  [LATIN SMALL LETTER O WITH HORN AND HOOK ABOVE]
        '\u{1EE1}' | // ỡ  [LATIN SMALL LETTER O WITH HORN AND TILDE]
        '\u{1EE3}' | // ợ  [LATIN SMALL LETTER O WITH HORN AND DOT BELOW]
        '\u{2092}' | // ₒ  [LATIN SUBSCRIPT SMALL LETTER O]
        '\u{24DE}' | // ⓞ  [CIRCLED LATIN SMALL LETTER O]
        '\u{2C7A}' | // ⱺ  [LATIN SMALL LETTER O WITH LOW RING INSIDE]
        '\u{A74B}' | // ꝋ  [LATIN SMALL LETTER O WITH LONG STROKE OVERLAY]
        '\u{A74D}' | // ꝍ  [LATIN SMALL LETTER O WITH LOOP]
        '\u{FF4F}' // ｏ  [FULLWIDTH LATIN SMALL LETTER O]
        => Some("o"),
        '\u{0152}' | // Œ  [LATIN CAPITAL LIGATURE OE]
        '\u{0276}' // ɶ  [LATIN LETTER SMALL CAPITAL OE]
        => Some("OE"),
        '\u{A74E}' // Ꝏ  [LATIN CAPITAL LETTER OO]
        => Some("OO"),
        '\u{0222}' | // Ȣ  http://en.wikipedia.org/wiki/OU  [LATIN CAPITAL LETTER OU]
        '\u{1D15}' // ᴕ  [LATIN LETTER SMALL CAPITAL OU]
        => Some("OU"),
        '\u{24AA}' // ⒪  [PARENTHESIZED LATIN SMALL LETTER O]
        => Some("(o)"),
        '\u{0153}' | // œ  [LATIN SMALL LIGATURE OE]
        '\u{1D14}' // ᴔ  [LATIN SMALL LETTER TURNED OE]
        => Some("oe"),
        '\u{A74F}' // ꝏ  [LATIN SMALL LETTER OO]
        => Some("oo"),
        '\u{0223}' // ȣ  http://en.wikipedia.org/wiki/OU  [LATIN SMALL LETTER OU]
        => Some("ou"),
        '\u{01A4}' | // Ƥ  [LATIN CAPITAL LETTER P WITH HOOK]
        '\u{1D18}' | // ᴘ  [LATIN LETTER SMALL CAPITAL P]
        '\u{1E54}' | // Ṕ  [LATIN CAPITAL LETTER P WITH ACUTE]
        '\u{1E56}' | // Ṗ  [LATIN CAPITAL LETTER P WITH DOT ABOVE]
        '\u{24C5}' | // Ⓟ  [CIRCLED LATIN CAPITAL LETTER P]
        '\u{2C63}' | // Ᵽ  [LATIN CAPITAL LETTER P WITH STROKE]
        '\u{A750}' | // Ꝑ  [LATIN CAPITAL LETTER P WITH STROKE THROUGH DESCENDER]
        '\u{A752}' | // Ꝓ  [LATIN CAPITAL LETTER P WITH FLOURISH]
        '\u{A754}' | // Ꝕ  [LATIN CAPITAL LETTER P WITH SQUIRREL TAIL]
        '\u{FF30}' // Ｐ  [FULLWIDTH LATIN CAPITAL LETTER P]
        => Some("P"),
        '\u{01A5}' | // ƥ  [LATIN SMALL LETTER P WITH HOOK]
        '\u{1D71}' | // ᵱ  [LATIN SMALL LETTER P WITH MIDDLE TILDE]
        '\u{1D7D}' | // ᵽ  [LATIN SMALL LETTER P WITH STROKE]
        '\u{1D88}' | // ᶈ  [LATIN SMALL LETTER P WITH PALATAL HOOK]
        '\u{1E55}' | // ṕ  [LATIN SMALL LETTER P WITH ACUTE]
        '\u{1E57}' | // ṗ  [LATIN SMALL LETTER P WITH DOT ABOVE]
        '\u{24DF}' | // ⓟ  [CIRCLED LATIN SMALL LETTER P]
        '\u{A751}' | // ꝑ  [LATIN SMALL LETTER P WITH STROKE THROUGH DESCENDER]
        '\u{A753}' | // ꝓ  [LATIN SMALL LETTER P WITH FLOURISH]
        '\u{A755}' | // ꝕ  [LATIN SMALL LETTER P WITH SQUIRREL TAIL]
        '\u{A7FC}' | // ꟼ  [LATIN EPIGRAPHIC LETTER REVERSED P]
        '\u{FF50}' // ｐ  [FULLWIDTH LATIN SMALL LETTER P]
        => Some("p"),
        '\u{24AB}' // ⒫  [PARENTHESIZED LATIN SMALL LETTER P]
        => Some("(p)"),
        '\u{024A}' | // Ɋ  [LATIN CAPITAL LETTER SMALL Q WITH HOOK TAIL]
        '\u{24C6}' | // Ⓠ  [CIRCLED LATIN CAPITAL LETTER Q]
        '\u{A756}' | // Ꝗ  [LATIN CAPITAL LETTER Q WITH STROKE THROUGH DESCENDER]
        '\u{A758}' | // Ꝙ  [LATIN CAPITAL LETTER Q WITH DIAGONAL STROKE]
        '\u{FF31}' // Ｑ  [FULLWIDTH LATIN CAPITAL LETTER Q]
        => Some("Q"),
        '\u{0138}' | // ĸ  http://en.wikipedia.org/wiki/Kra_(letter)  [LATIN SMALL LETTER KRA]
        '\u{024B}' | // ɋ  [LATIN SMALL LETTER Q WITH HOOK TAIL]
        '\u{02A0}' | // ʠ  [LATIN SMALL LETTER Q WITH HOOK]
        '\u{24E0}' | // ⓠ  [CIRCLED LATIN SMALL LETTER Q]
        '\u{A757}' | // ꝗ  [LATIN SMALL LETTER Q WITH STROKE THROUGH DESCENDER]
        '\u{A759}' | // ꝙ  [LATIN SMALL LETTER Q WITH DIAGONAL STROKE]
        '\u{FF51}' // ｑ  [FULLWIDTH LATIN SMALL LETTER Q]
        => Some("q"),
        '\u{24AC}' // ⒬  [PARENTHESIZED LATIN SMALL LETTER Q]
        => Some("(q)"),
        '\u{0239}' // ȹ  [LATIN SMALL LETTER QP DIGRAPH]
        => Some("qp"),
        '\u{0154}' | // Ŕ  [LATIN CAPITAL LETTER R WITH ACUTE]
        '\u{0156}' | // Ŗ  [LATIN CAPITAL LETTER R WITH CEDILLA]
        '\u{0158}' | // Ř  [LATIN CAPITAL LETTER R WITH CARON]
        '\u{0210}' | // Ȓ  [LATIN CAPITAL LETTER R WITH DOUBLE GRAVE]
        '\u{0212}' | // Ȓ  [LATIN CAPITAL LETTER R WITH INVERTED BREVE]
        '\u{024C}' | // Ɍ  [LATIN CAPITAL LETTER R WITH STROKE]
        '\u{0280}' | // ʀ  [LATIN LETTER SMALL CAPITAL R]
        '\u{0281}' | // ʁ  [LATIN LETTER SMALL CAPITAL INVERTED R]
        '\u{1D19}' | // ᴙ  [LATIN LETTER SMALL CAPITAL REVERSED R]
        '\u{1D1A}' | // ᴚ  [LATIN LETTER SMALL CAPITAL TURNED R]
        '\u{1E58}' | // Ṙ  [LATIN CAPITAL LETTER R WITH DOT ABOVE]
        '\u{1E5A}' | // Ṛ  [LATIN CAPITAL LETTER R WITH DOT BELOW]
        '\u{1E5C}' | // Ṝ  [LATIN CAPITAL LETTER R WITH DOT BELOW AND MACRON]
        '\u{1E5E}' | // Ṟ  [LATIN CAPITAL LETTER R WITH LINE BELOW]
        '\u{24C7}' | // Ⓡ  [CIRCLED LATIN CAPITAL LETTER R]
        '\u{2C64}' | // Ɽ  [LATIN CAPITAL LETTER R WITH TAIL]
        '\u{A75A}' | // Ꝛ  [LATIN CAPITAL LETTER R ROTUNDA]
        '\u{A782}' | // Ꞃ  [LATIN CAPITAL LETTER INSULAR R]
        '\u{FF32}' // Ｒ  [FULLWIDTH LATIN CAPITAL LETTER R]
        => Some("R"),
        '\u{0155}' | // ŕ  [LATIN SMALL LETTER R WITH ACUTE]
        '\u{0157}' | // ŗ  [LATIN SMALL LETTER R WITH CEDILLA]
        '\u{0159}' | // ř  [LATIN SMALL LETTER R WITH CARON]
        '\u{0211}' | // ȑ  [LATIN SMALL LETTER R WITH DOUBLE GRAVE]
        '\u{0213}' | // ȓ  [LATIN SMALL LETTER R WITH INVERTED BREVE]
        '\u{024D}' | // ɍ  [LATIN SMALL LETTER R WITH STROKE]
        '\u{027C}' | // ɼ  [LATIN SMALL LETTER R WITH LONG LEG]
        '\u{027D}' | // ɽ  [LATIN SMALL LETTER R WITH TAIL]
        '\u{027E}' | // ɾ  [LATIN SMALL LETTER R WITH FISHHOOK]
        '\u{027F}' | // ɿ  [LATIN SMALL LETTER REVERSED R WITH FISHHOOK]
        '\u{1D63}' | // ᵣ  [LATIN SUBSCRIPT SMALL LETTER R]
        '\u{1D72}' | // ᵲ  [LATIN SMALL LETTER R WITH MIDDLE TILDE]
        '\u{1D73}' | // ᵳ  [LATIN SMALL LETTER R WITH FISHHOOK AND MIDDLE TILDE]
        '\u{1D89}' | // ᶉ  [LATIN SMALL LETTER R WITH PALATAL HOOK]
        '\u{1E59}' | // ṙ  [LATIN SMALL LETTER R WITH DOT ABOVE]
        '\u{1E5B}' | // ṛ  [LATIN SMALL LETTER R WITH DOT BELOW]
        '\u{1E5D}' | // ṝ  [LATIN SMALL LETTER R WITH DOT BELOW AND MACRON]
        '\u{1E5F}' | // ṟ  [LATIN SMALL LETTER R WITH LINE BELOW]
        '\u{24E1}' | // ⓡ  [CIRCLED LATIN SMALL LETTER R]
        '\u{A75B}' | // ꝛ  [LATIN SMALL LETTER R ROTUNDA]
        '\u{A783}' | // ꞃ  [LATIN SMALL LETTER INSULAR R]
        '\u{FF52}' // ｒ  [FULLWIDTH LATIN SMALL LETTER R]
        => Some("r"),
        '\u{24AD}' // ⒭  [PARENTHESIZED LATIN SMALL LETTER R]
        => Some("(r)"),
        '\u{015A}' | // Ś  [LATIN CAPITAL LETTER S WITH ACUTE]
        '\u{015C}' | // Ŝ  [LATIN CAPITAL LETTER S WITH CIRCUMFLEX]
        '\u{015E}' | // Ş  [LATIN CAPITAL LETTER S WITH CEDILLA]
        '\u{0160}' | // Š  [LATIN CAPITAL LETTER S WITH CARON]
        '\u{0218}' | // Ș  [LATIN CAPITAL LETTER S WITH COMMA BELOW]
        '\u{1E60}' | // Ṡ  [LATIN CAPITAL LETTER S WITH DOT ABOVE]
        '\u{1E62}' | // Ṣ  [LATIN CAPITAL LETTER S WITH DOT BELOW]
        '\u{1E64}' | // Ṥ  [LATIN CAPITAL LETTER S WITH ACUTE AND DOT ABOVE]
        '\u{1E66}' | // Ṧ  [LATIN CAPITAL LETTER S WITH CARON AND DOT ABOVE]
        '\u{1E68}' | // Ṩ  [LATIN CAPITAL LETTER S WITH DOT BELOW AND DOT ABOVE]
        '\u{24C8}' | // Ⓢ  [CIRCLED LATIN CAPITAL LETTER S]
        '\u{A731}' | // ꜱ  [LATIN LETTER SMALL CAPITAL S]
        '\u{A785}' | // ꞅ  [LATIN SMALL LETTER INSULAR S]
        '\u{FF33}' // Ｓ  [FULLWIDTH LATIN CAPITAL LETTER S]
        => Some("S"),
        '\u{015B}' | // ś  [LATIN SMALL LETTER S WITH ACUTE]
        '\u{015D}' | // ŝ  [LATIN SMALL LETTER S WITH CIRCUMFLEX]
        '\u{015F}' | // ş  [LATIN SMALL LETTER S WITH CEDILLA]
        '\u{0161}' | // š  [LATIN SMALL LETTER S WITH CARON]
        '\u{017F}' | // ſ  http://en.wikipedia.org/wiki/Long_S  [LATIN SMALL LETTER LONG S]
        '\u{0219}' | // ș  [LATIN SMALL LETTER S WITH COMMA BELOW]
        '\u{023F}' | // ȿ  [LATIN SMALL LETTER S WITH SWASH TAIL]
        '\u{0282}' | // ʂ  [LATIN SMALL LETTER S WITH HOOK]
        '\u{1D74}' | // ᵴ  [LATIN SMALL LETTER S WITH MIDDLE TILDE]
        '\u{1D8A}' | // ᶊ  [LATIN SMALL LETTER S WITH PALATAL HOOK]
        '\u{1E61}' | // ṡ  [LATIN SMALL LETTER S WITH DOT ABOVE]
        '\u{1E63}' | // ṣ  [LATIN SMALL LETTER S WITH DOT BELOW]
        '\u{1E65}' | // ṥ  [LATIN SMALL LETTER S WITH ACUTE AND DOT ABOVE]
        '\u{1E67}' | // ṧ  [LATIN SMALL LETTER S WITH CARON AND DOT ABOVE]
        '\u{1E69}' | // ṩ  [LATIN SMALL LETTER S WITH DOT BELOW AND DOT ABOVE]
        '\u{1E9C}' | // ẜ  [LATIN SMALL LETTER LONG S WITH DIAGONAL STROKE]
        '\u{1E9D}' | // ẝ  [LATIN SMALL LETTER LONG S WITH HIGH STROKE]
        '\u{24E2}' | // ⓢ  [CIRCLED LATIN SMALL LETTER S]
        '\u{A784}' | // Ꞅ  [LATIN CAPITAL LETTER INSULAR S]
        '\u{FF53}' // ｓ  [FULLWIDTH LATIN SMALL LETTER S]
        => Some("s"),
        '\u{1E9E}' // ẞ  [LATIN CAPITAL LETTER SHARP S]
        => Some("SS"),
        '\u{24AE}' // ⒮  [PARENTHESIZED LATIN SMALL LETTER S]
        => Some("(s)"),
        '\u{00DF}' // ß  [LATIN SMALL LETTER SHARP S]
        => Some("ss"),
        '\u{FB06}' // ﬆ  [LATIN SMALL LIGATURE ST]
        => Some("st"),
        '\u{0162}' | // Ţ  [LATIN CAPITAL LETTER T WITH CEDILLA]
        '\u{0164}' | // Ť  [LATIN CAPITAL LETTER T WITH CARON]
        '\u{0166}' | // Ŧ  [LATIN CAPITAL LETTER T WITH STROKE]
        '\u{01AC}' | // Ƭ  [LATIN CAPITAL LETTER T WITH HOOK]
        '\u{01AE}' | // Ʈ  [LATIN CAPITAL LETTER T WITH RETROFLEX HOOK]
        '\u{021A}' | // Ț  [LATIN CAPITAL LETTER T WITH COMMA BELOW]
        '\u{023E}' | // Ⱦ  [LATIN CAPITAL LETTER T WITH DIAGONAL STROKE]
        '\u{1D1B}' | // ᴛ  [LATIN LETTER SMALL CAPITAL T]
        '\u{1E6A}' | // Ṫ  [LATIN CAPITAL LETTER T WITH DOT ABOVE]
        '\u{1E6C}' | // Ṭ  [LATIN CAPITAL LETTER T WITH DOT BELOW]
        '\u{1E6E}' | // Ṯ  [LATIN CAPITAL LETTER T WITH LINE BELOW]
        '\u{1E70}' | // Ṱ  [LATIN CAPITAL LETTER T WITH CIRCUMFLEX BELOW]
        '\u{24C9}' | // Ⓣ  [CIRCLED LATIN CAPITAL LETTER T]
        '\u{A786}' | // Ꞇ  [LATIN CAPITAL LETTER INSULAR T]
        '\u{FF34}' // Ｔ  [FULLWIDTH LATIN CAPITAL LETTER T]
        => Some("T"),
        '\u{0163}' | // ţ  [LATIN SMALL LETTER T WITH CEDILLA]
        '\u{0165}' | // ť  [LATIN SMALL LETTER T WITH CARON]
        '\u{0167}' | // ŧ  [LATIN SMALL LETTER T WITH STROKE]
        '\u{01AB}' | // ƫ  [LATIN SMALL LETTER T WITH PALATAL HOOK]
        '\u{01AD}' | // ƭ  [LATIN SMALL LETTER T WITH HOOK]
        '\u{021B}' | // ț  [LATIN SMALL LETTER T WITH COMMA BELOW]
        '\u{0236}' | // ȶ  [LATIN SMALL LETTER T WITH CURL]
        '\u{0287}' | // ʇ  [LATIN SMALL LETTER TURNED T]
        '\u{0288}' | // ʈ  [LATIN SMALL LETTER T WITH RETROFLEX HOOK]
        '\u{1D75}' | // ᵵ  [LATIN SMALL LETTER T WITH MIDDLE TILDE]
        '\u{1E6B}' | // ṫ  [LATIN SMALL LETTER T WITH DOT ABOVE]
        '\u{1E6D}' | // ṭ  [LATIN SMALL LETTER T WITH DOT BELOW]
        '\u{1E6F}' | // ṯ  [LATIN SMALL LETTER T WITH LINE BELOW]
        '\u{1E71}' | // ṱ  [LATIN SMALL LETTER T WITH CIRCUMFLEX BELOW]
        '\u{1E97}' | // ẗ  [LATIN SMALL LETTER T WITH DIAERESIS]
        '\u{24E3}' | // ⓣ  [CIRCLED LATIN SMALL LETTER T]
        '\u{2C66}' | // ⱦ  [LATIN SMALL LETTER T WITH DIAGONAL STROKE]
        '\u{FF54}' // ｔ  [FULLWIDTH LATIN SMALL LETTER T]
        => Some("t"),
        '\u{00DE}' | // Þ  [LATIN CAPITAL LETTER THORN]
        '\u{A766}' // Ꝧ  [LATIN CAPITAL LETTER THORN WITH STROKE THROUGH DESCENDER]
        => Some("TH"),
        '\u{A728}' // Ꜩ  [LATIN CAPITAL LETTER TZ]
        => Some("TZ"),
        '\u{24AF}' // ⒯  [PARENTHESIZED LATIN SMALL LETTER T]
        => Some("(t)"),
        '\u{02A8}' // ʨ  [LATIN SMALL LETTER TC DIGRAPH WITH CURL]
        => Some("tc"),
        '\u{00FE}' | // þ  [LATIN SMALL LETTER THORN]
        '\u{1D7A}' | // ᵺ  [LATIN SMALL LETTER TH WITH STRIKETHROUGH]
        '\u{A767}' // ꝧ  [LATIN SMALL LETTER THORN WITH STROKE THROUGH DESCENDER]
        => Some("th"),
        '\u{02A6}' // ʦ  [LATIN SMALL LETTER TS DIGRAPH]
        => Some("ts"),
        '\u{A729}' // ꜩ  [LATIN SMALL LETTER TZ]
        => Some("tz"),
        '\u{00D9}' | // Ù  [LATIN CAPITAL LETTER U WITH GRAVE]
        '\u{00DA}' | // Ú  [LATIN CAPITAL LETTER U WITH ACUTE]
        '\u{00DB}' | // Û  [LATIN CAPITAL LETTER U WITH CIRCUMFLEX]
        '\u{00DC}' | // Ü  [LATIN CAPITAL LETTER U WITH DIAERESIS]
        '\u{0168}' | // Ũ  [LATIN CAPITAL LETTER U WITH TILDE]
        '\u{016A}' | // Ū  [LATIN CAPITAL LETTER U WITH MACRON]
        '\u{016C}' | // Ŭ  [LATIN CAPITAL LETTER U WITH BREVE]
        '\u{016E}' | // Ů  [LATIN CAPITAL LETTER U WITH RING ABOVE]
        '\u{0170}' | // Ű  [LATIN CAPITAL LETTER U WITH DOUBLE ACUTE]
        '\u{0172}' | // Ų  [LATIN CAPITAL LETTER U WITH OGONEK]
        '\u{01AF}' | // Ư  [LATIN CAPITAL LETTER U WITH HORN]
        '\u{01D3}' | // Ǔ  [LATIN CAPITAL LETTER U WITH CARON]
        '\u{01D5}' | // Ǖ  [LATIN CAPITAL LETTER U WITH DIAERESIS AND MACRON]
        '\u{01D7}' | // Ǘ  [LATIN CAPITAL LETTER U WITH DIAERESIS AND ACUTE]
        '\u{01D9}' | // Ǚ  [LATIN CAPITAL LETTER U WITH DIAERESIS AND CARON]
        '\u{01DB}' | // Ǜ  [LATIN CAPITAL LETTER U WITH DIAERESIS AND GRAVE]
        '\u{0214}' | // Ȕ  [LATIN CAPITAL LETTER U WITH DOUBLE GRAVE]
        '\u{0216}' | // Ȗ  [LATIN CAPITAL LETTER U WITH INVERTED BREVE]
        '\u{0244}' | // Ʉ  [LATIN CAPITAL LETTER U BAR]
        '\u{1D1C}' | // ᴜ  [LATIN LETTER SMALL CAPITAL U]
        '\u{1D7E}' | // ᵾ  [LATIN SMALL CAPITAL LETTER U WITH STROKE]
        '\u{1E72}' | // Ṳ  [LATIN CAPITAL LETTER U WITH DIAERESIS BELOW]
        '\u{1E74}' | // Ṵ  [LATIN CAPITAL LETTER U WITH TILDE BELOW]
        '\u{1E76}' | // Ṷ  [LATIN CAPITAL LETTER U WITH CIRCUMFLEX BELOW]
        '\u{1E78}' | // Ṹ  [LATIN CAPITAL LETTER U WITH TILDE AND ACUTE]
        '\u{1E7A}' | // Ṻ  [LATIN CAPITAL LETTER U WITH MACRON AND DIAERESIS]
        '\u{1EE4}' | // Ụ  [LATIN CAPITAL LETTER U WITH DOT BELOW]
        '\u{1EE6}' | // Ủ  [LATIN CAPITAL LETTER U WITH HOOK ABOVE]
        '\u{1EE8}' | // Ứ  [LATIN CAPITAL LETTER U WITH HORN AND ACUTE]
        '\u{1EEA}' | // Ừ  [LATIN CAPITAL LETTER U WITH HORN AND GRAVE]
        '\u{1EEC}' | // Ử  [LATIN CAPITAL LETTER U WITH HORN AND HOOK ABOVE]
        '\u{1EEE}' | // Ữ  [LATIN CAPITAL LETTER U WITH HORN AND TILDE]
        '\u{1EF0}' | // Ự  [LATIN CAPITAL LETTER U WITH HORN AND DOT BELOW]
        '\u{24CA}' | // Ⓤ  [CIRCLED LATIN CAPITAL LETTER U]
        '\u{FF35}' // Ｕ  [FULLWIDTH LATIN CAPITAL LETTER U]
        => Some("U"),
        '\u{00F9}' | // ù  [LATIN SMALL LETTER U WITH GRAVE]
        '\u{00FA}' | // ú  [LATIN SMALL LETTER U WITH ACUTE]
        '\u{00FB}' | // û  [LATIN SMALL LETTER U WITH CIRCUMFLEX]
        '\u{00FC}' | // ü  [LATIN SMALL LETTER U WITH DIAERESIS]
        '\u{0169}' | // ũ  [LATIN SMALL LETTER U WITH TILDE]
        '\u{016B}' | // ū  [LATIN SMALL LETTER U WITH MACRON]
        '\u{016D}' | // ŭ  [LATIN SMALL LETTER U WITH BREVE]
        '\u{016F}' | // ů  [LATIN SMALL LETTER U WITH RING ABOVE]
        '\u{0171}' | // ű  [LATIN SMALL LETTER U WITH DOUBLE ACUTE]
        '\u{0173}' | // ų  [LATIN SMALL LETTER U WITH OGONEK]
        '\u{01B0}' | // ư  [LATIN SMALL LETTER U WITH HORN]
        '\u{01D4}' | // ǔ  [LATIN SMALL LETTER U WITH CARON]
        '\u{01D6}' | // ǖ  [LATIN SMALL LETTER U WITH DIAERESIS AND MACRON]
        '\u{01D8}' | // ǘ  [LATIN SMALL LETTER U WITH DIAERESIS AND ACUTE]
        '\u{01DA}' | // ǚ  [LATIN SMALL LETTER U WITH DIAERESIS AND CARON]
        '\u{01DC}' | // ǜ  [LATIN SMALL LETTER U WITH DIAERESIS AND GRAVE]
        '\u{0215}' | // ȕ  [LATIN SMALL LETTER U WITH DOUBLE GRAVE]
        '\u{0217}' | // ȗ  [LATIN SMALL LETTER U WITH INVERTED BREVE]
        '\u{0289}' | // ʉ  [LATIN SMALL LETTER U BAR]
        '\u{1D64}' | // ᵤ  [LATIN SUBSCRIPT SMALL LETTER U]
        '\u{1D99}' | // ᶙ  [LATIN SMALL LETTER U WITH RETROFLEX HOOK]
        '\u{1E73}' | // ṳ  [LATIN SMALL LETTER U WITH DIAERESIS BELOW]
        '\u{1E75}' | // ṵ  [LATIN SMALL LETTER U WITH TILDE BELOW]
        '\u{1E77}' | // ṷ  [LATIN SMALL LETTER U WITH CIRCUMFLEX BELOW]
        '\u{1E79}' | // ṹ  [LATIN SMALL LETTER U WITH TILDE AND ACUTE]
        '\u{1E7B}' | // ṻ  [LATIN SMALL LETTER U WITH MACRON AND DIAERESIS]
        '\u{1EE5}' | // ụ  [LATIN SMALL LETTER U WITH DOT BELOW]
        '\u{1EE7}' | // ủ  [LATIN SMALL LETTER U WITH HOOK ABOVE]
        '\u{1EE9}' | // ứ  [LATIN SMALL LETTER U WITH HORN AND ACUTE]
        '\u{1EEB}' | // ừ  [LATIN SMALL LETTER U WITH HORN AND GRAVE]
        '\u{1EED}' | // ử  [LATIN SMALL LETTER U WITH HORN AND HOOK ABOVE]
        '\u{1EEF}' | // ữ  [LATIN SMALL LETTER U WITH HORN AND TILDE]
        '\u{1EF1}' | // ự  [LATIN SMALL LETTER U WITH HORN AND DOT BELOW]
        '\u{24E4}' | // ⓤ  [CIRCLED LATIN SMALL LETTER U]
        '\u{FF55}' // ｕ  [FULLWIDTH LATIN SMALL LETTER U]
        => Some("u"),
        '\u{24B0}' // ⒰  [PARENTHESIZED LATIN SMALL LETTER U]
        => Some("(u)"),
        '\u{1D6B}' // ᵫ  [LATIN SMALL LETTER UE]
        => Some("ue"),
        '\u{01B2}' | // Ʋ  [LATIN CAPITAL LETTER V WITH HOOK]
        '\u{0245}' | // Ʌ  [LATIN CAPITAL LETTER TURNED V]
        '\u{1D20}' | // ᴠ  [LATIN LETTER SMALL CAPITAL V]
        '\u{1E7C}' | // Ṽ  [LATIN CAPITAL LETTER V WITH TILDE]
        '\u{1E7E}' | // Ṿ  [LATIN CAPITAL LETTER V WITH DOT BELOW]
        '\u{1EFC}' | // Ỽ  [LATIN CAPITAL LETTER MIDDLE-WELSH V]
        '\u{24CB}' | // Ⓥ  [CIRCLED LATIN CAPITAL LETTER V]
        '\u{A75E}' | // Ꝟ  [LATIN CAPITAL LETTER V WITH DIAGONAL STROKE]
        '\u{A768}' | // Ꝩ  [LATIN CAPITAL LETTER VEND]
        '\u{FF36}' // Ｖ  [FULLWIDTH LATIN CAPITAL LETTER V]
        => Some("V"),
        '\u{028B}' | // ʋ  [LATIN SMALL LETTER V WITH HOOK]
        '\u{028C}' | // ʌ  [LATIN SMALL LETTER TURNED V]
        '\u{1D65}' | // ᵥ  [LATIN SUBSCRIPT SMALL LETTER V]
        '\u{1D8C}' | // ᶌ  [LATIN SMALL LETTER V WITH PALATAL HOOK]
        '\u{1E7D}' | // ṽ  [LATIN SMALL LETTER V WITH TILDE]
        '\u{1E7F}' | // ṿ  [LATIN SMALL LETTER V WITH DOT BELOW]
        '\u{24E5}' | // ⓥ  [CIRCLED LATIN SMALL LETTER V]
        '\u{2C71}' | // ⱱ  [LATIN SMALL LETTER V WITH RIGHT HOOK]
        '\u{2C74}' | // ⱴ  [LATIN SMALL LETTER V WITH CURL]
        '\u{A75F}' | // ꝟ  [LATIN SMALL LETTER V WITH DIAGONAL STROKE]
        '\u{FF56}' // ｖ  [FULLWIDTH LATIN SMALL LETTER V]
        => Some("v"),
        '\u{A760}' // Ꝡ  [LATIN CAPITAL LETTER VY]
        => Some("VY"),
        '\u{24B1}' // ⒱  [PARENTHESIZED LATIN SMALL LETTER V]
        => Some("(v)"),
        '\u{A761}' // ꝡ  [LATIN SMALL LETTER VY]
        => Some("vy"),
        '\u{0174}' | // Ŵ  [LATIN CAPITAL LETTER W WITH CIRCUMFLEX]
        '\u{01F7}' | // Ƿ  http://en.wikipedia.org/wiki/Wynn  [LATIN CAPITAL LETTER WYNN]
        '\u{1D21}' | // ᴡ  [LATIN LETTER SMALL CAPITAL W]
        '\u{1E80}' | // Ẁ  [LATIN CAPITAL LETTER W WITH GRAVE]
        '\u{1E82}' | // Ẃ  [LATIN CAPITAL LETTER W WITH ACUTE]
        '\u{1E84}' | // Ẅ  [LATIN CAPITAL LETTER W WITH DIAERESIS]
        '\u{1E86}' | // Ẇ  [LATIN CAPITAL LETTER W WITH DOT ABOVE]
        '\u{1E88}' | // Ẉ  [LATIN CAPITAL LETTER W WITH DOT BELOW]
        '\u{24CC}' | // Ⓦ  [CIRCLED LATIN CAPITAL LETTER W]
        '\u{2C72}' | // Ⱳ  [LATIN CAPITAL LETTER W WITH HOOK]
        '\u{FF37}' // Ｗ  [FULLWIDTH LATIN CAPITAL LETTER W]
        => Some("W"),
        '\u{0175}' | // ŵ  [LATIN SMALL LETTER W WITH CIRCUMFLEX]
        '\u{01BF}' | // ƿ  http://en.wikipedia.org/wiki/Wynn  [LATIN LETTER WYNN]
        '\u{028D}' | // ʍ  [LATIN SMALL LETTER TURNED W]
        '\u{1E81}' | // ẁ  [LATIN SMALL LETTER W WITH GRAVE]
        '\u{1E83}' | // ẃ  [LATIN SMALL LETTER W WITH ACUTE]
        '\u{1E85}' | // ẅ  [LATIN SMALL LETTER W WITH DIAERESIS]
        '\u{1E87}' | // ẇ  [LATIN SMALL LETTER W WITH DOT ABOVE]
        '\u{1E89}' | // ẉ  [LATIN SMALL LETTER W WITH DOT BELOW]
        '\u{1E98}' | // ẘ  [LATIN SMALL LETTER W WITH RING ABOVE]
        '\u{24E6}' | // ⓦ  [CIRCLED LATIN SMALL LETTER W]
        '\u{2C73}' | // ⱳ  [LATIN SMALL LETTER W WITH HOOK]
        '\u{FF57}' // ｗ  [FULLWIDTH LATIN SMALL LETTER W]
        => Some("w"),
        '\u{24B2}' // ⒲  [PARENTHESIZED LATIN SMALL LETTER W]
        => Some("(w)"),
        '\u{1E8A}' | // Ẋ  [LATIN CAPITAL LETTER X WITH DOT ABOVE]
        '\u{1E8C}' | // Ẍ  [LATIN CAPITAL LETTER X WITH DIAERESIS]
        '\u{24CD}' | // Ⓧ  [CIRCLED LATIN CAPITAL LETTER X]
        '\u{FF38}' // Ｘ  [FULLWIDTH LATIN CAPITAL LETTER X]
        => Some("X"),
        '\u{1D8D}' | // ᶍ  [LATIN SMALL LETTER X WITH PALATAL HOOK]
        '\u{1E8B}' | // ẋ  [LATIN SMALL LETTER X WITH DOT ABOVE]
        '\u{1E8D}' | // ẍ  [LATIN SMALL LETTER X WITH DIAERESIS]
        '\u{2093}' | // ₓ  [LATIN SUBSCRIPT SMALL LETTER X]
        '\u{24E7}' | // ⓧ  [CIRCLED LATIN SMALL LETTER X]
        '\u{FF58}' // ｘ  [FULLWIDTH LATIN SMALL LETTER X]
        => Some("x"),
        '\u{24B3}' // ⒳  [PARENTHESIZED LATIN SMALL LETTER X]
        => Some("(x)"),
        '\u{00DD}' | // Ý  [LATIN CAPITAL LETTER Y WITH ACUTE]
        '\u{0176}' | // Ŷ  [LATIN CAPITAL LETTER Y WITH CIRCUMFLEX]
        '\u{0178}' | // Ÿ  [LATIN CAPITAL LETTER Y WITH DIAERESIS]
        '\u{01B3}' | // Ƴ  [LATIN CAPITAL LETTER Y WITH HOOK]
        '\u{0232}' | // Ȳ  [LATIN CAPITAL LETTER Y WITH MACRON]
        '\u{024E}' | // Ɏ  [LATIN CAPITAL LETTER Y WITH STROKE]
        '\u{028F}' | // ʏ  [LATIN LETTER SMALL CAPITAL Y]
        '\u{1E8E}' | // Ẏ  [LATIN CAPITAL LETTER Y WITH DOT ABOVE]
        '\u{1EF2}' | // Ỳ  [LATIN CAPITAL LETTER Y WITH GRAVE]
        '\u{1EF4}' | // Ỵ  [LATIN CAPITAL LETTER Y WITH DOT BELOW]
        '\u{1EF6}' | // Ỷ  [LATIN CAPITAL LETTER Y WITH HOOK ABOVE]
        '\u{1EF8}' | // Ỹ  [LATIN CAPITAL LETTER Y WITH TILDE]
        '\u{1EFE}' | // Ỿ  [LATIN CAPITAL LETTER Y WITH LOOP]
        '\u{24CE}' | // Ⓨ  [CIRCLED LATIN CAPITAL LETTER Y]
        '\u{FF39}' // Ｙ  [FULLWIDTH LATIN CAPITAL LETTER Y]
        => Some("Y"),
        '\u{00FD}' | // ý  [LATIN SMALL LETTER Y WITH ACUTE]
        '\u{00FF}' | // ÿ  [LATIN SMALL LETTER Y WITH DIAERESIS]
        '\u{0177}' | // ŷ  [LATIN SMALL LETTER Y WITH CIRCUMFLEX]
        '\u{01B4}' | // ƴ  [LATIN SMALL LETTER Y WITH HOOK]
        '\u{0233}' | // ȳ  [LATIN SMALL LETTER Y WITH MACRON]
        '\u{024F}' | // ɏ  [LATIN SMALL LETTER Y WITH STROKE]
        '\u{028E}' | // ʎ  [LATIN SMALL LETTER TURNED Y]
        '\u{1E8F}' | // ẏ  [LATIN SMALL LETTER Y WITH DOT ABOVE]
        '\u{1E99}' | // ẙ  [LATIN SMALL LETTER Y WITH RING ABOVE]
        '\u{1EF3}' | // ỳ  [LATIN SMALL LETTER Y WITH GRAVE]
        '\u{1EF5}' | // ỵ  [LATIN SMALL LETTER Y WITH DOT BELOW]
        '\u{1EF7}' | // ỷ  [LATIN SMALL LETTER Y WITH HOOK ABOVE]
        '\u{1EF9}' | // ỹ  [LATIN SMALL LETTER Y WITH TILDE]
        '\u{1EFF}' | // ỿ  [LATIN SMALL LETTER Y WITH LOOP]
        '\u{24E8}' | // ⓨ  [CIRCLED LATIN SMALL LETTER Y]
        '\u{FF59}' // ｙ  [FULLWIDTH LATIN SMALL LETTER Y]
        => Some("y"),
        '\u{24B4}' // ⒴  [PARENTHESIZED LATIN SMALL LETTER Y]
        => Some("(y)"),
        '\u{0179}' | // Ź  [LATIN CAPITAL LETTER Z WITH ACUTE]
        '\u{017B}' | // Ż  [LATIN CAPITAL LETTER Z WITH DOT ABOVE]
        '\u{017D}' | // Ž  [LATIN CAPITAL LETTER Z WITH CARON]
        '\u{01B5}' | // Ƶ  [LATIN CAPITAL LETTER Z WITH STROKE]
        '\u{021C}' | // Ȝ  http://en.wikipedia.org/wiki/Yogh  [LATIN CAPITAL LETTER YOGH]
        '\u{0224}' | // Ȥ  [LATIN CAPITAL LETTER Z WITH HOOK]
        '\u{1D22}' | // ᴢ  [LATIN LETTER SMALL CAPITAL Z]
        '\u{1E90}' | // Ẑ  [LATIN CAPITAL LETTER Z WITH CIRCUMFLEX]
        '\u{1E92}' | // Ẓ  [LATIN CAPITAL LETTER Z WITH DOT BELOW]
        '\u{1E94}' | // Ẕ  [LATIN CAPITAL LETTER Z WITH LINE BELOW]
        '\u{24CF}' | // Ⓩ  [CIRCLED LATIN CAPITAL LETTER Z]
        '\u{2C6B}' | // Ⱬ  [LATIN CAPITAL LETTER Z WITH DESCENDER]
        '\u{A762}' | // Ꝣ  [LATIN CAPITAL LETTER VISIGOTHIC Z]
        '\u{FF3A}' // Ｚ  [FULLWIDTH LATIN CAPITAL LETTER Z]
        => Some("Z"),
        '\u{017A}' | // ź  [LATIN SMALL LETTER Z WITH ACUTE]
        '\u{017C}' | // ż  [LATIN SMALL LETTER Z WITH DOT ABOVE]
        '\u{017E}' | // ž  [LATIN SMALL LETTER Z WITH CARON]
        '\u{01B6}' | // ƶ  [LATIN SMALL LETTER Z WITH STROKE]
        '\u{021D}' | // ȝ  http://en.wikipedia.org/wiki/Yogh  [LATIN SMALL LETTER YOGH]
        '\u{0225}' | // ȥ  [LATIN SMALL LETTER Z WITH HOOK]
        '\u{0240}' | // ɀ  [LATIN SMALL LETTER Z WITH SWASH TAIL]
        '\u{0290}' | // ʐ  [LATIN SMALL LETTER Z WITH RETROFLEX HOOK]
        '\u{0291}' | // ʑ  [LATIN SMALL LETTER Z WITH CURL]
        '\u{1D76}' | // ᵶ  [LATIN SMALL LETTER Z WITH MIDDLE TILDE]
        '\u{1D8E}' | // ᶎ  [LATIN SMALL LETTER Z WITH PALATAL HOOK]
        '\u{1E91}' | // ẑ  [LATIN SMALL LETTER Z WITH CIRCUMFLEX]
        '\u{1E93}' | // ẓ  [LATIN SMALL LETTER Z WITH DOT BELOW]
        '\u{1E95}' | // ẕ  [LATIN SMALL LETTER Z WITH LINE BELOW]
        '\u{24E9}' | // ⓩ  [CIRCLED LATIN SMALL LETTER Z]
        '\u{2C6C}' | // ⱬ  [LATIN SMALL LETTER Z WITH DESCENDER]
        '\u{A763}' | // ꝣ  [LATIN SMALL LETTER VISIGOTHIC Z]
        '\u{FF5A}' // ｚ  [FULLWIDTH LATIN SMALL LETTER Z]
        => Some("z"),
        '\u{24B5}' // ⒵  [PARENTHESIZED LATIN SMALL LETTER Z]
        => Some("(z)"),
        '\u{2070}' | // ⁰  [SUPERSCRIPT ZERO]
        '\u{2080}' | // ₀  [SUBSCRIPT ZERO]
        '\u{24EA}' | // ⓪  [CIRCLED DIGIT ZERO]
        '\u{24FF}' | // ⓿  [NEGATIVE CIRCLED DIGIT ZERO]
        '\u{FF10}' // ０  [FULLWIDTH DIGIT ZERO]
        => Some("0"),
        '\u{00B9}' | // ¹  [SUPERSCRIPT ONE]
        '\u{2081}' | // ₁  [SUBSCRIPT ONE]
        '\u{2460}' | // ①  [CIRCLED DIGIT ONE]
        '\u{24F5}' | // ⓵  [DOUBLE CIRCLED DIGIT ONE]
        '\u{2776}' | // ❶  [DINGBAT NEGATIVE CIRCLED DIGIT ONE]
        '\u{2780}' | // ➀  [DINGBAT CIRCLED SANS-SERIF DIGIT ONE]
        '\u{278A}' | // ➊  [DINGBAT NEGATIVE CIRCLED SANS-SERIF DIGIT ONE]
        '\u{FF11}' // １  [FULLWIDTH DIGIT ONE]
        => Some("1"),
        '\u{2488}' // ⒈  [DIGIT ONE FULL STOP]
        => Some("1."),
        '\u{2474}' // ⑴  [PARENTHESIZED DIGIT ONE]
        => Some("(1)"),
        '\u{00B2}' | // ²  [SUPERSCRIPT TWO]
        '\u{2082}' | // ₂  [SUBSCRIPT TWO]
        '\u{2461}' | // ②  [CIRCLED DIGIT TWO]
        '\u{24F6}' | // ⓶  [DOUBLE CIRCLED DIGIT TWO]
        '\u{2777}' | // ❷  [DINGBAT NEGATIVE CIRCLED DIGIT TWO]
        '\u{2781}' | // ➁  [DINGBAT CIRCLED SANS-SERIF DIGIT TWO]
        '\u{278B}' | // ➋  [DINGBAT NEGATIVE CIRCLED SANS-SERIF DIGIT TWO]
        '\u{FF12}' // ２  [FULLWIDTH DIGIT TWO]
        => Some("2"),
        '\u{2489}' // ⒉  [DIGIT TWO FULL STOP]
        => Some("2."),
        '\u{2475}' // ⑵  [PARENTHESIZED DIGIT TWO]
        => Some("(2)"),
        '\u{00B3}' | // ³  [SUPERSCRIPT THREE]
        '\u{2083}' | // ₃  [SUBSCRIPT THREE]
        '\u{2462}' | // ③  [CIRCLED DIGIT THREE]
        '\u{24F7}' | // ⓷  [DOUBLE CIRCLED DIGIT THREE]
        '\u{2778}' | // ❸  [DINGBAT NEGATIVE CIRCLED DIGIT THREE]
        '\u{2782}' | // ➂  [DINGBAT CIRCLED SANS-SERIF DIGIT THREE]
        '\u{278C}' | // ➌  [DINGBAT NEGATIVE CIRCLED SANS-SERIF DIGIT THREE]
        '\u{FF13}' // ３  [FULLWIDTH DIGIT THREE]
        => Some("3"),
        '\u{248A}' // ⒊  [DIGIT THREE FULL STOP]
        => Some("3."),
        '\u{2476}' // ⑶  [PARENTHESIZED DIGIT THREE]
        => Some("(3)"),
        '\u{2074}' | // ⁴  [SUPERSCRIPT FOUR]
        '\u{2084}' | // ₄  [SUBSCRIPT FOUR]
        '\u{2463}' | // ④  [CIRCLED DIGIT FOUR]
        '\u{24F8}' | // ⓸  [DOUBLE CIRCLED DIGIT FOUR]
        '\u{2779}' | // ❹  [DINGBAT NEGATIVE CIRCLED DIGIT FOUR]
        '\u{2783}' | // ➃  [DINGBAT CIRCLED SANS-SERIF DIGIT FOUR]
        '\u{278D}' | // ➍  [DINGBAT NEGATIVE CIRCLED SANS-SERIF DIGIT FOUR]
        '\u{FF14}' // ４  [FULLWIDTH DIGIT FOUR]
        => Some("4"),
        '\u{248B}' // ⒋  [DIGIT FOUR FULL STOP]
        => Some("4."),
        '\u{2477}' // ⑷  [PARENTHESIZED DIGIT FOUR]
        => Some("(4)"),
        '\u{2075}' | // ⁵  [SUPERSCRIPT FIVE]
        '\u{2085}' | // ₅  [SUBSCRIPT FIVE]
        '\u{2464}' | // ⑤  [CIRCLED DIGIT FIVE]
        '\u{24F9}' | // ⓹  [DOUBLE CIRCLED DIGIT FIVE]
        '\u{277A}' | // ❺  [DINGBAT NEGATIVE CIRCLED DIGIT FIVE]
        '\u{2784}' | // ➄  [DINGBAT CIRCLED SANS-SERIF DIGIT FIVE]
        '\u{278E}' | // ➎  [DINGBAT NEGATIVE CIRCLED SANS-SERIF DIGIT FIVE]
        '\u{FF15}' // ５  [FULLWIDTH DIGIT FIVE]
        => Some("5"),
        '\u{248C}' // ⒌  [DIGIT FIVE FULL STOP]
        => Some("5."),
        '\u{2478}' // ⑸  [PARENTHESIZED DIGIT FIVE]
        => Some("(5)"),
        '\u{2076}' | // ⁶  [SUPERSCRIPT SIX]
        '\u{2086}' | // ₆  [SUBSCRIPT SIX]
        '\u{2465}' | // ⑥  [CIRCLED DIGIT SIX]
        '\u{24FA}' | // ⓺  [DOUBLE CIRCLED DIGIT SIX]
        '\u{277B}' | // ❻  [DINGBAT NEGATIVE CIRCLED DIGIT SIX]
        '\u{2785}' | // ➅  [DINGBAT CIRCLED SANS-SERIF DIGIT SIX]
        '\u{278F}' | // ➏  [DINGBAT NEGATIVE CIRCLED SANS-SERIF DIGIT SIX]
        '\u{FF16}' // ６  [FULLWIDTH DIGIT SIX]
        => Some("6"),
        '\u{248D}' // ⒍  [DIGIT SIX FULL STOP]
        => Some("6."),
        '\u{2479}' // ⑹  [PARENTHESIZED DIGIT SIX]
        => Some("(6)"),
        '\u{2077}' | // ⁷  [SUPERSCRIPT SEVEN]
        '\u{2087}' | // ₇  [SUBSCRIPT SEVEN]
        '\u{2466}' | // ⑦  [CIRCLED DIGIT SEVEN]
        '\u{24FB}' | // ⓻  [DOUBLE CIRCLED DIGIT SEVEN]
        '\u{277C}' | // ❼  [DINGBAT NEGATIVE CIRCLED DIGIT SEVEN]
        '\u{2786}' | // ➆  [DINGBAT CIRCLED SANS-SERIF DIGIT SEVEN]
        '\u{2790}' | // ➐  [DINGBAT NEGATIVE CIRCLED SANS-SERIF DIGIT SEVEN]
        '\u{FF17}' // ７  [FULLWIDTH DIGIT SEVEN]
        => Some("7"),
        '\u{248E}' // ⒎  [DIGIT SEVEN FULL STOP]
        => Some("7."),
        '\u{247A}' // ⑺  [PARENTHESIZED DIGIT SEVEN]
        => Some("(7)"),
        '\u{2078}' | // ⁸  [SUPERSCRIPT EIGHT]
        '\u{2088}' | // ₈  [SUBSCRIPT EIGHT]
        '\u{2467}' | // ⑧  [CIRCLED DIGIT EIGHT]
        '\u{24FC}' | // ⓼  [DOUBLE CIRCLED DIGIT EIGHT]
        '\u{277D}' | // ❽  [DINGBAT NEGATIVE CIRCLED DIGIT EIGHT]
        '\u{2787}' | // ➇  [DINGBAT CIRCLED SANS-SERIF DIGIT EIGHT]
        '\u{2791}' | // ➑  [DINGBAT NEGATIVE CIRCLED SANS-SERIF DIGIT EIGHT]
        '\u{FF18}' // ８  [FULLWIDTH DIGIT EIGHT]
        => Some("8"),
        '\u{248F}' // ⒏  [DIGIT EIGHT FULL STOP]
        => Some("8."),
        '\u{247B}' // ⑻  [PARENTHESIZED DIGIT EIGHT]
        => Some("(8)"),
        '\u{2079}' | // ⁹  [SUPERSCRIPT NINE]
        '\u{2089}' | // ₉  [SUBSCRIPT NINE]
        '\u{2468}' | // ⑨  [CIRCLED DIGIT NINE]
        '\u{24FD}' | // ⓽  [DOUBLE CIRCLED DIGIT NINE]
        '\u{277E}' | // ❾  [DINGBAT NEGATIVE CIRCLED DIGIT NINE]
        '\u{2788}' | // ➈  [DINGBAT CIRCLED SANS-SERIF DIGIT NINE]
        '\u{2792}' | // ➒  [DINGBAT NEGATIVE CIRCLED SANS-SERIF DIGIT NINE]
        '\u{FF19}' // ９  [FULLWIDTH DIGIT NINE]
        => Some("9"),
        '\u{2490}' // ⒐  [DIGIT NINE FULL STOP]
        => Some("9."),
        '\u{247C}' // ⑼  [PARENTHESIZED DIGIT NINE]
        => Some("(9)"),
        '\u{2469}' | // ⑩  [CIRCLED NUMBER TEN]
        '\u{24FE}' | // ⓾  [DOUBLE CIRCLED NUMBER TEN]
        '\u{277F}' | // ❿  [DINGBAT NEGATIVE CIRCLED NUMBER TEN]
        '\u{2789}' | // ➉  [DINGBAT CIRCLED SANS-SERIF NUMBER TEN]
        '\u{2793}' // ➓  [DINGBAT NEGATIVE CIRCLED SANS-SERIF NUMBER TEN]
        => Some("10"),
        '\u{2491}' // ⒑  [NUMBER TEN FULL STOP]
        => Some("10."),
        '\u{247D}' // ⑽  [PARENTHESIZED NUMBER TEN]
        => Some("(10)"),
        '\u{246A}' | // ⑪  [CIRCLED NUMBER ELEVEN]
        '\u{24EB}' // ⓫  [NEGATIVE CIRCLED NUMBER ELEVEN]
        => Some("11"),
        '\u{2492}' // ⒒  [NUMBER ELEVEN FULL STOP]
        => Some("11."),
        '\u{247E}' // ⑾  [PARENTHESIZED NUMBER ELEVEN]
        => Some("(11)"),
        '\u{246B}' | // ⑫  [CIRCLED NUMBER TWELVE]
        '\u{24EC}' // ⓬  [NEGATIVE CIRCLED NUMBER TWELVE]
        => Some("12"),
        '\u{2493}' // ⒓  [NUMBER TWELVE FULL STOP]
        => Some("12."),
        '\u{247F}' // ⑿  [PARENTHESIZED NUMBER TWELVE]
        => Some("(12)"),
        '\u{246C}' | // ⑬  [CIRCLED NUMBER THIRTEEN]
        '\u{24ED}' // ⓭  [NEGATIVE CIRCLED NUMBER THIRTEEN]
        => Some("13"),
        '\u{2494}' // ⒔  [NUMBER THIRTEEN FULL STOP]
        => Some("13."),
        '\u{2480}' // ⒀  [PARENTHESIZED NUMBER THIRTEEN]
        => Some("(13)"),
        '\u{246D}' | // ⑭  [CIRCLED NUMBER FOURTEEN]
        '\u{24EE}' // ⓮  [NEGATIVE CIRCLED NUMBER FOURTEEN]
        => Some("14"),
        '\u{2495}' // ⒕  [NUMBER FOURTEEN FULL STOP]
        => Some("14."),
        '\u{2481}' // ⒁  [PARENTHESIZED NUMBER FOURTEEN]
        => Some("(14)"),
        '\u{246E}' | // ⑮  [CIRCLED NUMBER FIFTEEN]
        '\u{24EF}' // ⓯  [NEGATIVE CIRCLED NUMBER FIFTEEN]
        => Some("15"),
        '\u{2496}' // ⒖  [NUMBER FIFTEEN FULL STOP]
        => Some("15."),
        '\u{2482}' // ⒂  [PARENTHESIZED NUMBER FIFTEEN]
        => Some("(15)"),
        '\u{246F}' | // ⑯  [CIRCLED NUMBER SIXTEEN]
        '\u{24F0}' // ⓰  [NEGATIVE CIRCLED NUMBER SIXTEEN]
        => Some("16"),
        '\u{2497}' // ⒗  [NUMBER SIXTEEN FULL STOP]
        => Some("16."),
        '\u{2483}' // ⒃  [PARENTHESIZED NUMBER SIXTEEN]
        => Some("(16)"),
        '\u{2470}' | // ⑰  [CIRCLED NUMBER SEVENTEEN]
        '\u{24F1}' // ⓱  [NEGATIVE CIRCLED NUMBER SEVENTEEN]
        => Some("17"),
        '\u{2498}' // ⒘  [NUMBER SEVENTEEN FULL STOP]
        => Some("17."),
        '\u{2484}' // ⒄  [PARENTHESIZED NUMBER SEVENTEEN]
        => Some("(17)"),
        '\u{2471}' | // ⑱  [CIRCLED NUMBER EIGHTEEN]
        '\u{24F2}' // ⓲  [NEGATIVE CIRCLED NUMBER EIGHTEEN]
        => Some("18"),
        '\u{2499}' // ⒙  [NUMBER EIGHTEEN FULL STOP]
        => Some("18."),
        '\u{2485}' // ⒅  [PARENTHESIZED NUMBER EIGHTEEN]
        => Some("(18)"),
        '\u{2472}' | // ⑲  [CIRCLED NUMBER NINETEEN]
        '\u{24F3}' // ⓳  [NEGATIVE CIRCLED NUMBER NINETEEN]
        => Some("19"),
        '\u{249A}' // ⒚  [NUMBER NINETEEN FULL STOP]
        => Some("19."),
        '\u{2486}' // ⒆  [PARENTHESIZED NUMBER NINETEEN]
        => Some("(19)"),
        '\u{2473}' | // ⑳  [CIRCLED NUMBER TWENTY]
        '\u{24F4}' // ⓴  [NEGATIVE CIRCLED NUMBER TWENTY]
        => Some("20"),
        '\u{249B}' // ⒛  [NUMBER TWENTY FULL STOP]
        => Some("20."),
        '\u{2487}' // ⒇  [PARENTHESIZED NUMBER TWENTY]
        => Some("(20)"),
        '\u{00AB}' | // «  [LEFT-POINTING DOUBLE ANGLE QUOTATION MARK]
        '\u{00BB}' | // »  [RIGHT-POINTING DOUBLE ANGLE QUOTATION MARK]
        '\u{201C}' | // “  [LEFT DOUBLE QUOTATION MARK]
        '\u{201D}' | // ”  [RIGHT DOUBLE QUOTATION MARK]
        '\u{201E}' | // „  [DOUBLE LOW-9 QUOTATION MARK]
        '\u{2033}' | // ″  [DOUBLE PRIME]
        '\u{2036}' | // ‶  [REVERSED DOUBLE PRIME]
        '\u{275D}' | // ❝  [HEAVY DOUBLE TURNED COMMA QUOTATION MARK ORNAMENT]
        '\u{275E}' | // ❞  [HEAVY DOUBLE COMMA QUOTATION MARK ORNAMENT]
        '\u{276E}' | // ❮  [HEAVY LEFT-POINTING ANGLE QUOTATION MARK ORNAMENT]
        '\u{276F}' | // ❯  [HEAVY RIGHT-POINTING ANGLE QUOTATION MARK ORNAMENT]
        '\u{FF02}' // ＂  [FULLWIDTH QUOTATION MARK]
        => Some("\""),
        '\u{2018}' | // ‘  [LEFT SINGLE QUOTATION MARK]
        '\u{2019}' | // ’  [RIGHT SINGLE QUOTATION MARK]
        '\u{201A}' | // ‚  [SINGLE LOW-9 QUOTATION MARK]
        '\u{201B}' | // ‛  [SINGLE HIGH-REVERSED-9 QUOTATION MARK]
        '\u{2032}' | // ′  [PRIME]
        '\u{2035}' | // ‵  [REVERSED PRIME]
        '\u{2039}' | // ‹  [SINGLE LEFT-POINTING ANGLE QUOTATION MARK]
        '\u{203A}' | // ›  [SINGLE RIGHT-POINTING ANGLE QUOTATION MARK]
        '\u{275B}' | // ❛  [HEAVY SINGLE TURNED COMMA QUOTATION MARK ORNAMENT]
        '\u{275C}' | // ❜  [HEAVY SINGLE COMMA QUOTATION MARK ORNAMENT]
        '\u{FF07}' // ＇  [FULLWIDTH APOSTROPHE]
        => Some("\'"),
        '\u{2010}' | // ‐  [HYPHEN]
        '\u{2011}' | // ‑  [NON-BREAKING HYPHEN]
        '\u{2012}' | // ‒  [FIGURE DASH]
        '\u{2013}' | // –  [EN DASH]
        '\u{2014}' | // —  [EM DASH]
        '\u{207B}' | // ⁻  [SUPERSCRIPT MINUS]
        '\u{208B}' | // ₋  [SUBSCRIPT MINUS]
        '\u{FF0D}' // －  [FULLWIDTH HYPHEN-MINUS]
        => Some("-"),
        '\u{2045}' | // ⁅  [LEFT SQUARE BRACKET WITH QUILL]
        '\u{2772}' | // ❲  [LIGHT LEFT TORTOISE SHELL BRACKET ORNAMENT]
        '\u{FF3B}' // ［  [FULLWIDTH LEFT SQUARE BRACKET]
        => Some("["),
        '\u{2046}' | // ⁆  [RIGHT SQUARE BRACKET WITH QUILL]
        '\u{2773}' | // ❳  [LIGHT RIGHT TORTOISE SHELL BRACKET ORNAMENT]
        '\u{FF3D}' // ］  [FULLWIDTH RIGHT SQUARE BRACKET]
        => Some("]"),
        '\u{207D}' | // ⁽  [SUPERSCRIPT LEFT PARENTHESIS]
        '\u{208D}' | // ₍  [SUBSCRIPT LEFT PARENTHESIS]
        '\u{2768}' | // ❨  [MEDIUM LEFT PARENTHESIS ORNAMENT]
        '\u{276A}' | // ❪  [MEDIUM FLATTENED LEFT PARENTHESIS ORNAMENT]
        '\u{FF08}' // （  [FULLWIDTH LEFT PARENTHESIS]
        => Some("("),
        '\u{2E28}' // ⸨  [LEFT DOUBLE PARENTHESIS]
        => Some("(("),
        '\u{207E}' | // ⁾  [SUPERSCRIPT RIGHT PARENTHESIS]
        '\u{208E}' | // ₎  [SUBSCRIPT RIGHT PARENTHESIS]
        '\u{2769}' | // ❩  [MEDIUM RIGHT PARENTHESIS ORNAMENT]
        '\u{276B}' | // ❫  [MEDIUM FLATTENED RIGHT PARENTHESIS ORNAMENT]
        '\u{FF09}' // ）  [FULLWIDTH RIGHT PARENTHESIS]
        => Some(")"),
        '\u{2E29}' // ⸩  [RIGHT DOUBLE PARENTHESIS]
        => Some("))"),
        '\u{276C}' | // ❬  [MEDIUM LEFT-POINTING ANGLE BRACKET ORNAMENT]
        '\u{2770}' | // ❰  [HEAVY LEFT-POINTING ANGLE BRACKET ORNAMENT]
        '\u{FF1C}' // ＜  [FULLWIDTH LESS-THAN SIGN]
        => Some("<"),
        '\u{276D}' | // ❭  [MEDIUM RIGHT-POINTING ANGLE BRACKET ORNAMENT]
        '\u{2771}' | // ❱  [HEAVY RIGHT-POINTING ANGLE BRACKET ORNAMENT]
        '\u{FF1E}' // ＞  [FULLWIDTH GREATER-THAN SIGN]
        => Some(">"),
        '\u{2774}' | // ❴  [MEDIUM LEFT CURLY BRACKET ORNAMENT]
        '\u{FF5B}' // ｛  [FULLWIDTH LEFT CURLY BRACKET]
        => Some("{"),
        '\u{2775}' | // ❵  [MEDIUM RIGHT CURLY BRACKET ORNAMENT]
        '\u{FF5D}' // ｝  [FULLWIDTH RIGHT CURLY BRACKET]
        => Some("}"),
        '\u{207A}' | // ⁺  [SUPERSCRIPT PLUS SIGN]
        '\u{208A}' | // ₊  [SUBSCRIPT PLUS SIGN]
        '\u{FF0B}' // ＋  [FULLWIDTH PLUS SIGN]
        => Some("+"),
        '\u{207C}' | // ⁼  [SUPERSCRIPT EQUALS SIGN]
        '\u{208C}' | // ₌  [SUBSCRIPT EQUALS SIGN]
        '\u{FF1D}' // ＝  [FULLWIDTH EQUALS SIGN]
        => Some("="),
        '\u{FF01}' // ！  [FULLWIDTH EXCLAMATION MARK]
        => Some("!"),
        '\u{203C}' // ‼  [DOUBLE EXCLAMATION MARK]
        => Some("!!"),
        '\u{2049}' // ⁉  [EXCLAMATION QUESTION MARK]
        => Some("!?"),
        '\u{FF03}' // ＃  [FULLWIDTH NUMBER SIGN]
        => Some("#"),
        '\u{FF04}' // ＄  [FULLWIDTH DOLLAR SIGN]
        => Some("$"),
        '\u{2052}' | // ⁒  [COMMERCIAL MINUS SIGN]
        '\u{FF05}' // ％  [FULLWIDTH PERCENT SIGN]
        => Some("%"),
        '\u{FF06}' // ＆  [FULLWIDTH AMPERSAND]
        => Some("&"),
        '\u{204E}' | // ⁎  [LOW ASTERISK]
        '\u{FF0A}' // ＊  [FULLWIDTH ASTERISK]
        => Some("*"),
        '\u{FF0C}' // ，  [FULLWIDTH COMMA]
        => Some(","),
        '\u{FF0E}' // ．  [FULLWIDTH FULL STOP]
        => Some("."),
        '\u{2044}' | // ⁄  [FRACTION SLASH]
        '\u{FF0F}' // ／  [FULLWIDTH SOLIDUS]
        => Some("/"),
        '\u{FF1A}' // ：  [FULLWIDTH COLON]
        => Some(":"),
        '\u{204F}' | // ⁏  [REVERSED SEMICOLON]
        '\u{FF1B}' // ；  [FULLWIDTH SEMICOLON]
        => Some(";"),
        '\u{FF1F}' // ？  [FULLWIDTH QUESTION MARK]
        => Some("?"),
        '\u{2047}' // ⁇  [DOUBLE QUESTION MARK]
        => Some("??"),
        '\u{2048}' // ⁈  [QUESTION EXCLAMATION MARK]
        => Some("?!"),
        '\u{FF20}' // ＠  [FULLWIDTH COMMERCIAL AT]
        => Some("@"),
        '\u{FF3C}' // ＼  [FULLWIDTH REVERSE SOLIDUS]
        => Some("\\"),
        '\u{2038}' | // ‸  [CARET]
        '\u{FF3E}' // ＾  [FULLWIDTH CIRCUMFLEX ACCENT]
        => Some("^"),
        '\u{FF3F}' // ＿  [FULLWIDTH LOW LINE]
        => Some("_"),
        '\u{2053}' | // ⁓  [SWUNG DASH]
        '\u{FF5E}' // ～  [FULLWIDTH TILDE]
        => Some("~"),
        _ => None
    }
}

// https://github.com/apache/lucene-solr/blob/master/lucene/analysis/common/src/java/org/apache/lucene/analysis/miscellaneous/ASCIIFoldingFilter.java#L187
fn to_ascii(text: &str, output: &mut String) {
    output.clear();

    for c in text.chars() {
        if let Some(folded) = fold_non_ascii_char(c) {
            output.push_str(folded);
        } else {
            output.push(c);
        }
    }
}

#[cfg(test)]
mod tests {

    use super::to_ascii;
    use crate::tokenizer::{AsciiFoldingFilter, RawTokenizer, SimpleTokenizer, TextAnalyzer};

    #[test]
    fn test_ascii_folding() {
        assert_eq!(&folding_helper("Ràmon"), &["Ramon"]);
        assert_eq!(&folding_helper("accentué"), &["accentue"]);
        assert_eq!(&folding_helper("âäàéè"), &["aaaee"]);
    }

    #[test]
    fn test_no_change() {
        assert_eq!(&folding_helper("Usagi"), &["Usagi"]);
    }

    fn folding_helper(text: &str) -> Vec<String> {
        let mut tokens = Vec::new();
        TextAnalyzer::builder(SimpleTokenizer::default())
            .filter(AsciiFoldingFilter)
            .build()
            .token_stream(text)
            .process(&mut |token| {
                tokens.push(token.text.clone());
            });
        tokens
    }

    fn folding_using_raw_tokenizer_helper(text: &str) -> String {
        let mut tokenizer = TextAnalyzer::builder(RawTokenizer::default())
            .filter(AsciiFoldingFilter)
            .build();
        let mut token_stream = tokenizer.token_stream(text);
        token_stream.advance();
        token_stream.token().text.clone()
    }

    #[test]
    fn test_latin1_characters() {
        let latin1_string = "Des mot clés À LA CHAÎNE À Á Â Ã Ä Å Æ Ç È É Ê Ë Ì Í Î Ï Ĳ Ð Ñ
                   Ò Ó Ô Õ Ö Ø Œ Þ Ù Ú Û Ü Ý Ÿ à á â ã ä å æ ç è é ê ë ì í î ï ĳ
                   ð ñ ò ó ô õ ö ø œ ß þ ù ú û ü ý ÿ ﬁ ﬂ";
        let mut vec: Vec<&str> = vec!["Des", "mot", "cles", "A", "LA", "CHAINE"];
        vec.extend(std::iter::repeat_n("A", 6));
        vec.extend(std::iter::repeat_n("AE", 1));
        vec.extend(std::iter::repeat_n("C", 1));
        vec.extend(std::iter::repeat_n("E", 4));
        vec.extend(std::iter::repeat_n("I", 4));
        vec.extend(std::iter::repeat_n("IJ", 1));
        vec.extend(std::iter::repeat_n("D", 1));
        vec.extend(std::iter::repeat_n("N", 1));
        vec.extend(std::iter::repeat_n("O", 6));
        vec.extend(std::iter::repeat_n("OE", 1));
        vec.extend(std::iter::repeat_n("TH", 1));
        vec.extend(std::iter::repeat_n("U", 4));
        vec.extend(std::iter::repeat_n("Y", 2));
        vec.extend(std::iter::repeat_n("a", 6));
        vec.extend(std::iter::repeat_n("ae", 1));
        vec.extend(std::iter::repeat_n("c", 1));
        vec.extend(std::iter::repeat_n("e", 4));
        vec.extend(std::iter::repeat_n("i", 4));
        vec.extend(std::iter::repeat_n("ij", 1));
        vec.extend(std::iter::repeat_n("d", 1));
        vec.extend(std::iter::repeat_n("n", 1));
        vec.extend(std::iter::repeat_n("o", 6));
        vec.extend(std::iter::repeat_n("oe", 1));
        vec.extend(std::iter::repeat_n("ss", 1));
        vec.extend(std::iter::repeat_n("th", 1));
        vec.extend(std::iter::repeat_n("u", 4));
        vec.extend(std::iter::repeat_n("y", 2));
        vec.extend(std::iter::repeat_n("fi", 1));
        vec.extend(std::iter::repeat_n("fl", 1));
        assert_eq!(folding_helper(latin1_string), vec);
    }

    #[test]
    fn test_unmodified_letters() {
        assert_eq!(
            folding_using_raw_tokenizer_helper("§ ¦ ¤ END"),
            "§ ¦ ¤ END".to_string()
        );
    }

    #[test]
    fn test_to_ascii() {
        let input = "Rámon".to_string();
        let mut buffer = String::new();
        to_ascii(&input, &mut buffer);
        assert_eq!("Ramon", buffer);
    }

    #[test]
    fn test_all_foldings() {
        // those folding is a copy of
        // https://github.com/apache/lucene-solr/blob/28d187acd1e391723eb6e1b5445f22abf5580a80/lucene/analysis/common/src/test/org/apache/lucene/analysis/miscellaneous/TestASCIIFoldingFilter.java
        // useful regex to adapt to a Rust structure:
        // 1. Preg and replace folded:
        //    - **REGEX** |,"(.){3,5}", // Folded result|
        //    - **REPLACEMENT** ], "$1".to_string(), ), ( vec![
        // 2. Preg and replace characters:
        //    - **REGEX** |[\+]{0,1} "(.{1,3})"  // U\+|
        //    - **REPLACEMENT** "$1",  // U+
        let foldings: Vec<(&[&str], &str)> = vec![
            (
                &[
                    "À",  // U+00C0: LATIN CAPITAL LETTER A WITH GRAVE
                    "Á",  // U+00C1: LATIN CAPITAL LETTER A WITH ACUTE
                    "Â",  // U+00C2: LATIN CAPITAL LETTER A WITH CIRCUMFLEX
                    "Ã",  // U+00C3: LATIN CAPITAL LETTER A WITH TILDE
                    "Ä",  // U+00C4: LATIN CAPITAL LETTER A WITH DIAERESIS
                    "Å",  // U+00C5: LATIN CAPITAL LETTER A WITH RING ABOVE
                    "Ā",  // U+0100: LATIN CAPITAL LETTER A WITH MACRON
                    "Ă",  // U+0102: LATIN CAPITAL LETTER A WITH BREVE
                    "Ą",  // U+0104: LATIN CAPITAL LETTER A WITH OGONEK
                    "Ə",  // U+018F: LATIN CAPITAL LETTER SCHWA
                    "Ǎ",  // U+01CD: LATIN CAPITAL LETTER A WITH CARON
                    "Ǟ",  // U+01DE: LATIN CAPITAL LETTER A WITH DIAERESIS AND MACRON
                    "Ǡ",  // U+01E0: LATIN CAPITAL LETTER A WITH DOT ABOVE AND MACRON
                    "Ǻ",  // U+01FA: LATIN CAPITAL LETTER A WITH RING ABOVE AND ACUTE
                    "Ȁ",  // U+0200: LATIN CAPITAL LETTER A WITH DOUBLE GRAVE
                    "Ȃ",  // U+0202: LATIN CAPITAL LETTER A WITH INVERTED BREVE
                    "Ȧ",  // U+0226: LATIN CAPITAL LETTER A WITH DOT ABOVE
                    "Ⱥ",  // U+023A: LATIN CAPITAL LETTER A WITH STROKE
                    "ᴀ",  // U+1D00: LATIN LETTER SMALL CAPITAL A
                    "Ḁ",  // U+1E00: LATIN CAPITAL LETTER A WITH RING BELOW
                    "Ạ",  // U+1EA0: LATIN CAPITAL LETTER A WITH DOT BELOW
                    "Ả",  // U+1EA2: LATIN CAPITAL LETTER A WITH HOOK ABOVE
                    "Ấ",  // U+1EA4: LATIN CAPITAL LETTER A WITH CIRCUMFLEX AND ACUTE
                    "Ầ",  // U+1EA6: LATIN CAPITAL LETTER A WITH CIRCUMFLEX AND GRAVE
                    "Ẩ",  // U+1EA8: LATIN CAPITAL LETTER A WITH CIRCUMFLEX AND HOOK ABOVE
                    "Ẫ",  // U+1EAA: LATIN CAPITAL LETTER A WITH CIRCUMFLEX AND TILDE
                    "Ậ",  // U+1EAC: LATIN CAPITAL LETTER A WITH CIRCUMFLEX AND DOT BELOW
                    "Ắ",  // U+1EAE: LATIN CAPITAL LETTER A WITH BREVE AND ACUTE
                    "Ằ",  // U+1EB0: LATIN CAPITAL LETTER A WITH BREVE AND GRAVE
                    "Ẳ",  // U+1EB2: LATIN CAPITAL LETTER A WITH BREVE AND HOOK ABOVE
                    "Ẵ",  // U+1EB4: LATIN CAPITAL LETTER A WITH BREVE AND TILDE
                    "Ặ",  // U+1EB6: LATIN CAPITAL LETTER A WITH BREVE AND DOT BELOW
                    "Ⓐ",  // U+24B6: CIRCLED LATIN CAPITAL LETTER A
                    "Ａ", // U+FF21: FULLWIDTH LATIN CAPITAL LETTER A
                ],
                "A",
            ),
            (
                &[
                    "à",  // U+00E0: LATIN SMALL LETTER A WITH GRAVE
                    "á",  // U+00E1: LATIN SMALL LETTER A WITH ACUTE
                    "â",  // U+00E2: LATIN SMALL LETTER A WITH CIRCUMFLEX
                    "ã",  // U+00E3: LATIN SMALL LETTER A WITH TILDE
                    "ä",  // U+00E4: LATIN SMALL LETTER A WITH DIAERESIS
                    "å",  // U+00E5: LATIN SMALL LETTER A WITH RING ABOVE
                    "ā",  // U+0101: LATIN SMALL LETTER A WITH MACRON
                    "ă",  // U+0103: LATIN SMALL LETTER A WITH BREVE
                    "ą",  // U+0105: LATIN SMALL LETTER A WITH OGONEK
                    "ǎ",  // U+01CE: LATIN SMALL LETTER A WITH CARON
                    "ǟ",  // U+01DF: LATIN SMALL LETTER A WITH DIAERESIS AND MACRON
                    "ǡ",  // U+01E1: LATIN SMALL LETTER A WITH DOT ABOVE AND MACRON
                    "ǻ",  // U+01FB: LATIN SMALL LETTER A WITH RING ABOVE AND ACUTE
                    "ȁ",  // U+0201: LATIN SMALL LETTER A WITH DOUBLE GRAVE
                    "ȃ",  // U+0203: LATIN SMALL LETTER A WITH INVERTED BREVE
                    "ȧ",  // U+0227: LATIN SMALL LETTER A WITH DOT ABOVE
                    "ɐ",  // U+0250: LATIN SMALL LETTER TURNED A
                    "ə",  // U+0259: LATIN SMALL LETTER SCHWA
                    "ɚ",  // U+025A: LATIN SMALL LETTER SCHWA WITH HOOK
                    "ᶏ",  // U+1D8F: LATIN SMALL LETTER A WITH RETROFLEX HOOK
                    "ḁ",  // U+1E01: LATIN SMALL LETTER A WITH RING BELOW
                    "ᶕ",  // U+1D95: LATIN SMALL LETTER SCHWA WITH RETROFLEX HOOK
                    "ẚ",  // U+1E9A: LATIN SMALL LETTER A WITH RIGHT HALF RING
                    "ạ",  // U+1EA1: LATIN SMALL LETTER A WITH DOT BELOW
                    "ả",  // U+1EA3: LATIN SMALL LETTER A WITH HOOK ABOVE
                    "ấ",  // U+1EA5: LATIN SMALL LETTER A WITH CIRCUMFLEX AND ACUTE
                    "ầ",  // U+1EA7: LATIN SMALL LETTER A WITH CIRCUMFLEX AND GRAVE
                    "ẩ",  // U+1EA9: LATIN SMALL LETTER A WITH CIRCUMFLEX AND HOOK ABOVE
                    "ẫ",  // U+1EAB: LATIN SMALL LETTER A WITH CIRCUMFLEX AND TILDE
                    "ậ",  // U+1EAD: LATIN SMALL LETTER A WITH CIRCUMFLEX AND DOT BELOW
                    "ắ",  // U+1EAF: LATIN SMALL LETTER A WITH BREVE AND ACUTE
                    "ằ",  // U+1EB1: LATIN SMALL LETTER A WITH BREVE AND GRAVE
                    "ẳ",  // U+1EB3: LATIN SMALL LETTER A WITH BREVE AND HOOK ABOVE
                    "ẵ",  // U+1EB5: LATIN SMALL LETTER A WITH BREVE AND TILDE
                    "ặ",  // U+1EB7: LATIN SMALL LETTER A WITH BREVE AND DOT BELOW
                    "ₐ",  // U+2090: LATIN SUBSCRIPT SMALL LETTER A
                    "ₔ",  // U+2094: LATIN SUBSCRIPT SMALL LETTER SCHWA
                    "ⓐ",  // U+24D0: CIRCLED LATIN SMALL LETTER A
                    "ⱥ",  // U+2C65: LATIN SMALL LETTER A WITH STROKE
                    "Ɐ",  // U+2C6F: LATIN CAPITAL LETTER TURNED A
                    "ａ", // U+FF41: FULLWIDTH LATIN SMALL LETTER A
                ],
                "a",
            ),
            (
                &[
                    "Ꜳ", // U+A732: LATIN CAPITAL LETTER AA
                ],
                "AA",
            ),
            (
                &[
                    "Æ", // U+00C6: LATIN CAPITAL LETTER AE
                    "Ǣ", // U+01E2: LATIN CAPITAL LETTER AE WITH MACRON
                    "Ǽ", // U+01FC: LATIN CAPITAL LETTER AE WITH ACUTE
                    "ᴁ", // U+1D01: LATIN LETTER SMALL CAPITAL AE
                ],
                "AE",
            ),
            (
                &[
                    "Ꜵ", // U+A734: LATIN CAPITAL LETTER AO
                ],
                "AO",
            ),
            (
                &[
                    "Ꜷ", // U+A736: LATIN CAPITAL LETTER AU
                ],
                "AU",
            ),
            (
                &[
                    "Ꜹ", // U+A738: LATIN CAPITAL LETTER AV
                    "Ꜻ", // U+A73A: LATIN CAPITAL LETTER AV WITH HORIZONTAL BAR
                ],
                "AV",
            ),
            (
                &[
                    "Ꜽ", // U+A73C: LATIN CAPITAL LETTER AY
                ],
                "AY",
            ),
            (
                &[
                    "⒜", // U+249C: PARENTHESIZED LATIN SMALL LETTER A
                ],
                "(a)",
            ),
            (
                &[
                    "ꜳ", // U+A733: LATIN SMALL LETTER AA
                ],
                "aa",
            ),
            (
                &[
                    "æ", // U+00E6: LATIN SMALL LETTER AE
                    "ǣ", // U+01E3: LATIN SMALL LETTER AE WITH MACRON
                    "ǽ", // U+01FD: LATIN SMALL LETTER AE WITH ACUTE
                    "ᴂ", // U+1D02: LATIN SMALL LETTER TURNED AE
                ],
                "ae",
            ),
            (
                &[
                    "ꜵ", // U+A735: LATIN SMALL LETTER AO
                ],
                "ao",
            ),
            (
                &[
                    "ꜷ", // U+A737: LATIN SMALL LETTER AU
                ],
                "au",
            ),
            (
                &[
                    "ꜹ", // U+A739: LATIN SMALL LETTER AV
                    "ꜻ", // U+A73B: LATIN SMALL LETTER AV WITH HORIZONTAL BAR
                ],
                "av",
            ),
            (
                &[
                    "ꜽ", // U+A73D: LATIN SMALL LETTER AY
                ],
                "ay",
            ),
            (
                &[
                    "Ɓ",  // U+0181: LATIN CAPITAL LETTER B WITH HOOK
                    "Ƃ",  // U+0182: LATIN CAPITAL LETTER B WITH TOPBAR
                    "Ƀ",  // U+0243: LATIN CAPITAL LETTER B WITH STROKE
                    "ʙ",  // U+0299: LATIN LETTER SMALL CAPITAL B
                    "ᴃ",  // U+1D03: LATIN LETTER SMALL CAPITAL BARRED B
                    "Ḃ",  // U+1E02: LATIN CAPITAL LETTER B WITH DOT ABOVE
                    "Ḅ",  // U+1E04: LATIN CAPITAL LETTER B WITH DOT BELOW
                    "Ḇ",  // U+1E06: LATIN CAPITAL LETTER B WITH LINE BELOW
                    "Ⓑ",  // U+24B7: CIRCLED LATIN CAPITAL LETTER B
                    "Ｂ", // U+FF22: FULLWIDTH LATIN CAPITAL LETTER B
                ],
                "B",
            ),
            (
                &[
                    "ƀ",  // U+0180: LATIN SMALL LETTER B WITH STROKE
                    "ƃ",  // U+0183: LATIN SMALL LETTER B WITH TOPBAR
                    "ɓ",  // U+0253: LATIN SMALL LETTER B WITH HOOK
                    "ᵬ",  // U+1D6C: LATIN SMALL LETTER B WITH MIDDLE TILDE
                    "ᶀ",  // U+1D80: LATIN SMALL LETTER B WITH PALATAL HOOK
                    "ḃ",  // U+1E03: LATIN SMALL LETTER B WITH DOT ABOVE
                    "ḅ",  // U+1E05: LATIN SMALL LETTER B WITH DOT BELOW
                    "ḇ",  // U+1E07: LATIN SMALL LETTER B WITH LINE BELOW
                    "ⓑ",  // U+24D1: CIRCLED LATIN SMALL LETTER B
                    "ｂ", // U+FF42: FULLWIDTH LATIN SMALL LETTER B
                ],
                "b",
            ),
            (
                &[
                    "⒝", // U+249D: PARENTHESIZED LATIN SMALL LETTER B
                ],
                "(b)",
            ),
            (
                &[
                    "Ç",  // U+00C7: LATIN CAPITAL LETTER C WITH CEDILLA
                    "Ć",  // U+0106: LATIN CAPITAL LETTER C WITH ACUTE
                    "Ĉ",  // U+0108: LATIN CAPITAL LETTER C WITH CIRCUMFLEX
                    "Ċ",  // U+010A: LATIN CAPITAL LETTER C WITH DOT ABOVE
                    "Č",  // U+010C: LATIN CAPITAL LETTER C WITH CARON
                    "Ƈ",  // U+0187: LATIN CAPITAL LETTER C WITH HOOK
                    "Ȼ",  // U+023B: LATIN CAPITAL LETTER C WITH STROKE
                    "ʗ",  // U+0297: LATIN LETTER STRETCHED C
                    "ᴄ",  // U+1D04: LATIN LETTER SMALL CAPITAL C
                    "Ḉ",  // U+1E08: LATIN CAPITAL LETTER C WITH CEDILLA AND ACUTE
                    "Ⓒ",  // U+24B8: CIRCLED LATIN CAPITAL LETTER C
                    "Ｃ", // U+FF23: FULLWIDTH LATIN CAPITAL LETTER C
                ],
                "C",
            ),
            (
                &[
                    "ç",  // U+00E7: LATIN SMALL LETTER C WITH CEDILLA
                    "ć",  // U+0107: LATIN SMALL LETTER C WITH ACUTE
                    "ĉ",  // U+0109: LATIN SMALL LETTER C WITH CIRCUMFLEX
                    "ċ",  // U+010B: LATIN SMALL LETTER C WITH DOT ABOVE
                    "č",  // U+010D: LATIN SMALL LETTER C WITH CARON
                    "ƈ",  // U+0188: LATIN SMALL LETTER C WITH HOOK
                    "ȼ",  // U+023C: LATIN SMALL LETTER C WITH STROKE
                    "ɕ",  // U+0255: LATIN SMALL LETTER C WITH CURL
                    "ḉ",  // U+1E09: LATIN SMALL LETTER C WITH CEDILLA AND ACUTE
                    "ↄ",  // U+2184: LATIN SMALL LETTER REVERSED C
                    "ⓒ",  // U+24D2: CIRCLED LATIN SMALL LETTER C
                    "Ꜿ",  // U+A73E: LATIN CAPITAL LETTER REVERSED C WITH DOT
                    "ꜿ",  // U+A73F: LATIN SMALL LETTER REVERSED C WITH DOT
                    "ｃ", // U+FF43: FULLWIDTH LATIN SMALL LETTER C
                ],
                "c",
            ),
            (
                &[
                    "⒞", // U+249E: PARENTHESIZED LATIN SMALL LETTER C
                ],
                "(c)",
            ),
            (
                &[
                    "Ð",  // U+00D0: LATIN CAPITAL LETTER ETH
                    "Ď",  // U+010E: LATIN CAPITAL LETTER D WITH CARON
                    "Đ",  // U+0110: LATIN CAPITAL LETTER D WITH STROKE
                    "Ɖ",  // U+0189: LATIN CAPITAL LETTER AFRICAN D
                    "Ɗ",  // U+018A: LATIN CAPITAL LETTER D WITH HOOK
                    "Ƌ",  // U+018B: LATIN CAPITAL LETTER D WITH TOPBAR
                    "ᴅ",  // U+1D05: LATIN LETTER SMALL CAPITAL D
                    "ᴆ",  // U+1D06: LATIN LETTER SMALL CAPITAL ETH
                    "Ḋ",  // U+1E0A: LATIN CAPITAL LETTER D WITH DOT ABOVE
                    "Ḍ",  // U+1E0C: LATIN CAPITAL LETTER D WITH DOT BELOW
                    "Ḏ",  // U+1E0E: LATIN CAPITAL LETTER D WITH LINE BELOW
                    "Ḑ",  // U+1E10: LATIN CAPITAL LETTER D WITH CEDILLA
                    "Ḓ",  // U+1E12: LATIN CAPITAL LETTER D WITH CIRCUMFLEX BELOW
                    "Ⓓ",  // U+24B9: CIRCLED LATIN CAPITAL LETTER D
                    "Ꝺ",  // U+A779: LATIN CAPITAL LETTER INSULAR D
                    "Ｄ", // U+FF24: FULLWIDTH LATIN CAPITAL LETTER D
                ],
                "D",
            ),
            (
                &[
                    "ð",  // U+00F0: LATIN SMALL LETTER ETH
                    "ď",  // U+010F: LATIN SMALL LETTER D WITH CARON
                    "đ",  // U+0111: LATIN SMALL LETTER D WITH STROKE
                    "ƌ",  // U+018C: LATIN SMALL LETTER D WITH TOPBAR
                    "ȡ",  // U+0221: LATIN SMALL LETTER D WITH CURL
                    "ɖ",  // U+0256: LATIN SMALL LETTER D WITH TAIL
                    "ɗ",  // U+0257: LATIN SMALL LETTER D WITH HOOK
                    "ᵭ",  // U+1D6D: LATIN SMALL LETTER D WITH MIDDLE TILDE
                    "ᶁ",  // U+1D81: LATIN SMALL LETTER D WITH PALATAL HOOK
                    "ᶑ",  // U+1D91: LATIN SMALL LETTER D WITH HOOK AND TAIL
                    "ḋ",  // U+1E0B: LATIN SMALL LETTER D WITH DOT ABOVE
                    "ḍ",  // U+1E0D: LATIN SMALL LETTER D WITH DOT BELOW
                    "ḏ",  // U+1E0F: LATIN SMALL LETTER D WITH LINE BELOW
                    "ḑ",  // U+1E11: LATIN SMALL LETTER D WITH CEDILLA
                    "ḓ",  // U+1E13: LATIN SMALL LETTER D WITH CIRCUMFLEX BELOW
                    "ⓓ",  // U+24D3: CIRCLED LATIN SMALL LETTER D
                    "ꝺ",  // U+A77A: LATIN SMALL LETTER INSULAR D
                    "ｄ", // U+FF44: FULLWIDTH LATIN SMALL LETTER D
                ],
                "d",
            ),
            (
                &[
                    "Ǆ", // U+01C4: LATIN CAPITAL LETTER DZ WITH CARON
                    "Ǳ", // U+01F1: LATIN CAPITAL LETTER DZ
                ],
                "DZ",
            ),
            (
                &[
                    "ǅ", // U+01C5: LATIN CAPITAL LETTER D WITH SMALL LETTER Z WITH CARON
                    "ǲ", // U+01F2: LATIN CAPITAL LETTER D WITH SMALL LETTER Z
                ],
                "Dz",
            ),
            (
                &[
                    "⒟", // U+249F: PARENTHESIZED LATIN SMALL LETTER D
                ],
                "(d)",
            ),
            (
                &[
                    "ȸ", // U+0238: LATIN SMALL LETTER DB DIGRAPH
                ],
                "db",
            ),
            (
                &[
                    "ǆ", // U+01C6: LATIN SMALL LETTER DZ WITH CARON
                    "ǳ", // U+01F3: LATIN SMALL LETTER DZ
                    "ʣ", // U+02A3: LATIN SMALL LETTER DZ DIGRAPH
                    "ʥ", // U+02A5: LATIN SMALL LETTER DZ DIGRAPH WITH CURL
                ],
                "dz",
            ),
            (
                &[
                    "È",  // U+00C8: LATIN CAPITAL LETTER E WITH GRAVE
                    "É",  // U+00C9: LATIN CAPITAL LETTER E WITH ACUTE
                    "Ê",  // U+00CA: LATIN CAPITAL LETTER E WITH CIRCUMFLEX
                    "Ë",  // U+00CB: LATIN CAPITAL LETTER E WITH DIAERESIS
                    "Ē",  // U+0112: LATIN CAPITAL LETTER E WITH MACRON
                    "Ĕ",  // U+0114: LATIN CAPITAL LETTER E WITH BREVE
                    "Ė",  // U+0116: LATIN CAPITAL LETTER E WITH DOT ABOVE
                    "Ę",  // U+0118: LATIN CAPITAL LETTER E WITH OGONEK
                    "Ě",  // U+011A: LATIN CAPITAL LETTER E WITH CARON
                    "Ǝ",  // U+018E: LATIN CAPITAL LETTER REVERSED E
                    "Ɛ",  // U+0190: LATIN CAPITAL LETTER OPEN E
                    "Ȅ",  // U+0204: LATIN CAPITAL LETTER E WITH DOUBLE GRAVE
                    "Ȇ",  // U+0206: LATIN CAPITAL LETTER E WITH INVERTED BREVE
                    "Ȩ",  // U+0228: LATIN CAPITAL LETTER E WITH CEDILLA
                    "Ɇ",  // U+0246: LATIN CAPITAL LETTER E WITH STROKE
                    "ᴇ",  // U+1D07: LATIN LETTER SMALL CAPITAL E
                    "Ḕ",  // U+1E14: LATIN CAPITAL LETTER E WITH MACRON AND GRAVE
                    "Ḗ",  // U+1E16: LATIN CAPITAL LETTER E WITH MACRON AND ACUTE
                    "Ḙ",  // U+1E18: LATIN CAPITAL LETTER E WITH CIRCUMFLEX BELOW
                    "Ḛ",  // U+1E1A: LATIN CAPITAL LETTER E WITH TILDE BELOW
                    "Ḝ",  // U+1E1C: LATIN CAPITAL LETTER E WITH CEDILLA AND BREVE
                    "Ẹ",  // U+1EB8: LATIN CAPITAL LETTER E WITH DOT BELOW
                    "Ẻ",  // U+1EBA: LATIN CAPITAL LETTER E WITH HOOK ABOVE
                    "Ẽ",  // U+1EBC: LATIN CAPITAL LETTER E WITH TILDE
                    "Ế",  // U+1EBE: LATIN CAPITAL LETTER E WITH CIRCUMFLEX AND ACUTE
                    "Ề",  // U+1EC0: LATIN CAPITAL LETTER E WITH CIRCUMFLEX AND GRAVE
                    "Ể",  // U+1EC2: LATIN CAPITAL LETTER E WITH CIRCUMFLEX AND HOOK ABOVE
                    "Ễ",  // U+1EC4: LATIN CAPITAL LETTER E WITH CIRCUMFLEX AND TILDE
                    "Ệ",  // U+1EC6: LATIN CAPITAL LETTER E WITH CIRCUMFLEX AND DOT BELOW
                    "Ⓔ",  // U+24BA: CIRCLED LATIN CAPITAL LETTER E
                    "ⱻ",  // U+2C7B: LATIN LETTER SMALL CAPITAL TURNED E
                    "Ｅ", // U+FF25: FULLWIDTH LATIN CAPITAL LETTER E
                ],
                "E",
            ),
            (
                &[
                    "è",  // U+00E8: LATIN SMALL LETTER E WITH GRAVE
                    "é",  // U+00E9: LATIN SMALL LETTER E WITH ACUTE
                    "ê",  // U+00EA: LATIN SMALL LETTER E WITH CIRCUMFLEX
                    "ë",  // U+00EB: LATIN SMALL LETTER E WITH DIAERESIS
                    "ē",  // U+0113: LATIN SMALL LETTER E WITH MACRON
                    "ĕ",  // U+0115: LATIN SMALL LETTER E WITH BREVE
                    "ė",  // U+0117: LATIN SMALL LETTER E WITH DOT ABOVE
                    "ę",  // U+0119: LATIN SMALL LETTER E WITH OGONEK
                    "ě",  // U+011B: LATIN SMALL LETTER E WITH CARON
                    "ǝ",  // U+01DD: LATIN SMALL LETTER TURNED E
                    "ȅ",  // U+0205: LATIN SMALL LETTER E WITH DOUBLE GRAVE
                    "ȇ",  // U+0207: LATIN SMALL LETTER E WITH INVERTED BREVE
                    "ȩ",  // U+0229: LATIN SMALL LETTER E WITH CEDILLA
                    "ɇ",  // U+0247: LATIN SMALL LETTER E WITH STROKE
                    "ɘ",  // U+0258: LATIN SMALL LETTER REVERSED E
                    "ɛ",  // U+025B: LATIN SMALL LETTER OPEN E
                    "ɜ",  // U+025C: LATIN SMALL LETTER REVERSED OPEN E
                    "ɝ",  // U+025D: LATIN SMALL LETTER REVERSED OPEN E WITH HOOK
                    "ɞ",  // U+025E: LATIN SMALL LETTER CLOSED REVERSED OPEN E
                    "ʚ",  // U+029A: LATIN SMALL LETTER CLOSED OPEN E
                    "ᴈ",  // U+1D08: LATIN SMALL LETTER TURNED OPEN E
                    "ᶒ",  // U+1D92: LATIN SMALL LETTER E WITH RETROFLEX HOOK
                    "ᶓ",  // U+1D93: LATIN SMALL LETTER OPEN E WITH RETROFLEX HOOK
                    "ᶔ",  // U+1D94: LATIN SMALL LETTER REVERSED OPEN E WITH RETROFLEX HOOK
                    "ḕ",  // U+1E15: LATIN SMALL LETTER E WITH MACRON AND GRAVE
                    "ḗ",  // U+1E17: LATIN SMALL LETTER E WITH MACRON AND ACUTE
                    "ḙ",  // U+1E19: LATIN SMALL LETTER E WITH CIRCUMFLEX BELOW
                    "ḛ",  // U+1E1B: LATIN SMALL LETTER E WITH TILDE BELOW
                    "ḝ",  // U+1E1D: LATIN SMALL LETTER E WITH CEDILLA AND BREVE
                    "ẹ",  // U+1EB9: LATIN SMALL LETTER E WITH DOT BELOW
                    "ẻ",  // U+1EBB: LATIN SMALL LETTER E WITH HOOK ABOVE
                    "ẽ",  // U+1EBD: LATIN SMALL LETTER E WITH TILDE
                    "ế",  // U+1EBF: LATIN SMALL LETTER E WITH CIRCUMFLEX AND ACUTE
                    "ề",  // U+1EC1: LATIN SMALL LETTER E WITH CIRCUMFLEX AND GRAVE
                    "ể",  // U+1EC3: LATIN SMALL LETTER E WITH CIRCUMFLEX AND HOOK ABOVE
                    "ễ",  // U+1EC5: LATIN SMALL LETTER E WITH CIRCUMFLEX AND TILDE
                    "ệ",  // U+1EC7: LATIN SMALL LETTER E WITH CIRCUMFLEX AND DOT BELOW
                    "ₑ",  // U+2091: LATIN SUBSCRIPT SMALL LETTER E
                    "ⓔ",  // U+24D4: CIRCLED LATIN SMALL LETTER E
                    "ⱸ",  // U+2C78: LATIN SMALL LETTER E WITH NOTCH
                    "ｅ", // U+FF45: FULLWIDTH LATIN SMALL LETTER E
                ],
                "e",
            ),
            (
                &[
                    "⒠", // U+24A0: PARENTHESIZED LATIN SMALL LETTER E
                ],
                "(e)",
            ),
            (
                &[
                    "Ƒ",  // U+0191: LATIN CAPITAL LETTER F WITH HOOK
                    "Ḟ",  // U+1E1E: LATIN CAPITAL LETTER F WITH DOT ABOVE
                    "Ⓕ",  // U+24BB: CIRCLED LATIN CAPITAL LETTER F
                    "ꜰ",  // U+A730: LATIN LETTER SMALL CAPITAL F
                    "Ꝼ",  // U+A77B: LATIN CAPITAL LETTER INSULAR F
                    "ꟻ",  // U+A7FB: LATIN EPIGRAPHIC LETTER REVERSED F
                    "Ｆ", // U+FF26: FULLWIDTH LATIN CAPITAL LETTER F
                ],
                "F",
            ),
            (
                &[
                    "ƒ",  // U+0192: LATIN SMALL LETTER F WITH HOOK
                    "ᵮ",  // U+1D6E: LATIN SMALL LETTER F WITH MIDDLE TILDE
                    "ᶂ",  // U+1D82: LATIN SMALL LETTER F WITH PALATAL HOOK
                    "ḟ",  // U+1E1F: LATIN SMALL LETTER F WITH DOT ABOVE
                    "ẛ",  // U+1E9B: LATIN SMALL LETTER LONG S WITH DOT ABOVE
                    "ⓕ",  // U+24D5: CIRCLED LATIN SMALL LETTER F
                    "ꝼ",  // U+A77C: LATIN SMALL LETTER INSULAR F
                    "ｆ", // U+FF46: FULLWIDTH LATIN SMALL LETTER F
                ],
                "f",
            ),
            (
                &[
                    "⒡", // U+24A1: PARENTHESIZED LATIN SMALL LETTER F
                ],
                "(f)",
            ),
            (
                &[
                    "ﬀ", // U+FB00: LATIN SMALL LIGATURE FF
                ],
                "ff",
            ),
            (
                &[
                    "ﬃ", // U+FB03: LATIN SMALL LIGATURE FFI
                ],
                "ffi",
            ),
            (
                &[
                    "ﬄ", // U+FB04: LATIN SMALL LIGATURE FFL
                ],
                "ffl",
            ),
            (
                &[
                    "ﬁ", // U+FB01: LATIN SMALL LIGATURE FI
                ],
                "fi",
            ),
            (
                &[
                    "ﬂ", // U+FB02: LATIN SMALL LIGATURE FL
                ],
                "fl",
            ),
            (
                &[
                    "Ĝ",  // U+011C: LATIN CAPITAL LETTER G WITH CIRCUMFLEX
                    "Ğ",  // U+011E: LATIN CAPITAL LETTER G WITH BREVE
                    "Ġ",  // U+0120: LATIN CAPITAL LETTER G WITH DOT ABOVE
                    "Ģ",  // U+0122: LATIN CAPITAL LETTER G WITH CEDILLA
                    "Ɠ",  // U+0193: LATIN CAPITAL LETTER G WITH HOOK
                    "Ǥ",  // U+01E4: LATIN CAPITAL LETTER G WITH STROKE
                    "ǥ",  // U+01E5: LATIN SMALL LETTER G WITH STROKE
                    "Ǧ",  // U+01E6: LATIN CAPITAL LETTER G WITH CARON
                    "ǧ",  // U+01E7: LATIN SMALL LETTER G WITH CARON
                    "Ǵ",  // U+01F4: LATIN CAPITAL LETTER G WITH ACUTE
                    "ɢ",  // U+0262: LATIN LETTER SMALL CAPITAL G
                    "ʛ",  // U+029B: LATIN LETTER SMALL CAPITAL G WITH HOOK
                    "Ḡ",  // U+1E20: LATIN CAPITAL LETTER G WITH MACRON
                    "Ⓖ",  // U+24BC: CIRCLED LATIN CAPITAL LETTER G
                    "Ᵹ",  // U+A77D: LATIN CAPITAL LETTER INSULAR G
                    "Ꝿ",  // U+A77E: LATIN CAPITAL LETTER TURNED INSULAR G
                    "Ｇ", // U+FF27: FULLWIDTH LATIN CAPITAL LETTER G
                ],
                "G",
            ),
            (
                &[
                    "ĝ",  // U+011D: LATIN SMALL LETTER G WITH CIRCUMFLEX
                    "ğ",  // U+011F: LATIN SMALL LETTER G WITH BREVE
                    "ġ",  // U+0121: LATIN SMALL LETTER G WITH DOT ABOVE
                    "ģ",  // U+0123: LATIN SMALL LETTER G WITH CEDILLA
                    "ǵ",  // U+01F5: LATIN SMALL LETTER G WITH ACUTE
                    "ɠ",  // U+0260: LATIN SMALL LETTER G WITH HOOK
                    "ɡ",  // U+0261: LATIN SMALL LETTER SCRIPT G
                    "ᵷ",  // U+1D77: LATIN SMALL LETTER TURNED G
                    "ᵹ",  // U+1D79: LATIN SMALL LETTER INSULAR G
                    "ᶃ",  // U+1D83: LATIN SMALL LETTER G WITH PALATAL HOOK
                    "ḡ",  // U+1E21: LATIN SMALL LETTER G WITH MACRON
                    "ⓖ",  // U+24D6: CIRCLED LATIN SMALL LETTER G
                    "ꝿ",  // U+A77F: LATIN SMALL LETTER TURNED INSULAR G
                    "ｇ", // U+FF47: FULLWIDTH LATIN SMALL LETTER G
                ],
                "g",
            ),
            (
                &[
                    "⒢", // U+24A2: PARENTHESIZED LATIN SMALL LETTER G
                ],
                "(g)",
            ),
            (
                &[
                    "Ĥ",  // U+0124: LATIN CAPITAL LETTER H WITH CIRCUMFLEX
                    "Ħ",  // U+0126: LATIN CAPITAL LETTER H WITH STROKE
                    "Ȟ",  // U+021E: LATIN CAPITAL LETTER H WITH CARON
                    "ʜ",  // U+029C: LATIN LETTER SMALL CAPITAL H
                    "Ḣ",  // U+1E22: LATIN CAPITAL LETTER H WITH DOT ABOVE
                    "Ḥ",  // U+1E24: LATIN CAPITAL LETTER H WITH DOT BELOW
                    "Ḧ",  // U+1E26: LATIN CAPITAL LETTER H WITH DIAERESIS
                    "Ḩ",  // U+1E28: LATIN CAPITAL LETTER H WITH CEDILLA
                    "Ḫ",  // U+1E2A: LATIN CAPITAL LETTER H WITH BREVE BELOW
                    "Ⓗ",  // U+24BD: CIRCLED LATIN CAPITAL LETTER H
                    "Ⱨ",  // U+2C67: LATIN CAPITAL LETTER H WITH DESCENDER
                    "Ⱶ",  // U+2C75: LATIN CAPITAL LETTER HALF H
                    "Ｈ", // U+FF28: FULLWIDTH LATIN CAPITAL LETTER H
                ],
                "H",
            ),
            (
                &[
                    "ĥ",  // U+0125: LATIN SMALL LETTER H WITH CIRCUMFLEX
                    "ħ",  // U+0127: LATIN SMALL LETTER H WITH STROKE
                    "ȟ",  // U+021F: LATIN SMALL LETTER H WITH CARON
                    "ɥ",  // U+0265: LATIN SMALL LETTER TURNED H
                    "ɦ",  // U+0266: LATIN SMALL LETTER H WITH HOOK
                    "ʮ",  // U+02AE: LATIN SMALL LETTER TURNED H WITH FISHHOOK
                    "ʯ",  // U+02AF: LATIN SMALL LETTER TURNED H WITH FISHHOOK AND TAIL
                    "ḣ",  // U+1E23: LATIN SMALL LETTER H WITH DOT ABOVE
                    "ḥ",  // U+1E25: LATIN SMALL LETTER H WITH DOT BELOW
                    "ḧ",  // U+1E27: LATIN SMALL LETTER H WITH DIAERESIS
                    "ḩ",  // U+1E29: LATIN SMALL LETTER H WITH CEDILLA
                    "ḫ",  // U+1E2B: LATIN SMALL LETTER H WITH BREVE BELOW
                    "ẖ",  // U+1E96: LATIN SMALL LETTER H WITH LINE BELOW
                    "ⓗ",  // U+24D7: CIRCLED LATIN SMALL LETTER H
                    "ⱨ",  // U+2C68: LATIN SMALL LETTER H WITH DESCENDER
                    "ⱶ",  // U+2C76: LATIN SMALL LETTER HALF H
                    "ｈ", // U+FF48: FULLWIDTH LATIN SMALL LETTER H
                ],
                "h",
            ),
            (
                &[
                    "Ƕ", // U+01F6: LATIN CAPITAL LETTER HWAIR
                ],
                "HV",
            ),
            (
                &[
                    "⒣", // U+24A3: PARENTHESIZED LATIN SMALL LETTER H
                ],
                "(h)",
            ),
            (
                &[
                    "ƕ", // U+0195: LATIN SMALL LETTER HV
                ],
                "hv",
            ),
            (
                &[
                    "Ì",  // U+00CC: LATIN CAPITAL LETTER I WITH GRAVE
                    "Í",  // U+00CD: LATIN CAPITAL LETTER I WITH ACUTE
                    "Î",  // U+00CE: LATIN CAPITAL LETTER I WITH CIRCUMFLEX
                    "Ï",  // U+00CF: LATIN CAPITAL LETTER I WITH DIAERESIS
                    "Ĩ",  // U+0128: LATIN CAPITAL LETTER I WITH TILDE
                    "Ī",  // U+012A: LATIN CAPITAL LETTER I WITH MACRON
                    "Ĭ",  // U+012C: LATIN CAPITAL LETTER I WITH BREVE
                    "Į",  // U+012E: LATIN CAPITAL LETTER I WITH OGONEK
                    "İ",  // U+0130: LATIN CAPITAL LETTER I WITH DOT ABOVE
                    "Ɩ",  // U+0196: LATIN CAPITAL LETTER IOTA
                    "Ɨ",  // U+0197: LATIN CAPITAL LETTER I WITH STROKE
                    "Ǐ",  // U+01CF: LATIN CAPITAL LETTER I WITH CARON
                    "Ȉ",  // U+0208: LATIN CAPITAL LETTER I WITH DOUBLE GRAVE
                    "Ȋ",  // U+020A: LATIN CAPITAL LETTER I WITH INVERTED BREVE
                    "ɪ",  // U+026A: LATIN LETTER SMALL CAPITAL I
                    "ᵻ",  // U+1D7B: LATIN SMALL CAPITAL LETTER I WITH STROKE
                    "Ḭ",  // U+1E2C: LATIN CAPITAL LETTER I WITH TILDE BELOW
                    "Ḯ",  // U+1E2E: LATIN CAPITAL LETTER I WITH DIAERESIS AND ACUTE
                    "Ỉ",  // U+1EC8: LATIN CAPITAL LETTER I WITH HOOK ABOVE
                    "Ị",  // U+1ECA: LATIN CAPITAL LETTER I WITH DOT BELOW
                    "Ⓘ",  // U+24BE: CIRCLED LATIN CAPITAL LETTER I
                    "ꟾ",  // U+A7FE: LATIN EPIGRAPHIC LETTER I LONGA
                    "Ｉ", // U+FF29: FULLWIDTH LATIN CAPITAL LETTER I
                ],
                "I",
            ),
            (
                &[
                    "ì",  // U+00EC: LATIN SMALL LETTER I WITH GRAVE
                    "í",  // U+00ED: LATIN SMALL LETTER I WITH ACUTE
                    "î",  // U+00EE: LATIN SMALL LETTER I WITH CIRCUMFLEX
                    "ï",  // U+00EF: LATIN SMALL LETTER I WITH DIAERESIS
                    "ĩ",  // U+0129: LATIN SMALL LETTER I WITH TILDE
                    "ī",  // U+012B: LATIN SMALL LETTER I WITH MACRON
                    "ĭ",  // U+012D: LATIN SMALL LETTER I WITH BREVE
                    "į",  // U+012F: LATIN SMALL LETTER I WITH OGONEK
                    "ı",  // U+0131: LATIN SMALL LETTER DOTLESS I
                    "ǐ",  // U+01D0: LATIN SMALL LETTER I WITH CARON
                    "ȉ",  // U+0209: LATIN SMALL LETTER I WITH DOUBLE GRAVE
                    "ȋ",  // U+020B: LATIN SMALL LETTER I WITH INVERTED BREVE
                    "ɨ",  // U+0268: LATIN SMALL LETTER I WITH STROKE
                    "ᴉ",  // U+1D09: LATIN SMALL LETTER TURNED I
                    "ᵢ",  // U+1D62: LATIN SUBSCRIPT SMALL LETTER I
                    "ᵼ",  // U+1D7C: LATIN SMALL LETTER IOTA WITH STROKE
                    "ᶖ",  // U+1D96: LATIN SMALL LETTER I WITH RETROFLEX HOOK
                    "ḭ",  // U+1E2D: LATIN SMALL LETTER I WITH TILDE BELOW
                    "ḯ",  // U+1E2F: LATIN SMALL LETTER I WITH DIAERESIS AND ACUTE
                    "ỉ",  // U+1EC9: LATIN SMALL LETTER I WITH HOOK ABOVE
                    "ị",  // U+1ECB: LATIN SMALL LETTER I WITH DOT BELOW
                    "ⁱ",  // U+2071: SUPERSCRIPT LATIN SMALL LETTER I
                    "ⓘ",  // U+24D8: CIRCLED LATIN SMALL LETTER I
                    "ｉ", // U+FF49: FULLWIDTH LATIN SMALL LETTER I
                ],
                "i",
            ),
            (
                &[
                    "Ĳ", // U+0132: LATIN CAPITAL LIGATURE IJ
                ],
                "IJ",
            ),
            (
                &[
                    "⒤", // U+24A4: PARENTHESIZED LATIN SMALL LETTER I
                ],
                "(i)",
            ),
            (
                &[
                    "ĳ", // U+0133: LATIN SMALL LIGATURE IJ
                ],
                "ij",
            ),
            (
                &[
                    "Ĵ",  // U+0134: LATIN CAPITAL LETTER J WITH CIRCUMFLEX
                    "Ɉ",  // U+0248: LATIN CAPITAL LETTER J WITH STROKE
                    "ᴊ",  // U+1D0A: LATIN LETTER SMALL CAPITAL J
                    "Ⓙ",  // U+24BF: CIRCLED LATIN CAPITAL LETTER J
                    "Ｊ", // U+FF2A: FULLWIDTH LATIN CAPITAL LETTER J
                ],
                "J",
            ),
            (
                &[
                    "ĵ",  // U+0135: LATIN SMALL LETTER J WITH CIRCUMFLEX
                    "ǰ",  // U+01F0: LATIN SMALL LETTER J WITH CARON
                    "ȷ",  // U+0237: LATIN SMALL LETTER DOTLESS J
                    "ɉ",  // U+0249: LATIN SMALL LETTER J WITH STROKE
                    "ɟ",  // U+025F: LATIN SMALL LETTER DOTLESS J WITH STROKE
                    "ʄ",  // U+0284: LATIN SMALL LETTER DOTLESS J WITH STROKE AND HOOK
                    "ʝ",  // U+029D: LATIN SMALL LETTER J WITH CROSSED-TAIL
                    "ⓙ",  // U+24D9: CIRCLED LATIN SMALL LETTER J
                    "ⱼ",  // U+2C7C: LATIN SUBSCRIPT SMALL LETTER J
                    "ｊ", // U+FF4A: FULLWIDTH LATIN SMALL LETTER J
                ],
                "j",
            ),
            (
                &[
                    "⒥", // U+24A5: PARENTHESIZED LATIN SMALL LETTER J
                ],
                "(j)",
            ),
            (
                &[
                    "Ķ",  // U+0136: LATIN CAPITAL LETTER K WITH CEDILLA
                    "Ƙ",  // U+0198: LATIN CAPITAL LETTER K WITH HOOK
                    "Ǩ",  // U+01E8: LATIN CAPITAL LETTER K WITH CARON
                    "ᴋ",  // U+1D0B: LATIN LETTER SMALL CAPITAL K
                    "Ḱ",  // U+1E30: LATIN CAPITAL LETTER K WITH ACUTE
                    "Ḳ",  // U+1E32: LATIN CAPITAL LETTER K WITH DOT BELOW
                    "Ḵ",  // U+1E34: LATIN CAPITAL LETTER K WITH LINE BELOW
                    "Ⓚ",  // U+24C0: CIRCLED LATIN CAPITAL LETTER K
                    "Ⱪ",  // U+2C69: LATIN CAPITAL LETTER K WITH DESCENDER
                    "Ꝁ",  // U+A740: LATIN CAPITAL LETTER K WITH STROKE
                    "Ꝃ",  // U+A742: LATIN CAPITAL LETTER K WITH DIAGONAL STROKE
                    "Ꝅ",  // U+A744: LATIN CAPITAL LETTER K WITH STROKE AND DIAGONAL STROKE
                    "Ｋ", // U+FF2B: FULLWIDTH LATIN CAPITAL LETTER K
                ],
                "K",
            ),
            (
                &[
                    "ķ",  // U+0137: LATIN SMALL LETTER K WITH CEDILLA
                    "ƙ",  // U+0199: LATIN SMALL LETTER K WITH HOOK
                    "ǩ",  // U+01E9: LATIN SMALL LETTER K WITH CARON
                    "ʞ",  // U+029E: LATIN SMALL LETTER TURNED K
                    "ᶄ",  // U+1D84: LATIN SMALL LETTER K WITH PALATAL HOOK
                    "ḱ",  // U+1E31: LATIN SMALL LETTER K WITH ACUTE
                    "ḳ",  // U+1E33: LATIN SMALL LETTER K WITH DOT BELOW
                    "ḵ",  // U+1E35: LATIN SMALL LETTER K WITH LINE BELOW
                    "ⓚ",  // U+24DA: CIRCLED LATIN SMALL LETTER K
                    "ⱪ",  // U+2C6A: LATIN SMALL LETTER K WITH DESCENDER
                    "ꝁ",  // U+A741: LATIN SMALL LETTER K WITH STROKE
                    "ꝃ",  // U+A743: LATIN SMALL LETTER K WITH DIAGONAL STROKE
                    "ꝅ",  // U+A745: LATIN SMALL LETTER K WITH STROKE AND DIAGONAL STROKE
                    "ｋ", // U+FF4B: FULLWIDTH LATIN SMALL LETTER K
                ],
                "k",
            ),
            (
                &[
                    "⒦", // U+24A6: PARENTHESIZED LATIN SMALL LETTER K
                ],
                "(k)",
            ),
            (
                &[
                    "Ĺ",  // U+0139: LATIN CAPITAL LETTER L WITH ACUTE
                    "Ļ",  // U+013B: LATIN CAPITAL LETTER L WITH CEDILLA
                    "Ľ",  // U+013D: LATIN CAPITAL LETTER L WITH CARON
                    "Ŀ",  // U+013F: LATIN CAPITAL LETTER L WITH MIDDLE DOT
                    "Ł",  // U+0141: LATIN CAPITAL LETTER L WITH STROKE
                    "Ƚ",  // U+023D: LATIN CAPITAL LETTER L WITH BAR
                    "ʟ",  // U+029F: LATIN LETTER SMALL CAPITAL L
                    "ᴌ",  // U+1D0C: LATIN LETTER SMALL CAPITAL L WITH STROKE
                    "Ḷ",  // U+1E36: LATIN CAPITAL LETTER L WITH DOT BELOW
                    "Ḹ",  // U+1E38: LATIN CAPITAL LETTER L WITH DOT BELOW AND MACRON
                    "Ḻ",  // U+1E3A: LATIN CAPITAL LETTER L WITH LINE BELOW
                    "Ḽ",  // U+1E3C: LATIN CAPITAL LETTER L WITH CIRCUMFLEX BELOW
                    "Ⓛ",  // U+24C1: CIRCLED LATIN CAPITAL LETTER L
                    "Ⱡ",  // U+2C60: LATIN CAPITAL LETTER L WITH DOUBLE BAR
                    "Ɫ",  // U+2C62: LATIN CAPITAL LETTER L WITH MIDDLE TILDE
                    "Ꝇ",  // U+A746: LATIN CAPITAL LETTER BROKEN L
                    "Ꝉ",  // U+A748: LATIN CAPITAL LETTER L WITH HIGH STROKE
                    "Ꞁ",  // U+A780: LATIN CAPITAL LETTER TURNED L
                    "Ｌ", // U+FF2C: FULLWIDTH LATIN CAPITAL LETTER L
                ],
                "L",
            ),
            (
                &[
                    "ĺ",  // U+013A: LATIN SMALL LETTER L WITH ACUTE
                    "ļ",  // U+013C: LATIN SMALL LETTER L WITH CEDILLA
                    "ľ",  // U+013E: LATIN SMALL LETTER L WITH CARON
                    "ŀ",  // U+0140: LATIN SMALL LETTER L WITH MIDDLE DOT
                    "ł",  // U+0142: LATIN SMALL LETTER L WITH STROKE
                    "ƚ",  // U+019A: LATIN SMALL LETTER L WITH BAR
                    "ȴ",  // U+0234: LATIN SMALL LETTER L WITH CURL
                    "ɫ",  // U+026B: LATIN SMALL LETTER L WITH MIDDLE TILDE
                    "ɬ",  // U+026C: LATIN SMALL LETTER L WITH BELT
                    "ɭ",  // U+026D: LATIN SMALL LETTER L WITH RETROFLEX HOOK
                    "ᶅ",  // U+1D85: LATIN SMALL LETTER L WITH PALATAL HOOK
                    "ḷ",  // U+1E37: LATIN SMALL LETTER L WITH DOT BELOW
                    "ḹ",  // U+1E39: LATIN SMALL LETTER L WITH DOT BELOW AND MACRON
                    "ḻ",  // U+1E3B: LATIN SMALL LETTER L WITH LINE BELOW
                    "ḽ",  // U+1E3D: LATIN SMALL LETTER L WITH CIRCUMFLEX BELOW
                    "ⓛ",  // U+24DB: CIRCLED LATIN SMALL LETTER L
                    "ⱡ",  // U+2C61: LATIN SMALL LETTER L WITH DOUBLE BAR
                    "ꝇ",  // U+A747: LATIN SMALL LETTER BROKEN L
                    "ꝉ",  // U+A749: LATIN SMALL LETTER L WITH HIGH STROKE
                    "ꞁ",  // U+A781: LATIN SMALL LETTER TURNED L
                    "ｌ", // U+FF4C: FULLWIDTH LATIN SMALL LETTER L
                ],
                "l",
            ),
            (
                &[
                    "Ǉ", // U+01C7: LATIN CAPITAL LETTER LJ
                ],
                "LJ",
            ),
            (
                &[
                    "Ỻ", // U+1EFA: LATIN CAPITAL LETTER MIDDLE-WELSH LL
                ],
                "LL",
            ),
            (
                &[
                    "ǈ", // U+01C8: LATIN CAPITAL LETTER L WITH SMALL LETTER J
                ],
                "Lj",
            ),
            (
                &[
                    "⒧", // U+24A7: PARENTHESIZED LATIN SMALL LETTER L
                ],
                "(l)",
            ),
            (
                &[
                    "ǉ", // U+01C9: LATIN SMALL LETTER LJ
                ],
                "lj",
            ),
            (
                &[
                    "ỻ", // U+1EFB: LATIN SMALL LETTER MIDDLE-WELSH LL
                ],
                "ll",
            ),
            (
                &[
                    "ʪ", // U+02AA: LATIN SMALL LETTER LS DIGRAPH
                ],
                "ls",
            ),
            (
                &[
                    "ʫ", // U+02AB: LATIN SMALL LETTER LZ DIGRAPH
                ],
                "lz",
            ),
            (
                &[
                    "Ɯ",  // U+019C: LATIN CAPITAL LETTER TURNED M
                    "ᴍ",  // U+1D0D: LATIN LETTER SMALL CAPITAL M
                    "Ḿ",  // U+1E3E: LATIN CAPITAL LETTER M WITH ACUTE
                    "Ṁ",  // U+1E40: LATIN CAPITAL LETTER M WITH DOT ABOVE
                    "Ṃ",  // U+1E42: LATIN CAPITAL LETTER M WITH DOT BELOW
                    "Ⓜ",  // U+24C2: CIRCLED LATIN CAPITAL LETTER M
                    "Ɱ",  // U+2C6E: LATIN CAPITAL LETTER M WITH HOOK
                    "ꟽ",  // U+A7FD: LATIN EPIGRAPHIC LETTER INVERTED M
                    "ꟿ",  // U+A7FF: LATIN EPIGRAPHIC LETTER ARCHAIC M
                    "Ｍ", // U+FF2D: FULLWIDTH LATIN CAPITAL LETTER M
                ],
                "M",
            ),
            (
                &[
                    "ɯ",  // U+026F: LATIN SMALL LETTER TURNED M
                    "ɰ",  // U+0270: LATIN SMALL LETTER TURNED M WITH LONG LEG
                    "ɱ",  // U+0271: LATIN SMALL LETTER M WITH HOOK
                    "ᵯ",  // U+1D6F: LATIN SMALL LETTER M WITH MIDDLE TILDE
                    "ᶆ",  // U+1D86: LATIN SMALL LETTER M WITH PALATAL HOOK
                    "ḿ",  // U+1E3F: LATIN SMALL LETTER M WITH ACUTE
                    "ṁ",  // U+1E41: LATIN SMALL LETTER M WITH DOT ABOVE
                    "ṃ",  // U+1E43: LATIN SMALL LETTER M WITH DOT BELOW
                    "ⓜ",  // U+24DC: CIRCLED LATIN SMALL LETTER M
                    "ｍ", // U+FF4D: FULLWIDTH LATIN SMALL LETTER M
                ],
                "m",
            ),
            (
                &[
                    "⒨", // U+24A8: PARENTHESIZED LATIN SMALL LETTER M
                ],
                "(m)",
            ),
            (
                &[
                    "Ñ",  // U+00D1: LATIN CAPITAL LETTER N WITH TILDE
                    "Ń",  // U+0143: LATIN CAPITAL LETTER N WITH ACUTE
                    "Ņ",  // U+0145: LATIN CAPITAL LETTER N WITH CEDILLA
                    "Ň",  // U+0147: LATIN CAPITAL LETTER N WITH CARON
                    "Ŋ",  // U+014A: LATIN CAPITAL LETTER ENG
                    "Ɲ",  // U+019D: LATIN CAPITAL LETTER N WITH LEFT HOOK
                    "Ǹ",  // U+01F8: LATIN CAPITAL LETTER N WITH GRAVE
                    "Ƞ",  // U+0220: LATIN CAPITAL LETTER N WITH LONG RIGHT LEG
                    "ɴ",  // U+0274: LATIN LETTER SMALL CAPITAL N
                    "ᴎ",  // U+1D0E: LATIN LETTER SMALL CAPITAL REVERSED N
                    "Ṅ",  // U+1E44: LATIN CAPITAL LETTER N WITH DOT ABOVE
                    "Ṇ",  // U+1E46: LATIN CAPITAL LETTER N WITH DOT BELOW
                    "Ṉ",  // U+1E48: LATIN CAPITAL LETTER N WITH LINE BELOW
                    "Ṋ",  // U+1E4A: LATIN CAPITAL LETTER N WITH CIRCUMFLEX BELOW
                    "Ⓝ",  // U+24C3: CIRCLED LATIN CAPITAL LETTER N
                    "Ｎ", // U+FF2E: FULLWIDTH LATIN CAPITAL LETTER N
                ],
                "N",
            ),
            (
                &[
                    "ñ",  // U+00F1: LATIN SMALL LETTER N WITH TILDE
                    "ń",  // U+0144: LATIN SMALL LETTER N WITH ACUTE
                    "ņ",  // U+0146: LATIN SMALL LETTER N WITH CEDILLA
                    "ň",  // U+0148: LATIN SMALL LETTER N WITH CARON
                    "ŉ",  // U+0149: LATIN SMALL LETTER N PRECEDED BY APOSTROPHE
                    "ŋ",  // U+014B: LATIN SMALL LETTER ENG
                    "ƞ",  // U+019E: LATIN SMALL LETTER N WITH LONG RIGHT LEG
                    "ǹ",  // U+01F9: LATIN SMALL LETTER N WITH GRAVE
                    "ȵ",  // U+0235: LATIN SMALL LETTER N WITH CURL
                    "ɲ",  // U+0272: LATIN SMALL LETTER N WITH LEFT HOOK
                    "ɳ",  // U+0273: LATIN SMALL LETTER N WITH RETROFLEX HOOK
                    "ᵰ",  // U+1D70: LATIN SMALL LETTER N WITH MIDDLE TILDE
                    "ᶇ",  // U+1D87: LATIN SMALL LETTER N WITH PALATAL HOOK
                    "ṅ",  // U+1E45: LATIN SMALL LETTER N WITH DOT ABOVE
                    "ṇ",  // U+1E47: LATIN SMALL LETTER N WITH DOT BELOW
                    "ṉ",  // U+1E49: LATIN SMALL LETTER N WITH LINE BELOW
                    "ṋ",  // U+1E4B: LATIN SMALL LETTER N WITH CIRCUMFLEX BELOW
                    "ⁿ",  // U+207F: SUPERSCRIPT LATIN SMALL LETTER N
                    "ⓝ",  // U+24DD: CIRCLED LATIN SMALL LETTER N
                    "ｎ", // U+FF4E: FULLWIDTH LATIN SMALL LETTER N
                ],
                "n",
            ),
            (
                &[
                    "Ǌ", // U+01CA: LATIN CAPITAL LETTER NJ
                ],
                "NJ",
            ),
            (
                &[
                    "ǋ", // U+01CB: LATIN CAPITAL LETTER N WITH SMALL LETTER J
                ],
                "Nj",
            ),
            (
                &[
                    "⒩", // U+24A9: PARENTHESIZED LATIN SMALL LETTER N
                ],
                "(n)",
            ),
            (
                &[
                    "ǌ", // U+01CC: LATIN SMALL LETTER NJ
                ],
                "nj",
            ),
            (
                &[
                    "Ò",  // U+00D2: LATIN CAPITAL LETTER O WITH GRAVE
                    "Ó",  // U+00D3: LATIN CAPITAL LETTER O WITH ACUTE
                    "Ô",  // U+00D4: LATIN CAPITAL LETTER O WITH CIRCUMFLEX
                    "Õ",  // U+00D5: LATIN CAPITAL LETTER O WITH TILDE
                    "Ö",  // U+00D6: LATIN CAPITAL LETTER O WITH DIAERESIS
                    "Ø",  // U+00D8: LATIN CAPITAL LETTER O WITH STROKE
                    "Ō",  // U+014C: LATIN CAPITAL LETTER O WITH MACRON
                    "Ŏ",  // U+014E: LATIN CAPITAL LETTER O WITH BREVE
                    "Ő",  // U+0150: LATIN CAPITAL LETTER O WITH DOUBLE ACUTE
                    "Ɔ",  // U+0186: LATIN CAPITAL LETTER OPEN O
                    "Ɵ",  // U+019F: LATIN CAPITAL LETTER O WITH MIDDLE TILDE
                    "Ơ",  // U+01A0: LATIN CAPITAL LETTER O WITH HORN
                    "Ǒ",  // U+01D1: LATIN CAPITAL LETTER O WITH CARON
                    "Ǫ",  // U+01EA: LATIN CAPITAL LETTER O WITH OGONEK
                    "Ǭ",  // U+01EC: LATIN CAPITAL LETTER O WITH OGONEK AND MACRON
                    "Ǿ",  // U+01FE: LATIN CAPITAL LETTER O WITH STROKE AND ACUTE
                    "Ȍ",  // U+020C: LATIN CAPITAL LETTER O WITH DOUBLE GRAVE
                    "Ȏ",  // U+020E: LATIN CAPITAL LETTER O WITH INVERTED BREVE
                    "Ȫ",  // U+022A: LATIN CAPITAL LETTER O WITH DIAERESIS AND MACRON
                    "Ȭ",  // U+022C: LATIN CAPITAL LETTER O WITH TILDE AND MACRON
                    "Ȯ",  // U+022E: LATIN CAPITAL LETTER O WITH DOT ABOVE
                    "Ȱ",  // U+0230: LATIN CAPITAL LETTER O WITH DOT ABOVE AND MACRON
                    "ᴏ",  // U+1D0F: LATIN LETTER SMALL CAPITAL O
                    "ᴐ",  // U+1D10: LATIN LETTER SMALL CAPITAL OPEN O
                    "Ṍ",  // U+1E4C: LATIN CAPITAL LETTER O WITH TILDE AND ACUTE
                    "Ṏ",  // U+1E4E: LATIN CAPITAL LETTER O WITH TILDE AND DIAERESIS
                    "Ṑ",  // U+1E50: LATIN CAPITAL LETTER O WITH MACRON AND GRAVE
                    "Ṓ",  // U+1E52: LATIN CAPITAL LETTER O WITH MACRON AND ACUTE
                    "Ọ",  // U+1ECC: LATIN CAPITAL LETTER O WITH DOT BELOW
                    "Ỏ",  // U+1ECE: LATIN CAPITAL LETTER O WITH HOOK ABOVE
                    "Ố",  // U+1ED0: LATIN CAPITAL LETTER O WITH CIRCUMFLEX AND ACUTE
                    "Ồ",  // U+1ED2: LATIN CAPITAL LETTER O WITH CIRCUMFLEX AND GRAVE
                    "Ổ",  // U+1ED4: LATIN CAPITAL LETTER O WITH CIRCUMFLEX AND HOOK ABOVE
                    "Ỗ",  // U+1ED6: LATIN CAPITAL LETTER O WITH CIRCUMFLEX AND TILDE
                    "Ộ",  // U+1ED8: LATIN CAPITAL LETTER O WITH CIRCUMFLEX AND DOT BELOW
                    "Ớ",  // U+1EDA: LATIN CAPITAL LETTER O WITH HORN AND ACUTE
                    "Ờ",  // U+1EDC: LATIN CAPITAL LETTER O WITH HORN AND GRAVE
                    "Ở",  // U+1EDE: LATIN CAPITAL LETTER O WITH HORN AND HOOK ABOVE
                    "Ỡ",  // U+1EE0: LATIN CAPITAL LETTER O WITH HORN AND TILDE
                    "Ợ",  // U+1EE2: LATIN CAPITAL LETTER O WITH HORN AND DOT BELOW
                    "Ⓞ",  // U+24C4: CIRCLED LATIN CAPITAL LETTER O
                    "Ꝋ",  // U+A74A: LATIN CAPITAL LETTER O WITH LONG STROKE OVERLAY
                    "Ꝍ",  // U+A74C: LATIN CAPITAL LETTER O WITH LOOP
                    "Ｏ", // U+FF2F: FULLWIDTH LATIN CAPITAL LETTER O
                ],
                "O",
            ),
            (
                &[
                    "ò",  // U+00F2: LATIN SMALL LETTER O WITH GRAVE
                    "ó",  // U+00F3: LATIN SMALL LETTER O WITH ACUTE
                    "ô",  // U+00F4: LATIN SMALL LETTER O WITH CIRCUMFLEX
                    "õ",  // U+00F5: LATIN SMALL LETTER O WITH TILDE
                    "ö",  // U+00F6: LATIN SMALL LETTER O WITH DIAERESIS
                    "ø",  // U+00F8: LATIN SMALL LETTER O WITH STROKE
                    "ō",  // U+014D: LATIN SMALL LETTER O WITH MACRON
                    "ŏ",  // U+014F: LATIN SMALL LETTER O WITH BREVE
                    "ő",  // U+0151: LATIN SMALL LETTER O WITH DOUBLE ACUTE
                    "ơ",  // U+01A1: LATIN SMALL LETTER O WITH HORN
                    "ǒ",  // U+01D2: LATIN SMALL LETTER O WITH CARON
                    "ǫ",  // U+01EB: LATIN SMALL LETTER O WITH OGONEK
                    "ǭ",  // U+01ED: LATIN SMALL LETTER O WITH OGONEK AND MACRON
                    "ǿ",  // U+01FF: LATIN SMALL LETTER O WITH STROKE AND ACUTE
                    "ȍ",  // U+020D: LATIN SMALL LETTER O WITH DOUBLE GRAVE
                    "ȏ",  // U+020F: LATIN SMALL LETTER O WITH INVERTED BREVE
                    "ȫ",  // U+022B: LATIN SMALL LETTER O WITH DIAERESIS AND MACRON
                    "ȭ",  // U+022D: LATIN SMALL LETTER O WITH TILDE AND MACRON
                    "ȯ",  // U+022F: LATIN SMALL LETTER O WITH DOT ABOVE
                    "ȱ",  // U+0231: LATIN SMALL LETTER O WITH DOT ABOVE AND MACRON
                    "ɔ",  // U+0254: LATIN SMALL LETTER OPEN O
                    "ɵ",  // U+0275: LATIN SMALL LETTER BARRED O
                    "ᴖ",  // U+1D16: LATIN SMALL LETTER TOP HALF O
                    "ᴗ",  // U+1D17: LATIN SMALL LETTER BOTTOM HALF O
                    "ᶗ",  // U+1D97: LATIN SMALL LETTER OPEN O WITH RETROFLEX HOOK
                    "ṍ",  // U+1E4D: LATIN SMALL LETTER O WITH TILDE AND ACUTE
                    "ṏ",  // U+1E4F: LATIN SMALL LETTER O WITH TILDE AND DIAERESIS
                    "ṑ",  // U+1E51: LATIN SMALL LETTER O WITH MACRON AND GRAVE
                    "ṓ",  // U+1E53: LATIN SMALL LETTER O WITH MACRON AND ACUTE
                    "ọ",  // U+1ECD: LATIN SMALL LETTER O WITH DOT BELOW
                    "ỏ",  // U+1ECF: LATIN SMALL LETTER O WITH HOOK ABOVE
                    "ố",  // U+1ED1: LATIN SMALL LETTER O WITH CIRCUMFLEX AND ACUTE
                    "ồ",  // U+1ED3: LATIN SMALL LETTER O WITH CIRCUMFLEX AND GRAVE
                    "ổ",  // U+1ED5: LATIN SMALL LETTER O WITH CIRCUMFLEX AND HOOK ABOVE
                    "ỗ",  // U+1ED7: LATIN SMALL LETTER O WITH CIRCUMFLEX AND TILDE
                    "ộ",  // U+1ED9: LATIN SMALL LETTER O WITH CIRCUMFLEX AND DOT BELOW
                    "ớ",  // U+1EDB: LATIN SMALL LETTER O WITH HORN AND ACUTE
                    "ờ",  // U+1EDD: LATIN SMALL LETTER O WITH HORN AND GRAVE
                    "ở",  // U+1EDF: LATIN SMALL LETTER O WITH HORN AND HOOK ABOVE
                    "ỡ",  // U+1EE1: LATIN SMALL LETTER O WITH HORN AND TILDE
                    "ợ",  // U+1EE3: LATIN SMALL LETTER O WITH HORN AND DOT BELOW
                    "ₒ",  // U+2092: LATIN SUBSCRIPT SMALL LETTER O
                    "ⓞ",  // U+24DE: CIRCLED LATIN SMALL LETTER O
                    "ⱺ",  // U+2C7A: LATIN SMALL LETTER O WITH LOW RING INSIDE
                    "ꝋ",  // U+A74B: LATIN SMALL LETTER O WITH LONG STROKE OVERLAY
                    "ꝍ",  // U+A74D: LATIN SMALL LETTER O WITH LOOP
                    "ｏ", // U+FF4F: FULLWIDTH LATIN SMALL LETTER O
                ],
                "o",
            ),
            (
                &[
                    "Œ", // U+0152: LATIN CAPITAL LIGATURE OE
                    "ɶ", // U+0276: LATIN LETTER SMALL CAPITAL OE
                ],
                "OE",
            ),
            (
                &[
                    "Ꝏ", // U+A74E: LATIN CAPITAL LETTER OO
                ],
                "OO",
            ),
            (
                &[
                    "Ȣ", // U+0222: LATIN CAPITAL LETTER OU
                    "ᴕ", // U+1D15: LATIN LETTER SMALL CAPITAL OU
                ],
                "OU",
            ),
            (
                &[
                    "⒪", // U+24AA: PARENTHESIZED LATIN SMALL LETTER O
                ],
                "(o)",
            ),
            (
                &[
                    "œ", // U+0153: LATIN SMALL LIGATURE OE
                    "ᴔ", // U+1D14: LATIN SMALL LETTER TURNED OE
                ],
                "oe",
            ),
            (
                &[
                    "ꝏ", // U+A74F: LATIN SMALL LETTER OO
                ],
                "oo",
            ),
            (
                &[
                    "ȣ", // U+0223: LATIN SMALL LETTER OU
                ],
                "ou",
            ),
            (
                &[
                    "Ƥ",  // U+01A4: LATIN CAPITAL LETTER P WITH HOOK
                    "ᴘ",  // U+1D18: LATIN LETTER SMALL CAPITAL P
                    "Ṕ",  // U+1E54: LATIN CAPITAL LETTER P WITH ACUTE
                    "Ṗ",  // U+1E56: LATIN CAPITAL LETTER P WITH DOT ABOVE
                    "Ⓟ",  // U+24C5: CIRCLED LATIN CAPITAL LETTER P
                    "Ᵽ",  // U+2C63: LATIN CAPITAL LETTER P WITH STROKE
                    "Ꝑ",  // U+A750: LATIN CAPITAL LETTER P WITH STROKE THROUGH DESCENDER
                    "Ꝓ",  // U+A752: LATIN CAPITAL LETTER P WITH FLOURISH
                    "Ꝕ",  // U+A754: LATIN CAPITAL LETTER P WITH SQUIRREL TAIL
                    "Ｐ", // U+FF30: FULLWIDTH LATIN CAPITAL LETTER P
                ],
                "P",
            ),
            (
                &[
                    "ƥ",  // U+01A5: LATIN SMALL LETTER P WITH HOOK
                    "ᵱ",  // U+1D71: LATIN SMALL LETTER P WITH MIDDLE TILDE
                    "ᵽ",  // U+1D7D: LATIN SMALL LETTER P WITH STROKE
                    "ᶈ",  // U+1D88: LATIN SMALL LETTER P WITH PALATAL HOOK
                    "ṕ",  // U+1E55: LATIN SMALL LETTER P WITH ACUTE
                    "ṗ",  // U+1E57: LATIN SMALL LETTER P WITH DOT ABOVE
                    "ⓟ",  // U+24DF: CIRCLED LATIN SMALL LETTER P
                    "ꝑ",  // U+A751: LATIN SMALL LETTER P WITH STROKE THROUGH DESCENDER
                    "ꝓ",  // U+A753: LATIN SMALL LETTER P WITH FLOURISH
                    "ꝕ",  // U+A755: LATIN SMALL LETTER P WITH SQUIRREL TAIL
                    "ꟼ",  // U+A7FC: LATIN EPIGRAPHIC LETTER REVERSED P
                    "ｐ", // U+FF50: FULLWIDTH LATIN SMALL LETTER P
                ],
                "p",
            ),
            (
                &[
                    "⒫", // U+24AB: PARENTHESIZED LATIN SMALL LETTER P
                ],
                "(p)",
            ),
            (
                &[
                    "Ɋ",  // U+024A: LATIN CAPITAL LETTER SMALL Q WITH HOOK TAIL
                    "Ⓠ",  // U+24C6: CIRCLED LATIN CAPITAL LETTER Q
                    "Ꝗ",  // U+A756: LATIN CAPITAL LETTER Q WITH STROKE THROUGH DESCENDER
                    "Ꝙ",  // U+A758: LATIN CAPITAL LETTER Q WITH DIAGONAL STROKE
                    "Ｑ", // U+FF31: FULLWIDTH LATIN CAPITAL LETTER Q
                ],
                "Q",
            ),
            (
                &[
                    "ĸ",  // U+0138: LATIN SMALL LETTER KRA
                    "ɋ",  // U+024B: LATIN SMALL LETTER Q WITH HOOK TAIL
                    "ʠ",  // U+02A0: LATIN SMALL LETTER Q WITH HOOK
                    "ⓠ",  // U+24E0: CIRCLED LATIN SMALL LETTER Q
                    "ꝗ",  // U+A757: LATIN SMALL LETTER Q WITH STROKE THROUGH DESCENDER
                    "ꝙ",  // U+A759: LATIN SMALL LETTER Q WITH DIAGONAL STROKE
                    "ｑ", // U+FF51: FULLWIDTH LATIN SMALL LETTER Q
                ],
                "q",
            ),
            (
                &[
                    "⒬", // U+24AC: PARENTHESIZED LATIN SMALL LETTER Q
                ],
                "(q)",
            ),
            (
                &[
                    "ȹ", // U+0239: LATIN SMALL LETTER QP DIGRAPH
                ],
                "qp",
            ),
            (
                &[
                    "Ŕ",  // U+0154: LATIN CAPITAL LETTER R WITH ACUTE
                    "Ŗ",  // U+0156: LATIN CAPITAL LETTER R WITH CEDILLA
                    "Ř",  // U+0158: LATIN CAPITAL LETTER R WITH CARON
                    "Ȑ",  // U+0210: LATIN CAPITAL LETTER R WITH DOUBLE GRAVE
                    "Ȓ",  // U+0212: LATIN CAPITAL LETTER R WITH INVERTED BREVE
                    "Ɍ",  // U+024C: LATIN CAPITAL LETTER R WITH STROKE
                    "ʀ",  // U+0280: LATIN LETTER SMALL CAPITAL R
                    "ʁ",  // U+0281: LATIN LETTER SMALL CAPITAL INVERTED R
                    "ᴙ",  // U+1D19: LATIN LETTER SMALL CAPITAL REVERSED R
                    "ᴚ",  // U+1D1A: LATIN LETTER SMALL CAPITAL TURNED R
                    "Ṙ",  // U+1E58: LATIN CAPITAL LETTER R WITH DOT ABOVE
                    "Ṛ",  // U+1E5A: LATIN CAPITAL LETTER R WITH DOT BELOW
                    "Ṝ",  // U+1E5C: LATIN CAPITAL LETTER R WITH DOT BELOW AND MACRON
                    "Ṟ",  // U+1E5E: LATIN CAPITAL LETTER R WITH LINE BELOW
                    "Ⓡ",  // U+24C7: CIRCLED LATIN CAPITAL LETTER R
                    "Ɽ",  // U+2C64: LATIN CAPITAL LETTER R WITH TAIL
                    "Ꝛ",  // U+A75A: LATIN CAPITAL LETTER R ROTUNDA
                    "Ꞃ",  // U+A782: LATIN CAPITAL LETTER INSULAR R
                    "Ｒ", // U+FF32: FULLWIDTH LATIN CAPITAL LETTER R
                ],
                "R",
            ),
            (
                &[
                    "ŕ",  // U+0155: LATIN SMALL LETTER R WITH ACUTE
                    "ŗ",  // U+0157: LATIN SMALL LETTER R WITH CEDILLA
                    "ř",  // U+0159: LATIN SMALL LETTER R WITH CARON
                    "ȑ",  // U+0211: LATIN SMALL LETTER R WITH DOUBLE GRAVE
                    "ȓ",  // U+0213: LATIN SMALL LETTER R WITH INVERTED BREVE
                    "ɍ",  // U+024D: LATIN SMALL LETTER R WITH STROKE
                    "ɼ",  // U+027C: LATIN SMALL LETTER R WITH LONG LEG
                    "ɽ",  // U+027D: LATIN SMALL LETTER R WITH TAIL
                    "ɾ",  // U+027E: LATIN SMALL LETTER R WITH FISHHOOK
                    "ɿ",  // U+027F: LATIN SMALL LETTER REVERSED R WITH FISHHOOK
                    "ᵣ",  // U+1D63: LATIN SUBSCRIPT SMALL LETTER R
                    "ᵲ",  // U+1D72: LATIN SMALL LETTER R WITH MIDDLE TILDE
                    "ᵳ",  // U+1D73: LATIN SMALL LETTER R WITH FISHHOOK AND MIDDLE TILDE
                    "ᶉ",  // U+1D89: LATIN SMALL LETTER R WITH PALATAL HOOK
                    "ṙ",  // U+1E59: LATIN SMALL LETTER R WITH DOT ABOVE
                    "ṛ",  // U+1E5B: LATIN SMALL LETTER R WITH DOT BELOW
                    "ṝ",  // U+1E5D: LATIN SMALL LETTER R WITH DOT BELOW AND MACRON
                    "ṟ",  // U+1E5F: LATIN SMALL LETTER R WITH LINE BELOW
                    "ⓡ",  // U+24E1: CIRCLED LATIN SMALL LETTER R
                    "ꝛ",  // U+A75B: LATIN SMALL LETTER R ROTUNDA
                    "ꞃ",  // U+A783: LATIN SMALL LETTER INSULAR R
                    "ｒ", // U+FF52: FULLWIDTH LATIN SMALL LETTER R
                ],
                "r",
            ),
            (
                &[
                    "⒭", // U+24AD: PARENTHESIZED LATIN SMALL LETTER R
                ],
                "(r)",
            ),
            (
                &[
                    "Ś",  // U+015A: LATIN CAPITAL LETTER S WITH ACUTE
                    "Ŝ",  // U+015C: LATIN CAPITAL LETTER S WITH CIRCUMFLEX
                    "Ş",  // U+015E: LATIN CAPITAL LETTER S WITH CEDILLA
                    "Š",  // U+0160: LATIN CAPITAL LETTER S WITH CARON
                    "Ș",  // U+0218: LATIN CAPITAL LETTER S WITH COMMA BELOW
                    "Ṡ",  // U+1E60: LATIN CAPITAL LETTER S WITH DOT ABOVE
                    "Ṣ",  // U+1E62: LATIN CAPITAL LETTER S WITH DOT BELOW
                    "Ṥ",  // U+1E64: LATIN CAPITAL LETTER S WITH ACUTE AND DOT ABOVE
                    "Ṧ",  // U+1E66: LATIN CAPITAL LETTER S WITH CARON AND DOT ABOVE
                    "Ṩ",  // U+1E68: LATIN CAPITAL LETTER S WITH DOT BELOW AND DOT ABOVE
                    "Ⓢ",  // U+24C8: CIRCLED LATIN CAPITAL LETTER S
                    "ꜱ",  // U+A731: LATIN LETTER SMALL CAPITAL S
                    "ꞅ",  // U+A785: LATIN SMALL LETTER INSULAR S
                    "Ｓ", // U+FF33: FULLWIDTH LATIN CAPITAL LETTER S
                ],
                "S",
            ),
            (
                &[
                    "ś",  // U+015B: LATIN SMALL LETTER S WITH ACUTE
                    "ŝ",  // U+015D: LATIN SMALL LETTER S WITH CIRCUMFLEX
                    "ş",  // U+015F: LATIN SMALL LETTER S WITH CEDILLA
                    "š",  // U+0161: LATIN SMALL LETTER S WITH CARON
                    "ſ",  // U+017F: LATIN SMALL LETTER LONG S
                    "ș",  // U+0219: LATIN SMALL LETTER S WITH COMMA BELOW
                    "ȿ",  // U+023F: LATIN SMALL LETTER S WITH SWASH TAIL
                    "ʂ",  // U+0282: LATIN SMALL LETTER S WITH HOOK
                    "ᵴ",  // U+1D74: LATIN SMALL LETTER S WITH MIDDLE TILDE
                    "ᶊ",  // U+1D8A: LATIN SMALL LETTER S WITH PALATAL HOOK
                    "ṡ",  // U+1E61: LATIN SMALL LETTER S WITH DOT ABOVE
                    "ṣ",  // U+1E63: LATIN SMALL LETTER S WITH DOT BELOW
                    "ṥ",  // U+1E65: LATIN SMALL LETTER S WITH ACUTE AND DOT ABOVE
                    "ṧ",  // U+1E67: LATIN SMALL LETTER S WITH CARON AND DOT ABOVE
                    "ṩ",  // U+1E69: LATIN SMALL LETTER S WITH DOT BELOW AND DOT ABOVE
                    "ẜ",  // U+1E9C: LATIN SMALL LETTER LONG S WITH DIAGONAL STROKE
                    "ẝ",  // U+1E9D: LATIN SMALL LETTER LONG S WITH HIGH STROKE
                    "ⓢ",  // U+24E2: CIRCLED LATIN SMALL LETTER S
                    "Ꞅ",  // U+A784: LATIN CAPITAL LETTER INSULAR S
                    "ｓ", // U+FF53: FULLWIDTH LATIN SMALL LETTER S
                ],
                "s",
            ),
            (
                &[
                    "ẞ", // U+1E9E: LATIN CAPITAL LETTER SHARP S
                ],
                "SS",
            ),
            (
                &[
                    "⒮", // U+24AE: PARENTHESIZED LATIN SMALL LETTER S
                ],
                "(s)",
            ),
            (
                &[
                    "ß", // U+00DF: LATIN SMALL LETTER SHARP S
                ],
                "ss",
            ),
            (
                &[
                    "ﬆ", // U+FB06: LATIN SMALL LIGATURE ST
                ],
                "st",
            ),
            (
                &[
                    "Ţ",  // U+0162: LATIN CAPITAL LETTER T WITH CEDILLA
                    "Ť",  // U+0164: LATIN CAPITAL LETTER T WITH CARON
                    "Ŧ",  // U+0166: LATIN CAPITAL LETTER T WITH STROKE
                    "Ƭ",  // U+01AC: LATIN CAPITAL LETTER T WITH HOOK
                    "Ʈ",  // U+01AE: LATIN CAPITAL LETTER T WITH RETROFLEX HOOK
                    "Ț",  // U+021A: LATIN CAPITAL LETTER T WITH COMMA BELOW
                    "Ⱦ",  // U+023E: LATIN CAPITAL LETTER T WITH DIAGONAL STROKE
                    "ᴛ",  // U+1D1B: LATIN LETTER SMALL CAPITAL T
                    "Ṫ",  // U+1E6A: LATIN CAPITAL LETTER T WITH DOT ABOVE
                    "Ṭ",  // U+1E6C: LATIN CAPITAL LETTER T WITH DOT BELOW
                    "Ṯ",  // U+1E6E: LATIN CAPITAL LETTER T WITH LINE BELOW
                    "Ṱ",  // U+1E70: LATIN CAPITAL LETTER T WITH CIRCUMFLEX BELOW
                    "Ⓣ",  // U+24C9: CIRCLED LATIN CAPITAL LETTER T
                    "Ꞇ",  // U+A786: LATIN CAPITAL LETTER INSULAR T
                    "Ｔ", // U+FF34: FULLWIDTH LATIN CAPITAL LETTER T
                ],
                "T",
            ),
            (
                &[
                    "ţ",  // U+0163: LATIN SMALL LETTER T WITH CEDILLA
                    "ť",  // U+0165: LATIN SMALL LETTER T WITH CARON
                    "ŧ",  // U+0167: LATIN SMALL LETTER T WITH STROKE
                    "ƫ",  // U+01AB: LATIN SMALL LETTER T WITH PALATAL HOOK
                    "ƭ",  // U+01AD: LATIN SMALL LETTER T WITH HOOK
                    "ț",  // U+021B: LATIN SMALL LETTER T WITH COMMA BELOW
                    "ȶ",  // U+0236: LATIN SMALL LETTER T WITH CURL
                    "ʇ",  // U+0287: LATIN SMALL LETTER TURNED T
                    "ʈ",  // U+0288: LATIN SMALL LETTER T WITH RETROFLEX HOOK
                    "ᵵ",  // U+1D75: LATIN SMALL LETTER T WITH MIDDLE TILDE
                    "ṫ",  // U+1E6B: LATIN SMALL LETTER T WITH DOT ABOVE
                    "ṭ",  // U+1E6D: LATIN SMALL LETTER T WITH DOT BELOW
                    "ṯ",  // U+1E6F: LATIN SMALL LETTER T WITH LINE BELOW
                    "ṱ",  // U+1E71: LATIN SMALL LETTER T WITH CIRCUMFLEX BELOW
                    "ẗ",  // U+1E97: LATIN SMALL LETTER T WITH DIAERESIS
                    "ⓣ",  // U+24E3: CIRCLED LATIN SMALL LETTER T
                    "ⱦ",  // U+2C66: LATIN SMALL LETTER T WITH DIAGONAL STROKE
                    "ｔ", // U+FF54: FULLWIDTH LATIN SMALL LETTER T
                ],
                "t",
            ),
            (
                &[
                    "Þ", // U+00DE: LATIN CAPITAL LETTER THORN
                    "Ꝧ", // U+A766: LATIN CAPITAL LETTER THORN WITH STROKE THROUGH DESCENDER
                ],
                "TH",
            ),
            (
                &[
                    "Ꜩ", // U+A728: LATIN CAPITAL LETTER TZ
                ],
                "TZ",
            ),
            (
                &[
                    "⒯", // U+24AF: PARENTHESIZED LATIN SMALL LETTER T
                ],
                "(t)",
            ),
            (
                &[
                    "ʨ", // U+02A8: LATIN SMALL LETTER TC DIGRAPH WITH CURL
                ],
                "tc",
            ),
            (
                &[
                    "þ", // U+00FE: LATIN SMALL LETTER THORN
                    "ᵺ", // U+1D7A: LATIN SMALL LETTER TH WITH STRIKETHROUGH
                    "ꝧ", // U+A767: LATIN SMALL LETTER THORN WITH STROKE THROUGH DESCENDER
                ],
                "th",
            ),
            (
                &[
                    "ʦ", // U+02A6: LATIN SMALL LETTER TS DIGRAPH
                ],
                "ts",
            ),
            (
                &[
                    "ꜩ", // U+A729: LATIN SMALL LETTER TZ
                ],
                "tz",
            ),
            (
                &[
                    "Ù",  // U+00D9: LATIN CAPITAL LETTER U WITH GRAVE
                    "Ú",  // U+00DA: LATIN CAPITAL LETTER U WITH ACUTE
                    "Û",  // U+00DB: LATIN CAPITAL LETTER U WITH CIRCUMFLEX
                    "Ü",  // U+00DC: LATIN CAPITAL LETTER U WITH DIAERESIS
                    "Ũ",  // U+0168: LATIN CAPITAL LETTER U WITH TILDE
                    "Ū",  // U+016A: LATIN CAPITAL LETTER U WITH MACRON
                    "Ŭ",  // U+016C: LATIN CAPITAL LETTER U WITH BREVE
                    "Ů",  // U+016E: LATIN CAPITAL LETTER U WITH RING ABOVE
                    "Ű",  // U+0170: LATIN CAPITAL LETTER U WITH DOUBLE ACUTE
                    "Ų",  // U+0172: LATIN CAPITAL LETTER U WITH OGONEK
                    "Ư",  // U+01AF: LATIN CAPITAL LETTER U WITH HORN
                    "Ǔ",  // U+01D3: LATIN CAPITAL LETTER U WITH CARON
                    "Ǖ",  // U+01D5: LATIN CAPITAL LETTER U WITH DIAERESIS AND MACRON
                    "Ǘ",  // U+01D7: LATIN CAPITAL LETTER U WITH DIAERESIS AND ACUTE
                    "Ǚ",  // U+01D9: LATIN CAPITAL LETTER U WITH DIAERESIS AND CARON
                    "Ǜ",  // U+01DB: LATIN CAPITAL LETTER U WITH DIAERESIS AND GRAVE
                    "Ȕ",  // U+0214: LATIN CAPITAL LETTER U WITH DOUBLE GRAVE
                    "Ȗ",  // U+0216: LATIN CAPITAL LETTER U WITH INVERTED BREVE
                    "Ʉ",  // U+0244: LATIN CAPITAL LETTER U BAR
                    "ᴜ",  // U+1D1C: LATIN LETTER SMALL CAPITAL U
                    "ᵾ",  // U+1D7E: LATIN SMALL CAPITAL LETTER U WITH STROKE
                    "Ṳ",  // U+1E72: LATIN CAPITAL LETTER U WITH DIAERESIS BELOW
                    "Ṵ",  // U+1E74: LATIN CAPITAL LETTER U WITH TILDE BELOW
                    "Ṷ",  // U+1E76: LATIN CAPITAL LETTER U WITH CIRCUMFLEX BELOW
                    "Ṹ",  // U+1E78: LATIN CAPITAL LETTER U WITH TILDE AND ACUTE
                    "Ṻ",  // U+1E7A: LATIN CAPITAL LETTER U WITH MACRON AND DIAERESIS
                    "Ụ",  // U+1EE4: LATIN CAPITAL LETTER U WITH DOT BELOW
                    "Ủ",  // U+1EE6: LATIN CAPITAL LETTER U WITH HOOK ABOVE
                    "Ứ",  // U+1EE8: LATIN CAPITAL LETTER U WITH HORN AND ACUTE
                    "Ừ",  // U+1EEA: LATIN CAPITAL LETTER U WITH HORN AND GRAVE
                    "Ử",  // U+1EEC: LATIN CAPITAL LETTER U WITH HORN AND HOOK ABOVE
                    "Ữ",  // U+1EEE: LATIN CAPITAL LETTER U WITH HORN AND TILDE
                    "Ự",  // U+1EF0: LATIN CAPITAL LETTER U WITH HORN AND DOT BELOW
                    "Ⓤ",  // U+24CA: CIRCLED LATIN CAPITAL LETTER U
                    "Ｕ", // U+FF35: FULLWIDTH LATIN CAPITAL LETTER U
                ],
                "U",
            ),
            (
                &[
                    "ù",  // U+00F9: LATIN SMALL LETTER U WITH GRAVE
                    "ú",  // U+00FA: LATIN SMALL LETTER U WITH ACUTE
                    "û",  // U+00FB: LATIN SMALL LETTER U WITH CIRCUMFLEX
                    "ü",  // U+00FC: LATIN SMALL LETTER U WITH DIAERESIS
                    "ũ",  // U+0169: LATIN SMALL LETTER U WITH TILDE
                    "ū",  // U+016B: LATIN SMALL LETTER U WITH MACRON
                    "ŭ",  // U+016D: LATIN SMALL LETTER U WITH BREVE
                    "ů",  // U+016F: LATIN SMALL LETTER U WITH RING ABOVE
                    "ű",  // U+0171: LATIN SMALL LETTER U WITH DOUBLE ACUTE
                    "ų",  // U+0173: LATIN SMALL LETTER U WITH OGONEK
                    "ư",  // U+01B0: LATIN SMALL LETTER U WITH HORN
                    "ǔ",  // U+01D4: LATIN SMALL LETTER U WITH CARON
                    "ǖ",  // U+01D6: LATIN SMALL LETTER U WITH DIAERESIS AND MACRON
                    "ǘ",  // U+01D8: LATIN SMALL LETTER U WITH DIAERESIS AND ACUTE
                    "ǚ",  // U+01DA: LATIN SMALL LETTER U WITH DIAERESIS AND CARON
                    "ǜ",  // U+01DC: LATIN SMALL LETTER U WITH DIAERESIS AND GRAVE
                    "ȕ",  // U+0215: LATIN SMALL LETTER U WITH DOUBLE GRAVE
                    "ȗ",  // U+0217: LATIN SMALL LETTER U WITH INVERTED BREVE
                    "ʉ",  // U+0289: LATIN SMALL LETTER U BAR
                    "ᵤ",  // U+1D64: LATIN SUBSCRIPT SMALL LETTER U
                    "ᶙ",  // U+1D99: LATIN SMALL LETTER U WITH RETROFLEX HOOK
                    "ṳ",  // U+1E73: LATIN SMALL LETTER U WITH DIAERESIS BELOW
                    "ṵ",  // U+1E75: LATIN SMALL LETTER U WITH TILDE BELOW
                    "ṷ",  // U+1E77: LATIN SMALL LETTER U WITH CIRCUMFLEX BELOW
                    "ṹ",  // U+1E79: LATIN SMALL LETTER U WITH TILDE AND ACUTE
                    "ṻ",  // U+1E7B: LATIN SMALL LETTER U WITH MACRON AND DIAERESIS
                    "ụ",  // U+1EE5: LATIN SMALL LETTER U WITH DOT BELOW
                    "ủ",  // U+1EE7: LATIN SMALL LETTER U WITH HOOK ABOVE
                    "ứ",  // U+1EE9: LATIN SMALL LETTER U WITH HORN AND ACUTE
                    "ừ",  // U+1EEB: LATIN SMALL LETTER U WITH HORN AND GRAVE
                    "ử",  // U+1EED: LATIN SMALL LETTER U WITH HORN AND HOOK ABOVE
                    "ữ",  // U+1EEF: LATIN SMALL LETTER U WITH HORN AND TILDE
                    "ự",  // U+1EF1: LATIN SMALL LETTER U WITH HORN AND DOT BELOW
                    "ⓤ",  // U+24E4: CIRCLED LATIN SMALL LETTER U
                    "ｕ", // U+FF55: FULLWIDTH LATIN SMALL LETTER U
                ],
                "u",
            ),
            (
                &[
                    "⒰", // U+24B0: PARENTHESIZED LATIN SMALL LETTER U
                ],
                "(u)",
            ),
            (
                &[
                    "ᵫ", // U+1D6B: LATIN SMALL LETTER UE
                ],
                "ue",
            ),
            (
                &[
                    "Ʋ",  // U+01B2: LATIN CAPITAL LETTER V WITH HOOK
                    "Ʌ",  // U+0245: LATIN CAPITAL LETTER TURNED V
                    "ᴠ",  // U+1D20: LATIN LETTER SMALL CAPITAL V
                    "Ṽ",  // U+1E7C: LATIN CAPITAL LETTER V WITH TILDE
                    "Ṿ",  // U+1E7E: LATIN CAPITAL LETTER V WITH DOT BELOW
                    "Ỽ",  // U+1EFC: LATIN CAPITAL LETTER MIDDLE-WELSH V
                    "Ⓥ",  // U+24CB: CIRCLED LATIN CAPITAL LETTER V
                    "Ꝟ",  // U+A75E: LATIN CAPITAL LETTER V WITH DIAGONAL STROKE
                    "Ꝩ",  // U+A768: LATIN CAPITAL LETTER VEND
                    "Ｖ", // U+FF36: FULLWIDTH LATIN CAPITAL LETTER V
                ],
                "V",
            ),
            (
                &[
                    "ʋ",  // U+028B: LATIN SMALL LETTER V WITH HOOK
                    "ʌ",  // U+028C: LATIN SMALL LETTER TURNED V
                    "ᵥ",  // U+1D65: LATIN SUBSCRIPT SMALL LETTER V
                    "ᶌ",  // U+1D8C: LATIN SMALL LETTER V WITH PALATAL HOOK
                    "ṽ",  // U+1E7D: LATIN SMALL LETTER V WITH TILDE
                    "ṿ",  // U+1E7F: LATIN SMALL LETTER V WITH DOT BELOW
                    "ⓥ",  // U+24E5: CIRCLED LATIN SMALL LETTER V
                    "ⱱ",  // U+2C71: LATIN SMALL LETTER V WITH RIGHT HOOK
                    "ⱴ",  // U+2C74: LATIN SMALL LETTER V WITH CURL
                    "ꝟ",  // U+A75F: LATIN SMALL LETTER V WITH DIAGONAL STROKE
                    "ｖ", // U+FF56: FULLWIDTH LATIN SMALL LETTER V
                ],
                "v",
            ),
            (
                &[
                    "Ꝡ", // U+A760: LATIN CAPITAL LETTER VY
                ],
                "VY",
            ),
            (
                &[
                    "⒱", // U+24B1: PARENTHESIZED LATIN SMALL LETTER V
                ],
                "(v)",
            ),
            (
                &[
                    "ꝡ", // U+A761: LATIN SMALL LETTER VY
                ],
                "vy",
            ),
            (
                &[
                    "Ŵ",  // U+0174: LATIN CAPITAL LETTER W WITH CIRCUMFLEX
                    "Ƿ",  // U+01F7: LATIN CAPITAL LETTER WYNN
                    "ᴡ",  // U+1D21: LATIN LETTER SMALL CAPITAL W
                    "Ẁ",  // U+1E80: LATIN CAPITAL LETTER W WITH GRAVE
                    "Ẃ",  // U+1E82: LATIN CAPITAL LETTER W WITH ACUTE
                    "Ẅ",  // U+1E84: LATIN CAPITAL LETTER W WITH DIAERESIS
                    "Ẇ",  // U+1E86: LATIN CAPITAL LETTER W WITH DOT ABOVE
                    "Ẉ",  // U+1E88: LATIN CAPITAL LETTER W WITH DOT BELOW
                    "Ⓦ",  // U+24CC: CIRCLED LATIN CAPITAL LETTER W
                    "Ⱳ",  // U+2C72: LATIN CAPITAL LETTER W WITH HOOK
                    "Ｗ", // U+FF37: FULLWIDTH LATIN CAPITAL LETTER W
                ],
                "W",
            ),
            (
                &[
                    "ŵ",  // U+0175: LATIN SMALL LETTER W WITH CIRCUMFLEX
                    "ƿ",  // U+01BF: LATIN LETTER WYNN
                    "ʍ",  // U+028D: LATIN SMALL LETTER TURNED W
                    "ẁ",  // U+1E81: LATIN SMALL LETTER W WITH GRAVE
                    "ẃ",  // U+1E83: LATIN SMALL LETTER W WITH ACUTE
                    "ẅ",  // U+1E85: LATIN SMALL LETTER W WITH DIAERESIS
                    "ẇ",  // U+1E87: LATIN SMALL LETTER W WITH DOT ABOVE
                    "ẉ",  // U+1E89: LATIN SMALL LETTER W WITH DOT BELOW
                    "ẘ",  // U+1E98: LATIN SMALL LETTER W WITH RING ABOVE
                    "ⓦ",  // U+24E6: CIRCLED LATIN SMALL LETTER W
                    "ⱳ",  // U+2C73: LATIN SMALL LETTER W WITH HOOK
                    "ｗ", // U+FF57: FULLWIDTH LATIN SMALL LETTER W
                ],
                "w",
            ),
            (
                &[
                    "⒲", // U+24B2: PARENTHESIZED LATIN SMALL LETTER W
                ],
                "(w)",
            ),
            (
                &[
                    "Ẋ",  // U+1E8A: LATIN CAPITAL LETTER X WITH DOT ABOVE
                    "Ẍ",  // U+1E8C: LATIN CAPITAL LETTER X WITH DIAERESIS
                    "Ⓧ",  // U+24CD: CIRCLED LATIN CAPITAL LETTER X
                    "Ｘ", // U+FF38: FULLWIDTH LATIN CAPITAL LETTER X
                ],
                "X",
            ),
            (
                &[
                    "ᶍ",  // U+1D8D: LATIN SMALL LETTER X WITH PALATAL HOOK
                    "ẋ",  // U+1E8B: LATIN SMALL LETTER X WITH DOT ABOVE
                    "ẍ",  // U+1E8D: LATIN SMALL LETTER X WITH DIAERESIS
                    "ₓ",  // U+2093: LATIN SUBSCRIPT SMALL LETTER X
                    "ⓧ",  // U+24E7: CIRCLED LATIN SMALL LETTER X
                    "ｘ", // U+FF58: FULLWIDTH LATIN SMALL LETTER X
                ],
                "x",
            ),
            (
                &[
                    "⒳", // U+24B3: PARENTHESIZED LATIN SMALL LETTER X
                ],
                "(x)",
            ),
            (
                &[
                    "Ý",  // U+00DD: LATIN CAPITAL LETTER Y WITH ACUTE
                    "Ŷ",  // U+0176: LATIN CAPITAL LETTER Y WITH CIRCUMFLEX
                    "Ÿ",  // U+0178: LATIN CAPITAL LETTER Y WITH DIAERESIS
                    "Ƴ",  // U+01B3: LATIN CAPITAL LETTER Y WITH HOOK
                    "Ȳ",  // U+0232: LATIN CAPITAL LETTER Y WITH MACRON
                    "Ɏ",  // U+024E: LATIN CAPITAL LETTER Y WITH STROKE
                    "ʏ",  // U+028F: LATIN LETTER SMALL CAPITAL Y
                    "Ẏ",  // U+1E8E: LATIN CAPITAL LETTER Y WITH DOT ABOVE
                    "Ỳ",  // U+1EF2: LATIN CAPITAL LETTER Y WITH GRAVE
                    "Ỵ",  // U+1EF4: LATIN CAPITAL LETTER Y WITH DOT BELOW
                    "Ỷ",  // U+1EF6: LATIN CAPITAL LETTER Y WITH HOOK ABOVE
                    "Ỹ",  // U+1EF8: LATIN CAPITAL LETTER Y WITH TILDE
                    "Ỿ",  // U+1EFE: LATIN CAPITAL LETTER Y WITH LOOP
                    "Ⓨ",  // U+24CE: CIRCLED LATIN CAPITAL LETTER Y
                    "Ｙ", // U+FF39: FULLWIDTH LATIN CAPITAL LETTER Y
                ],
                "Y",
            ),
            (
                &[
                    "ý",  // U+00FD: LATIN SMALL LETTER Y WITH ACUTE
                    "ÿ",  // U+00FF: LATIN SMALL LETTER Y WITH DIAERESIS
                    "ŷ",  // U+0177: LATIN SMALL LETTER Y WITH CIRCUMFLEX
                    "ƴ",  // U+01B4: LATIN SMALL LETTER Y WITH HOOK
                    "ȳ",  // U+0233: LATIN SMALL LETTER Y WITH MACRON
                    "ɏ",  // U+024F: LATIN SMALL LETTER Y WITH STROKE
                    "ʎ",  // U+028E: LATIN SMALL LETTER TURNED Y
                    "ẏ",  // U+1E8F: LATIN SMALL LETTER Y WITH DOT ABOVE
                    "ẙ",  // U+1E99: LATIN SMALL LETTER Y WITH RING ABOVE
                    "ỳ",  // U+1EF3: LATIN SMALL LETTER Y WITH GRAVE
                    "ỵ",  // U+1EF5: LATIN SMALL LETTER Y WITH DOT BELOW
                    "ỷ",  // U+1EF7: LATIN SMALL LETTER Y WITH HOOK ABOVE
                    "ỹ",  // U+1EF9: LATIN SMALL LETTER Y WITH TILDE
                    "ỿ",  // U+1EFF: LATIN SMALL LETTER Y WITH LOOP
                    "ⓨ",  // U+24E8: CIRCLED LATIN SMALL LETTER Y
                    "ｙ", // U+FF59: FULLWIDTH LATIN SMALL LETTER Y
                ],
                "y",
            ),
            (
                &[
                    "⒴", // U+24B4: PARENTHESIZED LATIN SMALL LETTER Y
                ],
                "(y)",
            ),
            (
                &[
                    "Ź",  // U+0179: LATIN CAPITAL LETTER Z WITH ACUTE
                    "Ż",  // U+017B: LATIN CAPITAL LETTER Z WITH DOT ABOVE
                    "Ž",  // U+017D: LATIN CAPITAL LETTER Z WITH CARON
                    "Ƶ",  // U+01B5: LATIN CAPITAL LETTER Z WITH STROKE
                    "Ȝ",  // U+021C: LATIN CAPITAL LETTER YOGH
                    "Ȥ",  // U+0224: LATIN CAPITAL LETTER Z WITH HOOK
                    "ᴢ",  // U+1D22: LATIN LETTER SMALL CAPITAL Z
                    "Ẑ",  // U+1E90: LATIN CAPITAL LETTER Z WITH CIRCUMFLEX
                    "Ẓ",  // U+1E92: LATIN CAPITAL LETTER Z WITH DOT BELOW
                    "Ẕ",  // U+1E94: LATIN CAPITAL LETTER Z WITH LINE BELOW
                    "Ⓩ",  // U+24CF: CIRCLED LATIN CAPITAL LETTER Z
                    "Ⱬ",  // U+2C6B: LATIN CAPITAL LETTER Z WITH DESCENDER
                    "Ꝣ",  // U+A762: LATIN CAPITAL LETTER VISIGOTHIC Z
                    "Ｚ", // U+FF3A: FULLWIDTH LATIN CAPITAL LETTER Z
                ],
                "Z",
            ),
            (
                &[
                    "ź",  // U+017A: LATIN SMALL LETTER Z WITH ACUTE
                    "ż",  // U+017C: LATIN SMALL LETTER Z WITH DOT ABOVE
                    "ž",  // U+017E: LATIN SMALL LETTER Z WITH CARON
                    "ƶ",  // U+01B6: LATIN SMALL LETTER Z WITH STROKE
                    "ȝ",  // U+021D: LATIN SMALL LETTER YOGH
                    "ȥ",  // U+0225: LATIN SMALL LETTER Z WITH HOOK
                    "ɀ",  // U+0240: LATIN SMALL LETTER Z WITH SWASH TAIL
                    "ʐ",  // U+0290: LATIN SMALL LETTER Z WITH RETROFLEX HOOK
                    "ʑ",  // U+0291: LATIN SMALL LETTER Z WITH CURL
                    "ᵶ",  // U+1D76: LATIN SMALL LETTER Z WITH MIDDLE TILDE
                    "ᶎ",  // U+1D8E: LATIN SMALL LETTER Z WITH PALATAL HOOK
                    "ẑ",  // U+1E91: LATIN SMALL LETTER Z WITH CIRCUMFLEX
                    "ẓ",  // U+1E93: LATIN SMALL LETTER Z WITH DOT BELOW
                    "ẕ",  // U+1E95: LATIN SMALL LETTER Z WITH LINE BELOW
                    "ⓩ",  // U+24E9: CIRCLED LATIN SMALL LETTER Z
                    "ⱬ",  // U+2C6C: LATIN SMALL LETTER Z WITH DESCENDER
                    "ꝣ",  // U+A763: LATIN SMALL LETTER VISIGOTHIC Z
                    "ｚ", // U+FF5A: FULLWIDTH LATIN SMALL LETTER Z
                ],
                "z",
            ),
            (
                &[
                    "⒵", // U+24B5: PARENTHESIZED LATIN SMALL LETTER Z
                ],
                "(z)",
            ),
            (
                &[
                    "⁰",  // U+2070: SUPERSCRIPT ZERO
                    "₀",  // U+2080: SUBSCRIPT ZERO
                    "⓪",  // U+24EA: CIRCLED DIGIT ZERO
                    "⓿",  // U+24FF: NEGATIVE CIRCLED DIGIT ZERO
                    "０", // U+FF10: FULLWIDTH DIGIT ZERO
                ],
                "0",
            ),
            (
                &[
                    "¹",  // U+00B9: SUPERSCRIPT ONE
                    "₁",  // U+2081: SUBSCRIPT ONE
                    "①",  // U+2460: CIRCLED DIGIT ONE
                    "⓵",  // U+24F5: DOUBLE CIRCLED DIGIT ONE
                    "❶",  // U+2776: DINGBAT NEGATIVE CIRCLED DIGIT ONE
                    "➀",  // U+2780: DINGBAT CIRCLED SANS-SERIF DIGIT ONE
                    "➊",  // U+278A: DINGBAT NEGATIVE CIRCLED SANS-SERIF DIGIT ONE
                    "１", // U+FF11: FULLWIDTH DIGIT ONE
                ],
                "1",
            ),
            (
                &[
                    "⒈", // U+2488: DIGIT ONE FULL STOP
                ],
                "1.",
            ),
            (
                &[
                    "⑴", // U+2474: PARENTHESIZED DIGIT ONE
                ],
                "(1)",
            ),
            (
                &[
                    "²",  // U+00B2: SUPERSCRIPT TWO
                    "₂",  // U+2082: SUBSCRIPT TWO
                    "②",  // U+2461: CIRCLED DIGIT TWO
                    "⓶",  // U+24F6: DOUBLE CIRCLED DIGIT TWO
                    "❷",  // U+2777: DINGBAT NEGATIVE CIRCLED DIGIT TWO
                    "➁",  // U+2781: DINGBAT CIRCLED SANS-SERIF DIGIT TWO
                    "➋",  // U+278B: DINGBAT NEGATIVE CIRCLED SANS-SERIF DIGIT TWO
                    "２", // U+FF12: FULLWIDTH DIGIT TWO
                ],
                "2",
            ),
            (
                &[
                    "⒉", // U+2489: DIGIT TWO FULL STOP
                ],
                "2.",
            ),
            (
                &[
                    "⑵", // U+2475: PARENTHESIZED DIGIT TWO
                ],
                "(2)",
            ),
            (
                &[
                    "³",  // U+00B3: SUPERSCRIPT THREE
                    "₃",  // U+2083: SUBSCRIPT THREE
                    "③",  // U+2462: CIRCLED DIGIT THREE
                    "⓷",  // U+24F7: DOUBLE CIRCLED DIGIT THREE
                    "❸",  // U+2778: DINGBAT NEGATIVE CIRCLED DIGIT THREE
                    "➂",  // U+2782: DINGBAT CIRCLED SANS-SERIF DIGIT THREE
                    "➌",  // U+278C: DINGBAT NEGATIVE CIRCLED SANS-SERIF DIGIT THREE
                    "３", // U+FF13: FULLWIDTH DIGIT THREE
                ],
                "3",
            ),
            (
                &[
                    "⒊", // U+248A: DIGIT THREE FULL STOP
                ],
                "3.",
            ),
            (
                &[
                    "⑶", // U+2476: PARENTHESIZED DIGIT THREE
                ],
                "(3)",
            ),
            (
                &[
                    "⁴",  // U+2074: SUPERSCRIPT FOUR
                    "₄",  // U+2084: SUBSCRIPT FOUR
                    "④",  // U+2463: CIRCLED DIGIT FOUR
                    "⓸",  // U+24F8: DOUBLE CIRCLED DIGIT FOUR
                    "❹",  // U+2779: DINGBAT NEGATIVE CIRCLED DIGIT FOUR
                    "➃",  // U+2783: DINGBAT CIRCLED SANS-SERIF DIGIT FOUR
                    "➍",  // U+278D: DINGBAT NEGATIVE CIRCLED SANS-SERIF DIGIT FOUR
                    "４", // U+FF14: FULLWIDTH DIGIT FOUR
                ],
                "4",
            ),
            (
                &[
                    "⒋", // U+248B: DIGIT FOUR FULL STOP
                ],
                "4.",
            ),
            (
                &[
                    "⑷", // U+2477: PARENTHESIZED DIGIT FOUR
                ],
                "(4)",
            ),
            (
                &[
                    "⁵",  // U+2075: SUPERSCRIPT FIVE
                    "₅",  // U+2085: SUBSCRIPT FIVE
                    "⑤",  // U+2464: CIRCLED DIGIT FIVE
                    "⓹",  // U+24F9: DOUBLE CIRCLED DIGIT FIVE
                    "❺",  // U+277A: DINGBAT NEGATIVE CIRCLED DIGIT FIVE
                    "➄",  // U+2784: DINGBAT CIRCLED SANS-SERIF DIGIT FIVE
                    "➎",  // U+278E: DINGBAT NEGATIVE CIRCLED SANS-SERIF DIGIT FIVE
                    "５", // U+FF15: FULLWIDTH DIGIT FIVE
                ],
                "5",
            ),
            (
                &[
                    "⒌", // U+248C: DIGIT FIVE FULL STOP
                ],
                "5.",
            ),
            (
                &[
                    "⑸", // U+2478: PARENTHESIZED DIGIT FIVE
                ],
                "(5)",
            ),
            (
                &[
                    "⁶",  // U+2076: SUPERSCRIPT SIX
                    "₆",  // U+2086: SUBSCRIPT SIX
                    "⑥",  // U+2465: CIRCLED DIGIT SIX
                    "⓺",  // U+24FA: DOUBLE CIRCLED DIGIT SIX
                    "❻",  // U+277B: DINGBAT NEGATIVE CIRCLED DIGIT SIX
                    "➅",  // U+2785: DINGBAT CIRCLED SANS-SERIF DIGIT SIX
                    "➏",  // U+278F: DINGBAT NEGATIVE CIRCLED SANS-SERIF DIGIT SIX
                    "６", // U+FF16: FULLWIDTH DIGIT SIX
                ],
                "6",
            ),
            (
                &[
                    "⒍", // U+248D: DIGIT SIX FULL STOP
                ],
                "6.",
            ),
            (
                &[
                    "⑹", // U+2479: PARENTHESIZED DIGIT SIX
                ],
                "(6)",
            ),
            (
                &[
                    "⁷",  // U+2077: SUPERSCRIPT SEVEN
                    "₇",  // U+2087: SUBSCRIPT SEVEN
                    "⑦",  // U+2466: CIRCLED DIGIT SEVEN
                    "⓻",  // U+24FB: DOUBLE CIRCLED DIGIT SEVEN
                    "❼",  // U+277C: DINGBAT NEGATIVE CIRCLED DIGIT SEVEN
                    "➆",  // U+2786: DINGBAT CIRCLED SANS-SERIF DIGIT SEVEN
                    "➐",  // U+2790: DINGBAT NEGATIVE CIRCLED SANS-SERIF DIGIT SEVEN
                    "７", // U+FF17: FULLWIDTH DIGIT SEVEN
                ],
                "7",
            ),
            (
                &[
                    "⒎", // U+248E: DIGIT SEVEN FULL STOP
                ],
                "7.",
            ),
            (
                &[
                    "⑺", // U+247A: PARENTHESIZED DIGIT SEVEN
                ],
                "(7)",
            ),
            (
                &[
                    "⁸",  // U+2078: SUPERSCRIPT EIGHT
                    "₈",  // U+2088: SUBSCRIPT EIGHT
                    "⑧",  // U+2467: CIRCLED DIGIT EIGHT
                    "⓼",  // U+24FC: DOUBLE CIRCLED DIGIT EIGHT
                    "❽",  // U+277D: DINGBAT NEGATIVE CIRCLED DIGIT EIGHT
                    "➇",  // U+2787: DINGBAT CIRCLED SANS-SERIF DIGIT EIGHT
                    "➑",  // U+2791: DINGBAT NEGATIVE CIRCLED SANS-SERIF DIGIT EIGHT
                    "８", // U+FF18: FULLWIDTH DIGIT EIGHT
                ],
                "8",
            ),
            (
                &[
                    "⒏", // U+248F: DIGIT EIGHT FULL STOP
                ],
                "8.",
            ),
            (
                &[
                    "⑻", // U+247B: PARENTHESIZED DIGIT EIGHT
                ],
                "(8)",
            ),
            (
                &[
                    "⁹",  // U+2079: SUPERSCRIPT NINE
                    "₉",  // U+2089: SUBSCRIPT NINE
                    "⑨",  // U+2468: CIRCLED DIGIT NINE
                    "⓽",  // U+24FD: DOUBLE CIRCLED DIGIT NINE
                    "❾",  // U+277E: DINGBAT NEGATIVE CIRCLED DIGIT NINE
                    "➈",  // U+2788: DINGBAT CIRCLED SANS-SERIF DIGIT NINE
                    "➒",  // U+2792: DINGBAT NEGATIVE CIRCLED SANS-SERIF DIGIT NINE
                    "９", // U+FF19: FULLWIDTH DIGIT NINE
                ],
                "9",
            ),
            (
                &[
                    "⒐", // U+2490: DIGIT NINE FULL STOP
                ],
                "9.",
            ),
            (
                &[
                    "⑼", // U+247C: PARENTHESIZED DIGIT NINE
                ],
                "(9)",
            ),
            (
                &[
                    "⑩", // U+2469: CIRCLED NUMBER TEN
                    "⓾", // U+24FE: DOUBLE CIRCLED NUMBER TEN
                    "❿", // U+277F: DINGBAT NEGATIVE CIRCLED NUMBER TEN
                    "➉", // U+2789: DINGBAT CIRCLED SANS-SERIF NUMBER TEN
                    "➓", // U+2793: DINGBAT NEGATIVE CIRCLED SANS-SERIF NUMBER TEN
                ],
                "10",
            ),
            (
                &[
                    "⒑", // U+2491: NUMBER TEN FULL STOP
                ],
                "10.",
            ),
            (
                &[
                    "⑽", // U+247D: PARENTHESIZED NUMBER TEN
                ],
                "(10)",
            ),
            (
                &[
                    "⑪", // U+246A: CIRCLED NUMBER ELEVEN
                    "⓫", // U+24EB: NEGATIVE CIRCLED NUMBER ELEVEN
                ],
                "11",
            ),
            (
                &[
                    "⒒", // U+2492: NUMBER ELEVEN FULL STOP
                ],
                "11.",
            ),
            (
                &[
                    "⑾", // U+247E: PARENTHESIZED NUMBER ELEVEN
                ],
                "(11)",
            ),
            (
                &[
                    "⑫", // U+246B: CIRCLED NUMBER TWELVE
                    "⓬", // U+24EC: NEGATIVE CIRCLED NUMBER TWELVE
                ],
                "12",
            ),
            (
                &[
                    "⒓", // U+2493: NUMBER TWELVE FULL STOP
                ],
                "12.",
            ),
            (
                &[
                    "⑿", // U+247F: PARENTHESIZED NUMBER TWELVE
                ],
                "(12)",
            ),
            (
                &[
                    "⑬", // U+246C: CIRCLED NUMBER THIRTEEN
                    "⓭", // U+24ED: NEGATIVE CIRCLED NUMBER THIRTEEN
                ],
                "13",
            ),
            (
                &[
                    "⒔", // U+2494: NUMBER THIRTEEN FULL STOP
                ],
                "13.",
            ),
            (
                &[
                    "⒀", // U+2480: PARENTHESIZED NUMBER THIRTEEN
                ],
                "(13)",
            ),
            (
                &[
                    "⑭", // U+246D: CIRCLED NUMBER FOURTEEN
                    "⓮", // U+24EE: NEGATIVE CIRCLED NUMBER FOURTEEN
                ],
                "14",
            ),
            (
                &[
                    "⒕", // U+2495: NUMBER FOURTEEN FULL STOP
                ],
                "14.",
            ),
            (
                &[
                    "⒁", // U+2481: PARENTHESIZED NUMBER FOURTEEN
                ],
                "(14)",
            ),
            (
                &[
                    "⑮", // U+246E: CIRCLED NUMBER FIFTEEN
                    "⓯", // U+24EF: NEGATIVE CIRCLED NUMBER FIFTEEN
                ],
                "15",
            ),
            (
                &[
                    "⒖", // U+2496: NUMBER FIFTEEN FULL STOP
                ],
                "15.",
            ),
            (
                &[
                    "⒂", // U+2482: PARENTHESIZED NUMBER FIFTEEN
                ],
                "(15)",
            ),
            (
                &[
                    "⑯", // U+246F: CIRCLED NUMBER SIXTEEN
                    "⓰", // U+24F0: NEGATIVE CIRCLED NUMBER SIXTEEN
                ],
                "16",
            ),
            (
                &[
                    "⒗", // U+2497: NUMBER SIXTEEN FULL STOP
                ],
                "16.",
            ),
            (
                &[
                    "⒃", // U+2483: PARENTHESIZED NUMBER SIXTEEN
                ],
                "(16)",
            ),
            (
                &[
                    "⑰", // U+2470: CIRCLED NUMBER SEVENTEEN
                    "⓱", // U+24F1: NEGATIVE CIRCLED NUMBER SEVENTEEN
                ],
                "17",
            ),
            (
                &[
                    "⒘", // U+2498: NUMBER SEVENTEEN FULL STOP
                ],
                "17.",
            ),
            (
                &[
                    "⒄", // U+2484: PARENTHESIZED NUMBER SEVENTEEN
                ],
                "(17)",
            ),
            (
                &[
                    "⑱", // U+2471: CIRCLED NUMBER EIGHTEEN
                    "⓲", // U+24F2: NEGATIVE CIRCLED NUMBER EIGHTEEN
                ],
                "18",
            ),
            (
                &[
                    "⒙", // U+2499: NUMBER EIGHTEEN FULL STOP
                ],
                "18.",
            ),
            (
                &[
                    "⒅", // U+2485: PARENTHESIZED NUMBER EIGHTEEN
                ],
                "(18)",
            ),
            (
                &[
                    "⑲", // U+2472: CIRCLED NUMBER NINETEEN
                    "⓳", // U+24F3: NEGATIVE CIRCLED NUMBER NINETEEN
                ],
                "19",
            ),
            (
                &[
                    "⒚", // U+249A: NUMBER NINETEEN FULL STOP
                ],
                "19.",
            ),
            (
                &[
                    "⒆", // U+2486: PARENTHESIZED NUMBER NINETEEN
                ],
                "(19)",
            ),
            (
                &[
                    "⑳", // U+2473: CIRCLED NUMBER TWENTY
                    "⓴", // U+24F4: NEGATIVE CIRCLED NUMBER TWENTY
                ],
                "20",
            ),
            (
                &[
                    "⒛", // U+249B: NUMBER TWENTY FULL STOP
                ],
                "20.",
            ),
            (
                &[
                    "⒇", // U+2487: PARENTHESIZED NUMBER TWENTY
                ],
                "(20)",
            ),
            (
                &[
                    "«",  // U+00AB: LEFT-POINTING DOUBLE ANGLE QUOTATION MARK
                    "»",  // U+00BB: RIGHT-POINTING DOUBLE ANGLE QUOTATION MARK
                    "“",  // U+201C: LEFT DOUBLE QUOTATION MARK
                    "”",  // U+201D: RIGHT DOUBLE QUOTATION MARK
                    "„",  // U+201E: DOUBLE LOW-9 QUOTATION MARK
                    "″",  // U+2033: DOUBLE PRIME
                    "‶",  // U+2036: REVERSED DOUBLE PRIME
                    "❝",  // U+275D: HEAVY DOUBLE TURNED COMMA QUOTATION MARK ORNAMENT
                    "❞",  // U+275E: HEAVY DOUBLE COMMA QUOTATION MARK ORNAMENT
                    "❮",  // U+276E: HEAVY LEFT-POINTING ANGLE QUOTATION MARK ORNAMENT
                    "❯",  // U+276F: HEAVY RIGHT-POINTING ANGLE QUOTATION MARK ORNAMENT
                    "＂", // U+FF02: FULLWIDTH QUOTATION MARK
                ],
                "\"",
            ),
            (
                &[
                    "‘",  // U+2018: LEFT SINGLE QUOTATION MARK
                    "’",  // U+2019: RIGHT SINGLE QUOTATION MARK
                    "‚",  // U+201A: SINGLE LOW-9 QUOTATION MARK
                    "‛",  // U+201B: SINGLE HIGH-REVERSED-9 QUOTATION MARK
                    "′",  // U+2032: PRIME
                    "‵",  // U+2035: REVERSED PRIME
                    "‹",  // U+2039: SINGLE LEFT-POINTING ANGLE QUOTATION MARK
                    "›",  // U+203A: SINGLE RIGHT-POINTING ANGLE QUOTATION MARK
                    "❛",  // U+275B: HEAVY SINGLE TURNED COMMA QUOTATION MARK ORNAMENT
                    "❜",  // U+275C: HEAVY SINGLE COMMA QUOTATION MARK ORNAMENT
                    "＇", // U+FF07: FULLWIDTH APOSTROPHE
                ],
                "'",
            ),
            (
                &[
                    "‐",  // U+2010: HYPHEN
                    "‑",  // U+2011: NON-BREAKING HYPHEN
                    "‒",  // U+2012: FIGURE DASH
                    "–",  // U+2013: EN DASH
                    "—",  // U+2014: EM DASH
                    "⁻",  // U+207B: SUPERSCRIPT MINUS
                    "₋",  // U+208B: SUBSCRIPT MINUS
                    "－", // U+FF0D: FULLWIDTH HYPHEN-MINUS
                ],
                "-",
            ),
            (
                &[
                    "⁅",  // U+2045: LEFT SQUARE BRACKET WITH QUILL
                    "❲",  // U+2772: LIGHT LEFT TORTOISE SHELL BRACKET ORNAMENT
                    "［", // U+FF3B: FULLWIDTH LEFT SQUARE BRACKET
                ],
                "[",
            ),
            (
                &[
                    "⁆",  // U+2046: RIGHT SQUARE BRACKET WITH QUILL
                    "❳",  // U+2773: LIGHT RIGHT TORTOISE SHELL BRACKET ORNAMENT
                    "］", // U+FF3D: FULLWIDTH RIGHT SQUARE BRACKET
                ],
                "]",
            ),
            (
                &[
                    "⁽",  // U+207D: SUPERSCRIPT LEFT PARENTHESIS
                    "₍",  // U+208D: SUBSCRIPT LEFT PARENTHESIS
                    "❨",  // U+2768: MEDIUM LEFT PARENTHESIS ORNAMENT
                    "❪",  // U+276A: MEDIUM FLATTENED LEFT PARENTHESIS ORNAMENT
                    "（", // U+FF08: FULLWIDTH LEFT PARENTHESIS
                ],
                "(",
            ),
            (
                &[
                    "⸨", // U+2E28: LEFT DOUBLE PARENTHESIS
                ],
                "((",
            ),
            (
                &[
                    "⁾",  // U+207E: SUPERSCRIPT RIGHT PARENTHESIS
                    "₎",  // U+208E: SUBSCRIPT RIGHT PARENTHESIS
                    "❩",  // U+2769: MEDIUM RIGHT PARENTHESIS ORNAMENT
                    "❫",  // U+276B: MEDIUM FLATTENED RIGHT PARENTHESIS ORNAMENT
                    "）", // U+FF09: FULLWIDTH RIGHT PARENTHESIS
                ],
                ")",
            ),
            (
                &[
                    "⸩", // U+2E29: RIGHT DOUBLE PARENTHESIS
                ],
                "))",
            ),
            (
                &[
                    "❬",  // U+276C: MEDIUM LEFT-POINTING ANGLE BRACKET ORNAMENT
                    "❰",  // U+2770: HEAVY LEFT-POINTING ANGLE BRACKET ORNAMENT
                    "＜", // U+FF1C: FULLWIDTH LESS-THAN SIGN
                ],
                "<",
            ),
            (
                &[
                    "❭",  // U+276D: MEDIUM RIGHT-POINTING ANGLE BRACKET ORNAMENT
                    "❱",  // U+2771: HEAVY RIGHT-POINTING ANGLE BRACKET ORNAMENT
                    "＞", // U+FF1E: FULLWIDTH GREATER-THAN SIGN
                ],
                ">",
            ),
            (
                &[
                    "❴",  // U+2774: MEDIUM LEFT CURLY BRACKET ORNAMENT
                    "｛", // U+FF5B: FULLWIDTH LEFT CURLY BRACKET
                ],
                "{",
            ),
            (
                &[
                    "❵",  // U+2775: MEDIUM RIGHT CURLY BRACKET ORNAMENT
                    "｝", // U+FF5D: FULLWIDTH RIGHT CURLY BRACKET
                ],
                "}",
            ),
            (
                &[
                    "⁺",  // U+207A: SUPERSCRIPT PLUS SIGN
                    "₊",  // U+208A: SUBSCRIPT PLUS SIGN
                    "＋", // U+FF0B: FULLWIDTH PLUS SIGN
                ],
                "+",
            ),
            (
                &[
                    "⁼",  // U+207C: SUPERSCRIPT EQUALS SIGN
                    "₌",  // U+208C: SUBSCRIPT EQUALS SIGN
                    "＝", // U+FF1D: FULLWIDTH EQUALS SIGN
                ],
                "=",
            ),
            (
                &[
                    "！", // U+FF01: FULLWIDTH EXCLAMATION MARK
                ],
                "!",
            ),
            (
                &[
                    "‼", // U+203C: DOUBLE EXCLAMATION MARK
                ],
                "!!",
            ),
            (
                &[
                    "⁉", // U+2049: EXCLAMATION QUESTION MARK
                ],
                "!?",
            ),
            (
                &[
                    "＃", // U+FF03: FULLWIDTH NUMBER SIGN
                ],
                "#",
            ),
            (
                &[
                    "＄", // U+FF04: FULLWIDTH DOLLAR SIGN
                ],
                "$",
            ),
            (
                &[
                    "⁒",  // U+2052: COMMERCIAL MINUS SIGN
                    "％", // U+FF05: FULLWIDTH PERCENT SIGN
                ],
                "%",
            ),
            (
                &[
                    "＆", // U+FF06: FULLWIDTH AMPERSAND
                ],
                "&",
            ),
            (
                &[
                    "⁎",  // U+204E: LOW ASTERISK
                    "＊", // U+FF0A: FULLWIDTH ASTERISK
                ],
                "*",
            ),
            (
                &[
                    "，", // U+FF0C: FULLWIDTH COMMA
                ],
                ",",
            ),
            (
                &[
                    "．", // U+FF0E: FULLWIDTH FULL STOP
                ],
                ".",
            ),
            (
                &[
                    "⁄",  // U+2044: FRACTION SLASH
                    "／", // U+FF0F: FULLWIDTH SOLIDUS
                ],
                "/",
            ),
            (
                &[
                    "：", // U+FF1A: FULLWIDTH COLON
                ],
                ":",
            ),
            (
                &[
                    "⁏",  // U+204F: REVERSED SEMICOLON
                    "；", // U+FF1B: FULLWIDTH SEMICOLON
                ],
                ";",
            ),
            (
                &[
                    "？", // U+FF1F: FULLWIDTH QUESTION MARK
                ],
                "?",
            ),
            (
                &[
                    "⁇", // U+2047: DOUBLE QUESTION MARK
                ],
                "??",
            ),
            (
                &[
                    "⁈", // U+2048: QUESTION EXCLAMATION MARK
                ],
                "?!",
            ),
            (
                &[
                    "＠", // U+FF20: FULLWIDTH COMMERCIAL AT
                ],
                "@",
            ),
            (
                &[
                    "＼", // U+FF3C: FULLWIDTH REVERSE SOLIDUS
                ],
                "\\",
            ),
            (
                &[
                    "‸",  // U+2038: CARET
                    "＾", // U+FF3E: FULLWIDTH CIRCUMFLEX ACCENT
                ],
                "^",
            ),
            (
                &[
                    "＿", // U+FF3F: FULLWIDTH LOW LINE
                ],
                "_",
            ),
            (
                &[
                    "⁓",  // U+2053: SWUNG DASH
                    "～", // U+FF5E: FULLWIDTH TILDE
                ],
                "~",
            ),
        ];

        for (characters, folded) in foldings {
            for &c in characters {
                assert_eq!(
                    folding_using_raw_tokenizer_helper(c),
                    folded,
                    "testing that character \"{c}\" becomes \"{folded}\""
                );
            }
        }
    }
}


================================================
FILE: src/tokenizer/empty_tokenizer.rs
================================================
use crate::tokenizer::{Token, TokenStream, Tokenizer};

#[derive(Clone)]
pub(crate) struct EmptyTokenizer;

impl Tokenizer for EmptyTokenizer {
    type TokenStream<'a> = EmptyTokenStream;
    fn token_stream(&mut self, _text: &str) -> EmptyTokenStream {
        EmptyTokenStream::default()
    }
}

#[derive(Default)]
pub struct EmptyTokenStream {
    token: Token,
}

impl TokenStream for EmptyTokenStream {
    fn advance(&mut self) -> bool {
        false
    }

    fn token(&self) -> &super::Token {
        &self.token
    }

    fn token_mut(&mut self) -> &mut super::Token {
        &mut self.token
    }
}

#[cfg(test)]
mod tests {
    use crate::tokenizer::{TokenStream, Tokenizer};

    #[test]
    fn test_empty_tokenizer() {
        let mut tokenizer = super::EmptyTokenizer;
        let mut empty = tokenizer.token_stream("whatever string");
        assert!(!empty.advance());
    }
}


================================================
FILE: src/tokenizer/facet_tokenizer.rs
================================================
use super::{Token, TokenStream, Tokenizer};
use crate::schema::FACET_SEP_BYTE;

/// The `FacetTokenizer` process a `Facet` binary representation
/// and emits a token for all of its parent.
///
/// For instance,  `/america/north_america/canada`
/// will emit the three following tokens
///     - `/america/north_america/canada`
///     - `/america/north_america`
///     - `/america`
#[derive(Clone, Default)]
pub struct FacetTokenizer {
    token: Token,
}

#[derive(Debug)]
enum State {
    RootFacetNotEmitted,
    UpToPosition(usize), //< we already emitted facet prefix up to &text[..cursor]
    Terminated,
}

pub struct FacetTokenStream<'a> {
    text: &'a str,
    state: State,
    token: &'a mut Token,
}

impl Tokenizer for FacetTokenizer {
    type TokenStream<'a> = FacetTokenStream<'a>;
    fn token_stream<'a>(&'a mut self, text: &'a str) -> FacetTokenStream<'a> {
        self.token.reset();
        self.token.position = 0;
        FacetTokenStream {
            text,
            state: State::RootFacetNotEmitted, //< pos is the first char that has not been processed yet.
            token: &mut self.token,
        }
    }
}

impl TokenStream for FacetTokenStream<'_> {
    fn advance(&mut self) -> bool {
        match self.state {
            State::RootFacetNotEmitted => {
                self.state = if self.text.is_empty() {
                    State::Terminated
                } else {
                    State::UpToPosition(0)
                };
                true
            }
            State::UpToPosition(cursor) => {
                let bytes: &[u8] = self.text.as_bytes();
                if let Some(next_sep_pos) = bytes[cursor + 1..]
                    .iter()
                    .cloned()
                    .position(|b| b == FACET_SEP_BYTE)
                    .map(|pos| cursor + 1 + pos)
                {
                    let facet_part = &self.text[cursor..next_sep_pos];
                    self.token.text.push_str(facet_part);
                    self.state = State::UpToPosition(next_sep_pos);
                } else {
                    let facet_part = &self.text[cursor..];
                    self.token.text.push_str(facet_part);
                    self.state = State::Terminated;
                }
                true
            }
            State::Terminated => false,
        }
    }

    fn token(&self) -> &Token {
        self.token
    }

    fn token_mut(&mut self) -> &mut Token {
        self.token
    }
}

#[cfg(test)]
mod tests {

    use super::FacetTokenizer;
    use crate::schema::Facet;
    use crate::tokenizer::{Token, TokenStream, Tokenizer};

    #[test]
    fn test_facet_tokenizer() {
        let facet = Facet::from_path(vec!["top", "a", "b"]);
        let mut tokens = vec![];
        {
            let mut add_token = |token: &Token| {
                let facet = Facet::from_encoded(token.text.as_bytes().to_owned()).unwrap();
                tokens.push(format!("{facet}"));
            };
            FacetTokenizer::default()
                .token_stream(facet.encoded_str())
                .process(&mut add_token);
        }
        assert_eq!(tokens.len(), 4);
        assert_eq!(tokens[0], "/");
        assert_eq!(tokens[1], "/top");
        assert_eq!(tokens[2], "/top/a");
        assert_eq!(tokens[3], "/top/a/b");
    }

    #[test]
    fn test_facet_tokenizer_root_facets() {
        let facet = Facet::root();
        let mut tokens = vec![];
        {
            let mut add_token = |token: &Token| {
                let facet = Facet::from_encoded(token.text.as_bytes().to_owned()).unwrap(); // ok test
                tokens.push(format!("{facet}"));
            };
            FacetTokenizer::default()
                .token_stream(facet.encoded_str()) // ok test
                .process(&mut add_token);
        }
        assert_eq!(tokens.len(), 1);
        assert_eq!(tokens[0], "/");
    }
}


================================================
FILE: src/tokenizer/lower_caser.rs
================================================
use std::mem;

use super::{Token, TokenFilter, TokenStream, Tokenizer};

/// Token filter that lowercase terms.
#[derive(Clone)]
pub struct LowerCaser;

impl TokenFilter for LowerCaser {
    type Tokenizer<T: Tokenizer> = LowerCaserFilter<T>;

    fn transform<T: Tokenizer>(self, tokenizer: T) -> Self::Tokenizer<T> {
        LowerCaserFilter {
            tokenizer,
            buffer: String::new(),
        }
    }
}

#[derive(Clone)]
pub struct LowerCaserFilter<T> {
    tokenizer: T,
    buffer: String,
}

impl<T: Tokenizer> Tokenizer for LowerCaserFilter<T> {
    type TokenStream<'a> = LowerCaserTokenStream<'a, T::TokenStream<'a>>;

    fn token_stream<'a>(&'a mut self, text: &'a str) -> Self::TokenStream<'a> {
        self.buffer.clear();
        LowerCaserTokenStream {
            tail: self.tokenizer.token_stream(text),
            buffer: &mut self.buffer,
        }
    }
}

pub struct LowerCaserTokenStream<'a, T> {
    buffer: &'a mut String,
    tail: T,
}

// writes a lowercased version of text into output.
fn to_lowercase_unicode(text: &str, output: &mut String) {
    output.clear();
    output.reserve(50);
    for c in text.chars() {
        // Contrary to the std, we do not take care of sigma special case.
        // This will have an normalizationo effect, which is ok for search.
        output.extend(c.to_lowercase());
    }
}

impl<T: TokenStream> TokenStream for LowerCaserTokenStream<'_, T> {
    fn advance(&mut self) -> bool {
        if !self.tail.advance() {
            return false;
        }
        if self.token_mut().text.is_ascii() {
            // fast track for ascii.
            self.token_mut().text.make_ascii_lowercase();
        } else {
            to_lowercase_unicode(&self.tail.token().text, self.buffer);
            mem::swap(&mut self.tail.token_mut().text, self.buffer);
        }
        true
    }

    fn token(&self) -> &Token {
        self.tail.token()
    }

    fn token_mut(&mut self) -> &mut Token {
        self.tail.token_mut()
    }
}

#[cfg(test)]
mod tests {
    use crate::tokenizer::tests::assert_token;
    use crate::tokenizer::{LowerCaser, SimpleTokenizer, TextAnalyzer, Token};

    #[test]
    fn test_to_lower_case() {
        let tokens = token_stream_helper("Tree");
        assert_eq!(tokens.len(), 1);
        assert_token(&tokens[0], 0, "tree", 0, 4);

        let tokens = token_stream_helper("Русский текст");
        assert_eq!(tokens.len(), 2);
        assert_token(&tokens[0], 0, "русский", 0, 14);
        assert_token(&tokens[1], 1, "текст", 15, 25);
    }

    fn token_stream_helper(text: &str) -> Vec<Token> {
        let mut token_stream = TextAnalyzer::builder(SimpleTokenizer::default())
            .filter(LowerCaser)
            .build();

        let mut token_stream = token_stream.token_stream(text);
        let mut tokens = vec![];
        let mut add_token = |token: &Token| {
            tokens.push(token.clone());
        };
        token_stream.process(&mut add_token);
        tokens
    }
}


================================================
FILE: src/tokenizer/mod.rs
================================================
//! Tokenizer are in charge of chopping text into a stream of tokens
//! ready for indexing.
//!
//! You must define in your schema which tokenizer should be used for
//! each of your fields :
//!
//! ```rust
//! use tantivy::schema::*;
//!
//! let mut schema_builder = Schema::builder();
//!
//! let text_options = TextOptions::default()
//!     .set_indexing_options(
//!         TextFieldIndexing::default()
//!             .set_tokenizer("en_stem")
//!             .set_index_option(IndexRecordOption::Basic)
//!     )
//!     .set_stored();
//!
//! let id_options = TextOptions::default()
//!     .set_indexing_options(
//!         TextFieldIndexing::default()
//!             .set_tokenizer("raw_ids")
//!             .set_index_option(IndexRecordOption::WithFreqsAndPositions)
//!     )
//!     .set_stored();
//!
//! schema_builder.add_text_field("title", text_options.clone());
//! schema_builder.add_text_field("text", text_options);
//! schema_builder.add_text_field("uuid", id_options);
//!
//! let schema = schema_builder.build();
//! ```
//!
//! By default, `tantivy` offers the following tokenizers:
//!
//! ## `default`
//!
//! `default` is the tokenizer that will be used if you do not
//! assign a specific tokenizer to your text field.
//! It will chop your text on punctuation and whitespaces,
//! removes tokens that are longer than 40 chars, and lowercase your text.
//!
//! ## `raw`
//! Does not actual tokenizer your text. It keeps it entirely unprocessed.
//! It can be useful to index uuids, or urls for instance.
//!
//! ## `en_stem`
//!
//! In addition to what `default` does, the `en_stem` tokenizer also
//! apply stemming to your tokens. Stemming consists in trimming words to
//! remove their inflection. This tokenizer is slower than the default one,
//! but is recommended to improve recall.
//!
//! # Custom tokenizer Library
//! Avoid using tantivy as dependency and prefer `tantivy-tokenizer-api` instead.
//!
//! # Custom tokenizers
//!
//! You can write your own tokenizer by implementing the [`Tokenizer`] trait
//! or you can extend an existing [`Tokenizer`] by chaining it with several
//! [`TokenFilter`]s.
//!
//! For instance, the `en_stem` is defined as follows.
//!
//! ```rust
//! use tantivy::tokenizer::*;
//!
//! let en_stem = TextAnalyzer::builder(SimpleTokenizer::default())
//!     .filter(RemoveLongFilter::limit(40))
//!     .filter(LowerCaser)
//!     .filter(Stemmer::new(Language::English))
//!     .build();
//! ```
//!
//! Once your tokenizer is defined, you need to
//! register it with a name in your index's [`TokenizerManager`].
//!
//! ```rust
//! # use tantivy::schema::Schema;
//! # use tantivy::tokenizer::*;
//! # use tantivy::Index;
//! #
//! let custom_en_tokenizer = SimpleTokenizer::default();
//! # let schema = Schema::builder().build();
//! let index = Index::create_in_ram(schema);
//! index.tokenizers()
//!      .register("custom_en", custom_en_tokenizer);
//! ```
//!
//! If you built your schema programmatically, a complete example
//! could like this for instance.
//!
//! Note that tokens with a len greater or equal to
//! [`MAX_TOKEN_LEN`].
//!
//! # Example
//!
//! ```rust
//! use tantivy::schema::{Schema, IndexRecordOption, TextOptions, TextFieldIndexing};
//! use tantivy::tokenizer::*;
//! use tantivy::Index;
//!
//! let mut schema_builder = Schema::builder();
//! let text_field_indexing = TextFieldIndexing::default()
//!     .set_tokenizer("custom_en")
//!     .set_index_option(IndexRecordOption::WithFreqsAndPositions);
//! let text_options = TextOptions::default()
//!     .set_indexing_options(text_field_indexing)
//!     .set_stored();
//! schema_builder.add_text_field("title", text_options);
//! let schema = schema_builder.build();
//! let index = Index::create_in_ram(schema);
//!
//! // We need to register our tokenizer :
//! let custom_en_tokenizer = TextAnalyzer::builder(SimpleTokenizer::default())
//!     .filter(RemoveLongFilter::limit(40))
//!     .filter(LowerCaser)
//!     .build();
//! index
//!     .tokenizers()
//!     .register("custom_en", custom_en_tokenizer);
//! ```
mod alphanum_only;
mod ascii_folding_filter;
mod empty_tokenizer;
mod facet_tokenizer;
mod lower_caser;
mod ngram_tokenizer;
mod raw_tokenizer;
mod regex_tokenizer;
mod remove_long;
mod simple_tokenizer;
mod split_compound_words;
mod stop_word_filter;
mod tokenized_string;
mod tokenizer;
mod tokenizer_manager;
mod whitespace_tokenizer;

#[cfg(feature = "stemmer")]
mod stemmer;
pub use tokenizer_api::{BoxTokenStream, Token, TokenFilter, TokenStream, Tokenizer};

pub use self::alphanum_only::AlphaNumOnlyFilter;
pub use self::ascii_folding_filter::AsciiFoldingFilter;
pub use self::facet_tokenizer::FacetTokenizer;
pub use self::lower_caser::LowerCaser;
pub use self::ngram_tokenizer::NgramTokenizer;
pub use self::raw_tokenizer::RawTokenizer;
pub use self::regex_tokenizer::RegexTokenizer;
pub use self::remove_long::RemoveLongFilter;
pub use self::simple_tokenizer::{SimpleTokenStream, SimpleTokenizer};
pub use self::split_compound_words::SplitCompoundWords;
#[cfg(feature = "stemmer")]
pub use self::stemmer::{Language, Stemmer};
pub use self::stop_word_filter::StopWordFilter;
pub use self::tokenized_string::{PreTokenizedStream, PreTokenizedString};
pub use self::tokenizer::{TextAnalyzer, TextAnalyzerBuilder};
pub use self::tokenizer_manager::TokenizerManager;
pub use self::whitespace_tokenizer::WhitespaceTokenizer;

/// Maximum authorized len (in bytes) for a token.
///
/// Tokenizers are in charge of not emitting tokens larger than this value.
/// Currently, if a faulty tokenizer implementation emits tokens with a length larger than
/// `2^16 - 1 - 5`, the token will simply be ignored downstream.
pub const MAX_TOKEN_LEN: usize = u16::MAX as usize - 5;

#[cfg(test)]
pub(crate) mod tests {
    use super::{Token, TokenizerManager};

    /// This is a function that can be used in tests and doc tests
    /// to assert a token's correctness.
    pub fn assert_token(token: &Token, position: usize, text: &str, from: usize, to: usize) {
        assert_eq!(
            token.position, position,
            "expected position {position} but {token:?}"
        );
        assert_eq!(token.text, text, "expected text {text} but {token:?}");
        assert_eq!(
            token.offset_from, from,
            "expected offset_from {from} but {token:?}"
        );
        assert_eq!(token.offset_to, to, "expected offset_to {to} but {token:?}");
    }

    #[test]
    fn test_raw_tokenizer2() {
        let tokenizer_manager = TokenizerManager::default();
        let mut en_tokenizer = tokenizer_manager.get("raw").unwrap();
        let mut tokens: Vec<Token> = vec![];
        {
            let mut add_token = |token: &Token| {
                tokens.push(token.clone());
            };
            en_tokenizer
                .token_stream("Hello, happy tax payer!")
                .process(&mut add_token);
        }
        assert_eq!(tokens.len(), 1);
        assert_token(&tokens[0], 0, "Hello, happy tax payer!", 0, 23);
    }

    #[test]
    fn test_tokenizer_does_not_exist() {
        let tokenizer_manager = TokenizerManager::default();
        assert!(tokenizer_manager.get("en_doesnotexist").is_none());
    }

    #[test]
    fn test_tokenizer_empty() {
        let tokenizer_manager = TokenizerManager::default();
        let mut en_tokenizer = tokenizer_manager.get("default").unwrap();
        {
            let mut tokens: Vec<Token> = vec![];
            {
                let mut add_token = |token: &Token| {
                    tokens.push(token.clone());
                };
                en_tokenizer.token_stream(" ").process(&mut add_token);
            }
            assert!(tokens.is_empty());
        }
        {
            let mut tokens: Vec<Token> = vec![];
            {
                let mut add_token = |token: &Token| {
                    tokens.push(token.clone());
                };
                en_tokenizer.token_stream(" ").process(&mut add_token);
            }
            assert!(tokens.is_empty());
        }
    }

    #[test]
    fn test_whitespace_tokenizer() {
        let tokenizer_manager = TokenizerManager::default();
        let mut ws_tokenizer = tokenizer_manager.get("whitespace").unwrap();
        let mut tokens: Vec<Token> = vec![];
        {
            let mut add_token = |token: &Token| {
                tokens.push(token.clone());
            };
            ws_tokenizer
                .token_stream("Hello, happy tax payer!")
                .process(&mut add_token);
        }

        assert_eq!(tokens.len(), 4);
        assert_token(&tokens[0], 0, "Hello,", 0, 6);
        assert_token(&tokens[1], 1, "happy", 7, 12);
        assert_token(&tokens[2], 2, "tax", 13, 16);
        assert_token(&tokens[3], 3, "payer!", 17, 23);
    }
}


================================================
FILE: src/tokenizer/ngram_tokenizer.rs
================================================
use super::{Token, TokenStream, Tokenizer};
use crate::TantivyError;

/// Tokenize the text by splitting words into n-grams of the given size(s)
///
/// With this tokenizer, the `position` is always 0.
/// Beware however, in presence of multiple value for the same field,
/// the position will be `POSITION_GAP * index of value`.
///
/// Example 1: `hello` would be tokenized as (min_gram: 2, max_gram: 3, prefix_only: false)
///
/// | Term     | he  | hel | el  | ell | ll  | llo | lo |
/// |----------|-----|-----|-----|-----|-----|-----|----|
/// | Position | 0   | 0   | 0   | 0   | 0   | 0   | 0  |
/// | Offsets  | 0,2 | 0,3 | 1,3 | 1,4 | 2,4 | 2,5 | 3,5|
///
/// Example 2: `hello` would be tokenized as (min_gram: 2, max_gram: 5, prefix_only: **true**)
///
/// | Term     | he  | hel | hell  | hello |
/// |----------|-----|-----|-------|-------|
/// | Position | 0   | 0   | 0     | 0     |
/// | Offsets  | 0,2 | 0,3 | 0,4   | 0,5   |
///
/// Example 3: `hεllo` (non-ascii) would be tokenized as (min_gram: 2, max_gram: 5, prefix_only:
/// **true**)
///
/// | Term     | hε  | hεl | hεll  | hεllo |
/// |----------|-----|-----|-------|-------|
/// | Position | 0   | 0   | 0     | 0     |
/// | Offsets  | 0,3 | 0,4 | 0,5   | 0,6   |
///
/// # Example
///
/// ```rust
/// use tantivy::tokenizer::*;
///
/// let mut tokenizer = NgramTokenizer::new(2, 3, false).unwrap();
/// let mut stream = tokenizer.token_stream("hello");
/// {
///     let token = stream.next().unwrap();
///     assert_eq!(token.text, "he");
///     assert_eq!(token.offset_from, 0);
///     assert_eq!(token.offset_to, 2);
/// }
/// {
///   let token = stream.next().unwrap();
///     assert_eq!(token.text, "hel");
///     assert_eq!(token.offset_from, 0);
///     assert_eq!(token.offset_to, 3);
/// }
/// {
///   let token = stream.next().unwrap();
///     assert_eq!(token.text, "el");
///     assert_eq!(token.offset_from, 1);
///     assert_eq!(token.offset_to, 3);
/// }
/// {
///   let token = stream.next().unwrap();
///     assert_eq!(token.text, "ell");
///     assert_eq!(token.offset_from, 1);
///     assert_eq!(token.offset_to, 4);
/// }
/// {
///   let token = stream.next().unwrap();
///     assert_eq!(token.text, "ll");
///     assert_eq!(token.offset_from, 2);
///     assert_eq!(token.offset_to, 4);
/// }
/// {
///   let token = stream.next().unwrap();
///     assert_eq!(token.text, "llo");
///     assert_eq!(token.offset_from, 2);
///     assert_eq!(token.offset_to, 5);
/// }
/// {
///   let token = stream.next().unwrap();
///   assert_eq!(token.text, "lo");
///   assert_eq!(token.offset_from, 3);
///   assert_eq!(token.offset_to, 5);
/// }
/// assert!(stream.next().is_none());
/// ```
#[derive(Clone, Debug)]
pub struct NgramTokenizer {
    /// min size of the n-gram
    min_gram: usize,
    /// max size of the n-gram
    max_gram: usize,
    /// if true, will only parse the leading edge of the input
    prefix_only: bool,
    token: Token,
}

impl NgramTokenizer {
    /// Configures a new Ngram tokenizer
    pub fn new(
        min_gram: usize,
        max_gram: usize,
        prefix_only: bool,
    ) -> crate::Result<NgramTokenizer> {
        if min_gram == 0 {
            return Err(TantivyError::InvalidArgument(
                "min_gram must be greater than 0".to_string(),
            ));
        }
        if min_gram > max_gram {
            return Err(TantivyError::InvalidArgument(
                "min_gram must not be greater than max_gram".to_string(),
            ));
        }
        Ok(NgramTokenizer {
            min_gram,
            max_gram,
            prefix_only,
            token: Token::default(),
        })
    }

    /// Create a `NGramTokenizer` which generates tokens for all inner ngrams.
    ///
    /// This is as opposed to only prefix ngrams    .
    pub fn all_ngrams(min_gram: usize, max_gram: usize) -> crate::Result<NgramTokenizer> {
        Self::new(min_gram, max_gram, false)
    }

    /// Create a `NGramTokenizer` which only generates tokens for the
    /// prefix ngrams.
    pub fn prefix_only(min_gram: usize, max_gram: usize) -> crate::Result<NgramTokenizer> {
        Self::new(min_gram, max_gram, true)
    }
}

/// TokenStream associate to the `NgramTokenizer`
pub struct NgramTokenStream<'a> {
    /// parameters
    ngram_charidx_iterator: StutteringIterator<CodepointFrontiers<'a>>,
    /// true if the NgramTokenStream is in prefix mode.
    prefix_only: bool,
    /// input
    text: &'a str,
    /// output
    token: &'a mut Token,
}

impl Tokenizer for NgramTokenizer {
    type TokenStream<'a> = NgramTokenStream<'a>;
    fn token_stream<'a>(&'a mut self, text: &'a str) -> NgramTokenStream<'a> {
        self.token.reset();
        NgramTokenStream {
            ngram_charidx_iterator: StutteringIterator::new(
                CodepointFrontiers::for_str(text),
                self.min_gram,
                self.max_gram,
            ),
            prefix_only: self.prefix_only,
            text,
            token: &mut self.token,
        }
    }
}

impl TokenStream for NgramTokenStream<'_> {
    fn advance(&mut self) -> bool {
        if let Some((offset_from, offset_to)) = self.ngram_charidx_iterator.next() {
            if self.prefix_only && offset_from > 0 {
                return false;
            }
            self.token.position = 0;
            self.token.offset_from = offset_from;
            self.token.offset_to = offset_to;
            self.token.text.clear();
            self.token.text.push_str(&self.text[offset_from..offset_to]);
            true
        } else {
            false
        }
    }

    fn token(&self) -> &Token {
        self.token
    }
    fn token_mut(&mut self) -> &mut Token {
        self.token
    }
}

/// This iterator takes an underlying Iterator
/// and emits all of the pairs `(a,b)` such that
/// a and b are items emitted by the iterator at
/// an interval between `min_gram` and `max_gram`.
///
/// The elements are emitted in the order of appearance
/// of `a` first, `b` then.
///
/// See `test_stuttering_iterator` for an example of its
/// output.
struct StutteringIterator<T> {
    underlying: T,
    min_gram: usize,
    max_gram: usize,

    memory: Vec<usize>,
    cursor: usize,
    gram_len: usize,
}

impl<T> StutteringIterator<T>
where T: Iterator<Item = usize>
{
    pub fn new(mut underlying: T, min_gram: usize, max_gram: usize) -> StutteringIterator<T> {
        assert!(min_gram > 0);
        let memory: Vec<usize> = (&mut underlying).take(max_gram + 1).collect();
        if memory.len() <= min_gram {
            // returns an empty iterator
            StutteringIterator {
                underlying,
                min_gram: 1,
                max_gram: 0,
                memory,
                cursor: 0,
                gram_len: 0,
            }
        } else {
            StutteringIterator {
                underlying,
                min_gram,
                max_gram: memory.len() - 1,
                memory,
                cursor: 0,
                gram_len: min_gram,
            }
        }
    }
}

impl<T> Iterator for StutteringIterator<T>
where T: Iterator<Item = usize>
{
    type Item = (usize, usize);

    fn next(&mut self) -> Option<(usize, usize)> {
        if self.gram_len > self.max_gram {
            // we have exhausted all options
            // starting at `self.memory[self.cursor]`.
            //
            // Time to advance.
            self.gram_len = self.min_gram;
            if let Some(next_val) = self.underlying.next() {
                self.memory[self.cursor] = next_val;
            } else {
                self.max_gram -= 1;
            }
            self.cursor += 1;
            if self.cursor >= self.memory.len() {
                self.cursor = 0;
            }
        }
        if self.max_gram < self.min_gram {
            return None;
        }
        let start = self.memory[self.cursor % self.memory.len()];
        let stop = self.memory[(self.cursor + self.gram_len) % self.memory.len()];
        self.gram_len += 1;
        Some((start, stop))
    }
}

/// Emits all of the offsets where a codepoint starts
/// or a codepoint ends.
///
/// By convention, we emit `[0]` for the empty string.
struct CodepointFrontiers<'a> {
    s: &'a str,
    next_el: Option<usize>,
}

impl<'a> CodepointFrontiers<'a> {
    fn for_str(s: &'a str) -> Self {
        CodepointFrontiers {
            s,
            next_el: Some(0),
        }
    }
}

impl Iterator for CodepointFrontiers<'_> {
    type Item = usize;

    fn next(&mut self) -> Option<usize> {
        self.next_el.inspect(|&offset| {
            if self.s.is_empty() {
                self.next_el = None;
            } else {
                let first_codepoint_width = utf8_codepoint_width(self.s.as_bytes()[0]);
                self.s = &self.s[first_codepoint_width..];
                self.next_el = Some(offset + first_codepoint_width);
            }
        })
    }
}

const CODEPOINT_UTF8_WIDTH: [u8; 16] = [1, 1, 1, 1, 1, 1, 1, 1, 2, 2, 2, 2, 2, 2, 3, 4];

// Number of bytes to encode a codepoint in UTF-8 given
// the first byte.
//
// To do that we count the number of higher significant bits set to `1`.
fn utf8_codepoint_width(b: u8) -> usize {
    let higher_4_bits = (b as usize) >> 4;
    CODEPOINT_UTF8_WIDTH[higher_4_bits] as usize
}

#[cfg(test)]
mod tests {

    use super::{utf8_codepoint_width, CodepointFrontiers, NgramTokenizer, StutteringIterator};
    use crate::tokenizer::tests::assert_token;
    use crate::tokenizer::{Token, TokenStream, Tokenizer};

    fn test_helper<T: TokenStream>(mut tokenizer: T) -> Vec<Token> {
        let mut tokens: Vec<Token> = vec![];
        tokenizer.process(&mut |token: &Token| tokens.push(token.clone()));
        tokens
    }

    #[test]
    fn test_utf8_codepoint_width() {
        // 0xxx
        for i in 0..128 {
            assert_eq!(utf8_codepoint_width(i), 1);
        }
        // 110xx
        for i in (128 | 64)..(128 | 64 | 32) {
            assert_eq!(utf8_codepoint_width(i), 2);
        }
        // 1110xx
        for i in (128 | 64 | 32)..(128 | 64 | 32 | 16) {
            assert_eq!(utf8_codepoint_width(i), 3);
        }
        // 1111xx
        for i in (128 | 64 | 32 | 16)..256 {
            assert_eq!(utf8_codepoint_width(i as u8), 4);
        }
    }

    #[test]
    fn test_codepoint_frontiers() {
        assert_eq!(CodepointFrontiers::for_str("").collect::<Vec<_>>(), vec![0]);
        assert_eq!(
            CodepointFrontiers::for_str("abcd").collect::<Vec<_>>(),
            vec![0, 1, 2, 3, 4]
        );
        assert_eq!(
            CodepointFrontiers::for_str("aあ").collect::<Vec<_>>(),
            vec![0, 1, 4]
        );
    }

    #[test]
    fn test_ngram_tokenizer_1_2_false() {
        let tokens = test_helper(
            NgramTokenizer::all_ngrams(1, 2)
                .unwrap()
                .token_stream("hello"),
        );
        assert_eq!(tokens.len(), 9);
        assert_token(&tokens[0], 0, "h", 0, 1);
        assert_token(&tokens[1], 0, "he", 0, 2);
        assert_token(&tokens[2], 0, "e", 1, 2);
        assert_token(&tokens[3], 0, "el", 1, 3);
        assert_token(&tokens[4], 0, "l", 2, 3);
        assert_token(&tokens[5], 0, "ll", 2, 4);
        assert_token(&tokens[6], 0, "l", 3, 4);
        assert_token(&tokens[7], 0, "lo", 3, 5);
        assert_token(&tokens[8], 0, "o", 4, 5);
    }

    #[test]
    fn test_ngram_tokenizer_min_max_equal() {
        let tokens = test_helper(
            NgramTokenizer::all_ngrams(3, 3)
                .unwrap()
                .token_stream("hello"),
        );
        assert_eq!(tokens.len(), 3);
        assert_token(&tokens[0], 0, "hel", 0, 3);
        assert_token(&tokens[1], 0, "ell", 1, 4);
        assert_token(&tokens[2], 0, "llo", 2, 5);
    }

    #[test]
    fn test_ngram_tokenizer_2_5_prefix() {
        let tokens = test_helper(
            NgramTokenizer::prefix_only(2, 5)
                .unwrap()
                .token_stream("frankenstein"),
        );
        assert_eq!(tokens.len(), 4);
        assert_token(&tokens[0], 0, "fr", 0, 2);
        assert_token(&tokens[1], 0, "fra", 0, 3);
        assert_token(&tokens[2], 0, "fran", 0, 4);
        assert_token(&tokens[3], 0, "frank", 0, 5);
    }

    #[test]
    fn test_ngram_non_ascii_1_2() {
        let tokens = test_helper(
            NgramTokenizer::all_ngrams(1, 2)
                .unwrap()
                .token_stream("hεllo"),
        );
        assert_eq!(tokens.len(), 9);
        assert_token(&tokens[0], 0, "h", 0, 1);
        assert_token(&tokens[1], 0, "hε", 0, 3);
        assert_token(&tokens[2], 0, "ε", 1, 3);
        assert_token(&tokens[3], 0, "εl", 1, 4);
        assert_token(&tokens[4], 0, "l", 3, 4);
        assert_token(&tokens[5], 0, "ll", 3, 5);
        assert_token(&tokens[6], 0, "l", 4, 5);
        assert_token(&tokens[7], 0, "lo", 4, 6);
        assert_token(&tokens[8], 0, "o", 5, 6);
    }

    #[test]
    fn test_ngram_non_ascii_2_5_prefix() {
        let tokens = test_helper(
            NgramTokenizer::prefix_only(2, 5)
                .unwrap()
                .token_stream("hεllo"),
        );
        assert_eq!(tokens.len(), 4);
        assert_token(&tokens[0], 0, "hε", 0, 3);
        assert_token(&tokens[1], 0, "hεl", 0, 4);
        assert_token(&tokens[2], 0, "hεll", 0, 5);
        assert_token(&tokens[3], 0, "hεllo", 0, 6);
    }

    #[test]
    fn test_ngram_empty() {
        let tokens = test_helper(NgramTokenizer::all_ngrams(1, 5).unwrap().token_stream(""));
        assert!(tokens.is_empty());
        let tokens = test_helper(NgramTokenizer::all_ngrams(2, 5).unwrap().token_stream(""));
        assert!(tokens.is_empty());
    }

    #[test]
    #[should_panic(expected = "min_gram must be greater than 0")]
    fn test_ngram_min_max_interval_empty() {
        test_helper(
            NgramTokenizer::all_ngrams(0, 2)
                .unwrap()
                .token_stream("hellossss"),
        );
    }

    #[test]
    #[should_panic(expected = "min_gram must not be greater than max_gram")]
    fn test_invalid_interval_should_panic_if_smaller() {
        NgramTokenizer::all_ngrams(2, 1).unwrap();
    }

    #[test]
    fn test_stuttering_iterator_empty() {
        let rg: Vec<usize> = vec![0];
        let mut it = StutteringIterator::new(rg.into_iter(), 1, 2);
        assert_eq!(it.next(), None);
    }

    #[test]
    fn test_stuterring_iterator() {
        let mut it = StutteringIterator::new(0..10, 1, 2);
        assert_eq!(it.next(), Some((0, 1)));
        assert_eq!(it.next(), Some((0, 2)));
        assert_eq!(it.next(), Some((1, 2)));
        assert_eq!(it.next(), Some((1, 3)));
        assert_eq!(it.next(), Some((2, 3)));
        assert_eq!(it.next(), Some((2, 4)));
        assert_eq!(it.next(), Some((3, 4)));
        assert_eq!(it.next(), Some((3, 5)));
        assert_eq!(it.next(), Some((4, 5)));
        assert_eq!(it.next(), Some((4, 6)));
        assert_eq!(it.next(), Some((5, 6)));
        assert_eq!(it.next(), Some((5, 7)));
        assert_eq!(it.next(), Some((6, 7)));
        assert_eq!(it.next(), Some((6, 8)));
        assert_eq!(it.next(), Some((7, 8)));
        assert_eq!(it.next(), Some((7, 9)));
        assert_eq!(it.next(), Some((8, 9)));
        assert_eq!(it.next(), None);
    }
}


================================================
FILE: src/tokenizer/raw_tokenizer.rs
================================================
use super::{Token, TokenStream, Tokenizer};

/// For each value of the field, emit a single unprocessed token.
#[derive(Clone, Default)]
pub struct RawTokenizer {
    token: Token,
}

pub struct RawTokenStream<'a> {
    token: &'a mut Token,
    has_token: bool,
}

impl Tokenizer for RawTokenizer {
    type TokenStream<'a> = RawTokenStream<'a>;
    fn token_stream<'a>(&'a mut self, text: &str) -> RawTokenStream<'a> {
        self.token.reset();
        self.token.position = 0;
        self.token.position_length = 1;
        self.token.offset_from = 0;
        self.token.offset_to = text.len();
        self.token.text.clear();
        self.token.text.push_str(text);
        RawTokenStream {
            token: &mut self.token,
            has_token: true,
        }
    }
}

impl TokenStream for RawTokenStream<'_> {
    fn advance(&mut self) -> bool {
        let result = self.has_token;
        self.has_token = false;
        result
    }

    fn token(&self) -> &Token {
        self.token
    }

    fn token_mut(&mut self) -> &mut Token {
        self.token
    }
}

#[cfg(test)]
mod tests {
    use crate::tokenizer::tests::assert_token;
    use crate::tokenizer::{RawTokenizer, TextAnalyzer, Token};

    #[test]
    fn test_raw_tokenizer() {
        let tokens = token_stream_helper("Hello, happy tax payer!");
        assert_eq!(tokens.len(), 1);
        assert_token(&tokens[0], 0, "Hello, happy tax payer!", 0, 23);
    }

    fn token_stream_helper(text: &str) -> Vec<Token> {
        let mut a = TextAnalyzer::from(RawTokenizer::default());
        let mut token_stream = a.token_stream(text);
        let mut tokens: Vec<Token> = vec![];
        let mut add_token = |token: &Token| {
            tokens.push(token.clone());
        };
        token_stream.process(&mut add_token);
        tokens
    }
}


================================================
FILE: src/tokenizer/regex_tokenizer.rs
================================================
use regex::Regex;

use super::{Token, TokenStream, Tokenizer};
use crate::TantivyError;

/// Tokenize the text by using a regex pattern to split.
///
/// Each match of the regex emits a distinct token, empty tokens will not be emitted. Anchors such
/// as `\A` will match the text from the part where the last token was emitted or the beginning of
/// the complete text if no token was emitted yet.
///
/// Example: `` 'aaa' bbb 'ccc' 'ddd' `` with the pattern `` '(?:\w*)' `` will be tokenized as
/// followed:
///
/// | Term     | aaa  | ccc    | ddd   |
/// |----------|------|--------|-------|
/// | Position | 1    | 2      | 3     |
/// | Offsets  |0,5   | 10,15  | 16,21 |
///
///
/// # Example
///
/// ```rust
/// use tantivy::tokenizer::*;
///
/// let mut tokenizer = RegexTokenizer::new(r"'(?:\w*)'").unwrap();
/// let mut stream = tokenizer.token_stream("'aaa' bbb 'ccc' 'ddd'");
/// {
///     let token = stream.next().unwrap();
///     assert_eq!(token.text, "'aaa'");
///     assert_eq!(token.offset_from, 0);
///     assert_eq!(token.offset_to, 5);
/// }
/// {
///   let token = stream.next().unwrap();
///     assert_eq!(token.text, "'ccc'");
///     assert_eq!(token.offset_from, 10);
///     assert_eq!(token.offset_to, 15);
/// }
/// {
///   let token = stream.next().unwrap();
///     assert_eq!(token.text, "'ddd'");
///     assert_eq!(token.offset_from, 16);
///     assert_eq!(token.offset_to, 21);
/// }
/// assert!(stream.next().is_none());
/// ```

#[derive(Clone)]
pub struct RegexTokenizer {
    regex: Regex,
    token: Token,
}

impl RegexTokenizer {
    /// Creates a new RegexTokenizer.
    pub fn new(regex_pattern: &str) -> crate::Result<RegexTokenizer> {
        Regex::new(regex_pattern)
            .map_err(|_| TantivyError::InvalidArgument(regex_pattern.to_owned()))
            .map(|regex| Self {
                regex,
                token: Token::default(),
            })
    }
}

impl Tokenizer for RegexTokenizer {
    type TokenStream<'a> = RegexTokenStream<'a>;
    fn token_stream<'a>(&'a mut self, text: &'a str) -> RegexTokenStream<'a> {
        self.token.reset();
        RegexTokenStream {
            regex: self.regex.clone(),
            text,
            token: &mut self.token,
            cursor: 0,
        }
    }
}

pub struct RegexTokenStream<'a> {
    regex: Regex,
    text: &'a str,
    token: &'a mut Token,
    cursor: usize,
}

impl TokenStream for RegexTokenStream<'_> {
    fn advance(&mut self) -> bool {
        let Some(regex_match) = self.regex.find(self.text) else {
            return false;
        };
        if regex_match.as_str().is_empty() {
            return false;
        }
        self.token.text.clear();
        self.token.text.push_str(regex_match.as_str());

        self.token.offset_from = self.cursor + regex_match.start();
        self.cursor += regex_match.end();
        self.token.offset_to = self.cursor;

        self.token.position = self.token.position.wrapping_add(1);

        self.text = &self.text[regex_match.end()..];
        true
    }

    fn token(&self) -> &Token {
        self.token
    }

    fn token_mut(&mut self) -> &mut Token {
        self.token
    }
}

#[cfg(test)]
mod tests {
    use crate::tokenizer::regex_tokenizer::RegexTokenizer;
    use crate::tokenizer::tests::assert_token;
    use crate::tokenizer::{TextAnalyzer, Token};

    #[test]
    fn test_regex_tokenizer() {
        let tokens = token_stream_helper("'aaa' bbb 'ccc' 'ddd'", r"'(?:\w*)'");
        assert_eq!(tokens.len(), 3);
        assert_token(&tokens[0], 0, "'aaa'", 0, 5);
        assert_token(&tokens[1], 1, "'ccc'", 10, 15);
        assert_token(&tokens[2], 2, "'ddd'", 16, 21);
    }

    #[test]
    fn test_regexp_tokenizer_no_match_on_input_data() {
        let tokens = token_stream_helper("aaa", r"'(?:\w*)'");
        assert_eq!(tokens.len(), 0);
    }

    #[test]
    fn test_regexp_tokenizer_no_input_data() {
        let tokens = token_stream_helper("", r"'(?:\w*)'");
        assert_eq!(tokens.len(), 0);
    }

    #[test]
    fn test_regexp_tokenizer_error_on_invalid_regex() {
        let tokenizer = RegexTokenizer::new(r"\@(");
        assert_eq!(tokenizer.is_err(), true);
        assert_eq!(
            tokenizer.err().unwrap().to_string(),
            "An invalid argument was passed: '\\@('"
        );
    }

    fn token_stream_helper(text: &str, pattern: &str) -> Vec<Token> {
        let r = RegexTokenizer::new(pattern).unwrap();
        let mut a = TextAnalyzer::from(r);
        let mut token_stream = a.token_stream(text);
        let mut tokens: Vec<Token> = vec![];
        let mut add_token = |token: &Token| {
            tokens.push(token.clone());
        };
        token_stream.process(&mut add_token);
        tokens
    }
}


================================================
FILE: src/tokenizer/remove_long.rs
================================================
//! # Example
//! ```rust
//! use tantivy::tokenizer::*;
//!
//! let mut tokenizer = TextAnalyzer::builder(SimpleTokenizer::default())
//!   .filter(RemoveLongFilter::limit(5))
//!   .build();
//!
//! let mut stream = tokenizer.token_stream("toolong nice");
//! // because `toolong` is more than 5 characters, it is filtered
//! // out of the token stream.
//! assert_eq!(stream.next().unwrap().text, "nice");
//! assert!(stream.next().is_none());
//! ```
use super::{Token, TokenFilter, TokenStream, Tokenizer};

/// `RemoveLongFilter` removes tokens that are longer
/// than a given number of bytes (in UTF-8 representation).
///
/// It is especially useful when indexing unconstrained content.
/// e.g. Mail containing base-64 encoded pictures etc.
#[derive(Clone)]
pub struct RemoveLongFilter {
    length_limit: usize,
}

impl RemoveLongFilter {
    /// Creates a `RemoveLongFilter` given a limit in bytes of the UTF-8 representation.
    pub fn limit(length_limit: usize) -> RemoveLongFilter {
        RemoveLongFilter { length_limit }
    }
}

impl<T> RemoveLongFilterStream<T> {
    fn predicate(&self, token: &Token) -> bool {
        token.text.len() < self.token_length_limit
    }
}

impl TokenFilter for RemoveLongFilter {
    type Tokenizer<T: Tokenizer> = RemoveLongFilterWrapper<T>;

    fn transform<T: Tokenizer>(self, tokenizer: T) -> RemoveLongFilterWrapper<T> {
        RemoveLongFilterWrapper {
            length_limit: self.length_limit,
            inner: tokenizer,
        }
    }
}

#[derive(Clone)]
pub struct RemoveLongFilterWrapper<T: Tokenizer> {
    length_limit: usize,
    inner: T,
}

impl<T: Tokenizer> Tokenizer for RemoveLongFilterWrapper<T> {
    type TokenStream<'a> = RemoveLongFilterStream<T::TokenStream<'a>>;

    fn token_stream<'a>(&'a mut self, text: &'a str) -> Self::TokenStream<'a> {
        RemoveLongFilterStream {
            token_length_limit: self.length_limit,
            tail: self.inner.token_stream(text),
        }
    }
}

pub struct RemoveLongFilterStream<T> {
    token_length_limit: usize,
    tail: T,
}

impl<T: TokenStream> TokenStream for RemoveLongFilterStream<T> {
    fn advance(&mut self) -> bool {
        while self.tail.advance() {
            if self.predicate(self.tail.token()) {
                return true;
            }
        }
        false
    }

    fn token(&self) -> &Token {
        self.tail.token()
    }

    fn token_mut(&mut self) -> &mut Token {
        self.tail.token_mut()
    }
}

#[cfg(test)]
mod tests {
    use crate::tokenizer::tests::assert_token;
    use crate::tokenizer::{RemoveLongFilter, SimpleTokenizer, TextAnalyzer, Token};

    #[test]
    fn test_remove_long() {
        let tokens = token_stream_helper("hello tantivy, happy searching!");
        assert_eq!(tokens.len(), 2);
        assert_token(&tokens[0], 0, "hello", 0, 5);
        assert_token(&tokens[1], 2, "happy", 15, 20);
    }

    fn token_stream_helper(text: &str) -> Vec<Token> {
        let mut a = TextAnalyzer::builder(SimpleTokenizer::default())
            .filter(RemoveLongFilter::limit(6))
            .build();
        let mut token_stream = a.token_stream(text);
        let mut tokens: Vec<Token> = vec![];
        let mut add_token = |token: &Token| {
            tokens.push(token.clone());
        };
        token_stream.process(&mut add_token);
        tokens
    }
}


================================================
FILE: src/tokenizer/simple_tokenizer.rs
================================================
use std::str::CharIndices;

use super::{Token, TokenStream, Tokenizer};

/// Tokenize the text by splitting on whitespaces and punctuation.
#[derive(Clone, Default)]
pub struct SimpleTokenizer {
    token: Token,
}

/// TokenStream produced by the `SimpleTokenizer`.
pub struct SimpleTokenStream<'a> {
    text: &'a str,
    chars: CharIndices<'a>,
    token: &'a mut Token,
}

impl Tokenizer for SimpleTokenizer {
    type TokenStream<'a> = SimpleTokenStream<'a>;
    fn token_stream<'a>(&'a mut self, text: &'a str) -> SimpleTokenStream<'a> {
        self.token.reset();
        SimpleTokenStream {
            text,
            chars: text.char_indices(),
            token: &mut self.token,
        }
    }
}

impl SimpleTokenStream<'_> {
    // search for the end of the current token.
    fn search_token_end(&mut self) -> usize {
        (&mut self.chars)
            .filter(|(_, c)| !c.is_alphanumeric())
            .map(|(offset, _)| offset)
            .next()
            .unwrap_or(self.text.len())
    }
}

impl TokenStream for SimpleTokenStream<'_> {
    fn advance(&mut self) -> bool {
        self.token.text.clear();
        self.token.position = self.token.position.wrapping_add(1);
        while let Some((offset_from, c)) = self.chars.next() {
            if c.is_alphanumeric() {
                let offset_to = self.search_token_end();
                self.token.offset_from = offset_from;
                self.token.offset_to = offset_to;
                self.token.text.push_str(&self.text[offset_from..offset_to]);
                return true;
            }
        }
        false
    }

    fn token(&self) -> &Token {
        self.token
    }

    fn token_mut(&mut self) -> &mut Token {
        self.token
    }
}

#[cfg(test)]
mod tests {
    use crate::tokenizer::tests::assert_token;
    use crate::tokenizer::{SimpleTokenizer, TextAnalyzer, Token};

    #[test]
    fn test_simple_tokenizer() {
        let tokens = token_stream_helper("Hello, happy tax payer!");
        assert_eq!(tokens.len(), 4);
        assert_token(&tokens[0], 0, "Hello", 0, 5);
        assert_token(&tokens[1], 1, "happy", 7, 12);
        assert_token(&tokens[2], 2, "tax", 13, 16);
        assert_token(&tokens[3], 3, "payer", 17, 22);
    }

    fn token_stream_helper(text: &str) -> Vec<Token> {
        let mut a = TextAnalyzer::from(SimpleTokenizer::default());
        let mut token_stream = a.token_stream(text);
        let mut tokens: Vec<Token> = vec![];
        let mut add_token = |token: &Token| {
            tokens.push(token.clone());
        };
        token_stream.process(&mut add_token);
        tokens
    }
}


================================================
FILE: src/tokenizer/split_compound_words.rs
================================================
use aho_corasick::{AhoCorasick, AhoCorasickBuilder, MatchKind};

use super::{Token, TokenFilter, TokenStream, Tokenizer};

/// A [`TokenFilter`] which splits compound words into their parts
/// based on a given dictionary.
///
/// Words only will be split if they can be fully decomposed into
/// consecutive matches into the given dictionary.
///
/// This is mostly useful to split [compound nouns][compound] common to many
/// Germanic languages into their constituents.
///
/// # Example
///
/// The quality of the dictionary determines the quality of the splits,
/// e.g. the missing stem "back" of "backen" implies that "brotbackautomat"
/// is not split in the following example.
///
/// ```rust
/// use tantivy::tokenizer::{SimpleTokenizer, SplitCompoundWords, TextAnalyzer};
///
/// let mut tokenizer =
///        TextAnalyzer::builder(SimpleTokenizer::default())
///        .filter(
///            SplitCompoundWords::from_dictionary([
///                 "dampf", "schiff", "fahrt", "brot", "backen", "automat",
///            ])
///            .unwrap()
///        )
///        .build();
/// {
///     let mut stream = tokenizer.token_stream("dampfschifffahrt");
///     assert_eq!(stream.next().unwrap().text, "dampf");
///     assert_eq!(stream.next().unwrap().text, "schiff");
///     assert_eq!(stream.next().unwrap().text, "fahrt");
///     assert_eq!(stream.next(), None);
/// }
/// let mut stream = tokenizer.token_stream("brotbackautomat");
/// assert_eq!(stream.next().unwrap().text, "brotbackautomat");
/// assert_eq!(stream.next(), None);
/// ```
///
/// [compound]: https://en.wikipedia.org/wiki/Compound_(linguistics)
#[derive(Clone)]
pub struct SplitCompoundWords {
    dict: AhoCorasick,
}

impl SplitCompoundWords {
    /// Create a filter from a given dictionary.
    ///
    /// The dictionary will be used to construct an [`AhoCorasick`] automaton
    /// with reasonable defaults. See [`from_automaton`][Self::from_automaton] if
    /// more control over its construction is required.
    pub fn from_dictionary<I, P>(dict: I) -> crate::Result<Self>
    where
        I: IntoIterator<Item = P>,
        P: AsRef<[u8]>,
    {
        let dict = AhoCorasickBuilder::new()
            .match_kind(MatchKind::LeftmostLongest)
            .build(dict)
            .map_err(|err| {
                crate::TantivyError::InvalidArgument(format!(
                    "Failed to build Aho-Corasick automaton from dictionary: {err}"
                ))
            })?;

        Ok(Self::from_automaton(dict))
    }

    /// Create a filter from a given automaton.
    ///
    /// The automaton should use one of the leftmost-first match kinds
    /// and it should not be anchored.
    pub fn from_automaton(dict: AhoCorasick) -> Self {
        Self { dict }
    }
}

impl TokenFilter for SplitCompoundWords {
    type Tokenizer<T: Tokenizer> = SplitCompoundWordsFilter<T>;

    fn transform<T: Tokenizer>(self, tokenizer: T) -> SplitCompoundWordsFilter<T> {
        SplitCompoundWordsFilter {
            dict: self.dict,
            inner: tokenizer,
            cuts: Vec::new(),
            parts: Vec::new(),
        }
    }
}

#[derive(Clone)]
pub struct SplitCompoundWordsFilter<T> {
    dict: AhoCorasick,
    inner: T,
    cuts: Vec<usize>,
    parts: Vec<Token>,
}

impl<T: Tokenizer> Tokenizer for SplitCompoundWordsFilter<T> {
    type TokenStream<'a> = SplitCompoundWordsTokenStream<'a, T::TokenStream<'a>>;

    fn token_stream<'a>(&'a mut self, text: &'a str) -> Self::TokenStream<'a> {
        self.cuts.clear();
        self.parts.clear();
        SplitCompoundWordsTokenStream {
            dict: self.dict.clone(),
            tail: self.inner.token_stream(text),
            cuts: &mut self.cuts,
            parts: &mut self.parts,
        }
    }
}

pub struct SplitCompoundWordsTokenStream<'a, T> {
    dict: AhoCorasick,
    tail: T,
    cuts: &'a mut Vec<usize>,
    parts: &'a mut Vec<Token>,
}

impl<T: TokenStream> SplitCompoundWordsTokenStream<'_, T> {
    // Will use `self.cuts` to fill `self.parts` if `self.tail.token()`
    // can fully be split into consecutive matches against `self.dict`.
    fn split(&mut self) {
        let token = self.tail.token();
        let mut text = token.text.as_str();

        self.cuts.clear();
        let mut pos = 0;

        for match_ in self.dict.find_iter(text) {
            if pos != match_.start() {
                break;
            }

            self.cuts.push(pos);
            pos = match_.end();
        }

        if pos == token.text.len() {
            // Fill `self.parts` in reverse order,
            // so that `self.parts.pop()` yields
            // the tokens in their original order.
            for pos in self.cuts.iter().rev() {
                let (head, tail) = text.split_at(*pos);

                text = head;
                self.parts.push(Token {
                    text: tail.to_owned(),
                    ..*token
                });
            }
        }
    }
}

impl<T: TokenStream> TokenStream for SplitCompoundWordsTokenStream<'_, T> {
    fn advance(&mut self) -> bool {
        self.parts.pop();

        if !self.parts.is_empty() {
            return true;
        }

        if !self.tail.advance() {
            return false;
        }

        // Will yield either `self.parts.last()` or
        // `self.tail.token()` if it could not be split.
        self.split();
        true
    }

    fn token(&self) -> &Token {
        self.parts.last().unwrap_or_else(|| self.tail.token())
    }

    fn token_mut(&mut self) -> &mut Token {
        self.parts
            .last_mut()
            .unwrap_or_else(|| self.tail.token_mut())
    }
}

#[cfg(test)]
mod tests {
    use super::*;
    use crate::tokenizer::{SimpleTokenizer, TextAnalyzer};

    #[test]
    fn splitting_compound_words_works() {
        let mut tokenizer = TextAnalyzer::builder(SimpleTokenizer::default())
            .filter(SplitCompoundWords::from_dictionary(["foo", "bar"]).unwrap())
            .build();

        {
            let mut stream = tokenizer.token_stream("");
            assert_eq!(stream.next(), None);
        }

        {
            let mut stream = tokenizer.token_stream("foo bar");
            assert_eq!(stream.next().unwrap().text, "foo");
            assert_eq!(stream.next().unwrap().text, "bar");
            assert_eq!(stream.next(), None);
        }

        {
            let mut stream = tokenizer.token_stream("foobar");
            assert_eq!(stream.next().unwrap().text, "foo");
            assert_eq!(stream.next().unwrap().text, "bar");
            assert_eq!(stream.next(), None);
        }

        {
            let mut stream = tokenizer.token_stream("foobarbaz");
            assert_eq!(stream.next().unwrap().text, "foobarbaz");
            assert_eq!(stream.next(), None);
        }

        {
            let mut stream = tokenizer.token_stream("baz foobar qux");
            assert_eq!(stream.next().unwrap().text, "baz");
            assert_eq!(stream.next().unwrap().text, "foo");
            assert_eq!(stream.next().unwrap().text, "bar");
            assert_eq!(stream.next().unwrap().text, "qux");
            assert_eq!(stream.next(), None);
        }

        {
            let mut stream = tokenizer.token_stream("foobar foobar");
            assert_eq!(stream.next().unwrap().text, "foo");
            assert_eq!(stream.next().unwrap().text, "bar");
            assert_eq!(stream.next().unwrap().text, "foo");
            assert_eq!(stream.next().unwrap().text, "bar");
            assert_eq!(stream.next(), None);
        }

        {
            let mut stream = tokenizer.token_stream("foobar foo bar foobar");
            assert_eq!(stream.next().unwrap().text, "foo");
            assert_eq!(stream.next().unwrap().text, "bar");
            assert_eq!(stream.next().unwrap().text, "foo");
            assert_eq!(stream.next().unwrap().text, "bar");
            assert_eq!(stream.next().unwrap().text, "foo");
            assert_eq!(stream.next().unwrap().text, "bar");
            assert_eq!(stream.next(), None);
        }

        {
            let mut stream = tokenizer.token_stream("foobazbar foo bar foobar");
            assert_eq!(stream.next().unwrap().text, "foobazbar");
            assert_eq!(stream.next().unwrap().text, "foo");
            assert_eq!(stream.next().unwrap().text, "bar");
            assert_eq!(stream.next().unwrap().text, "foo");
            assert_eq!(stream.next().unwrap().text, "bar");
            assert_eq!(stream.next(), None);
        }

        {
            let mut stream = tokenizer.token_stream("foobar qux foobar");
            assert_eq!(stream.next().unwrap().text, "foo");
            assert_eq!(stream.next().unwrap().text, "bar");
            assert_eq!(stream.next().unwrap().text, "qux");
            assert_eq!(stream.next().unwrap().text, "foo");
            assert_eq!(stream.next().unwrap().text, "bar");
            assert_eq!(stream.next(), None);
        }

        {
            let mut stream = tokenizer.token_stream("barfoo");
            assert_eq!(stream.next().unwrap().text, "bar");
            assert_eq!(stream.next().unwrap().text, "foo");
            assert_eq!(stream.next(), None);
        }
    }
}


================================================
FILE: src/tokenizer/stemmer.rs
================================================
use std::borrow::Cow;
use std::mem;

use rust_stemmers::Algorithm;
use serde::{Deserialize, Serialize};

use super::{Token, TokenFilter, TokenStream, Tokenizer};

/// Available stemmer languages.
#[derive(Debug, Serialize, Deserialize, Eq, PartialEq, Copy, Clone, Hash)]
#[allow(missing_docs)]
pub enum Language {
    Arabic,
    Danish,
    Dutch,
    English,
    Finnish,
    French,
    German,
    Greek,
    Hungarian,
    Italian,
    Norwegian,
    Portuguese,
    Romanian,
    Russian,
    Spanish,
    Swedish,
    Tamil,
    Turkish,
}

impl Language {
    fn algorithm(self) -> Algorithm {
        use self::Language::*;
        match self {
            Arabic => Algorithm::Arabic,
            Danish => Algorithm::Danish,
            Dutch => Algorithm::Dutch,
            English => Algorithm::English,
            Finnish => Algorithm::Finnish,
            French => Algorithm::French,
            German => Algorithm::German,
            Greek => Algorithm::Greek,
            Hungarian => Algorithm::Hungarian,
            Italian => Algorithm::Italian,
            Norwegian => Algorithm::Norwegian,
            Portuguese => Algorithm::Portuguese,
            Romanian => Algorithm::Romanian,
            Russian => Algorithm::Russian,
            Spanish => Algorithm::Spanish,
            Swedish => Algorithm::Swedish,
            Tamil => Algorithm::Tamil,
            Turkish => Algorithm::Turkish,
        }
    }
}

/// `Stemmer` token filter. Several languages are supported, see [`Language`] for the available
/// languages.
/// Tokens are expected to be lowercased beforehand.
#[derive(Clone)]
pub struct Stemmer {
    stemmer_algorithm: Algorithm,
}

impl Stemmer {
    /// Creates a new `Stemmer` [`TokenFilter`] for a given language algorithm.
    pub fn new(language: Language) -> Stemmer {
        Stemmer {
            stemmer_algorithm: language.algorithm(),
        }
    }
}

impl Default for Stemmer {
    /// Creates a new `Stemmer` [`TokenFilter`] for [`Language::English`].
    fn default() -> Self {
        Stemmer::new(Language::English)
    }
}

impl TokenFilter for Stemmer {
    type Tokenizer<T: Tokenizer> = StemmerFilter<T>;

    fn transform<T: Tokenizer>(self, tokenizer: T) -> StemmerFilter<T> {
        StemmerFilter {
            stemmer_algorithm: self.stemmer_algorithm,
            inner: tokenizer,
        }
    }
}

#[derive(Clone)]
pub struct StemmerFilter<T> {
    stemmer_algorithm: Algorithm,
    inner: T,
}

impl<T: Tokenizer> Tokenizer for StemmerFilter<T> {
    type TokenStream<'a> = StemmerTokenStream<T::TokenStream<'a>>;

    fn token_stream<'a>(&'a mut self, text: &'a str) -> Self::TokenStream<'a> {
        let stemmer = rust_stemmers::Stemmer::create(self.stemmer_algorithm);
        StemmerTokenStream {
            tail: self.inner.token_stream(text),
            stemmer,
            buffer: String::new(),
        }
    }
}

pub struct StemmerTokenStream<T> {
    tail: T,
    stemmer: rust_stemmers::Stemmer,
    buffer: String,
}

impl<T: TokenStream> TokenStream for StemmerTokenStream<T> {
    fn advance(&mut self) -> bool {
        if !self.tail.advance() {
            return false;
        }
        let token = self.tail.token_mut();
        let stemmed_str = self.stemmer.stem(&token.text);
        match stemmed_str {
            Cow::Owned(stemmed_str) => token.text = stemmed_str,
            Cow::Borrowed(stemmed_str) => {
                self.buffer.clear();
                self.buffer.push_str(stemmed_str);
                mem::swap(&mut token.text, &mut self.buffer);
            }
        }
        true
    }

    fn token(&self) -> &Token {
        self.tail.token()
    }

    fn token_mut(&mut self) -> &mut Token {
        self.tail.token_mut()
    }
}

#[cfg(test)]
mod tests {
    use tokenizer_api::Token;

    use super::*;
    use crate::tokenizer::tests::assert_token;
    use crate::tokenizer::{LowerCaser, SimpleTokenizer, TextAnalyzer, TokenizerManager};

    #[test]
    fn test_en_stem() {
        let tokenizer_manager = TokenizerManager::default();
        let mut en_tokenizer = tokenizer_manager.get("en_stem").unwrap();
        let mut tokens: Vec<Token> = vec![];
        {
            let mut add_token = |token: &Token| {
                tokens.push(token.clone());
            };
            en_tokenizer
                .token_stream("Dogs are the bests!")
                .process(&mut add_token);
        }

        assert_eq!(tokens.len(), 4);
        assert_token(&tokens[0], 0, "dog", 0, 4);
        assert_token(&tokens[1], 1, "are", 5, 8);
        assert_token(&tokens[2], 2, "the", 9, 12);
        assert_token(&tokens[3], 3, "best", 13, 18);
    }

    #[test]
    fn test_non_en_stem() {
        let tokenizer_manager = TokenizerManager::default();
        tokenizer_manager.register(
            "el_stem",
            TextAnalyzer::builder(SimpleTokenizer::default())
                .filter(LowerCaser)
                .filter(Stemmer::new(Language::Greek))
                .build(),
        );
        let mut el_tokenizer = tokenizer_manager.get("el_stem").unwrap();
        let mut tokens: Vec<Token> = vec![];
        {
            let mut add_token = |token: &Token| {
                tokens.push(token.clone());
            };
            el_tokenizer
                .token_stream("Καλημέρα, χαρούμενε φορολογούμενε!")
                .process(&mut add_token);
        }

        assert_eq!(tokens.len(), 3);
        assert_token(&tokens[0], 0, "καλημερ", 0, 16);
        assert_token(&tokens[1], 1, "χαρουμεν", 18, 36);
        assert_token(&tokens[2], 2, "φορολογουμεν", 37, 63);
    }
}


================================================
FILE: src/tokenizer/stop_word_filter/gen_stopwords.py
================================================
import requests

LANGUAGES = [
    "danish",
    "dutch",
    "finnish",
    "french",
    "german",
    "hungarian",
    "italian",
    "norwegian",
    "portuguese",
    "russian",
    "spanish",
    "swedish",
]

with requests.Session() as sess, open("stopwords.rs", "w") as mod:
    mod.write("/*\n")
    mod.write(
        "These stop word lists are from the Snowball project (https://snowballstem.org/)\nwhich carries the following copyright and license:\n\n"
    )

    resp = sess.get(
        "https://raw.githubusercontent.com/snowballstem/snowball/master/COPYING"
    )
    resp.raise_for_status()
    mod.write(resp.text)
    mod.write("*/\n\n")

    for lang in LANGUAGES:
        resp = sess.get(f"https://snowballstem.org/algorithms/{lang}/stop.txt")
        resp.raise_for_status()

        mod.write(f"pub const {lang.upper()}: &[&str] = &[\n")

        for line in resp.text.splitlines():
            line, _, _ = line.partition("|")

            for word in line.split():
                mod.write(f'    "{word}",\n')

        mod.write("];\n\n")


================================================
FILE: src/tokenizer/stop_word_filter/mod.rs
================================================
//! # Example
//! ```rust
//! use tantivy::tokenizer::*;
//!
//! let mut tokenizer = TextAnalyzer::builder(SimpleTokenizer::default())
//!   .filter(StopWordFilter::remove(vec!["the".to_string(), "is".to_string()]))
//!   .build();
//!
//! let mut stream = tokenizer.token_stream("the fox is crafty");
//! assert_eq!(stream.next().unwrap().text, "fox");
//! assert_eq!(stream.next().unwrap().text, "crafty");
//! assert!(stream.next().is_none());
//! ```
#[cfg(feature = "stopwords")]
#[rustfmt::skip]
mod stopwords;

use std::sync::Arc;

use rustc_hash::FxHashSet;

#[cfg(feature = "stopwords")]
use super::Language;
use super::{Token, TokenFilter, TokenStream, Tokenizer};

/// `TokenFilter` that removes stop words from a token stream
#[derive(Clone)]
pub struct StopWordFilter {
    words: Arc<FxHashSet<String>>,
}

impl StopWordFilter {
    /// Creates a new [`StopWordFilter`] for the given [`Language`]
    ///
    /// Returns `Some` if a list of stop words is available and `None` otherwise.
    #[cfg(feature = "stopwords")]
    pub fn new(language: Language) -> Option<Self> {
        let words = match language {
            Language::Danish => stopwords::DANISH,
            Language::Dutch => stopwords::DUTCH,
            Language::English => {
                // This is the same list of words used by the Apache-licensed Lucene project,
                // c.f. https://github.com/apache/lucene/blob/d5d6dc079395c47cd6d12dcce3bcfdd2c7d9dc63/lucene/analysis/common/src/java/org/apache/lucene/analysis/en/EnglishAnalyzer.java#L46
                &[
                    "a", "an", "and", "are", "as", "at", "be", "but", "by", "for", "if", "in",
                    "into", "is", "it", "no", "not", "of", "on", "or", "such", "that", "the",
                    "their", "then", "there", "these", "they", "this", "to", "was", "will", "with",
                ]
            }
            Language::Finnish => stopwords::FINNISH,
            Language::French => stopwords::FRENCH,
            Language::German => stopwords::GERMAN,
            Language::Hungarian => stopwords::HUNGARIAN,
            Language::Italian => stopwords::ITALIAN,
            Language::Norwegian => stopwords::NORWEGIAN,
            Language::Portuguese => stopwords::PORTUGUESE,
            Language::Russian => stopwords::RUSSIAN,
            Language::Spanish => stopwords::SPANISH,
            Language::Swedish => stopwords::SWEDISH,
            _ => return None,
        };

        Some(Self::remove(words.iter().map(|&word| word.to_owned())))
    }

    /// Creates a `StopWordFilter` given a list of words to remove
    pub fn remove<W: IntoIterator<Item = String>>(words: W) -> StopWordFilter {
        StopWordFilter {
            words: Arc::new(words.into_iter().collect()),
        }
    }
}

impl TokenFilter for StopWordFilter {
    type Tokenizer<T: Tokenizer> = StopWordFilterWrapper<T>;

    fn transform<T: Tokenizer>(self, tokenizer: T) -> StopWordFilterWrapper<T> {
        StopWordFilterWrapper {
            words: self.words,
            inner: tokenizer,
        }
    }
}

#[derive(Clone)]
pub struct StopWordFilterWrapper<T> {
    words: Arc<FxHashSet<String>>,
    inner: T,
}

impl<T: Tokenizer> Tokenizer for StopWordFilterWrapper<T> {
    type TokenStream<'a> = StopWordFilterStream<T::TokenStream<'a>>;

    fn token_stream<'a>(&'a mut self, text: &'a str) -> Self::TokenStream<'a> {
        StopWordFilterStream {
            words: self.words.clone(),
            tail: self.inner.token_stream(text),
        }
    }
}

pub struct StopWordFilterStream<T> {
    words: Arc<FxHashSet<String>>,
    tail: T,
}

impl<T> StopWordFilterStream<T> {
    fn predicate(&self, token: &Token) -> bool {
        !self.words.contains(&token.text)
    }
}

impl<T: TokenStream> TokenStream for StopWordFilterStream<T> {
    fn advance(&mut self) -> bool {
        while self.tail.advance() {
            if self.predicate(self.tail.token()) {
                return true;
            }
        }
        false
    }

    fn token(&self) -> &Token {
        self.tail.token()
    }

    fn token_mut(&mut self) -> &mut Token {
        self.tail.token_mut()
    }
}

#[cfg(test)]
mod tests {
    use crate::tokenizer::tests::assert_token;
    use crate::tokenizer::{SimpleTokenizer, StopWordFilter, TextAnalyzer, Token};

    #[test]
    fn test_stop_word() {
        let tokens = token_stream_helper("i am a cat. as yet i have no name.");
        assert_eq!(tokens.len(), 5);
        assert_token(&tokens[0], 3, "cat", 7, 10);
        assert_token(&tokens[1], 5, "yet", 15, 18);
        assert_token(&tokens[2], 7, "have", 21, 25);
        assert_token(&tokens[3], 8, "no", 26, 28);
        assert_token(&tokens[4], 9, "name", 29, 33);
    }

    fn token_stream_helper(text: &str) -> Vec<Token> {
        let stops = vec![
            "a".to_string(),
            "as".to_string(),
            "am".to_string(),
            "i".to_string(),
        ];
        let mut a = TextAnalyzer::builder(SimpleTokenizer::default())
            .filter(StopWordFilter::remove(stops))
            .build();
        let mut token_stream = a.token_stream(text);
        let mut tokens: Vec<Token> = vec![];
        let mut add_token = |token: &Token| {
            tokens.push(token.clone());
        };
        token_stream.process(&mut add_token);
        tokens
    }
}


================================================
FILE: src/tokenizer/stop_word_filter/stopwords.rs
================================================
/*
These stop word lists are from the Snowball project (https://snowballstem.org/)
which carries the following copyright and license:

Copyright (c) 2001, Dr Martin Porter
Copyright (c) 2004,2005, Richard Boulton
Copyright (c) 2013, Yoshiki Shibukawa
Copyright (c) 2006,2007,2009,2010,2011,2014-2019, Olly Betts
All rights reserved.

Redistribution and use in source and binary forms, with or without
modification, are permitted provided that the following conditions
are met:

  1. Redistributions of source code must retain the above copyright notice,
     this list of conditions and the following disclaimer.
  2. Redistributions in binary form must reproduce the above copyright notice,
     this list of conditions and the following disclaimer in the documentation
     and/or other materials provided with the distribution.
  3. Neither the name of the Snowball project nor the names of its contributors
     may be used to endorse or promote products derived from this software
     without specific prior written permission.

THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS" AND
ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE LIABLE FOR
ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES
(INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES;
LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON
ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
(INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS
SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
*/

pub const DANISH: &[&str] = &[
    "og",
    "i",
    "jeg",
    "det",
    "at",
    "en",
    "den",
    "til",
    "er",
    "som",
    "på",
    "de",
    "med",
    "han",
    "af",
    "for",
    "ikke",
    "der",
    "var",
    "mig",
    "sig",
    "men",
    "et",
    "har",
    "om",
    "vi",
    "min",
    "havde",
    "ham",
    "hun",
    "nu",
    "over",
    "da",
    "fra",
    "du",
    "ud",
    "sin",
    "dem",
    "os",
    "op",
    "man",
    "hans",
    "hvor",
    "eller",
    "hvad",
    "skal",
    "selv",
    "her",
    "alle",
    "vil",
    "blev",
    "kunne",
    "ind",
    "når",
    "være",
    "dog",
    "noget",
    "ville",
    "jo",
    "deres",
    "efter",
    "ned",
    "skulle",
    "denne",
    "end",
    "dette",
    "mit",
    "også",
    "under",
    "have",
    "dig",
    "anden",
    "hende",
    "mine",
    "alt",
    "meget",
    "sit",
    "sine",
    "vor",
    "mod",
    "disse",
    "hvis",
    "din",
    "nogle",
    "hos",
    "blive",
    "mange",
    "ad",
    "bliver",
    "hendes",
    "været",
    "thi",
    "jer",
    "sådan",
];

pub const DUTCH: &[&str] = &[
    "de",
    "en",
    "van",
    "ik",
    "te",
    "dat",
    "die",
    "in",
    "een",
    "hij",
    "het",
    "niet",
    "zijn",
    "is",
    "was",
    "op",
    "aan",
    "met",
    "als",
    "voor",
    "had",
    "er",
    "maar",
    "om",
    "hem",
    "dan",
    "zou",
    "of",
    "wat",
    "mijn",
    "men",
    "dit",
    "zo",
    "door",
    "over",
    "ze",
    "zich",
    "bij",
    "ook",
    "tot",
    "je",
    "mij",
    "uit",
    "der",
    "daar",
    "haar",
    "naar",
    "heb",
    "hoe",
    "heeft",
    "hebben",
    "deze",
    "u",
    "want",
    "nog",
    "zal",
    "me",
    "zij",
    "nu",
    "ge",
    "geen",
    "omdat",
    "iets",
    "worden",
    "toch",
    "al",
    "waren",
    "veel",
    "meer",
    "doen",
    "toen",
    "moet",
    "ben",
    "zonder",
    "kan",
    "hun",
    "dus",
    "alles",
    "onder",
    "ja",
    "eens",
    "hier",
    "wie",
    "werd",
    "altijd",
    "doch",
    "wordt",
    "wezen",
    "kunnen",
    "ons",
    "zelf",
    "tegen",
    "na",
    "reeds",
    "wil",
    "kon",
    "niets",
    "uw",
    "iemand",
    "geweest",
    "andere",
];

pub const FINNISH: &[&str] = &[
    "olla",
    "olen",
    "olet",
    "on",
    "olemme",
    "olette",
    "ovat",
    "ole",
    "oli",
    "olisi",
    "olisit",
    "olisin",
    "olisimme",
    "olisitte",
    "olisivat",
    "olit",
    "olin",
    "olimme",
    "olitte",
    "olivat",
    "ollut",
    "olleet",
    "en",
    "et",
    "ei",
    "emme",
    "ette",
    "eivät",
    "minä",
    "minun",
    "minut",
    "minua",
    "minussa",
    "minusta",
    "minuun",
    "minulla",
    "minulta",
    "minulle",
    "sinä",
    "sinun",
    "sinut",
    "sinua",
    "sinussa",
    "sinusta",
    "sinuun",
    "sinulla",
    "sinulta",
    "sinulle",
    "hän",
    "hänen",
    "hänet",
    "häntä",
    "hänessä",
    "hänestä",
    "häneen",
    "hänellä",
    "häneltä",
    "hänelle",
    "me",
    "meidän",
    "meidät",
    "meitä",
    "meissä",
    "meistä",
    "meihin",
    "meillä",
    "meiltä",
    "meille",
    "te",
    "teidän",
    "teidät",
    "teitä",
    "teissä",
    "teistä",
    "teihin",
    "teillä",
    "teiltä",
    "teille",
    "he",
    "heidän",
    "heidät",
    "heitä",
    "heissä",
    "heistä",
    "heihin",
    "heillä",
    "heiltä",
    "heille",
    "tämä",
    "tämän",
    "tätä",
    "tässä",
    "tästä",
    "tähän",
    "tällä",
    "tältä",
    "tälle",
    "tänä",
    "täksi",
    "tuo",
    "tuon",
    "tuota",
    "tuossa",
    "tuosta",
    "tuohon",
    "tuolla",
    "tuolta",
    "tuolle",
    "tuona",
    "tuoksi",
    "se",
    "sen",
    "sitä",
    "siinä",
    "siitä",
    "siihen",
    "sillä",
    "siltä",
    "sille",
    "sinä",
    "siksi",
    "nämä",
    "näiden",
    "näitä",
    "näissä",
    "näistä",
    "näihin",
    "näillä",
    "näiltä",
    "näille",
    "näinä",
    "näiksi",
    "nuo",
    "noiden",
    "noita",
    "noissa",
    "noista",
    "noihin",
    "noilla",
    "noilta",
    "noille",
    "noina",
    "noiksi",
    "ne",
    "niiden",
    "niitä",
    "niissä",
    "niistä",
    "niihin",
    "niillä",
    "niiltä",
    "niille",
    "niinä",
    "niiksi",
    "kuka",
    "kenen",
    "kenet",
    "ketä",
    "kenessä",
    "kenestä",
    "keneen",
    "kenellä",
    "keneltä",
    "kenelle",
    "kenenä",
    "keneksi",
    "ketkä",
    "keiden",
    "ketkä",
    "keitä",
    "keissä",
    "keistä",
    "keihin",
    "keillä",
    "keiltä",
    "keille",
    "keinä",
    "keiksi",
    "mikä",
    "minkä",
    "minkä",
    "mitä",
    "missä",
    "mistä",
    "mihin",
    "millä",
    "miltä",
    "mille",
    "minä",
    "miksi",
    "mitkä",
    "joka",
    "jonka",
    "jota",
    "jossa",
    "josta",
    "johon",
    "jolla",
    "jolta",
    "jolle",
    "jona",
    "joksi",
    "jotka",
    "joiden",
    "joita",
    "joissa",
    "joista",
    "joihin",
    "joilla",
    "joilta",
    "joille",
    "joina",
    "joiksi",
    "että",
    "ja",
    "jos",
    "koska",
    "kuin",
    "mutta",
    "niin",
    "sekä",
    "sillä",
    "tai",
    "vaan",
    "vai",
    "vaikka",
    "kanssa",
    "mukaan",
    "noin",
    "poikki",
    "yli",
    "kun",
    "nyt",
    "itse",
];

pub const FRENCH: &[&str] = &[
    "au",
    "aux",
    "avec",
    "ce",
    "ces",
    "dans",
    "de",
    "des",
    "du",
    "elle",
    "en",
    "et",
    "eux",
    "il",
    "je",
    "la",
    "le",
    "leur",
    "lui",
    "ma",
    "mais",
    "me",
    "même",
    "mes",
    "moi",
    "mon",
    "ne",
    "nos",
    "notre",
    "nous",
    "on",
    "ou",
    "par",
    "pas",
    "pour",
    "qu",
    "que",
    "qui",
    "sa",
    "se",
    "ses",
    "sur",
    "ta",
    "te",
    "tes",
    "toi",
    "ton",
    "tu",
    "un",
    "une",
    "vos",
    "votre",
    "vous",
    "c",
    "d",
    "j",
    "l",
    "à",
    "m",
    "n",
    "s",
    "t",
    "y",
    "étée",
    "étées",
    "étant",
    "suis",
    "es",
    "êtes",
    "sont",
    "serai",
    "seras",
    "sera",
    "serons",
    "serez",
    "seront",
    "serais",
    "serait",
    "serions",
    "seriez",
    "seraient",
    "étais",
    "était",
    "étions",
    "étiez",
    "étaient",
    "fus",
    "fut",
    "fûmes",
    "fûtes",
    "furent",
    "sois",
    "soit",
    "soyons",
    "soyez",
    "soient",
    "fusse",
    "fusses",
    "fussions",
    "fussiez",
    "fussent",
    "ayant",
    "eu",
    "eue",
    "eues",
    "eus",
    "ai",
    "avons",
    "avez",
    "ont",
    "aurai",
    "aurons",
    "aurez",
    "auront",
    "aurais",
    "aurait",
    "aurions",
    "auriez",
    "auraient",
    "avais",
    "avait",
    "aviez",
    "avaient",
    "eut",
    "eûmes",
    "eûtes",
    "eurent",
    "aie",
    "aies",
    "ait",
    "ayons",
    "ayez",
    "aient",
    "eusse",
    "eusses",
    "eût",
    "eussions",
    "eussiez",
    "eussent",
    "ceci",
    "cela",
    "celà",
    "cet",
    "cette",
    "ici",
    "ils",
    "les",
    "leurs",
    "quel",
    "quels",
    "quelle",
    "quelles",
    "sans",
    "soi",
];

pub const GERMAN: &[&str] = &[
    "aber",
    "alle",
    "allem",
    "allen",
    "aller",
    "alles",
    "als",
    "also",
    "am",
    "an",
    "ander",
    "andere",
    "anderem",
    "anderen",
    "anderer",
    "anderes",
    "anderm",
    "andern",
    "anderr",
    "anders",
    "auch",
    "auf",
    "aus",
    "bei",
    "bin",
    "bis",
    "bist",
    "da",
    "damit",
    "dann",
    "der",
    "den",
    "des",
    "dem",
    "die",
    "das",
    "daß",
    "derselbe",
    "derselben",
    "denselben",
    "desselben",
    "demselben",
    "dieselbe",
    "dieselben",
    "dasselbe",
    "dazu",
    "dein",
    "deine",
    "deinem",
    "deinen",
    "deiner",
    "deines",
    "denn",
    "derer",
    "dessen",
    "dich",
    "dir",
    "du",
    "dies",
    "diese",
    "diesem",
    "diesen",
    "dieser",
    "dieses",
    "doch",
    "dort",
    "durch",
    "ein",
    "eine",
    "einem",
    "einen",
    "einer",
    "eines",
    "einig",
    "einige",
    "einigem",
    "einigen",
    "einiger",
    "einiges",
    "einmal",
    "er",
    "ihn",
    "ihm",
    "es",
    "etwas",
    "euer",
    "eure",
    "eurem",
    "euren",
    "eurer",
    "eures",
    "für",
    "gegen",
    "gewesen",
    "hab",
    "habe",
    "haben",
    "hat",
    "hatte",
    "hatten",
    "hier",
    "hin",
    "hinter",
    "ich",
    "mich",
    "mir",
    "ihr",
    "ihre",
    "ihrem",
    "ihren",
    "ihrer",
    "ihres",
    "euch",
    "im",
    "in",
    "indem",
    "ins",
    "ist",
    "jede",
    "jedem",
    "jeden",
    "jeder",
    "jedes",
    "jene",
    "jenem",
    "jenen",
    "jener",
    "jenes",
    "jetzt",
    "kann",
    "kein",
    "keine",
    "keinem",
    "keinen",
    "keiner",
    "keines",
    "können",
    "könnte",
    "machen",
    "man",
    "manche",
    "manchem",
    "manchen",
    "mancher",
    "manches",
    "mein",
    "meine",
    "meinem",
    "meinen",
    "meiner",
    "meines",
    "mit",
    "muss",
    "musste",
    "nach",
    "nicht",
    "nichts",
    "noch",
    "nun",
    "nur",
    "ob",
    "oder",
    "ohne",
    "sehr",
    "sein",
    "seine",
    "seinem",
    "seinen",
    "seiner",
    "seines",
    "selbst",
    "sich",
    "sie",
    "ihnen",
    "sind",
    "so",
    "solche",
    "solchem",
    "solchen",
    "solcher",
    "solches",
    "soll",
    "sollte",
    "sondern",
    "sonst",
    "über",
    "um",
    "und",
    "uns",
    "unse",
    "unsem",
    "unsen",
    "unser",
    "unses",
    "unter",
    "viel",
    "vom",
    "von",
    "vor",
    "während",
    "war",
    "waren",
    "warst",
    "was",
    "weg",
    "weil",
    "weiter",
    "welche",
    "welchem",
    "welchen",
    "welcher",
    "welches",
    "wenn",
    "werde",
    "werden",
    "wie",
    "wieder",
    "will",
    "wir",
    "wird",
    "wirst",
    "wo",
    "wollen",
    "wollte",
    "würde",
    "würden",
    "zu",
    "zum",
    "zur",
    "zwar",
    "zwischen",
];

pub const HUNGARIAN: &[&str] = &[
    "a",
    "ahogy",
    "ahol",
    "aki",
    "akik",
    "akkor",
    "alatt",
    "által",
    "általában",
    "amely",
    "amelyek",
    "amelyekben",
    "amelyeket",
    "amelyet",
    "amelynek",
    "ami",
    "amit",
    "amolyan",
    "amíg",
    "amikor",
    "át",
    "abban",
    "ahhoz",
    "annak",
    "arra",
    "arról",
    "az",
    "azok",
    "azon",
    "azt",
    "azzal",
    "azért",
    "aztán",
    "azután",
    "azonban",
    "bár",
    "be",
    "belül",
    "benne",
    "cikk",
    "cikkek",
    "cikkeket",
    "csak",
    "de",
    "e",
    "eddig",
    "egész",
    "egy",
    "egyes",
    "egyetlen",
    "egyéb",
    "egyik",
    "egyre",
    "ekkor",
    "el",
    "elég",
    "ellen",
    "elő",
    "először",
    "előtt",
    "első",
    "én",
    "éppen",
    "ebben",
    "ehhez",
    "emilyen",
    "ennek",
    "erre",
    "ez",
    "ezt",
    "ezek",
    "ezen",
    "ezzel",
    "ezért",
    "és",
    "fel",
    "felé",
    "hanem",
    "hiszen",
    "hogy",
    "hogyan",
    "igen",
    "így",
    "illetve",
    "ill.",
    "ill",
    "ilyen",
    "ilyenkor",
    "ison",
    "ismét",
    "itt",
    "jó",
    "jól",
    "jobban",
    "kell",
    "kellett",
    "keresztül",
    "keressünk",
    "ki",
    "kívül",
    "között",
    "közül",
    "legalább",
    "lehet",
    "lehetett",
    "legyen",
    "lenne",
    "lenni",
    "lesz",
    "lett",
    "maga",
    "magát",
    "majd",
    "majd",
    "már",
    "más",
    "másik",
    "meg",
    "még",
    "mellett",
    "mert",
    "mely",
    "melyek",
    "mi",
    "mit",
    "míg",
    "miért",
    "milyen",
    "mikor",
    "minden",
    "mindent",
    "mindenki",
    "mindig",
    "mint",
    "mintha",
    "mivel",
    "most",
    "nagy",
    "nagyobb",
    "nagyon",
    "ne",
    "néha",
    "nekem",
    "neki",
    "nem",
    "néhány",
    "nélkül",
    "nincs",
    "olyan",
    "ott",
    "össze",
    "ő",
    "ők",
    "őket",
    "pedig",
    "persze",
    "rá",
    "s",
    "saját",
    "sem",
    "semmi",
    "sok",
    "sokat",
    "sokkal",
    "számára",
    "szemben",
    "szerint",
    "szinte",
    "talán",
    "tehát",
    "teljes",
    "tovább",
    "továbbá",
    "több",
    "úgy",
    "ugyanis",
    "új",
    "újabb",
    "újra",
    "után",
    "utána",
    "utolsó",
    "vagy",
    "vagyis",
    "valaki",
    "valami",
    "valamint",
    "való",
    "vagyok",
    "van",
    "vannak",
    "volt",
    "voltam",
    "voltak",
    "voltunk",
    "vissza",
    "vele",
    "viszont",
    "volna",
];

pub const ITALIAN: &[&str] = &[
    "ad",
    "al",
    "allo",
    "ai",
    "agli",
    "all",
    "agl",
    "alla",
    "alle",
    "con",
    "col",
    "coi",
    "da",
    "dal",
    "dallo",
    "dai",
    "dagli",
    "dall",
    "dagl",
    "dalla",
    "dalle",
    "di",
    "del",
    "dello",
    "dei",
    "degli",
    "dell",
    "degl",
    "della",
    "delle",
    "in",
    "nel",
    "nello",
    "nei",
    "negli",
    "nell",
    "negl",
    "nella",
    "nelle",
    "su",
    "sul",
    "sullo",
    "sui",
    "sugli",
    "sull",
    "sugl",
    "sulla",
    "sulle",
    "per",
    "tra",
    "contro",
    "io",
    "tu",
    "lui",
    "lei",
    "noi",
    "voi",
    "loro",
    "mio",
    "mia",
    "miei",
    "mie",
    "tuo",
    "tua",
    "tuoi",
    "tue",
    "suo",
    "sua",
    "suoi",
    "sue",
    "nostro",
    "nostra",
    "nostri",
    "nostre",
    "vostro",
    "vostra",
    "vostri",
    "vostre",
    "mi",
    "ti",
    "ci",
    "vi",
    "lo",
    "la",
    "li",
    "le",
    "gli",
    "ne",
    "il",
    "un",
    "uno",
    "una",
    "ma",
    "ed",
    "se",
    "perché",
    "anche",
    "come",
    "dov",
    "dove",
    "che",
    "chi",
    "cui",
    "non",
    "più",
    "quale",
    "quanto",
    "quanti",
    "quanta",
    "quante",
    "quello",
    "quelli",
    "quella",
    "quelle",
    "questo",
    "questi",
    "questa",
    "queste",
    "si",
    "tutto",
    "tutti",
    "a",
    "c",
    "e",
    "i",
    "l",
    "o",
    "ho",
    "hai",
    "ha",
    "abbiamo",
    "avete",
    "hanno",
    "abbia",
    "abbiate",
    "abbiano",
    "avrò",
    "avrai",
    "avrà",
    "avremo",
    "avrete",
    "avranno",
    "avrei",
    "avresti",
    "avrebbe",
    "avremmo",
    "avreste",
    "avrebbero",
    "avevo",
    "avevi",
    "aveva",
    "avevamo",
    "avevate",
    "avevano",
    "ebbi",
    "avesti",
    "ebbe",
    "avemmo",
    "aveste",
    "ebbero",
    "avessi",
    "avesse",
    "avessimo",
    "avessero",
    "avendo",
    "avuto",
    "avuta",
    "avuti",
    "avute",
    "sono",
    "sei",
    "è",
    "siamo",
    "siete",
    "sia",
    "siate",
    "siano",
    "sarò",
    "sarai",
    "sarà",
    "saremo",
    "sarete",
    "saranno",
    "sarei",
    "saresti",
    "sarebbe",
    "saremmo",
    "sareste",
    "sarebbero",
    "ero",
    "eri",
    "era",
    "eravamo",
    "eravate",
    "erano",
    "fui",
    "fosti",
    "fu",
    "fummo",
    "foste",
    "furono",
    "fossi",
    "fosse",
    "fossimo",
    "fossero",
    "essendo",
    "faccio",
    "fai",
    "facciamo",
    "fanno",
    "faccia",
    "facciate",
    "facciano",
    "farò",
    "farai",
    "farà",
    "faremo",
    "farete",
    "faranno",
    "farei",
    "faresti",
    "farebbe",
    "faremmo",
    "fareste",
    "farebbero",
    "facevo",
    "facevi",
    "faceva",
    "facevamo",
    "facevate",
    "facevano",
    "feci",
    "facesti",
    "fece",
    "facemmo",
    "faceste",
    "fecero",
    "facessi",
    "facesse",
    "facessimo",
    "facessero",
    "facendo",
    "sto",
    "stai",
    "sta",
    "stiamo",
    "stanno",
    "stia",
    "stiate",
    "stiano",
    "starò",
    "starai",
    "starà",
    "staremo",
    "starete",
    "staranno",
    "starei",
    "staresti",
    "starebbe",
    "staremmo",
    "stareste",
    "starebbero",
    "stavo",
    "stavi",
    "stava",
    "stavamo",
    "stavate",
    "stavano",
    "stetti",
    "stesti",
    "stette",
    "stemmo",
    "steste",
    "stettero",
    "stessi",
    "stesse",
    "stessimo",
    "stessero",
    "stando",
];

pub const NORWEGIAN: &[&str] = &[
    "og",
    "i",
    "jeg",
    "det",
    "at",
    "en",
    "et",
    "den",
    "til",
    "er",
    "som",
    "på",
    "de",
    "med",
    "han",
    "av",
    "ikke",
    "ikkje",
    "der",
    "så",
    "var",
    "meg",
    "seg",
    "men",
    "ett",
    "har",
    "om",
    "vi",
    "min",
    "mitt",
    "ha",
    "hadde",
    "hun",
    "nå",
    "over",
    "da",
    "ved",
    "fra",
    "du",
    "ut",
    "sin",
    "dem",
    "oss",
    "opp",
    "man",
    "kan",
    "hans",
    "hvor",
    "eller",
    "hva",
    "skal",
    "selv",
    "sjøl",
    "her",
    "alle",
    "vil",
    "bli",
    "ble",
    "blei",
    "blitt",
    "kunne",
    "inn",
    "når",
    "være",
    "kom",
    "noen",
    "noe",
    "ville",
    "dere",
    "deres",
    "kun",
    "ja",
    "etter",
    "ned",
    "skulle",
    "denne",
    "for",
    "deg",
    "si",
    "sine",
    "sitt",
    "mot",
    "å",
    "meget",
    "hvorfor",
    "dette",
    "disse",
    "uten",
    "hvordan",
    "ingen",
    "din",
    "ditt",
    "blir",
    "samme",
    "hvilken",
    "hvilke",
    "sånn",
    "inni",
    "mellom",
    "vår",
    "hver",
    "hvem",
    "vors",
    "hvis",
    "både",
    "bare",
    "enn",
    "fordi",
    "før",
    "mange",
    "også",
    "slik",
    "vært",
    "båe",
    "begge",
    "siden",
    "dykk",
    "dykkar",
    "dei",
    "deira",
    "deires",
    "deim",
    "di",
    "då",
    "eg",
    "ein",
    "eit",
    "eitt",
    "elles",
    "honom",
    "hjå",
    "ho",
    "hoe",
    "henne",
    "hennar",
    "hennes",
    "hoss",
    "hossen",
    "ingi",
    "inkje",
    "korleis",
    "korso",
    "kva",
    "kvar",
    "kvarhelst",
    "kven",
    "kvi",
    "kvifor",
    "me",
    "medan",
    "mi",
    "mine",
    "mykje",
    "no",
    "nokon",
    "noka",
    "nokor",
    "noko",
    "nokre",
    "sia",
    "sidan",
    "so",
    "somt",
    "somme",
    "um",
    "upp",
    "vere",
    "vore",
    "verte",
    "vort",
    "varte",
    "vart",
];

pub const PORTUGUESE: &[&str] = &[
    "de",
    "a",
    "o",
    "que",
    "e",
    "do",
    "da",
    "em",
    "um",
    "para",
    "com",
    "não",
    "uma",
    "os",
    "no",
    "se",
    "na",
    "por",
    "mais",
    "as",
    "dos",
    "como",
    "mas",
    "ao",
    "ele",
    "das",
    "à",
    "seu",
    "sua",
    "ou",
    "quando",
    "muito",
    "nos",
    "já",
    "eu",
    "também",
    "só",
    "pelo",
    "pela",
    "até",
    "isso",
    "ela",
    "entre",
    "depois",
    "sem",
    "mesmo",
    "aos",
    "seus",
    "quem",
    "nas",
    "me",
    "esse",
    "eles",
    "você",
    "essa",
    "num",
    "nem",
    "suas",
    "meu",
    "às",
    "minha",
    "numa",
    "pelos",
    "elas",
    "qual",
    "nós",
    "lhe",
    "deles",
    "essas",
    "esses",
    "pelas",
    "este",
    "dele",
    "tu",
    "te",
    "vocês",
    "vos",
    "lhes",
    "meus",
    "minhas",
    "teu",
    "tua",
    "teus",
    "tuas",
    "nosso",
    "nossa",
    "nossos",
    "nossas",
    "dela",
    "delas",
    "esta",
    "estes",
    "estas",
    "aquele",
    "aquela",
    "aqueles",
    "aquelas",
    "isto",
    "aquilo",
    "estou",
    "está",
    "estamos",
    "estão",
    "estive",
    "esteve",
    "estivemos",
    "estiveram",
    "estava",
    "estávamos",
    "estavam",
    "estivera",
    "estivéramos",
    "esteja",
    "estejamos",
    "estejam",
    "estivesse",
    "estivéssemos",
    "estivessem",
    "estiver",
    "estivermos",
    "estiverem",
    "hei",
    "há",
    "havemos",
    "hão",
    "houve",
    "houvemos",
    "houveram",
    "houvera",
    "houvéramos",
    "haja",
    "hajamos",
    "hajam",
    "houvesse",
    "houvéssemos",
    "houvessem",
    "houver",
    "houvermos",
    "houverem",
    "houverei",
    "houverá",
    "houveremos",
    "houverão",
    "houveria",
    "houveríamos",
    "houveriam",
    "sou",
    "somos",
    "são",
    "era",
    "éramos",
    "eram",
    "fui",
    "foi",
    "fomos",
    "foram",
    "fora",
    "fôramos",
    "seja",
    "sejamos",
    "sejam",
    "fosse",
    "fôssemos",
    "fossem",
    "for",
    "formos",
    "forem",
    "serei",
    "será",
    "seremos",
    "serão",
    "seria",
    "seríamos",
    "seriam",
    "tenho",
    "tem",
    "temos",
    "tém",
    "tinha",
    "tínhamos",
    "tinham",
    "tive",
    "teve",
    "tivemos",
    "tiveram",
    "tivera",
    "tivéramos",
    "tenha",
    "tenhamos",
    "tenham",
    "tivesse",
    "tivéssemos",
    "tivessem",
    "tiver",
    "tivermos",
    "tiverem",
    "terei",
    "terá",
    "teremos",
    "terão",
    "teria",
    "teríamos",
    "teriam",
];

pub const RUSSIAN: &[&str] = &[
    "и",
    "в",
    "во",
    "не",
    "что",
    "он",
    "на",
    "я",
    "с",
    "со",
    "как",
    "а",
    "то",
    "все",
    "она",
    "так",
    "его",
    "но",
    "да",
    "ты",
    "к",
    "у",
    "же",
    "вы",
    "за",
    "бы",
    "по",
    "только",
    "ее",
    "мне",
    "было",
    "вот",
    "от",
    "меня",
    "еще",
    "нет",
    "о",
    "из",
    "ему",
    "теперь",
    "когда",
    "даже",
    "ну",
    "вдруг",
    "ли",
    "если",
    "уже",
    "или",
    "ни",
    "быть",
    "был",
    "него",
    "до",
    "вас",
    "нибудь",
    "опять",
    "уж",
    "вам",
    "сказал",
    "ведь",
    "там",
    "потом",
    "себя",
    "ничего",
    "ей",
    "может",
    "они",
    "тут",
    "где",
    "есть",
    "надо",
    "ней",
    "для",
    "мы",
    "тебя",
    "их",
    "чем",
    "была",
    "сам",
    "чтоб",
    "без",
    "будто",
    "человек",
    "чего",
    "раз",
    "тоже",
    "себе",
    "под",
    "жизнь",
    "будет",
    "ж",
    "тогда",
    "кто",
    "этот",
    "говорил",
    "того",
    "потому",
    "этого",
    "какой",
    "совсем",
    "ним",
    "здесь",
    "этом",
    "один",
    "почти",
    "мой",
    "тем",
    "чтобы",
    "нее",
    "кажется",
    "сейчас",
    "были",
    "куда",
    "зачем",
    "сказать",
    "всех",
    "никогда",
    "сегодня",
    "можно",
    "при",
    "наконец",
    "два",
    "об",
    "другой",
    "хоть",
    "после",
    "над",
    "больше",
    "тот",
    "через",
    "эти",
    "нас",
    "про",
    "всего",
    "них",
    "какая",
    "много",
    "разве",
    "сказала",
    "три",
    "эту",
    "моя",
    "впрочем",
    "хорошо",
    "свою",
    "этой",
    "перед",
    "иногда",
    "лучше",
    "чуть",
    "том",
    "нельзя",
    "такой",
    "им",
    "более",
    "всегда",
    "конечно",
    "всю",
    "между",
];

pub const SPANISH: &[&str] = &[
    "de",
    "la",
    "que",
    "el",
    "en",
    "y",
    "a",
    "los",
    "del",
    "se",
    "las",
    "por",
    "un",
    "para",
    "con",
    "no",
    "una",
    "su",
    "al",
    "lo",
    "como",
    "más",
    "pero",
    "sus",
    "le",
    "ya",
    "o",
    "este",
    "sí",
    "porque",
    "esta",
    "entre",
    "cuando",
    "muy",
    "sin",
    "sobre",
    "también",
    "me",
    "hasta",
    "hay",
    "donde",
    "quien",
    "desde",
    "todo",
    "nos",
    "durante",
    "todos",
    "uno",
    "les",
    "ni",
    "contra",
    "otros",
    "ese",
    "eso",
    "ante",
    "ellos",
    "e",
    "esto",
    "mí",
    "antes",
    "algunos",
    "qué",
    "unos",
    "yo",
    "otro",
    "otras",
    "otra",
    "él",
    "tanto",
    "esa",
    "estos",
    "mucho",
    "quienes",
    "nada",
    "muchos",
    "cual",
    "poco",
    "ella",
    "estar",
    "estas",
    "algunas",
    "algo",
    "nosotros",
    "mi",
    "mis",
    "tú",
    "te",
    "ti",
    "tu",
    "tus",
    "ellas",
    "nosotras",
    "vosotros",
    "vosotras",
    "os",
    "mío",
    "mía",
    "míos",
    "mías",
    "tuyo",
    "tuya",
    "tuyos",
    "tuyas",
    "suyo",
    "suya",
    "suyos",
    "suyas",
    "nuestro",
    "nuestra",
    "nuestros",
    "nuestras",
    "vuestro",
    "vuestra",
    "vuestros",
    "vuestras",
    "esos",
    "esas",
    "estoy",
    "estás",
    "está",
    "estamos",
    "estáis",
    "están",
    "esté",
    "estés",
    "estemos",
    "estéis",
    "estén",
    "estaré",
    "estarás",
    "estará",
    "estaremos",
    "estaréis",
    "estarán",
    "estaría",
    "estarías",
    "estaríamos",
    "estaríais",
    "estarían",
    "estaba",
    "estabas",
    "estábamos",
    "estabais",
    "estaban",
    "estuve",
    "estuviste",
    "estuvo",
    "estuvimos",
    "estuvisteis",
    "estuvieron",
    "estuviera",
    "estuvieras",
    "estuviéramos",
    "estuvierais",
    "estuvieran",
    "estuviese",
    "estuvieses",
    "estuviésemos",
    "estuvieseis",
    "estuviesen",
    "estando",
    "estado",
    "estada",
    "estados",
    "estadas",
    "estad",
    "he",
    "has",
    "ha",
    "hemos",
    "habéis",
    "han",
    "haya",
    "hayas",
    "hayamos",
    "hayáis",
    "hayan",
    "habré",
    "habrás",
    "habrá",
    "habremos",
    "habréis",
    "habrán",
    "habría",
    "habrías",
    "habríamos",
    "habríais",
    "habrían",
    "había",
    "habías",
    "habíamos",
    "habíais",
    "habían",
    "hube",
    "hubiste",
    "hubo",
    "hubimos",
    "hubisteis",
    "hubieron",
    "hubiera",
    "hubieras",
    "hubiéramos",
    "hubierais",
    "hubieran",
    "hubiese",
    "hubieses",
    "hubiésemos",
    "hubieseis",
    "hubiesen",
    "habiendo",
    "habido",
    "habida",
    "habidos",
    "habidas",
    "soy",
    "eres",
    "es",
    "somos",
    "sois",
    "son",
    "sea",
    "seas",
    "seamos",
    "seáis",
    "sean",
    "seré",
    "serás",
    "será",
    "seremos",
    "seréis",
    "serán",
    "sería",
    "serías",
    "seríamos",
    "seríais",
    "serían",
    "era",
    "eras",
    "éramos",
    "erais",
    "eran",
    "fui",
    "fuiste",
    "fue",
    "fuimos",
    "fuisteis",
    "fueron",
    "fuera",
    "fueras",
    "fuéramos",
    "fuerais",
    "fueran",
    "fuese",
    "fueses",
    "fuésemos",
    "fueseis",
    "fuesen",
    "siendo",
    "sido",
    "tengo",
    "tienes",
    "tiene",
    "tenemos",
    "tenéis",
    "tienen",
    "tenga",
    "tengas",
    "tengamos",
    "tengáis",
    "tengan",
    "tendré",
    "tendrás",
    "tendrá",
    "tendremos",
    "tendréis",
    "tendrán",
    "tendría",
    "tendrías",
    "tendríamos",
    "tendríais",
    "tendrían",
    "tenía",
    "tenías",
    "teníamos",
    "teníais",
    "tenían",
    "tuve",
    "tuviste",
    "tuvo",
    "tuvimos",
    "tuvisteis",
    "tuvieron",
    "tuviera",
    "tuvieras",
    "tuviéramos",
    "tuvierais",
    "tuvieran",
    "tuviese",
    "tuvieses",
    "tuviésemos",
    "tuvieseis",
    "tuviesen",
    "teniendo",
    "tenido",
    "tenida",
    "tenidos",
    "tenidas",
    "tened",
];

pub const SWEDISH: &[&str] = &[
    "och",
    "det",
    "att",
    "i",
    "en",
    "jag",
    "hon",
    "som",
    "han",
    "på",
    "den",
    "med",
    "var",
    "sig",
    "för",
    "så",
    "till",
    "är",
    "men",
    "ett",
    "om",
    "hade",
    "de",
    "av",
    "icke",
    "mig",
    "du",
    "henne",
    "då",
    "sin",
    "nu",
    "har",
    "inte",
    "hans",
    "honom",
    "skulle",
    "hennes",
    "där",
    "min",
    "man",
    "ej",
    "vid",
    "kunde",
    "något",
    "från",
    "ut",
    "när",
    "efter",
    "upp",
    "vi",
    "dem",
    "vara",
    "vad",
    "över",
    "än",
    "dig",
    "kan",
    "sina",
    "här",
    "ha",
    "mot",
    "alla",
    "under",
    "någon",
    "eller",
    "allt",
    "mycket",
    "sedan",
    "ju",
    "denna",
    "själv",
    "detta",
    "åt",
    "utan",
    "varit",
    "hur",
    "ingen",
    "mitt",
    "ni",
    "bli",
    "blev",
    "oss",
    "din",
    "dessa",
    "några",
    "deras",
    "blir",
    "mina",
    "samma",
    "vilken",
    "er",
    "sådan",
    "vår",
    "blivit",
    "dess",
    "inom",
    "mellan",
    "sådant",
    "varför",
    "varje",
    "vilka",
    "ditt",
    "vem",
    "vilket",
    "sitt",
    "sådana",
    "vart",
    "dina",
    "vars",
    "vårt",
    "våra",
    "ert",
    "era",
    "vilkas",
];


================================================
FILE: src/tokenizer/tokenized_string.rs
================================================
use std::cmp::Ordering;
use std::io;
use std::io::{Read, Write};

use common::*;

use crate::tokenizer::{Token, TokenStream};

/// Struct representing pre-tokenized text
#[derive(Debug, Clone, serde::Serialize, serde::Deserialize, Eq, PartialEq)]
pub struct PreTokenizedString {
    /// Original text
    pub text: String,
    /// Tokens derived from the text
    pub tokens: Vec<Token>,
}

impl Ord for PreTokenizedString {
    fn cmp(&self, other: &Self) -> Ordering {
        self.text.cmp(&other.text)
    }
}

impl PartialOrd for PreTokenizedString {
    fn partial_cmp(&self, other: &Self) -> Option<Ordering> {
        Some(self.cmp(other))
    }
}

impl BinarySerializable for PreTokenizedString {
    fn serialize<W: Write + ?Sized>(&self, writer: &mut W) -> io::Result<()> {
        if let Ok(text) = serde_json::to_string(self) {
            <String as BinarySerializable>::serialize(&text, writer)
        } else {
            Err(io::Error::other(
                "Failed to dump PreTokenizedString to json.",
            ))
        }
    }

    fn deserialize<R: Read>(reader: &mut R) -> io::Result<Self> {
        let json_text = <String as BinarySerializable>::deserialize(reader)?;

        if let Ok(value) = serde_json::from_str(&json_text) {
            Ok(value)
        } else {
            Err(io::Error::other(
                "Failed to parse string data as PreTokenizedString.",
            ))
        }
    }
}

/// [`TokenStream`] implementation which wraps [`PreTokenizedString`]
pub struct PreTokenizedStream {
    tokenized_string: PreTokenizedString,
    current_token: i64,
}

impl From<PreTokenizedString> for PreTokenizedStream {
    fn from(s: PreTokenizedString) -> PreTokenizedStream {
        PreTokenizedStream {
            tokenized_string: s,
            current_token: -1,
        }
    }
}

impl TokenStream for PreTokenizedStream {
    fn advance(&mut self) -> bool {
        self.current_token += 1;
        self.current_token < self.tokenized_string.tokens.len() as i64
    }

    fn token(&self) -> &Token {
        assert!(
            self.current_token >= 0,
            "TokenStream not initialized. You should call advance() at least once."
        );
        &self.tokenized_string.tokens[self.current_token as usize]
    }

    fn token_mut(&mut self) -> &mut Token {
        assert!(
            self.current_token >= 0,
            "TokenStream not initialized. You should call advance() at least once."
        );
        &mut self.tokenized_string.tokens[self.current_token as usize]
    }
}

#[cfg(test)]
mod tests {

    use super::*;

    #[test]
    fn test_tokenized_stream() {
        let tok_text = PreTokenizedString {
            text: String::from("A a"),
            tokens: vec![
                Token {
                    offset_from: 0,
                    offset_to: 1,
                    position: 0,
                    text: String::from("A"),
                    position_length: 1,
                },
                Token {
                    offset_from: 2,
                    offset_to: 3,
                    position: 1,
                    text: String::from("a"),
                    position_length: 1,
                },
            ],
        };

        let mut token_stream = PreTokenizedStream::from(tok_text.clone());

        for expected_token in tok_text.tokens {
            assert!(token_stream.advance());
            assert_eq!(token_stream.token(), &expected_token);
        }
        assert!(!token_stream.advance());
    }
}


================================================
FILE: src/tokenizer/tokenizer.rs
================================================
/// The tokenizer module contains all of the tools used to process
/// text in `tantivy`.
use tokenizer_api::{BoxTokenStream, TokenFilter, Tokenizer};

use crate::tokenizer::empty_tokenizer::EmptyTokenizer;

/// `TextAnalyzer` tokenizes an input text into tokens and modifies the resulting `TokenStream`.
#[derive(Clone)]
pub struct TextAnalyzer {
    tokenizer: Box<dyn BoxableTokenizer>,
}

impl Tokenizer for Box<dyn BoxableTokenizer> {
    type TokenStream<'a> = BoxTokenStream<'a>;

    // Note: we want to call `box_token_stream` on the concrete `Tokenizer`
    // implementation, not the `BoxableTokenizer` one as it will cause
    // a recursive call (and a stack overflow).
    fn token_stream<'a>(&'a mut self, text: &'a str) -> Self::TokenStream<'a> {
        (**self).box_token_stream(text)
    }
}

impl Clone for Box<dyn BoxableTokenizer> {
    // Note: we want to call `box_clone` on the concrete `Tokenizer`
    // implementation in order to clone the concrete `Tokenizer`.
    fn clone(&self) -> Self {
        (**self).box_clone()
    }
}

/// A boxable `Tokenizer`, with its `TokenStream` type erased.
pub trait BoxableTokenizer: 'static + Send + Sync {
    /// Creates a boxed token stream for a given `str`.
    fn box_token_stream<'a>(&'a mut self, text: &'a str) -> BoxTokenStream<'a>;
    /// Clone this tokenizer.
    fn box_clone(&self) -> Box<dyn BoxableTokenizer>;
}

impl<T: Tokenizer> BoxableTokenizer for T {
    fn box_token_stream<'a>(&'a mut self, text: &'a str) -> BoxTokenStream<'a> {
        BoxTokenStream::new(self.token_stream(text))
    }
    fn box_clone(&self) -> Box<dyn BoxableTokenizer> {
        Box::new(self.clone())
    }
}

impl Default for TextAnalyzer {
    fn default() -> TextAnalyzer {
        TextAnalyzer::from(EmptyTokenizer)
    }
}

impl<T: Tokenizer + Clone> From<T> for TextAnalyzer {
    fn from(tokenizer: T) -> Self {
        TextAnalyzer::builder(tokenizer).build()
    }
}

impl TextAnalyzer {
    /// Create a new TextAnalyzerBuilder
    pub fn builder<T: Tokenizer>(tokenizer: T) -> TextAnalyzerBuilder<T> {
        TextAnalyzerBuilder { tokenizer }
    }

    /// Creates a token stream for a given `str`.
    pub fn token_stream<'a>(&'a mut self, text: &'a str) -> BoxTokenStream<'a> {
        self.tokenizer.token_stream(text)
    }
}

/// Builder helper for [`TextAnalyzer`]
pub struct TextAnalyzerBuilder<T = Box<dyn BoxableTokenizer>> {
    tokenizer: T,
}

impl<T: Tokenizer> TextAnalyzerBuilder<T> {
    /// Appends a token filter to the current builder.
    ///
    /// # Example
    ///
    /// ```rust
    /// use tantivy::tokenizer::*;
    ///
    /// let en_stem = TextAnalyzer::builder(SimpleTokenizer::default())
    ///     .filter(RemoveLongFilter::limit(40))
    ///     .filter(LowerCaser)
    ///     .filter(Stemmer::default())
    ///     .build();
    /// ```
    pub fn filter<F: TokenFilter>(self, token_filter: F) -> TextAnalyzerBuilder<F::Tokenizer<T>> {
        TextAnalyzerBuilder {
            tokenizer: token_filter.transform(self.tokenizer),
        }
    }

    /// Boxes the internal tokenizer. This is useful for adding dynamic filters.
    /// Note: this will be less performant than the non boxed version.
    pub fn dynamic(self) -> TextAnalyzerBuilder {
        let boxed_tokenizer = Box::new(self.tokenizer);
        TextAnalyzerBuilder {
            tokenizer: boxed_tokenizer,
        }
    }

    /// Appends a token filter to the current builder and returns a boxed version of the
    /// tokenizer. This is useful when you want to build a `TextAnalyzer` dynamically.
    /// Prefer using `TextAnalyzer::builder(tokenizer).filter(token_filter).build()` if
    /// possible as it will be more performant and create less boxes.
    pub fn filter_dynamic<F: TokenFilter>(self, token_filter: F) -> TextAnalyzerBuilder {
        self.filter(token_filter).dynamic()
    }

    /// Finalize building the TextAnalyzer
    pub fn build(self) -> TextAnalyzer {
        TextAnalyzer {
            tokenizer: Box::new(self.tokenizer),
        }
    }
}

#[cfg(test)]
mod tests {

    use super::*;
    use crate::tokenizer::{LowerCaser, RemoveLongFilter, SimpleTokenizer};

    #[test]
    fn test_text_analyzer_builder() {
        let mut analyzer = TextAnalyzer::builder(SimpleTokenizer::default())
            .filter(RemoveLongFilter::limit(40))
            .filter(LowerCaser)
            .build();
        let mut stream = analyzer.token_stream("- first bullet point");
        assert_eq!(stream.next().unwrap().text, "first");
        assert_eq!(stream.next().unwrap().text, "bullet");
    }

    #[test]
    fn test_text_analyzer_with_filters_boxed() {
        // This test shows how one can build a TextAnalyzer dynamically, by stacking a list
        // of parametrizable token filters.
        //
        // The following enum is the thing that would be serializable.
        // Note that token filters can have their own parameters, too, like the RemoveLongFilter
        enum SerializableTokenFilterEnum {
            LowerCaser(LowerCaser),
            RemoveLongFilter(RemoveLongFilter),
        }
        // Note that everything below is dynamic.
        let filters: Vec<SerializableTokenFilterEnum> = vec![
            SerializableTokenFilterEnum::LowerCaser(LowerCaser),
            SerializableTokenFilterEnum::RemoveLongFilter(RemoveLongFilter::limit(12)),
        ];
        let mut analyzer_builder: TextAnalyzerBuilder =
            TextAnalyzer::builder(SimpleTokenizer::default())
                .filter_dynamic(RemoveLongFilter::limit(40))
                .filter_dynamic(LowerCaser);
        for filter in filters {
            analyzer_builder = match filter {
                SerializableTokenFilterEnum::LowerCaser(lower_caser) => {
                    analyzer_builder.filter_dynamic(lower_caser)
                }
                SerializableTokenFilterEnum::RemoveLongFilter(remove_long_filter) => {
                    analyzer_builder.filter_dynamic(remove_long_filter)
                }
            }
        }
        let mut analyzer = analyzer_builder.build();
        let mut stream = analyzer.token_stream("first bullet point");
        assert_eq!(stream.next().unwrap().text, "first");
        assert_eq!(stream.next().unwrap().text, "bullet");
    }
}


================================================
FILE: src/tokenizer/tokenizer_manager.rs
================================================
use std::collections::HashMap;
use std::sync::{Arc, RwLock};

use crate::tokenizer::tokenizer::TextAnalyzer;
use crate::tokenizer::{
    LowerCaser, RawTokenizer, RemoveLongFilter, SimpleTokenizer, WhitespaceTokenizer,
};

/// The tokenizer manager serves as a store for
/// all of the pre-configured tokenizer pipelines.
///
/// By default, it is populated with the following managers.
///
/// - `raw` : does not process nor tokenize the text.
/// - `default` : Chops the text on according to whitespace and punctuation, removes tokens that are
///   too long, and lowercases tokens.
/// - `en_stem` : Like `default`, but also applies stemming on the resulting tokens. Stemming can
///   improve the recall of your search engine.
/// - `whitespace` : Splits the text on whitespaces.
#[derive(Clone)]
pub struct TokenizerManager {
    tokenizers: Arc<RwLock<HashMap<String, TextAnalyzer>>>,
}

impl TokenizerManager {
    /// Creates an empty tokenizer manager.
    pub fn new() -> Self {
        Self {
            tokenizers: Arc::new(RwLock::new(HashMap::new())),
        }
    }

    /// Registers a new tokenizer associated with a given name.
    pub fn register<T>(&self, tokenizer_name: &str, tokenizer: T)
    where TextAnalyzer: From<T> {
        let boxed_tokenizer: TextAnalyzer = TextAnalyzer::from(tokenizer);
        self.tokenizers
            .write()
            .expect("Acquiring the lock should never fail")
            .insert(tokenizer_name.to_string(), boxed_tokenizer);
    }

    /// Accessing a tokenizer given its name.
    pub fn get(&self, tokenizer_name: &str) -> Option<TextAnalyzer> {
        self.tokenizers
            .read()
            .expect("Acquiring the lock should never fail")
            .get(tokenizer_name)
            .cloned()
    }
}

impl Default for TokenizerManager {
    /// Creates an `TokenizerManager` prepopulated with
    /// the default pre-configured tokenizers of `tantivy`.
    fn default() -> TokenizerManager {
        let manager = TokenizerManager::new();
        manager.register("raw", RawTokenizer::default());
        manager.register(
            "default",
            TextAnalyzer::builder(SimpleTokenizer::default())
                .filter(RemoveLongFilter::limit(40))
                .filter(LowerCaser)
                .build(),
        );
        #[cfg(feature = "stemmer")]
        {
            use crate::tokenizer::stemmer::{Language, Stemmer};
            manager.register(
                "en_stem",
                TextAnalyzer::builder(SimpleTokenizer::default())
                    .filter(RemoveLongFilter::limit(40))
                    .filter(LowerCaser) // The stemmer does not lowercase
                    .filter(Stemmer::new(Language::English))
                    .build(),
            );
        }
        manager.register("whitespace", WhitespaceTokenizer::default());
        manager
    }
}


================================================
FILE: src/tokenizer/whitespace_tokenizer.rs
================================================
use std::str::CharIndices;

use super::{Token, TokenStream, Tokenizer};

/// Tokenize the text by splitting on whitespaces.
#[derive(Clone, Default)]
pub struct WhitespaceTokenizer {
    token: Token,
}

pub struct WhitespaceTokenStream<'a> {
    text: &'a str,
    chars: CharIndices<'a>,
    token: &'a mut Token,
}

impl Tokenizer for WhitespaceTokenizer {
    type TokenStream<'a> = WhitespaceTokenStream<'a>;
    fn token_stream<'a>(&'a mut self, text: &'a str) -> WhitespaceTokenStream<'a> {
        self.token.reset();
        WhitespaceTokenStream {
            text,
            chars: text.char_indices(),
            token: &mut self.token,
        }
    }
}

impl WhitespaceTokenStream<'_> {
    // search for the end of the current token.
    fn search_token_end(&mut self) -> usize {
        (&mut self.chars)
            .filter(|(_, c)| c.is_ascii_whitespace())
            .map(|(offset, _)| offset)
            .next()
            .unwrap_or(self.text.len())
    }
}

impl TokenStream for WhitespaceTokenStream<'_> {
    fn advance(&mut self) -> bool {
        self.token.text.clear();
        self.token.position = self.token.position.wrapping_add(1);
        while let Some((offset_from, c)) = self.chars.next() {
            if !c.is_ascii_whitespace() {
                let offset_to = self.search_token_end();
                self.token.offset_from = offset_from;
                self.token.offset_to = offset_to;
                self.token.text.push_str(&self.text[offset_from..offset_to]);
                return true;
            }
        }
        false
    }

    fn token(&self) -> &Token {
        self.token
    }

    fn token_mut(&mut self) -> &mut Token {
        self.token
    }
}

#[cfg(test)]
mod tests {
    use crate::tokenizer::tests::assert_token;
    use crate::tokenizer::{TextAnalyzer, Token, WhitespaceTokenizer};

    #[test]
    fn test_whitespace_tokenizer() {
        let tokens = token_stream_helper("Hello, happy tax payer!");
        assert_eq!(tokens.len(), 4);
        assert_token(&tokens[0], 0, "Hello,", 0, 6);
        assert_token(&tokens[1], 1, "happy", 7, 12);
        assert_token(&tokens[2], 2, "tax", 13, 16);
        assert_token(&tokens[3], 3, "payer!", 17, 23);
    }

    fn token_stream_helper(text: &str) -> Vec<Token> {
        let mut a = TextAnalyzer::from(WhitespaceTokenizer::default());
        let mut token_stream = a.token_stream(text);
        let mut tokens: Vec<Token> = vec![];
        let mut add_token = |token: &Token| {
            tokens.push(token.clone());
        };
        token_stream.process(&mut add_token);
        tokens
    }
}


================================================
FILE: sstable/Cargo.toml
================================================
[package]
name = "tantivy-sstable"
version = "0.6.0"
edition = "2024"
license = "MIT"
homepage = "https://github.com/quickwit-oss/tantivy"
repository = "https://github.com/quickwit-oss/tantivy"
keywords = ["search", "information", "retrieval", "sstable"]
categories = ["database-implementations", "data-structures", "compression"]
description = "sstables for tantivy"

[dependencies]
common = {version= "0.10", path="../common", package="tantivy-common"}
futures-util = "0.3.30"
itertools = "0.14.0"
tantivy-bitpacker = { version= "0.9", path="../bitpacker" }
tantivy-fst = "0.5"
# experimental gives us access to Decompressor::upper_bound
zstd = { version = "0.13", optional = true, features = ["experimental"] }

[features]
zstd-compression = ["zstd"]

[dev-dependencies]
proptest = "1"
criterion = { version = "0.5", default-features = false }
names = "0.14"
rand = "0.9"

[[bench]]
name = "stream_bench"
harness = false

[[bench]]
name = "ord_to_term"
harness = false


================================================
FILE: sstable/README.md
================================================
# SSTable

The `tantivy-sstable` crate is yet another sstable crate.

It has been designed to be used in `quickwit`:
- as an alternative to the default tantivy fst dictionary.
- as a way to store the column index for dynamic fast fields.

The benefit compared to the fst crate is locality.
Searching a key in the fst crate requires downloading the entire dictionary.

Once the sstable index is downloaded, running a `get` in the sstable
crate only requires a single fetch.

Right now, the block index and the default block size have been thought
for quickwit, and the performance of a get is very bad.

# Sorted strings?

SSTable stands for Sorted String Table.
Strings have to be insert in sorted order.

That sorted order is used in different ways:
- it makes gets and streaming ranges of keys
possible.
- it allows incremental encoding of the keys
- the front compression is leveraged to optimize
the intersection with an automaton

# On disk format

Overview of the SSTable format. Unless noted otherwise, numbers are little-endian.

### SSTable
```
+-------+-------+-----+--------+
| Block | Block | ... | Footer |
+-------+-------+-----+--------+
|----( # of blocks)---|
```
- Block(`SSTBlock`): list of independent block, terminated by a single empty block.
- Footer(`SSTFooter`)

### SSTBlock
```
+----------+----------+--------+-------+-------+-----+
| BlockLen | Compress | Values | Delta | Delta | ... |
+----------+----------+--------+-------+-------+-----+
                      |        |----( # of deltas)---|
                      |------(maybe compressed)------|
```
- BlockLen(u32): length of the block, including the compress byte.
- Compress(u8): indicate whether block is compressed. 0 if not compressed, 1 if compressed.
- Values: an application defined format storing a sequence of value, capable of determining it own length
- Delta

### Delta
```
+---------+--------+
| KeepAdd | Suffix |
+---------+--------+
```
- KeepAdd
- Suffix: KeepAdd.add bytes of key suffix

### KeepAdd
KeepAdd can be represented in two different representation, a very compact 1byte one which is enough for most usage, and a longer variable-len one when required

When keep < 16 and add < 16
```
+-----+------+
| Add | Keep |
+-----+------+
```
- Add(u4): number of bytes to push
- Keep(u4): number of bytes to pop

Otherwise:
```
+------+------+-----+
| 0x01 | Keep | Add |
+------+------+-----+
```
- Add(VInt): number of bytes to push
- Keep(VInt): number of bytes to pop


Note: as the SSTable does not support redundant keys, there is no ambiguity between both representation. Add is always guaranteed to be non-zero, except for the very first key of an SSTable, where Keep is guaranteed to be zero.

### SSTFooter
```
+-----+----------------+-------------+-------------+---------+---------+
| Fst | BlockAddrStore | StoreOffset | IndexOffset | NumTerm | Version |
+-----+----------------+-------------+-------------+---------+---------+
```
- Fst(Fst): finite state transducer mapping keys to a block number
- BlockAddrStore(BlockAddrStore): store mapping a block number to its BlockAddr
- StoreOffset(u64): Offset to start of the BlockAddrStore. If zero, see the SingleBlockSStable section
- IndexOffset(u64): Offset to the start of the SSTFooter
- NumTerm(u64): number of terms in the sstable
- Version(u32): Currently equal to 3

### Fst

Fst is in the format of tantivy\_fst

### BlockAddrStore

+---------+-----------+-----------+-----+-----------+-----------+-----+
| MetaLen | BlockMeta | BlockMeta | ... | BlockData | BlockData | ... |
+---------+-----------+-----------+-----+-----------+-----------+-----+
          |---------(N blocks)----------|---------(N blocks)----------|

- MetaLen(u64): length of the BlockMeta section
- BlockMeta(BlockAddrBlockMetadata): metadata to seek through BlockData
- BlockData(CompactedBlockAddr): bitpacked per block metadata

### BlockAddrBlockMetadata

+--------+------------+--------------+------------+--------------+-------------------+-----------------+----------+
| Offset | RangeStart | FirstOrdinal | RangeSlope | OrdinalSlope | FirstOrdinalNBits | RangeStartNBits | BlockLen |
+--------+------------+--------------+------------+--------------+-------------------+-----------------+----------+

- Offset(u64): offset of the corresponding BlockData in the datastream
- RangeStart(u64): the start position of the first block
- FirstOrdinal(u64): the first ordinal of the first block
- RangeSlope(u32): slope predicted for start range evolution (see computation in BlockData)
- OrdinalSlope(u64): slope predicted for first ordinal evolution (see computation in BlockData)
- FirstOrdinalNBits(u8): number of bits per ordinal in datastream (see computation in BlockData)
- RangeStartNBits(u8): number of bits per range start in datastream (see computation in BlockData)

### BlockData

+-----------------+-------------------+---------------+
| RangeStartDelta | FirstOrdinalDelta | FinalRangeEnd |
+-----------------+-------------------+---------------+
|------(BlockLen repetitions)---------|

- RangeStartDelta(var): RangeStartNBits *bits* of little endian number. See below for decoding
- FirstOrdinalDelta(var): FirstOrdinalNBits *bits* of little endian number. See below for decoding
- FinalRangeEnd(var): RangeStartNBits *bits* of integer. See below for decoding

converting a BlockData of index Index and a BlockAddrBlockMetadata to an actual block address is done as follow:
range\_prediction := RangeStart + Index * RangeSlop;
range\_derivation := RangeStartDelta - (1 << (RangeStartNBits-1));
range\_start := range\_prediction + range\_derivation

The same computation can be done for ordinal.

Note that `range_derivation` can take negative value. `RangeStartDelta` is just its translation to a positive range.


## SingleBlockSStable

The format used for the index is meant to be compact, however it has a constant cost of around 70
bytes, which isn't negligible for a table containing very few keys.
To limit the impact of that constant cost, single block sstable omit the Fst and BlockAddrStore from
their index. Instead a block with first ordinal of 0, range start of 0 and range end of IndexOffset
is implicitly used for every operations.


================================================
FILE: sstable/benches/ord_to_term.rs
================================================
use std::sync::Arc;

use common::OwnedBytes;
use common::file_slice::FileSlice;
use criterion::{Criterion, criterion_group, criterion_main};
use tantivy_sstable::{Dictionary, MonotonicU64SSTable};

fn make_test_sstable(suffix: &str) -> FileSlice {
    let mut builder = Dictionary::<MonotonicU64SSTable>::builder(Vec::new()).unwrap();

    // 125 mio elements
    for elem in 0..125_000_000 {
        let key = format!("prefix.{elem:07X}{suffix}").into_bytes();
        builder.insert(&key, &elem).unwrap();
    }

    let table = builder.finish().unwrap();
    let table = Arc::new(OwnedBytes::new(table));
    common::file_slice::FileSlice::new(table.clone())
}

pub fn criterion_benchmark(c: &mut Criterion) {
    {
        let slice = make_test_sstable(".suffix");
        let dict = Dictionary::<MonotonicU64SSTable>::open(slice.clone()).unwrap();
        c.bench_function("ord_to_term_suffix", |b| {
            let mut res = Vec::new();
            b.iter(|| {
                assert!(dict.ord_to_term(100_000, &mut res).unwrap());
                assert!(dict.ord_to_term(19_000_000, &mut res).unwrap());
            })
        });
        c.bench_function("open_and_ord_to_term_suffix", |b| {
            let mut res = Vec::new();
            b.iter(|| {
                let dict = Dictionary::<MonotonicU64SSTable>::open(slice.clone()).unwrap();
                assert!(dict.ord_to_term(100_000, &mut res).unwrap());
                assert!(dict.ord_to_term(19_000_000, &mut res).unwrap());
            })
        });
        c.bench_function("term_ord_suffix", |b| {
            b.iter(|| {
                assert_eq!(
                    dict.term_ord(b"prefix.00186A0.suffix").unwrap().unwrap(),
                    100_000
                );
                assert_eq!(
                    dict.term_ord(b"prefix.121EAC0.suffix").unwrap().unwrap(),
                    19_000_000
                );
            })
        });
        c.bench_function("open_and_term_ord_suffix", |b| {
            b.iter(|| {
                let dict = Dictionary::<MonotonicU64SSTable>::open(slice.clone()).unwrap();
                assert_eq!(
                    dict.term_ord(b"prefix.00186A0.suffix").unwrap().unwrap(),
                    100_000
                );
                assert_eq!(
                    dict.term_ord(b"prefix.121EAC0.suffix").unwrap().unwrap(),
                    19_000_000
                );
            })
        });
    }
    {
        let slice = make_test_sstable("");
        let dict = Dictionary::<MonotonicU64SSTable>::open(slice.clone()).unwrap();
        c.bench_function("ord_to_term", |b| {
            let mut res = Vec::new();
            b.iter(|| {
                assert!(dict.ord_to_term(100_000, &mut res).unwrap());
                assert!(dict.ord_to_term(19_000_000, &mut res).unwrap());
            })
        });
        c.bench_function("open_and_ord_to_term", |b| {
            let mut res = Vec::new();
            b.iter(|| {
                let dict = Dictionary::<MonotonicU64SSTable>::open(slice.clone()).unwrap();
                assert!(dict.ord_to_term(100_000, &mut res).unwrap());
                assert!(dict.ord_to_term(19_000_000, &mut res).unwrap());
            })
        });
        c.bench_function("term_ord", |b| {
            b.iter(|| {
                assert_eq!(dict.term_ord(b"prefix.00186A0").unwrap().unwrap(), 100_000);
                assert_eq!(
                    dict.term_ord(b"prefix.121EAC0").unwrap().unwrap(),
                    19_000_000
                );
            })
        });
        c.bench_function("open_and_term_ord", |b| {
            b.iter(|| {
                let dict = Dictionary::<MonotonicU64SSTable>::open(slice.clone()).unwrap();
                assert_eq!(dict.term_ord(b"prefix.00186A0").unwrap().unwrap(), 100_000);
                assert_eq!(
                    dict.term_ord(b"prefix.121EAC0").unwrap().unwrap(),
                    19_000_000
                );
            })
        });
    }
}

criterion_group!(benches, criterion_benchmark);
criterion_main!(benches);


================================================
FILE: sstable/benches/stream_bench.rs
================================================
use std::collections::BTreeSet;
use std::io;

use common::file_slice::FileSlice;
use criterion::{Criterion, criterion_group, criterion_main};
use rand::rngs::StdRng;
use rand::{Rng, SeedableRng};
use tantivy_sstable::{Dictionary, MonotonicU64SSTable};

const CHARSET: &[u8] = b"abcdefghij";

fn generate_key(rng: &mut impl Rng) -> String {
    let len = rng.random_range(3..12);
    std::iter::from_fn(|| {
        let idx = rng.random_range(0..CHARSET.len());
        Some(CHARSET[idx] as char)
    })
    .take(len)
    .collect()
}

fn prepare_sstable() -> io::Result<Dictionary<MonotonicU64SSTable>> {
    let mut rng = StdRng::from_seed([3u8; 32]);
    let mut els = BTreeSet::new();
    while els.len() < 100_000 {
        els.insert(generate_key(&mut rng));
    }
    let mut dictionary_builder = Dictionary::<MonotonicU64SSTable>::builder(Vec::new())?;
    for (ord, word) in els.iter().enumerate() {
        dictionary_builder.insert(word, &(ord as u64))?;
    }
    let buffer = dictionary_builder.finish()?;
    let dictionary = Dictionary::open(FileSlice::from(buffer))?;
    Ok(dictionary)
}

fn stream_bench(
    dictionary: &Dictionary<MonotonicU64SSTable>,
    lower: &[u8],
    upper: &[u8],
    do_scan: bool,
) -> usize {
    let mut stream = dictionary
        .range()
        .ge(lower)
        .lt(upper)
        .into_stream()
        .unwrap();
    if !do_scan {
        return 0;
    }
    let mut count = 0;
    while stream.advance() {
        count += 1;
    }
    count
}

pub fn criterion_benchmark(c: &mut Criterion) {
    let dict = prepare_sstable().unwrap();
    c.bench_function("short_scan_init", |b| {
        b.iter(|| stream_bench(&dict, b"fa", b"fana", false))
    });
    c.bench_function("short_scan_init_and_scan", |b| {
        b.iter(|| {
            assert_eq!(stream_bench(&dict, b"fa", b"faz", true), 971);
        })
    });
    c.bench_function("full_scan_init_and_scan_full_with_bound", |b| {
        b.iter(|| {
            assert_eq!(stream_bench(&dict, b"", b"z", true), 100_000);
        })
    });
    c.bench_function("full_scan_init_and_scan_full_no_bounds", |b| {
        b.iter(|| {
            let mut stream = dict.stream().unwrap();
            let mut count = 0;
            while stream.advance() {
                count += 1;
            }
            count
        })
    });
}

criterion_group!(benches, criterion_benchmark);
criterion_main!(benches);


================================================
FILE: sstable/src/block_match_automaton.rs
================================================
use tantivy_fst::Automaton;

/// Returns whether a block can match an automaton based on its bounds.
///
/// start key is exclusive, and optional to account for the first block. end key is inclusive and
/// mandatory.
pub(crate) fn can_block_match_automaton(
    start_key_opt: Option<&[u8]>,
    end_key: &[u8],
    automaton: &impl Automaton,
) -> bool {
    let start_key = if let Some(start_key) = start_key_opt {
        start_key
    } else {
        // if start_key_opt is None, we would allow an automaton matching the empty string to match
        if automaton.is_match(&automaton.start()) {
            return true;
        }
        &[]
    };
    can_block_match_automaton_with_start(start_key, end_key, automaton)
}

// similar to can_block_match_automaton, ignoring the edge case of the initial block
fn can_block_match_automaton_with_start(
    start_key: &[u8],
    end_key: &[u8],
    automaton: &impl Automaton,
) -> bool {
    // notation: in loops, we use `kb` to denotate a key byte (a byte taken from the start/end key),
    // and `rb`, a range byte (usually all values higher than a `kb` when comparing with
    // start_key, or all values lower than a `kb` when comparing with end_key)

    if start_key >= end_key {
        return false;
    }

    let common_prefix_len = crate::common_prefix_len(start_key, end_key);

    let mut base_state = automaton.start();
    for kb in &start_key[0..common_prefix_len] {
        base_state = automaton.accept(&base_state, *kb);
    }

    // this is not required for correctness, but allows dodging more expensive checks
    if !automaton.can_match(&base_state) {
        return false;
    }

    // we have 3 distinct case:
    // - keys are `abc` and `abcd` => we test for abc[\0-d].*
    // - keys are `abcd` and `abce` => we test for abc[d-e].*
    // - keys are `abcd` and `abc` => contradiction with start_key < end_key.
    //
    // ideally for (abc, abcde] we could test for abc([\0-c].*|d([\0-d].*|e)?)
    // but let's start simple (and correct), and tighten our bounds latter
    //
    // and for (abcde, abcfg] we could test for abc(d(e.+|[f-\xff].*)|e.*|f([\0-f].*|g)?)
    // abc (
    //  d(e.+|[f-\xff].*) |
    //  e.* |
    //  f([\0-f].*|g)?
    // )
    //
    // these are all written as regex, but can be converted to operations we can do:
    // - [x-y] is a for c in x..=y
    // - .* is a can_match()
    // - .+ is a for c in 0..=255 { accept(c).can_match() }
    // - ? is a the thing before can_match(), or current state.is_match()
    // - | means test both side

    // we have two cases, either start_key is a prefix of end_key (e.g. (abc, abcjp]),
    // or it is not (e.g. (abcdg, abcjp]). It is not possible however that end_key be a prefix of
    // start_key (or that both are equal) because we already handled start_key >= end_key.
    //
    // if we are in the first case, we want to visit the following states:
    // abc (
    //   [\0-i].* |
    //   j (
    //     [\0-o].* |
    //     p
    //   )?
    // )
    // Everything after `abc` is handled by `match_range_end`
    //
    // if we are in the 2nd case, we want to visit the following states:
    // abc (
    //   d(g.+|[h-\xff].*) | // this is handled by match_range_start
    //
    //   [e-i].* |           // this is handled here
    //
    //   j (                 // this is handled by match_range_end (but countrary to the other
    //    [\0-o].* |         // case, j is already consumed so to not check [\0-i].* )
    //    p
    //   )?
    // )

    let Some(start_range) = start_key.get(common_prefix_len) else {
        return match_range_end(&end_key[common_prefix_len..], &automaton, base_state);
    };

    let end_range = end_key[common_prefix_len];

    // things starting with start_range were handled in match_range_start
    // this starting with end_range are handled below.
    // this can run for 0 iteration in cases such as (abc, abd]
    for rb in (start_range + 1)..end_range {
        let new_state = automaton.accept(&base_state, rb);
        if automaton.can_match(&new_state) {
            return true;
        }
    }

    let state_for_start = automaton.accept(&base_state, *start_range);
    if match_range_start(
        &start_key[common_prefix_len + 1..],
        &automaton,
        state_for_start,
    ) {
        return true;
    }

    let state_for_end = automaton.accept(&base_state, end_range);
    if automaton.is_match(&state_for_end) {
        return true;
    }
    match_range_end(&end_key[common_prefix_len + 1..], &automaton, state_for_end)
}

fn match_range_start<S, A: Automaton<State = S>>(
    start_key: &[u8],
    automaton: &A,
    mut state: S,
) -> bool {
    // case (abcdgj, abcpqr], `abcd` is already consumed, we need to handle:
    // - [h-\xff].*
    // - g[k-\xff].*
    // - gj.+ == gf[\0-\xff].*

    for kb in start_key {
        // this is an optimisation, and is not needed for correctness
        if !automaton.can_match(&state) {
            return false;
        }

        // does the [h-\xff].* part. we skip if kb==255 as [\{0100}-\xff] is an empty range, and
        // this would overflow in our u8 world
        if *kb < u8::MAX {
            for rb in (kb + 1)..=u8::MAX {
                let temp_state = automaton.accept(&state, rb);
                if automaton.can_match(&temp_state) {
                    return true;
                }
            }
        }
        // push g
        state = automaton.accept(&state, *kb);
    }

    // this isn't required for correctness, but can save us from looping 256 below
    if !automaton.can_match(&state) {
        return false;
    }

    // does the final `.+`, which is the same as `[\0-\xff].*`
    for rb in 0..=u8::MAX {
        let temp_state = automaton.accept(&state, rb);
        if automaton.can_match(&temp_state) {
            return true;
        }
    }
    false
}

fn match_range_end<S, A: Automaton<State = S>>(
    end_key: &[u8],
    automaton: &A,
    mut state: S,
) -> bool {
    // for (abcdef, abcmps]. the prefix `abcm` has been consumed, `[d-l].*` was handled elsewhere,
    // we just need to handle
    // - [\0-o].*
    // - p
    // - p[\0-r].*
    // - ps
    for kb in end_key {
        // this is an optimisation, and is not needed for correctness
        if !automaton.can_match(&state) {
            return false;
        }

        // does the `[\0-o].*`
        for rb in 0..*kb {
            let temp_state = automaton.accept(&state, rb);
            if automaton.can_match(&temp_state) {
                return true;
            }
        }

        // push p
        state = automaton.accept(&state, *kb);
        // verify the `p` case
        if automaton.is_match(&state) {
            return true;
        }
    }
    false
}

#[cfg(test)]
pub(crate) mod tests {
    use proptest::prelude::*;
    use tantivy_fst::Automaton;

    use super::*;

    pub(crate) struct EqBuffer(pub Vec<u8>);

    impl Automaton for EqBuffer {
        type State = Option<usize>;

        fn start(&self) -> Self::State {
            Some(0)
        }

        fn is_match(&self, state: &Self::State) -> bool {
            *state == Some(self.0.len())
        }

        fn accept(&self, state: &Self::State, byte: u8) -> Self::State {
            state
                .filter(|pos| self.0.get(*pos) == Some(&byte))
                .map(|pos| pos + 1)
        }

        fn can_match(&self, state: &Self::State) -> bool {
            state.is_some()
        }

        fn will_always_match(&self, _state: &Self::State) -> bool {
            false
        }
    }

    fn gen_key_strategy() -> impl Strategy<Value = Vec<u8>> {
        // we only generate bytes in [0, 1, 2, 254, 255] to reduce the search space without
        // ignoring edge cases that might ocure with integer over/underflow
        proptest::collection::vec(prop_oneof![0u8..=2, 254u8..=255], 0..5)
    }

    proptest! {
        #![proptest_config(ProptestConfig {
            cases: 10000, .. ProptestConfig::default()
        })]

        #[test]
        fn test_proptest_automaton_match_block(start in gen_key_strategy(), end in gen_key_strategy(), key in gen_key_strategy()) {
            let expected = start < key && end >= key;
            let automaton = EqBuffer(key);

            assert_eq!(can_block_match_automaton(Some(&start), &end, &automaton), expected);
        }

        #[test]
        fn test_proptest_automaton_match_first_block(end in gen_key_strategy(), key in gen_key_strategy()) {
            let expected = end >= key;
            let automaton = EqBuffer(key);
            assert_eq!(can_block_match_automaton(None, &end, &automaton), expected);
        }
    }
}


================================================
FILE: sstable/src/block_reader.rs
================================================
use std::io::{self, Read};
use std::ops::Range;

use common::OwnedBytes;
#[cfg(feature = "zstd-compression")]
use zstd::bulk::Decompressor;

pub struct BlockReader {
    buffer: Vec<u8>,
    reader: OwnedBytes,
    next_readers: std::vec::IntoIter<OwnedBytes>,
    offset: usize,
}

impl BlockReader {
    pub fn new(reader: OwnedBytes) -> BlockReader {
        BlockReader {
            buffer: Vec::new(),
            reader,
            next_readers: Vec::new().into_iter(),
            offset: 0,
        }
    }

    pub fn from_multiple_blocks(readers: Vec<OwnedBytes>) -> BlockReader {
        let mut next_readers = readers.into_iter();
        let reader = next_readers.next().unwrap_or_else(OwnedBytes::empty);
        BlockReader {
            buffer: Vec::new(),
            reader,
            next_readers,
            offset: 0,
        }
    }

    pub fn deserialize_u64(&mut self) -> u64 {
        let (num_bytes, val) = super::vint::deserialize_read(self.buffer());
        self.advance(num_bytes);
        val
    }

    #[inline(always)]
    pub fn buffer_from_to(&self, range: Range<usize>) -> &[u8] {
        &self.buffer[range]
    }

    pub fn read_block(&mut self) -> io::Result<bool> {
        self.offset = 0;
        self.buffer.clear();

        loop {
            let block_len = match self.reader.len() {
                0 => {
                    // we are out of data for this block. Check if we have another block after
                    match self.next_readers.next() {
                        Some(new_reader) => {
                            self.reader = new_reader;
                            continue;
                        }
                        _ => {
                            return Ok(false);
                        }
                    }
                }
                1..=3 => {
                    return Err(io::Error::new(
                        io::ErrorKind::UnexpectedEof,
                        "failed to read block_len",
                    ));
                }
                _ => self.reader.read_u32() as usize,
            };
            if block_len <= 1 {
                return Ok(false);
            }
            let compress = self.reader.read_u8();
            let block_len = block_len - 1;

            if self.reader.len() < block_len {
                return Err(io::Error::new(
                    io::ErrorKind::UnexpectedEof,
                    "failed to read block content",
                ));
            }
            if compress == 1 {
                #[cfg(feature = "zstd-compression")]
                {
                    let required_capacity =
                        Decompressor::upper_bound(&self.reader[..block_len]).unwrap_or(1024 * 1024);
                    self.buffer.reserve(required_capacity);
                    Decompressor::new()?
                        .decompress_to_buffer(&self.reader[..block_len], &mut self.buffer)?;

                    self.reader.advance(block_len);
                }

                if cfg!(not(feature = "zstd-compression")) {
                    return Err(io::Error::new(
                        io::ErrorKind::Unsupported,
                        "zstd-compression feature is not enabled",
                    ));
                }
            } else {
                self.buffer.resize(block_len, 0u8);
                self.reader.read_exact(&mut self.buffer[..])?;
            }

            return Ok(true);
        }
    }

    #[inline(always)]
    pub fn offset(&self) -> usize {
        self.offset
    }

    #[inline(always)]
    pub fn advance(&mut self, num_bytes: usize) {
        self.offset += num_bytes;
    }

    #[inline(always)]
    pub fn buffer(&self) -> &[u8] {
        &self.buffer[self.offset..]
    }
}

impl io::Read for BlockReader {
    fn read(&mut self, buf: &mut [u8]) -> io::Result<usize> {
        let len = self.buffer().read(buf)?;
        self.advance(len);
        Ok(len)
    }

    fn read_to_end(&mut self, buf: &mut Vec<u8>) -> io::Result<usize> {
        let len = self.buffer.len();
        buf.extend_from_slice(self.buffer());
        self.advance(len);
        Ok(len)
    }

    fn read_exact(&mut self, buf: &mut [u8]) -> io::Result<()> {
        self.buffer().read_exact(buf)?;
        self.advance(buf.len());
        Ok(())
    }
}


================================================
FILE: sstable/src/delta.rs
================================================
use std::io::{self, BufWriter, Write};
use std::ops::Range;

use common::{CountingWriter, OwnedBytes};
#[cfg(feature = "zstd-compression")]
use zstd::bulk::Compressor;

use super::value::ValueWriter;
use super::{BlockReader, value, vint};

const FOUR_BIT_LIMITS: usize = 1 << 4;
const VINT_MODE: u8 = 1u8;
const BLOCK_LEN: usize = 4_000;

pub struct DeltaWriter<W, TValueWriter>
where W: io::Write
{
    block: Vec<u8>,
    write: CountingWriter<BufWriter<W>>,
    value_writer: TValueWriter,
    // Only here to avoid allocations.
    stateless_buffer: Vec<u8>,
    block_len: usize,
}

impl<W, TValueWriter> DeltaWriter<W, TValueWriter>
where
    W: io::Write,
    TValueWriter: ValueWriter,
{
    pub fn new(wrt: W) -> Self {
        DeltaWriter {
            block: Vec::with_capacity(BLOCK_LEN * 2),
            write: CountingWriter::wrap(BufWriter::new(wrt)),
            value_writer: TValueWriter::default(),
            stateless_buffer: Vec::new(),
            block_len: BLOCK_LEN,
        }
    }

    pub fn set_block_len(&mut self, block_len: usize) {
        self.block_len = block_len
    }

    pub fn flush_block(&mut self) -> io::Result<Option<Range<usize>>> {
        if self.block.is_empty() {
            return Ok(None);
        }
        let start_offset = self.write.written_bytes() as usize;

        let buffer: &mut Vec<u8> = &mut self.stateless_buffer;
        self.value_writer.serialize_block(buffer);
        self.value_writer.clear();

        let block_len = buffer.len() + self.block.len();

        if cfg!(feature = "zstd-compression") && block_len > 2048 {
            #[cfg(feature = "zstd-compression")]
            {
                buffer.extend_from_slice(&self.block);
                self.block.clear();

                let max_len = zstd::zstd_safe::compress_bound(buffer.len());
                self.block.reserve(max_len);
                Compressor::new(3)?.compress_to_buffer(buffer, &mut self.block)?;

                // verify compression had a positive impact
                if self.block.len() < buffer.len() {
                    self.write
                        .write_all(&(self.block.len() as u32 + 1).to_le_bytes())?;
                    self.write.write_all(&[1])?;
                    self.write.write_all(&self.block[..])?;
                } else {
                    self.write
                        .write_all(&(block_len as u32 + 1).to_le_bytes())?;
                    self.write.write_all(&[0])?;
                    self.write.write_all(&buffer[..])?;
                }
            }
        } else {
            self.write
                .write_all(&(block_len as u32 + 1).to_le_bytes())?;
            self.write.write_all(&[0])?;
            self.write.write_all(&buffer[..])?;
            self.write.write_all(&self.block[..])?;
        }

        let end_offset = self.write.written_bytes() as usize;
        self.block.clear();
        buffer.clear();
        Ok(Some(start_offset..end_offset))
    }

    fn encode_keep_add(&mut self, keep_len: usize, add_len: usize) {
        if keep_len < FOUR_BIT_LIMITS && add_len < FOUR_BIT_LIMITS {
            let b = (keep_len | (add_len << 4)) as u8;
            self.block.extend_from_slice(&[b])
        } else {
            let mut buf = [VINT_MODE; 20];
            let mut len = 1 + vint::serialize(keep_len as u64, &mut buf[1..]);
            len += vint::serialize(add_len as u64, &mut buf[len..]);
            self.block.extend_from_slice(&buf[..len])
        }
    }

    pub(crate) fn write_suffix(&mut self, common_prefix_len: usize, suffix: &[u8]) {
        let keep_len = common_prefix_len;
        let add_len = suffix.len();
        self.encode_keep_add(keep_len, add_len);
        self.block.extend_from_slice(suffix);
    }

    pub(crate) fn write_value(&mut self, value: &TValueWriter::Value) {
        self.value_writer.write(value);
    }

    pub fn flush_block_if_required(&mut self) -> io::Result<Option<Range<usize>>> {
        if self.block.len() > self.block_len {
            return self.flush_block();
        }
        Ok(None)
    }

    pub fn finish(self) -> CountingWriter<BufWriter<W>> {
        self.write
    }
}

pub struct DeltaReader<TValueReader> {
    common_prefix_len: usize,
    suffix_range: Range<usize>,
    value_reader: TValueReader,
    block_reader: BlockReader,
    idx: usize,
}

impl<TValueReader> DeltaReader<TValueReader>
where TValueReader: value::ValueReader
{
    pub fn new(reader: OwnedBytes) -> Self {
        DeltaReader {
            idx: 0,
            common_prefix_len: 0,
            suffix_range: 0..0,
            value_reader: TValueReader::default(),
            block_reader: BlockReader::new(reader),
        }
    }

    pub fn from_multiple_blocks(reader: Vec<OwnedBytes>) -> Self {
        DeltaReader {
            idx: 0,
            common_prefix_len: 0,
            suffix_range: 0..0,
            value_reader: TValueReader::default(),
            block_reader: BlockReader::from_multiple_blocks(reader),
        }
    }

    pub fn empty() -> Self {
        DeltaReader::new(OwnedBytes::empty())
    }

    fn deserialize_vint(&mut self) -> u64 {
        self.block_reader.deserialize_u64()
    }

    fn read_keep_add(&mut self) -> Option<(usize, usize)> {
        let b = {
            let buf = &self.block_reader.buffer();
            if buf.is_empty() {
                return None;
            }
            buf[0]
        };
        self.block_reader.advance(1);
        match b {
            VINT_MODE => {
                let keep = self.deserialize_vint() as usize;
                let add = self.deserialize_vint() as usize;
                Some((keep, add))
            }
            b => {
                let keep = (b & 0b1111) as usize;
                let add = (b >> 4) as usize;
                Some((keep, add))
            }
        }
    }

    fn read_delta_key(&mut self) -> bool {
        let Some((keep, add)) = self.read_keep_add() else {
            return false;
        };
        self.common_prefix_len = keep;
        let suffix_start = self.block_reader.offset();
        self.suffix_range = suffix_start..(suffix_start + add);
        self.block_reader.advance(add);
        true
    }

    pub fn advance(&mut self) -> io::Result<bool> {
        if self.block_reader.buffer().is_empty() {
            if !self.block_reader.read_block()? {
                return Ok(false);
            }
            let consumed_len = self.value_reader.load(self.block_reader.buffer())?;
            self.block_reader.advance(consumed_len);
            self.idx = 0;
        } else {
            self.idx += 1;
        }
        if !self.read_delta_key() {
            return Ok(false);
        }
        Ok(true)
    }

    #[inline(always)]
    pub fn common_prefix_len(&self) -> usize {
        self.common_prefix_len
    }

    #[inline(always)]
    pub fn suffix(&self) -> &[u8] {
        self.block_reader.buffer_from_to(self.suffix_range.clone())
    }

    #[inline(always)]
    pub fn value(&self) -> &TValueReader::Value {
        self.value_reader.value(self.idx)
    }
}

#[cfg(test)]
mod tests {
    use super::DeltaReader;
    use crate::value::U64MonotonicValueReader;

    #[test]
    fn test_empty() {
        let mut delta_reader: DeltaReader<U64MonotonicValueReader> = DeltaReader::empty();
        assert!(!delta_reader.advance().unwrap());
    }
}


================================================
FILE: sstable/src/dictionary.rs
================================================
#![allow(clippy::needless_borrows_for_generic_args)]

use std::cmp::Ordering;
use std::io;
use std::marker::PhantomData;
use std::ops::{Bound, RangeBounds};
use std::sync::Arc;

use common::bounds::{TransformBound, transform_bound_inner_res};
use common::file_slice::FileSlice;
use common::{BinarySerializable, ByteCount, OwnedBytes};
use futures_util::{StreamExt, TryStreamExt, stream};
use itertools::Itertools;
use tantivy_fst::Automaton;
use tantivy_fst::automaton::AlwaysMatch;

use crate::sstable_index_v3::SSTableIndexV3Empty;
use crate::streamer::{Streamer, StreamerBuilder};
use crate::{
    BlockAddr, DeltaReader, Reader, SSTable, SSTableIndex, SSTableIndexV3, TermOrdinal, VoidSSTable,
};

/// An SSTable is a sorted map that associates sorted `&[u8]` keys
/// to any kind of typed values.
///
/// The SSTable is organized in blocks.
/// In each block, keys and values are encoded separately.
///
/// The keys are encoded using incremental encoding.
/// The values on the other hand, are encoded according to a value-specific
/// codec defined in the TSSTable generic argument.
///
/// Finally, an index is joined to the Dictionary to make it possible,
/// given a key to identify which block contains this key.
///
/// The codec was designed in such a way that the sstable
/// reader is not aware of block, and yet can read any sequence of blocks,
/// as long as the slice of bytes it is given starts and stops at
/// block boundary.
///
/// (See also README.md)
#[derive(Debug, Clone)]
pub struct Dictionary<TSSTable: SSTable = VoidSSTable> {
    pub sstable_slice: FileSlice,
    pub sstable_index: SSTableIndex,
    num_bytes: ByteCount,
    num_terms: u64,
    phantom_data: PhantomData<TSSTable>,
}

impl Dictionary<VoidSSTable> {
    pub fn build_for_tests(terms: &[&str]) -> Dictionary {
        let mut terms = terms.to_vec();
        terms.sort();
        let mut buffer = Vec::new();
        let mut dictionary_writer = Self::builder(&mut buffer).unwrap();
        for term in terms {
            dictionary_writer.insert(term, &()).unwrap();
        }
        dictionary_writer.finish().unwrap();
        Dictionary::from_bytes(OwnedBytes::new(buffer)).unwrap()
    }
}

#[derive(Debug, Clone, PartialEq, Eq)]
pub enum TermOrdHit {
    /// Exact term ord hit
    Exact(TermOrdinal),
    /// Next best term ordinal
    Next(TermOrdinal),
}

impl TermOrdHit {
    fn into_exact(self) -> Option<TermOrdinal> {
        match self {
            TermOrdHit::Exact(ord) => Some(ord),
            TermOrdHit::Next(_) => None,
        }
    }

    fn map<F: FnOnce(TermOrdinal) -> TermOrdinal>(self, f: F) -> Self {
        match self {
            TermOrdHit::Exact(ord) => TermOrdHit::Exact(f(ord)),
            TermOrdHit::Next(ord) => TermOrdHit::Next(f(ord)),
        }
    }
}

impl<TSSTable: SSTable> Dictionary<TSSTable> {
    pub fn builder<W: io::Write>(wrt: W) -> io::Result<crate::Writer<W, TSSTable::ValueWriter>> {
        Ok(TSSTable::writer(wrt))
    }

    pub(crate) fn sstable_reader_block(
        &self,
        block_addr: BlockAddr,
    ) -> io::Result<Reader<TSSTable::ValueReader>> {
        let data = self.sstable_slice.read_bytes_slice(block_addr.byte_range)?;
        Ok(TSSTable::reader(data))
    }

    pub(crate) async fn sstable_delta_reader_for_key_range_async(
        &self,
        key_range: impl RangeBounds<[u8]>,
        limit: Option<u64>,
        automaton: &impl Automaton,
        merge_holes_under_bytes: usize,
    ) -> io::Result<DeltaReader<TSSTable::ValueReader>> {
        let match_all = automaton.will_always_match(&automaton.start());
        if match_all {
            let slice = self.file_slice_for_range(key_range, limit);
            let data = slice.read_bytes_async().await?;
            Ok(TSSTable::delta_reader(data))
        } else {
            let blocks = stream::iter(self.get_block_iterator_for_range_and_automaton(
                key_range,
                automaton,
                merge_holes_under_bytes,
            ));
            let data = blocks
                .map(|block_addr| {
                    self.sstable_slice
                        .read_bytes_slice_async(block_addr.byte_range)
                })
                .buffered(5)
                .try_collect::<Vec<_>>()
                .await?;
            Ok(DeltaReader::from_multiple_blocks(data))
        }
    }

    pub(crate) fn sstable_delta_reader_for_key_range(
        &self,
        key_range: impl RangeBounds<[u8]>,
        limit: Option<u64>,
        automaton: &impl Automaton,
    ) -> io::Result<DeltaReader<TSSTable::ValueReader>> {
        let match_all = automaton.will_always_match(&automaton.start());
        if match_all {
            let slice = self.file_slice_for_range(key_range, limit);
            let data = slice.read_bytes()?;
            Ok(TSSTable::delta_reader(data))
        } else {
            // if operations are sync, we assume latency is almost null, and there is no point in
            // merging across holes
            let blocks = self.get_block_iterator_for_range_and_automaton(key_range, automaton, 0);
            let data = blocks
                .map(|block_addr| self.sstable_slice.read_bytes_slice(block_addr.byte_range))
                .collect::<Result<Vec<_>, _>>()?;
            Ok(DeltaReader::from_multiple_blocks(data))
        }
    }

    pub(crate) fn sstable_delta_reader_block(
        &self,
        block_addr: BlockAddr,
    ) -> io::Result<DeltaReader<TSSTable::ValueReader>> {
        let data = self.sstable_slice.read_bytes_slice(block_addr.byte_range)?;
        Ok(TSSTable::delta_reader(data))
    }

    pub(crate) async fn sstable_delta_reader_block_async(
        &self,
        block_addr: BlockAddr,
    ) -> io::Result<DeltaReader<TSSTable::ValueReader>> {
        let data = self
            .sstable_slice
            .read_bytes_slice_async(block_addr.byte_range)
            .await?;
        Ok(TSSTable::delta_reader(data))
    }

    /// This function returns a file slice covering a set of sstable blocks
    /// that include the key range passed in arguments. Optionally returns
    /// only block for up to `limit` matching terms.
    ///
    /// It works by identifying
    /// - `first_block`: the block containing the start boundary key
    /// - `last_block`: the block containing the end boundary key.
    ///
    /// And then returning the range that spans over all blocks between.
    /// and including first_block and last_block, aka:
    /// `[first_block.start_offset .. last_block.end_offset)`
    ///
    /// Technically this function does not provide the tightest fit, as
    /// for simplification, it treats the start bound of the `key_range`
    /// as if it was inclusive, even if it is exclusive.
    /// On the rare edge case where a user asks for `(start_key, end_key]`
    /// and `start_key` happens to be the last key of a block, we return a
    /// slice that is the first block was not necessary.
    pub fn file_slice_for_range(
        &self,
        key_range: impl RangeBounds<[u8]>,
        limit: Option<u64>,
    ) -> FileSlice {
        let first_block_id = match key_range.start_bound() {
            Bound::Included(key) | Bound::Excluded(key) => {
                let Some(first_block_id) = self.sstable_index.locate_with_key(key) else {
                    return FileSlice::empty();
                };
                Some(first_block_id)
            }
            Bound::Unbounded => None,
        };

        let last_block_id = match key_range.end_bound() {
            Bound::Included(key) | Bound::Excluded(key) => self.sstable_index.locate_with_key(key),
            Bound::Unbounded => None,
        };

        let start_bound = if let Some(first_block_id) = first_block_id {
            let Some(block_addr) = self.sstable_index.get_block(first_block_id) else {
                return FileSlice::empty();
            };
            Bound::Included(block_addr.byte_range.start)
        } else {
            Bound::Unbounded
        };

        let last_block_id = if let Some(limit) = limit {
            let second_block_id = first_block_id.map(|id| id + 1).unwrap_or(0);
            if let Some(block_addr) = self.sstable_index.get_block(second_block_id) {
                let ordinal_limit = block_addr.first_ordinal + limit;
                let last_block_limit = self.sstable_index.locate_with_ord(ordinal_limit);
                if let Some(last_block_id) = last_block_id {
                    Some(last_block_id.min(last_block_limit))
                } else {
                    Some(last_block_limit)
                }
            } else {
                last_block_id
            }
        } else {
            last_block_id
        };
        let end_bound = last_block_id
            .and_then(|block_id| self.sstable_index.get_block(block_id))
            .map(|block_addr| Bound::Excluded(block_addr.byte_range.end))
            .unwrap_or(Bound::Unbounded);

        self.sstable_slice.slice((start_bound, end_bound))
    }

    fn get_block_iterator_for_range_and_automaton<'a>(
        &'a self,
        key_range: impl RangeBounds<[u8]>,
        automaton: &'a impl Automaton,
        merge_holes_under_bytes: usize,
    ) -> impl Iterator<Item = BlockAddr> + 'a {
        let lower_bound = match key_range.start_bound() {
            Bound::Included(key) | Bound::Excluded(key) => {
                self.sstable_index.locate_with_key(key).unwrap_or(u64::MAX)
            }
            Bound::Unbounded => 0,
        };

        let upper_bound = match key_range.end_bound() {
            Bound::Included(key) | Bound::Excluded(key) => {
                self.sstable_index.locate_with_key(key).unwrap_or(u64::MAX)
            }
            Bound::Unbounded => u64::MAX,
        };
        let block_range = lower_bound..=upper_bound;
        self.sstable_index
            .get_block_for_automaton(automaton)
            .filter(move |(block_id, _)| block_range.contains(block_id))
            .map(|(_, block_addr)| block_addr)
            .coalesce(move |first, second| {
                if first.byte_range.end + merge_holes_under_bytes >= second.byte_range.start {
                    Ok(BlockAddr {
                        first_ordinal: first.first_ordinal,
                        byte_range: first.byte_range.start..second.byte_range.end,
                    })
                } else {
                    Err((first, second))
                }
            })
    }

    /// Opens a `TermDictionary`.
    pub fn open(term_dictionary_file: FileSlice) -> io::Result<Self> {
        let num_bytes = term_dictionary_file.num_bytes();
        let (main_slice, footer_len_slice) = term_dictionary_file.split_from_end(20);
        let mut footer_len_bytes: OwnedBytes = footer_len_slice.read_bytes()?;
        let index_offset = u64::deserialize(&mut footer_len_bytes)?;
        let num_terms = u64::deserialize(&mut footer_len_bytes)?;
        let version = u32::deserialize(&mut footer_len_bytes)?;
        let (sstable_slice, index_slice) = main_slice.split(index_offset as usize);
        let sstable_index_bytes = index_slice.read_bytes()?;

        let sstable_index = match version {
            2 => SSTableIndex::V2(
                crate::sstable_index_v2::SSTableIndex::load(sstable_index_bytes).map_err(|_| {
                    io::Error::new(io::ErrorKind::InvalidData, "SSTable corruption")
                })?,
            ),
            3 => {
                let (sstable_index_bytes, mut footerv3_len_bytes) = sstable_index_bytes.rsplit(8);
                let store_offset = u64::deserialize(&mut footerv3_len_bytes)?;
                if store_offset != 0 {
                    SSTableIndex::V3(
                        SSTableIndexV3::load(sstable_index_bytes, store_offset).map_err(|_| {
                            io::Error::new(io::ErrorKind::InvalidData, "SSTable corruption")
                        })?,
                    )
                } else {
                    // if store_offset is zero, there is no index, so we build a pseudo-index
                    // assuming a single block of sstable covering everything.
                    SSTableIndex::V3Empty(SSTableIndexV3Empty::load(index_offset as usize))
                }
            }
            _ => {
                return Err(io::Error::other(format!(
                    "Unsupported sstable version, expected one of [2, 3], found {version}"
                )));
            }
        };

        Ok(Dictionary {
            sstable_slice,
            sstable_index,
            num_bytes,
            num_terms,
            phantom_data: PhantomData,
        })
    }

    /// Creates a term dictionary from the supplied bytes.
    pub fn from_bytes(owned_bytes: OwnedBytes) -> io::Result<Self> {
        Dictionary::open(FileSlice::new(Arc::new(owned_bytes)))
    }

    /// Creates an empty term dictionary which contains no terms.
    pub fn empty() -> Self {
        let term_dictionary_data: Vec<u8> = Self::builder(Vec::<u8>::new())
            .expect("Creating a TermDictionaryBuilder in a Vec<u8> should never fail")
            .finish()
            .expect("Writing in a Vec<u8> should never fail");
        let empty_dict_file = FileSlice::from(term_dictionary_data);
        Dictionary::open(empty_dict_file).unwrap()
    }

    /// Returns the number of terms in the dictionary.
    /// Term ordinals range from 0 to `num_terms() - 1`.
    pub fn num_terms(&self) -> usize {
        self.num_terms as usize
    }

    /// Returns the total number of bytes used by the dictionary on disk.
    pub fn num_bytes(&self) -> ByteCount {
        self.num_bytes
    }

    /// Decode a DeltaReader up to key, returning the number of terms traversed
    ///
    /// If the key was not found, returns Ok(None).
    /// After calling this function, it is possible to call `DeltaReader::value` to get the
    /// associated value.
    fn decode_up_to_key<K: AsRef<[u8]>>(
        &self,
        key: K,
        sstable_delta_reader: &mut DeltaReader<TSSTable::ValueReader>,
    ) -> io::Result<Option<TermOrdinal>> {
        self.decode_up_to_or_next(key, sstable_delta_reader)
            .map(|hit| hit.into_exact())
    }
    /// Decode a DeltaReader up to key, returning the number of terms traversed
    ///
    /// If the key was not found, it returns the next term id.
    fn decode_up_to_or_next<K: AsRef<[u8]>>(
        &self,
        key: K,
        sstable_delta_reader: &mut DeltaReader<TSSTable::ValueReader>,
    ) -> io::Result<TermOrdHit> {
        let mut term_ord = 0;
        let key_bytes = key.as_ref();
        let mut ok_bytes = 0;
        while sstable_delta_reader.advance()? {
            let prefix_len = sstable_delta_reader.common_prefix_len();
            let suffix = sstable_delta_reader.suffix();

            match prefix_len.cmp(&ok_bytes) {
                Ordering::Less => return Ok(TermOrdHit::Next(term_ord)), /* popped bytes already matched => too far */
                Ordering::Equal => (),
                Ordering::Greater => {
                    // the ok prefix is less than current entry prefix => continue to next elem
                    term_ord += 1;
                    continue;
                }
            }

            // we have ok_bytes byte of common prefix, check if this key adds more
            for (key_byte, suffix_byte) in key_bytes[ok_bytes..].iter().zip(suffix) {
                match suffix_byte.cmp(key_byte) {
                    Ordering::Less => break,          // byte too small
                    Ordering::Equal => ok_bytes += 1, // new matching
                    // byte
                    Ordering::Greater => return Ok(TermOrdHit::Next(term_ord)), // too far
                }
            }

            if ok_bytes == key_bytes.len() {
                if prefix_len + suffix.len() == ok_bytes {
                    return Ok(TermOrdHit::Exact(term_ord));
                } else {
                    // current key is a prefix of current element, not a match
                    return Ok(TermOrdHit::Next(term_ord));
                }
            }

            term_ord += 1;
        }

        Ok(TermOrdHit::Next(term_ord))
    }

    /// Returns the ordinal associated with a given term.
    pub fn term_ord<K: AsRef<[u8]>>(&self, key: K) -> io::Result<Option<TermOrdinal>> {
        let key_bytes = key.as_ref();

        let Some(block_addr) = self.sstable_index.get_block_with_key(key_bytes) else {
            return Ok(None);
        };

        let first_ordinal = block_addr.first_ordinal;
        let mut sstable_delta_reader = self.sstable_delta_reader_block(block_addr)?;
        self.decode_up_to_key(key_bytes, &mut sstable_delta_reader)
            .map(|opt| opt.map(|ord| ord + first_ordinal))
    }

    /// Returns the ordinal associated with a given term or its closest next term_id
    /// The closest next term_id may not exist.
    pub fn term_ord_or_next<K: AsRef<[u8]>>(&self, key: K) -> io::Result<TermOrdHit> {
        let key_bytes = key.as_ref();

        let Some(block_addr) = self.sstable_index.get_block_with_key(key_bytes) else {
            // TODO: Would be more consistent to return last_term id + 1
            return Ok(TermOrdHit::Next(u64::MAX));
        };

        let first_ordinal = block_addr.first_ordinal;
        let mut sstable_delta_reader = self.sstable_delta_reader_block(block_addr)?;
        self.decode_up_to_or_next(key_bytes, &mut sstable_delta_reader)
            .map(|opt| opt.map(|ord| ord + first_ordinal))
    }

    /// Converts strings into a Bound range.
    /// This does handle several special cases if the term is not exactly in the dictionary.
    /// e.g. [bbb, ddd]
    /// lower_bound: Bound::Included(aaa) => Included(0) // "Next" term id
    /// lower_bound: Bound::Excluded(aaa) => Included(0) // "Next" term id + Change the Bounds
    /// lower_bound: Bound::Included(ccc) => Included(1) // "Next" term id
    /// lower_bound: Bound::Excluded(ccc) => Included(1) // "Next" term id + Change the Bounds
    /// lower_bound: Bound::Included(zzz) => Included(2) // "Next" term id
    /// lower_bound: Bound::Excluded(zzz) => Included(2) // "Next" term id + Change the Bounds
    /// For zzz we should have some post processing to return an empty query`
    ///
    /// upper_bound: Bound::Included(aaa) => Excluded(0) // "Next" term id + Change the bounds
    /// upper_bound: Bound::Excluded(aaa) => Excluded(0) // "Next" term id
    /// upper_bound: Bound::Included(ccc) => Excluded(1) // Next term id + Change the bounds
    /// upper_bound: Bound::Excluded(ccc) => Excluded(1) // Next term id
    /// upper_bound: Bound::Included(zzz) => Excluded(2) // Next term id + Change the bounds
    /// upper_bound: Bound::Excluded(zzz) => Excluded(2) // Next term id
    pub fn term_bounds_to_ord<K: AsRef<[u8]>>(
        &self,
        lower_bound: Bound<K>,
        upper_bound: Bound<K>,
    ) -> io::Result<(Bound<TermOrdinal>, Bound<TermOrdinal>)> {
        let lower_bound = transform_bound_inner_res(&lower_bound, |start_bound_bytes| {
            let ord = self.term_ord_or_next(start_bound_bytes)?;
            match ord {
                TermOrdHit::Exact(ord) => Ok(TransformBound::Existing(ord)),
                TermOrdHit::Next(ord) => Ok(TransformBound::NewBound(Bound::Included(ord))), /* Change bounds to included */
            }
        })?;
        let upper_bound = transform_bound_inner_res(&upper_bound, |end_bound_bytes| {
            let ord = self.term_ord_or_next(end_bound_bytes)?;
            match ord {
                TermOrdHit::Exact(ord) => Ok(TransformBound::Existing(ord)),
                TermOrdHit::Next(ord) => Ok(TransformBound::NewBound(Bound::Excluded(ord))), /* Change bounds to excluded */
            }
        })?;
        Ok((lower_bound, upper_bound))
    }

    /// Returns the term associated with a given term ordinal.
    ///
    /// Term ordinals are defined as the position of the term in
    /// the sorted list of terms.
    ///
    /// Returns true if and only if the term has been found.
    ///
    /// Regardless of whether the term is found or not,
    /// the buffer may be modified.
    pub fn ord_to_term(&self, ord: TermOrdinal, bytes: &mut Vec<u8>) -> io::Result<bool> {
        // find block in which the term would be
        let block_addr = self.sstable_index.get_block_with_ord(ord);
        let first_ordinal = block_addr.first_ordinal;

        // then search inside that block only
        let mut sstable_delta_reader = self.sstable_delta_reader_block(block_addr)?;
        for _ in first_ordinal..=ord {
            if !sstable_delta_reader.advance()? {
                return Ok(false);
            }
            bytes.truncate(sstable_delta_reader.common_prefix_len());
            bytes.extend_from_slice(sstable_delta_reader.suffix());
        }
        Ok(true)
    }

    /// Returns the terms for a _sorted_ list of term ordinals.
    ///
    /// Returns true if and only if all terms have been found.
    pub fn sorted_ords_to_term_cb<F: FnMut(&[u8]) -> io::Result<()>>(
        &self,
        mut ords: impl Iterator<Item = TermOrdinal>,
        mut cb: F,
    ) -> io::Result<bool> {
        let Some(mut ord) = ords.next() else {
            return Ok(true);
        };

        // Open the block for the first ordinal.
        let mut bytes = Vec::new();
        let mut current_block_addr = self.sstable_index.get_block_with_ord(ord);
        let mut current_sstable_delta_reader =
            self.sstable_delta_reader_block(current_block_addr.clone())?;
        let mut current_block_ordinal = current_block_addr.first_ordinal;

        loop {
            // move to the ord inside the current block
            while current_block_ordinal <= ord {
                if !current_sstable_delta_reader.advance()? {
                    return Ok(false);
                }
                bytes.truncate(current_sstable_delta_reader.common_prefix_len());
                bytes.extend_from_slice(current_sstable_delta_reader.suffix());
                current_block_ordinal += 1;
            }
            cb(&bytes)?;

            // fetch the next ordinal
            let Some(next_ord) = ords.next() else {
                return Ok(true);
            };

            // advance forward if the new ord is different than the one we just processed
            //
            // this allows the input TermOrdinal iterator to contain duplicates, so long as it's
            // still sorted
            if next_ord < ord {
                panic!("Ordinals were not sorted: received {next_ord} after {ord}");
            } else if next_ord > ord {
                // check if block changed for new term_ord
                let new_block_addr = self.sstable_index.get_block_with_ord(next_ord);
                if new_block_addr != current_block_addr {
                    current_block_addr = new_block_addr;
                    current_block_ordinal = current_block_addr.first_ordinal;
                    current_sstable_delta_reader =
                        self.sstable_delta_reader_block(current_block_addr.clone())?;
                    bytes.clear();
                }
                ord = next_ord;
            } else {
                // The next ord is equal to the previous ord: no need to seek or advance.
            }
        }
    }

    /// Returns the number of terms in the dictionary.
    pub fn term_info_from_ord(&self, term_ord: TermOrdinal) -> io::Result<Option<TSSTable::Value>> {
        // find block in which the term would be
        let block_addr = self.sstable_index.get_block_with_ord(term_ord);
        let first_ordinal = block_addr.first_ordinal;

        // then search inside that block only
        let mut sstable_reader = self.sstable_reader_block(block_addr)?;
        for _ in first_ordinal..=term_ord {
            if !sstable_reader.advance()? {
                return Ok(None);
            }
        }
        Ok(Some(sstable_reader.value().clone()))
    }

    /// Lookups the value corresponding to the key.
    pub fn get<K: AsRef<[u8]>>(&self, key: K) -> io::Result<Option<TSSTable::Value>> {
        if let Some(block_addr) = self.sstable_index.get_block_with_key(key.as_ref()) {
            let sstable_reader = self.sstable_delta_reader_block(block_addr)?;
            return self.do_get(key, sstable_reader);
        }
        Ok(None)
    }

    /// Lookups the value corresponding to the key.
    pub async fn get_async<K: AsRef<[u8]>>(&self, key: K) -> io::Result<Option<TSSTable::Value>> {
        if let Some(block_addr) = self.sstable_index.get_block_with_key(key.as_ref()) {
            let sstable_reader = self.sstable_delta_reader_block_async(block_addr).await?;
            return self.do_get(key, sstable_reader);
        }
        Ok(None)
    }

    fn do_get<K: AsRef<[u8]>>(
        &self,
        key: K,
        mut reader: DeltaReader<TSSTable::ValueReader>,
    ) -> io::Result<Option<TSSTable::Value>> {
        if let Some(_ord) = self.decode_up_to_key(key, &mut reader)? {
            Ok(Some(reader.value().clone()))
        } else {
            Ok(None)
        }
    }

    /// Returns a range builder, to stream all of the terms
    /// within an interval.
    pub fn range(&self) -> StreamerBuilder<'_, TSSTable> {
        StreamerBuilder::new(self, AlwaysMatch)
    }

    /// Returns a range builder filtered with a prefix.
    pub fn prefix_range<K: AsRef<[u8]>>(&self, prefix: K) -> StreamerBuilder<'_, TSSTable> {
        let lower_bound = prefix.as_ref();
        let mut upper_bound = lower_bound.to_vec();
        for idx in (0..upper_bound.len()).rev() {
            if upper_bound[idx] == 255 {
                upper_bound.pop();
            } else {
                upper_bound[idx] += 1;
                break;
            }
        }
        let mut builder = self.range().ge(lower_bound);
        if !upper_bound.is_empty() {
            builder = builder.lt(upper_bound);
        }
        builder
    }

    /// A stream of all the sorted terms.
    pub fn stream(&self) -> io::Result<Streamer<'_, TSSTable>> {
        self.range().into_stream()
    }

    /// Returns a search builder, to stream all of the terms
    /// within the Automaton
    pub fn search<'a, A: Automaton + 'a>(
        &'a self,
        automaton: A,
    ) -> StreamerBuilder<'a, TSSTable, A>
    where
        A::State: Clone,
    {
        StreamerBuilder::<TSSTable, A>::new(self, automaton)
    }

    #[doc(hidden)]
    pub async fn warm_up_dictionary(&self) -> io::Result<()> {
        self.sstable_slice.read_bytes_async().await?;
        Ok(())
    }
}

#[cfg(test)]
mod tests {
    use std::ops::{Bound, Range};
    use std::sync::{Arc, Mutex};

    use common::OwnedBytes;

    use super::Dictionary;
    use crate::MonotonicU64SSTable;
    use crate::dictionary::TermOrdHit;

    #[derive(Debug)]
    struct PermissionedHandle {
        bytes: OwnedBytes,
        allowed_range: Mutex<Range<usize>>,
    }

    impl PermissionedHandle {
        fn new(bytes: Vec<u8>) -> Self {
            let bytes = OwnedBytes::new(bytes);
            PermissionedHandle {
                allowed_range: Mutex::new(0..bytes.len()),
                bytes,
            }
        }

        fn restrict(&self, range: Range<usize>) {
            *self.allowed_range.lock().unwrap() = range;
        }
    }

    impl common::HasLen for PermissionedHandle {
        fn len(&self) -> usize {
            self.bytes.len()
        }
    }

    impl common::file_slice::FileHandle for PermissionedHandle {
        fn read_bytes(&self, range: Range<usize>) -> std::io::Result<OwnedBytes> {
            let allowed_range = self.allowed_range.lock().unwrap();
            if !allowed_range.contains(&range.start) || !allowed_range.contains(&(range.end - 1)) {
                return Err(std::io::Error::other(format!(
                    "invalid range, allowed {allowed_range:?}, requested {range:?}"
                )));
            }

            Ok(self.bytes.slice(range))
        }
    }

    fn make_test_sstable() -> (Dictionary<MonotonicU64SSTable>, Arc<PermissionedHandle>) {
        let mut builder = Dictionary::<MonotonicU64SSTable>::builder(Vec::new()).unwrap();

        // this makes 256k keys, enough to fill multiple blocks.
        for elem in 0..0x3ffff {
            let key = format!("{elem:05X}").into_bytes();
            builder.insert(&key, &elem).unwrap();
        }

        let table = builder.finish().unwrap();
        let table = Arc::new(PermissionedHandle::new(table));
        let slice = common::file_slice::FileSlice::new(table.clone());

        let dictionary = Dictionary::<MonotonicU64SSTable>::open(slice).unwrap();

        // if the last block is id 0, tests are meaningless
        assert_ne!(dictionary.sstable_index.locate_with_ord(u64::MAX), 0);
        assert_eq!(dictionary.num_terms(), 0x3ffff);
        (dictionary, table)
    }

    #[test]
    fn test_term_to_ord_or_next() {
        let dict = {
            let mut builder = Dictionary::<MonotonicU64SSTable>::builder(Vec::new()).unwrap();

            builder.insert(b"bbb", &1).unwrap();
            builder.insert(b"ddd", &2).unwrap();

            let table = builder.finish().unwrap();
            let table = Arc::new(PermissionedHandle::new(table));
            let slice = common::file_slice::FileSlice::new(table.clone());

            Dictionary::<MonotonicU64SSTable>::open(slice).unwrap()
        };

        assert_eq!(dict.term_ord_or_next(b"aaa").unwrap(), TermOrdHit::Next(0));
        assert_eq!(dict.term_ord_or_next(b"bbb").unwrap(), TermOrdHit::Exact(0));
        assert_eq!(dict.term_ord_or_next(b"bb").unwrap(), TermOrdHit::Next(0));
        assert_eq!(dict.term_ord_or_next(b"bbbb").unwrap(), TermOrdHit::Next(1));
        assert_eq!(dict.term_ord_or_next(b"dd").unwrap(), TermOrdHit::Next(1));
        assert_eq!(dict.term_ord_or_next(b"ddd").unwrap(), TermOrdHit::Exact(1));
        assert_eq!(dict.term_ord_or_next(b"dddd").unwrap(), TermOrdHit::Next(2));

        // This is not u64::MAX because for very small sstables (only one block),
        // we don't store an index, and the pseudo-index always reply that the
        // answer lies in block number 0
        assert_eq!(
            dict.term_ord_or_next(b"zzzzzzz").unwrap(),
            TermOrdHit::Next(2)
        );
    }
    #[test]
    fn test_term_to_ord_or_next_2() {
        let dict = {
            let mut builder = Dictionary::<MonotonicU64SSTable>::builder(Vec::new()).unwrap();

            let mut term_ord = 0;
            builder.insert(b"bbb", &term_ord).unwrap();

            // Fill blocks in between
            for elem in 0..50_000 {
                term_ord += 1;
                let key = format!("ccccc{elem:05X}").into_bytes();
                builder.insert(&key, &term_ord).unwrap();
            }

            term_ord += 1;
            builder.insert(b"eee", &term_ord).unwrap();

            let table = builder.finish().unwrap();
            let table = Arc::new(PermissionedHandle::new(table));
            let slice = common::file_slice::FileSlice::new(table.clone());

            Dictionary::<MonotonicU64SSTable>::open(slice).unwrap()
        };

        assert_eq!(dict.term_ord(b"bbb").unwrap(), Some(0));
        assert_eq!(dict.term_ord_or_next(b"bbb").unwrap(), TermOrdHit::Exact(0));
        assert_eq!(dict.term_ord_or_next(b"aaa").unwrap(), TermOrdHit::Next(0));
        assert_eq!(dict.term_ord_or_next(b"bb").unwrap(), TermOrdHit::Next(0));
        assert_eq!(dict.term_ord_or_next(b"bbbb").unwrap(), TermOrdHit::Next(1));
        assert_eq!(
            dict.term_ord_or_next(b"ee").unwrap(),
            TermOrdHit::Next(50001)
        );
        assert_eq!(
            dict.term_ord_or_next(b"eee").unwrap(),
            TermOrdHit::Exact(50001)
        );
        assert_eq!(
            dict.term_ord_or_next(b"eeee").unwrap(),
            TermOrdHit::Next(u64::MAX)
        );

        assert_eq!(
            dict.term_ord_or_next(b"zzzzzzz").unwrap(),
            TermOrdHit::Next(u64::MAX)
        );
    }

    #[test]
    fn test_term_bounds_to_ord() {
        let dict = {
            let mut builder = Dictionary::<MonotonicU64SSTable>::builder(Vec::new()).unwrap();

            builder.insert(b"bbb", &1).unwrap();
            builder.insert(b"ddd", &2).unwrap();

            let table = builder.finish().unwrap();
            let table = Arc::new(PermissionedHandle::new(table));
            let slice = common::file_slice::FileSlice::new(table.clone());

            Dictionary::<MonotonicU64SSTable>::open(slice).unwrap()
        };

        // Test cases for lower_bound
        let test_lower_bound = |bound, expected| {
            assert_eq!(
                dict.term_bounds_to_ord::<&[u8]>(bound, Bound::Included(b"ignored"))
                    .unwrap()
                    .0,
                expected
            );
        };

        test_lower_bound(Bound::Included(b"aaa".as_slice()), Bound::Included(0));
        test_lower_bound(Bound::Excluded(b"aaa".as_slice()), Bound::Included(0));

        test_lower_bound(Bound::Included(b"bbb".as_slice()), Bound::Included(0));
        test_lower_bound(Bound::Excluded(b"bbb".as_slice()), Bound::Excluded(0));

        test_lower_bound(Bound::Included(b"ccc".as_slice()), Bound::Included(1));
        test_lower_bound(Bound::Excluded(b"ccc".as_slice()), Bound::Included(1));

        test_lower_bound(Bound::Included(b"zzz".as_slice()), Bound::Included(2));
        test_lower_bound(Bound::Excluded(b"zzz".as_slice()), Bound::Included(2));

        // Test cases for upper_bound
        let test_upper_bound = |bound, expected| {
            assert_eq!(
                dict.term_bounds_to_ord::<&[u8]>(Bound::Included(b"ignored"), bound,)
                    .unwrap()
                    .1,
                expected
            );
        };
        test_upper_bound(Bound::Included(b"ccc".as_slice()), Bound::Excluded(1));
        test_upper_bound(Bound::Excluded(b"ccc".as_slice()), Bound::Excluded(1));
        test_upper_bound(Bound::Included(b"zzz".as_slice()), Bound::Excluded(2));
        test_upper_bound(Bound::Excluded(b"zzz".as_slice()), Bound::Excluded(2));
        test_upper_bound(Bound::Included(b"ddd".as_slice()), Bound::Included(1));
        test_upper_bound(Bound::Excluded(b"ddd".as_slice()), Bound::Excluded(1));
    }

    #[test]
    fn test_ord_term_conversion() {
        let (dic, slice) = make_test_sstable();

        let block = dic.sstable_index.get_block_with_ord(100_000);
        slice.restrict(block.byte_range);

        let mut res = Vec::new();

        // middle of a block
        assert!(dic.ord_to_term(100_000, &mut res).unwrap());
        assert_eq!(res, format!("{:05X}", 100_000).into_bytes());
        assert_eq!(dic.term_info_from_ord(100_000).unwrap().unwrap(), 100_000);
        assert_eq!(dic.get(&res).unwrap().unwrap(), 100_000);
        assert_eq!(dic.term_ord(&res).unwrap().unwrap(), 100_000);

        // start of a block
        assert!(dic.ord_to_term(block.first_ordinal, &mut res).unwrap());
        assert_eq!(res, format!("{:05X}", block.first_ordinal).into_bytes());
        assert_eq!(
            dic.term_info_from_ord(block.first_ordinal)
                .unwrap()
                .unwrap(),
            block.first_ordinal
        );
        assert_eq!(dic.get(&res).unwrap().unwrap(), block.first_ordinal);
        assert_eq!(dic.term_ord(&res).unwrap().unwrap(), block.first_ordinal);

        // end of a block
        let ordinal = block.first_ordinal - 1;
        let new_range = dic.sstable_index.get_block_with_ord(ordinal).byte_range;
        slice.restrict(new_range);
        assert!(dic.ord_to_term(ordinal, &mut res).unwrap());
        assert_eq!(res, format!("{ordinal:05X}").into_bytes());
        assert_eq!(dic.term_info_from_ord(ordinal).unwrap().unwrap(), ordinal);
        assert_eq!(dic.get(&res).unwrap().unwrap(), ordinal);
        assert_eq!(dic.term_ord(&res).unwrap().unwrap(), ordinal);

        // before first block
        // 1st block must be loaded for key-related operations
        let block = dic.sstable_index.get_block_with_ord(0);
        slice.restrict(block.byte_range);

        assert!(dic.get(b"$$$").unwrap().is_none());
        assert!(dic.term_ord(b"$$$").unwrap().is_none());

        // after last block
        // last block must be loaded for ord related operations
        let ordinal = 0x40000 + 10;
        let new_range = dic.sstable_index.get_block_with_ord(ordinal).byte_range;
        slice.restrict(new_range);
        assert!(!dic.ord_to_term(ordinal, &mut res).unwrap());
        assert!(dic.term_info_from_ord(ordinal).unwrap().is_none());

        // last block isn't required to be loaded for key related operations
        slice.restrict(0..0);
        assert!(dic.get(b"~~~").unwrap().is_none());
        assert!(dic.term_ord(b"~~~").unwrap().is_none());

        slice.restrict(0..slice.bytes.len());
        // between 1000F and 10010, test case where matched prefix > prefix kept
        assert!(dic.term_ord(b"1000G").unwrap().is_none());
        // shorter than 10000, tests prefix case
        assert!(dic.term_ord(b"1000").unwrap().is_none());
    }

    #[test]
    fn test_ords_term() {
        let (dic, _slice) = make_test_sstable();

        // Single term
        let mut terms = Vec::new();
        assert!(
            dic.sorted_ords_to_term_cb(100_000..100_001, |term| {
                terms.push(term.to_vec());
                Ok(())
            })
            .unwrap()
        );
        assert_eq!(terms, vec![format!("{:05X}", 100_000).into_bytes(),]);
        // Single term
        let mut terms = Vec::new();
        assert!(
            dic.sorted_ords_to_term_cb(100_001..100_002, |term| {
                terms.push(term.to_vec());
                Ok(())
            })
            .unwrap()
        );
        assert_eq!(terms, vec![format!("{:05X}", 100_001).into_bytes(),]);
        // both terms
        let mut terms = Vec::new();
        assert!(
            dic.sorted_ords_to_term_cb(100_000..100_002, |term| {
                terms.push(term.to_vec());
                Ok(())
            })
            .unwrap()
        );
        assert_eq!(
            terms,
            vec![
                format!("{:05X}", 100_000).into_bytes(),
                format!("{:05X}", 100_001).into_bytes(),
            ]
        );
        // Test cross block
        let mut terms = Vec::new();
        assert!(
            dic.sorted_ords_to_term_cb(98653..=98655, |term| {
                terms.push(term.to_vec());
                Ok(())
            })
            .unwrap()
        );
        assert_eq!(
            terms,
            vec![
                format!("{:05X}", 98653).into_bytes(),
                format!("{:05X}", 98654).into_bytes(),
                format!("{:05X}", 98655).into_bytes(),
            ]
        );
    }

    #[test]
    fn test_range() {
        let (dic, slice) = make_test_sstable();

        let start = dic
            .sstable_index
            .get_block_with_key(b"10000")
            .unwrap()
            .byte_range;
        let end = dic
            .sstable_index
            .get_block_with_key(b"18000")
            .unwrap()
            .byte_range;
        slice.restrict(start.start..end.end);

        let mut stream = dic.range().ge(b"10000").lt(b"18000").into_stream().unwrap();

        for i in 0x10000..0x18000 {
            assert!(stream.advance());
            assert_eq!(stream.term_ord(), i);
            assert_eq!(stream.value(), &i);
            assert_eq!(stream.key(), format!("{i:05X}").into_bytes());
        }
        assert!(!stream.advance());

        // verify limiting the number of results reduce the size read
        slice.restrict(start.start..(end.end - 1));

        let mut stream = dic
            .range()
            .ge(b"10000")
            .lt(b"18000")
            .limit(0xfff)
            .into_stream()
            .unwrap();

        for i in 0x10000..0x10fff {
            assert!(stream.advance());
            assert_eq!(stream.term_ord(), i);
            assert_eq!(stream.value(), &i);
            assert_eq!(stream.key(), format!("{i:05X}").into_bytes());
        }
        // there might be more successful elements after, though how many is undefined

        slice.restrict(0..slice.bytes.len());

        let mut stream = dic.stream().unwrap();
        for i in 0..0x3ffff {
            assert!(stream.advance());
            assert_eq!(stream.term_ord(), i);
            assert_eq!(stream.value(), &i);
            assert_eq!(stream.key(), format!("{i:05X}").into_bytes());
        }
        assert!(!stream.advance());
    }

    #[test]
    fn test_prefix() {
        let (dic, _slice) = make_test_sstable();
        {
            let mut stream = dic.prefix_range("1").into_stream().unwrap();
            for i in 0x10000..0x20000 {
                assert!(stream.advance());
                assert_eq!(stream.term_ord(), i);
                assert_eq!(stream.value(), &i);
                assert_eq!(stream.key(), format!("{i:05X}").into_bytes());
            }
            assert!(!stream.advance());
        }
        {
            let mut stream = dic.prefix_range("").into_stream().unwrap();
            for i in 0..0x3ffff {
                assert!(stream.advance(), "failed at {i:05X}");
                assert_eq!(stream.term_ord(), i);
                assert_eq!(stream.value(), &i);
                assert_eq!(stream.key(), format!("{i:05X}").into_bytes());
            }
            assert!(!stream.advance());
        }
        {
            let mut stream = dic.prefix_range("0FF").into_stream().unwrap();
            for i in 0x0ff00..=0x0ffff {
                assert!(stream.advance(), "failed at {i:05X}");
                assert_eq!(stream.term_ord(), i);
                assert_eq!(stream.value(), &i);
                assert_eq!(stream.key(), format!("{i:05X}").into_bytes());
            }
            assert!(!stream.advance());
        }
    }

    #[test]
    fn test_prefix_edge() {
        let dict = {
            let mut builder = Dictionary::<MonotonicU64SSTable>::builder(Vec::new()).unwrap();
            builder.insert(&[0, 254], &0).unwrap();
            builder.insert(&[0, 255], &1).unwrap();
            builder.insert(&[0, 255, 12], &2).unwrap();
            builder.insert(&[1], &2).unwrap();
            builder.insert(&[1, 0], &2).unwrap();
            let table = builder.finish().unwrap();
            let table = Arc::new(PermissionedHandle::new(table));
            let slice = common::file_slice::FileSlice::new(table.clone());
            Dictionary::<MonotonicU64SSTable>::open(slice).unwrap()
        };

        let mut stream = dict.prefix_range(&[0, 255]).into_stream().unwrap();
        assert!(stream.advance());
        assert_eq!(stream.key(), &[0, 255]);
        assert!(stream.advance());
        assert_eq!(stream.key(), &[0, 255, 12]);
        assert!(!stream.advance());
    }
}


================================================
FILE: sstable/src/lib.rs
================================================
//! `tantivy_sstable` is a crate that provides a sorted string table data structure.
//!
//! It is used in `tantivy` to store the term dictionary.
//!
//! A `sstable` is a map of sorted `&[u8]` keys to values.
//! The keys are encoded using incremental encoding.
//!
//! Values and keys are compressed using zstd with the default feature flag `zstd-compression`.
//!
//! # Example
//!
//! Here is an example of how to create and search an `sstable`:
//!
//! ```rust
//! use common::OwnedBytes;
//! use tantivy_sstable::{Dictionary, MonotonicU64SSTable};
//!
//! // Create a new sstable in memory.
//! let mut builder = Dictionary::<MonotonicU64SSTable>::builder(Vec::new()).unwrap();
//! builder.insert(b"apple", &1).unwrap();
//! builder.insert(b"banana", &2).unwrap();
//! builder.insert(b"orange", &3).unwrap();
//! let sstable_bytes = builder.finish().unwrap();
//!
//! // Open the sstable.
//! let sstable =
//!     Dictionary::<MonotonicU64SSTable>::from_bytes(OwnedBytes::new(sstable_bytes)).unwrap();
//!
//! // Search for a key.
//! let value = sstable.get(b"banana").unwrap();
//! assert_eq!(value, Some(2));
//!
//! // Search for a non-existent key.
//! let value = sstable.get(b"grape").unwrap();
//! assert_eq!(value, None);
//! ```

use std::io::{self, Write};
use std::ops::Range;

use merge::ValueMerger;

mod block_match_automaton;
mod delta;
mod dictionary;
pub mod merge;
mod streamer;
pub mod value;

mod sstable_index_v3;
pub use sstable_index_v3::{BlockAddr, SSTableIndex, SSTableIndexBuilder, SSTableIndexV3};
mod sstable_index_v2;
pub(crate) mod vint;
pub use dictionary::{Dictionary, TermOrdHit};
pub use streamer::{Streamer, StreamerBuilder};

mod block_reader;
use common::{BinarySerializable, OwnedBytes};
use value::{VecU32ValueReader, VecU32ValueWriter};

pub use self::block_reader::BlockReader;
pub use self::delta::{DeltaReader, DeltaWriter};
pub use self::merge::VoidMerge;
use self::value::{U64MonotonicValueReader, U64MonotonicValueWriter, ValueReader, ValueWriter};
use crate::value::{RangeValueReader, RangeValueWriter};

pub type TermOrdinal = u64;

const DEFAULT_KEY_CAPACITY: usize = 50;
const SSTABLE_VERSION: u32 = 3;

/// Given two byte string returns the length of
/// the longest common prefix.
fn common_prefix_len(left: &[u8], right: &[u8]) -> usize {
    left.iter()
        .cloned()
        .zip(right.iter().cloned())
        .take_while(|(left, right)| left == right)
        .count()
}

#[derive(Debug, Copy, Clone)]
pub struct SSTableDataCorruption;

/// SSTable makes it possible to read and write
/// sstables with typed values.
pub trait SSTable: Sized {
    type Value: Clone;
    type ValueReader: ValueReader<Value = Self::Value>;
    type ValueWriter: ValueWriter<Value = Self::Value>;

    fn delta_writer<W: io::Write>(write: W) -> DeltaWriter<W, Self::ValueWriter> {
        DeltaWriter::new(write)
    }

    fn writer<W: io::Write>(wrt: W) -> Writer<W, Self::ValueWriter> {
        Writer::new(wrt)
    }

    fn delta_reader(reader: OwnedBytes) -> DeltaReader<Self::ValueReader> {
        DeltaReader::new(reader)
    }

    fn reader(reader: OwnedBytes) -> Reader<Self::ValueReader> {
        Reader {
            key: Vec::with_capacity(DEFAULT_KEY_CAPACITY),
            delta_reader: Self::delta_reader(reader),
        }
    }

    /// Returns an empty static reader.
    fn create_empty_reader() -> Reader<Self::ValueReader> {
        Self::reader(OwnedBytes::empty())
    }

    fn merge<W: io::Write, M: ValueMerger<Self::Value>>(
        io_readers: Vec<OwnedBytes>,
        w: W,
        merger: M,
    ) -> io::Result<()> {
        let readers: Vec<_> = io_readers.into_iter().map(Self::reader).collect();
        let writer = Self::writer(w);
        merge::merge_sstable::<Self, _, _>(readers, writer, merger)
    }
}

pub struct VoidSSTable;

impl SSTable for VoidSSTable {
    type Value = ();
    type ValueReader = value::VoidValueReader;
    type ValueWriter = value::VoidValueWriter;
}

/// SSTable associated keys to u64
/// sorted in order.
///
/// In other words, two keys `k1` and `k2`
/// such that `k1` <= `k2`, are required to observe
/// `range_sstable[k1] <= range_sstable[k2]`.
pub struct MonotonicU64SSTable;

impl SSTable for MonotonicU64SSTable {
    type Value = u64;

    type ValueReader = U64MonotonicValueReader;

    type ValueWriter = U64MonotonicValueWriter;
}

/// SSTable associating keys to ranges.
/// The range are required to partition the
/// space.
///
/// In other words, two consecutive keys `k1` and `k2`
/// are required to observe
/// `range_sstable[k1].end == range_sstable[k2].start`.
///
/// The first range is not required to start at `0`.
#[derive(Clone, Copy, Debug)]
pub struct RangeSSTable;

impl SSTable for RangeSSTable {
    type Value = Range<u64>;

    type ValueReader = RangeValueReader;

    type ValueWriter = RangeValueWriter;
}

/// SSTable associating keys to Vec<u32>.
pub struct VecU32ValueSSTable;

impl SSTable for VecU32ValueSSTable {
    type Value = Vec<u32>;
    type ValueReader = VecU32ValueReader;
    type ValueWriter = VecU32ValueWriter;
}

/// SSTable reader.
pub struct Reader<TValueReader> {
    key: Vec<u8>,
    delta_reader: DeltaReader<TValueReader>,
}

impl<TValueReader> Reader<TValueReader>
where TValueReader: ValueReader
{
    pub fn advance(&mut self) -> io::Result<bool> {
        if !self.delta_reader.advance()? {
            return Ok(false);
        }
        let common_prefix_len = self.delta_reader.common_prefix_len();
        let suffix = self.delta_reader.suffix();
        let new_len = self.delta_reader.common_prefix_len() + suffix.len();
        self.key.resize(new_len, 0u8);
        self.key[common_prefix_len..].copy_from_slice(suffix);
        Ok(true)
    }

    #[inline(always)]
    pub fn key(&self) -> &[u8] {
        &self.key
    }

    #[inline(always)]
    pub fn value(&self) -> &TValueReader::Value {
        self.delta_reader.value()
    }
}

impl<TValueReader> AsRef<[u8]> for Reader<TValueReader> {
    #[inline(always)]
    fn as_ref(&self) -> &[u8] {
        &self.key
    }
}

pub struct Writer<W, TValueWriter>
where W: io::Write
{
    previous_key: Vec<u8>,
    index_builder: SSTableIndexBuilder,
    delta_writer: DeltaWriter<W, TValueWriter>,
    num_terms: u64,
    first_ordinal_of_the_block: u64,
}

impl<W, TValueWriter> Writer<W, TValueWriter>
where
    W: io::Write,
    TValueWriter: value::ValueWriter,
{
    /// Use `Self::new`. This method only exists to match its
    /// equivalent in fst.
    /// TODO remove this function. (See Issue #1727)
    #[doc(hidden)]
    pub fn create(wrt: W) -> io::Result<Self> {
        Ok(Self::new(wrt))
    }

    /// Creates a new `TermDictionaryBuilder`.
    pub fn new(wrt: W) -> Self {
        Writer {
            previous_key: Vec::with_capacity(DEFAULT_KEY_CAPACITY),
            num_terms: 0u64,
            index_builder: SSTableIndexBuilder::default(),
            delta_writer: DeltaWriter::new(wrt),
            first_ordinal_of_the_block: 0u64,
        }
    }

    /// Set the target block length.
    ///
    /// The delta part of a block will generally be slightly larger than the requested `block_len`,
    /// however this does not account for the length of the Value part of the table.
    pub fn set_block_len(&mut self, block_len: usize) {
        self.delta_writer.set_block_len(block_len)
    }

    /// Returns the last inserted key.
    /// If no key has been inserted yet, or the block was just
    /// flushed, this function returns "".
    #[inline(always)]
    pub(crate) fn last_inserted_key(&self) -> &[u8] {
        &self.previous_key[..]
    }

    /// Inserts a `(key, value)` pair in the term dictionary.
    /// Keys have to be inserted in order.
    ///
    /// # Panics
    ///
    /// Will panics if keys are inserted in an invalid order.
    #[inline]
    pub fn insert<K: AsRef<[u8]>>(
        &mut self,
        key: K,
        value: &TValueWriter::Value,
    ) -> io::Result<()> {
        self.insert_key(key.as_ref())?;
        self.insert_value(value)?;
        Ok(())
    }

    /// # Warning
    ///
    /// Horribly dangerous internal API. See `.insert(...)`.
    #[doc(hidden)]
    #[inline]
    pub fn insert_key(&mut self, key: &[u8]) -> io::Result<()> {
        // If this is the first key in the block, we use it to
        // shorten the last term in the last block.
        if self.first_ordinal_of_the_block == self.num_terms {
            self.index_builder
                .shorten_last_block_key_given_next_key(key);
        }
        let keep_len = common_prefix_len(&self.previous_key, key);
        let add_len = key.len() - keep_len;
        let increasing_keys = add_len > 0 && (self.previous_key.len() == keep_len)
            || self.previous_key.is_empty()
            || self.previous_key[keep_len] < key[keep_len];
        assert!(
            increasing_keys,
            "Keys should be increasing. ({:?} > {:?})",
            String::from_utf8_lossy(&self.previous_key),
            String::from_utf8_lossy(key),
        );
        self.previous_key.resize(key.len(), 0u8);
        self.previous_key[keep_len..].copy_from_slice(&key[keep_len..]);
        self.delta_writer.write_suffix(keep_len, &key[keep_len..]);
        Ok(())
    }

    /// # Warning
    ///
    /// Horribly dangerous internal API. See `.insert(...)`.
    #[doc(hidden)]
    #[inline]
    pub fn insert_value(&mut self, value: &TValueWriter::Value) -> io::Result<()> {
        self.delta_writer.write_value(value);
        self.num_terms += 1u64;
        self.flush_block_if_required()
    }

    pub fn flush_block_if_required(&mut self) -> io::Result<()> {
        if let Some(byte_range) = self.delta_writer.flush_block_if_required()? {
            self.index_builder.add_block(
                &self.previous_key[..],
                byte_range,
                self.first_ordinal_of_the_block,
            );
            self.first_ordinal_of_the_block = self.num_terms;
            self.previous_key.clear();
        }
        Ok(())
    }

    pub fn finish(mut self) -> io::Result<W> {
        if let Some(byte_range) = self.delta_writer.flush_block()? {
            self.index_builder.add_block(
                &self.previous_key[..],
                byte_range,
                self.first_ordinal_of_the_block,
            );
            self.first_ordinal_of_the_block = self.num_terms;
        }
        let mut wrt = self.delta_writer.finish();
        // add a final empty block as an end marker
        wrt.write_all(&0u32.to_le_bytes())?;

        let offset = wrt.written_bytes();

        let fst_len: u64 = self.index_builder.serialize(&mut wrt)?;
        wrt.write_all(&fst_len.to_le_bytes())?;
        wrt.write_all(&offset.to_le_bytes())?;
        wrt.write_all(&self.num_terms.to_le_bytes())?;

        SSTABLE_VERSION.serialize(&mut wrt)?;

        let wrt = wrt.finish();
        Ok(wrt.into_inner()?)
    }
}

#[cfg(test)]
mod test {
    use std::io;
    use std::ops::Bound;

    use common::OwnedBytes;

    use super::{MonotonicU64SSTable, SSTable, VoidMerge, VoidSSTable, common_prefix_len};

    fn aux_test_common_prefix_len(left: &str, right: &str, expect_len: usize) {
        assert_eq!(
            common_prefix_len(left.as_bytes(), right.as_bytes()),
            expect_len
        );
        assert_eq!(
            common_prefix_len(right.as_bytes(), left.as_bytes()),
            expect_len
        );
    }

    #[test]
    fn test_common_prefix_len() {
        aux_test_common_prefix_len("a", "ab", 1);
        aux_test_common_prefix_len("", "ab", 0);
        aux_test_common_prefix_len("ab", "abc", 2);
        aux_test_common_prefix_len("abde", "abce", 2);
    }

    #[test]
    fn test_long_key_diff() {
        let long_key = (0..1_024).map(|x| (x % 255) as u8).collect::<Vec<_>>();
        let long_key2 = (1..300).map(|x| (x % 255) as u8).collect::<Vec<_>>();
        let mut buffer = vec![];
        {
            let mut sstable_writer = VoidSSTable::writer(&mut buffer);
            assert!(sstable_writer.insert(&long_key[..], &()).is_ok());
            assert!(sstable_writer.insert([0, 3, 4], &()).is_ok());
            assert!(sstable_writer.insert(&long_key2[..], &()).is_ok());
            assert!(sstable_writer.finish().is_ok());
        }
        let buffer = OwnedBytes::new(buffer);
        let mut sstable_reader = VoidSSTable::reader(buffer);
        assert!(sstable_reader.advance().unwrap());
        assert_eq!(sstable_reader.key(), &long_key[..]);
        assert!(sstable_reader.advance().unwrap());
        assert_eq!(sstable_reader.key(), &[0, 3, 4]);
        assert!(sstable_reader.advance().unwrap());
        assert_eq!(sstable_reader.key(), &long_key2[..]);
        assert!(!sstable_reader.advance().unwrap());
    }

    #[test]
    fn test_simple_sstable() {
        let mut buffer = vec![];
        {
            let mut sstable_writer = VoidSSTable::writer(&mut buffer);
            assert!(sstable_writer.insert([17u8], &()).is_ok());
            assert!(sstable_writer.insert([17u8, 18u8, 19u8], &()).is_ok());
            assert!(sstable_writer.insert([17u8, 20u8], &()).is_ok());
            assert!(sstable_writer.finish().is_ok());
        }
        assert_eq!(
            &buffer,
            &[
                // block
                8, 0, 0, 0, // size of block
                0, // compression
                16, 17, 33, 18, 19, 17, 20, // data block
                0, 0, 0, 0, // no more block
                // index
                0, 0, 0, 0, 0, 0, 0, 0, // fst length
                16, 0, 0, 0, 0, 0, 0, 0, // index start offset
                3, 0, 0, 0, 0, 0, 0, 0, // num term
                3, 0, 0, 0, // version
            ]
        );
        let buffer = OwnedBytes::new(buffer);
        let mut sstable_reader = VoidSSTable::reader(buffer);
        assert!(sstable_reader.advance().unwrap());
        assert_eq!(sstable_reader.key(), &[17u8]);
        assert!(sstable_reader.advance().unwrap());
        assert_eq!(sstable_reader.key(), &[17u8, 18u8, 19u8]);
        assert!(sstable_reader.advance().unwrap());
        assert_eq!(sstable_reader.key(), &[17u8, 20u8]);
        assert!(!sstable_reader.advance().unwrap());
    }

    #[test]
    #[should_panic]
    fn test_simple_sstable_non_increasing_key() {
        let mut buffer = vec![];
        let mut sstable_writer = VoidSSTable::writer(&mut buffer);
        assert!(sstable_writer.insert([17u8], &()).is_ok());
        assert!(sstable_writer.insert([16u8], &()).is_ok());
    }

    #[test]
    fn test_merge_abcd_abe() {
        let mut buffer = Vec::new();
        {
            let mut writer = VoidSSTable::writer(&mut buffer);
            writer.insert(b"abcd", &()).unwrap();
            writer.insert(b"abe", &()).unwrap();
            writer.finish().unwrap();
        }
        let buffer = OwnedBytes::new(buffer);
        let mut output = Vec::new();
        assert!(
            VoidSSTable::merge(vec![buffer.clone(), buffer.clone()], &mut output, VoidMerge)
                .is_ok()
        );
        assert_eq!(&output[..], &buffer[..]);
    }

    #[test]
    fn test_sstable() {
        let mut buffer = Vec::new();
        {
            let mut writer = VoidSSTable::writer(&mut buffer);
            assert_eq!(writer.last_inserted_key(), b"");
            writer.insert(b"abcd", &()).unwrap();
            assert_eq!(writer.last_inserted_key(), b"abcd");
            writer.insert(b"abe", &()).unwrap();
            assert_eq!(writer.last_inserted_key(), b"abe");
            writer.finish().unwrap();
        }
        let buffer = OwnedBytes::new(buffer);
        let mut output = Vec::new();
        assert!(
            VoidSSTable::merge(vec![buffer.clone(), buffer.clone()], &mut output, VoidMerge)
                .is_ok()
        );
        assert_eq!(&output[..], &buffer[..]);
    }

    #[test]
    fn test_sstable_u64() -> io::Result<()> {
        let mut buffer = Vec::new();
        let mut writer = MonotonicU64SSTable::writer(&mut buffer);
        writer.insert(b"abcd", &1u64)?;
        writer.insert(b"abe", &4u64)?;
        writer.insert(b"gogo", &4324234234234234u64)?;
        writer.finish()?;
        let buffer = OwnedBytes::new(buffer);
        let mut reader = MonotonicU64SSTable::reader(buffer);
        assert!(reader.advance()?);
        assert_eq!(reader.key(), b"abcd");
        assert_eq!(reader.value(), &1u64);
        assert!(reader.advance()?);
        assert_eq!(reader.key(), b"abe");
        assert_eq!(reader.value(), &4u64);
        assert!(reader.advance()?);
        assert_eq!(reader.key(), b"gogo");
        assert_eq!(reader.value(), &4324234234234234u64);
        assert!(!reader.advance()?);
        Ok(())
    }

    #[test]
    fn test_sstable_empty() {
        let mut sstable_range_empty = crate::RangeSSTable::create_empty_reader();
        assert!(!sstable_range_empty.advance().unwrap());
    }

    use common::file_slice::FileSlice;
    use proptest::prelude::*;

    use crate::Dictionary;

    fn bound_strategy() -> impl Strategy<Value = Bound<String>> {
        prop_oneof![
            Just(Bound::<String>::Unbounded),
            "[a-c]{0,5}".prop_map(Bound::Included),
            "[a-c]{0,5}".prop_map(Bound::Excluded),
        ]
    }

    fn extract_key(bound: Bound<&String>) -> Option<&str> {
        match bound.as_ref() {
            Bound::Included(key) => Some(key.as_str()),
            Bound::Excluded(key) => Some(key.as_str()),
            Bound::Unbounded => None,
        }
    }

    fn bounds_strategy() -> impl Strategy<Value = (Bound<String>, Bound<String>)> {
        (bound_strategy(), bound_strategy()).prop_filter(
            "Lower bound <= Upper bound",
            |(left, right)| match (extract_key(left.as_ref()), extract_key(right.as_ref())) {
                (None, _) => true,
                (_, None) => true,
                (left, right) => left < right,
            },
        )
    }

    proptest! {
        #[test]
        fn test_proptest_sstable_ranges(words in prop::collection::btree_set("[a-c]{0,6}", 1..100),
            (lower_bound, upper_bound) in bounds_strategy(),
        ) {
            let mut builder = Dictionary::<VoidSSTable>::builder(Vec::new()).unwrap();
            builder.set_block_len(16);
            for word in &words {
                builder.insert(word.as_bytes(), &()).unwrap();
            }
            let buffer: Vec<u8> = builder.finish().unwrap();
            let dictionary: Dictionary<VoidSSTable> = Dictionary::open(FileSlice::from(buffer)).unwrap();
            let mut range_builder = dictionary.range();
            range_builder = match lower_bound.as_ref() {
                Bound::Included(key) => range_builder.ge(key.as_bytes()),
                Bound::Excluded(key) => range_builder.gt(key.as_bytes()),
                Bound::Unbounded => range_builder,
            };
            range_builder = match upper_bound.as_ref() {
                Bound::Included(key) => range_builder.le(key.as_bytes()),
                Bound::Excluded(key) => range_builder.lt(key.as_bytes()),
                Bound::Unbounded => range_builder,
            };
            let mut stream = range_builder.into_stream().unwrap();
            let mut btree_set_range = words.range((lower_bound, upper_bound));
            while stream.advance() {
                let val = btree_set_range.next().unwrap();
                assert_eq!(val.as_bytes(), stream.key());
            }
            assert!(btree_set_range.next().is_none());
        }
    }
}


================================================
FILE: sstable/src/merge/heap_merge.rs
================================================
use std::cmp::Ordering;
use std::collections::BinaryHeap;
use std::collections::binary_heap::PeekMut;
use std::io;

use super::{SingleValueMerger, ValueMerger};
use crate::{Reader, SSTable, Writer};

struct HeapItem<B: AsRef<[u8]>>(B);

impl<B: AsRef<[u8]>> Ord for HeapItem<B> {
    fn cmp(&self, other: &Self) -> Ordering {
        other.0.as_ref().cmp(self.0.as_ref())
    }
}
impl<B: AsRef<[u8]>> PartialOrd for HeapItem<B> {
    fn partial_cmp(&self, other: &Self) -> Option<Ordering> {
        Some(self.cmp(other))
    }
}

impl<B: AsRef<[u8]>> Eq for HeapItem<B> {}
impl<B: AsRef<[u8]>> PartialEq for HeapItem<B> {
    fn eq(&self, other: &Self) -> bool {
        self.0.as_ref() == other.0.as_ref()
    }
}

pub fn merge_sstable<SST: SSTable, W: io::Write, M: ValueMerger<SST::Value>>(
    readers: Vec<Reader<SST::ValueReader>>,
    mut writer: Writer<W, SST::ValueWriter>,
    mut merger: M,
) -> io::Result<()> {
    let mut heap: BinaryHeap<HeapItem<Reader<SST::ValueReader>>> =
        BinaryHeap::with_capacity(readers.len());
    for mut reader in readers {
        if reader.advance()? {
            heap.push(HeapItem(reader));
        }
    }
    loop {
        let len = heap.len();
        let mut value_merger;
        match heap.peek_mut() {
            Some(mut head) => {
                writer.insert_key(head.0.key()).unwrap();
                value_merger = merger.new_value(head.0.value());
                if !head.0.advance()? {
                    PeekMut::pop(head);
                }
            }
            _ => {
                break;
            }
        }
        for _ in 0..len - 1 {
            if let Some(mut head) = heap.peek_mut()
                && head.0.key() == writer.last_inserted_key()
            {
                value_merger.add(head.0.value());
                if !head.0.advance()? {
                    PeekMut::pop(head);
                }
                continue;
            }
            break;
        }
        let value = value_merger.finish();
        writer.insert_value(&value)?;
        writer.flush_block_if_required()?;
    }
    writer.finish()?;
    Ok(())
}


================================================
FILE: sstable/src/merge/mod.rs
================================================
mod heap_merge;

pub use self::heap_merge::merge_sstable;

pub trait SingleValueMerger<V> {
    fn add(&mut self, v: &V);
    fn finish(self) -> V;
}

pub trait ValueMerger<V> {
    type TSingleValueMerger: SingleValueMerger<V>;
    fn new_value(&mut self, v: &V) -> Self::TSingleValueMerger;
}

#[derive(Default)]
pub struct KeepFirst;

pub struct FirstVal<V>(V);

impl<V: Clone> ValueMerger<V> for KeepFirst {
    type TSingleValueMerger = FirstVal<V>;

    fn new_value(&mut self, v: &V) -> FirstVal<V> {
        FirstVal(v.clone())
    }
}

impl<V> SingleValueMerger<V> for FirstVal<V> {
    fn add(&mut self, _: &V) {}

    fn finish(self) -> V {
        self.0
    }
}

pub struct VoidMerge;
impl ValueMerger<()> for VoidMerge {
    type TSingleValueMerger = ();

    fn new_value(&mut self, _: &()) {}
}

pub struct U64Merge;
impl ValueMerger<u64> for U64Merge {
    type TSingleValueMerger = u64;

    fn new_value(&mut self, val: &u64) -> u64 {
        *val
    }
}

impl SingleValueMerger<u64> for u64 {
    fn add(&mut self, val: &u64) {
        *self += *val;
    }

    fn finish(self) -> u64 {
        self
    }
}

impl SingleValueMerger<()> for () {
    fn add(&mut self, _: &()) {}

    fn finish(self) {}
}

#[cfg(test)]
mod tests {

    use std::collections::{BTreeMap, BTreeSet};
    use std::str;

    use common::OwnedBytes;

    use super::super::{MonotonicU64SSTable, SSTable, VoidSSTable};
    use super::{U64Merge, VoidMerge};

    fn write_sstable(keys: &[&'static str]) -> OwnedBytes {
        let mut buffer: Vec<u8> = vec![];
        {
            let mut sstable_writer = VoidSSTable::writer(&mut buffer);
            for &key in keys {
                assert!(sstable_writer.insert(key.as_bytes(), &()).is_ok());
            }
            assert!(sstable_writer.finish().is_ok());
        }
        OwnedBytes::new(buffer)
    }

    fn write_sstable_u64(keys: &[(&'static str, u64)]) -> OwnedBytes {
        let mut buffer: Vec<u8> = vec![];
        {
            let mut sstable_writer = MonotonicU64SSTable::writer(&mut buffer);
            for (key, val) in keys {
                assert!(sstable_writer.insert(key.as_bytes(), val).is_ok());
            }
            assert!(sstable_writer.finish().is_ok());
        }
        OwnedBytes::new(buffer)
    }

    fn merge_test_aux(arrs: &[&[&'static str]]) {
        let sstables = arrs.iter().cloned().map(write_sstable).collect::<Vec<_>>();
        let mut merged = BTreeSet::new();
        for &arr in arrs.iter() {
            for &s in arr {
                merged.insert(s.to_string());
            }
        }
        let mut w = Vec::new();
        assert!(VoidSSTable::merge(sstables, &mut w, VoidMerge).is_ok());
        let w = OwnedBytes::new(w);
        let mut reader = VoidSSTable::reader(w);
        for k in merged {
            assert!(reader.advance().unwrap());
            assert_eq!(reader.key(), k.as_bytes());
        }
        assert!(!reader.advance().unwrap());
    }

    fn merge_test_u64_monotonic_aux(arrs: &[&[(&'static str, u64)]]) {
        let sstables = arrs
            .iter()
            .cloned()
            .map(write_sstable_u64)
            .collect::<Vec<_>>();
        let mut merged = BTreeMap::new();
        for &arr in arrs.iter() {
            for (key, val) in arr {
                let entry = merged.entry(key.to_string()).or_insert(0u64);
                *entry += val;
            }
        }
        let mut w = Vec::new();
        assert!(MonotonicU64SSTable::merge(sstables, &mut w, U64Merge).is_ok());
        let w = OwnedBytes::new(w);
        let mut reader = MonotonicU64SSTable::reader(w);
        for (k, v) in merged {
            assert!(reader.advance().unwrap());
            assert_eq!(reader.key(), k.as_bytes());
            assert_eq!(reader.value(), &v);
        }
        assert!(!reader.advance().unwrap());
    }

    #[test]
    fn test_merge_simple_reproduce() {
        let sstable_data = write_sstable(&["a"]);
        let mut reader = VoidSSTable::reader(sstable_data);
        assert!(reader.advance().unwrap());
        assert_eq!(reader.key(), b"a");
        assert!(!reader.advance().unwrap());
    }

    #[test]
    fn test_merge() {
        merge_test_aux(&[]);
        merge_test_aux(&[&["a"]]);
        merge_test_aux(&[&["a", "b"], &["ab"]]); // a, ab, b
        merge_test_aux(&[&["a", "b"], &["a", "b"]]);
        merge_test_aux(&[
            &["happy", "hello", "payer", "tax"],
            &["habitat", "hello", "zoo"],
            &[],
            &["a"],
        ]);
        merge_test_aux(&[&["a"]]);
        merge_test_aux(&[&["a", "b"], &["ab"]]);
        merge_test_aux(&[&["a", "b"], &["a", "b"]]);
    }

    #[test]
    fn test_merge_u64() {
        merge_test_u64_monotonic_aux(&[]);
        merge_test_u64_monotonic_aux(&[&[("a", 1u64)]]);
        merge_test_u64_monotonic_aux(&[&[("a", 1u64), ("b", 3u64)], &[("ab", 2u64)]]); // a, ab, b
        merge_test_u64_monotonic_aux(&[&[("a", 1u64), ("b", 2u64)], &[("a", 16u64), ("b", 23u64)]]);
    }
}


================================================
FILE: sstable/src/sstable_index_v2.rs
================================================
use common::OwnedBytes;
use tantivy_fst::Automaton;

use crate::block_match_automaton::can_block_match_automaton;
use crate::{BlockAddr, SSTable, SSTableDataCorruption, TermOrdinal};

#[derive(Default, Debug, Clone)]
pub struct SSTableIndex {
    pub(crate) blocks: Vec<BlockMeta>,
}

impl SSTableIndex {
    /// Load an index from its binary representation
    pub fn load(data: OwnedBytes) -> Result<SSTableIndex, SSTableDataCorruption> {
        let mut reader = IndexSSTable::reader(data);
        let mut blocks = Vec::new();

        while reader.advance().map_err(|_| SSTableDataCorruption)? {
            blocks.push(BlockMeta {
                last_key_or_greater: reader.key().to_vec(),
                block_addr: reader.value().clone(),
            });
        }

        Ok(SSTableIndex { blocks })
    }

    /// Get the [`BlockAddr`] of the requested block.
    pub(crate) fn get_block(&self, block_id: usize) -> Option<BlockAddr> {
        self.blocks
            .get(block_id)
            .map(|block_meta| block_meta.block_addr.clone())
    }

    /// Get the block id of the block that would contain `key`.
    ///
    /// Returns None if `key` is lexicographically after the last key recorded.
    pub(crate) fn locate_with_key(&self, key: &[u8]) -> Option<usize> {
        let pos = self
            .blocks
            .binary_search_by_key(&key, |block| &block.last_key_or_greater);
        match pos {
            Ok(pos) => Some(pos),
            Err(pos) => {
                if pos < self.blocks.len() {
                    Some(pos)
                } else {
                    // after end of last block: no block matches
                    None
                }
            }
        }
    }

    /// Get the [`BlockAddr`] of the block that would contain `key`.
    ///
    /// Returns None if `key` is lexicographically after the last key recorded.
    pub fn get_block_with_key(&self, key: &[u8]) -> Option<BlockAddr> {
        self.locate_with_key(key).and_then(|id| self.get_block(id))
    }

    pub(crate) fn locate_with_ord(&self, ord: TermOrdinal) -> usize {
        let pos = self
            .blocks
            .binary_search_by_key(&ord, |block| block.block_addr.first_ordinal);

        match pos {
            Ok(pos) => pos,
            // Err(0) can't happen as the sstable starts with ordinal zero
            Err(pos) => pos - 1,
        }
    }

    /// Get the [`BlockAddr`] of the block containing the `ord`-th term.
    pub(crate) fn get_block_with_ord(&self, ord: TermOrdinal) -> BlockAddr {
        // locate_with_ord always returns an index within range
        self.get_block(self.locate_with_ord(ord)).unwrap()
    }

    pub(crate) fn get_block_for_automaton<'a>(
        &'a self,
        automaton: &'a impl Automaton,
    ) -> impl Iterator<Item = (u64, BlockAddr)> + 'a {
        std::iter::once((None, &self.blocks[0]))
            .chain(self.blocks.windows(2).map(|window| {
                let [prev, curr] = window else {
                    unreachable!();
                };
                (Some(&*prev.last_key_or_greater), curr)
            }))
            .enumerate()
            .filter_map(move |(pos, (prev_key, current_block))| {
                if can_block_match_automaton(
                    prev_key,
                    &current_block.last_key_or_greater,
                    automaton,
                ) {
                    Some((pos as u64, current_block.block_addr.clone()))
                } else {
                    None
                }
            })
    }
}

#[derive(Debug, Clone)]
pub(crate) struct BlockMeta {
    /// Any byte string that is lexicographically greater or equal to
    /// the last key in the block,
    /// and yet strictly smaller than the first key in the next block.
    pub last_key_or_greater: Vec<u8>,
    pub block_addr: BlockAddr,
}

/// SSTable representing an index
///
/// `last_key_or_greater` is used as the key, the value contains the
/// length and first ordinal of each block. The start offset is implicitly
/// obtained from lengths.
struct IndexSSTable;

impl SSTable for IndexSSTable {
    type Value = BlockAddr;

    type ValueReader = crate::value::index::IndexValueReader;

    type ValueWriter = crate::value::index::IndexValueWriter;
}

#[cfg(test)]
mod tests {
    use super::*;
    use crate::block_match_automaton::tests::EqBuffer;

    #[test]
    fn test_get_block_for_automaton() {
        let sstable = SSTableIndex {
            blocks: vec![
                BlockMeta {
                    last_key_or_greater: vec![0, 1, 2],
                    block_addr: BlockAddr {
                        first_ordinal: 0,
                        byte_range: 0..10,
                    },
                },
                BlockMeta {
                    last_key_or_greater: vec![0, 2, 2],
                    block_addr: BlockAddr {
                        first_ordinal: 5,
                        byte_range: 10..20,
                    },
                },
                BlockMeta {
                    last_key_or_greater: vec![0, 3, 2],
                    block_addr: BlockAddr {
                        first_ordinal: 10,
                        byte_range: 20..30,
                    },
                },
            ],
        };

        let res = sstable
            .get_block_for_automaton(&EqBuffer(vec![0, 1, 1]))
            .collect::<Vec<_>>();
        assert_eq!(
            res,
            vec![(
                0,
                BlockAddr {
                    first_ordinal: 0,
                    byte_range: 0..10
                }
            )]
        );
        let res = sstable
            .get_block_for_automaton(&EqBuffer(vec![0, 2, 1]))
            .collect::<Vec<_>>();
        assert_eq!(
            res,
            vec![(
                1,
                BlockAddr {
                    first_ordinal: 5,
                    byte_range: 10..20
                }
            )]
        );
        let res = sstable
            .get_block_for_automaton(&EqBuffer(vec![0, 3, 1]))
            .collect::<Vec<_>>();
        assert_eq!(
            res,
            vec![(
                2,
                BlockAddr {
                    first_ordinal: 10,
                    byte_range: 20..30
                }
            )]
        );
        let res = sstable
            .get_block_for_automaton(&EqBuffer(vec![0, 4, 1]))
            .collect::<Vec<_>>();
        assert!(res.is_empty());

        let complex_automaton = EqBuffer(vec![0, 1, 1]).union(EqBuffer(vec![0, 3, 1]));
        let res = sstable
            .get_block_for_automaton(&complex_automaton)
            .collect::<Vec<_>>();
        assert_eq!(
            res,
            vec![
                (
                    0,
                    BlockAddr {
                        first_ordinal: 0,
                        byte_range: 0..10
                    }
                ),
                (
                    2,
                    BlockAddr {
                        first_ordinal: 10,
                        byte_range: 20..30
                    }
                )
            ]
        );
    }
}


================================================
FILE: sstable/src/sstable_index_v3.rs
================================================
use std::io::{self, Read, Write};
use std::ops::Range;
use std::sync::Arc;

use common::{BinarySerializable, FixedSize, OwnedBytes};
use tantivy_bitpacker::{BitPacker, compute_num_bits};
use tantivy_fst::raw::Fst;
use tantivy_fst::{Automaton, IntoStreamer, Map, MapBuilder, Streamer};

use crate::block_match_automaton::can_block_match_automaton;
use crate::{SSTableDataCorruption, TermOrdinal, common_prefix_len};

#[derive(Debug, Clone)]
pub enum SSTableIndex {
    V2(crate::sstable_index_v2::SSTableIndex),
    V3(SSTableIndexV3),
    V3Empty(SSTableIndexV3Empty),
}

impl SSTableIndex {
    /// Get the [`BlockAddr`] of the requested block.
    pub(crate) fn get_block(&self, block_id: u64) -> Option<BlockAddr> {
        match self {
            SSTableIndex::V2(v2_index) => v2_index.get_block(block_id as usize),
            SSTableIndex::V3(v3_index) => v3_index.get_block(block_id),
            SSTableIndex::V3Empty(v3_empty) => v3_empty.get_block(block_id),
        }
    }

    /// Get the block id of the block that would contain `key`.
    ///
    /// Returns None if `key` is lexicographically after the last key recorded.
    pub(crate) fn locate_with_key(&self, key: &[u8]) -> Option<u64> {
        match self {
            SSTableIndex::V2(v2_index) => v2_index.locate_with_key(key).map(|i| i as u64),
            SSTableIndex::V3(v3_index) => v3_index.locate_with_key(key),
            SSTableIndex::V3Empty(v3_empty) => v3_empty.locate_with_key(key),
        }
    }

    /// Get the [`BlockAddr`] of the block that would contain `key`.
    ///
    /// Returns None if `key` is lexicographically after the last key recorded.
    pub fn get_block_with_key(&self, key: &[u8]) -> Option<BlockAddr> {
        match self {
            SSTableIndex::V2(v2_index) => v2_index.get_block_with_key(key),
            SSTableIndex::V3(v3_index) => v3_index.get_block_with_key(key),
            SSTableIndex::V3Empty(v3_empty) => v3_empty.get_block_with_key(key),
        }
    }

    pub(crate) fn locate_with_ord(&self, ord: TermOrdinal) -> u64 {
        match self {
            SSTableIndex::V2(v2_index) => v2_index.locate_with_ord(ord) as u64,
            SSTableIndex::V3(v3_index) => v3_index.locate_with_ord(ord),
            SSTableIndex::V3Empty(v3_empty) => v3_empty.locate_with_ord(ord),
        }
    }

    /// Get the [`BlockAddr`] of the block containing the `ord`-th term.
    pub(crate) fn get_block_with_ord(&self, ord: TermOrdinal) -> BlockAddr {
        match self {
            SSTableIndex::V2(v2_index) => v2_index.get_block_with_ord(ord),
            SSTableIndex::V3(v3_index) => v3_index.get_block_with_ord(ord),
            SSTableIndex::V3Empty(v3_empty) => v3_empty.get_block_with_ord(ord),
        }
    }

    pub fn get_block_for_automaton<'a>(
        &'a self,
        automaton: &'a impl Automaton,
    ) -> impl Iterator<Item = (u64, BlockAddr)> + 'a {
        match self {
            SSTableIndex::V2(v2_index) => {
                BlockIter::V2(v2_index.get_block_for_automaton(automaton))
            }
            SSTableIndex::V3(v3_index) => {
                BlockIter::V3(v3_index.get_block_for_automaton(automaton))
            }
            SSTableIndex::V3Empty(v3_empty) => {
                BlockIter::V3Empty(std::iter::once((0, v3_empty.block_addr.clone())))
            }
        }
    }
}

enum BlockIter<V2, V3, T> {
    V2(V2),
    V3(V3),
    V3Empty(std::iter::Once<T>),
}

impl<V2: Iterator<Item = T>, V3: Iterator<Item = T>, T> Iterator for BlockIter<V2, V3, T> {
    type Item = T;

    fn next(&mut self) -> Option<Self::Item> {
        match self {
            BlockIter::V2(v2) => v2.next(),
            BlockIter::V3(v3) => v3.next(),
            BlockIter::V3Empty(once) => once.next(),
        }
    }
}

#[derive(Debug, Clone)]
pub struct SSTableIndexV3 {
    fst_index: Arc<Map<OwnedBytes>>,
    block_addr_store: BlockAddrStore,
}

impl SSTableIndexV3 {
    /// Load an index from its binary representation
    pub fn load(
        data: OwnedBytes,
        fst_length: u64,
    ) -> Result<SSTableIndexV3, SSTableDataCorruption> {
        let (fst_slice, block_addr_store_slice) = data.split(fst_length as usize);
        let fst_index = Fst::new(fst_slice)
            .map_err(|_| SSTableDataCorruption)?
            .into();
        let block_addr_store =
            BlockAddrStore::open(block_addr_store_slice).map_err(|_| SSTableDataCorruption)?;

        Ok(SSTableIndexV3 {
            fst_index: Arc::new(fst_index),
            block_addr_store,
        })
    }

    /// Get the [`BlockAddr`] of the requested block.
    pub(crate) fn get_block(&self, block_id: u64) -> Option<BlockAddr> {
        self.block_addr_store.get(block_id)
    }

    /// Get the block id of the block that would contain `key`.
    ///
    /// Returns None if `key` is lexicographically after the last key recorded.
    pub(crate) fn locate_with_key(&self, key: &[u8]) -> Option<u64> {
        self.fst_index
            .range()
            .ge(key)
            .into_stream()
            .next()
            .map(|(_key, id)| id)
    }

    /// Get the [`BlockAddr`] of the block that would contain `key`.
    ///
    /// Returns None if `key` is lexicographically after the last key recorded.
    pub fn get_block_with_key(&self, key: &[u8]) -> Option<BlockAddr> {
        self.locate_with_key(key).and_then(|id| self.get_block(id))
    }

    pub(crate) fn locate_with_ord(&self, ord: TermOrdinal) -> u64 {
        self.block_addr_store.binary_search_ord(ord).0
    }

    /// Get the [`BlockAddr`] of the block containing the `ord`-th term.
    pub(crate) fn get_block_with_ord(&self, ord: TermOrdinal) -> BlockAddr {
        self.block_addr_store.binary_search_ord(ord).1
    }

    pub(crate) fn get_block_for_automaton<'a>(
        &'a self,
        automaton: &'a impl Automaton,
    ) -> impl Iterator<Item = (u64, BlockAddr)> + 'a {
        // this is more complicated than other index formats: we don't have a ready made list of
        // blocks, and instead need to stream-decode the sstable.

        GetBlockForAutomaton {
            streamer: self.fst_index.stream(),
            block_addr_store: &self.block_addr_store,
            prev_key: None,
            automaton,
        }
    }
}

// TODO we iterate over the entire Map to find matching blocks,
// we could manually iterate on the underlying Fst and skip whole branches if our Automaton says
// cannot match. this isn't as bad as it sounds given the fst is a lot smaller than the rest of the
// sstable.
// To do that, we can't use tantivy_fst's Stream with an automaton, as we need to know 2 consecutive
// fst keys to form a proper opinion on whether this is a match, which we want translate into a
// single automaton
struct GetBlockForAutomaton<'a, A: Automaton> {
    streamer: tantivy_fst::map::Stream<'a>,
    block_addr_store: &'a BlockAddrStore,
    prev_key: Option<Vec<u8>>,
    automaton: &'a A,
}

impl<A: Automaton> Iterator for GetBlockForAutomaton<'_, A> {
    type Item = (u64, BlockAddr);

    fn next(&mut self) -> Option<Self::Item> {
        while let Some((new_key, block_id)) = self.streamer.next() {
            if let Some(prev_key) = self.prev_key.as_mut() {
                if can_block_match_automaton(Some(prev_key), new_key, self.automaton) {
                    prev_key.clear();
                    prev_key.extend_from_slice(new_key);
                    return Some((block_id, self.block_addr_store.get(block_id).unwrap()));
                }
                prev_key.clear();
                prev_key.extend_from_slice(new_key);
            } else {
                self.prev_key = Some(new_key.to_owned());
                if can_block_match_automaton(None, new_key, self.automaton) {
                    return Some((block_id, self.block_addr_store.get(block_id).unwrap()));
                }
            }
        }
        None
    }
}

#[derive(Debug, Clone)]
pub struct SSTableIndexV3Empty {
    block_addr: BlockAddr,
}

impl SSTableIndexV3Empty {
    pub fn load(index_start_pos: usize) -> SSTableIndexV3Empty {
        SSTableIndexV3Empty {
            block_addr: BlockAddr {
                first_ordinal: 0,
                byte_range: 0..index_start_pos,
            },
        }
    }

    /// Get the [`BlockAddr`] of the requested block.
    pub(crate) fn get_block(&self, _block_id: u64) -> Option<BlockAddr> {
        Some(self.block_addr.clone())
    }

    /// Get the block id of the block that would contain `key`.
    ///
    /// Returns None if `key` is lexicographically after the last key recorded.
    pub(crate) fn locate_with_key(&self, _key: &[u8]) -> Option<u64> {
        Some(0)
    }

    /// Get the [`BlockAddr`] of the block that would contain `key`.
    ///
    /// Returns None if `key` is lexicographically after the last key recorded.
    pub fn get_block_with_key(&self, _key: &[u8]) -> Option<BlockAddr> {
        Some(self.block_addr.clone())
    }

    pub(crate) fn locate_with_ord(&self, _ord: TermOrdinal) -> u64 {
        0
    }

    /// Get the [`BlockAddr`] of the block containing the `ord`-th term.
    pub(crate) fn get_block_with_ord(&self, _ord: TermOrdinal) -> BlockAddr {
        self.block_addr.clone()
    }
}
#[derive(Clone, Eq, PartialEq, Debug)]
pub struct BlockAddr {
    pub first_ordinal: u64,
    pub byte_range: Range<usize>,
}

impl BlockAddr {
    fn to_block_start(&self) -> BlockStartAddr {
        BlockStartAddr {
            first_ordinal: self.first_ordinal,
            byte_range_start: self.byte_range.start,
        }
    }
}

#[derive(Debug, Clone, PartialEq, Eq)]
struct BlockStartAddr {
    first_ordinal: u64,
    byte_range_start: usize,
}

impl BlockStartAddr {
    fn to_block_addr(&self, byte_range_end: usize) -> BlockAddr {
        BlockAddr {
            first_ordinal: self.first_ordinal,
            byte_range: self.byte_range_start..byte_range_end,
        }
    }
}

#[derive(Debug, Clone)]
pub(crate) struct BlockMeta {
    /// Any byte string that is lexicographically greater or equal to
    /// the last key in the block,
    /// and yet strictly smaller than the first key in the next block.
    pub last_key_or_greater: Vec<u8>,
    pub block_addr: BlockAddr,
}

impl BinarySerializable for BlockStartAddr {
    fn serialize<W: Write + ?Sized>(&self, writer: &mut W) -> io::Result<()> {
        let start = self.byte_range_start as u64;
        start.serialize(writer)?;
        self.first_ordinal.serialize(writer)
    }

    fn deserialize<R: Read>(reader: &mut R) -> io::Result<Self> {
        let byte_range_start = u64::deserialize(reader)? as usize;
        let first_ordinal = u64::deserialize(reader)?;
        Ok(BlockStartAddr {
            first_ordinal,
            byte_range_start,
        })
    }

    // Provided method
    fn num_bytes(&self) -> u64 {
        BlockStartAddr::SIZE_IN_BYTES as u64
    }
}

impl FixedSize for BlockStartAddr {
    const SIZE_IN_BYTES: usize = 2 * u64::SIZE_IN_BYTES;
}

/// Given that left < right,
/// mutates `left into a shorter byte string left'` that
/// matches `left <= left' < right`.
fn find_shorter_str_in_between(left: &mut Vec<u8>, right: &[u8]) {
    assert!(&left[..] < right);
    let common_len = common_prefix_len(left, right);
    if left.len() == common_len {
        return;
    }
    // It is possible to do one character shorter in some case,
    // but it is not worth the extra complexity
    for pos in (common_len + 1)..left.len() {
        if left[pos] != u8::MAX {
            left[pos] += 1;
            left.truncate(pos + 1);
            return;
        }
    }
}

#[derive(Default)]
pub struct SSTableIndexBuilder {
    blocks: Vec<BlockMeta>,
}

impl SSTableIndexBuilder {
    /// In order to make the index as light as possible, we
    /// try to find a shorter alternative to the last key of the last block
    /// that is still smaller than the next key.
    pub(crate) fn shorten_last_block_key_given_next_key(&mut self, next_key: &[u8]) {
        if let Some(last_block) = self.blocks.last_mut() {
            find_shorter_str_in_between(&mut last_block.last_key_or_greater, next_key);
        }
    }

    pub fn add_block(&mut self, last_key: &[u8], byte_range: Range<usize>, first_ordinal: u64) {
        self.blocks.push(BlockMeta {
            last_key_or_greater: last_key.to_vec(),
            block_addr: BlockAddr {
                byte_range,
                first_ordinal,
            },
        })
    }

    pub fn serialize<W: std::io::Write>(&self, wrt: W) -> io::Result<u64> {
        if self.blocks.len() <= 1 {
            return Ok(0);
        }
        let counting_writer = common::CountingWriter::wrap(wrt);
        let mut map_builder = MapBuilder::new(counting_writer).map_err(fst_error_to_io_error)?;
        for (i, block) in self.blocks.iter().enumerate() {
            map_builder
                .insert(&block.last_key_or_greater, i as u64)
                .map_err(fst_error_to_io_error)?;
        }
        let counting_writer = map_builder.into_inner().map_err(fst_error_to_io_error)?;
        let written_bytes = counting_writer.written_bytes();
        let mut wrt = counting_writer.finish();

        let mut block_store_writer = BlockAddrStoreWriter::new();
        for block in &self.blocks {
            block_store_writer.write_block_meta(block.block_addr.clone())?;
        }
        block_store_writer.serialize(&mut wrt)?;

        Ok(written_bytes)
    }
}

fn fst_error_to_io_error(error: tantivy_fst::Error) -> io::Error {
    match error {
        tantivy_fst::Error::Fst(fst_error) => io::Error::other(fst_error),
        tantivy_fst::Error::Io(ioerror) => ioerror,
    }
}

const STORE_BLOCK_LEN: usize = 128;

#[derive(Debug)]
struct BlockAddrBlockMetadata {
    offset: u64,
    ref_block_addr: BlockStartAddr,
    range_start_slope: u32,
    first_ordinal_slope: u32,
    range_start_nbits: u8,
    first_ordinal_nbits: u8,
    block_len: u16,
    // these fields are computed on deserialization, and not stored
    range_shift: i64,
    ordinal_shift: i64,
}

impl BlockAddrBlockMetadata {
    fn num_bits(&self) -> u8 {
        self.first_ordinal_nbits + self.range_start_nbits
    }

    fn deserialize_block_addr(&self, data: &[u8], inner_offset: usize) -> Option<BlockAddr> {
        if inner_offset == 0 {
            let range_end = self.ref_block_addr.byte_range_start
                + extract_bits(data, 0, self.range_start_nbits) as usize
                + self.range_start_slope as usize
                - self.range_shift as usize;
            return Some(self.ref_block_addr.to_block_addr(range_end));
        }
        let inner_offset = inner_offset - 1;
        if inner_offset >= self.block_len as usize {
            return None;
        }
        let num_bits = self.num_bits() as usize;

        let range_start_addr = num_bits * inner_offset;
        let ordinal_addr = range_start_addr + self.range_start_nbits as usize;
        let range_end_addr = range_start_addr + num_bits;

        if (range_end_addr + self.range_start_nbits as usize).div_ceil(8) > data.len() {
            return None;
        }

        let range_start = self.ref_block_addr.byte_range_start
            + extract_bits(data, range_start_addr, self.range_start_nbits) as usize
            + self.range_start_slope as usize * (inner_offset + 1)
            - self.range_shift as usize;
        let first_ordinal = self.ref_block_addr.first_ordinal
            + extract_bits(data, ordinal_addr, self.first_ordinal_nbits)
            + self.first_ordinal_slope as u64 * (inner_offset + 1) as u64
            - self.ordinal_shift as u64;
        let range_end = self.ref_block_addr.byte_range_start
            + extract_bits(data, range_end_addr, self.range_start_nbits) as usize
            + self.range_start_slope as usize * (inner_offset + 2)
            - self.range_shift as usize;

        Some(BlockAddr {
            first_ordinal,
            byte_range: range_start..range_end,
        })
    }

    fn bisect_for_ord(&self, data: &[u8], target_ord: TermOrdinal) -> (u64, BlockAddr) {
        let inner_target_ord = target_ord - self.ref_block_addr.first_ordinal;
        let num_bits = self.num_bits() as usize;
        let range_start_nbits = self.range_start_nbits as usize;
        let get_ord = |index| {
            extract_bits(
                data,
                num_bits * index as usize + range_start_nbits,
                self.first_ordinal_nbits,
            ) + self.first_ordinal_slope as u64 * (index + 1)
                - self.ordinal_shift as u64
        };

        let inner_offset = match binary_search(self.block_len as u64, |index| {
            get_ord(index).cmp(&inner_target_ord)
        }) {
            Ok(inner_offset) => inner_offset + 1,
            Err(inner_offset) => inner_offset,
        };
        // we can unwrap because inner_offset <= self.block_len
        (
            inner_offset,
            self.deserialize_block_addr(data, inner_offset as usize)
                .unwrap(),
        )
    }
}

// TODO move this function to tantivy_common?
#[inline(always)]
fn extract_bits(data: &[u8], addr_bits: usize, num_bits: u8) -> u64 {
    assert!(num_bits <= 56);
    let addr_byte = addr_bits / 8;
    let bit_shift = (addr_bits % 8) as u64;
    let val_unshifted_unmasked: u64 = if data.len() >= addr_byte + 8 {
        let b = data[addr_byte..addr_byte + 8].try_into().unwrap();
        u64::from_le_bytes(b)
    } else {
        // the buffer is not large enough.
        // Let's copy the few remaining bytes to a 8 byte buffer
        // padded with 0s.
        let mut buf = [0u8; 8];
        let data_to_copy = &data[addr_byte..];
        let nbytes = data_to_copy.len();
        buf[..nbytes].copy_from_slice(data_to_copy);
        u64::from_le_bytes(buf)
    };
    let val_shifted_unmasked = val_unshifted_unmasked >> bit_shift;
    let mask = (1u64 << u64::from(num_bits)) - 1;
    val_shifted_unmasked & mask
}

impl BinarySerializable for BlockAddrBlockMetadata {
    fn serialize<W: Write + ?Sized>(&self, write: &mut W) -> io::Result<()> {
        self.offset.serialize(write)?;
        self.ref_block_addr.serialize(write)?;
        self.range_start_slope.serialize(write)?;
        self.first_ordinal_slope.serialize(write)?;
        write.write_all(&[self.first_ordinal_nbits, self.range_start_nbits])?;
        self.block_len.serialize(write)?;
        self.num_bits();
        Ok(())
    }

    fn deserialize<R: Read>(reader: &mut R) -> io::Result<Self> {
        let offset = u64::deserialize(reader)?;
        let ref_block_addr = BlockStartAddr::deserialize(reader)?;
        let range_start_slope = u32::deserialize(reader)?;
        let first_ordinal_slope = u32::deserialize(reader)?;
        let mut buffer = [0u8; 2];
        reader.read_exact(&mut buffer)?;
        let first_ordinal_nbits = buffer[0];
        let range_start_nbits = buffer[1];
        let block_len = u16::deserialize(reader)?;
        Ok(BlockAddrBlockMetadata {
            offset,
            ref_block_addr,
            range_start_slope,
            first_ordinal_slope,
            range_start_nbits,
            first_ordinal_nbits,
            block_len,
            range_shift: 1 << (range_start_nbits - 1),
            ordinal_shift: 1 << (first_ordinal_nbits - 1),
        })
    }
}

impl FixedSize for BlockAddrBlockMetadata {
    const SIZE_IN_BYTES: usize = u64::SIZE_IN_BYTES
        + BlockStartAddr::SIZE_IN_BYTES
        + 2 * u32::SIZE_IN_BYTES
        + 2
        + u16::SIZE_IN_BYTES;
}

#[derive(Debug, Clone)]
struct BlockAddrStore {
    block_meta_bytes: OwnedBytes,
    addr_bytes: OwnedBytes,
}

impl BlockAddrStore {
    fn open(term_info_store_file: OwnedBytes) -> io::Result<BlockAddrStore> {
        let (mut len_slice, main_slice) = term_info_store_file.split(8);
        let len = u64::deserialize(&mut len_slice)? as usize;
        let (block_meta_bytes, addr_bytes) = main_slice.split(len);
        Ok(BlockAddrStore {
            block_meta_bytes,
            addr_bytes,
        })
    }

    fn get_block_meta(&self, store_block_id: usize) -> Option<BlockAddrBlockMetadata> {
        let mut block_data: &[u8] = self
            .block_meta_bytes
            .get(store_block_id * BlockAddrBlockMetadata::SIZE_IN_BYTES..)?;
        BlockAddrBlockMetadata::deserialize(&mut block_data).ok()
    }

    fn get(&self, block_id: u64) -> Option<BlockAddr> {
        let store_block_id = (block_id as usize) / STORE_BLOCK_LEN;
        let inner_offset = (block_id as usize) % STORE_BLOCK_LEN;
        let block_addr_block_data = self.get_block_meta(store_block_id)?;
        block_addr_block_data.deserialize_block_addr(
            &self.addr_bytes[block_addr_block_data.offset as usize..],
            inner_offset,
        )
    }

    fn binary_search_ord(&self, ord: TermOrdinal) -> (u64, BlockAddr) {
        let max_block =
            (self.block_meta_bytes.len() / BlockAddrBlockMetadata::SIZE_IN_BYTES) as u64;
        let get_first_ordinal = |block_id| {
            // we can unwrap because block_id < max_block
            self.get(block_id * STORE_BLOCK_LEN as u64)
                .unwrap()
                .first_ordinal
        };
        let store_block_id =
            binary_search(max_block, |block_id| get_first_ordinal(block_id).cmp(&ord));
        let store_block_id = match store_block_id {
            Ok(store_block_id) => {
                let block_id = store_block_id * STORE_BLOCK_LEN as u64;
                // we can unwrap because store_block_id < max_block
                return (block_id, self.get(block_id).unwrap());
            }
            Err(store_block_id) => store_block_id - 1,
        };

        // we can unwrap because store_block_id < max_block
        let block_addr_block_data = self.get_block_meta(store_block_id as usize).unwrap();
        let (inner_offset, block_addr) = block_addr_block_data.bisect_for_ord(
            &self.addr_bytes[block_addr_block_data.offset as usize..],
            ord,
        );
        (
            store_block_id * STORE_BLOCK_LEN as u64 + inner_offset,
            block_addr,
        )
    }
}

fn binary_search(max: u64, cmp_fn: impl Fn(u64) -> std::cmp::Ordering) -> Result<u64, u64> {
    use std::cmp::Ordering::*;
    let mut size = max;
    let mut left = 0;
    let mut right = size;
    while left < right {
        let mid = left + size / 2;

        let cmp = cmp_fn(mid);

        if cmp == Less {
            left = mid + 1;
        } else if cmp == Greater {
            right = mid;
        } else {
            return Ok(mid);
        }

        size = right - left;
    }
    Err(left)
}

struct BlockAddrStoreWriter {
    buffer_block_metas: Vec<u8>,
    buffer_addrs: Vec<u8>,
    block_addrs: Vec<BlockAddr>,
}

impl BlockAddrStoreWriter {
    fn new() -> Self {
        BlockAddrStoreWriter {
            buffer_block_metas: Vec::new(),
            buffer_addrs: Vec::new(),
            block_addrs: Vec::with_capacity(STORE_BLOCK_LEN),
        }
    }

    fn flush_block(&mut self) -> io::Result<()> {
        if self.block_addrs.is_empty() {
            return Ok(());
        }
        let ref_block_addr = self.block_addrs[0].clone();

        for block_addr in &mut self.block_addrs {
            block_addr.byte_range.start -= ref_block_addr.byte_range.start;
            block_addr.first_ordinal -= ref_block_addr.first_ordinal;
        }

        // we are only called if block_addrs is not empty
        let mut last_block_addr = self.block_addrs.last().unwrap().clone();
        last_block_addr.byte_range.end -= ref_block_addr.byte_range.start;

        // we skip(1), so we never give an index of 0 to find_best_slope
        let (range_start_slope, range_start_nbits) = find_best_slope(
            self.block_addrs
                .iter()
                .map(|block| block.byte_range.start as u64)
                .chain(std::iter::once(last_block_addr.byte_range.end as u64))
                .enumerate()
                .skip(1),
        );

        // we skip(1), so we never give an index of 0 to find_best_slope
        let (first_ordinal_slope, first_ordinal_nbits) = find_best_slope(
            self.block_addrs
                .iter()
                .map(|block| block.first_ordinal)
                .enumerate()
                .skip(1),
        );

        let range_shift = 1 << (range_start_nbits - 1);
        let ordinal_shift = 1 << (first_ordinal_nbits - 1);

        let block_addr_block_meta = BlockAddrBlockMetadata {
            offset: self.buffer_addrs.len() as u64,
            ref_block_addr: ref_block_addr.to_block_start(),
            range_start_slope,
            first_ordinal_slope,
            range_start_nbits,
            first_ordinal_nbits,
            block_len: self.block_addrs.len() as u16 - 1,
            range_shift,
            ordinal_shift,
        };
        block_addr_block_meta.serialize(&mut self.buffer_block_metas)?;

        let mut bit_packer = BitPacker::new();

        for (i, block_addr) in self.block_addrs.iter().enumerate().skip(1) {
            let range_pred = (range_start_slope as usize * i) as i64;
            bit_packer.write(
                (block_addr.byte_range.start as i64 - range_pred + range_shift) as u64,
                range_start_nbits,
                &mut self.buffer_addrs,
            )?;
            let first_ordinal_pred = (first_ordinal_slope as u64 * i as u64) as i64;
            bit_packer.write(
                (block_addr.first_ordinal as i64 - first_ordinal_pred + ordinal_shift) as u64,
                first_ordinal_nbits,
                &mut self.buffer_addrs,
            )?;
        }

        let range_pred = (range_start_slope as usize * self.block_addrs.len()) as i64;
        bit_packer.write(
            (last_block_addr.byte_range.end as i64 - range_pred + range_shift) as u64,
            range_start_nbits,
            &mut self.buffer_addrs,
        )?;
        bit_packer.flush(&mut self.buffer_addrs)?;

        self.block_addrs.clear();
        Ok(())
    }

    fn write_block_meta(&mut self, block_addr: BlockAddr) -> io::Result<()> {
        self.block_addrs.push(block_addr);
        if self.block_addrs.len() >= STORE_BLOCK_LEN {
            self.flush_block()?;
        }
        Ok(())
    }

    fn serialize<W: std::io::Write>(&mut self, wrt: &mut W) -> io::Result<()> {
        self.flush_block()?;
        let len = self.buffer_block_metas.len() as u64;
        len.serialize(wrt)?;
        wrt.write_all(&self.buffer_block_metas)?;
        wrt.write_all(&self.buffer_addrs)?;
        Ok(())
    }
}

/// Given an iterator over (index, value), returns the slope, and number of bits needed to
/// represent the error to a prediction made by this slope.
///
/// The iterator may be empty, but all indexes in it must be non-zero.
fn find_best_slope(elements: impl Iterator<Item = (usize, u64)> + Clone) -> (u32, u8) {
    let slope_iterator = elements.clone();
    let derivation_iterator = elements;

    let mut min_slope_idx = 1;
    let mut min_slope_val = 0;
    let mut min_slope = u32::MAX;
    let mut max_slope_idx = 1;
    let mut max_slope_val = 0;
    let mut max_slope = 0;
    for (index, value) in slope_iterator {
        let slope = (value / index as u64) as u32;
        if slope <= min_slope {
            min_slope = slope;
            min_slope_idx = index;
            min_slope_val = value;
        }
        if slope >= max_slope {
            max_slope = slope;
            max_slope_idx = index;
            max_slope_val = value;
        }
    }

    // above is an heuristic giving the "highest" and "lowest" point. It's imperfect in that in that
    // a point that appear earlier might have a high slope derivation, but a smaller absolute
    // derivation than a latter point.
    // The actual best values can be obtained by using the symplex method, but the improvement is
    // likely minimal, and computation is way more complex.
    //
    // Assuming these point are the furthest up and down, we find the slope that would cause the
    // same positive derivation for the highest as negative derivation for the lowest.
    // A is the optimal slope. B is the derivation to the guess
    //
    // 0 = min_slope_val - min_slope_idx * A - B
    // 0 = max_slope_val - max_slope_idx * A + B
    //
    // 0 = min_slope_val + max_slope_val - (min_slope_idx + max_slope_idx) * A
    // (min_slope_val + max_slope_val) / (min_slope_idx + max_slope_idx) = A
    //
    // we actually add some correcting factor to have proper rounding, not truncation.

    let denominator = (min_slope_idx + max_slope_idx) as u64;
    let final_slope = ((min_slope_val + max_slope_val + denominator / 2) / denominator) as u32;

    // we don't solve for B because our choice of point is suboptimal, so it's actually a lower
    // bound and we need to iterate to find the actual worst value.

    let max_derivation: u64 = derivation_iterator
        .map(|(index, value)| (value as i64 - final_slope as i64 * index as i64).unsigned_abs())
        .max()
        .unwrap_or(0);

    (final_slope, compute_num_bits(max_derivation) + 1)
}

#[cfg(test)]
mod tests {
    use common::OwnedBytes;

    use super::*;
    use crate::SSTableDataCorruption;
    use crate::block_match_automaton::tests::EqBuffer;

    #[test]
    fn test_sstable_index() {
        let mut sstable_builder = SSTableIndexBuilder::default();
        sstable_builder.add_block(b"aaa", 10..20, 0u64);
        sstable_builder.add_block(b"bbbbbbb", 20..30, 5u64);
        sstable_builder.add_block(b"ccc", 30..40, 10u64);
        sstable_builder.add_block(b"dddd", 40..50, 15u64);
        let mut buffer: Vec<u8> = Vec::new();
        let fst_len = sstable_builder.serialize(&mut buffer).unwrap();
        let buffer = OwnedBytes::new(buffer);
        let sstable_index = SSTableIndexV3::load(buffer, fst_len).unwrap();
        assert_eq!(
            sstable_index.get_block_with_key(b"bbbde"),
            Some(BlockAddr {
                first_ordinal: 10u64,
                byte_range: 30..40
            })
        );

        assert_eq!(sstable_index.locate_with_key(b"aa").unwrap(), 0);
        assert_eq!(sstable_index.locate_with_key(b"aaa").unwrap(), 0);
        assert_eq!(sstable_index.locate_with_key(b"aab").unwrap(), 1);
        assert_eq!(sstable_index.locate_with_key(b"ccc").unwrap(), 2);
        assert!(sstable_index.locate_with_key(b"e").is_none());

        assert_eq!(sstable_index.locate_with_ord(0), 0);
        assert_eq!(sstable_index.locate_with_ord(1), 0);
        assert_eq!(sstable_index.locate_with_ord(4), 0);
        assert_eq!(sstable_index.locate_with_ord(5), 1);
        assert_eq!(sstable_index.locate_with_ord(100), 3);
    }

    #[test]
    fn test_sstable_with_corrupted_data() {
        let mut sstable_builder = SSTableIndexBuilder::default();
        sstable_builder.add_block(b"aaa", 10..20, 0u64);
        sstable_builder.add_block(b"bbbbbbb", 20..30, 5u64);
        sstable_builder.add_block(b"ccc", 30..40, 10u64);
        sstable_builder.add_block(b"dddd", 40..50, 15u64);
        let mut buffer: Vec<u8> = Vec::new();
        let fst_len = sstable_builder.serialize(&mut buffer).unwrap();
        buffer[2] = 9u8;
        let buffer = OwnedBytes::new(buffer);
        let data_corruption_err = SSTableIndexV3::load(buffer, fst_len).err().unwrap();
        assert!(matches!(data_corruption_err, SSTableDataCorruption));
    }

    #[track_caller]
    fn test_find_shorter_str_in_between_aux(left: &[u8], right: &[u8]) {
        let mut left_buf = left.to_vec();
        super::find_shorter_str_in_between(&mut left_buf, right);
        assert!(left_buf.len() <= left.len());
        assert!(left <= &left_buf);
        assert!(&left_buf[..] < right);
    }

    #[test]
    fn test_find_shorter_str_in_between() {
        test_find_shorter_str_in_between_aux(b"", b"hello");
        test_find_shorter_str_in_between_aux(b"abc", b"abcd");
        test_find_shorter_str_in_between_aux(b"abcd", b"abd");
        test_find_shorter_str_in_between_aux(&[0, 0, 0], &[1]);
        test_find_shorter_str_in_between_aux(&[0, 0, 0], &[0, 0, 1]);
        test_find_shorter_str_in_between_aux(&[0, 0, 255, 255, 255, 0u8], &[0, 1]);
    }

    use proptest::prelude::*;

    proptest! {
        #![proptest_config(ProptestConfig::with_cases(100))]
        #[test]
        fn test_proptest_find_shorter_str(left in any::<Vec<u8>>(), right in any::<Vec<u8>>()) {
            if left < right {
                test_find_shorter_str_in_between_aux(&left, &right);
            }
        }
    }

    #[test]
    fn test_find_best_slop() {
        assert_eq!(super::find_best_slope(std::iter::empty()), (0, 1));
        assert_eq!(
            super::find_best_slope(std::iter::once((1, 12345))),
            (12345, 1)
        );
    }

    #[test]
    fn test_get_block_for_automaton() {
        let sstable_index_builder = SSTableIndexBuilder {
            blocks: vec![
                BlockMeta {
                    last_key_or_greater: vec![0, 1, 2],
                    block_addr: BlockAddr {
                        first_ordinal: 0,
                        byte_range: 0..10,
                    },
                },
                BlockMeta {
                    last_key_or_greater: vec![0, 2, 2],
                    block_addr: BlockAddr {
                        first_ordinal: 5,
                        byte_range: 10..20,
                    },
                },
                BlockMeta {
                    last_key_or_greater: vec![0, 3, 2],
                    block_addr: BlockAddr {
                        first_ordinal: 10,
                        byte_range: 20..30,
                    },
                },
            ],
        };

        let mut sstable_index_bytes = Vec::new();
        let fst_len = sstable_index_builder
            .serialize(&mut sstable_index_bytes)
            .unwrap();

        let sstable = SSTableIndexV3::load(OwnedBytes::new(sstable_index_bytes), fst_len).unwrap();

        let res = sstable
            .get_block_for_automaton(&EqBuffer(vec![0, 1, 1]))
            .collect::<Vec<_>>();
        assert_eq!(
            res,
            vec![(
                0,
                BlockAddr {
                    first_ordinal: 0,
                    byte_range: 0..10
                }
            )]
        );
        let res = sstable
            .get_block_for_automaton(&EqBuffer(vec![0, 2, 1]))
            .collect::<Vec<_>>();
        assert_eq!(
            res,
            vec![(
                1,
                BlockAddr {
                    first_ordinal: 5,
                    byte_range: 10..20
                }
            )]
        );
        let res = sstable
            .get_block_for_automaton(&EqBuffer(vec![0, 3, 1]))
            .collect::<Vec<_>>();
        assert_eq!(
            res,
            vec![(
                2,
                BlockAddr {
                    first_ordinal: 10,
                    byte_range: 20..30
                }
            )]
        );
        let res = sstable
            .get_block_for_automaton(&EqBuffer(vec![0, 4, 1]))
            .collect::<Vec<_>>();
        assert!(res.is_empty());

        let complex_automaton = EqBuffer(vec![0, 1, 1]).union(EqBuffer(vec![0, 3, 1]));
        let res = sstable
            .get_block_for_automaton(&complex_automaton)
            .collect::<Vec<_>>();
        assert_eq!(
            res,
            vec![
                (
                    0,
                    BlockAddr {
                        first_ordinal: 0,
                        byte_range: 0..10
                    }
                ),
                (
                    2,
                    BlockAddr {
                        first_ordinal: 10,
                        byte_range: 20..30
                    }
                )
            ]
        );
    }
}


================================================
FILE: sstable/src/streamer.rs
================================================
use std::io;
use std::ops::Bound;

use tantivy_fst::Automaton;
use tantivy_fst::automaton::AlwaysMatch;

use crate::dictionary::Dictionary;
use crate::{DeltaReader, SSTable, TermOrdinal};

/// `StreamerBuilder` is a helper object used to define
/// a range of terms that should be streamed.
pub struct StreamerBuilder<'a, TSSTable, A = AlwaysMatch>
where
    A: Automaton,
    A::State: Clone,
    TSSTable: SSTable,
{
    term_dict: &'a Dictionary<TSSTable>,
    automaton: A,
    lower: Bound<Vec<u8>>,
    upper: Bound<Vec<u8>>,
    limit: Option<u64>,
}

fn bound_as_byte_slice(bound: &Bound<Vec<u8>>) -> Bound<&[u8]> {
    match bound.as_ref() {
        Bound::Included(key) => Bound::Included(key.as_slice()),
        Bound::Excluded(key) => Bound::Excluded(key.as_slice()),
        Bound::Unbounded => Bound::Unbounded,
    }
}

impl<'a, TSSTable, A> StreamerBuilder<'a, TSSTable, A>
where
    A: Automaton,
    A::State: Clone,
    TSSTable: SSTable,
{
    pub(crate) fn new(term_dict: &'a Dictionary<TSSTable>, automaton: A) -> Self {
        StreamerBuilder {
            term_dict,
            automaton,
            lower: Bound::Unbounded,
            upper: Bound::Unbounded,
            limit: None,
        }
    }

    /// Limit the range to terms greater or equal to the bound
    pub fn ge<T: AsRef<[u8]>>(mut self, bound: T) -> Self {
        self.lower = Bound::Included(bound.as_ref().to_owned());
        self
    }

    /// Limit the range to terms strictly greater than the bound
    pub fn gt<T: AsRef<[u8]>>(mut self, bound: T) -> Self {
        self.lower = Bound::Excluded(bound.as_ref().to_owned());
        self
    }

    /// Limit the range to terms lesser or equal to the bound
    pub fn le<T: AsRef<[u8]>>(mut self, bound: T) -> Self {
        self.upper = Bound::Included(bound.as_ref().to_owned());
        self
    }

    /// Limit the range to terms lesser or equal to the bound
    pub fn lt<T: AsRef<[u8]>>(mut self, bound: T) -> Self {
        self.upper = Bound::Excluded(bound.as_ref().to_owned());
        self
    }

    /// Load no more data than what's required to to get `limit`
    /// matching entries.
    ///
    /// The resulting [`Streamer`] can still return marginally
    /// more than `limit` elements.
    pub fn limit(mut self, limit: u64) -> Self {
        self.limit = Some(limit);
        self
    }

    fn delta_reader(&self) -> io::Result<DeltaReader<TSSTable::ValueReader>> {
        let key_range = (
            bound_as_byte_slice(&self.lower),
            bound_as_byte_slice(&self.upper),
        );
        self.term_dict
            .sstable_delta_reader_for_key_range(key_range, self.limit, &self.automaton)
    }

    async fn delta_reader_async(
        &self,
        merge_holes_under_bytes: usize,
    ) -> io::Result<DeltaReader<TSSTable::ValueReader>> {
        let key_range = (
            bound_as_byte_slice(&self.lower),
            bound_as_byte_slice(&self.upper),
        );
        self.term_dict
            .sstable_delta_reader_for_key_range_async(
                key_range,
                self.limit,
                &self.automaton,
                merge_holes_under_bytes,
            )
            .await
    }

    fn into_stream_given_delta_reader(
        self,
        delta_reader: DeltaReader<<TSSTable as SSTable>::ValueReader>,
    ) -> io::Result<Streamer<'a, TSSTable, A>> {
        let start_state = self.automaton.start();
        let start_key = bound_as_byte_slice(&self.lower);

        let first_term = match start_key {
            Bound::Included(key) | Bound::Excluded(key) => self
                .term_dict
                .sstable_index
                .get_block_with_key(key)
                .map(|block| block.first_ordinal)
                .unwrap_or(0),
            Bound::Unbounded => 0,
        };

        Ok(Streamer {
            automaton: self.automaton,
            states: vec![start_state],
            delta_reader,
            key: Vec::new(),
            term_ord: first_term.checked_sub(1),
            lower_bound: self.lower,
            upper_bound: self.upper,
            _lifetime: std::marker::PhantomData,
        })
    }

    /// See `into_stream(..)`
    pub async fn into_stream_async(self) -> io::Result<Streamer<'a, TSSTable, A>> {
        self.into_stream_async_merging_holes(0).await
    }

    /// Same as `into_stream_async`, but tries to issue a single io operation when requesting
    /// blocks that are not consecutive, but also less than `merge_holes_under_bytes` bytes apart.
    pub async fn into_stream_async_merging_holes(
        self,
        merge_holes_under_bytes: usize,
    ) -> io::Result<Streamer<'a, TSSTable, A>> {
        let delta_reader = self.delta_reader_async(merge_holes_under_bytes).await?;
        self.into_stream_given_delta_reader(delta_reader)
    }

    /// Creates the stream corresponding to the range
    /// of terms defined using the `StreamerBuilder`.
    pub fn into_stream(self) -> io::Result<Streamer<'a, TSSTable, A>> {
        let delta_reader = self.delta_reader()?;
        self.into_stream_given_delta_reader(delta_reader)
    }
}

/// `Streamer` acts as a cursor over a range of terms of a segment.
/// Terms are guaranteed to be sorted.
pub struct Streamer<'a, TSSTable, A = AlwaysMatch>
where
    A: Automaton,
    A::State: Clone,
    TSSTable: SSTable,
{
    automaton: A,
    states: Vec<A::State>,
    delta_reader: crate::DeltaReader<TSSTable::ValueReader>,
    key: Vec<u8>,
    term_ord: Option<TermOrdinal>,
    lower_bound: Bound<Vec<u8>>,
    upper_bound: Bound<Vec<u8>>,
    // this field is used to please the type-interface of a dictionary in tantivy
    _lifetime: std::marker::PhantomData<&'a ()>,
}

impl<TSSTable> Streamer<'_, TSSTable, AlwaysMatch>
where TSSTable: SSTable
{
    pub fn empty() -> Self {
        Streamer {
            automaton: AlwaysMatch,
            states: Vec::new(),
            delta_reader: DeltaReader::empty(),
            key: Vec::new(),
            term_ord: None,
            lower_bound: Bound::Unbounded,
            upper_bound: Bound::Unbounded,
            _lifetime: std::marker::PhantomData,
        }
    }
}

impl<TSSTable, A> Streamer<'_, TSSTable, A>
where
    A: Automaton,
    A::State: Clone,
    TSSTable: SSTable,
{
    /// Advance position the stream on the next item.
    /// Before the first call to `.advance()`, the stream
    /// is an uninitialized state.
    pub fn advance(&mut self) -> bool {
        while self.delta_reader.advance().unwrap() {
            self.term_ord = Some(
                self.term_ord
                    .map(|term_ord| term_ord + 1u64)
                    .unwrap_or(0u64),
            );
            let common_prefix_len = self.delta_reader.common_prefix_len();
            self.states.truncate(common_prefix_len + 1);
            self.key.truncate(common_prefix_len);
            let mut state: A::State = self.states.last().unwrap().clone();
            for &b in self.delta_reader.suffix() {
                state = self.automaton.accept(&state, b);
                self.states.push(state.clone());
            }
            self.key.extend_from_slice(self.delta_reader.suffix());
            let match_lower_bound = match &self.lower_bound {
                Bound::Unbounded => true,
                Bound::Included(lower_bound_key) => lower_bound_key[..] <= self.key[..],
                Bound::Excluded(lower_bound_key) => lower_bound_key[..] < self.key[..],
            };
            if !match_lower_bound {
                continue;
            }
            // We match the lower key once. All subsequent keys will pass that bar.
            self.lower_bound = Bound::Unbounded;
            let match_upper_bound = match &self.upper_bound {
                Bound::Unbounded => true,
                Bound::Included(upper_bound_key) => upper_bound_key[..] >= self.key[..],
                Bound::Excluded(upper_bound_key) => upper_bound_key[..] > self.key[..],
            };
            if !match_upper_bound {
                return false;
            }
            if self.automaton.is_match(&state) {
                return true;
            }
        }
        false
    }

    /// Returns the `TermOrdinal` of the given term.
    ///
    /// May panic if the called as `.advance()` as never
    /// been called before.
    pub fn term_ord(&self) -> TermOrdinal {
        self.term_ord.unwrap_or(0u64)
    }

    /// Accesses the current key.
    ///
    /// `.key()` should return the key that was returned
    /// by the `.next()` method.
    ///
    /// If the end of the stream as been reached, and `.next()`
    /// has been called and returned `None`, `.key()` remains
    /// the value of the last key encountered.
    ///
    /// Before any call to `.next()`, `.key()` returns an empty array.
    pub fn key(&self) -> &[u8] {
        &self.key
    }

    /// Accesses the current value.
    ///
    /// Calling `.value()` after the end of the stream will return the
    /// last `.value()` encountered.
    ///
    /// # Panics
    ///
    /// Calling `.value()` before the first call to `.advance()` returns
    /// `V::default()`.
    pub fn value(&self) -> &TSSTable::Value {
        self.delta_reader.value()
    }

    /// Return the next `(key, value)` pair.
    #[expect(clippy::should_implement_trait)]
    pub fn next(&mut self) -> Option<(&[u8], &TSSTable::Value)> {
        if self.advance() {
            Some((self.key(), self.value()))
        } else {
            None
        }
    }
}

#[cfg(test)]
mod tests {
    use std::io;

    use common::OwnedBytes;

    use crate::{Dictionary, MonotonicU64SSTable};

    fn create_test_dictionary() -> io::Result<Dictionary<MonotonicU64SSTable>> {
        let mut dict_builder = Dictionary::<MonotonicU64SSTable>::builder(Vec::new())?;
        dict_builder.insert(b"abaisance", &0)?;
        dict_builder.insert(b"abalation", &1)?;
        dict_builder.insert(b"abalienate", &2)?;
        dict_builder.insert(b"abandon", &3)?;
        let buffer = dict_builder.finish()?;
        let owned_bytes = OwnedBytes::new(buffer);
        Dictionary::from_bytes(owned_bytes)
    }

    #[test]
    fn test_sstable_stream() -> io::Result<()> {
        let dict = create_test_dictionary()?;
        let mut streamer = dict.stream()?;
        assert!(streamer.advance());
        assert_eq!(streamer.key(), b"abaisance");
        assert_eq!(streamer.value(), &0);
        assert!(streamer.advance());
        assert_eq!(streamer.key(), b"abalation");
        assert_eq!(streamer.value(), &1);
        assert!(streamer.advance());
        assert_eq!(streamer.key(), b"abalienate");
        assert_eq!(streamer.value(), &2);
        assert!(streamer.advance());
        assert_eq!(streamer.key(), b"abandon");
        assert_eq!(streamer.value(), &3);
        assert!(!streamer.advance());
        Ok(())
    }

    #[test]
    fn test_sstable_search() -> io::Result<()> {
        let term_dict = create_test_dictionary()?;
        let ptn = tantivy_fst::Regex::new("ab.*t.*").unwrap();
        let mut term_streamer = term_dict.search(ptn).into_stream()?;
        assert!(term_streamer.advance());
        assert_eq!(term_streamer.key(), b"abalation");
        assert_eq!(term_streamer.value(), &1u64);
        assert!(term_streamer.advance());
        assert_eq!(term_streamer.key(), b"abalienate");
        assert_eq!(term_streamer.value(), &2u64);
        assert!(!term_streamer.advance());
        Ok(())
    }

    // TODO add test for sparse search with a block of poison (starts with 0xffffffff) => such a
    // block instantly causes an unexpected EOF error
}


================================================
FILE: sstable/src/value/index.rs
================================================
use std::io;

use crate::value::{ValueReader, ValueWriter, deserialize_vint_u64};
use crate::{BlockAddr, vint};

#[derive(Default)]
pub(crate) struct IndexValueReader {
    vals: Vec<BlockAddr>,
}

impl ValueReader for IndexValueReader {
    type Value = BlockAddr;

    #[inline(always)]
    fn value(&self, idx: usize) -> &Self::Value {
        &self.vals[idx]
    }

    fn load(&mut self, mut data: &[u8]) -> io::Result<usize> {
        let original_num_bytes = data.len();
        let num_vals = deserialize_vint_u64(&mut data) as usize;
        self.vals.clear();
        let mut first_ordinal = 0u64;
        let mut prev_start = deserialize_vint_u64(&mut data) as usize;
        for _ in 0..num_vals {
            let len = deserialize_vint_u64(&mut data);
            let delta_ordinal = deserialize_vint_u64(&mut data);

            first_ordinal += delta_ordinal;
            let end = prev_start + len as usize;
            self.vals.push(BlockAddr {
                byte_range: prev_start..end,
                first_ordinal,
            });
            prev_start = end;
        }
        Ok(original_num_bytes - data.len())
    }
}

#[derive(Default)]
pub(crate) struct IndexValueWriter {
    vals: Vec<BlockAddr>,
}

impl ValueWriter for IndexValueWriter {
    type Value = BlockAddr;

    fn write(&mut self, val: &Self::Value) {
        self.vals.push(val.clone());
    }

    fn serialize_block(&self, output: &mut Vec<u8>) {
        let mut prev_ord = 0u64;
        vint::serialize_into_vec(self.vals.len() as u64, output);

        let start_pos = if let Some(block_addr) = self.vals.first() {
            block_addr.byte_range.start as u64
        } else {
            0
        };
        vint::serialize_into_vec(start_pos, output);

        // TODO use array_windows when it gets stabilized
        for elem in self.vals.windows(2) {
            let [current, next] = elem else {
                unreachable!("windows should always return exactly 2 elements");
            };
            let len = next.byte_range.start - current.byte_range.start;
            vint::serialize_into_vec(len as u64, output);
            let delta = current.first_ordinal - prev_ord;
            vint::serialize_into_vec(delta, output);
            prev_ord = current.first_ordinal;
        }
        if let Some(last) = self.vals.last() {
            let len = last.byte_range.end - last.byte_range.start;
            vint::serialize_into_vec(len as u64, output);
            let delta = last.first_ordinal - prev_ord;
            vint::serialize_into_vec(delta, output);
        }
    }

    fn clear(&mut self) {
        self.vals.clear();
    }
}

#[cfg(test)]
mod tests {
    use super::*;

    #[test]
    fn test_index_reader_writer() {
        crate::value::tests::test_value_reader_writer::<_, IndexValueReader, IndexValueWriter>(&[]);
        crate::value::tests::test_value_reader_writer::<_, IndexValueReader, IndexValueWriter>(&[
            BlockAddr {
                byte_range: 0..10,
                first_ordinal: 0,
            },
        ]);
        crate::value::tests::test_value_reader_writer::<_, IndexValueReader, IndexValueWriter>(&[
            BlockAddr {
                byte_range: 0..10,
                first_ordinal: 0,
            },
            BlockAddr {
                byte_range: 10..20,
                first_ordinal: 5,
            },
        ]);
        crate::value::tests::test_value_reader_writer::<_, IndexValueReader, IndexValueWriter>(&[
            BlockAddr {
                byte_range: 0..10,
                first_ordinal: 0,
            },
            BlockAddr {
                byte_range: 10..20,
                first_ordinal: 5,
            },
            BlockAddr {
                byte_range: 20..30,
                first_ordinal: 10,
            },
        ]);
        crate::value::tests::test_value_reader_writer::<_, IndexValueReader, IndexValueWriter>(&[
            BlockAddr {
                byte_range: 5..10,
                first_ordinal: 2,
            },
        ]);
    }
}


================================================
FILE: sstable/src/value/mod.rs
================================================
pub(crate) mod index;
mod range;
mod u64_monotonic;
mod vec_u32;
mod void;

use std::io;

pub use range::{RangeValueReader, RangeValueWriter};
pub use u64_monotonic::{U64MonotonicValueReader, U64MonotonicValueWriter};
pub use vec_u32::{VecU32ValueReader, VecU32ValueWriter};
pub use void::{VoidValueReader, VoidValueWriter};

/// `ValueReader` is a trait describing the contract of something
/// reading blocks of value, and offering random access within this values.
pub trait ValueReader: Default {
    /// Type of the value being read.
    type Value;

    /// Access the value at index `idx`, in the last block that was read
    /// via a call to `ValueReader::read`.
    fn value(&self, idx: usize) -> &Self::Value;

    /// Loads a block.
    ///
    /// Returns the number of bytes that were read.
    fn load(&mut self, data: &[u8]) -> io::Result<usize>;
}

/// `ValueWriter` is a trait to make it possible to write blocks
/// of value.
pub trait ValueWriter: Default {
    /// Type of the value being written.
    type Value;

    /// Records a new value.
    /// This method usually just accumulates data in a `Vec`,
    /// only to be serialized on the call to `ValueWriter::serialize_block`.
    fn write(&mut self, val: &Self::Value);

    /// Serializes the accumulated values into the output buffer.
    fn serialize_block(&self, output: &mut Vec<u8>);

    /// Clears the `ValueWriter`. After a call to clear, the `ValueWriter`
    /// should behave like a fresh `ValueWriter::default()`.
    fn clear(&mut self);
}

fn deserialize_vint_u64(data: &mut &[u8]) -> u64 {
    let (num_bytes, val) = super::vint::deserialize_read(data);
    *data = &data[num_bytes..];
    val
}

#[cfg(test)]
pub(crate) mod tests {
    use std::fmt;

    use super::{ValueReader, ValueWriter};

    pub(crate) fn test_value_reader_writer<
        V: Eq + fmt::Debug,
        TReader: ValueReader<Value = V>,
        TWriter: ValueWriter<Value = V>,
    >(
        value_block: &[V],
    ) {
        let mut buffer = Vec::new();
        {
            let mut writer = TWriter::default();
            for value in value_block {
                writer.write(value);
            }
            writer.serialize_block(&mut buffer);
            writer.clear();
        }
        let data_len = buffer.len();
        buffer.extend_from_slice(&b"extradata"[..]);
        let mut reader = TReader::default();
        assert_eq!(reader.load(&buffer[..]).unwrap(), data_len);
        for (i, val) in value_block.iter().enumerate() {
            assert_eq!(reader.value(i), val);
        }
    }
}


================================================
FILE: sstable/src/value/range.rs
================================================
use std::io;
use std::ops::Range;

use crate::value::{ValueReader, ValueWriter, deserialize_vint_u64};

/// See module comment.
#[derive(Default)]
pub struct RangeValueReader {
    vals: Vec<Range<u64>>,
}

impl ValueReader for RangeValueReader {
    type Value = Range<u64>;

    #[inline(always)]
    fn value(&self, idx: usize) -> &Range<u64> {
        &self.vals[idx]
    }

    fn load(&mut self, mut data: &[u8]) -> io::Result<usize> {
        self.vals.clear();
        let original_num_bytes = data.len();
        let len = deserialize_vint_u64(&mut data) as usize;
        if len != 0 {
            let mut prev_val = deserialize_vint_u64(&mut data);
            for _ in 1..len {
                let next_val = prev_val + deserialize_vint_u64(&mut data);
                self.vals.push(prev_val..next_val);
                prev_val = next_val;
            }
        }
        Ok(original_num_bytes - data.len())
    }
}

/// Range writer. The range are required to partition the
/// space.
///
/// In other words, two consecutive keys `k1` and `k2`
/// are required to observe
/// `range_sstable[k1].end == range_sstable[k2].start`.
///
/// The writer will panic if the inserted value do not follow
/// this property.
///
/// The first range is not required to start at `0`.
#[derive(Default)]
pub struct RangeValueWriter {
    vals: Vec<u64>,
}

impl ValueWriter for RangeValueWriter {
    type Value = Range<u64>;

    fn write(&mut self, val: &Range<u64>) {
        if let Some(previous_offset) = self.vals.last().copied() {
            assert_eq!(previous_offset, val.start);
            self.vals.push(val.end);
        } else {
            self.vals.push(val.start);
            self.vals.push(val.end)
        }
    }

    fn serialize_block(&self, writer: &mut Vec<u8>) {
        let mut prev_val = 0u64;
        crate::vint::serialize_into_vec(self.vals.len() as u64, writer);
        for &val in &self.vals {
            let delta = val - prev_val;
            crate::vint::serialize_into_vec(delta, writer);
            prev_val = val;
        }
    }

    fn clear(&mut self) {
        self.vals.clear();
    }
}

#[cfg(test)]
#[expect(clippy::single_range_in_vec_init)]
mod tests {
    use super::*;

    #[test]
    fn test_range_reader_writer() {
        crate::value::tests::test_value_reader_writer::<_, RangeValueReader, RangeValueWriter>(&[]);
        crate::value::tests::test_value_reader_writer::<_, RangeValueReader, RangeValueWriter>(&[
            0..3,
        ]);
        crate::value::tests::test_value_reader_writer::<_, RangeValueReader, RangeValueWriter>(&[
            0..3,
            3..10,
        ]);
        crate::value::tests::test_value_reader_writer::<_, RangeValueReader, RangeValueWriter>(&[
            0..0,
            0..10,
        ]);
        crate::value::tests::test_value_reader_writer::<_, RangeValueReader, RangeValueWriter>(&[
            100..110,
            110..121,
            121..1250,
        ]);
    }

    #[test]
    #[should_panic]
    fn test_range_reader_writer_panics() {
        crate::value::tests::test_value_reader_writer::<_, RangeValueReader, RangeValueWriter>(&[
            1..3,
            4..10,
        ]);
    }
}


================================================
FILE: sstable/src/value/u64_monotonic.rs
================================================
use std::io;

use crate::value::{ValueReader, ValueWriter, deserialize_vint_u64};
use crate::vint;

#[derive(Default)]
pub struct U64MonotonicValueReader {
    vals: Vec<u64>,
}

impl ValueReader for U64MonotonicValueReader {
    type Value = u64;

    #[inline(always)]
    fn value(&self, idx: usize) -> &Self::Value {
        &self.vals[idx]
    }

    fn load(&mut self, mut data: &[u8]) -> io::Result<usize> {
        let original_num_bytes = data.len();
        let num_vals = deserialize_vint_u64(&mut data) as usize;
        self.vals.clear();
        let mut prev_val = 0u64;
        for _ in 0..num_vals {
            let delta = deserialize_vint_u64(&mut data);
            let val = prev_val + delta;
            self.vals.push(val);
            prev_val = val;
        }
        Ok(original_num_bytes - data.len())
    }
}

#[derive(Default)]
pub struct U64MonotonicValueWriter {
    vals: Vec<u64>,
}

impl ValueWriter for U64MonotonicValueWriter {
    type Value = u64;

    fn write(&mut self, val: &Self::Value) {
        self.vals.push(*val);
    }

    fn serialize_block(&self, output: &mut Vec<u8>) {
        let mut prev_val = 0u64;
        vint::serialize_into_vec(self.vals.len() as u64, output);
        for &val in &self.vals {
            let delta = val - prev_val;
            vint::serialize_into_vec(delta, output);
            prev_val = val;
        }
    }

    fn clear(&mut self) {
        self.vals.clear();
    }
}

#[cfg(test)]
mod tests {
    use super::*;

    #[test]
    fn test_u64_monotonic_reader_writer() {
        crate::value::tests::test_value_reader_writer::<
            _,
            U64MonotonicValueReader,
            U64MonotonicValueWriter,
        >(&[]);
        crate::value::tests::test_value_reader_writer::<
            _,
            U64MonotonicValueReader,
            U64MonotonicValueWriter,
        >(&[5]);
        crate::value::tests::test_value_reader_writer::<
            _,
            U64MonotonicValueReader,
            U64MonotonicValueWriter,
        >(&[1u64, 30u64]);
    }
}


================================================
FILE: sstable/src/value/vec_u32.rs
================================================
use std::io;

use super::{ValueReader, ValueWriter};

#[derive(Default)]
pub struct VecU32ValueReader {
    vals: Vec<Vec<u32>>,
}

impl ValueReader for VecU32ValueReader {
    type Value = Vec<u32>;

    #[inline(always)]
    fn value(&self, idx: usize) -> &Self::Value {
        &self.vals[idx]
    }

    fn load(&mut self, mut data: &[u8]) -> io::Result<usize> {
        let original_num_bytes = data.len();
        self.vals.clear();

        // The first 4 bytes are the number of blocks
        let num_blocks = u32::from_le_bytes(data[..4].try_into().unwrap()) as usize;
        data = &data[4..];

        for _ in 0..num_blocks {
            // Each block starts with a 4-byte length
            let segment_len = u32::from_le_bytes(data[..4].try_into().unwrap()) as usize;
            data = &data[4..];

            // Read the segment IDs for this block
            let mut segment_ids = Vec::with_capacity(segment_len);
            for _ in 0..segment_len {
                let segment_id = u32::from_le_bytes(data[..4].try_into().unwrap());
                segment_ids.push(segment_id);
                data = &data[4..];
            }
            self.vals.push(segment_ids);
        }

        // Return the number of bytes consumed
        Ok(original_num_bytes - data.len())
    }
}

#[derive(Default)]
pub struct VecU32ValueWriter {
    vals: Vec<Vec<u32>>,
}

impl ValueWriter for VecU32ValueWriter {
    type Value = Vec<u32>;

    fn write(&mut self, val: &Self::Value) {
        self.vals.push(val.to_vec());
    }

    fn serialize_block(&self, output: &mut Vec<u8>) {
        let num_blocks = self.vals.len() as u32;
        output.extend_from_slice(&num_blocks.to_le_bytes());
        for vals in &self.vals {
            let len = vals.len() as u32;
            output.extend_from_slice(&len.to_le_bytes());
            for &segment_id in vals.iter() {
                output.extend_from_slice(&segment_id.to_le_bytes());
            }
        }
    }

    fn clear(&mut self) {
        self.vals.clear();
    }
}


================================================
FILE: sstable/src/value/void.rs
================================================
use std::io;

use crate::value::{ValueReader, ValueWriter};

#[derive(Default)]
pub struct VoidValueReader;

impl ValueReader for VoidValueReader {
    type Value = ();

    #[inline(always)]
    fn value(&self, _idx: usize) -> &() {
        &()
    }

    fn load(&mut self, _data: &[u8]) -> io::Result<usize> {
        Ok(0)
    }
}

#[derive(Default)]
pub struct VoidValueWriter;

impl ValueWriter for VoidValueWriter {
    type Value = ();

    fn write(&mut self, _val: &()) {}

    fn serialize_block(&self, _output: &mut Vec<u8>) {}

    fn clear(&mut self) {}
}

#[cfg(test)]
mod tests {
    use super::*;

    #[test]
    fn test_range_reader_writer() {
        crate::value::tests::test_value_reader_writer::<_, VoidValueReader, VoidValueWriter>(&[]);
        crate::value::tests::test_value_reader_writer::<_, VoidValueReader, VoidValueWriter>(&[()]);
        crate::value::tests::test_value_reader_writer::<_, VoidValueReader, VoidValueWriter>(&[
            (),
            (),
            (),
        ]);
    }
}


================================================
FILE: sstable/src/vint.rs
================================================
const CONTINUE_BIT: u8 = 128u8;

pub fn serialize(mut val: u64, buffer: &mut [u8]) -> usize {
    for (i, b) in buffer.iter_mut().enumerate() {
        let next_byte: u8 = (val & 127u64) as u8;
        val >>= 7;
        if val == 0u64 {
            *b = next_byte;
            return i + 1;
        } else {
            *b = next_byte | CONTINUE_BIT;
        }
    }
    10 //< actually unreachable
}

pub fn serialize_into_vec(val: u64, buffer: &mut Vec<u8>) {
    let mut buf = [0u8; 10];
    let num_bytes = serialize(val, &mut buf[..]);
    buffer.extend_from_slice(&buf[..num_bytes]);
}

// super slow but we don't care
pub fn deserialize_read(buf: &[u8]) -> (usize, u64) {
    let mut result = 0u64;
    let mut shift = 0u64;
    let mut consumed = 0;

    for &b in buf {
        consumed += 1;
        result |= u64::from(b % 128u8) << shift;
        if b < CONTINUE_BIT {
            break;
        }
        shift += 7;
    }
    (consumed, result)
}

#[cfg(test)]
mod tests {
    use super::{deserialize_read, serialize};

    fn aux_test_int(val: u64, expect_len: usize) {
        let mut buffer = [0u8; 14];
        assert_eq!(serialize(val, &mut buffer[..]), expect_len);
        assert_eq!(deserialize_read(&buffer), (expect_len, val));
    }

    #[test]
    fn test_vint() {
        aux_test_int(0u64, 1);
        aux_test_int(17u64, 1);
        aux_test_int(127u64, 1);
        aux_test_int(128u64, 2);
        aux_test_int(123423418u64, 4);
        for i in 1..63 {
            let power_of_two = 1u64 << i;
            aux_test_int(power_of_two + 1, (i / 7) + 1);
            aux_test_int(power_of_two, (i / 7) + 1);
            aux_test_int(power_of_two - 1, ((i - 1) / 7) + 1);
        }
        aux_test_int(u64::MAX, 10);
    }
}


================================================
FILE: sstable/tests/sstable_test.rs
================================================
use common::OwnedBytes;
use tantivy_sstable::{Dictionary, MonotonicU64SSTable, VecU32ValueSSTable};

#[test]
fn test_create_and_search_sstable() {
    // Create a new sstable in memory.
    let mut builder = Dictionary::<MonotonicU64SSTable>::builder(Vec::new()).unwrap();
    builder.insert(b"apple", &1).unwrap();
    builder.insert(b"banana", &2).unwrap();
    builder.insert(b"orange", &3).unwrap();
    let sstable_bytes = builder.finish().unwrap();

    // Open the sstable.
    let sstable =
        Dictionary::<MonotonicU64SSTable>::from_bytes(OwnedBytes::new(sstable_bytes)).unwrap();

    // Search for a key.
    let value = sstable.get(b"banana").unwrap();
    assert_eq!(value, Some(2));

    // Search for a non-existent key.
    let value = sstable.get(b"blub").unwrap();
    assert_eq!(value, None);
}

#[test]
fn test_custom_value_sstable() {
    // Create a new sstable with custom values.
    let mut builder = Dictionary::<VecU32ValueSSTable>::builder(Vec::new()).unwrap();
    builder.set_block_len(4096); // Ensure both values are in the same block
    builder.insert(b"first", &vec![1, 2, 3]).unwrap();
    builder.insert(b"second", &vec![4, 5]).unwrap();
    let sstable_bytes = builder.finish().unwrap();

    // Open the sstable.
    let sstable =
        Dictionary::<VecU32ValueSSTable>::from_bytes(OwnedBytes::new(sstable_bytes)).unwrap();

    let mut stream = sstable.stream().unwrap();
    assert!(stream.advance());
    assert_eq!(stream.key(), b"first");
    assert_eq!(stream.value(), &vec![1, 2, 3]);

    assert!(stream.advance());
    assert_eq!(stream.key(), b"second");
    assert_eq!(stream.value(), &vec![4, 5]);

    assert!(!stream.advance());
}


================================================
FILE: stacker/Cargo.toml
================================================
[package]
name = "tantivy-stacker"
version = "0.6.0"
edition = "2024"
license = "MIT"
homepage = "https://github.com/quickwit-oss/tantivy"
repository = "https://github.com/quickwit-oss/tantivy"
description = "term hashmap used for indexing"

[dependencies]
murmurhash32 = "0.3"
common = { version = "0.10", path = "../common/", package = "tantivy-common" }
ahash = { version = "0.8.11", default-features = false, optional = true }


[[bench]]
harness = false
name = "bench"
path = "benches/bench.rs"

[[example]]
name = "hashmap"
path = "example/hashmap.rs"

[dev-dependencies]
rand = "0.9"
zipf = "7.0.0"
rustc-hash = "2.1.0"
proptest = "1.2.0"
binggan = { version = "0.14.0" }
rand_distr = "0.5"

[features]
compare_hash_only = ["ahash"] # Compare hash only, not the key in the Hashmap
unstable = [] # useful for benches.


================================================
FILE: stacker/Performance.md
================================================

# Notes

- `extend_from_slice(&key)` calls memcpy, which is relatively slow, since most keys are relatively short. For now there's a specialized version toavoid memcpy calls.
    Wild copy 16 bytes in a loop is faster, but would require a guard against overflow from the caller side. (We probably can do that). 
- Comparing two slices of unknown length calls memcmp. Same as above, we can do a specialized version.

fastcmp and fastcpy both employ the same trick, to compare slices of odd length, e.g. 2 operations unconditional on 4 bytes, instead 3 operations with conditionals (1 4byte, 1 2byte, 1 1byte).
[1, 2, 3, 4, 5, 6, 7]
[1, 2, 3, 4]
         [4, 5, 6, 7]

- Since the hashmap writes the values on every key insert/update, the values like expull should be small. Therefore inlining of the values has been removed.
- Currently the first call to Expull will get a capacity of 0. It would be beneficial if it could be initialized with some memory, so that the first call doesn't have to allocate. But that would mean we don't have `Default` impls.


================================================
FILE: stacker/benches/bench.rs
================================================
use binggan::plugins::PeakMemAllocPlugin;
use binggan::{BenchRunner, INSTRUMENTED_SYSTEM, PeakMemAlloc, black_box};
use rand::SeedableRng;
use rustc_hash::FxHashMap;
use tantivy_stacker::{ArenaHashMap, ExpUnrolledLinkedList, MemoryArena};

const ALICE: &str = include_str!("../../benches/alice.txt");

#[global_allocator]
pub static GLOBAL: &PeakMemAlloc<std::alloc::System> = &INSTRUMENTED_SYSTEM;

fn bench_vint() {
    let mut runner = BenchRunner::new();
    // Set the peak mem allocator. This will enable peak memory reporting.
    runner.add_plugin(PeakMemAllocPlugin::new(GLOBAL));

    {
        let input_bytes = ALICE.len();

        let alice_terms_as_bytes: Vec<&[u8]> = ALICE
            .split_ascii_whitespace()
            .map(|el| el.as_bytes())
            .collect();

        let alice_terms_as_bytes_with_docid: Vec<(u32, &[u8])> = ALICE
            .split_ascii_whitespace()
            .map(|el| el.as_bytes())
            .enumerate()
            .map(|(docid, el)| (docid as u32, el))
            .collect();

        // Alice benchmark
        let mut group = runner.new_group();
        group.set_name(format!("alice (num terms: {})", ALICE.len()));
        group.set_input_size(input_bytes);
        group.register_with_input("hashmap", &alice_terms_as_bytes, move |data| {
            black_box(create_hash_map(data.iter()));
        });
        group.register_with_input(
            "hasmap with postings",
            &alice_terms_as_bytes_with_docid,
            move |data| {
                black_box(create_hash_map_with_expull(data.iter().cloned()));
            },
        );
        group.register_with_input(
            "fxhashmap ref postings",
            &alice_terms_as_bytes,
            move |data| {
                black_box(create_fx_hash_ref_map_with_expull(data.iter().cloned()));
            },
        );
        group.register_with_input(
            "fxhasmap owned postings",
            &alice_terms_as_bytes,
            move |data| {
                black_box(create_fx_hash_owned_map_with_expull(data.iter().cloned()));
            },
        );
        group.run();
    }

    {
        for (num_numbers, num_numbers_label) in [
            (100_000u64, "100k"),
            (1_000_000, "1mio"),
            (2_000_000, "2mio"),
            (5_000_000, "5mio"),
        ] {
            // benchmark unique numbers
            {
                let numbers: Vec<[u8; 8]> = (0..num_numbers).map(|el| el.to_le_bytes()).collect();
                let numbers_with_doc: Vec<_> = numbers
                    .iter()
                    .enumerate()
                    .map(|(docid, el)| (docid as u32, el))
                    .collect();

                let input_bytes = numbers.len() * 8;
                let mut group = runner.new_group();
                group.set_name(format!("numbers unique {}", num_numbers_label));
                group.set_input_size(input_bytes);
                group.register_with_input("only hashmap", &numbers, move |data| {
                    black_box(create_hash_map(data.iter()));
                });
                group.register_with_input("hasmap with postings", &numbers_with_doc, move |data| {
                    black_box(create_hash_map_with_expull(data.iter().cloned()));
                });
                group.run();
            }
            // benchmark zipfs distribution numbers
            {
                use rand::distr::Distribution;
                use rand::rngs::StdRng;
                let mut rng = StdRng::from_seed([3u8; 32]);
                let zipf = rand_distr::Zipf::new(10_000.0f64, 1.03).unwrap();
                let numbers: Vec<[u8; 8]> = (0..num_numbers)
                    .map(|_| zipf.sample(&mut rng).to_le_bytes())
                    .collect();
                let numbers_with_doc: Vec<_> = numbers
                    .iter()
                    .enumerate()
                    .map(|(docid, el)| (docid as u32, el))
                    .collect();

                let input_bytes = numbers.len() * 8;
                let mut group = runner.new_group();
                group.set_name(format!("zipfs numbers {}", num_numbers_label));
                group.set_input_size(input_bytes);
                group.register_with_input("hashmap", &numbers, move |data| {
                    black_box(create_hash_map(data.iter()));
                });
                group.register_with_input("hasmap with postings", &numbers_with_doc, move |data| {
                    black_box(create_hash_map_with_expull(data.iter().cloned()));
                });
                group.run();
            }
        }
    }
}

fn main() {
    bench_vint();
}

const HASHMAP_CAPACITY: usize = 1 << 15;

/// Only records the doc ids
#[derive(Clone, Default, Copy)]
pub struct DocIdRecorder {
    stack: ExpUnrolledLinkedList,
}
impl DocIdRecorder {
    fn new_doc(&mut self, doc: u32, arena: &mut MemoryArena) {
        self.stack.writer(arena).write_u32_vint(doc);
    }
}

fn create_hash_map<T: AsRef<[u8]>>(terms: impl Iterator<Item = T>) -> ArenaHashMap {
    let mut map = ArenaHashMap::with_capacity(HASHMAP_CAPACITY);
    for term in terms {
        map.mutate_or_create(term.as_ref(), |val| {
            if let Some(mut val) = val {
                val += 1;
                val
            } else {
                1u64
            }
        });
    }

    map
}

fn create_hash_map_with_expull<T: AsRef<[u8]>>(
    terms: impl Iterator<Item = (u32, T)>,
) -> ArenaHashMap {
    let mut memory_arena = MemoryArena::default();
    let mut map = ArenaHashMap::with_capacity(HASHMAP_CAPACITY);
    for (i, term) in terms {
        map.mutate_or_create(term.as_ref(), |val: Option<DocIdRecorder>| {
            if let Some(mut rec) = val {
                rec.new_doc(i, &mut memory_arena);
                rec
            } else {
                DocIdRecorder::default()
            }
        });
    }

    map
}

fn create_fx_hash_ref_map_with_expull(
    terms: impl Iterator<Item = &'static [u8]>,
) -> FxHashMap<&'static [u8], Vec<u32>> {
    let terms = terms.enumerate();
    let mut map = FxHashMap::with_capacity_and_hasher(HASHMAP_CAPACITY, Default::default());
    for (i, term) in terms {
        map.entry(term.as_ref())
            .or_insert_with(Vec::new)
            .push(i as u32);
    }
    map
}

fn create_fx_hash_owned_map_with_expull(
    terms: impl Iterator<Item = &'static [u8]>,
) -> FxHashMap<Vec<u8>, Vec<u32>> {
    let terms = terms.enumerate();
    let mut map = FxHashMap::with_capacity_and_hasher(HASHMAP_CAPACITY, Default::default());
    for (i, term) in terms {
        map.entry(term.as_ref().to_vec())
            .or_insert_with(Vec::new)
            .push(i as u32);
    }
    map
}


================================================
FILE: stacker/example/hashmap.rs
================================================
use tantivy_stacker::ArenaHashMap;

const ALICE: &str = include_str!("../../benches/alice.txt");

fn main() {
    create_hash_map((0..100_000_000).map(|el| el.to_string()));

    for _ in 0..1000 {
        create_hash_map(ALICE.split_whitespace());
    }
}

fn create_hash_map<T: AsRef<str>>(terms: impl Iterator<Item = T>) -> ArenaHashMap {
    let mut map = ArenaHashMap::with_capacity(4);
    for term in terms {
        map.mutate_or_create(term.as_ref().as_bytes(), |val| {
            if let Some(mut val) = val {
                val += 1;
                val
            } else {
                1u64
            }
        });
    }

    map
}


================================================
FILE: stacker/fuzz_test/Cargo.toml
================================================
[package]
name = "fuzz_test"
version = "0.1.0"
edition = "2021"

# See more keys and their definitions at https://doc.rust-lang.org/cargo/reference/manifest.html

[dependencies]
ahash = "0.8.7"
rand = "0.9"
rand_distr = "0.5"
tantivy-stacker = { version = "0.2.0", path = ".." }

[workspace]


================================================
FILE: stacker/fuzz_test/src/main.rs
================================================
use ahash::AHashMap;
use rand::{rngs::StdRng, Rng, SeedableRng};
use rand_distr::Exp;
use tantivy_stacker::ArenaHashMap;

fn main() {
    for _ in 0..1_000_000 {
        let seed: u64 = rand::random();
        test_with_seed(seed);
    }
}

fn test_with_seed(seed: u64) {
    let mut hash_map = AHashMap::new();
    let mut arena_hashmap = ArenaHashMap::default();
    let mut rng = StdRng::seed_from_u64(seed);
    let key_count = rng.random_range(1_000..=1_000_000);
    let exp = Exp::new(0.05).unwrap();

    for _ in 0..key_count {
        let key_length = rng.sample::<f32, _>(exp).min(u16::MAX as f32).max(1.0) as usize;

        let key: Vec<u8> = (0..key_length).map(|_| rng.gen()).collect();

        arena_hashmap.mutate_or_create(&key, |current_count| {
            let count: u64 = current_count.unwrap_or(0);
            count + 1
        });
        hash_map.entry(key).and_modify(|e| *e += 1).or_insert(1);
    }

    println!(
        "Seed: {} \t {:.2}MB",
        seed,
        arena_hashmap.memory_arena.len() as f32 / 1024.0 / 1024.0
    );
    // Check the contents of the ArenaHashMap
    for (key, addr) in arena_hashmap.iter() {
        let count: u64 = arena_hashmap.read(addr);
        let count_expected = hash_map
            .get(key)
            .unwrap_or_else(|| panic!("NOT FOUND: Key: {:?}, Count: {}", key, count));
        assert_eq!(count, *count_expected);
    }
}


================================================
FILE: stacker/src/arena_hashmap.rs
================================================
use super::{Addr, MemoryArena};
use crate::shared_arena_hashmap::SharedArenaHashMap;

/// Customized `HashMap` with `&[u8]` keys
///
/// Its main particularity is that rather than storing its
/// keys in the heap, keys are stored in a memory arena
/// inline with the values.
///
/// The quirky API has the benefit of avoiding
/// the computation of the hash of the key twice,
/// or copying the key as long as there is no insert.
///
/// ArenaHashMap is like SharedArenaHashMap but takes ownership
/// of the memory arena. The memory arena stores the serialized
/// keys and values.
pub struct ArenaHashMap {
    shared_arena_hashmap: SharedArenaHashMap,
    pub memory_arena: MemoryArena,
}

impl Default for ArenaHashMap {
    fn default() -> Self {
        ArenaHashMap::with_capacity(4)
    }
}

impl ArenaHashMap {
    pub fn with_capacity(table_size: usize) -> ArenaHashMap {
        let memory_arena = MemoryArena::default();

        ArenaHashMap {
            shared_arena_hashmap: SharedArenaHashMap::with_capacity(table_size),
            memory_arena,
        }
    }

    #[inline]
    pub fn read<Item: Copy + 'static>(&self, addr: Addr) -> Item {
        self.memory_arena.read(addr)
    }

    #[inline]
    pub fn mem_usage(&self) -> usize {
        self.shared_arena_hashmap.mem_usage() + self.memory_arena.mem_usage()
    }

    #[inline]
    pub fn is_empty(&self) -> bool {
        self.shared_arena_hashmap.is_empty()
    }

    #[inline]
    pub fn len(&self) -> usize {
        self.shared_arena_hashmap.len()
    }

    #[inline]
    pub fn iter(&self) -> impl Iterator<Item = (&[u8], Addr)> {
        self.shared_arena_hashmap.iter(&self.memory_arena)
    }

    /// Get a value associated to a key.
    #[inline]
    pub fn get<V>(&self, key: &[u8]) -> Option<V>
    where V: Copy + 'static {
        self.shared_arena_hashmap.get(key, &self.memory_arena)
    }

    /// `update` create a new entry for a given key if it does not exist
    /// or updates the existing entry.
    ///
    /// The actual logic for this update is define in the `updater`
    /// argument.
    ///
    /// If the key is not present, `updater` will receive `None` and
    /// will be in charge of returning a default value.
    /// If the key already as an associated value, then it will be passed
    /// `Some(previous_value)`.
    #[inline]
    pub fn mutate_or_create<V>(&mut self, key: &[u8], updater: impl FnMut(Option<V>) -> V)
    where V: Copy + 'static {
        self.shared_arena_hashmap
            .mutate_or_create(key, &mut self.memory_arena, updater);
    }
}

#[cfg(test)]
mod tests {

    use std::collections::HashMap;

    use super::ArenaHashMap;

    #[test]
    fn test_hash_map() {
        let mut hash_map: ArenaHashMap = ArenaHashMap::default();
        hash_map.mutate_or_create(b"abc", |opt_val: Option<u32>| {
            assert_eq!(opt_val, None);
            3u32
        });
        hash_map.mutate_or_create(b"abcd", |opt_val: Option<u32>| {
            assert_eq!(opt_val, None);
            4u32
        });
        hash_map.mutate_or_create(b"abc", |opt_val: Option<u32>| {
            assert_eq!(opt_val, Some(3u32));
            5u32
        });
        let mut vanilla_hash_map = HashMap::new();
        let iter_values = hash_map.iter();
        for (key, addr) in iter_values {
            let val: u32 = hash_map.memory_arena.read(addr);
            vanilla_hash_map.insert(key.to_owned(), val);
        }
        assert_eq!(vanilla_hash_map.len(), 2);
    }
    #[test]
    fn test_empty_hashmap() {
        let hash_map: ArenaHashMap = ArenaHashMap::default();
        assert_eq!(hash_map.get::<u32>(b"abc"), None);
    }

    #[test]
    fn test_many_terms() {
        let mut terms: Vec<String> = (0..20_000).map(|val| val.to_string()).collect();
        let mut hash_map: ArenaHashMap = ArenaHashMap::default();
        for term in terms.iter() {
            hash_map.mutate_or_create(term.as_bytes(), |_opt_val: Option<u32>| 5u32);
        }
        let mut terms_back: Vec<String> = hash_map
            .iter()
            .map(|(bytes, _)| String::from_utf8(bytes.to_vec()).unwrap())
            .collect();
        terms_back.sort();
        terms.sort();

        for pos in 0..terms.len() {
            assert_eq!(terms[pos], terms_back[pos]);
        }
    }
}


================================================
FILE: stacker/src/expull.rs
================================================
use std::mem;

use common::serialize_vint_u32;

use crate::fastcpy::fast_short_slice_copy;
use crate::{Addr, MemoryArena};

const FIRST_BLOCK_NUM: u32 = 2;

/// An exponential unrolled link.
///
/// The use case is as follows. Tantivy's indexer conceptually acts like a
/// `HashMap<Term, Vec<u32>>`. As we come across a given term in document
/// `D`, we lookup the term in the map and append the document id to its vector.
///
/// The vector is then only read when it is serialized.
///
/// The `ExpUnrolledLinkedList` offers a more efficient solution to this
/// problem.
///
/// It combines the idea of the unrolled linked list and tries to address the
/// problem of selecting an adequate block size using a strategy similar to
/// that of the `Vec` amortized resize strategy.
///
/// Data is stored in a linked list of blocks. The first block has a size of `8`
/// and each block has a length of twice that of the previous block up to
/// `MAX_BLOCK_LEN = 1<<15`.
///
/// This strategy is a good trade off to handle numerous very rare terms
/// and avoid wasting half of the memory for very frequent terms.
#[derive(Debug, Clone, Copy)]
pub struct ExpUnrolledLinkedList {
    // u16, since the max size of each block is (1<<next_cap_pow_2)
    // Limited to 15, so we don't overflow remaining_cap.
    remaining_cap: u16,
    // Tracks the number of blocks allocated: block_num - FIRST_BLOCK_NUM
    block_num: u32,
    head: Addr,
    tail: Addr,
}

impl Default for ExpUnrolledLinkedList {
    fn default() -> Self {
        Self {
            // 0 to trigger an initial allocation. Init with MemoryArena would be better.
            remaining_cap: 0,
            block_num: FIRST_BLOCK_NUM,
            head: Addr::null_pointer(),
            tail: Addr::null_pointer(),
        }
    }
}

pub struct ExpUnrolledLinkedListWriter<'a> {
    eull: &'a mut ExpUnrolledLinkedList,
    arena: &'a mut MemoryArena,
}

#[inline]
fn ensure_capacity<'a>(
    eull: &'a mut ExpUnrolledLinkedList,
    arena: &'a mut MemoryArena,
    allocate: u32,
) {
    let new_block_addr: Addr = arena.allocate_space(allocate as usize + mem::size_of::<Addr>());
    // Check first write
    if eull.head.is_null() {
        eull.head = new_block_addr;
    } else {
        arena.write_at(eull.tail, new_block_addr);
    }

    eull.tail = new_block_addr;
    eull.remaining_cap = allocate as u16;
}

impl ExpUnrolledLinkedListWriter<'_> {
    #[inline]
    pub fn write_u32_vint(&mut self, val: u32) {
        let mut buf = [0u8; 8];
        let data = serialize_vint_u32(val, &mut buf);
        self.extend_from_slice(data);
    }

    #[inline]
    pub fn extend_from_slice(&mut self, mut buf: &[u8]) {
        while !buf.is_empty() {
            let add_len: usize;
            {
                if self.eull.remaining_cap == 0 {
                    // Double the next cap
                    self.eull.increment_num_blocks();
                    let block_size = get_block_size(self.eull.block_num);
                    ensure_capacity(self.eull, self.arena, block_size as u32);
                }

                let output_buf = self
                    .arena
                    .slice_mut(self.eull.tail, self.eull.remaining_cap as usize);
                add_len = buf.len().min(output_buf.len());
                let output_buf = &mut output_buf[..add_len];
                let buf = &buf[..add_len];

                fast_short_slice_copy(buf, output_buf);
            }
            self.eull.remaining_cap -= add_len as u16;
            self.eull.tail = self.eull.tail.offset(add_len as u32);
            buf = &buf[add_len..];
        }
    }
}

// The block size is 2^block_num, but max 2^15 = 32KB
// Initial size is 8 bytes (2^3), for the first block => block_num == 2
// Block size caps at 32KB (2^15) regardless of how high block_num goes
#[inline]
fn get_block_size(block_num: u32) -> u16 {
    // Cap at 15 to prevent block sizes > 32KB
    // block_num can now be much larger than 15, but block size maxes out
    let exp: u32 = block_num.min(15u32);
    (1u32 << exp) as u16
}

impl ExpUnrolledLinkedList {
    #[inline(always)]
    pub fn increment_num_blocks(&mut self) {
        // Add overflow check as a safety measure
        // With u32, we can handle up to ~4 billion blocks before overflow
        // At 32KB per block (max size), that's 128 TB of data
        self.block_num = self
            .block_num
            .checked_add(1)
            .expect("ExpUnrolledLinkedList block count overflow - exceeded 4 billion blocks");
    }

    #[inline]
    pub fn writer<'a>(&'a mut self, arena: &'a mut MemoryArena) -> ExpUnrolledLinkedListWriter<'a> {
        ExpUnrolledLinkedListWriter { eull: self, arena }
    }

    pub fn read_to_end(&self, arena: &MemoryArena, output: &mut Vec<u8>) {
        let mut addr = self.head;
        if addr.is_null() {
            return;
        }

        // Calculate last block length with bounds checking to prevent underflow
        let block_size = get_block_size(self.block_num) as usize;
        let last_block_len = block_size.saturating_sub(self.remaining_cap as usize);

        // Safety check: if remaining_cap > block_size, the metadata is corrupted
        assert!(
            self.remaining_cap as usize <= block_size,
            "ExpUnrolledLinkedList metadata corruption detected: remaining_cap ({}) > block_size \
             ({}). This indicates a serious bug, please report! (block_num={}, head={:?}, \
             tail={:?})",
            self.remaining_cap,
            block_size,
            self.block_num,
            self.head,
            self.tail
        );

        // Full Blocks (iterate through all blocks except the last one)
        // Note: Blocks are numbered starting from FIRST_BLOCK_NUM+1 (=3) after first allocation
        for block_num in FIRST_BLOCK_NUM + 1..self.block_num {
            let cap = get_block_size(block_num) as usize;
            let data = arena.slice(addr, cap);
            output.extend_from_slice(data);
            addr = arena.read(addr.offset(cap as u32));
        }
        // Last Block
        let data = arena.slice(addr, last_block_len);
        output.extend_from_slice(data);
    }
}

#[cfg(test)]
mod tests {
    use common::{read_u32_vint, write_u32_vint};

    use super::*;

    #[test]
    fn test_eull_empty() {
        let arena = MemoryArena::default();
        let stack = ExpUnrolledLinkedList::default();
        {
            let mut buffer = Vec::new();
            stack.read_to_end(&arena, &mut buffer);
            assert_eq!(&buffer[..], &[] as &[u8]);
        }
    }

    #[test]
    fn test_eull1() {
        let mut arena = MemoryArena::default();
        let mut stack = ExpUnrolledLinkedList::default();
        stack.writer(&mut arena).extend_from_slice(&[1u8]);
        stack.writer(&mut arena).extend_from_slice(&[2u8]);
        stack.writer(&mut arena).extend_from_slice(&[3u8, 4u8]);
        stack.writer(&mut arena).extend_from_slice(&[5u8]);
        {
            let mut buffer = Vec::new();
            stack.read_to_end(&arena, &mut buffer);
            assert_eq!(&buffer[..], &[1u8, 2u8, 3u8, 4u8, 5u8]);
        }
    }

    #[test]
    fn test_eull_vint1() {
        let mut arena = MemoryArena::default();
        let mut stack = ExpUnrolledLinkedList::default();
        stack.writer(&mut arena).extend_from_slice(&[1u8]);
        stack.writer(&mut arena).extend_from_slice(&[2u8]);
        stack.writer(&mut arena).extend_from_slice(&[3u8, 4u8]);
        stack.writer(&mut arena).extend_from_slice(&[5u8]);
        {
            let mut buffer = Vec::new();
            stack.read_to_end(&arena, &mut buffer);
            assert_eq!(&buffer[..], &[1u8, 2u8, 3u8, 4u8, 5u8]);
        }
    }

    #[test]
    fn test_eull_first_write_extends_cap() {
        let mut arena = MemoryArena::default();
        let mut stack = ExpUnrolledLinkedList::default();
        stack
            .writer(&mut arena)
            .extend_from_slice(&[1u8, 2, 3, 4, 5, 6, 7, 8, 9]);
        {
            let mut buffer = Vec::new();
            stack.read_to_end(&arena, &mut buffer);
            assert_eq!(&buffer[..], &[1u8, 2, 3, 4, 5, 6, 7, 8, 9]);
        }
    }

    #[test]
    fn test_eull_long() {
        let mut arena = MemoryArena::default();
        let mut eull = ExpUnrolledLinkedList::default();
        let data: Vec<u32> = (0..100).collect();
        for &el in &data {
            eull.writer(&mut arena).write_u32_vint(el);
        }
        let mut buffer = Vec::new();
        eull.read_to_end(&arena, &mut buffer);
        let mut result = vec![];
        let mut remaining = &buffer[..];
        while !remaining.is_empty() {
            result.push(read_u32_vint(&mut remaining));
        }
        assert_eq!(&result[..], &data[..]);
    }

    #[test]
    fn test_eull_limit() {
        let mut eull = ExpUnrolledLinkedList::default();
        for _ in 0..100 {
            eull.increment_num_blocks();
        }
        assert_eq!(get_block_size(eull.block_num), 1 << 15);
    }

    #[test]
    fn test_eull_interlaced() {
        let mut arena = MemoryArena::default();
        let mut stack = ExpUnrolledLinkedList::default();
        let mut stack2 = ExpUnrolledLinkedList::default();

        let mut vec1: Vec<u8> = vec![];
        let mut vec2: Vec<u8> = vec![];

        for i in 0..9 {
            stack.writer(&mut arena).write_u32_vint(i);
            assert!(write_u32_vint(i, &mut vec1).is_ok());
            if i % 2 == 0 {
                stack2.writer(&mut arena).write_u32_vint(i);
                assert!(write_u32_vint(i, &mut vec2).is_ok());
            }
        }
        let mut res1 = vec![];
        let mut res2 = vec![];
        stack.read_to_end(&arena, &mut res1);
        stack2.read_to_end(&arena, &mut res2);
        assert_eq!(&vec1[..], &res1[..]);
        assert_eq!(&vec2[..], &res2[..]);
    }

    // Tests for u32 block_num fix (issue with large arrays)

    #[test]
    fn test_block_num_exceeds_u16_max() {
        // Test that we can handle more than 65,535 blocks (old u16 limit)
        let mut eull = ExpUnrolledLinkedList::default();

        // Simulate allocating 70,000 blocks (exceeds u16::MAX of 65,535)
        for _ in 0..70_000 {
            eull.increment_num_blocks();
        }

        // Verify block_num is correct
        assert_eq!(eull.block_num, FIRST_BLOCK_NUM + 70_000);

        // Verify we can still get block size (should be capped at 32KB)
        let block_size = get_block_size(eull.block_num);
        assert_eq!(block_size, 1 << 15); // 32KB max
    }

    #[test]
    #[allow(clippy::needless_range_loop)]
    fn test_large_dataset_simulation() {
        // Simulate the scenario: large arrays requiring many blocks
        // We write enough data to require thousands of blocks
        let mut arena = MemoryArena::default();
        let mut eull = ExpUnrolledLinkedList::default();

        // Write 100 MB of data (this will require ~3,200 blocks at 32KB each)
        // This is enough to validate the system works with large datasets
        // but not so much that the test is slow
        let bytes_per_write = 10_000;
        let num_writes = 10_000; // 10k * 10k = 100 MB

        let data: Vec<u8> = (0..bytes_per_write).map(|i| (i % 256) as u8).collect();
        for _ in 0..num_writes {
            eull.writer(&mut arena).extend_from_slice(&data);
        }

        // Verify we allocated many blocks (should be in the thousands)
        assert!(
            eull.block_num > 1000,
            "block_num ({}) should be > 1000 for this much data",
            eull.block_num
        );

        // Verify we can read back correctly
        let mut buffer = Vec::new();
        eull.read_to_end(&arena, &mut buffer);
        assert_eq!(buffer.len(), bytes_per_write * num_writes);

        // Verify data integrity on a sample
        for i in 0..bytes_per_write {
            assert_eq!(buffer[i], (i % 256) as u8);
        }
    }

    #[test]
    fn test_get_block_size_with_large_block_num() {
        // Test that get_block_size handles large u32 values correctly

        // Small block numbers (under 15)
        assert_eq!(get_block_size(2), 4); // 2^2 = 4
        assert_eq!(get_block_size(3), 8); // 2^3 = 8
        assert_eq!(get_block_size(10), 1024); // 2^10 = 1KB

        // At the cap (15)
        assert_eq!(get_block_size(15), 32768); // 2^15 = 32KB

        // Beyond the cap (should stay at 32KB)
        assert_eq!(get_block_size(16), 32768);
        assert_eq!(get_block_size(100), 32768);
        assert_eq!(get_block_size(65_536), 32768); // Old u16::MAX + 1
        assert_eq!(get_block_size(100_000), 32768);
        assert_eq!(get_block_size(1_000_000), 32768);
    }

    #[test]
    fn test_increment_blocks_near_u16_boundary() {
        // Test incrementing around the old u16::MAX boundary
        let mut eull = ExpUnrolledLinkedList::default();

        // Set to just before old limit
        for _ in 0..65_533 {
            eull.increment_num_blocks();
        }
        assert_eq!(eull.block_num, FIRST_BLOCK_NUM + 65_533);

        // Cross the old u16::MAX boundary (this would have overflowed before)
        eull.increment_num_blocks(); // 65,534
        eull.increment_num_blocks(); // 65,535 (old max)
        eull.increment_num_blocks(); // 65,536 (would overflow u16)
        eull.increment_num_blocks(); // 65,537

        // Verify we're past the old limit
        assert_eq!(eull.block_num, FIRST_BLOCK_NUM + 65_537);
    }

    #[test]
    fn test_write_and_read_with_many_blocks() {
        // Test that write/read works correctly with many blocks
        let mut arena = MemoryArena::default();
        let mut eull = ExpUnrolledLinkedList::default();

        // Write data that will span many blocks
        let test_data: Vec<u8> = (0..50_000).map(|i| (i % 256) as u8).collect();
        eull.writer(&mut arena).extend_from_slice(&test_data);

        // Read it back
        let mut buffer = Vec::new();
        eull.read_to_end(&arena, &mut buffer);

        // Verify data integrity
        assert_eq!(buffer.len(), test_data.len());
        assert_eq!(&buffer[..], &test_data[..]);
    }

    #[test]
    fn test_multiple_eull_with_large_block_counts() {
        // Test multiple ExpUnrolledLinkedLists with high block counts
        // (simulates parallel columnar writes)
        let mut arena = MemoryArena::default();
        let mut eull1 = ExpUnrolledLinkedList::default();
        let mut eull2 = ExpUnrolledLinkedList::default();

        // Write different data to each
        for i in 0..10_000u32 {
            eull1.writer(&mut arena).write_u32_vint(i);
            eull2.writer(&mut arena).write_u32_vint(i * 2);
        }

        // Read back and verify
        let mut buf1 = Vec::new();
        let mut buf2 = Vec::new();
        eull1.read_to_end(&arena, &mut buf1);
        eull2.read_to_end(&arena, &mut buf2);

        // Deserialize and check
        let mut cursor1 = &buf1[..];
        let mut cursor2 = &buf2[..];
        for i in 0..10_000u32 {
            assert_eq!(read_u32_vint(&mut cursor1), i);
            assert_eq!(read_u32_vint(&mut cursor2), i * 2);
        }
    }

    #[test]
    fn test_block_size_stays_capped() {
        // Verify that even with massive block numbers, size stays at 32KB
        let mut eull = ExpUnrolledLinkedList::default();

        // Increment to a very large number
        for _ in 0..200_000 {
            eull.increment_num_blocks();
        }

        let block_size = get_block_size(eull.block_num);
        assert_eq!(block_size, 32768, "Block size should be capped at 32KB");
    }

    #[test]
    #[should_panic(expected = "ExpUnrolledLinkedList block count overflow")]
    fn test_increment_overflow_protection() {
        // Test that we panic gracefully if we somehow hit u32::MAX
        // This is extremely unlikely in practice (would require 128TB of data)
        let mut eull = ExpUnrolledLinkedList {
            block_num: u32::MAX,
            ..Default::default()
        };

        // This should panic with our custom error message
        eull.increment_num_blocks();
    }
}

#[cfg(all(test, feature = "unstable"))]
mod bench {
    use std::iter;

    use test::Bencher;

    use super::super::MemoryArena;
    use super::ExpUnrolledLinkedList;

    const NUM_STACK: usize = 10_000;
    const STACK_SIZE: u32 = 1000;

    #[bench]
    fn bench_push_vec(bench: &mut Bencher) {
        bench.iter(|| {
            let mut vecs = Vec::with_capacity(100);
            for _ in 0..NUM_STACK {
                vecs.push(Vec::new());
            }
            for s in 0..NUM_STACK {
                for i in 0u32..STACK_SIZE {
                    let t = s * 392017 % NUM_STACK;
                    vecs[t].push(i);
                }
            }
        });
    }

    #[bench]
    fn bench_push_stack(bench: &mut Bencher) {
        bench.iter(|| {
            let mut arena = MemoryArena::default();
            let mut stacks: Vec<ExpUnrolledLinkedList> =
                iter::repeat_with(ExpUnrolledLinkedList::default)
                    .take(NUM_STACK)
                    .collect();
            for s in 0..NUM_STACK {
                for i in 0u32..STACK_SIZE {
                    let t = s * 392017 % NUM_STACK;
                    stacks[t]
                        .writer(&mut arena)
                        .extend_from_slice(&i.to_ne_bytes());
                }
            }
        });
    }
}


================================================
FILE: stacker/src/fastcmp.rs
================================================
/// fastcmp employs a trick to speed up the comparison of two slices of bytes.
/// It's also possible to inline compared to the memcmp call.
///
/// E.g. Comparing equality of slice length 7 in two steps, by comparing two 4 byte slices
/// unconditionally instead comparing the remaining 3 bytes if the first comparison was equal.
/// [1, 2, 3, 4, 5, 6, 7]
/// [1, 2, 3, 4]
///          [4, 5, 6, 7]
///
/// This method uses the XMM register for bytes slices bigger than 16, else regular registers.
#[inline]
pub fn fast_short_slice_compare(left: &[u8], right: &[u8]) -> bool {
    let len = left.len();
    if len != right.len() {
        return false;
    }

    // This could be less equals, but to make the job a little bit easier for the branch predictor
    // we put the length 8 into the bigger group (8-16 bytes), that compares two u64
    // assuming that range 8-16 are more common than 4-7

    // This weird branching is done on purpose to get the best assembly.
    // if len< 4 {
    // ..
    // if len < 8
    // will cause assembly inlined instead of jumps
    if len < 8 {
        if len >= 4 {
            return double_check_trick::<4>(left, right);
        } else {
            return short_compare(left, right);
        }
    }

    if len > 16 {
        return fast_nbyte_slice_compare::<16>(left, right);
    }

    double_check_trick::<8>(left, right)
}

// Note: The straightforward left.chunks_exact(SIZE).zip(right.chunks_exact(SIZE)) produces slower
// assembly
#[inline]
pub fn fast_nbyte_slice_compare<const SIZE: usize>(left: &[u8], right: &[u8]) -> bool {
    let last = left.len() - left.len() % SIZE;
    let mut i = 0;
    loop {
        if unsafe { left.get_unchecked(i..i + SIZE) != right.get_unchecked(i..i + SIZE) } {
            return false;
        }
        i += SIZE;
        if i >= last {
            break;
        }
    }
    unsafe { left.get_unchecked(left.len() - SIZE..) == right.get_unchecked(right.len() - SIZE..) }
}

#[inline(always)]
fn short_compare(left: &[u8], right: &[u8]) -> bool {
    for (l, r) in left.iter().zip(right) {
        if l != r {
            return false;
        }
    }
    true
}

#[inline(always)]
fn double_check_trick<const SIZE: usize>(left: &[u8], right: &[u8]) -> bool {
    left[0..SIZE] == right[0..SIZE] && left[left.len() - SIZE..] == right[right.len() - SIZE..]
}

#[cfg(test)]
mod tests {
    use proptest::prelude::*;

    use super::*;

    #[test]
    fn test_slice_compare_bytes_len_8() {
        let a = &[1, 2, 3, 4, 5, 6, 7, 8];
        let b = &[1, 2, 3, 4, 5, 6, 7, 8];
        let c = &[1, 2, 3, 4, 5, 6, 7, 7];

        assert!(fast_short_slice_compare(a, b));
        assert!(!fast_short_slice_compare(a, c));
    }

    #[test]
    fn test_slice_compare_bytes_len_9() {
        let a = &[1, 2, 3, 4, 5, 6, 7, 8, 9];
        let b = &[1, 2, 3, 4, 5, 6, 7, 8, 9];
        let c = &[0, 2, 3, 4, 5, 6, 7, 8, 9];

        assert!(fast_short_slice_compare(a, b));
        assert!(!fast_short_slice_compare(a, c));
    }

    #[test]
    fn test_slice_compare_bytes_len_16() {
        let a = &[1, 2, 3, 4, 5, 6, 7, 8, 1, 2, 3, 4, 5, 6, 7, 8];
        let b = &[1, 2, 3, 4, 5, 6, 7, 8, 1, 2, 3, 4, 5, 6, 7, 8];
        let c = &[1, 2, 3, 4, 5, 6, 7, 7, 1, 2, 3, 4, 5, 6, 7, 8];

        assert!(fast_short_slice_compare(a, b));
        assert!(!fast_short_slice_compare(a, c));
    }

    #[test]
    fn test_slice_compare_bytes_short() {
        let a = &[1, 2, 3, 4];
        let b = &[1, 2, 3, 4];

        assert!(fast_short_slice_compare(a, b));

        let a = &[1, 2, 3];
        let b = &[1, 2, 3];

        assert!(fast_short_slice_compare(a, b));

        let a = &[1, 2];
        let b = &[1, 2];

        assert!(fast_short_slice_compare(a, b));
    }

    proptest! {
        #[test]
        fn test_fast_short_slice_compare(left in prop::collection::vec(any::<u8>(), 0..100),
                                          right in prop::collection::vec(any::<u8>(), 0..100)) {
            let result = fast_short_slice_compare(&left, &right);
            let expected = left == right;
            prop_assert_eq!(result, expected, "left: {:?}, right: {:?}", left, right);
        }

        #[test]
        fn test_fast_short_slice_compare_equal(left in prop::collection::vec(any::<u8>(), 0..100),
                                          ) {
            let result = fast_short_slice_compare(&left, &left);
            let expected = left == left;
            prop_assert_eq!(result, expected, "left: {:?}, right: {:?}", left, left);
        }

    }
}


================================================
FILE: stacker/src/fastcpy.rs
================================================
/// Optimized copy for small sizes. All bounds checks are elided.
/// Avoids call to memcpy
/// Applies unbranched copy trick for sizes 8, 16, 32
///
/// src and dst must be num_bytes long.
#[inline]
pub fn fast_short_slice_copy(src: &[u8], dst: &mut [u8]) {
    #[inline(never)]
    #[cold]
    #[track_caller]
    fn len_mismatch_fail(dst_len: usize, src_len: usize) -> ! {
        panic!(
            "source slice length ({}) does not match destination slice length ({})",
            src_len, dst_len,
        );
    }

    if src.len() != dst.len() {
        len_mismatch_fail(src.len(), dst.len());
    }
    let len = src.len();

    if src.is_empty() {
        return;
    }

    if len < 4 {
        short_copy(src, dst);
        return;
    }

    if len < 8 {
        double_copy_trick::<4>(src, dst);
        return;
    }

    if len <= 16 {
        double_copy_trick::<8>(src, dst);
        return;
    }

    if len <= 32 {
        double_copy_trick::<16>(src, dst);
        return;
    }

    // The code will use the vmovdqu instruction to copy 32 bytes at a time.
    #[cfg(target_feature = "avx")]
    {
        if len <= 64 {
            double_copy_trick::<32>(src, dst);
            return;
        }
    }

    // For larger sizes we use the default, which calls memcpy
    // memcpy does some virtual memory tricks to copy large chunks of memory.
    //
    // The theory should be that the checks above don't cost much relative to the copy call for
    // larger copies.
    // The bounds checks in `copy_from_slice` are elided.
    dst.copy_from_slice(src);
}

#[inline(always)]
fn short_copy(src: &[u8], dst: &mut [u8]) {
    debug_assert_ne!(src.len(), 0);
    debug_assert_eq!(src.len(), dst.len());
    let len = src.len();

    // length 1-3
    dst[0] = src[0];
    if len >= 2 {
        double_copy_trick::<2>(src, dst);
    }
}

#[inline(always)]
fn double_copy_trick<const SIZE: usize>(src: &[u8], dst: &mut [u8]) {
    debug_assert!(src.len() >= SIZE);
    debug_assert!(dst.len() >= SIZE);
    dst[0..SIZE].copy_from_slice(&src[0..SIZE]);
    dst[src.len() - SIZE..].copy_from_slice(&src[src.len() - SIZE..]);
}

#[cfg(test)]
mod tests {
    use super::*;

    fn copy_test<const SIZE: usize>() {
        let src: Vec<u8> = (0..SIZE as u8).collect();
        let mut dst = [0u8; SIZE];
        fast_short_slice_copy(&src, &mut dst);
        assert_eq!(src, dst);
    }

    #[test]
    fn copy_test_n() {
        copy_test::<1>();
        copy_test::<2>();
        copy_test::<3>();
        copy_test::<4>();
        copy_test::<5>();
        copy_test::<6>();
        copy_test::<7>();
        copy_test::<8>();
        copy_test::<9>();
        copy_test::<10>();
        copy_test::<11>();
        copy_test::<31>();
        copy_test::<32>();
        copy_test::<33>();
        copy_test::<47>();
        copy_test::<48>();
        copy_test::<49>();
    }
}


================================================
FILE: stacker/src/lib.rs
================================================
#![cfg_attr(all(feature = "unstable", test), feature(test))]

#[cfg(all(test, feature = "unstable"))]
extern crate test;

mod arena_hashmap;
mod expull;
mod fastcmp;
mod fastcpy;
mod memory_arena;
mod shared_arena_hashmap;

pub use self::arena_hashmap::ArenaHashMap;
pub use self::expull::ExpUnrolledLinkedList;
pub use self::memory_arena::{Addr, MemoryArena};
pub use self::shared_arena_hashmap::{SharedArenaHashMap, compute_table_memory_size};

/// When adding an element in a `ArenaHashMap`, we get a unique id associated to the given key.
pub type UnorderedId = u32;


================================================
FILE: stacker/src/memory_arena.rs
================================================
//! 32-bits Memory arena for types implementing `Copy`.
//! This Memory arena has been implemented to fit the use of tantivy's indexer
//! and has *twisted specifications*.
//!
//! - It works on stable rust.
//! - One can get an accurate figure of the memory usage of the arena.
//! - Allocation are very cheap.
//! - Allocation happening consecutively are very likely to have great locality.
//! - Addresses (`Addr`) are 32bits.
//! - Dropping the whole `MemoryArena` is cheap.
//!
//! # Limitations
//!
//! - Your object shall not implement `Drop`.
//! - `Addr` to the `Arena` are 32-bits. The maximum capacity of the arena is 4GB. *(Tantivy's
//!   indexer uses one arena per indexing thread.)*
//! - The arena only works for objects much smaller than  `1MB`. Allocating more than `1MB` at a
//!   time will result in a panic, and allocating a lot of large object (> 500KB) will result in a
//!   fragmentation.
//! - Your objects are store in an unaligned fashion. For this reason, the API does not let you
//!   access them as references.
//!
//! Instead, you store and access your data via `.write(...)` and `.read(...)`, which under the hood
//! stores your object using `ptr::write_unaligned` and `ptr::read_unaligned`.
use std::{mem, ptr};

const NUM_BITS_PAGE_ADDR: usize = 20;
const PAGE_SIZE: usize = 1 << NUM_BITS_PAGE_ADDR; // pages are 1 MB large

/// Represents a pointer into the `MemoryArena`
/// .
/// Pointer are 32-bits and are split into
/// two parts.
///
/// The first 12 bits represent the id of a
/// page of memory.
///
/// The last 20 bits are an address within this page of memory.
#[derive(Copy, Clone, Debug)]
pub struct Addr(u32);

impl Addr {
    /// Creates a null pointer.
    #[inline]
    pub fn null_pointer() -> Addr {
        Addr(u32::MAX)
    }

    /// Returns the `Addr` object for `addr + offset`
    #[inline]
    pub fn offset(self, offset: u32) -> Addr {
        Addr(self.0.wrapping_add(offset))
    }

    #[inline]
    fn new(page_id: usize, local_addr: usize) -> Addr {
        Addr(((page_id << NUM_BITS_PAGE_ADDR) | local_addr) as u32)
    }

    #[inline]
    fn page_id(self) -> usize {
        (self.0 as usize) >> NUM_BITS_PAGE_ADDR
    }

    #[inline]
    fn page_local_addr(self) -> usize {
        (self.0 as usize) & (PAGE_SIZE - 1)
    }

    /// Returns true if and only if the `Addr` is null.
    #[inline]
    pub fn is_null(self) -> bool {
        self.0 == u32::MAX
    }
}

#[inline(always)]
pub fn store<Item: Copy + 'static>(dest: &mut [u8], val: Item) {
    debug_assert_eq!(dest.len(), std::mem::size_of::<Item>());
    unsafe {
        ptr::write_unaligned(dest.as_mut_ptr() as *mut Item, val);
    }
}

#[inline]
pub fn load<Item: Copy + 'static>(data: &[u8]) -> Item {
    debug_assert_eq!(data.len(), std::mem::size_of::<Item>());
    unsafe { ptr::read_unaligned(data.as_ptr() as *const Item) }
}

/// The `MemoryArena`
pub struct MemoryArena {
    pages: Vec<Page>,
}

impl Default for MemoryArena {
    fn default() -> MemoryArena {
        let first_page = Page::new(0);
        MemoryArena {
            pages: vec![first_page],
        }
    }
}

impl MemoryArena {
    /// Returns an estimate in number of bytes
    /// of resident memory consumed by the `MemoryArena`.
    ///
    /// Internally, it counts a number of `1MB` pages
    /// and therefore delivers an upperbound.
    pub fn mem_usage(&self) -> usize {
        self.pages.len() * PAGE_SIZE
    }

    /// Returns the number of bytes allocated in the arena.
    pub fn len(&self) -> usize {
        self.pages.len().saturating_sub(1) * PAGE_SIZE + self.pages.last().unwrap().len
    }

    pub fn is_empty(&self) -> bool {
        self.len() == 0
    }

    #[inline]
    pub fn write_at<Item: Copy + 'static>(&mut self, addr: Addr, val: Item) {
        let dest = self.slice_mut(addr, std::mem::size_of::<Item>());
        store(dest, val);
    }

    /// Read an item in the memory arena at the given `address`.
    ///
    /// # Panics
    ///
    /// If the address is erroneous
    #[inline]
    pub fn read<Item: Copy + 'static>(&self, addr: Addr) -> Item {
        load(self.slice(addr, mem::size_of::<Item>()))
    }
    #[inline]
    fn get_page(&self, page_id: usize) -> &Page {
        unsafe { self.pages.get_unchecked(page_id) }
    }
    #[inline]
    fn get_page_mut(&mut self, page_id: usize) -> &mut Page {
        unsafe { self.pages.get_unchecked_mut(page_id) }
    }

    #[inline]
    pub fn slice(&self, addr: Addr, len: usize) -> &[u8] {
        self.get_page(addr.page_id())
            .slice(addr.page_local_addr(), len)
    }

    #[inline]
    pub fn slice_from(&self, addr: Addr) -> &[u8] {
        self.get_page(addr.page_id())
            .slice_from(addr.page_local_addr())
    }
    #[inline]
    pub fn slice_from_mut(&mut self, addr: Addr) -> &mut [u8] {
        self.get_page_mut(addr.page_id())
            .slice_from_mut(addr.page_local_addr())
    }

    #[inline]
    pub fn slice_mut(&mut self, addr: Addr, len: usize) -> &mut [u8] {
        self.get_page_mut(addr.page_id())
            .slice_mut(addr.page_local_addr(), len)
    }

    /// Add a page and allocate len on it.
    /// Return the address
    fn add_page(&mut self, len: usize) -> Addr {
        let new_page_id = self.pages.len();
        let mut page = Page::new(new_page_id);
        page.len = len;
        self.pages.push(page);
        Addr::new(new_page_id, 0)
    }

    /// Allocates `len` bytes and returns the allocated address.
    #[inline]
    pub fn allocate_space(&mut self, len: usize) -> Addr {
        let page_id = self.pages.len() - 1;
        if let Some(addr) = self.get_page_mut(page_id).allocate_space(len) {
            return addr;
        }
        self.add_page(len)
    }
}

struct Page {
    page_id: usize,
    len: usize,
    data: Box<[u8; PAGE_SIZE]>,
}

impl Page {
    fn new(page_id: usize) -> Page {
        // We use 32-bits addresses.
        // - 20 bits for the in-page addressing
        // - 12 bits for the page id.
        // This limits us to 2^12 - 1=4095 for the page id.
        assert!(page_id < 4096);
        Page {
            page_id,
            len: 0,
            data: vec![0u8; PAGE_SIZE].into_boxed_slice().try_into().unwrap(),
        }
    }

    #[inline]
    fn is_available(&self, len: usize) -> bool {
        len + self.len <= PAGE_SIZE
    }

    #[inline]
    fn slice(&self, local_addr: usize, len: usize) -> &[u8] {
        let data = &self.slice_from(local_addr);
        unsafe { data.get_unchecked(..len) }
    }

    #[inline]
    fn slice_from(&self, local_addr: usize) -> &[u8] {
        &self.data[local_addr..]
    }
    #[inline]
    fn slice_from_mut(&mut self, local_addr: usize) -> &mut [u8] {
        &mut self.data[local_addr..]
    }

    #[inline]
    fn slice_mut(&mut self, local_addr: usize, len: usize) -> &mut [u8] {
        let data = &mut self.data[local_addr..];
        unsafe { data.get_unchecked_mut(..len) }
    }

    #[inline]
    fn allocate_space(&mut self, len: usize) -> Option<Addr> {
        if self.is_available(len) {
            let addr = Addr::new(self.page_id, self.len);
            self.len += len;
            Some(addr)
        } else {
            None
        }
    }
}

#[cfg(test)]
mod tests {

    use super::MemoryArena;
    use crate::memory_arena::PAGE_SIZE;

    #[test]
    fn test_arena_allocate_slice() {
        let mut arena = MemoryArena::default();
        let a = b"hello";
        let b = b"happy tax payer";

        let addr_a = arena.allocate_space(a.len());
        arena.slice_mut(addr_a, a.len()).copy_from_slice(a);

        let addr_b = arena.allocate_space(b.len());
        arena.slice_mut(addr_b, b.len()).copy_from_slice(b);

        assert_eq!(arena.slice(addr_a, a.len()), a);
        assert_eq!(arena.slice(addr_b, b.len()), b);
    }

    #[test]
    fn test_arena_allocate_end_of_page() {
        let mut arena = MemoryArena::default();

        // A big block
        let len_a = PAGE_SIZE - 2;
        let addr_a = arena.allocate_space(len_a);
        *arena.slice_mut(addr_a, len_a).last_mut().unwrap() = 1;

        // Single bytes
        let addr_b = arena.allocate_space(1);
        arena.slice_mut(addr_b, 1)[0] = 2;

        let addr_c = arena.allocate_space(1);
        arena.slice_mut(addr_c, 1)[0] = 3;

        let addr_d = arena.allocate_space(1);
        arena.slice_mut(addr_d, 1)[0] = 4;

        assert_eq!(arena.slice(addr_a, len_a)[len_a - 1], 1);
        assert_eq!(arena.slice(addr_b, 1)[0], 2);
        assert_eq!(arena.slice(addr_c, 1)[0], 3);
        assert_eq!(arena.slice(addr_d, 1)[0], 4);
    }

    #[derive(Clone, Copy, Debug, Eq, PartialEq)]
    struct MyTest {
        pub a: usize,
        pub b: u8,
        pub c: u32,
    }

    #[test]
    fn test_store_object() {
        let mut arena = MemoryArena::default();
        let a = MyTest {
            a: 143,
            b: 21,
            c: 32,
        };
        let b = MyTest {
            a: 113,
            b: 221,
            c: 12,
        };

        let num_bytes = std::mem::size_of::<MyTest>();
        let addr_a = arena.allocate_space(num_bytes);
        arena.write_at(addr_a, a);

        let addr_b = arena.allocate_space(num_bytes);
        arena.write_at(addr_b, b);

        assert_eq!(arena.read::<MyTest>(addr_a), a);
        assert_eq!(arena.read::<MyTest>(addr_b), b);
    }
}


================================================
FILE: stacker/src/shared_arena_hashmap.rs
================================================
use std::iter::{Cloned, Filter};
use std::mem;

use super::{Addr, MemoryArena};
use crate::fastcpy::fast_short_slice_copy;
use crate::memory_arena::store;

/// Returns the actual memory size in bytes
/// required to create a table with a given capacity.
/// required to create a table of size
pub fn compute_table_memory_size(capacity: usize) -> usize {
    capacity * mem::size_of::<KeyValue>()
}

#[cfg(not(feature = "compare_hash_only"))]
type HashType = u32;

#[cfg(feature = "compare_hash_only")]
type HashType = u64;

/// `KeyValue` is the item stored in the hash table.
/// The key is actually a `BytesRef` object stored in an external memory arena.
/// The `value_addr` also points to an address in the memory arena.
#[derive(Copy, Clone)]
struct KeyValue {
    key_value_addr: Addr,
    hash: HashType,
}

impl Default for KeyValue {
    fn default() -> Self {
        KeyValue {
            key_value_addr: Addr::null_pointer(),
            hash: 0,
        }
    }
}

impl KeyValue {
    #[inline]
    fn is_empty(&self) -> bool {
        self.key_value_addr.is_null()
    }
    #[inline]
    fn is_not_empty_ref(&self) -> bool {
        !self.key_value_addr.is_null()
    }
}

/// Customized `HashMap` with `&[u8]` keys
///
/// Its main particularity is that rather than storing its
/// keys in the heap, keys are stored in a memory arena
/// inline with the values.
///
/// The quirky API has the benefit of avoiding
/// the computation of the hash of the key twice,
/// or copying the key as long as there is no insert.
///
/// SharedArenaHashMap is like ArenaHashMap but gets the memory arena
/// passed as an argument to the methods.
/// So one MemoryArena can be shared with multiple SharedArenaHashMap.
pub struct SharedArenaHashMap {
    table: Vec<KeyValue>,
    mask: usize,
    len: usize,
}

struct LinearProbing {
    pos: usize,
    mask: usize,
}

impl LinearProbing {
    #[inline]
    fn compute(hash: HashType, mask: usize) -> LinearProbing {
        LinearProbing {
            pos: hash as usize,
            mask,
        }
    }

    #[inline]
    fn next_probe(&mut self) -> usize {
        // Not saving the masked version removes a dependency.
        self.pos = self.pos.wrapping_add(1);
        self.pos & self.mask
    }
}

type IterNonEmpty<'a> = Filter<Cloned<std::slice::Iter<'a, KeyValue>>, fn(&KeyValue) -> bool>;

pub struct Iter<'a> {
    hashmap: &'a SharedArenaHashMap,
    memory_arena: &'a MemoryArena,
    inner: IterNonEmpty<'a>,
}

impl<'a> Iterator for Iter<'a> {
    type Item = (&'a [u8], Addr);

    fn next(&mut self) -> Option<Self::Item> {
        self.inner.next().map(move |kv| {
            let (key, offset): (&'a [u8], Addr) = self
                .hashmap
                .get_key_value(kv.key_value_addr, self.memory_arena);
            (key, offset)
        })
    }
}

/// Returns the greatest power of two lower or equal to `n`.
/// Except if n == 0, in that case, return 1.
///
/// # Panics if n == 0
fn compute_previous_power_of_two(n: usize) -> usize {
    assert!(n > 0);
    let msb = (63u32 - (n as u64).leading_zeros()) as u8;
    1 << msb
}

impl Default for SharedArenaHashMap {
    fn default() -> Self {
        SharedArenaHashMap::with_capacity(4)
    }
}

impl SharedArenaHashMap {
    pub fn with_capacity(table_size: usize) -> SharedArenaHashMap {
        let table_size_power_of_2 = compute_previous_power_of_two(table_size);
        let table = vec![KeyValue::default(); table_size_power_of_2];

        SharedArenaHashMap {
            table,
            mask: table_size_power_of_2 - 1,
            len: 0,
        }
    }

    #[inline]
    #[cfg(not(feature = "compare_hash_only"))]
    fn get_hash(&self, key: &[u8]) -> HashType {
        murmurhash32::murmurhash2(key)
    }

    #[inline]
    #[cfg(feature = "compare_hash_only")]
    fn get_hash(&self, key: &[u8]) -> HashType {
        /// Since we compare only the hash we need a high quality hash.
        use std::hash::Hasher;
        let mut hasher = ahash::AHasher::default();
        hasher.write(key);
        hasher.finish() as HashType
    }

    #[inline]
    fn probe(&self, hash: HashType) -> LinearProbing {
        LinearProbing::compute(hash, self.mask)
    }

    #[inline]
    pub fn mem_usage(&self) -> usize {
        self.table.len() * mem::size_of::<KeyValue>()
    }

    #[inline]
    fn is_saturated(&self) -> bool {
        self.table.len() <= self.len * 2
    }

    #[inline]
    fn get_key_value<'a>(&'a self, addr: Addr, memory_arena: &'a MemoryArena) -> (&'a [u8], Addr) {
        let data = memory_arena.slice_from(addr);
        let key_bytes_len_bytes = unsafe { data.get_unchecked(..2) };
        let key_bytes_len = u16::from_le_bytes(key_bytes_len_bytes.try_into().unwrap());
        let key_bytes: &[u8] = unsafe { data.get_unchecked(2..2 + key_bytes_len as usize) };
        (key_bytes, addr.offset(2 + key_bytes_len as u32))
    }

    #[inline]
    #[cfg(not(feature = "compare_hash_only"))]
    fn get_value_addr_if_key_match(
        &self,
        target_key: &[u8],
        addr: Addr,
        memory_arena: &MemoryArena,
    ) -> Option<Addr> {
        use crate::fastcmp::fast_short_slice_compare;

        let (stored_key, value_addr) = self.get_key_value(addr, memory_arena);
        if fast_short_slice_compare(stored_key, target_key) {
            Some(value_addr)
        } else {
            None
        }
    }
    #[inline]
    #[cfg(feature = "compare_hash_only")]
    fn get_value_addr_if_key_match(
        &self,
        _target_key: &[u8],
        addr: Addr,
        memory_arena: &MemoryArena,
    ) -> Option<Addr> {
        // For the compare_hash_only feature, it would make sense to store the keys at a different
        // memory location. Here they will just pollute the cache.
        let data = memory_arena.slice_from(addr);
        let key_bytes_len_bytes = &data[..2];
        let key_bytes_len = u16::from_le_bytes(key_bytes_len_bytes.try_into().unwrap());
        let value_addr = addr.offset(2 + key_bytes_len as u32);

        Some(value_addr)
    }

    #[inline]
    fn set_bucket(&mut self, hash: HashType, key_value_addr: Addr, bucket: usize) {
        self.len += 1;

        self.table[bucket] = KeyValue {
            key_value_addr,
            hash,
        };
    }

    #[inline]
    pub fn is_empty(&self) -> bool {
        self.len() == 0
    }

    #[inline]
    pub fn len(&self) -> usize {
        self.len
    }

    #[inline]
    pub fn iter<'a>(&'a self, memory_arena: &'a MemoryArena) -> Iter<'a> {
        Iter {
            inner: self
                .table
                .iter()
                .cloned()
                .filter(KeyValue::is_not_empty_ref),
            hashmap: self,
            memory_arena,
        }
    }

    fn resize(&mut self) {
        let new_len = (self.table.len() * 2).max(1 << 3);
        let mask = new_len - 1;
        self.mask = mask;
        let new_table = vec![KeyValue::default(); new_len];
        let old_table = mem::replace(&mut self.table, new_table);
        for key_value in old_table.into_iter().filter(KeyValue::is_not_empty_ref) {
            let mut probe = LinearProbing::compute(key_value.hash, mask);
            loop {
                let bucket = probe.next_probe();
                if self.table[bucket].is_empty() {
                    self.table[bucket] = key_value;
                    break;
                }
            }
        }
    }

    /// Get a value associated to a key.
    #[inline]
    pub fn get<V>(&self, key: &[u8], memory_arena: &MemoryArena) -> Option<V>
    where V: Copy + 'static {
        let hash = self.get_hash(key);
        let mut probe = self.probe(hash);
        loop {
            let bucket = probe.next_probe();
            let kv: KeyValue = self.table[bucket];
            if kv.is_empty() {
                return None;
            } else if kv.hash == hash
                && let Some(val_addr) =
                    self.get_value_addr_if_key_match(key, kv.key_value_addr, memory_arena)
            {
                let v = memory_arena.read(val_addr);
                return Some(v);
            }
        }
    }

    /// `update` create a new entry for a given key if it does not exist
    /// or updates the existing entry.
    ///
    /// The actual logic for this update is define in the `updater`
    /// argument.
    ///
    /// If the key is not present, `updater` will receive `None` and
    /// will be in charge of returning a default value.
    /// If the key already as an associated value, then it will be passed
    /// `Some(previous_value)`.
    ///
    /// The key will be truncated to u16::MAX bytes.
    #[inline]
    pub fn mutate_or_create<V>(
        &mut self,
        key: &[u8],
        memory_arena: &mut MemoryArena,
        mut updater: impl FnMut(Option<V>) -> V,
    ) -> V
    where
        V: Copy + 'static,
    {
        if self.is_saturated() {
            self.resize();
        }
        // Limit the key size to u16::MAX
        let key = &key[..std::cmp::min(key.len(), u16::MAX as usize)];
        let hash = self.get_hash(key);
        let mut probe = self.probe(hash);
        let mut bucket = probe.next_probe();
        let mut kv: KeyValue = self.table[bucket];
        loop {
            if kv.is_empty() {
                // The key does not exist yet.
                let val = updater(None);
                let num_bytes = std::mem::size_of::<u16>() + key.len() + std::mem::size_of::<V>();
                let key_addr = memory_arena.allocate_space(num_bytes);
                {
                    let data = memory_arena.slice_mut(key_addr, num_bytes);
                    let key_len_bytes: [u8; 2] = (key.len() as u16).to_le_bytes();
                    data[..2].copy_from_slice(&key_len_bytes);
                    let stop = 2 + key.len();
                    fast_short_slice_copy(key, &mut data[2..stop]);
                    store(&mut data[stop..], val);
                }

                self.set_bucket(hash, key_addr, bucket);
                return val;
            }
            if kv.hash == hash
                && let Some(val_addr) =
                    self.get_value_addr_if_key_match(key, kv.key_value_addr, memory_arena)
            {
                let v = memory_arena.read(val_addr);
                let new_v = updater(Some(v));
                memory_arena.write_at(val_addr, new_v);
                return new_v;
            }
            // This allows fetching the next bucket before the loop jmp
            bucket = probe.next_probe();
            kv = self.table[bucket];
        }
    }
}

#[cfg(test)]
mod tests {

    use std::collections::HashMap;

    use super::{SharedArenaHashMap, compute_previous_power_of_two};
    use crate::MemoryArena;

    #[test]
    fn test_hash_map() {
        let mut memory_arena = MemoryArena::default();
        let mut hash_map: SharedArenaHashMap = SharedArenaHashMap::default();
        hash_map.mutate_or_create(b"abc", &mut memory_arena, |opt_val: Option<u32>| {
            assert_eq!(opt_val, None);
            3u32
        });
        hash_map.mutate_or_create(b"abcd", &mut memory_arena, |opt_val: Option<u32>| {
            assert_eq!(opt_val, None);
            4u32
        });
        hash_map.mutate_or_create(b"abc", &mut memory_arena, |opt_val: Option<u32>| {
            assert_eq!(opt_val, Some(3u32));
            5u32
        });
        let mut vanilla_hash_map = HashMap::new();
        let iter_values = hash_map.iter(&memory_arena);
        for (key, addr) in iter_values {
            let val: u32 = memory_arena.read(addr);
            vanilla_hash_map.insert(key.to_owned(), val);
        }
        assert_eq!(vanilla_hash_map.len(), 2);
    }

    #[test]
    fn test_long_key_truncation() {
        // Keys longer than u16::MAX are truncated.
        let mut memory_arena = MemoryArena::default();
        let mut hash_map: SharedArenaHashMap = SharedArenaHashMap::default();
        let key1 = (0..u16::MAX as usize).map(|i| i as u8).collect::<Vec<_>>();
        hash_map.mutate_or_create(&key1, &mut memory_arena, |opt_val: Option<u32>| {
            assert_eq!(opt_val, None);
            4u32
        });
        // Due to truncation, this key is the same as key1
        let key2 = (0..u16::MAX as usize + 1)
            .map(|i| i as u8)
            .collect::<Vec<_>>();
        hash_map.mutate_or_create(&key2, &mut memory_arena, |opt_val: Option<u32>| {
            assert_eq!(opt_val, Some(4));
            3u32
        });
        let mut vanilla_hash_map = HashMap::new();
        let iter_values = hash_map.iter(&memory_arena);
        for (key, addr) in iter_values {
            let val: u32 = memory_arena.read(addr);
            vanilla_hash_map.insert(key.to_owned(), val);
            assert_eq!(key.len(), key1[..].len());
            assert_eq!(key, &key1[..])
        }
        assert_eq!(vanilla_hash_map.len(), 1); // Both map to the same key
    }

    #[test]
    fn test_empty_hashmap() {
        let memory_arena = MemoryArena::default();
        let hash_map: SharedArenaHashMap = SharedArenaHashMap::default();
        assert_eq!(hash_map.get::<u32>(b"abc", &memory_arena), None);
    }

    #[test]
    fn test_compute_previous_power_of_two() {
        assert_eq!(compute_previous_power_of_two(8), 8);
        assert_eq!(compute_previous_power_of_two(9), 8);
        assert_eq!(compute_previous_power_of_two(7), 4);
        assert_eq!(compute_previous_power_of_two(u64::MAX as usize), 1 << 63);
    }

    #[test]
    fn test_many_terms() {
        let mut memory_arena = MemoryArena::default();
        let mut terms: Vec<String> = (0..20_000).map(|val| val.to_string()).collect();
        let mut hash_map: SharedArenaHashMap = SharedArenaHashMap::default();
        for term in terms.iter() {
            hash_map.mutate_or_create(
                term.as_bytes(),
                &mut memory_arena,
                |_opt_val: Option<u32>| 5u32,
            );
        }
        let mut terms_back: Vec<String> = hash_map
            .iter(&memory_arena)
            .map(|(bytes, _)| String::from_utf8(bytes.to_vec()).unwrap())
            .collect();
        terms_back.sort();
        terms.sort();

        for pos in 0..terms.len() {
            assert_eq!(terms[pos], terms_back[pos]);
        }
    }
}


================================================
FILE: tests/compat_tests_data/index_v6/.managed.json
================================================
["00000000000000000000000000000000.store","00000000000000000000000000000000.fast","00000000000000000000000000000000.fieldnorm","00000000000000000000000000000000.term","00000000000000000000000000000000.idx","meta.json","00000000000000000000000000000000.pos"]


================================================
FILE: tests/compat_tests_data/index_v6/meta.json
================================================
{
  "index_settings": {
    "docstore_compression": "lz4",
    "docstore_blocksize": 16384
  },
  "segments": [
    {
      "segment_id": "00000000-0000-0000-0000-000000000000",
      "max_doc": 1,
      "deletes": null
    }
  ],
  "schema": [
    {
      "name": "label",
      "type": "text",
      "options": {
        "indexing": {
          "record": "position",
          "fieldnorms": true,
          "tokenizer": "default"
        },
        "stored": true,
        "fast": false
      }
    },
    {
      "name": "date",
      "type": "date",
      "options": {
        "indexed": true,
        "fieldnorms": true,
        "fast": false,
        "stored": true,
        "precision": "seconds"
      }
    }
  ],
  "opstamp": 2
}


================================================
FILE: tests/compat_tests_data/index_v7/.managed.json
================================================
["meta.json","000002f0000000000000000000000000.fieldnorm","000002f0000000000000000000000000.pos","000002f0000000000000000000000000.store","000002f0000000000000000000000000.term","000002f0000000000000000000000000.fast","000002f0000000000000000000000000.idx"]


================================================
FILE: tests/compat_tests_data/index_v7/meta.json
================================================
{
  "index_settings": {
    "docstore_compression": "lz4",
    "docstore_blocksize": 16384
  },
  "segments": [
    {
      "segment_id": "000002f0-0000-0000-0000-000000000000",
      "max_doc": 1,
      "deletes": null
    }
  ],
  "schema": [
    {
      "name": "label",
      "type": "text",
      "options": {
        "indexing": {
          "record": "position",
          "fieldnorms": true,
          "tokenizer": "default"
        },
        "stored": true,
        "fast": false
      }
    },
    {
      "name": "date",
      "type": "date",
      "options": {
        "indexed": true,
        "fieldnorms": true,
        "fast": false,
        "stored": true,
        "precision": "seconds"
      }
    }
  ],
  "opstamp": 2
}


================================================
FILE: tests/failpoints/mod.rs
================================================
use std::path::Path;

use tantivy::directory::{Directory, ManagedDirectory, RamDirectory, TerminatingWrite};
use tantivy::schema::{Schema, TEXT};
use tantivy::{doc, Index, IndexWriter, Term};

#[test]
fn test_failpoints_managed_directory_gc_if_delete_fails() {
    let _scenario = fail::FailScenario::setup();

    let test_path: &'static Path = Path::new("some_path_for_test");

    let ram_directory = Box::new(RamDirectory::create());
    let mut managed_directory = ManagedDirectory::wrap(ram_directory).unwrap();
    managed_directory
        .open_write(test_path)
        .unwrap()
        .terminate()
        .unwrap();
    assert!(managed_directory.exists(test_path).unwrap());
    // triggering gc and setting the delete operation to fail.
    //
    // We are checking that the gc operation is not removing the
    // file from managed.json to ensure that the file will be removed
    // in the next gc.
    //
    // The initial 1*off is there to allow for the removal of the
    // lock file.
    fail::cfg("RamDirectory::delete", "1*off->1*return").unwrap();
    assert!(managed_directory.garbage_collect(Default::default).is_ok());
    assert!(managed_directory.exists(test_path).unwrap());

    // running the gc a second time should remove the file.
    assert!(managed_directory.garbage_collect(Default::default).is_ok());
    assert!(
        !managed_directory.exists(test_path).unwrap(),
        "The file should have been deleted"
    );
}

#[test]
fn test_write_commit_fails() -> tantivy::Result<()> {
    let _fail_scenario_guard = fail::FailScenario::setup();
    let mut schema_builder = Schema::builder();
    let text_field = schema_builder.add_text_field("text", TEXT);
    let index = Index::create_in_ram(schema_builder.build());

    let mut index_writer: IndexWriter = index.writer_with_num_threads(1, 15_000_000)?;
    for _ in 0..100 {
        index_writer.add_document(doc!(text_field => "a"))?;
    }
    index_writer.commit()?;
    fail::cfg("save_metas", "return(error_write_failed)").unwrap();
    for _ in 0..100 {
        index_writer.add_document(doc!(text_field => "b"))?;
    }
    assert!(index_writer.commit().is_err());

    let num_docs_containing = |s: &str| {
        let term_a = Term::from_field_text(text_field, s);
        index.reader()?.searcher().doc_freq(&term_a)
    };
    assert_eq!(num_docs_containing("a")?, 100);
    assert_eq!(num_docs_containing("b")?, 0);
    Ok(())
}

// Motivated by
// - https://github.com/quickwit-oss/quickwit/issues/730
// Details at
// - https://github.com/quickwit-oss/tantivy/issues/1198
#[test]
fn test_fail_on_flush_segment() -> tantivy::Result<()> {
    let _fail_scenario_guard = fail::FailScenario::setup();
    let mut schema_builder = Schema::builder();
    let text_field = schema_builder.add_text_field("text", TEXT);
    let index = Index::create_in_ram(schema_builder.build());
    let index_writer: IndexWriter = index.writer_with_num_threads(1, 15_000_000)?;
    fail::cfg("FieldSerializer::close_term", "return(simulatederror)").unwrap();
    for i in 0..100_000 {
        if index_writer
            .add_document(doc!(text_field => format!("hellohappytaxpayerlongtokenblabla{}", i)))
            .is_err()
        {
            return Ok(());
        }
    }
    panic!("add_document should have returned an error");
}

#[test]
fn test_fail_on_flush_segment_but_one_worker_remains() -> tantivy::Result<()> {
    let _fail_scenario_guard = fail::FailScenario::setup();
    let mut schema_builder = Schema::builder();
    let text_field = schema_builder.add_text_field("text", TEXT);
    let index = Index::create_in_ram(schema_builder.build());
    let index_writer: IndexWriter = index.writer_with_num_threads(2, 30_000_000)?;
    fail::cfg("FieldSerializer::close_term", "1*return(simulatederror)").unwrap();
    for i in 0..100_000 {
        if index_writer
            .add_document(doc!(text_field => format!("hellohappytaxpayerlongtokenblabla{}", i)))
            .is_err()
        {
            return Ok(());
        }
    }
    panic!("add_document should have returned an error");
}

#[test]
fn test_fail_on_commit_segment() -> tantivy::Result<()> {
    let _fail_scenario_guard = fail::FailScenario::setup();
    let mut schema_builder = Schema::builder();
    let text_field = schema_builder.add_text_field("text", TEXT);
    let index = Index::create_in_ram(schema_builder.build());
    let mut index_writer: IndexWriter = index.writer_with_num_threads(1, 15_000_000)?;
    fail::cfg("FieldSerializer::close_term", "return(simulatederror)").unwrap();
    for i in 0..10 {
        index_writer
            .add_document(doc!(text_field => format!("hellohappytaxpayerlongtokenblabla{}", i)))?;
    }
    assert!(index_writer.commit().is_err());
    Ok(())
}


================================================
FILE: tokenizer-api/Cargo.toml
================================================
[package]
name = "tantivy-tokenizer-api"
version = "0.6.0"
license = "MIT"
edition = "2021"
description = "Tokenizer API of tantivy"
homepage = "https://github.com/quickwit-oss/tantivy"
repository = "https://github.com/quickwit-oss/tantivy"

# See more keys and their definitions at https://doc.rust-lang.org/cargo/reference/manifest.html

[dependencies]
serde = { version = "1.0.152", features = ["derive"] }


================================================
FILE: tokenizer-api/README.md
================================================

#Tokenizer-API

An API to interface a tokenizer with tantivy. 

The API will be kept stable in order to not break support for existing tokenizers.


================================================
FILE: tokenizer-api/src/lib.rs
================================================
//! Tokenizer are in charge of chopping text into a stream of tokens
//! ready for indexing. This is an separate crate from tantivy, so implementers don't need to update
//! for each new tantivy version.
//!
//! To add support for a tokenizer, implement the [`Tokenizer`] trait.
//! Checkout the [tantivy repo](https://github.com/quickwit-oss/tantivy/tree/main/src/tokenizer) for some examples.

use std::borrow::{Borrow, BorrowMut};
use std::ops::{Deref, DerefMut};

use serde::{Deserialize, Serialize};

/// Token
#[derive(Debug, Clone, Serialize, Deserialize, Eq, PartialEq)]
pub struct Token {
    /// Offset (byte index) of the first character of the token.
    /// Offsets shall not be modified by token filters.
    pub offset_from: usize,
    /// Offset (byte index) of the last character of the token + 1.
    /// The text that generated the token should be obtained by
    /// &text[token.offset_from..token.offset_to]
    pub offset_to: usize,
    /// Position, expressed in number of tokens.
    pub position: usize,
    /// Actual text content of the token.
    pub text: String,
    /// Is the length expressed in term of number of original tokens.
    pub position_length: usize,
}

impl Default for Token {
    fn default() -> Token {
        Token {
            offset_from: 0,
            offset_to: 0,
            position: usize::MAX,
            text: String::new(),
            position_length: 1,
        }
    }
}

impl Token {
    /// reset to default
    pub fn reset(&mut self) {
        self.offset_from = 0;
        self.offset_to = 0;
        self.position = usize::MAX;
        self.text.clear();
        self.position_length = 1;
    }
}

/// `Tokenizer` are in charge of splitting text into a stream of token
/// before indexing.
pub trait Tokenizer: 'static + Clone + Send + Sync {
    /// The token stream returned by this Tokenizer.
    type TokenStream<'a>: TokenStream;
    /// Creates a token stream for a given `str`.
    fn token_stream<'a>(&'a mut self, text: &'a str) -> Self::TokenStream<'a>;
}

/// Simple wrapper of `Box<dyn TokenStream + 'a>`.
pub struct BoxTokenStream<'a>(Box<dyn TokenStream + 'a>);

impl TokenStream for BoxTokenStream<'_> {
    fn advance(&mut self) -> bool {
        self.0.advance()
    }

    fn token(&self) -> &Token {
        self.0.token()
    }

    fn token_mut(&mut self) -> &mut Token {
        self.0.token_mut()
    }
}

impl<'a> BoxTokenStream<'a> {
    pub fn new<T: TokenStream + 'a>(token_stream: T) -> BoxTokenStream<'a> {
        BoxTokenStream(Box::new(token_stream))
    }
}

impl<'a> Deref for BoxTokenStream<'a> {
    type Target = dyn TokenStream + 'a;

    fn deref(&self) -> &Self::Target {
        &*self.0
    }
}
impl DerefMut for BoxTokenStream<'_> {
    fn deref_mut(&mut self) -> &mut Self::Target {
        &mut *self.0
    }
}

impl<'a> TokenStream for Box<dyn TokenStream + 'a> {
    fn advance(&mut self) -> bool {
        let token_stream: &mut dyn TokenStream = self.borrow_mut();
        token_stream.advance()
    }

    fn token<'b>(&'b self) -> &'b Token {
        let token_stream: &'b (dyn TokenStream + 'a) = self.borrow();
        token_stream.token()
    }

    fn token_mut<'b>(&'b mut self) -> &'b mut Token {
        let token_stream: &'b mut (dyn TokenStream + 'a) = self.borrow_mut();
        token_stream.token_mut()
    }
}

/// `TokenStream` is the result of the tokenization.
///
/// It consists consumable stream of `Token`s.
pub trait TokenStream {
    /// Advance to the next token
    ///
    /// Returns false if there are no other tokens.
    fn advance(&mut self) -> bool;

    /// Returns a reference to the current token.
    fn token(&self) -> &Token;

    /// Returns a mutable reference to the current token.
    fn token_mut(&mut self) -> &mut Token;

    /// Helper to iterate over tokens. It
    /// simply combines a call to `.advance()`
    /// and `.token()`.
    fn next(&mut self) -> Option<&Token> {
        if self.advance() {
            Some(self.token())
        } else {
            None
        }
    }

    /// Helper function to consume the entire `TokenStream`
    /// and push the tokens to a sink function.
    fn process(&mut self, sink: &mut dyn FnMut(&Token)) {
        while self.advance() {
            sink(self.token());
        }
    }
}

/// Trait for the pluggable components of `Tokenizer`s.
pub trait TokenFilter: 'static + Send + Sync {
    /// The Tokenizer type returned by this filter, typically parametrized by the underlying
    /// Tokenizer.
    type Tokenizer<T: Tokenizer>: Tokenizer;
    /// Wraps a Tokenizer and returns a new one.
    fn transform<T: Tokenizer>(self, tokenizer: T) -> Self::Tokenizer<T>;
}

#[cfg(test)]
mod test {
    use super::*;

    #[test]
    fn clone() {
        let t1 = Token {
            position: 1,
            offset_from: 2,
            offset_to: 3,
            text: "abc".to_string(),
            position_length: 1,
        };
        let t2 = t1.clone();

        assert_eq!(t1.position, t2.position);
        assert_eq!(t1.offset_from, t2.offset_from);
        assert_eq!(t1.offset_to, t2.offset_to);
        assert_eq!(t1.text, t2.text);
    }
}