gitextract_4p4dwrk2/

├── .gitignore
├── LICENSE
├── README.md
├── dataspeech/
│   ├── __init__.py
│   ├── cpu_enrichments/
│   │   ├── __init__.py
│   │   └── rate.py
│   └── gpu_enrichments/
│       ├── __init__.py
│       ├── pitch.py
│       ├── snr_and_reverb.py
│       └── squim.py
├── examples/
│   ├── prompt_creation/
│   │   ├── run_prompt_creation_10k.sh
│   │   ├── run_prompt_creation_1k.sh
│   │   ├── run_prompt_creation_1k_with_speaker_consistency.sh
│   │   ├── run_prompt_creation_45k.sh
│   │   ├── run_prompt_creation_dummy.sh
│   │   ├── run_prompt_creation_jenny.sh
│   │   └── speaker_ids_to_names.json
│   ├── prompt_creation_llm_swarm/
│   │   ├── nginx.template.conf
│   │   ├── run_prompt_creation_10k.sh
│   │   ├── run_prompt_creation_1k.sh
│   │   ├── run_prompt_creation_dummy.sh
│   │   ├── run_prompt_creation_full_mls.sh
│   │   └── tgi_h100.template.slurm
│   ├── tagging/
│   │   ├── run_main_10k.sh
│   │   ├── run_main_1k.sh
│   │   ├── run_main_45k.sh
│   │   └── run_main_dummy.sh
│   └── tags_to_annotations/
│       ├── run_metadata_to_text_10k.sh
│       ├── run_metadata_to_text_10k_v02.sh
│       ├── run_metadata_to_text_for_finetuning.sh
│       ├── v01_bin_edges.json
│       ├── v01_text_bins.json
│       ├── v02_bin_edges.json
│       └── v02_text_bins.json
├── main.py
├── requirements.txt
└── scripts/
    ├── filter_audio_separation.py
    ├── merge_audio_to_metadata.py
    ├── metadata_to_text.py
    ├── per_dataset_script/
    │   ├── add_gender_to_MLS.py
    │   ├── add_gender_to_libritts_r.py
    │   └── clean_libritts_r.py
    ├── run_prompt_creation.py
    └── run_prompt_creation_llm_swarm.py