gitextract_pb8s4_gh/

├── .github/
│   └── workflows/
│       └── publish_action.yml
├── .gitignore
├── LICENSE
├── README-CN.md
├── README.md
├── __init__.py
├── megatts3node.py
├── pyproject.toml
├── requirements.txt
├── tts/
│   ├── frontend_function.py
│   ├── modules/
│   │   ├── aligner/
│   │   │   └── whisper_small.py
│   │   ├── ar_dur/
│   │   │   ├── ar_dur_predictor.py
│   │   │   └── commons/
│   │   │       ├── layers.py
│   │   │       ├── nar_tts_modules.py
│   │   │       ├── rel_transformer.py
│   │   │       ├── rot_transformer.py
│   │   │       ├── seq_utils.py
│   │   │       └── transformer.py
│   │   ├── llm_dit/
│   │   │   ├── cfm.py
│   │   │   ├── dit.py
│   │   │   ├── time_embedding.py
│   │   │   └── transformer.py
│   │   └── wavvae/
│   │       ├── decoder/
│   │       │   ├── diag_gaussian.py
│   │       │   ├── hifigan_modules.py
│   │       │   ├── seanet_encoder.py
│   │       │   └── wavvae_v3.py
│   │       └── encoder/
│   │           └── common_modules/
│   │               ├── conv.py
│   │               ├── lstm.py
│   │               └── seanet.py
│   └── utils/
│       ├── audio_utils/
│       │   ├── align.py
│       │   ├── io.py
│       │   └── plot.py
│       ├── commons/
│       │   ├── ckpt_utils.py
│       │   └── hparams.py
│       └── text_utils/
│           ├── dict.json
│           ├── ph_tone_convert.py
│           ├── split_text.py
│           └── text_encoder.py
└── workflow-examples/
    ├── 单人语音.json
    └── 双人会话.json