gitextract_6xpfra6z/

├── .gitignore
├── .gradio/
│   └── certificate.pem
├── LICENCE
├── README.md
├── assets/
│   ├── ReadMe.md
│   ├── crop_faces.py
│   ├── rename.py
│   └── segmentation.py
├── eval/
│   ├── eval_scripts/
│   │   ├── run_eval_multi.sh
│   │   └── run_eval_single.sh
│   ├── grounded_sam/
│   │   ├── florence2/
│   │   │   ├── config.json
│   │   │   ├── configuration_florence2.py
│   │   │   ├── generation_config.json
│   │   │   ├── modeling_florence2.py
│   │   │   ├── preprocessor_config.json
│   │   │   ├── processing_florence2.py
│   │   │   ├── tokenizer.json
│   │   │   ├── tokenizer_config.json
│   │   │   └── vocab.json
│   │   ├── grounded_sam2_florence2_autolabel_pipeline.py
│   │   └── sam2/
│   │       ├── __init__.py
│   │       ├── automatic_mask_generator.py
│   │       ├── build_sam.py
│   │       ├── configs/
│   │       │   ├── sam2/
│   │       │   │   ├── sam2_hiera_b+.yaml
│   │       │   │   ├── sam2_hiera_l.yaml
│   │       │   │   ├── sam2_hiera_s.yaml
│   │       │   │   └── sam2_hiera_t.yaml
│   │       │   ├── sam2.1/
│   │       │   │   ├── sam2.1_hiera_b+.yaml
│   │       │   │   ├── sam2.1_hiera_l.yaml
│   │       │   │   ├── sam2.1_hiera_s.yaml
│   │       │   │   └── sam2.1_hiera_t.yaml
│   │       │   └── sam2.1_training/
│   │       │       └── sam2.1_hiera_b+_MOSE_finetune.yaml
│   │       ├── csrc/
│   │       │   └── connected_components.cu
│   │       ├── modeling/
│   │       │   ├── __init__.py
│   │       │   ├── backbones/
│   │       │   │   ├── __init__.py
│   │       │   │   ├── hieradet.py
│   │       │   │   ├── image_encoder.py
│   │       │   │   └── utils.py
│   │       │   ├── memory_attention.py
│   │       │   ├── memory_encoder.py
│   │       │   ├── position_encoding.py
│   │       │   ├── sam/
│   │       │   │   ├── __init__.py
│   │       │   │   ├── mask_decoder.py
│   │       │   │   ├── prompt_encoder.py
│   │       │   │   └── transformer.py
│   │       │   ├── sam2_base.py
│   │       │   └── sam2_utils.py
│   │       ├── sam2_hiera_b+.yaml
│   │       ├── sam2_hiera_l.yaml
│   │       ├── sam2_hiera_s.yaml
│   │       ├── sam2_hiera_t.yaml
│   │       ├── sam2_image_predictor.py
│   │       ├── sam2_video_predictor.py
│   │       └── utils/
│   │           ├── __init__.py
│   │           ├── amg.py
│   │           ├── misc.py
│   │           └── transforms.py
│   └── tools/
│       ├── XVerseBench_multi.json
│       ├── XVerseBench_multi_DSG.json
│       ├── XVerseBench_single.json
│       ├── XVerseBench_single_DSG.json
│       ├── dino.py
│       ├── dpg_score.py
│       ├── face_id.py
│       ├── face_utils/
│       │   ├── face.py
│       │   └── face_recg.py
│       ├── florence_sam.py
│       ├── idip_aes_score.py
│       ├── idip_dpg_score.py
│       ├── idip_face_score.py
│       ├── idip_gen_split_idip.py
│       ├── idip_sam-dino_score.py
│       └── log_scores.py
├── inference_single_sample.py
├── requirements.txt
├── run_demo.sh
├── run_gradio.py
├── src/
│   ├── adapters/
│   │   ├── __init__.py
│   │   └── mod_adapters.py
│   ├── flux/
│   │   ├── block.py
│   │   ├── condition.py
│   │   ├── generate.py
│   │   ├── lora_controller.py
│   │   ├── pipeline_tools.py
│   │   └── transformer.py
│   └── utils/
│       ├── data_utils.py
│       ├── gpu_momory_utils.py
│       └── modulation_utils.py
└── train/
    └── config/
        ├── XVerse_config_INF.yaml
        └── XVerse_config_demo.yaml