gitextract_qaxjy5oq/

├── README.md
├── README_en.md
├── VisCPM/
│   ├── __init__.py
│   ├── cpm_tokenizers/
│   │   ├── __init__.py
│   │   ├── bee.py
│   │   └── vocabs/
│   │       └── bee.txt
│   ├── generation/
│   │   ├── __init__.py
│   │   ├── generation_utils.py
│   │   └── vllm_bee.py
│   ├── models/
│   │   ├── __init__.py
│   │   ├── beit3.py
│   │   ├── cpmbee.py
│   │   ├── modeling_utils.py
│   │   ├── modules/
│   │   │   ├── __init__.py
│   │   │   ├── attention.py
│   │   │   ├── blocks.py
│   │   │   ├── config.py
│   │   │   ├── embedding.py
│   │   │   ├── feedforward.py
│   │   │   ├── layernorm.py
│   │   │   ├── linear.py
│   │   │   ├── position_embedding.py
│   │   │   └── transformer.py
│   │   ├── stablediffusion.py
│   │   ├── vlg_cpmbee.py
│   │   └── vlu_cpmbee.py
│   ├── utils/
│   │   ├── __init__.py
│   │   └── utils.py
│   ├── viscpm_chat.py
│   └── viscpm_paint.py
├── config/
│   └── cpm-bee-10b.json
├── data/
│   ├── prompts.txt
│   └── translated_LLaVA_qa90/
│       ├── caps_boxes_coco2014_val_80_zh.jsonl
│       ├── qa90_gpt4_answer_zh.jsonl
│       ├── qa90_questions_zh.jsonl
│       └── rule_zh.json
├── demo_chat.py
├── demo_paint.py
├── figures/
│   └── wechat.md
├── finetune/
│   ├── README.md
│   ├── __init__.py
│   ├── dataset/
│   │   ├── __init__.py
│   │   ├── bee.py
│   │   ├── itembuilder.py
│   │   └── transformeddataset.py
│   ├── exporter.py
│   ├── ft_viscpm_chat/
│   │   ├── __init__.py
│   │   ├── config/
│   │   │   └── deepspeed/
│   │   │       └── viscpm_chat_ft.json
│   │   ├── get_llava150k_zh.sh
│   │   ├── run_viscpm_chat_ft.sh
│   │   └── train_viscpm_chat.py
│   ├── initializer.py
│   └── utils/
│       ├── __init__.py
│       ├── logger.py
│       ├── prompts.py
│       └── utils.py
├── requirements.txt
└── setup.py